0% found this document useful (0 votes)

10 views5 pages

Naive Bayes

Uploaded by

trishakhimesra

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as ODT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

10 views5 pages

Naive Bayes

Uploaded by

trishakhimesra

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as ODT, PDF, TXT or read online on Scribd

You are on page 1/ 5

import pandas as pd

from sklearn.model_selection import train_test_split

from sklearn.preprocessing import LabelEncoder
from sklearn.naive_bayes import GaussianNB
from sklearn.metrics import accuracy_score, classification_report
from sklearn.preprocessing import StandardScaler

# Load the CSV file

file_path = '../ML Prac/LP-1 Dataset/Decision Tree & Naive Bayes
Classification/Social_Network_Ads.csv'
df = pd.read_csv(file_path)

# Preprocess the data

# Encode 'Gender' column (since it's categorical)
label_encoder = LabelEncoder()
df['Gender'] = label_encoder.fit_transform(df['Gender'])

# Separate features (X) and labels (y)

X = df[['Gender', 'Age', 'EstimatedSalary']] # Features
y = df['Purchased'] # Labels

# Scale the features for better model performance

scaler = StandardScaler()
X_scaled = scaler.fit_transform(X)

# Split the data into training and testing sets

X_train, X_test, y_train, y_test = train_test_split(X_scaled, y, test_size=0.2, random_state=42)

# Train the Naive Bayes classifier (GaussianNB for numerical data)

nb_classifier = GaussianNB()
nb_classifier.fit(X_train, y_train)

# Predict on the test set

y_pred = nb_classifier.predict(X_test)

# Evaluate the model's performance

accuracy = accuracy_score(y_test, y_pred)
report = classification_report(y_test, y_pred, zero_division=1)

# Print the results

print(f'Accuracy: {accuracy}')
print('Classification Report:')
print(report)

# Take input from the user for prediction (for demonstration purposes)
# Get gender as 'Male' or 'Female', and age and salary
user_gender = input("Enter Gender (Male/Female): ")
user_age = float(input("Enter Age: "))
user_salary = float(input("Enter Estimated Salary: "))

# Encode gender (Male=1, Female=0)

user_gender_encoded = label_encoder.transform([user_gender])[0]
# Scale the user's input
user_input = scaler.transform([[user_gender_encoded, user_age, user_salary]])

# Predict whether the user will purchase

user_prediction = nb_classifier.predict(user_input)

# Print the prediction result

print(f"Prediction: {'Purchased' if user_prediction[0] == 1 else 'Not Purchased'}")

# Import necessary libraries

import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.naive_bayes import GaussianNB
from sklearn.metrics import accuracy_score, classification_report

# Load the CSV file, skipping the initial lines with descriptions
file_path = '../ML Prac/LP-1 Dataset/Decision Tree & Naive Bayes Classification/pima-indians-
diabetes.csv'
df = pd.read_csv(file_path, header=None, skiprows=9)

# Assign column names based on dataset attributes

df.columns = [
'Pregnancies', 'Glucose', 'BloodPressure', 'SkinThickness', 'Insulin',
'BMI', 'DiabetesPedigreeFunction', 'Age', 'Outcome'
]

# Strip any leading/trailing spaces from the column names

df.columns = df.columns.str.strip()

# Check for missing values and handle them (drop rows with missing values for simplicity)
df = df.dropna()

# Separate features (X) and labels (y)

X = df[['Pregnancies', 'Glucose', 'BloodPressure', 'SkinThickness', 'Insulin',
'BMI', 'DiabetesPedigreeFunction', 'Age']] # Features
y = df['Outcome'] # Labels
# Scale the features for better model performance
scaler = StandardScaler()
X_scaled = scaler.fit_transform(X)

# Split the data into training and testing sets

X_train, X_test, y_train, y_test = train_test_split(X_scaled, y, test_size=0.2, random_state=42)

# Train the Naive Bayes classifier (GaussianNB for numerical data)

nb_classifier = GaussianNB()
nb_classifier.fit(X_train, y_train)

# Predict on the test set

y_pred = nb_classifier.predict(X_test)

# Evaluate the model's performance

accuracy = accuracy_score(y_test, y_pred)
report = classification_report(y_test, y_pred, zero_division=1)

# Print the results

print(f'Accuracy: {accuracy}')
print('Classification Report:')
print(report)

# Take input from the user for prediction (for demonstration purposes)
user_pregnancies = int(input("Enter Number of Pregnancies: "))
user_glucose = int(input("Enter Plasma Glucose Concentration (2 hours in OGTT): "))
user_blood_pressure = int(input("Enter Diastolic Blood Pressure (mm Hg): "))
user_skin_thickness = int(input("Enter Triceps Skin Fold Thickness (mm): "))
user_insulin = int(input("Enter 2-Hour Serum Insulin (mu U/ml): "))
user_bmi = float(input("Enter Body Mass Index (BMI): "))
user_diabetes_pedigree = float(input("Enter Diabetes Pedigree Function: "))
user_age = int(input("Enter Age (years): "))

# Create a list for the user input

user_input = [[user_pregnancies, user_glucose, user_blood_pressure, user_skin_thickness,
user_insulin, user_bmi, user_diabetes_pedigree, user_age]]

# Scale the user's input

user_input_scaled = scaler.transform(user_input)

# Predict whether the user has diabetes

user_prediction = nb_classifier.predict(user_input_scaled)

# Print the prediction result

print(f"Prediction: {'Diabetic' if user_prediction[0] == 1 else 'Not Diabetic'}")
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import LabelEncoder
from sklearn.naive_bayes import GaussianNB
from sklearn.metrics import accuracy_score, classification_report
from sklearn.preprocessing import StandardScaler

# Load the CSV file

file_path = '../ML Prac/LP-1 Dataset/Decision Tree & Naive Bayes Classification/NaiveBayes.csv'
# Provide the correct path to your nAIVEBAYES.csv file
df = pd.read_csv(file_path)

# Strip any leading/trailing spaces from the column names

df.columns = df.columns.str.strip()

# Separate features (X) and labels (y)

X = df[['Age', 'Salary']] # Features: Age and Salary
y = df['Purchased'] # Labels: Purchased

# Scale the features for better model performance

scaler = StandardScaler()
X_scaled = scaler.fit_transform(X)

# Split the data into training and testing sets

X_train, X_test, y_train, y_test = train_test_split(X_scaled, y, test_size=0.2, random_state=42)

# Train the Naive Bayes classifier (GaussianNB for numerical data)

nb_classifier = GaussianNB()
nb_classifier.fit(X_train, y_train)

# Predict on the test set

y_pred = nb_classifier.predict(X_test)

# Evaluate the model's performance

accuracy = accuracy_score(y_test, y_pred)
report = classification_report(y_test, y_pred, zero_division=1)

# Print the results

print(f'Accuracy: {accuracy}')
print('Classification Report:')
print(report)

Decision Trees
No ratings yet
Decision Trees
28 pages
Diabetes Case Study - Jupyter Notebook
100% (1)
Diabetes Case Study - Jupyter Notebook
10 pages
ML Cheatsheet
No ratings yet
ML Cheatsheet
4 pages
Machine Learning
100% (1)
Machine Learning
21 pages
AI and ML Lab Manual
No ratings yet
AI and ML Lab Manual
29 pages
Lab Manual - MachineLearningLaboratory-DR - Vaishnavi
No ratings yet
Lab Manual - MachineLearningLaboratory-DR - Vaishnavi
71 pages
ML Lab Experiments (1) - Pages-3
No ratings yet
ML Lab Experiments (1) - Pages-3
11 pages
Logistic Regression vs. SVMs - Solution
No ratings yet
Logistic Regression vs. SVMs - Solution
7 pages
ML File External File
No ratings yet
ML File External File
25 pages
20MIS7043 (LAB 7) .Ipynb Colaboratory
No ratings yet
20MIS7043 (LAB 7) .Ipynb Colaboratory
4 pages
20MIS7095 (LAB 7) .Ipynb Colaboratory
No ratings yet
20MIS7095 (LAB 7) .Ipynb Colaboratory
4 pages
Ai 5
No ratings yet
Ai 5
7 pages
Example - 1
No ratings yet
Example - 1
5 pages
Naive Bayes
No ratings yet
Naive Bayes
9 pages
Generative AI Binary Classification
No ratings yet
Generative AI Binary Classification
7 pages
Diabetes Classification Report
No ratings yet
Diabetes Classification Report
17 pages
ML Lab PT
No ratings yet
ML Lab PT
25 pages
Data Mining Journal 5 Kashan
No ratings yet
Data Mining Journal 5 Kashan
7 pages
Diabetic Prediction Using LogicalRegression
No ratings yet
Diabetic Prediction Using LogicalRegression
9 pages
Naive Bayes Numericals
No ratings yet
Naive Bayes Numericals
9 pages
Classification Demo
No ratings yet
Classification Demo
4 pages
SL Classification For Data Science..
No ratings yet
SL Classification For Data Science..
4 pages
Assignment 2
No ratings yet
Assignment 2
4 pages
Machine NB + Lda Second Try
No ratings yet
Machine NB + Lda Second Try
5 pages
Mllabprog 5
No ratings yet
Mllabprog 5
6 pages
Allcodesml 2
No ratings yet
Allcodesml 2
10 pages
AI ML - Cycle 2 Programs
No ratings yet
AI ML - Cycle 2 Programs
15 pages
Import As From Import From Import From Import From Import From Import From Import From Import From Import From Import From Import Import As
No ratings yet
Import As From Import From Import From Import From Import From Import From Import From Import From Import From Import From Import Import As
8 pages
Practical 3
No ratings yet
Practical 3
11 pages
Class-Work-Naive-Bayes (21-10-2024)
No ratings yet
Class-Work-Naive-Bayes (21-10-2024)
5 pages
Bacdeaf 23032025 115708 Split 1
No ratings yet
Bacdeaf 23032025 115708 Split 1
37 pages
Aiml Ex 4-7
No ratings yet
Aiml Ex 4-7
8 pages
Assignment - 01
No ratings yet
Assignment - 01
4 pages
Sodapdf
No ratings yet
Sodapdf
1 page
Naive Bayes Classification
No ratings yet
Naive Bayes Classification
8 pages
W8 Naive Bayes Lab
No ratings yet
W8 Naive Bayes Lab
4 pages
Atul MLT Exp 4-11
No ratings yet
Atul MLT Exp 4-11
17 pages
Amlnew
No ratings yet
Amlnew
25 pages
Purva Rawale - BDA Practical No 2
No ratings yet
Purva Rawale - BDA Practical No 2
9 pages
Prediction Diabetic NBayes
No ratings yet
Prediction Diabetic NBayes
3 pages
Deep Learning Approach For Diabetes Prediction Using PIMA Indian Dataset
No ratings yet
Deep Learning Approach For Diabetes Prediction Using PIMA Indian Dataset
3 pages
Data Pipeline in ML
No ratings yet
Data Pipeline in ML
3 pages
23UCC554
No ratings yet
23UCC554
9 pages
Naive Bayes Program Machine Learning
No ratings yet
Naive Bayes Program Machine Learning
1 page
DA Pr6 Output
No ratings yet
DA Pr6 Output
1 page
Aiml Programs
No ratings yet
Aiml Programs
12 pages
Exp 4 ML
No ratings yet
Exp 4 ML
3 pages
Untitled5.Ipynb - Colab
No ratings yet
Untitled5.Ipynb - Colab
1 page
LAB08 Bayes Theory
No ratings yet
LAB08 Bayes Theory
4 pages
Liner Regression Chapter N3
No ratings yet
Liner Regression Chapter N3
2 pages
AI Assignment-6
No ratings yet
AI Assignment-6
7 pages
ML External Xerox
No ratings yet
ML External Xerox
1 page
P 7
No ratings yet
P 7
5 pages
Prog 6
No ratings yet
Prog 6
3 pages
BTVN6 Code
No ratings yet
BTVN6 Code
2 pages
ML Lab Exp
No ratings yet
ML Lab Exp
7 pages
Dia PGM
No ratings yet
Dia PGM
2 pages
Bagging Codes
No ratings yet
Bagging Codes
1 page
Diabeties SVM
No ratings yet
Diabeties SVM
2 pages

Naive Bayes

Uploaded by

Naive Bayes

Uploaded by

import pandas as pd

from sklearn.model_selection import train_test_split

# Load the CSV file

# Preprocess the data

# Separate features (X) and labels (y)

# Scale the features for better model performance

# Split the data into training and testing sets

# Train the Naive Bayes classifier (GaussianNB for numerical data)

# Predict on the test set

# Evaluate the model's performance

# Print the results

# Encode gender (Male=1, Female=0)

# Predict whether the user will purchase

# Print the prediction result

# Import necessary libraries

# Assign column names based on dataset attributes

# Strip any leading/trailing spaces from the column names

# Separate features (X) and labels (y)

# Split the data into training and testing sets

# Train the Naive Bayes classifier (GaussianNB for numerical data)

# Predict on the test set

# Evaluate the model's performance

# Print the results

# Create a list for the user input

# Scale the user's input

# Predict whether the user has diabetes

# Print the prediction result

# Load the CSV file

# Strip any leading/trailing spaces from the column names

# Separate features (X) and labels (y)

# Scale the features for better model performance

# Split the data into training and testing sets

# Train the Naive Bayes classifier (GaussianNB for numerical data)

# Predict on the test set

# Evaluate the model's performance

# Print the results

You might also like