0% found this document useful (0 votes)

16 views9 pages

Btech1007022 Lab5.1

The document contains three programs demonstrating data analysis and machine learning techniques using Python. Program 1 performs linear regression on salary data based on experience, Program 2 applies linear regression to an insurance dataset, and Program 3 implements logistic regression on the Iris dataset. Each program includes data loading, preprocessing, model training, and evaluation steps.

Uploaded by

C30 Md arbab

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

16 views9 pages

Btech1007022 Lab5.1

Uploaded by

C30 Md arbab

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 9

Name-Md Arbab

Roll - BTECH/10070/22

LAB-5

Program1:

import csv

import numpy as np

import matplotlib.pyplot as plt

# Load the data

data = []

with open('Salary_data.csv', 'r') as le:

reader = csv.reader( le)

next(reader) # Skip header

for row in reader:

data.append([ oat(row[0]), oat(row[1])])

# Separate the data into Experience (X) and Salary (Y)

X = np.array([row[0] for row in data])

Y = np.array([row[1] for row in data])

# Plot Experience vs. Salary

plt.scatter(X, Y, color='blue')

plt.xlabel('Experience (years)')

plt.ylabel('Salary')

plt.title('Experience vs. Salary')

plt.show()
fl
fi
fl
fi
# Initialize parameters

m = 0 # Slope

b = 0 # Intercept

learning_rate = 0.01

iterations = 1000

n = len(X)

# Function to compute Mean Squared Error

def compute_mse(X, Y, m, b):

total_error = 0

for i in range(len(X)):

total_error += (Y[i] - (m * X[i] + b)) ** 2

return total_error / n

# Gradient Descent

errors = []

for _ in range(iterations):

m_grad = 0

b_grad = 0

for i in range(len(X)):

m_grad += -2 * X[i] * (Y[i] - (m * X[i] + b))

b_grad += -2 * (Y[i] - (m * X[i] + b))

m -= (m_grad / n) * learning_rate

b -= (b_grad / n) * learning_rate

mse = compute_mse(X, Y, m, b)

errors.append(mse)
print(f"Final Parameters: m = {m}, b = {b}")

# Plot Training Error at Each Iteration

plt.plot(range(iterations), errors, color='red')

plt.xlabel('Iteration')

plt.ylabel('Mean Squared Error')

plt.title('Training Error at Each Iteration')

plt.show()

# Plot Experience vs. Salary with Best Fit Line

plt.scatter(X, Y, color='blue')

plt.plot(X, [m * x + b for x in X], color='red') # Best t line

plt.xlabel('Experience (years)')

plt.ylabel('Salary')

plt.title('Experience vs. Salary with Best Fit Line')

plt.show()

OUTPUT:

Program2:

import pandas as pd

from sklearn.preprocessing import MinMaxScaler

from sklearn.model_selection import train_test_split

from sklearn.linear_model import LinearRegression

from sklearn.metrics import mean_squared_error

fi
# Load the dataset

data = pd.read_csv('insurance.csv')

# Display the top 10 samples of the dataset

print(data.head(10))

# Display the features and label

features = data.columns[:-1]

label = data.columns[-1]

print("Features (Independent Variables):", features.tolist())

print("Label (Dependent Variable):", label)

# Remove missing value samples

data = data.dropna()

print("Number of samples after removing missing values:", len(data))

# Convert categorical variables to numeric using one-hot encoding

data = pd.get_dummies(data, columns=['sex', 'smoker', 'region'], drop_ rst=True)

# Update the features to re ect one-hot encoded columns

features = data.columns[:-1]

# Normalize the feature set

scaler = MinMaxScaler()

data[features] = scaler. t_transform(data[features])

print("Normalized feature set:")

fi
fl
fi
print(data.head(10))

# Split the data into training and testing sets

X = data[features]

y = data[label]

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

print("Number of training samples:", len(X_train))

print("Number of testing samples:", len(X_test))

# Train the regression model

model = LinearRegression()

model. t(X_train, y_train)

print("Model coef cients:", model.coef_)

print("Model intercept:", model.intercept_)

# Predict the test data

y_pred = model.predict(X_test)

# Calculate and display the testing error (Mean Squared Error)

mse = mean_squared_error(y_test, y_pred)

print("Testing Error (Mean Squared Error):", mse)

OUTPUT:
fi
fi
Program3:

import pandas as pd

import numpy as np

from sklearn.model_selection import train_test_split

from sklearn.preprocessing import LabelEncoder

from sklearn.metrics import accuracy_score

# Load the Iris dataset from the local CSV le

data = pd.read_csv('iris.csv')

# Display the top 10 samples of the dataset

print(data.head(10))

# Check the column names to identify the target variable

print("Column names:", data.columns)

# The target variable column name is 'Species'

target_variable = 'Species'

# Encode the class labels into numeric values

label_encoder = LabelEncoder()

data[target_variable] = label_encoder. t_transform(data[target_variable])

# Split the data into features (X) and labels (y)

X = data.iloc[:, 1:-1] # Exclude the 'Id' column and the target variable column

y = data.iloc[:, -1]

# Split the data into training and testing sets (80% training, 20% testing)

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

fi
fi
# Logistic Regression implementation

class LogisticRegression:

def init(self, learning_rate=0.01, iterations=1000):

self.learning_rate = learning_rate

self.iterations = iterations

def sigmoid(self, z):

return 1 / (1 + np.exp(-z))

def t(self, X, y):

self.m, self.n = X.shape

self.weights = np.zeros(self.n)

self.bias = 0

self.errors = []

epsilon = 1e-7 # Small epsilon value to avoid log(0)

for _ in range(self.iterations):

linear_model = np.dot(X, self.weights) + self.bias

y_pred = self.sigmoid(linear_model)

dw = (1 / self.m) * np.dot(X.T, (y_pred - y))

db = (1 / self.m) * np.sum(y_pred - y)

self.weights -= self.learning_rate * dw

self.bias -= self.learning_rate * db

loss = - (1 / self.m) * np.sum(y * np.log(y_pred + epsilon) + (1 - y) * np.log(1 -

y_pred + epsilon))

self.errors.append(loss)
fi
def predict(self, X):

linear_model = np.dot(X, self.weights) + self.bias

y_pred = self.sigmoid(linear_model)

return [1 if i > 0.5 else 0 for i in y_pred]

# Train the logistic regression model

log_reg = LogisticRegression(learning_rate=0.01, iterations=1000)

log_reg. t(X_train, y_train)

print("Model weights:", log_reg.weights)

print("Model bias:", log_reg.bias)

# Predict the test data

y_pred = log_reg.predict(X_test)

# Calculate and display the accuracy

accuracy = accuracy_score(y_test, y_pred)

print("Accuracy:", accuracy)

OUTPUT:
fi

C2 W3 Assignment
No ratings yet
C2 W3 Assignment
437 pages
Machine
100% (1)
Machine
45 pages
DA Practicle Answers Easyw
No ratings yet
DA Practicle Answers Easyw
30 pages
Code Book
No ratings yet
Code Book
20 pages
Simple Linear Regression
No ratings yet
Simple Linear Regression
11 pages
School of Engineering: Lab Manual On Machine Learning Lab
No ratings yet
School of Engineering: Lab Manual On Machine Learning Lab
23 pages
Naive Bayes
No ratings yet
Naive Bayes
58 pages
Regression Dataset Example
No ratings yet
Regression Dataset Example
14 pages
Machine Learnin
100% (2)
Machine Learnin
23 pages
ML Internal Questions
No ratings yet
ML Internal Questions
15 pages
Machine Learning Hands-On
100% (1)
Machine Learning Hands-On
18 pages
ML All Projectpdf Removed
No ratings yet
ML All Projectpdf Removed
41 pages
Btech1007022 Lab5
No ratings yet
Btech1007022 Lab5
14 pages
MMDS Da3
No ratings yet
MMDS Da3
8 pages
Machine Learning With SQL
100% (1)
Machine Learning With SQL
12 pages
Sofcomputing Da2
No ratings yet
Sofcomputing Da2
7 pages
Machine Learning LAB: Practical-1
100% (2)
Machine Learning LAB: Practical-1
24 pages
Index: Name - JINESH PRAJAPAT Class - B. Tech, III Year Branch - AI & DS Sem - V
No ratings yet
Index: Name - JINESH PRAJAPAT Class - B. Tech, III Year Branch - AI & DS Sem - V
35 pages
Aiml Practicals
No ratings yet
Aiml Practicals
22 pages
Zerox Ready
No ratings yet
Zerox Ready
21 pages
ML
No ratings yet
ML
17 pages
Data Mining Practicals
No ratings yet
Data Mining Practicals
22 pages
1st PGM
No ratings yet
1st PGM
10 pages
Da 012307
No ratings yet
Da 012307
8 pages
Exp 5
No ratings yet
Exp 5
4 pages
C2W3 Lab 01 Model Evaluation and Selection
No ratings yet
C2W3 Lab 01 Model Evaluation and Selection
21 pages
Ai Lab
No ratings yet
Ai Lab
19 pages
Machine Learning
No ratings yet
Machine Learning
10 pages
C2W3 Lab 01 Model Evaluation and Selection
No ratings yet
C2W3 Lab 01 Model Evaluation and Selection
21 pages
Lecture-2 Unit 2
No ratings yet
Lecture-2 Unit 2
56 pages
ML Lab Programs For Exam
No ratings yet
ML Lab Programs For Exam
10 pages
ML File
No ratings yet
ML File
10 pages
Atul MLT Exp 4-11
No ratings yet
Atul MLT Exp 4-11
17 pages
16BCB0126 VL2018195002535 Pe003
No ratings yet
16BCB0126 VL2018195002535 Pe003
40 pages
ML Lab Programs
No ratings yet
ML Lab Programs
9 pages
AI ML - Cycle 2 Programs
No ratings yet
AI ML - Cycle 2 Programs
15 pages
Data Analytics
No ratings yet
Data Analytics
10 pages
Aiml Ex 4-7
No ratings yet
Aiml Ex 4-7
8 pages
Print Out ML - Finallllllllllllllll
No ratings yet
Print Out ML - Finallllllllllllllll
11 pages
ML Lab Prgms Split
No ratings yet
ML Lab Prgms Split
3 pages
Lab Exam ... Roll No 24cs4103
No ratings yet
Lab Exam ... Roll No 24cs4103
4 pages
DL Lab 5
No ratings yet
DL Lab 5
3 pages
Da Lab Mannual
No ratings yet
Da Lab Mannual
25 pages
MD Asaduzzaman - 213002257
No ratings yet
MD Asaduzzaman - 213002257
3 pages
Task 1
No ratings yet
Task 1
5 pages
ML Practical File
No ratings yet
ML Practical File
30 pages
ML Lab 01999676272
No ratings yet
ML Lab 01999676272
12 pages
Shobit Sharma (2124399) ML Lab File PDF
No ratings yet
Shobit Sharma (2124399) ML Lab File PDF
19 pages
Machine File
No ratings yet
Machine File
27 pages
Python 1
No ratings yet
Python 1
3 pages
1
No ratings yet
1
13 pages
ML Record Print
No ratings yet
ML Record Print
20 pages
Assignment 1
No ratings yet
Assignment 1
5 pages
Practicalpgm ML
No ratings yet
Practicalpgm ML
33 pages
Experiment No.8
No ratings yet
Experiment No.8
5 pages
Easy Pract ML
No ratings yet
Easy Pract ML
7 pages
ML Lab
No ratings yet
ML Lab
7 pages
ML External Xerox
No ratings yet
ML External Xerox
1 page
CS-701 BigDataHadoop Unit-1
No ratings yet
CS-701 BigDataHadoop Unit-1
23 pages
Exp 1
No ratings yet
Exp 1
6 pages
Intro To Probability For Computing - PDF Room
No ratings yet
Intro To Probability For Computing - PDF Room
571 pages
Fakulty of Computer and Mathematical Sciences Bachelor of Science (Hons.) Management Mathematics
No ratings yet
Fakulty of Computer and Mathematical Sciences Bachelor of Science (Hons.) Management Mathematics
13 pages
Chapter 3 Forecasting
100% (1)
Chapter 3 Forecasting
87 pages
ch11 Analysis of Variance and Design of Experiment
No ratings yet
ch11 Analysis of Variance and Design of Experiment
54 pages
SML Lab Manuel
No ratings yet
SML Lab Manuel
24 pages
Res2dinv Notes
No ratings yet
Res2dinv Notes
151 pages
LN Estimation Theory
No ratings yet
LN Estimation Theory
11 pages
Machine Learning-Based Models For Accurate Car Pri
No ratings yet
Machine Learning-Based Models For Accurate Car Pri
6 pages
Chapter 3 - 20240918 - 002752 - 0000
No ratings yet
Chapter 3 - 20240918 - 002752 - 0000
98 pages
LN NN Rug
No ratings yet
LN NN Rug
215 pages
22bce9239 Smart Traffic
No ratings yet
22bce9239 Smart Traffic
17 pages
CRD & RCBD With Sampling, Efficiency, Power Etc
No ratings yet
CRD & RCBD With Sampling, Efficiency, Power Etc
34 pages
Reverse Logistics Optimization in The Indian Dairy Industry: Forecasting Vendor Returns To Reduce Spoilage
No ratings yet
Reverse Logistics Optimization in The Indian Dairy Industry: Forecasting Vendor Returns To Reduce Spoilage
6 pages
Part 3 Forecasting
No ratings yet
Part 3 Forecasting
39 pages
SRM Formula Sheet
No ratings yet
SRM Formula Sheet
16 pages
(IJCST-V12I3P5) :arjita Sable, Riya Gupta, Prof Aproov Khare, Prof Richa Shukla
No ratings yet
(IJCST-V12I3P5) :arjita Sable, Riya Gupta, Prof Aproov Khare, Prof Richa Shukla
6 pages
ML Sanchit
No ratings yet
ML Sanchit
49 pages
BEST Linear Estimators
No ratings yet
BEST Linear Estimators
8 pages
II B.com (A) - Business Statistics
No ratings yet
II B.com (A) - Business Statistics
17 pages
Vicky Patil - Practical - 9 - Colab
No ratings yet
Vicky Patil - Practical - 9 - Colab
4 pages
The Coefficient of Determination R-Squared Is More Informative Than SMAPE, MAE, MAPE, MSE and RMSE in Regression Analysis Evaluation
No ratings yet
The Coefficient of Determination R-Squared Is More Informative Than SMAPE, MAE, MAPE, MSE and RMSE in Regression Analysis Evaluation
25 pages
1 s2.0 S2212017312004197 Main
No ratings yet
1 s2.0 S2212017312004197 Main
8 pages
Problem Set Linear Regression and Gradient Descent
No ratings yet
Problem Set Linear Regression and Gradient Descent
3 pages
A Practical Note On Evaluating Kalman Filter Performance Optimality and Degradation
No ratings yet
A Practical Note On Evaluating Kalman Filter Performance Optimality and Degradation
24 pages
Performance Metrics
No ratings yet
Performance Metrics
3 pages
1 Onyeka s189 200
No ratings yet
1 Onyeka s189 200
12 pages
KNN Age Prediction Model
No ratings yet
KNN Age Prediction Model
9 pages
Comparative Analysis of Time Series Forecasting Models To Predict Amount of Rainfall in Telangana
No ratings yet
Comparative Analysis of Time Series Forecasting Models To Predict Amount of Rainfall in Telangana
5 pages
A Study On Mixture of Exponentiated Pareto and Exponential Distributions PDF
No ratings yet
A Study On Mixture of Exponentiated Pareto and Exponential Distributions PDF
20 pages
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet

Btech1007022 Lab5.1

Uploaded by

Btech1007022 Lab5.1

Uploaded by

Name-Md Arbab

import matplotlib.pyplot as plt

# Load the data

with open('Salary_data.csv', 'r') as le:

reader = csv.reader( le)

next(reader) # Skip header

for row in reader:

data.append([ oat(row[0]), oat(row[1])])

# Separate the data into Experience (X) and Salary (Y)

X = np.array([row[0] for row in data])

Y = np.array([row[1] for row in data])

# Plot Experience vs. Salary

plt.title('Experience vs. Salary')

# Function to compute Mean Squared Error

def compute_mse(X, Y, m, b):

total_error += (Y[i] - (m * X[i] + b)) ** 2

m_grad += -2 * X[i] * (Y[i] - (m * X[i] + b))

b_grad += -2 * (Y[i] - (m * X[i] + b))

# Plot Training Error at Each Iteration

plt.plot(range(iterations), errors, color='red')

plt.ylabel('Mean Squared Error')

plt.title('Training Error at Each Iteration')

# Plot Experience vs. Salary with Best Fit Line

plt.plot(X, [m * x + b for x in X], color='red') # Best t line

plt.title('Experience vs. Salary with Best Fit Line')

from sklearn.preprocessing import MinMaxScaler

from sklearn.model_selection import train_test_split

from sklearn.linear_model import LinearRegression

from sklearn.metrics import mean_squared_error

# Display the top 10 samples of the dataset

# Display the features and label

print("Features (Independent Variables):", features.tolist())

print("Label (Dependent Variable):", label)

# Remove missing value samples

print("Number of samples after removing missing values:", len(data))

# Convert categorical variables to numeric using one-hot encoding

data = pd.get_dummies(data, columns=['sex', 'smoker', 'region'], drop_ rst=True)

# Update the features to re ect one-hot encoded columns

# Normalize the feature set

data[features] = scaler. t_transform(data[features])

print("Normalized feature set:")

# Split the data into training and testing sets

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

print("Number of training samples:", len(X_train))

print("Number of testing samples:", len(X_test))

# Train the regression model

model. t(X_train, y_train)

print("Model coef cients:", model.coef_)

print("Model intercept:", model.intercept_)

# Predict the test data

# Calculate and display the testing error (Mean Squared Error)

mse = mean_squared_error(y_test, y_pred)

print("Testing Error (Mean Squared Error):", mse)

from sklearn.model_selection import train_test_split

from sklearn.preprocessing import LabelEncoder

from sklearn.metrics import accuracy_score

# Load the Iris dataset from the local CSV le

# Display the top 10 samples of the dataset

# Check the column names to identify the target variable

print("Column names:", data.columns)

# The target variable column name is 'Species'

# Encode the class labels into numeric values

data[target_variable] = label_encoder. t_transform(data[target_variable])

# Split the data into features (X) and labels (y)

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

def __init__(self, learning_rate=0.01, iterations=1000):

def sigmoid(self, z):

def t(self, X, y):

self.m, self.n = X.shape

epsilon = 1e-7 # Small epsilon value to avoid log(0)

linear_model = np.dot(X, self.weights) + self.bias

dw = (1 / self.m) * np.dot(X.T, (y_pred - y))

loss = - (1 / self.m) * np.sum(y * np.log(y_pred + epsilon) + (1 - y) * np.log(1 -

linear_model = np.dot(X, self.weights) + self.bias

return [1 if i > 0.5 else 0 for i in y_pred]

# Train the logistic regression model

def init(self, learning_rate=0.01, iterations=1000):