0% found this document useful (0 votes)

13 views14 pages

Btech1007022 Lab5

The document contains three separate programs focused on data analysis and machine learning. Program 1 implements linear regression to predict salary based on experience, Program 2 uses linear regression on an insurance dataset, and Program 3 applies logistic regression to classify species in the Iris dataset. Each program includes data loading, preprocessing, model training, and evaluation steps.

Uploaded by

C30 Md arbab

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as RTF, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

13 views14 pages

Btech1007022 Lab5

Uploaded by

C30 Md arbab

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as RTF, PDF, TXT or read online on Scribd

You are on page 1/ 14

Name-Ankit Kumar

Roll - BTECH/10066/22

LAB-5

Program1:

import csv

import numpy as np

import matplotlib.pyplot as plt

# Load the data

data = []

with open('Salary_data.csv', 'r') as file:

reader = csv.reader(file)

next(reader) # Skip header

for row in reader:

data.append([float(row[0]), float(row[1])])

# Separate the data into Experience (X) and Salary (Y)

X = np.array([row[0] for row in data])

Y = np.array([row[1] for row in data])

# Plot Experience vs. Salary

plt.scatter(X, Y, color='blue')

plt.xlabel('Experience (years)')

plt.ylabel('Salary')

plt.title('Experience vs. Salary')

plt.show()

# Initialize parameters

m = 0 # Slope

b = 0 # Intercept

learning_rate = 0.01

iterations = 1000

n = len(X)

# Function to compute Mean Squared Error

def compute_mse(X, Y, m, b):

total_error = 0

for i in range(len(X)):

total_error += (Y[i] - (m * X[i] + b)) ** 2

return total_error / n

# Gradient Descent

errors = []
for _ in range(iterations):

m_grad = 0

b_grad = 0

for i in range(len(X)):

m_grad += -2 * X[i] * (Y[i] - (m * X[i] + b))

b_grad += -2 * (Y[i] - (m * X[i] + b))

m -= (m_grad / n) * learning_rate

b -= (b_grad / n) * learning_rate

mse = compute_mse(X, Y, m, b)

errors.append(mse)

print(f"Final Parameters: m = {m}, b = {b}")

# Plot Training Error at Each Iteration

plt.plot(range(iterations), errors, color='red')

plt.xlabel('Iteration')

plt.ylabel('Mean Squared Error')

plt.title('Training Error at Each Iteration')

plt.show()

# Plot Experience vs. Salary with Best Fit Line

plt.scatter(X, Y, color='blue')
plt.plot(X, [m * x + b for x in X], color='red') # Best fit line

plt.xlabel('Experience (years)')

plt.ylabel('Salary')

plt.title('Experience vs. Salary with Best Fit Line')

plt.show()

OUTPUT:
Program2:
import pandas as pd
from sklearn.preprocessing import MinMaxScaler
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_squared_error

# Load the dataset

data = pd.read_csv('insurance.csv')
# Display the top 10 samples of the dataset
print(data.head(10))

# Display the features and label

features = data.columns[:-1]
label = data.columns[-1]

print("Features (Independent Variables):", features.tolist())

print("Label (Dependent Variable):", label)

# Remove missing value samples

data = data.dropna()

print("Number of samples after removing missing values:", len(data))

# Convert categorical variables to numeric using one-hot encoding

data = pd.get_dummies(data, columns=['sex', 'smoker', 'region'], drop_first=True)

# Update the features to reflect one-hot encoded columns

features = data.columns[:-1]

# Normalize the feature set

scaler = MinMaxScaler()
data[features] = scaler.fit_transform(data[features])
print("Normalized feature set:")
print(data.head(10))

# Split the data into training and testing sets

X = data[features]
y = data[label]
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2,
random_state=42)

print("Number of training samples:", len(X_train))

print("Number of testing samples:", len(X_test))

# Train the regression model

model = LinearRegression()
model.fit(X_train, y_train)

print("Model coefficients:", model.coef_)

print("Model intercept:", model.intercept_)

# Predict the test data

y_pred = model.predict(X_test)

# Calculate and display the testing error (Mean Squared Error)

mse = mean_squared_error(y_test, y_pred)
print("Testing Error (Mean Squared Error):", mse)

OUTPUT:
Program3:
import pandas as pd
import numpy as np
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import LabelEncoder
from sklearn.metrics import accuracy_score

# Load the Iris dataset from the local CSV file

data = pd.read_csv('iris.csv')

# Display the top 10 samples of the dataset

print(data.head(10))

# Check the column names to identify the target variable

print("Column names:", data.columns)

# The target variable column name is 'Species'

target_variable = 'Species'

# Encode the class labels into numeric values

label_encoder = LabelEncoder()
data[target_variable] = label_encoder.fit_transform(data[target_variable])

# Split the data into features (X) and labels (y)

X = data.iloc[:, 1:-1] # Exclude the 'Id' column and the target variable column
y = data.iloc[:, -1]

# Split the data into training and testing sets (80% training, 20% testing)
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2,
random_state=42)

# Logistic Regression implementation

class LogisticRegression:
def __init__(self, learning_rate=0.01, iterations=1000):
self.learning_rate = learning_rate
self.iterations = iterations

def sigmoid(self, z):

return 1 / (1 + np.exp(-z))

def fit(self, X, y):

self.m, self.n = X.shape
self.weights = np.zeros(self.n)
self.bias = 0
self.errors = []
epsilon = 1e-7 # Small epsilon value to avoid log(0)

for _ in range(self.iterations):
linear_model = np.dot(X, self.weights) + self.bias
y_pred = self.sigmoid(linear_model)

dw = (1 / self.m) * np.dot(X.T, (y_pred - y))

db = (1 / self.m) * np.sum(y_pred - y)

self.weights -= self.learning_rate * dw
self.bias -= self.learning_rate * db

loss = - (1 / self.m) * np.sum(y * np.log(y_pred + epsilon) + (1 - y) * np.log(1

- y_pred + epsilon))
self.errors.append(loss)

def predict(self, X):

linear_model = np.dot(X, self.weights) + self.bias
y_pred = self.sigmoid(linear_model)
return [1 if i > 0.5 else 0 for i in y_pred]

# Train the logistic regression model

log_reg = LogisticRegression(learning_rate=0.01, iterations=1000)
log_reg.fit(X_train, y_train)

print("Model weights:", log_reg.weights)

print("Model bias:", log_reg.bias)

# Predict the test data

y_pred = log_reg.predict(X_test)
# Calculate and display the accuracy
accuracy = accuracy_score(y_test, y_pred)
print("Accuracy:", accuracy)

OUTPUT:

Examples Regression
No ratings yet
Examples Regression
19 pages
Chapter 6 - Advanced Machine Learning PDF
No ratings yet
Chapter 6 - Advanced Machine Learning PDF
37 pages
PracticeExamRegression3024 PDF
100% (2)
PracticeExamRegression3024 PDF
13 pages
CH 13
No ratings yet
CH 13
53 pages
Introduction To Econometrics, 5 Edition: Chapter 2: Properties of The Regression Coefficients and Hypothesis Testing
No ratings yet
Introduction To Econometrics, 5 Edition: Chapter 2: Properties of The Regression Coefficients and Hypothesis Testing
29 pages
Time Series STATA Manual PDF
No ratings yet
Time Series STATA Manual PDF
544 pages
Global Hydrogen Peroxide Market - Growth, Trends, and Forecast (2019 - 2024)
No ratings yet
Global Hydrogen Peroxide Market - Growth, Trends, and Forecast (2019 - 2024)
173 pages
Robust Regression
No ratings yet
Robust Regression
7 pages
Research in Agribusiness and Value Chain (Abvm 14) : Compiled By: Milkessa Temesgen (MSC) Wondimagegn Mesfin (MSC)
No ratings yet
Research in Agribusiness and Value Chain (Abvm 14) : Compiled By: Milkessa Temesgen (MSC) Wondimagegn Mesfin (MSC)
85 pages
Lecture 5 6 Forecasting
100% (1)
Lecture 5 6 Forecasting
45 pages
Syllabus 17.802 Quantitative Research Methods II: Professor: Jens Hainmueller TA: Chad Hazlett Spring Semester 2012
No ratings yet
Syllabus 17.802 Quantitative Research Methods II: Professor: Jens Hainmueller TA: Chad Hazlett Spring Semester 2012
12 pages
v33b01 PDF
No ratings yet
v33b01 PDF
3 pages
Nonlife Actuarial Models: Model Estimation and Types of Data
No ratings yet
Nonlife Actuarial Models: Model Estimation and Types of Data
35 pages
Course Outline - Econometrics
No ratings yet
Course Outline - Econometrics
7 pages
Principles of Model Building
No ratings yet
Principles of Model Building
75 pages
Applied Eco No Metrics With Stata
No ratings yet
Applied Eco No Metrics With Stata
170 pages
Ho - Diagnostics Examples 2 in SPSS
No ratings yet
Ho - Diagnostics Examples 2 in SPSS
4 pages
Sample Sec 3
No ratings yet
Sample Sec 3
16 pages
3.2 Least-Squares Regression: Andrew Brown AP Stats Per. 6
No ratings yet
3.2 Least-Squares Regression: Andrew Brown AP Stats Per. 6
15 pages
Interval Est
No ratings yet
Interval Est
25 pages
An Econometric Analysis On The Impact of Trade On Economic Growth: Evidence From Namibia
No ratings yet
An Econometric Analysis On The Impact of Trade On Economic Growth: Evidence From Namibia
7 pages
Linear Regression
No ratings yet
Linear Regression
7 pages
Code Book
No ratings yet
Code Book
20 pages
Machine
100% (1)
Machine
45 pages
Mgt555 - Individual Assignment 2
100% (1)
Mgt555 - Individual Assignment 2
6 pages
Forecasting Accuracy of Industrial Sales With Endogeneity in Firm-Level Data
No ratings yet
Forecasting Accuracy of Industrial Sales With Endogeneity in Firm-Level Data
11 pages
Hasil Uji Deskriptif: Descriptive Statistics
No ratings yet
Hasil Uji Deskriptif: Descriptive Statistics
3 pages
MMDS Da3
No ratings yet
MMDS Da3
8 pages
ML Lab
No ratings yet
ML Lab
7 pages
16BCB0126 VL2018195002535 Pe003
No ratings yet
16BCB0126 VL2018195002535 Pe003
40 pages
Illustration of Using Excel To Find Maximum Likelihood Estimates
No ratings yet
Illustration of Using Excel To Find Maximum Likelihood Estimates
14 pages
Machine Learning LAB: Practical-1
100% (2)
Machine Learning LAB: Practical-1
24 pages
Zerox Ready
No ratings yet
Zerox Ready
21 pages
Naive Bayes
No ratings yet
Naive Bayes
58 pages
Go To Market Strategy Lawrence G Friedma
No ratings yet
Go To Market Strategy Lawrence G Friedma
2 pages
MSF 566 Topic 04 Modeling With Volatility
No ratings yet
MSF 566 Topic 04 Modeling With Volatility
36 pages
Jurnal Penelitian Tolak Angin
No ratings yet
Jurnal Penelitian Tolak Angin
9 pages
ML Practical File
No ratings yet
ML Practical File
30 pages
Machine Learnin
100% (2)
Machine Learnin
23 pages
Index: Name - JINESH PRAJAPAT Class - B. Tech, III Year Branch - AI & DS Sem - V
No ratings yet
Index: Name - JINESH PRAJAPAT Class - B. Tech, III Year Branch - AI & DS Sem - V
35 pages
School of Engineering: Lab Manual On Machine Learning Lab
No ratings yet
School of Engineering: Lab Manual On Machine Learning Lab
23 pages
Machine Learning With SQL
100% (1)
Machine Learning With SQL
12 pages
DA Practicle Answers Easyw
No ratings yet
DA Practicle Answers Easyw
30 pages
C2 W3 Assignment
No ratings yet
C2 W3 Assignment
437 pages
Machine File
No ratings yet
Machine File
27 pages
Aiml Ex 4-7
No ratings yet
Aiml Ex 4-7
8 pages
Sofcomputing Da2
No ratings yet
Sofcomputing Da2
7 pages
ML Internal Questions
No ratings yet
ML Internal Questions
15 pages
ML Lab Programs For Exam
No ratings yet
ML Lab Programs For Exam
10 pages
Machine Learning Hands-On
100% (1)
Machine Learning Hands-On
18 pages
Data Mining Practicals
No ratings yet
Data Mining Practicals
22 pages
Exp 1
No ratings yet
Exp 1
6 pages
Pragyan Chandra Resume Template by Me
No ratings yet
Pragyan Chandra Resume Template by Me
1 page
1st PGM
No ratings yet
1st PGM
10 pages
C2W3 Lab 01 Model Evaluation and Selection
No ratings yet
C2W3 Lab 01 Model Evaluation and Selection
21 pages
ML Lab Prgms Split
No ratings yet
ML Lab Prgms Split
3 pages
Simple Linear Regression
No ratings yet
Simple Linear Regression
11 pages
DL Lab 5
No ratings yet
DL Lab 5
3 pages
ML Record Print
No ratings yet
ML Record Print
20 pages
MD Asaduzzaman - 213002257
No ratings yet
MD Asaduzzaman - 213002257
3 pages
21CSC305P ML - Lab Programs 1 - 9
No ratings yet
21CSC305P ML - Lab Programs 1 - 9
36 pages
ML
No ratings yet
ML
17 pages
Lab Exam ... Roll No 24cs4103
No ratings yet
Lab Exam ... Roll No 24cs4103
4 pages
Regression Dataset Example
No ratings yet
Regression Dataset Example
14 pages
Machine Learning
No ratings yet
Machine Learning
10 pages
ML Lab 01999676272
No ratings yet
ML Lab 01999676272
12 pages
Data Analytics
No ratings yet
Data Analytics
10 pages
C2W3 Lab 01 Model Evaluation and Selection
No ratings yet
C2W3 Lab 01 Model Evaluation and Selection
21 pages
AI ML - Cycle 2 Programs
No ratings yet
AI ML - Cycle 2 Programs
15 pages
Aiml Practicals
No ratings yet
Aiml Practicals
22 pages
ML External Xerox
No ratings yet
ML External Xerox
1 page
ML All Projectpdf Removed
No ratings yet
ML All Projectpdf Removed
41 pages
Python 1
No ratings yet
Python 1
3 pages
ML Lab Programs
No ratings yet
ML Lab Programs
9 pages
Ai Lab
No ratings yet
Ai Lab
19 pages
Da 012307
No ratings yet
Da 012307
8 pages
Task 1
No ratings yet
Task 1
5 pages
Lecture-2 Unit 2
No ratings yet
Lecture-2 Unit 2
56 pages
Research Methodology 22 Year Question
No ratings yet
Research Methodology 22 Year Question
3 pages
Print Out ML - Finallllllllllllllll
No ratings yet
Print Out ML - Finallllllllllllllll
11 pages
Btech1007022 Lab5.1
No ratings yet
Btech1007022 Lab5.1
9 pages
Atul MLT Exp 4-11
No ratings yet
Atul MLT Exp 4-11
17 pages
Shobit Sharma (2124399) ML Lab File PDF
No ratings yet
Shobit Sharma (2124399) ML Lab File PDF
19 pages
Experiment No.8
No ratings yet
Experiment No.8
5 pages
1
No ratings yet
1
13 pages
Assignment 1
No ratings yet
Assignment 1
5 pages
Da Lab Mannual
No ratings yet
Da Lab Mannual
25 pages
Easy Pract ML
No ratings yet
Easy Pract ML
7 pages
Practicalpgm ML
No ratings yet
Practicalpgm ML
33 pages
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet