0% found this document useful (0 votes)

7 views9 pages

Mlee Lab1

The document contains Python code for implementing various gradient descent algorithms (batch, stochastic, and mini-batch) for linear regression using a dataset loaded from a CSV file. It includes functions for calculating cost, mean absolute error, mean square error, correlation coefficient, and R-squared value, along with data normalization and splitting into training and testing sets. The code visualizes the cost over iterations and compares predicted outputs against actual outputs using various metrics.

Uploaded by

f20220250

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

7 views9 pages

Mlee Lab1

Uploaded by

f20220250

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 9

from google.

colab import drive

filepath='/content/drive/MyDrive/data.csv'

import pandas as pd
import numpy as np
import matplotlib.pyplot as plt

data=pd.read_csv(filepath)

from re import X
X=data.iloc[:,:-1].values
y=data.iloc[:,-1].values

def cost_function(X,y,w):
hypothesis = np.dot(X,w.T)
J = (1/(2*len(y)))*np.sum((hypothesis-y)**2)
return J

def batch_gradient_descent(X,y,w,alpha,iters):
cost_history = np.zeros(iters)
for i in range(iters):
hypothesis = np.dot(X,w.T)
w = w - (alpha/len(y)) * np.dot(hypothesis - y, X)
cost_history[i] = cost_function(X,y,w)
return w, cost_history

def stochastic_gradient_descent(X,y,w,alpha, iters):

cost_history = np.zeros(iters)
for i in range(iters):
rand_index = np.random.randint(len(y)-1)

ind_x = X[rand_index:rand_index+1]
ind_y = y[rand_index:rand_index+1]
w = w- alpha * np.dot((np.dot(ind_x,w.T) - ind_y), ind_x)
cost_history[i] = cost_function(ind_x,ind_y,w)
return w, cost_history

def MB_gradient_descent(X,y,w,alpha, iters, batch_size):

cost_history = np.zeros(iters)
for i in range(iters):
rand_index = np.random.randint(len(y)-batch_size)
ind_x = X[rand_index:rand_index+batch_size]
ind_y = y[rand_index:rand_index+batch_size]
w = w - (alpha/batch_size) * (ind_x.T.dot(ind_x.dot(w) -
ind_y))
cost_history[i] = cost_function(ind_x,ind_y,w)
return w, cost_history

def mean_abs_error(Ypred,Yact):
sum_error=abs(Yact - Ypred)
ma_error=sum(sum_error)/Ypred.shape[0]
return ma_error

def mean_square_error(Ypred,Yact):
for i in range(Ypred.shape[0]):
sum_error=(Yact - Ypred)**2
ms_error=sum(sum_error)/Ypred.shape[0]
return ms_error

def r_squared(y_true, y_pred):

ss_total = np.sum((y_true - np.mean(y_true)) ** 2)
ss_residual = np.sum((y_true - y_pred) ** 2)
return 1 - (ss_residual / ss_total)

def correcoff(Ypred,Yact):
ypm=np.mean(Ypred)##mean of Ypred data
yam=np.mean(Yact)##mean of Yactual data
sum_numerator=((Yact - yam)*(Ypred-ypm))
sum_d1=((Yact - yam)**2)
sum_d2=((Ypred - ypm)**2)
sum_d1=pow(sum(sum_d1),1/2)
sum_d2=pow(sum(sum_d2),1/2)
th_error=sum(sum_numerator)/(sum_d1*sum_d2)
return th_error

X = data.iloc[:, :-1] # All rows, all columns except the last

y = data.iloc[:, -1]

X=np.asarray(X)
y=np.asarray(y)

m=X.shape[0]
xmin=np.min(X,axis=0)
xmax=np.max(X,axis=0)
X_normalized= (X-xmin)/(xmax-xmin)

ymin = np.min(y, axis = 0)

ymax = np.max(y, axis = 0)
y_normalized = (y- ymin)/(ymax-ymin)

m=X_normalized.shape[0]
pp=np.ones([m,1])
X_normalized=np.append(pp,X_normalized,axis=1)

train_percentage = 0.70
train_size = int(len(X) * train_percentage)
# split the data into training and testing
X_train = X_normalized[:train_size]
y_train = y_normalized[:train_size]
X_test = X_normalized[train_size:]
y_test = y_normalized[train_size:]
print("Training Features Shape:", X_train.shape)
print("Testing Features Shape:", X_test.shape)
print("Training Target Shape:", y_train.shape)
print("Testing Target Shape:", y_test.shape)

Training Features Shape: (56, 9)

Testing Features Shape: (25, 9)
Training Target Shape: (56,)
Testing Target Shape: (25,)

w= np.zeros((X_normalized.shape[1])) ###weight initialization

w.shape

(9,)

alpha=0.4 ##learning rate

iters=1500 ###iterations
batch_w,J_his = batch_gradient_descent(X_train,y_train,w,alpha,iters)
plt.plot(range(iters),J_his)
plt.xlabel('Iterations')
plt.ylabel('Cost')
plt.title('BGD Cost vs Iterations')
plt.show()
bgd=batch_w
print("WEIGHT VECTOR",bgd)

y_pred_bgd=X_test.dot(bgd.T)

WEIGHT VECTOR [0.21794334 0.10606424 0.0478828 0.03935448 0.03229864

0.03136558
0.11796494 0.06546174 0.03341064]

yp_unnorm=(y_pred_bgd*(ymax-ymin))+ymin
y_test_unnorm=(y_test*(ymax-ymin))+ymin

a=mean_abs_error(yp_unnorm,y_test_unnorm)
print("MEAN ABSOLUTE ERROR",a)

MEAN ABSOLUTE ERROR 1.1326579129012353

b=mean_square_error(yp_unnorm,y_test_unnorm)
print("MEAN SQUARE ERROR:",b)

MEAN SQUARE ERROR: 1.819265635873902

c=correcoff(yp_unnorm,y_test_unnorm)
print("CORRELATION COEFF:",c)

CORRELATION COEFF: 0.2602600569650748

d=r_squared(yp_unnorm,y_test_unnorm)
print("R2:",d)

R2: -226.79600202581813

plt.figure(figsize=(8, 6))
plt.plot(y_test_unnorm, label='Actual Output', color='blue',
marker='o')
plt.plot(yp_unnorm, label='Predicted Output', color='red', marker='x')
plt.xlabel('Sample Index')
plt.ylabel('Output Value')
plt.title('Predicted vs Actual Output (Line Plot)')
plt.legend()
plt.show()
alpha=0.4
iters=5000 ###iterations
w_n_l2,J_sgd_l2 = stochastic_gradient_descent(X_train,y_train,w,alpha,
iters)
plt.plot(range(iters),J_sgd_l2)
plt.xlabel('Iterations')
plt.ylabel('Cost')
plt.title('SGD Cost vs Iterations')
plt.show()
sgd=w_n_l2
print("WEIGHT VECTOR",bgd)
y_pred_sgd=X_test.dot(sgd.T)
yp_unnorm=(y_pred_sgd*(ymax-ymin))+ymin
y_test_unnorm=(y_test*(ymax-ymin))+ymin
a=mean_abs_error(yp_unnorm,y_test_unnorm)
print("MEAN ABSOLUTE ERROR",a)

b=mean_square_error(yp_unnorm,y_test_unnorm)
print("MEAN SQUARE ERROR:",b)
c=correcoff(y_test_unnorm, yp_unnorm)
print("CORRELATION COEFF:",c)
d=r_squared(yp_unnorm,y_test_unnorm)
print("R2:",d)
plt.figure(figsize=(8, 6))
plt.plot(y_test_unnorm, label='Actual Output', color='blue',
marker='o')
plt.plot(yp_unnorm, label='Predicted Output', color='red', marker='x')
plt.xlabel('Sample Index')
plt.ylabel('Output Value')
plt.title('Predicted vs Actual Output (Line Plot)')
plt.legend()
plt.show()

WEIGHT VECTOR [0.21794334 0.10606424 0.0478828 0.03935448 0.03229864

0.03136558
0.11796494 0.06546174 0.03341064]
MEAN ABSOLUTE ERROR 0.9617008469068318
MEAN SQUARE ERROR: 1.6948874101095208
CORRELATION COEFF: 0.7968621371120339
R2: -6.284048634553031
alpha=0.4
iters=2000 ###iterations
batch_size=15
mb_w_l1,J_mb_l1 = MB_gradient_descent(X_train,y_train,w,alpha, iters,
batch_size)
plt.plot(range(iters),J_mb_l1)
plt.xlabel('Iterations')
plt.ylabel('Cost')
plt.title('MBGD Cost vs Iterations')
plt.show()
mbgd=mb_w_l1

print("WEIGHT VECTOR",bgd)
y_pred_mbgd=X_test.dot(mbgd.T)
yp_unnorm=(y_pred_mbgd*(ymax-ymin))+ymin
y_test_unnorm=(y_test*(ymax-ymin))+ymin
a=mean_abs_error(yp_unnorm,y_test_unnorm)
print("MEAN ABSOLUTE ERROR",a)
b=mean_square_error(yp_unnorm,y_test_unnorm)
print("MEAN SQUARE ERROR:",b)
c=correcoff(yp_unnorm,y_test_unnorm)
print("CORRELATION COEFF:",c)
d=r_squared(yp_unnorm,y_test_unnorm)
print("R2:",d)
plt.figure(figsize=(8, 6))
plt.plot(y_test_unnorm, label='Actual Output', color='blue',
marker='o')
plt.plot(yp_unnorm, label='Predicted Output', color='red', marker='x')
plt.xlabel('Sample Index')
plt.ylabel('Output Value')
plt.title('Predicted vs Actual Output')
plt.legend()
plt.show()

WEIGHT VECTOR [0.21794334 0.10606424 0.0478828 0.03935448 0.03229864

0.03136558
0.11796494 0.06546174 0.03341064]
MEAN ABSOLUTE ERROR 1.0860545963179458
MEAN SQUARE ERROR: 1.7247709330182672
CORRELATION COEFF: 0.39688976236696366
R2: -293.6095175999243

Mercedes-Benz Greener Manufacturing Ai
0% (1)
Mercedes-Benz Greener Manufacturing Ai
16 pages
'/content/drive': From Import Import As Import As Import As
No ratings yet
'/content/drive': From Import Import As Import As Import As
9 pages
Ai Last 5
No ratings yet
Ai Last 5
4 pages
ANN PR Code and Output
No ratings yet
ANN PR Code and Output
25 pages
Mlee Lab4
No ratings yet
Mlee Lab4
11 pages
CCC
No ratings yet
CCC
25 pages
Code Diamond
No ratings yet
Code Diamond
6 pages
Assignment No. 3: 1. Plot of Loss Function J Vs Number of Iterations
No ratings yet
Assignment No. 3: 1. Plot of Loss Function J Vs Number of Iterations
6 pages
Deeplg 3
No ratings yet
Deeplg 3
8 pages
Mlee 4
No ratings yet
Mlee 4
12 pages
ML File
No ratings yet
ML File
13 pages
Naive Bayes
No ratings yet
Naive Bayes
58 pages
Neural Network Code
No ratings yet
Neural Network Code
5 pages
NP Plot Linear Regression Torch
No ratings yet
NP Plot Linear Regression Torch
5 pages
DEEP LEARNING MANUAL Final
No ratings yet
DEEP LEARNING MANUAL Final
14 pages
Big Data Assignment - 7
No ratings yet
Big Data Assignment - 7
7 pages
ML Lab
No ratings yet
ML Lab
7 pages
Deep Record
No ratings yet
Deep Record
44 pages
Aiml Lab
No ratings yet
Aiml Lab
14 pages
Null 0
No ratings yet
Null 0
6 pages
MMDS Da3
No ratings yet
MMDS Da3
8 pages
Image Classification Handson-Image - Test
No ratings yet
Image Classification Handson-Image - Test
5 pages
Báo Cáo Java 4
No ratings yet
Báo Cáo Java 4
3 pages
22051001 (2)
No ratings yet
22051001 (2)
5 pages
Lab Report 03
No ratings yet
Lab Report 03
14 pages
Linear Reg 33
No ratings yet
Linear Reg 33
3 pages
ML Record Print
No ratings yet
ML Record Print
20 pages
Machine Learning CODE
No ratings yet
Machine Learning CODE
19 pages
ML Lab Manual
No ratings yet
ML Lab Manual
12 pages
Autoencoder From Scratch
No ratings yet
Autoencoder From Scratch
21 pages
ML Record
No ratings yet
ML Record
24 pages
Nibedita Dehury, 123CE0079, Assignment 7
No ratings yet
Nibedita Dehury, 123CE0079, Assignment 7
15 pages
Software Laboratory II Code
No ratings yet
Software Laboratory II Code
27 pages
ML Lab....... 3-Converted New
No ratings yet
ML Lab....... 3-Converted New
27 pages
X OR Problem Using DNN
No ratings yet
X OR Problem Using DNN
3 pages
MIT Ans
No ratings yet
MIT Ans
216 pages
Experiment No
No ratings yet
Experiment No
29 pages
Import Numpy As NP
No ratings yet
Import Numpy As NP
5 pages
Neural Net Python Sleep Study
No ratings yet
Neural Net Python Sleep Study
3 pages
16BCB0126 VL2018195002535 Pe003
No ratings yet
16BCB0126 VL2018195002535 Pe003
40 pages
Machine Learning Practical File
No ratings yet
Machine Learning Practical File
31 pages
ML Journal External
No ratings yet
ML Journal External
14 pages
Bilal Ahmad Ai & DSS Assign # 03
No ratings yet
Bilal Ahmad Ai & DSS Assign # 03
7 pages
Sofcomputing Da2
No ratings yet
Sofcomputing Da2
7 pages
Lab-5 Report
No ratings yet
Lab-5 Report
11 pages
Bacdeaf 23032025 115708 Split 1
No ratings yet
Bacdeaf 23032025 115708 Split 1
37 pages
Index: Name - JINESH PRAJAPAT Class - B. Tech, III Year Branch - AI & DS Sem - V
No ratings yet
Index: Name - JINESH PRAJAPAT Class - B. Tech, III Year Branch - AI & DS Sem - V
35 pages
Assignment 2 Documentation
No ratings yet
Assignment 2 Documentation
15 pages
Btech1007022 Lab5.1
No ratings yet
Btech1007022 Lab5.1
9 pages
ML Lab Record
No ratings yet
ML Lab Record
33 pages
Machine Learning Model Building
No ratings yet
Machine Learning Model Building
6 pages
Bananini Chimpanzini
No ratings yet
Bananini Chimpanzini
8 pages
Mlda - Lab
No ratings yet
Mlda - Lab
35 pages
Bank Nifty PDF
No ratings yet
Bank Nifty PDF
16 pages
Soft Sensor Code
No ratings yet
Soft Sensor Code
4 pages
Soft Sensor Code
No ratings yet
Soft Sensor Code
4 pages
Nibedita Dehury, 123CE0079, ASSIGNMENT 9
No ratings yet
Nibedita Dehury, 123CE0079, ASSIGNMENT 9
18 pages
Btech1007022 Lab5
No ratings yet
Btech1007022 Lab5
14 pages
Exe 1
No ratings yet
Exe 1
13 pages
Computer Solved: Nonlinear Differential Equations
From Everand
Computer Solved: Nonlinear Differential Equations
Joe J. Ettl
No ratings yet
Cybercrime in Ghana A Study of Offenders, Victims and The Law - 2015
100% (1)
Cybercrime in Ghana A Study of Offenders, Victims and The Law - 2015
193 pages
Consumer Behaviour - Vivo Phones
No ratings yet
Consumer Behaviour - Vivo Phones
10 pages
How To Fix: Print Operation Failed Error 0x00000006
No ratings yet
How To Fix: Print Operation Failed Error 0x00000006
11 pages
Fuel Card Request Form
100% (1)
Fuel Card Request Form
2 pages
40 Gbps QSFP Cables Ds
No ratings yet
40 Gbps QSFP Cables Ds
2 pages
Chapter-5-The Internet and Its Uses
No ratings yet
Chapter-5-The Internet and Its Uses
17 pages
MarketSmiths Growth250 (Total 300) 1-25
No ratings yet
MarketSmiths Growth250 (Total 300) 1-25
1 page
BIORADIO PG Contribution - Bci2000.org BBS
No ratings yet
BIORADIO PG Contribution - Bci2000.org BBS
3 pages
Delomatic 3 Replacement Instruction SCM 1 4189340248
100% (1)
Delomatic 3 Replacement Instruction SCM 1 4189340248
2 pages
Ttl1 Module
No ratings yet
Ttl1 Module
50 pages
Manual Smar Tt301
100% (1)
Manual Smar Tt301
58 pages
CV Mandeep Thakur
No ratings yet
CV Mandeep Thakur
2 pages
Superagency in The Workplace Empowering People To Unlock Ais Full Potential v3
No ratings yet
Superagency in The Workplace Empowering People To Unlock Ais Full Potential v3
47 pages
EDM - Module II - Intro. To Digital Marketing
No ratings yet
EDM - Module II - Intro. To Digital Marketing
24 pages
(Readings) Deep Learning Applications in Business Activities
No ratings yet
(Readings) Deep Learning Applications in Business Activities
6 pages
Design Patterns Embedded Systems
No ratings yet
Design Patterns Embedded Systems
9 pages
Epermit2025 0170 2986
No ratings yet
Epermit2025 0170 2986
1 page
Console Output CLI Console
No ratings yet
Console Output CLI Console
20 pages
25 Solana
No ratings yet
25 Solana
11 pages
Final Thesis
No ratings yet
Final Thesis
78 pages
M1 R5 O-Level Detailed
No ratings yet
M1 R5 O-Level Detailed
4 pages
Vanderbilt #Readyforanychallenge: Cybersecurity: How To Implement Best Practices
No ratings yet
Vanderbilt #Readyforanychallenge: Cybersecurity: How To Implement Best Practices
6 pages
July 2023 JLPT Registration Guide - Manila Test Site
No ratings yet
July 2023 JLPT Registration Guide - Manila Test Site
43 pages
B4A y MySQL
100% (1)
B4A y MySQL
1 page
Test Specification Number 1 December 2021 2
No ratings yet
Test Specification Number 1 December 2021 2
27 pages
Current-and-voltage-measurements-using-Rogowski-coil-in-MV-air-insulated-switchgear (Thesis)
No ratings yet
Current-and-voltage-measurements-using-Rogowski-coil-in-MV-air-insulated-switchgear (Thesis)
93 pages
NCM110 LEC MODULE 6 - PDA - Wireless - DSS - Implications of NI
No ratings yet
NCM110 LEC MODULE 6 - PDA - Wireless - DSS - Implications of NI
35 pages
Sra4 Installation Guide
No ratings yet
Sra4 Installation Guide
26 pages
Product Life Cycle Announcement EOS TH6430
No ratings yet
Product Life Cycle Announcement EOS TH6430
2 pages
Sy0-701 0
No ratings yet
Sy0-701 0
25 pages

Mlee Lab1

Uploaded by

Mlee Lab1

Uploaded by

from google.

colab import drive

def stochastic_gradient_descent(X,y,w,alpha, iters):

def MB_gradient_descent(X,y,w,alpha, iters, batch_size):

def r_squared(y_true, y_pred):

X = data.iloc[:, :-1] # All rows, all columns except the last

ymin = np.min(y, axis = 0)

Training Features Shape: (56, 9)

w= np.zeros((X_normalized.shape[1])) ###weight initialization

alpha=0.4 ##learning rate

WEIGHT VECTOR [0.21794334 0.10606424 0.0478828 0.03935448 0.03229864

MEAN ABSOLUTE ERROR 1.1326579129012353

MEAN SQUARE ERROR: 1.819265635873902

CORRELATION COEFF: 0.2602600569650748

WEIGHT VECTOR [0.21794334 0.10606424 0.0478828 0.03935448 0.03229864

WEIGHT VECTOR [0.21794334 0.10606424 0.0478828 0.03935448 0.03229864

You might also like