0% found this document useful (0 votes)

11 views4 pages

Adaline SGD

This document details the implementation of the ADALINE model using Stochastic Gradient Descent with a focus on understanding the underlying mechanics without relying on PyTorch's automatic differentiation. It includes steps for loading a toy dataset, normalizing it, training the model, and evaluating its performance through accuracy metrics and visualization of decision boundaries. The results show a training accuracy of 90% and a test accuracy of 96.67%.

Uploaded by

pnqanh.gdsciu

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

11 views4 pages

Adaline SGD

Uploaded by

pnqanh.gdsciu

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 4

ADALINE with Stochastic Gradient Descent (Minibatch)

In this notebook, we are implementing ADALINE "by hand" without using PyTorch's autograd capabilities. In Lecture 06, we will use
"automatic differentiation" (also known as "autodiff"; or autograd in PyTorch) to implement Adaline more compactly. (The reason why we
don't use autodiff here is that it is useful to understand what's going on under the hood.)

import pandas as pd
import matplotlib.pyplot as plt
import torch
%matplotlib inline

Load & Prepare a Toy Dataset

df = pd.read_csv('./datasets/iris.data', index_col=None, header=None)
df.columns = ['x1', 'x2', 'x3', 'x4', 'y']
df = df.iloc[50:150]
df['y'] = df['y'].apply(lambda x: 0 if x == 'Iris-versicolor' else 1)
df.tail()

x1 x2 x3 x4 y

145 6.7 3.0 5.2 2.3 1

146 6.3 2.5 5.0 1.9 1

147 6.5 3.0 5.2 2.0 1

148 6.2 3.4 5.4 2.3 1

149 5.9 3.0 5.1 1.8 1

# Assign features and target

X = torch.tensor(df[['x2', 'x3']].values, dtype=torch.float)

y = torch.tensor(df['y'].values, dtype=torch.int)

# Shuffling & train/test split

torch.manual_seed(123)
shuffle_idx = torch.randperm(y.size(0), dtype=torch.long)

X, y = X[shuffle_idx], y[shuffle_idx]

percent70 = int(shuffle_idx.size(0)*0.7)

X_train, X_test = X[shuffle_idx[:percent70]], X[shuffle_idx[percent70:]]

y_train, y_test = y[shuffle_idx[:percent70]], y[shuffle_idx[percent70:]]

# Normalize (mean zero, unit variance)

mu, sigma = X_train.mean(dim=0), X_train.std(dim=0)

X_train = (X_train - mu) / sigma
X_test = (X_test - mu) / sigma

plt.scatter(X_train[y_train == 0, 0], X_train[y_train == 0, 1], label='class 0')

plt.scatter(X_train[y_train == 1, 0], X_train[y_train == 1, 1], label='class 1')
plt.legend()
plt.show()

plt.scatter(X_test[y_test == 0, 0], X_test[y_test == 0, 1], label='class 0')

plt.scatter(X_test[y_test == 1, 0], X_test[y_test == 1, 1], label='class 1')
plt.legend()
plt.show()

Implement ADALINE Model

class Adaline1():
def __init__(self, num_features):
self.num_features = num_features
self.weights = torch.zeros(num_features, 1,
dtype=torch.float)
self.bias = torch.zeros(1, dtype=torch.float)

def forward(self, x):

netinputs = torch.add(torch.mm(x, self.weights), self.bias)
activations = netinputs
return activations.view(-1)

def backward(self, x, yhat, y):

grad_loss_yhat = 2*(yhat - y)

grad_yhat_weights = x
grad_yhat_bias = 1.

# Chain rule: inner times outer

grad_loss_weights = torch.mm(grad_yhat_weights.t(),
grad_loss_yhat.view(-1, 1)) / y.size(0)

grad_loss_bias = torch.sum(grad_yhat_bias*grad_loss_yhat) / y.size(0)

# return negative gradient

return (-1)*grad_loss_weights, (-1)*grad_loss_bias

Define Training and Evaluation Functions

####################################################
##### Training and evaluation wrappers
###################################################

def loss(yhat, y):

return torch.mean((yhat - y)**2)

def train(model, x, y, num_epochs,

learning_rate=0.01, seed=123, minibatch_size=10):
cost = []

torch.manual_seed(seed)
for e in range(num_epochs):

#### Shuffle epoch

shuffle_idx = torch.randperm(y.size(0), dtype=torch.long)
minibatches = torch.split(shuffle_idx, minibatch_size)

for minibatch_idx in minibatches:

#### Compute outputs ####

yhat = model.forward(x[minibatch_idx])

#### Compute gradients ####

negative_grad_w, negative_grad_b = \
model.backward(x[minibatch_idx], yhat, y[minibatch_idx])

#### Update weights ####

model.weights += learning_rate * negative_grad_w
model.bias += learning_rate * negative_grad_b

#### Logging ####

minibatch_loss = loss(yhat, y[minibatch_idx])
print(' Minibatch MSE: %.3f' % minibatch_loss)

#### Logging ####

yhat = model.forward(x)
curr_loss = loss(yhat, y)
print('Epoch: %03d' % (e+1), end="")
print(' | MSE: %.5f' % curr_loss)
cost.append(curr_loss)

return cost

Train Model
model = Adaline1(num_features=X_train.size(1))
cost = train(model,
X_train, y_train.float(),
num_epochs=20,
learning_rate=0.1,
seed=123,
minibatch_size=10)

Evaluate ADALINE Model

Plot Loss (MSE)

plt.plot(range(len(cost)), cost)
plt.ylabel('Mean Squared Error')
plt.xlabel('Epoch')
plt.show()

Compare with analytical solution

print('Weights', model.weights)
print('Bias', model.bias)

Weights tensor([[-0.0763],
[ 0.4181]])
Bias tensor([0.4888])

def analytical_solution(x, y):

Xb = torch.cat( (torch.ones((x.size(0), 1)), x), dim=1)
w = torch.zeros(x.size(1))
z = torch.inverse(torch.matmul(Xb.t(), Xb))
params = torch.matmul(z, torch.matmul(Xb.t(), y))
b, w = torch.tensor([params[0]]), params[1:].view(x.size(1), 1)
return w, b

w, b = analytical_solution(X_train, y_train.float())
print('Analytical weights', w)
print('Analytical bias', b)

Analytical weights tensor([[-0.0703],

[ 0.4219]])
Analytical bias tensor([0.4857])
Evaluate on Evaluation Metric (Prediction Accuracy)
ones = torch.ones(y_train.size())
zeros = torch.zeros(y_train.size())
train_pred = model.forward(X_train)
train_acc = torch.mean(
(torch.where(train_pred > 0.5,
ones,
zeros).int() == y_train).float())

ones = torch.ones(y_test.size())
zeros = torch.zeros(y_test.size())
test_pred = model.forward(X_test)
test_acc = torch.mean(
(torch.where(test_pred > 0.5,
ones,
zeros).int() == y_test).float())

print('Training Accuracy: %.2f' % (train_acc*100))

print('Test Accuracy: %.2f' % (test_acc*100))

Training Accuracy: 90.00

Test Accuracy: 96.67

Decision Boundary
##########################
### 2D Decision Boundary
##########################

w, b = model.weights, model.bias - 0.5

x_min = -3
y_min = ( (-(w[0] * x_min) - b[0])
/ w[1] )

x_max = 3
y_max = ( (-(w[0] * x_max) - b[0])
/ w[1] )

fig, ax = plt.subplots(1, 2, sharex=True, figsize=(7, 3))

ax[0].plot([x_min, x_max], [y_min, y_max])

ax[1].plot([x_min, x_max], [y_min, y_max])

ax[0].scatter(X_train[y_train==0, 0], X_train[y_train==0, 1], label='class 0', marker='o')

ax[0].scatter(X_train[y_train==1, 0], X_train[y_train==1, 1], label='class 1', marker='s')

ax[1].scatter(X_test[y_test==0, 0], X_test[y_test==0, 1], label='class 0', marker='o')

ax[1].scatter(X_test[y_test==1, 0], X_test[y_test==1, 1], label='class 1', marker='s')

ax[1].legend(loc='upper left')
plt.show()

Loading [MathJax]/jax/output/CommonHTML/fonts/TeX/fontdata.js

ND Computer Science
No ratings yet
ND Computer Science
224 pages
Basic Discrete Structure
100% (1)
Basic Discrete Structure
57 pages
Manual Motor DC (Siemens)
No ratings yet
Manual Motor DC (Siemens)
104 pages
Wind Turbine Blade Design On SolidWorks
No ratings yet
Wind Turbine Blade Design On SolidWorks
6 pages
Esp32 Technical Reference Manual en
No ratings yet
Esp32 Technical Reference Manual en
660 pages
LSTM From Scratch in Python
No ratings yet
LSTM From Scratch in Python
11 pages
Heizer Chapter 6 - Managing Quality
No ratings yet
Heizer Chapter 6 - Managing Quality
17 pages
IBest DeepLearning
No ratings yet
IBest DeepLearning
123 pages
Micrologix 1200 and 1500 Programmable Controllers Firmware Upgrade
No ratings yet
Micrologix 1200 and 1500 Programmable Controllers Firmware Upgrade
12 pages
Office Automation
No ratings yet
Office Automation
14 pages
On Bottom Stability Analysis and Mudmat Design
No ratings yet
On Bottom Stability Analysis and Mudmat Design
9 pages
(Deep Learning Using PyTorch) (Cheatsheet)
No ratings yet
(Deep Learning Using PyTorch) (Cheatsheet)
7 pages
Bananini Chimpanzini
No ratings yet
Bananini Chimpanzini
8 pages
Lecture 03 Gradient Descent
No ratings yet
Lecture 03 Gradient Descent
26 pages
Physics 1.11 Pressure
No ratings yet
Physics 1.11 Pressure
67 pages
GEHC DICOM Conformance - Senographe Pristina Zephyr - DOC2139635 - Rev2
No ratings yet
GEHC DICOM Conformance - Senographe Pristina Zephyr - DOC2139635 - Rev2
212 pages
Exp 4
No ratings yet
Exp 4
3 pages
NN From Scratch
No ratings yet
NN From Scratch
5 pages
Deep Learning With PyTorch 1
No ratings yet
Deep Learning With PyTorch 1
1 page
Notebook - Deep Neural Networks
No ratings yet
Notebook - Deep Neural Networks
28 pages
C2 W2ok
No ratings yet
C2 W2ok
109 pages
Extraction of Piperine From Black Pepper PDF
0% (2)
Extraction of Piperine From Black Pepper PDF
2 pages
Chapter 1
No ratings yet
Chapter 1
37 pages
DL Lab Manual
No ratings yet
DL Lab Manual
52 pages
Formwork (Shuttering) For Different Structural Members - Beams, Slabs Etc
No ratings yet
Formwork (Shuttering) For Different Structural Members - Beams, Slabs Etc
6 pages
04 02 Permutation and Combinations2 PDF
No ratings yet
04 02 Permutation and Combinations2 PDF
28 pages
Effects of Batches - Jupyter Notebook
No ratings yet
Effects of Batches - Jupyter Notebook
73 pages
Part 13 MD
No ratings yet
Part 13 MD
41 pages
IoT Lab Assignment No. 2
No ratings yet
IoT Lab Assignment No. 2
8 pages
Pytorch 101: Deep Learning PHD Course 2017/2018
No ratings yet
Pytorch 101: Deep Learning PHD Course 2017/2018
19 pages
BLDD VIT ResNet50v2 CustomCNN
No ratings yet
BLDD VIT ResNet50v2 CustomCNN
38 pages
PyTorch Crash Course 1713016363
No ratings yet
PyTorch Crash Course 1713016363
15 pages
NN From Scratch PDF 1735495327
No ratings yet
NN From Scratch PDF 1735495327
19 pages
Py Torch
No ratings yet
Py Torch
11 pages
Software Laboratory II Code
No ratings yet
Software Laboratory II Code
27 pages
Pytorch Demo 1749471354
No ratings yet
Pytorch Demo 1749471354
10 pages
Assignment-1 (MLP From Scratch) : Roll No: EDM18B055
No ratings yet
Assignment-1 (MLP From Scratch) : Roll No: EDM18B055
1 page
PyTorch CrashCourse
No ratings yet
PyTorch CrashCourse
17 pages
555610a19 DL Exp4
No ratings yet
555610a19 DL Exp4
11 pages
MLP Pytorch Sigmoid Mse
No ratings yet
MLP Pytorch Sigmoid Mse
20 pages
PyTorch CrashCourse
No ratings yet
PyTorch CrashCourse
16 pages
Ic Engine and Turbo Machinery
No ratings yet
Ic Engine and Turbo Machinery
25 pages
Class Neuron Red
No ratings yet
Class Neuron Red
12 pages
New Exp
No ratings yet
New Exp
12 pages
MLP Pytorch Softmax Crossentr
No ratings yet
MLP Pytorch Softmax Crossentr
20 pages
Lab 8
No ratings yet
Lab 8
10 pages
Linear Regression With Pytroch
No ratings yet
Linear Regression With Pytroch
13 pages
Lab 2
No ratings yet
Lab 2
13 pages
High Electron Mobility Transistor-Foti
No ratings yet
High Electron Mobility Transistor-Foti
17 pages
Ilovepdf Merged
No ratings yet
Ilovepdf Merged
10 pages
Using A Three Layer Deep Neural Network To Solve An Unsupervised Learning Problem
No ratings yet
Using A Three Layer Deep Neural Network To Solve An Unsupervised Learning Problem
13 pages
Unsupervised Optimal Fuzzy Clustering: I.Gath and A. B. Geva. IEEE Transactions On Pattern
No ratings yet
Unsupervised Optimal Fuzzy Clustering: I.Gath and A. B. Geva. IEEE Transactions On Pattern
34 pages
Deeplg 3
No ratings yet
Deeplg 3
8 pages
Assignment 3 DS5620
No ratings yet
Assignment 3 DS5620
11 pages
Mlp-Fromscratch Sigmoid-Mse
No ratings yet
Mlp-Fromscratch Sigmoid-Mse
13 pages
135-4500-421H 5.12inch 20-23 PPF 6K RHP-SPR Packer
No ratings yet
135-4500-421H 5.12inch 20-23 PPF 6K RHP-SPR Packer
15 pages
2-3btc of Freebitco - in
100% (1)
2-3btc of Freebitco - in
2 pages
Iron FerroVer + TPTZ Methods
No ratings yet
Iron FerroVer + TPTZ Methods
15 pages
CIFAR - 10 - Dataset - Using - CNN - Aniiiii - HTML
No ratings yet
CIFAR - 10 - Dataset - Using - CNN - Aniiiii - HTML
8 pages
Experiment 2.4 DL
No ratings yet
Experiment 2.4 DL
4 pages
TXT
No ratings yet
TXT
7 pages
Convex Report
No ratings yet
Convex Report
9 pages
PyTorch Cheat Sheet & Quick Reference
No ratings yet
PyTorch Cheat Sheet & Quick Reference
6 pages
Lesson 2
No ratings yet
Lesson 2
8 pages
Intro To Pytorch
No ratings yet
Intro To Pytorch
12 pages
Assignment 6 (14 10 24)
No ratings yet
Assignment 6 (14 10 24)
2 pages
Week 7 - Lab
No ratings yet
Week 7 - Lab
6 pages
CA LISA Virtualization - Presentation
No ratings yet
CA LISA Virtualization - Presentation
15 pages
Deep Learning
No ratings yet
Deep Learning
4 pages
Trainina A NN Backpropagation
No ratings yet
Trainina A NN Backpropagation
6 pages
Refrigeration Unit Datasheet
No ratings yet
Refrigeration Unit Datasheet
8 pages
IND315 Operations Research I, Fall 2023, by Ç. Özgün Kibiroğlu
No ratings yet
IND315 Operations Research I, Fall 2023, by Ç. Özgün Kibiroğlu
7 pages
How The Switching Frequency Affects The Performance of A Buck Converter
No ratings yet
How The Switching Frequency Affects The Performance of A Buck Converter
8 pages
Notes On EV:CV
No ratings yet
Notes On EV:CV
13 pages
LIFT DATA SHEET (Single Mobile Crane Lift)
No ratings yet
LIFT DATA SHEET (Single Mobile Crane Lift)
1 page
Softmax Regression Scratch
No ratings yet
Softmax Regression Scratch
5 pages
A-Simple-Neural-Network-From-Scratch - Jupyter Notebook
No ratings yet
A-Simple-Neural-Network-From-Scratch - Jupyter Notebook
9 pages
Hvu
No ratings yet
Hvu
4 pages
Logistic Regression
No ratings yet
Logistic Regression
4 pages
Linear Regr GD
No ratings yet
Linear Regr GD
3 pages
Softmax Regression Mnist
No ratings yet
Softmax Regression Mnist
3 pages
Experiment 6
No ratings yet
Experiment 6
3 pages
Perceptron Pytorch
No ratings yet
Perceptron Pytorch
3 pages
Python Code PDF
No ratings yet
Python Code PDF
3 pages
Acknowledgement Abstract
No ratings yet
Acknowledgement Abstract
6 pages
S11 Question Catalog en
No ratings yet
S11 Question Catalog en
2 pages
A 3
No ratings yet
A 3
5 pages
Diploma Baru Ee111
No ratings yet
Diploma Baru Ee111
2 pages

Adaline SGD

Uploaded by

Adaline SGD

Uploaded by

ADALINE with Stochastic Gradient Descent (Minibatch)

Load & Prepare a Toy Dataset

145 6.7 3.0 5.2 2.3 1

146 6.3 2.5 5.0 1.9 1

147 6.5 3.0 5.2 2.0 1

148 6.2 3.4 5.4 2.3 1

149 5.9 3.0 5.1 1.8 1

# Assign features and target

X = torch.tensor(df[['x2', 'x3']].values, dtype=torch.float)

# Shuffling & train/test split

X_train, X_test = X[shuffle_idx[:percent70]], X[shuffle_idx[percent70:]]

# Normalize (mean zero, unit variance)

mu, sigma = X_train.mean(dim=0), X_train.std(dim=0)

plt.scatter(X_train[y_train == 0, 0], X_train[y_train == 0, 1], label='class 0')

plt.scatter(X_test[y_test == 0, 0], X_test[y_test == 0, 1], label='class 0')

Implement ADALINE Model

def forward(self, x):

def backward(self, x, yhat, y):

# Chain rule: inner times outer

grad_loss_bias = torch.sum(grad_yhat_bias*grad_loss_yhat) / y.size(0)

# return negative gradient

Define Training and Evaluation Functions

def loss(yhat, y):

def train(model, x, y, num_epochs,

#### Shuffle epoch

for minibatch_idx in minibatches:

#### Compute outputs ####

#### Compute gradients ####

#### Update weights ####

#### Logging ####

#### Logging ####

Evaluate ADALINE Model

Plot Loss (MSE)

Compare with analytical solution

def analytical_solution(x, y):

Analytical weights tensor([[-0.0703],

print('Training Accuracy: %.2f' % (train_acc*100))

Training Accuracy: 90.00

w, b = model.weights, model.bias - 0.5

fig, ax = plt.subplots(1, 2, sharex=True, figsize=(7, 3))

ax[0].plot([x_min, x_max], [y_min, y_max])

ax[0].scatter(X_train[y_train==0, 0], X_train[y_train==0, 1], label='class 0', marker='o')

ax[1].scatter(X_test[y_test==0, 0], X_test[y_test==0, 1], label='class 0', marker='o')

You might also like