0% found this document useful (0 votes)

20 views5 pages

Softmax Regression Scratch

The document outlines the implementation of softmax regression using both low-level manual gradient calculations and high-level PyTorch nn.Module API. It includes steps for data preparation, model training, and evaluation using the Iris dataset, achieving a test set accuracy of 80%. Additionally, it provides visualizations of decision boundaries and model parameters.

Uploaded by

pnqanh.gdsciu

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

20 views5 pages

Softmax Regression Scratch

Uploaded by

pnqanh.gdsciu

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 5

Softmax Regression

Implementation of classic softmax regression (multinomial logistic regression).

Imports
%matplotlib inline
import matplotlib.pyplot as plt
import pandas as pd
import torch
import torch.nn.functional as F

Preparing a dataset
##########################
### DATASET
##########################

df = pd.read_csv('./data/iris.data', index_col=None, header=None)

df.columns = ['x1', 'x2', 'x3', 'x4', 'y']

d = {'Iris-versicolor': 1,
'Iris-virginica': 2,
'Iris-setosa': 0,
}

df['y'] = df['y'].map(d)

# Assign features and target

X = torch.tensor(df[['x2', 'x4']].values, dtype=torch.float)

y = torch.tensor(df['y'].values, dtype=torch.int)

# Shuffling & train/test split

torch.manual_seed(123)
shuffle_idx = torch.randperm(y.size(0), dtype=torch.long)

X, y = X[shuffle_idx], y[shuffle_idx]

percent80 = int(shuffle_idx.size(0)*0.8)

X_train, X_test = X[shuffle_idx[:percent80]], X[shuffle_idx[percent80:]]

y_train, y_test = y[shuffle_idx[:percent80]], y[shuffle_idx[percent80:]]

# Normalize (mean zero, unit variance)

mu, sigma = X_train.mean(dim=0), X_train.std(dim=0)

X_train = (X_train - mu) / sigma
X_test = (X_test - mu) / sigma

fig, ax = plt.subplots(1, 2, figsize=(7, 2.5))

ax[0].scatter(X_train[y_train == 2, 0], X_train[y_train == 2, 1])
ax[0].scatter(X_train[y_train == 1, 0], X_train[y_train == 1, 1], marker='v')
ax[0].scatter(X_train[y_train == 0, 0], X_train[y_train == 0, 1], marker='s')
ax[1].scatter(X_test[y_test == 2, 0], X_test[y_test == 2, 1])
ax[1].scatter(X_test[y_test == 1, 0], X_test[y_test == 1, 1], marker='v')
ax[1].scatter(X_test[y_test == 0, 0], X_test[y_test == 0, 1], marker='s')
plt.show()

Low-level implementation with manual gradients

DEVICE = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")

def to_onehot(y, num_classes):

y_onehot = torch.FloatTensor(y.size(0), num_classes)
y_onehot.zero_()
y_cpu = y.to(torch.device('cpu'))
y_onehot.scatter_(1, y_cpu.view(-1, 1).long(), 1).float()
return y_onehot.to(DEVICE)

def softmax(z):
return (torch.exp(z.t()) / torch.sum(torch.exp(z), dim=1)).t()

def cross_entropy(softmax, y_target):

return -torch.sum(torch.log(softmax) * (y_target), dim=1)

class SoftmaxRegression1():
def __init__(self, num_features, num_classes):
self.num_features = num_features
self.num_classes = num_classes
self.weights = torch.zeros(num_classes, num_features, # h x m
dtype=torch.float32, device=DEVICE)
self.bias = torch.zeros(num_classes, dtype=torch.float32, device=DEVICE) # h

def forward(self, x):

logits = torch.mm(x, self.weights.t()) + self.bias # net inputs
probas = softmax(logits) # activations
return logits, probas

def backward(self, x, y, probas):

grad_loss_wrt_w = -torch.mm(x.t(), y - probas).t()
grad_loss_wrt_b = -torch.sum(y - probas)
return grad_loss_wrt_w, grad_loss_wrt_b

def predict_labels(self, x):

logits, probas = self.forward(x)
labels = torch.argmax(probas, dim=1)
return labels

def evaluate(self, x, y):

labels = self.predict_labels(x).float()
accuracy = torch.sum(labels.view(-1) == y.float()).item() / y.size(0)
return accuracy

def train(self, x, y, num_epochs, learning_rate=0.01):

epoch_cost = []
for e in range(num_epochs):

y_onehot = to_onehot(y, num_classes=self.num_classes)

#### Compute outputs ####

logits, probas = self.forward(x)

#### Compute gradients ####

grad_w, grad_b = self.backward(x, y_onehot, probas)

#### Update weights ####

self.weights -= learning_rate * grad_w / y.size(0)
self.bias -= learning_rate * grad_b / y.size(0)

#### Logging ####

logits, probas = self.forward(x)
cost = torch.mean(cross_entropy(probas, y_onehot))
print('Epoch: %03d' % (e+1), end="")
print(' | Train ACC: %.3f' % self.evaluate(x, y), end="")
print(' | Cost: %.3f' % cost)
epoch_cost.append(cost)
return epoch_cost

X_train = X_train.to(DEVICE)
y_train = y_train.to(DEVICE)

model1 = SoftmaxRegression1(num_features=2, num_classes=3)

epoch_cost = model1.train(X_train, y_train,
num_epochs=50,
learning_rate=0.1)

print('\nModel parameters:')
print(' Weights: %s' % model1.weights)
print(' Bias: %s' % model1.bias)

Evaluating the Model

plt.plot(epoch_cost)
plt.ylabel('Negative Log Likelihood Loss')
plt.xlabel('Epoch')
plt.show()

X_test = X_test.to(DEVICE)
y_test = y_test.to(DEVICE)

test_acc = model1.evaluate(X_test, y_test)

print('Test set accuracy: %.2f%%' % (test_acc*100))

Test set accuracy: 80.00%

from matplotlib.colors import ListedColormap

import numpy as np

def plot_decision_regions(X, y, classifier, resolution=0.02):

# setup marker generator and color map

markers = ('s', 'x', 'o', '^', 'v')
colors = ('red', 'blue', 'lightgreen', 'gray', 'cyan')
cmap = ListedColormap(colors[:len(np.unique(y))])

# plot the decision surface

x1_min, x1_max = X[:, 0].min() - 1, X[:, 0].max() + 1
x2_min, x2_max = X[:, 1].min() - 1, X[:, 1].max() + 1
xx1, xx2 = np.meshgrid(np.arange(x1_min, x1_max, resolution),
np.arange(x2_min, x2_max, resolution))
tensor = torch.tensor(np.array([xx1.ravel(), xx2.ravel()]).T).float()
logits, probas = classifier.forward(tensor)
Z = np.argmax(probas.detach().numpy(), axis=1)

Z = Z.reshape(xx1.shape)
plt.contourf(xx1, xx2, Z, alpha=0.4, cmap=cmap)
plt.xlim(xx1.min(), xx1.max())
plt.ylim(xx2.min(), xx2.max())

# plot class samples

for idx, cl in enumerate(np.unique(y)):
plt.scatter(x=X[y == cl, 0], y=X[y == cl, 1],
alpha=0.8, color=cmap(idx),
edgecolor='black',
marker=markers[idx],
label=cl)

plot_decision_regions(X_train, y_train, classifier=model1)

plt.xlabel('sepal length [cm]')
plt.ylabel('petal length [cm]')
plt.legend(loc='upper left')

plt.tight_layout()
plt.show()
High-level implementation using the nn.Module API
class SoftmaxRegression2(torch.nn.Module):

def init(self, num_features, num_classes):

super(SoftmaxRegression2, self).__init__()
self.linear = torch.nn.Linear(num_features, num_classes)
# initialize weights to zeros here,
# since we used zero weights in the
# manual approach

self.linear.weight.detach().zero_()
self.linear.bias.detach().zero_()
# Note: the trailing underscore
# means "in-place operation" in the context
# of PyTorch

def forward(self, x):

logits = self.linear(x)
probas = F.softmax(logits, dim=1)
return logits, probas

model2 = SoftmaxRegression2(num_features=2, num_classes=3).to(DEVICE)

optimizer = torch.optim.SGD(model2.parameters(), lr=0.1)

def comp_accuracy(true_labels, pred_labels):

accuracy = torch.sum(true_labels.view(-1).float() ==
pred_labels.float()).item() / true_labels.size(0)
return accuracy

X_train = X_train.to(DEVICE)
y_train = y_train.to(DEVICE)
X_test = X_test.to(DEVICE)
y_test = y_test.to(DEVICE)

num_epochs = 50
for epoch in range(num_epochs):

#### Compute outputs ####

logits, probas = model2(X_train)

#### Compute gradients ####

cost = F.cross_entropy(logits, y_train.long())
optimizer.zero_grad()
cost.backward()

#### Update weights ####

optimizer.step()

#### Logging ####

logits, probas = model2(X_train)
acc = comp_accuracy(y_train, torch.argmax(probas, dim=1))
print('Epoch: %03d' % (epoch + 1), end="")
print(' | Train ACC: %.3f' % acc, end="")
print(' | Cost: %.3f' % F.cross_entropy(logits, y_train.long()))

print('\nModel parameters:')
print(' Weights: %s' % model2.linear.weight)
print(' Bias: %s' % model2.linear.bias)
X_test = X_test.to(DEVICE)
y_test = y_test.to(DEVICE)

test_acc = model1.evaluate(X_test, y_test)

print('Test set accuracy: %.2f%%' % (test_acc*100))

Test set accuracy: 80.00%

plot_decision_regions(X_train, y_train, classifier=model2)

plt.xlabel('sepal length [cm]')
plt.ylabel('petal length [cm]')
plt.legend(loc='upper left')

plt.tight_layout()
plt.show()

Loading [MathJax]/jax/output/CommonHTML/fonts/TeX/fontdata.js

KR23 DL Lab Record
No ratings yet
KR23 DL Lab Record
59 pages
Kolmogorov-Arnold-Networks in Python
No ratings yet
Kolmogorov-Arnold-Networks in Python
8 pages
IBest DeepLearning
No ratings yet
IBest DeepLearning
123 pages
BLDD VIT ResNet50v2 CustomCNN
No ratings yet
BLDD VIT ResNet50v2 CustomCNN
38 pages
Bevans, Stephen. B
100% (1)
Bevans, Stephen. B
284 pages
Programming and Scientific Computing in Python For Aerospace Engineers - J Hoekstra (TU Delft)
100% (1)
Programming and Scientific Computing in Python For Aerospace Engineers - J Hoekstra (TU Delft)
139 pages
Lab Manual DL (New)
No ratings yet
Lab Manual DL (New)
89 pages
Deep Learning Lab Manual - 23-24
No ratings yet
Deep Learning Lab Manual - 23-24
41 pages
Speakout 2nd Edition Elementary Reading&Listening Extra
100% (2)
Speakout 2nd Edition Elementary Reading&Listening Extra
14 pages
Ann Experiential Learning
No ratings yet
Ann Experiential Learning
43 pages
MLP Pytorch Softmax Crossentr
No ratings yet
MLP Pytorch Softmax Crossentr
20 pages
ATM Case Study, Part 1: Object-Oriented Design With The UML
No ratings yet
ATM Case Study, Part 1: Object-Oriented Design With The UML
46 pages
PINN 1DBurgers
No ratings yet
PINN 1DBurgers
19 pages
21BCE5775 Neural Networks
No ratings yet
21BCE5775 Neural Networks
19 pages
Machine Learning CODE
No ratings yet
Machine Learning CODE
19 pages
Pytorch Demo 1749471354
No ratings yet
Pytorch Demo 1749471354
10 pages
MLP Pytorch Sigmoid Mse
No ratings yet
MLP Pytorch Sigmoid Mse
20 pages
Deep Learning Programs Updated
No ratings yet
Deep Learning Programs Updated
24 pages
Autoencoder From Scratch
No ratings yet
Autoencoder From Scratch
21 pages
Bananini Chimpanzini
No ratings yet
Bananini Chimpanzini
8 pages
C# Module
No ratings yet
C# Module
131 pages
Mlee Lab4
No ratings yet
Mlee Lab4
11 pages
HW4ML Project Code
No ratings yet
HW4ML Project Code
24 pages
Starter System Provisioning Process
No ratings yet
Starter System Provisioning Process
17 pages
'/content/drive': From Import Import As Import As Import As
No ratings yet
'/content/drive': From Import Import As Import As Import As
9 pages
Presentation
No ratings yet
Presentation
31 pages
Logistic Regression
No ratings yet
Logistic Regression
4 pages
Mlp-Fromscratch Sigmoid-Mse
No ratings yet
Mlp-Fromscratch Sigmoid-Mse
13 pages
Wisdom Diary On Ministry
100% (2)
Wisdom Diary On Ministry
15 pages
SC Lab File Fayiz PDF
No ratings yet
SC Lab File Fayiz PDF
29 pages
NN From Scratch
No ratings yet
NN From Scratch
5 pages
ML Expt 08
No ratings yet
ML Expt 08
4 pages
Adaline SGD
No ratings yet
Adaline SGD
4 pages
NN From Scratch PDF 1735495327
No ratings yet
NN From Scratch PDF 1735495327
19 pages
Lab Report 03
No ratings yet
Lab Report 03
14 pages
Document 2
No ratings yet
Document 2
8 pages
Sofcomputing Da2
No ratings yet
Sofcomputing Da2
7 pages
Bản sao của softmax - regression.ipynb - Colab
No ratings yet
Bản sao của softmax - regression.ipynb - Colab
6 pages
Deep Learning Assignments
No ratings yet
Deep Learning Assignments
6 pages
Huawei ICT Competition 2023-2024 Exam Outline - Cloud Track
0% (1)
Huawei ICT Competition 2023-2024 Exam Outline - Cloud Track
1 page
Experiment 6
No ratings yet
Experiment 6
3 pages
Perceptron Pytorch
No ratings yet
Perceptron Pytorch
3 pages
Softmax Regression Mnist
No ratings yet
Softmax Regression Mnist
3 pages
Experiment 2
No ratings yet
Experiment 2
15 pages
Loss
No ratings yet
Loss
4 pages
Deep Learning Assignments
No ratings yet
Deep Learning Assignments
5 pages
Deeplg 3
No ratings yet
Deeplg 3
8 pages
Big Data Assignment - 7
No ratings yet
Big Data Assignment - 7
7 pages
21bit0706 VL2024250106861 Da
No ratings yet
21bit0706 VL2024250106861 Da
7 pages
Assignment 1: Q1. Task Description
No ratings yet
Assignment 1: Q1. Task Description
12 pages
G8 - WEEK 1 - Q1 (Autosaved)
No ratings yet
G8 - WEEK 1 - Q1 (Autosaved)
65 pages
ANN PR Code and Output
No ratings yet
ANN PR Code and Output
25 pages
ML Lab 01999676272
No ratings yet
ML Lab 01999676272
12 pages
Ov2500 Nms e 46r1 Install Reva
No ratings yet
Ov2500 Nms e 46r1 Install Reva
268 pages
X OR Problem Using DNN
No ratings yet
X OR Problem Using DNN
3 pages
Lab 8
No ratings yet
Lab 8
10 pages
Val
No ratings yet
Val
9 pages
Java Programming Unit-1 Mega Notes
No ratings yet
Java Programming Unit-1 Mega Notes
42 pages
Linear Regr GD
No ratings yet
Linear Regr GD
3 pages
CIFAR - 10 - Dataset - Using - CNN - Aniiiii - HTML
No ratings yet
CIFAR - 10 - Dataset - Using - CNN - Aniiiii - HTML
8 pages
Ccnet Only
No ratings yet
Ccnet Only
6 pages
Code
No ratings yet
Code
4 pages
LPC2148 Ebook
No ratings yet
LPC2148 Ebook
89 pages
PyTorch Crash Course 1713016363
No ratings yet
PyTorch Crash Course 1713016363
15 pages
Literacy Assessment Test
No ratings yet
Literacy Assessment Test
4 pages
Ddsu666 User Manual en
No ratings yet
Ddsu666 User Manual en
22 pages
Lab-5 Report
No ratings yet
Lab-5 Report
11 pages
SES - Nora D. Herrera - Grade 6 - 2nd ST - San Rafael East
No ratings yet
SES - Nora D. Herrera - Grade 6 - 2nd ST - San Rafael East
4 pages
Ilovepdf Merged
No ratings yet
Ilovepdf Merged
10 pages
Ontological Engineering: Delivered by Joel Anandraj.E Ap/It
No ratings yet
Ontological Engineering: Delivered by Joel Anandraj.E Ap/It
39 pages
Introduction to PHP, Part 2, Second Edition
From Everand
Introduction to PHP, Part 2, Second Edition
Adam Majczak
No ratings yet
Assignment 3 DS5620
No ratings yet
Assignment 3 DS5620
11 pages
Using A Three Layer Deep Neural Network To Solve An Unsupervised Learning Problem
No ratings yet
Using A Three Layer Deep Neural Network To Solve An Unsupervised Learning Problem
13 pages
Compositions Latines Rimbaud
No ratings yet
Compositions Latines Rimbaud
286 pages
Intro To Pytorch
No ratings yet
Intro To Pytorch
12 pages
Trainina A NN Backpropagation
No ratings yet
Trainina A NN Backpropagation
6 pages
Grammar Summary Unit 4-1
No ratings yet
Grammar Summary Unit 4-1
2 pages
Level: M.A English Term: 2: Course Outline
No ratings yet
Level: M.A English Term: 2: Course Outline
3 pages
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet
English Exams
No ratings yet
English Exams
4 pages
ME Student Data
No ratings yet
ME Student Data
5 pages
Jair 14714 Corr
No ratings yet
Jair 14714 Corr
35 pages
PostgreSQL Training 72622
No ratings yet
PostgreSQL Training 72622
3 pages
Blood of Jesus
No ratings yet
Blood of Jesus
14 pages
How To Teach Reading
No ratings yet
How To Teach Reading
22 pages
Actual MH Cet 2020
No ratings yet
Actual MH Cet 2020
40 pages
CAPITALS Analysis Table - Karmil Nguyen
No ratings yet
CAPITALS Analysis Table - Karmil Nguyen
3 pages
Excel Assignment-1
No ratings yet
Excel Assignment-1
2 pages
How To Schedule Query Extracts Using RSCRM - BAPI
No ratings yet
How To Schedule Query Extracts Using RSCRM - BAPI
14 pages
Phrasal Verbs Worksheet:: - With Marty
No ratings yet
Phrasal Verbs Worksheet:: - With Marty
1 page

Softmax Regression Scratch

Uploaded by

Softmax Regression Scratch

Uploaded by

Softmax Regression

Implementation of classic softmax regression (multinomial logistic regression).

df = pd.read_csv('./data/iris.data', index_col=None, header=None)

# Assign features and target

X = torch.tensor(df[['x2', 'x4']].values, dtype=torch.float)

# Shuffling & train/test split

X_train, X_test = X[shuffle_idx[:percent80]], X[shuffle_idx[percent80:]]

# Normalize (mean zero, unit variance)

mu, sigma = X_train.mean(dim=0), X_train.std(dim=0)

fig, ax = plt.subplots(1, 2, figsize=(7, 2.5))

Low-level implementation with manual gradients

def to_onehot(y, num_classes):

def cross_entropy(softmax, y_target):

def forward(self, x):

def backward(self, x, y, probas):

def predict_labels(self, x):

def evaluate(self, x, y):

def train(self, x, y, num_epochs, learning_rate=0.01):

y_onehot = to_onehot(y, num_classes=self.num_classes)

#### Compute outputs ####

#### Compute gradients ####

#### Update weights ####

#### Logging ####

model1 = SoftmaxRegression1(num_features=2, num_classes=3)

Evaluating the Model

test_acc = model1.evaluate(X_test, y_test)

Test set accuracy: 80.00%

from matplotlib.colors import ListedColormap

def plot_decision_regions(X, y, classifier, resolution=0.02):

# setup marker generator and color map

# plot the decision surface

# plot class samples

plot_decision_regions(X_train, y_train, classifier=model1)

def __init__(self, num_features, num_classes):

def forward(self, x):

model2 = SoftmaxRegression2(num_features=2, num_classes=3).to(DEVICE)

def comp_accuracy(true_labels, pred_labels):

#### Compute outputs ####

#### Compute gradients ####

#### Update weights ####

#### Logging ####

test_acc = model1.evaluate(X_test, y_test)

Test set accuracy: 80.00%

plot_decision_regions(X_train, y_train, classifier=model2)

You might also like

def init(self, num_features, num_classes):