0% found this document useful (0 votes)

31 views6 pages

PCA Codebase

Uploaded by

harsh

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

31 views6 pages

PCA Codebase

Uploaded by

harsh

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 6

KNN/SVM

Harsh kumar

roll no 12112011

batch cs-a-01

import math
from collections import Counter
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

df = pd.read_csv('data.csv')

X = df.drop(columns=['id', 'diagnosis'])
y = df['diagnosis'].map({'M': 1, 'B': 0})

split_index = int(0.8 * len(df))

X_train = X[:split_index].values
y_train = y[:split_index].values
X_test = X[split_index:].values
y_test = y[split_index:].values

def euclidean_distance(point1, point2):

return math.sqrt(sum((x - y) ** 2 for x, y in zip(point1,
point2)))

def knn_predict(X_train, y_train, X_test, k=5):

predictions = []
for test_point in X_test:
distances = [(euclidean_distance(test_point, train_point),
label) for train_point, label in zip(X_train, y_train)]
k_nearest_neighbors = sorted(distances, key=lambda x: x[0])
[:k]
k_nearest_labels = [label for _, label in k_nearest_neighbors]
most_common = Counter(k_nearest_labels).most_common(1)[0][0]
predictions.append(most_common)
return predictions

def accuracy(y_true, y_pred):

correct = sum(1 for true, pred in zip(y_true, y_pred) if true ==
pred)
return correct / len(y_true)

def precision_recall_f1(y_true, y_pred):

tp = sum(1 for true, pred in zip(y_true, y_pred) if true == pred
== 1)
fp = sum(1 for true, pred in zip(y_true, y_pred) if true == 0 and
pred == 1)
fn = sum(1 for true, pred in zip(y_true, y_pred) if true == 1 and
pred == 0)
tn = sum(1 for true, pred in zip(y_true, y_pred) if true == 0 and
pred == 0)

precision = tp / (tp + fp) if (tp + fp) > 0 else 0

recall = tp / (tp + fn) if (tp + fn) > 0 else 0
f1 = 2 * precision * recall / (precision + recall) if (precision +
recall) > 0 else 0

return precision, recall, f1, tp, tn, fp, fn

def plot_confusion_matrix(tp, tn, fp, fn, title="Confusion Matrix"):

cm = np.array([[tn, fp], [fn, tp]])
sns.heatmap(cm, annot=True, fmt='d', cmap='Blues', cbar=False,
xticklabels=["Pred: Benign", "Pred: Malignant"], yticklabels=["Actual:
Benign", "Actual: Malignant"])
plt.title(title)
plt.show()

print("Running K-Nearest Neighbors (KNN)...")

y_pred_knn = knn_predict(X_train, y_train, X_test, k=5)
knn_acc = accuracy(y_test, y_pred_knn)
knn_prec, knn_recall, knn_f1, knn_tp, knn_tn, knn_fp, knn_fn =
precision_recall_f1(y_test, y_pred_knn)

print(f"KNN Accuracy: {knn_acc:.4f}")

print(f"KNN Precision: {knn_prec:.4f}")
print(f"KNN Recall: {knn_recall:.4f}")
print(f"KNN F1-Score: {knn_f1:.4f}")

plot_confusion_matrix(knn_tp, knn_tn, knn_fp, knn_fn, title="KNN

Confusion Matrix")

class SVM:
def __init__(self, learning_rate=0.001, lambda_param=0.01,
n_iters=1000):
self.lr = learning_rate
self.lambda_param = lambda_param
self.n_iters = n_iters
self.w = None
self.b = None

def fit(self, X, y):

y_ = np.where(y <= 0, -1, 1)
n_samples, n_features = X.shape
self.w = np.zeros(n_features)
self.b = 0

for _ in range(self.n_iters):
for idx, x_i in enumerate(X):
condition = y_[idx] * (np.dot(x_i, self.w) - self.b)
>= 1
if condition:
self.w -= self.lr * (2 * self.lambda_param *
self.w)
else:
self.w -= self.lr * (2 * self.lambda_param *
self.w - np.dot(x_i, y_[idx]))
self.b -= self.lr * y_[idx]

def predict(self, X):

linear_output = np.dot(X, self.w) - self.b
return np.sign(linear_output)

print("Running Support Vector Machine (SVM)...")

svm = SVM()
svm.fit(X_train, y_train)
y_pred_svm = svm.predict(X_test)
y_pred_svm_binary = np.where(y_pred_svm <= 0, 0, 1) # Convert to (0,
1)

svm_acc = accuracy(y_test, y_pred_svm_binary)

svm_prec, svm_recall, svm_f1, svm_tp, svm_tn, svm_fp, svm_fn =
precision_recall_f1(y_test, y_pred_svm_binary)

print(f"SVM Accuracy: {svm_acc:.4f}")

print(f"SVM Precision: {svm_prec:.4f}")
print(f"SVM Recall: {svm_recall:.4f}")
print(f"SVM F1-Score: {svm_f1:.4f}")

plot_confusion_matrix(svm_tp, svm_tn, svm_fp, svm_fn, title="SVM

Confusion Matrix")

print("\n--- Final Model Comparison ---")

print(f"KNN Accuracy: {knn_acc:.4f}, Precision: {knn_prec:.4f},
Recall: {knn_recall:.4f}, F1-Score: {knn_f1:.4f}")
print(f"SVM Accuracy: {svm_acc:.4f}, Precision: {svm_prec:.4f},
Recall: {svm_recall:.4f}, F1-Score: {svm_f1:.4f}")

Running K-Nearest Neighbors (KNN)...

KNN Accuracy: 0.2281
KNN Precision: 0.2281
KNN Recall: 1.0000
KNN F1-Score: 0.3714
Running Support Vector Machine (SVM)...
SVM Accuracy: 0.2281
SVM Precision: 0.2281
SVM Recall: 1.0000
SVM F1-Score: 0.3714
--- Final Model Comparison ---
KNN Accuracy: 0.2281, Precision: 0.2281, Recall: 1.0000, F1-Score:
0.3714
SVM Accuracy: 0.2281, Precision: 0.2281, Recall: 1.0000, F1-Score:
0.3714

import numpy as np

class SVM:
def __init__(self, learning_rate=0.001, lambda_param=0.01,
n_iters=1000):
self.lr = learning_rate
self.lambda_param = lambda_param
self.n_iters = n_iters
self.w = None
self.b = None

def fit(self, X, y):

# Convert y from (0,1) to (-1,1)
y_ = np.where(y <= 0, -1, 1)

n_samples, n_features = X.shape

self.w = np.zeros(n_features)
self.b = 0

# Gradient Descent
for _ in range(self.n_iters):
for idx, x_i in enumerate(X):
condition = y_[idx] * (np.dot(x_i, self.w) - self.b)
>= 1
if condition:
self.w -= self.lr * (2 * self.lambda_param *
self.w)
else:
self.w -= self.lr * (2 * self.lambda_param *
self.w - np.dot(x_i, y_[idx]))
self.b -= self.lr * y_[idx]

def predict(self, X):

linear_output = np.dot(X, self.w) - self.b
return np.sign(linear_output)

X_train = X[:split_index].values
y_train = y[:split_index].values
X_test = X[split_index:].values
y_test = y[split_index:].values

svm = SVM()
svm.fit(X_train, y_train)

y_pred_svm = svm.predict(X_test)

y_pred_svm_binary = np.where(y_pred_svm <= 0, 0, 1) # Convert back

from (-1, 1) to (0, 1)
print(f"SVM Accuracy: {accuracy(y_test, y_pred_svm_binary)}")

SVM Accuracy: 0.22807017543859648

ml-batch(1)
No ratings yet
ml-batch(1)
36 pages
Machine Learning Algorithms From Scratch
No ratings yet
Machine Learning Algorithms From Scratch
9 pages
Vertopal.com Lab 2 SVM
No ratings yet
Vertopal.com Lab 2 SVM
23 pages
ML Programs
No ratings yet
ML Programs
14 pages
All in one
No ratings yet
All in one
13 pages
Final_ML_Programs_075005
No ratings yet
Final_ML_Programs_075005
15 pages
svm using iris dataset by hyparlink
No ratings yet
svm using iris dataset by hyparlink
19 pages
ML Journal External
No ratings yet
ML Journal External
14 pages
ml
No ratings yet
ml
11 pages
Vertopal.com Untitled (2)
No ratings yet
Vertopal.com Untitled (2)
4 pages
Ml Lab Experiment Shortened With Same Output
No ratings yet
Ml Lab Experiment Shortened With Same Output
6 pages
1
No ratings yet
1
13 pages
ANN_EXPERIENTIAL_LEARNING
No ratings yet
ANN_EXPERIENTIAL_LEARNING
43 pages
Shobit Sharma (2124399) ML lab file pdf
No ratings yet
Shobit Sharma (2124399) ML lab file pdf
19 pages
Support-Vector-Classifier
No ratings yet
Support-Vector-Classifier
7 pages
Support-Vector-Classifier
No ratings yet
Support-Vector-Classifier
7 pages
mlalllabprgs
No ratings yet
mlalllabprgs
17 pages
210596_ML_Labtask5.ipynb_k - Colab
No ratings yet
210596_ML_Labtask5.ipynb_k - Colab
8 pages
Pedagogy of The Oppressed 50th Anniversary Edition Freire: For Dowload This Book Click LINK or Button Below
No ratings yet
Pedagogy of The Oppressed 50th Anniversary Edition Freire: For Dowload This Book Click LINK or Button Below
64 pages
MLLabManual
No ratings yet
MLLabManual
24 pages
ML pdf
No ratings yet
ML pdf
30 pages
SVM(686) (1)
No ratings yet
SVM(686) (1)
5 pages
ML Brefing
No ratings yet
ML Brefing
28 pages
svmdoc
No ratings yet
svmdoc
7 pages
AML_lab[1] (1)
No ratings yet
AML_lab[1] (1)
14 pages
A Testament of Hope The Essential Writings of Martin Luther King Jr.
75% (4)
A Testament of Hope The Essential Writings of Martin Luther King Jr.
10 pages
22104057_Prakhar_Week 5
No ratings yet
22104057_Prakhar_Week 5
8 pages
MLT_07
No ratings yet
MLT_07
8 pages
ML W8 Merged
No ratings yet
ML W8 Merged
27 pages
SPPUML5
No ratings yet
SPPUML5
4 pages
ml-5_31
No ratings yet
ml-5_31
6 pages
Naive Bayes
No ratings yet
Naive Bayes
58 pages
1q8ye9zo62ASSI_4_ML_16
No ratings yet
1q8ye9zo62ASSI_4_ML_16
4 pages
ai int-1
No ratings yet
ai int-1
6 pages
Ob Casestudy - Jury
100% (1)
Ob Casestudy - Jury
16 pages
Slip
No ratings yet
Slip
5 pages
Classification Review
No ratings yet
Classification Review
8 pages
Knapsack Problems
No ratings yet
Knapsack Problems
306 pages
Aiml 5-8
No ratings yet
Aiml 5-8
19 pages
Machine Learnin
100% (2)
Machine Learnin
23 pages
Minor_lab
No ratings yet
Minor_lab
4 pages
Selective Benefits of Question Self-Generation and Answering For Remembering Expository Text
No ratings yet
Selective Benefits of Question Self-Generation and Answering For Remembering Expository Text
10 pages
Lab Program (SVM From Scratch)
No ratings yet
Lab Program (SVM From Scratch)
2 pages
Perimeter Problems
No ratings yet
Perimeter Problems
2 pages
LAB-4 Report
No ratings yet
LAB-4 Report
21 pages
Data Mining Practicals
No ratings yet
Data Mining Practicals
22 pages
Implementing KNN Algorithm on the Iris Dataset
No ratings yet
Implementing KNN Algorithm on the Iris Dataset
7 pages
ML
No ratings yet
ML
7 pages
Education Arts
No ratings yet
Education Arts
23 pages
A Review On Secured Authentication Using 3D Password: M. Padmaja P.Manjula
No ratings yet
A Review On Secured Authentication Using 3D Password: M. Padmaja P.Manjula
6 pages
ML Lab Prgms Split
No ratings yet
ML Lab Prgms Split
3 pages
ML Lab6
No ratings yet
ML Lab6
4 pages
Lesson-1-Introduction-to-Science-Technology-and-Society-for-review
No ratings yet
Lesson-1-Introduction-to-Science-Technology-and-Society-for-review
5 pages
SVM K NN MLP With Sklearn Jupyter NoteBo
No ratings yet
SVM K NN MLP With Sklearn Jupyter NoteBo
22 pages
3 SVM - Jupyter Notebook
No ratings yet
3 SVM - Jupyter Notebook
4 pages
I Avaliação Parcial - 25.0 PTS - Gabarito
No ratings yet
I Avaliação Parcial - 25.0 PTS - Gabarito
9 pages
Doc1 PDF
No ratings yet
Doc1 PDF
1 page
Spadafora Et Al - Redimendionando Los Vínculos Entre Naturaleza y Cultura
No ratings yet
Spadafora Et Al - Redimendionando Los Vínculos Entre Naturaleza y Cultura
18 pages
B24 ML Exp-3
No ratings yet
B24 ML Exp-3
10 pages
Ai Last 5
No ratings yet
Ai Last 5
4 pages
Unit2 ML Programs
No ratings yet
Unit2 ML Programs
7 pages
Che 401
No ratings yet
Che 401
7 pages
Kåñëa-Sürya-Sama Mäyä Haya Andhakära Yähäì Kåñëa, Tähäì Nähi Mäyära Adhikära
No ratings yet
Kåñëa-Sürya-Sama Mäyä Haya Andhakära Yähäì Kåñëa, Tähäì Nähi Mäyära Adhikära
2 pages
Jawad Qamar (Coding Ass#06)
No ratings yet
Jawad Qamar (Coding Ass#06)
2 pages
Inferential Estimation
100% (1)
Inferential Estimation
74 pages
Commitment and Satisfaction in Romantic A Test of The Investment
No ratings yet
Commitment and Satisfaction in Romantic A Test of The Investment
24 pages
Python Tutorial Final V2
100% (1)
Python Tutorial Final V2
13 pages
Assignment #1: K Nearest Neighbor Classifier: Name: Srikanth Mujjiga (Roll No: 2015-50-831
No ratings yet
Assignment #1: K Nearest Neighbor Classifier: Name: Srikanth Mujjiga (Roll No: 2015-50-831
8 pages
Medicinal Plants and Their Processing Mtmel7025a
No ratings yet
Medicinal Plants and Their Processing Mtmel7025a
4 pages
Hsphys001 Lectures
No ratings yet
Hsphys001 Lectures
33 pages
1 KNN - Jupyter Notebook
No ratings yet
1 KNN - Jupyter Notebook
3 pages
Chapter 3 - Edm Calibration
0% (1)
Chapter 3 - Edm Calibration
23 pages
Linearregression SVM
No ratings yet
Linearregression SVM
3 pages
PDF
No ratings yet
PDF
114 pages
De Thi Hoc Sinh Gioi Mon Tieng Anh Lop 10 Nam Hoc 2018 2019 So 2
No ratings yet
De Thi Hoc Sinh Gioi Mon Tieng Anh Lop 10 Nam Hoc 2018 2019 So 2
8 pages
06 Kleene Theorem
No ratings yet
06 Kleene Theorem
3 pages
1 Modernism
No ratings yet
1 Modernism
20 pages
16BCB0126 VL2018195002535 Pe003
No ratings yet
16BCB0126 VL2018195002535 Pe003
40 pages
Machine Learning Scikit Handson
0% (1)
Machine Learning Scikit Handson
4 pages
Machine Learning Scikit Handson
No ratings yet
Machine Learning Scikit Handson
4 pages
ML Lab
No ratings yet
ML Lab
7 pages
Thermodynamics 1
No ratings yet
Thermodynamics 1
20 pages
ISTQB Foundation Certification Exam (Q1-200)
0% (1)
ISTQB Foundation Certification Exam (Q1-200)
49 pages
Software Fixes To Strategy Checking For Pick 3
100% (1)
Software Fixes To Strategy Checking For Pick 3
8 pages
STAAD AISC ASD Parmeters
No ratings yet
STAAD AISC ASD Parmeters
9 pages
Livros Vet Links
No ratings yet
Livros Vet Links
12 pages
Strategic Six Sigma Best Practices
100% (10)
Strategic Six Sigma Best Practices
339 pages
LessonPlan Binary
100% (1)
LessonPlan Binary
1 page
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet

PCA Codebase

Uploaded by

PCA Codebase

Uploaded by

KNN/SVM

split_index = int(0.8 * len(df))

def euclidean_distance(point1, point2):

def knn_predict(X_train, y_train, X_test, k=5):

def accuracy(y_true, y_pred):

def precision_recall_f1(y_true, y_pred):

precision = tp / (tp + fp) if (tp + fp) > 0 else 0

return precision, recall, f1, tp, tn, fp, fn

def plot_confusion_matrix(tp, tn, fp, fn, title="Confusion Matrix"):

print("Running K-Nearest Neighbors (KNN)...")

print(f"KNN Accuracy: {knn_acc:.4f}")

plot_confusion_matrix(knn_tp, knn_tn, knn_fp, knn_fn, title="KNN

def fit(self, X, y):

def predict(self, X):

print("Running Support Vector Machine (SVM)...")

svm_acc = accuracy(y_test, y_pred_svm_binary)

print(f"SVM Accuracy: {svm_acc:.4f}")

plot_confusion_matrix(svm_tp, svm_tn, svm_fp, svm_fn, title="SVM

print("\n--- Final Model Comparison ---")

Running K-Nearest Neighbors (KNN)...

def fit(self, X, y):

n_samples, n_features = X.shape

def predict(self, X):

y_pred_svm_binary = np.where(y_pred_svm <= 0, 0, 1) # Convert back

SVM Accuracy: 0.22807017543859648

You might also like