Assignment 5 - SourceCode - Ipynb - Colab
Assignment 5 - SourceCode - Ipynb - Colab
ipynb - Colab
import pandas as pd
df=pd.read_csv('C:/Users/Admin/Desktop/lp3/diabetes.csv')
df.columns
#input data
x=df.drop(['Outcome'],axis=1)
#output data
y=df['Outcome']
sns.countplot(x=y)
y.value_counts()
0 500
1 268
Name: Outcome, dtype: int64
#scaling
from sklearn.preprocessing import MinMaxScaler
scaler=MinMaxScaler()
x_scaled=scaler.fit_transform(x)
x_scaled
#cross validation
from sklearn.model_selection import train_test_split
https://colab.research.google.com/drive/1nmAB7PbwkK0rh3LpASgDETFy67xlrTEg#printMode=true 1/4
10/15/24, 9:52 AM Assignment 5_SourceCode.ipynb - Colab
x_train,x_test,y_train,y_test=train_test_split(x_scaled,y,test_size=0.25)
x.shape
(768, 8)
x_train.shape
(576, 8)
x_test.shape
(192, 8)
knn= KNeighborsClassifier(n_neighbors=5)
knn.fit(x_train,y_train)
▾ KNeighborsClassifier
KNeighborsClassifier()
y_pred=knn.predict(x_test)
ConfusionMatrixDisplay.from_predictions(y_test,y_pred)
<sklearn.metrics._plot.confusion_matrix.ConfusionMatrixDisplay at 0x27aeb73add0>
print(classification_report(y_test,y_pred))
error=[]
for i in range(1,20):
knn= KNeighborsClassifier(n_neighbors=i)
knn.fit(x_train,y_train)
https://colab.research.google.com/drive/1nmAB7PbwkK0rh3LpASgDETFy67xlrTEg#printMode=true 2/4
10/15/24, 9:52 AM Assignment 5_SourceCode.ipynb - Colab
y_pred=knn.predict(x_test)
error.append(np.mean(y_pred!=y_test))
error
[0.296875,
0.2708333333333333,
0.23958333333333334,
0.24479166666666666,
0.25,
0.24479166666666666,
0.21875,
0.21875,
0.2708333333333333,
0.25,
0.2604166666666667,
0.22395833333333334,
0.2604166666666667,
0.23958333333333334,
0.25,
0.23958333333333334,
0.22916666666666666,
0.22916666666666666,
0.22395833333333334]
plt.figure(figsize=(16,9))
plt.xlabel('value of k')
plt.ylabel('error')
plt.grid()
plt.xticks(range(1,20))
plt.plot(range(1,20),error,marker='.')
[<matplotlib.lines.Line2D at 0x27af324cdd0>]
https://colab.research.google.com/drive/1nmAB7PbwkK0rh3LpASgDETFy67xlrTEg#printMode=true 3/4
10/15/24, 9:52 AM Assignment 5_SourceCode.ipynb - Colab
https://colab.research.google.com/drive/1nmAB7PbwkK0rh3LpASgDETFy67xlrTEg#printMode=true 4/4