0% found this document useful (0 votes)

16 views7 pages

Push - Table Copy2 2

Uploaded by

jlesalvador

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

16 views7 pages

Push - Table Copy2 2

Uploaded by

jlesalvador

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 7

7/23/24, 12:53 PM push_table-Copy2

In [30]: #importing the modules, the estimator and the dataframe

from sklearn.ensemble import BaggingClassifier
from sklearn.ensemble import RandomForestClassifier
from sklearn.ensemble import AdaBoostClassifier
from sklearn.ensemble import GradientBoostingClassifier

from sklearn.tree import DecisionTreeClassifier

from sklearn.linear_model import LogisticRegression
from sklearn.neighbors import KNeighborsClassifier

from sklearn.datasets import load_breast_cancer

from sklearn.metrics import accuracy_score

from sklearn.model_selection import train_test_split
from sklearn.metrics import auc

import matplotlib.pyplot as plt

import numpy as np
import pandas as pd
import warnings
warnings.filterwarnings('ignore', category=DeprecationWarning)

In [31]: #loading the breast_cancer dataset and dividing it into feature and target
data = load_breast_cancer()
data_to_process = pd.DataFrame(data.data, columns=data.feature_names)
target_value = pd.Series(data.target)

In [32]: #splitting the dataset into train dataset and test dataset
x_train, x_test, y_train, y_test = train_test_split(data_to_process, target_

In [33]: x_train.head()

Out[33]: mean
mean mean mean mean mean mean mean
concave
radius texture perimeter area smoothness compactness concavity s
points

276 11.33 14.16 71.79 396.6 0.09379 0.03872 0.001487 0.003333

56 19.21 18.57 125.50 1152.0 0.10530 0.12670 0.132300 0.089940

16 14.68 20.13 94.74 684.5 0.09867 0.07200 0.073950 0.052590

352 25.73 17.46 174.20 2010.0 0.11490 0.23630 0.336800 0.191300

250 20.94 23.56 138.90 1364.0 0.10070 0.16060 0.271200 0.131000

5 rows × 30 columns

In [34]: #making classification with baggingClassifier , base estimator is Kneighbors

bclf = BaggingClassifier(base_estimator=KNeighborsClassifier(), n_estimators
max_samples= 0.5, max_features=1.0, random_state=12
bclf.fit(x_train, y_train)

file:///home/aman/Downloads/push_table-Copy2.html 1/7
7/23/24, 12:53 PM push_table-Copy2

y_pred = bclf.predict(x_test)
#bscore = accuracy_score(y_pred, y_test)

In [35]: # random forestclassifier

forest = RandomForestClassifier(n_estimators=10, max_depth=4, random_state=5
forest.fit(x_train, y_train)
y_pred = forest.predict(x_test)
#fscore = accuracy_score(y_pred, y_test)

In [36]: #AdaboostClassifier baseestimator is logistic regression

adaB = AdaBoostClassifier(base_estimator=LogisticRegression(solver='newton-c
adaB.fit(x_train, y_train)
y_pred = adaB.predict(x_test)
#abscore = accuracy_score(y_pred, y_test)

In [37]: #GradientBoostingClassifier
gbclf = GradientBoostingClassifier(n_estimators=100, random_state=12)
gbclf.fit(x_train, y_train)
y_pred = gbclf.predict(x_test)
#gbscore = accuracy_score(y_pred, y_test)

In [38]: #decisionTreeClassifier
dtclf = DecisionTreeClassifier()
dtclf.fit(x_train, y_train)
y_pred = dtclf.predict(x_test)
#dtclfscore = accuracy_score(y_pred, y_test)

In [39]: #LogisticRegression
lr = LogisticRegression(solver='newton-cg')
lr.fit(x_train, y_train)
y_pred = lr.predict(x_test)
#lrscore = accuracy_score(y_test, y_pred)

In [40]: #kNeighborsClassifier
knn = KNeighborsClassifier(20)
knn.fit(x_train, y_train)
y_pred = knn.predict(x_test)
#knn_score = accuracy_score(y_pred, y_test)

In [41]: ############################################################################
#calculate coodinate roc

In [42]: # function that return the name of agiven classifier

def return_class_name(given_class):
given_class_to_string = str(given_class.__class__).split('.')[-1].rstrip
return given_class_to_string

In [51]: def TruePosRate(y_true, y_pred):

y_pred_test = pd.Series(y_pred, index=y_true.index)
TP = FP = FN = TN = 0
for i in y_true.index:
if y_true[i] == y_pred[i] == 1:
TP+=1

file:///home/aman/Downloads/push_table-Copy2.html 2/7
7/23/24, 12:53 PM push_table-Copy2

if y_pred[i] ==1 and y_true[i]!=y_pred[i]:

FP+=1
if y_pred[i]==0 and y_pred[i]!=y_true[i]:
FN+=1
if y_true[i] == y_pred[i] == 0:
TN+=1

try:
FPR = FP / (FP + TN)
except ZeroDivisionError:
FPR = 1

try:
recall = TP / (TP+FN)
except ZeroDivisionError:
recall = 1

return FPR, recall

TruePosRate(y_test, y_pred)

---------------------------------------------------------------------------
IndexError Traceback (most recent call last)
/tmp/ipykernel_82001/3978752527.py in <module>
23
24 return FPR, recall
---> 25 TruePosRate(y_test, y_pred)

/tmp/ipykernel_82001/3978752527.py in TruePosRate(y_true, y_pred)

3 TP = FP = FN = TN = 0
4 for i in y_true.index:
----> 5 if y_true[i] == y_pred[i] == 1:
6 TP+=1
7 if y_pred[i] ==1 and y_true[i]!=y_pred[i]:

IndexError: index 534 is out of bounds for axis 0 with size 143

In [44]: #varying the probability threshold

def FPR_recall_scores_list(estimator):
y_test_probs = estimator.predict_proba(x_test)[:,1]
FPR_scores = list()
recall1_scores = list()
probability_thresholds = np.linspace(0,1, num=100)
for p in probability_thresholds:
y_test_pred=list()
for prob in y_test_probs:
if prob > p :
y_test_pred.append(1)
else:
y_test_pred.append(0)
FPR, recall = TruePosRate(y_test, y_test_pred)

FPR_scores.append(FPR)
recall1_scores.append(recall)
return FPR_scores, recall1_scores
FPR_score_list, recall_score_list =FPR_recall_scores_list(knn)

file:///home/aman/Downloads/push_table-Copy2.html 3/7
7/23/24, 12:53 PM push_table-Copy2

---------------------------------------------------------------------------
IndexError Traceback (most recent call last)
/tmp/ipykernel_82001/1444861665.py in <module>
17 recall1_scores.append(recall)
18 return FPR_scores, recall1_scores
---> 19 FPR_score_list, recall_score_list =FPR_recall_scores_list(knn)

/tmp/ipykernel_82001/1444861665.py in FPR_recall_scores_list(estimator)
12 else:
13 y_test_pred.append(0)
---> 14 FPR, recall = TruePosRate(y_test, y_test_pred)
15
16 FPR_scores.append(FPR)

/tmp/ipykernel_82001/3978752527.py in TruePosRate(y_true, y_pred)

3 TP = FP = FN = TN = 0
4 for i in y_true.index:
----> 5 if y_true[i] == y_pred[i] == 1:
6 TP+=1
7 if y_pred[i] ==1 and y_true[i]!=y_pred[i]:

IndexError: list index out of range

In [ ]:

In [46]: fig, ax = plt.subplots(figsize=(7,7))

ax.plot(recall_scores, precision_scores, label='knn')
baseline=len(y_test[y_test==1]) / len(y_test)
ax.plot([0,1], [baseline, baseline], ls='--', label='Baseline')
ax.set_xlabel('Recall')
ax.set_ylabel('Precision')
ax.legend(loc='center left')

Out[46]: <matplotlib.legend.Legend at 0x7ff5b1748850>

file:///home/aman/Downloads/push_table-Copy2.html 4/7
7/23/24, 12:53 PM push_table-Copy2

In [ ]:

In [47]: listClassifier = [bclf,forest,adaB,gbclf,dtclf,lr,knn]

def classifier_and_score(listClassifier):
data = list()
for classifier in listClassifier:
classifier.fit(x_train, y_train)
y_pred = classifier.predict(x_test)
score = round(accuracy_score(y_pred, y_test) * 100, 2)
name = return_class_name(classifier)
auc_score = auc(precision_recall_scores_list(classifier, x_test)[1],
precision_recall_scores_list(classifier, x_test)[0])
data.append([name, score, auc_score])
return data
data = classifier_and_score(listClassifier)

file:///home/aman/Downloads/push_table-Copy2.html 5/7
7/23/24, 12:53 PM push_table-Copy2

---------------------------------------------------------------------------
NameError Traceback (most recent call last)
/tmp/ipykernel_82001/3633130248.py in <module>
13 data.append([name, score, auc_score])
14 return data
---> 15 data = classifier_and_score(listClassifier)

/tmp/ipykernel_82001/3633130248.py in classifier_and_score(listClassifier)
9 score = round(accuracy_score(y_pred, y_test) * 100, 2)
10 name = return_class_name(classifier)
---> 11 auc_score = auc(precision_recall_scores_list(classifier, x_t
est)[1], \
12 precision_recall_scores_list(classifier, x_t
est)[0])
13 data.append([name, score, auc_score])

NameError: name 'precision_recall_scores_list' is not defined

In [ ]:

In [48]: from tabulate import tabulate

datat = data
col_name = ['algorithm_name', 'accuracy(%)','AUC']
print(tabulate(datat, headers=col_name))

---------------------------------------------------------------------------
TypeError Traceback (most recent call last)
/tmp/ipykernel_82001/2995579325.py in <module>
3 datat = data
4 col_name = ['algorithm_name', 'accuracy(%)','AUC']
----> 5 print(tabulate(datat, headers=col_name))

~/anaconda3/lib/python3.9/site-packages/tabulate.py in tabulate(tabular_dat
a, headers, tablefmt, floatfmt, numalign, stralign, missingval, showindex, d
isable_numparse, colalign)
1526 if tabular_data is None:
1527 tabular_data = []
-> 1528 list_of_lists, headers = _normalize_tabular_data(
1529 tabular_data, headers, showindex=showindex
1530 )

~/anaconda3/lib/python3.9/site-packages/tabulate.py in _normalize_tabular_da
ta(tabular_data, headers, showindex)
1087 keys = tabular_data.keys()
1088 rows = list(
-> 1089 izip_longest(*tabular_data.values())
1090 ) # columns have to be transposed
1091 elif hasattr(tabular_data, "index"):

TypeError: 'NoneType' object is not iterable

In [ ]: #calcolo della curva roc for all algo

In [ ]:

file:///home/aman/Downloads/push_table-Copy2.html 6/7
7/23/24, 12:53 PM push_table-Copy2

file:///home/aman/Downloads/push_table-Copy2.html 7/7

Diabetes Case Study - Jupyter Notebook
100% (1)
Diabetes Case Study - Jupyter Notebook
10 pages
IRis
No ratings yet
IRis
19 pages
'/content/data - PKL' 'RB': Open Print
No ratings yet
'/content/data - PKL' 'RB': Open Print
5 pages
Chandigarh Group of Colleges College of Engineering Landran, Mohali
No ratings yet
Chandigarh Group of Colleges College of Engineering Landran, Mohali
47 pages
Machine Learning Model Building
No ratings yet
Machine Learning Model Building
6 pages
B22EE010 Report
No ratings yet
B22EE010 Report
9 pages
Experiment 2 FDL - Jupyter Notebook
No ratings yet
Experiment 2 FDL - Jupyter Notebook
2 pages
Dsbda 5
No ratings yet
Dsbda 5
4 pages
HIV Regression Source Code
No ratings yet
HIV Regression Source Code
26 pages
Day No 46 Date No 06 07 2024 Logistic Regression Practical PDF
No ratings yet
Day No 46 Date No 06 07 2024 Logistic Regression Practical PDF
8 pages
ML Practical 205160694034
No ratings yet
ML Practical 205160694034
33 pages
Demantra
100% (1)
Demantra
49 pages
05 E RandomForest LoanData
No ratings yet
05 E RandomForest LoanData
8 pages
S6 - Data Mining Lab Experiments (Except 1)
No ratings yet
S6 - Data Mining Lab Experiments (Except 1)
6 pages
Error 1
No ratings yet
Error 1
3 pages
Da Program
No ratings yet
Da Program
18 pages
Jaycolpdf 1
No ratings yet
Jaycolpdf 1
5 pages
G 203008076 - 4 - Christhian Quiñonez - Ex1 - 2 A PDF
No ratings yet
G 203008076 - 4 - Christhian Quiñonez - Ex1 - 2 A PDF
20 pages
1st PGM
No ratings yet
1st PGM
10 pages
COMPARISON - Jupyter Notebook
No ratings yet
COMPARISON - Jupyter Notebook
5 pages
Regression Prac 9
No ratings yet
Regression Prac 9
8 pages
Imbalanced Dataset Customer Churn
No ratings yet
Imbalanced Dataset Customer Churn
9 pages
Import Numpy As NP Import Pandas As PD
No ratings yet
Import Numpy As NP Import Pandas As PD
7 pages
Mlext
No ratings yet
Mlext
1 page
Linear Regression
No ratings yet
Linear Regression
10 pages
Linear Reg Signal and Noise PDF
No ratings yet
Linear Reg Signal and Noise PDF
20 pages
ML LAB Manual-1
No ratings yet
ML LAB Manual-1
33 pages
MACHINE LEARNING Manual
No ratings yet
MACHINE LEARNING Manual
36 pages
Logistic - Regresssion
No ratings yet
Logistic - Regresssion
22 pages
St. John College of Engineering and Management, Palghar - Maharashtra
No ratings yet
St. John College of Engineering and Management, Palghar - Maharashtra
11 pages
Da Program Upto 6
No ratings yet
Da Program Upto 6
20 pages
I Avaliação Parcial - 25.0 PTS - Gabarito
No ratings yet
I Avaliação Parcial - 25.0 PTS - Gabarito
9 pages
Machine File
No ratings yet
Machine File
27 pages
Practical Research Long Quiz Grade 12
No ratings yet
Practical Research Long Quiz Grade 12
11 pages
ML - Labtask5.ipynb - K - Colab
No ratings yet
ML - Labtask5.ipynb - K - Colab
8 pages
ML Record Print
No ratings yet
ML Record Print
20 pages
Ilovepdf Merged
No ratings yet
Ilovepdf Merged
47 pages
DSBDA4
No ratings yet
DSBDA4
6 pages
Linear Regression - Jupyter Notebook
No ratings yet
Linear Regression - Jupyter Notebook
4 pages
Big Data Merged
No ratings yet
Big Data Merged
7 pages
CCD - Ipynb - Colab
No ratings yet
CCD - Ipynb - Colab
6 pages
Index: Name - JINESH PRAJAPAT Class - B. Tech, III Year Branch - AI & DS Sem - V
No ratings yet
Index: Name - JINESH PRAJAPAT Class - B. Tech, III Year Branch - AI & DS Sem - V
35 pages
Data Science Record - 05
No ratings yet
Data Science Record - 05
20 pages
Pract5 1
No ratings yet
Pract5 1
3 pages
ML All Projectpdf Removed
No ratings yet
ML All Projectpdf Removed
41 pages
Crime Prediction Using Machine Learning - Log
No ratings yet
Crime Prediction Using Machine Learning - Log
3 pages
DA Programs
No ratings yet
DA Programs
44 pages
Bacdeaf 23032025 115708 Split 1
No ratings yet
Bacdeaf 23032025 115708 Split 1
37 pages
ML Practicals
No ratings yet
ML Practicals
11 pages
Machine Learning Lab Assignment CSE-716: S. M. Shafkat Raihan ID: 16701041 SESSION: 2015-16
No ratings yet
Machine Learning Lab Assignment CSE-716: S. M. Shafkat Raihan ID: 16701041 SESSION: 2015-16
9 pages
Da Lab Mannual
No ratings yet
Da Lab Mannual
25 pages
ML Lab Prgms Split
No ratings yet
ML Lab Prgms Split
3 pages
Da 012307
No ratings yet
Da 012307
8 pages
Ann Experiential Learning
No ratings yet
Ann Experiential Learning
43 pages
1
No ratings yet
1
13 pages
Datascience PR 6 Veda
No ratings yet
Datascience PR 6 Veda
6 pages
Data Warehousing and Data Mining
No ratings yet
Data Warehousing and Data Mining
24 pages
DA Lab
No ratings yet
DA Lab
27 pages
Arbitrary Value Imputation.
No ratings yet
Arbitrary Value Imputation.
5 pages
Statistics Mcqs - Estimation Part 2: For Solved Question Bank Visit and For Free Video Lectures Visit
No ratings yet
Statistics Mcqs - Estimation Part 2: For Solved Question Bank Visit and For Free Video Lectures Visit
8 pages
Store 24 AB
0% (2)
Store 24 AB
15 pages
GE4 Quiz No. 3
100% (2)
GE4 Quiz No. 3
5 pages
NAMJ 15 (3) Sept 2020-11
No ratings yet
NAMJ 15 (3) Sept 2020-11
17 pages
Statistics IV Interpreting The Results of Statistical Tests
No ratings yet
Statistics IV Interpreting The Results of Statistical Tests
3 pages
Use of Statistics by Scientist
No ratings yet
Use of Statistics by Scientist
22 pages
e87e0c6b-5c89-4b7c-b6bc-60e46de76890
No ratings yet
e87e0c6b-5c89-4b7c-b6bc-60e46de76890
3 pages
Management Science
No ratings yet
Management Science
15 pages
BFC 34303 Uthm
No ratings yet
BFC 34303 Uthm
7 pages
IAC Lecture4 Homework
No ratings yet
IAC Lecture4 Homework
12 pages
Dwedw
No ratings yet
Dwedw
217 pages
Class 10 Maths Chapter 14 Statistics MCQs For Practice
No ratings yet
Class 10 Maths Chapter 14 Statistics MCQs For Practice
3 pages
Chapter 10 QBM
No ratings yet
Chapter 10 QBM
38 pages
Course Syllabus - Colin Cameron
No ratings yet
Course Syllabus - Colin Cameron
3 pages
BBT 3106 - Probability & Statistics II - August 2023EC
No ratings yet
BBT 3106 - Probability & Statistics II - August 2023EC
3 pages
Examples On Continuous Variables Expected Value
No ratings yet
Examples On Continuous Variables Expected Value
4 pages
Nonlife Actuarial Models: Classical Credibility
No ratings yet
Nonlife Actuarial Models: Classical Credibility
28 pages
4what Are Mean Median Mode - Explained For Elementary School
No ratings yet
4what Are Mean Median Mode - Explained For Elementary School
7 pages
Prediksi Data Curah Hujan Dengan Menggunakan Statistika Non Parametrik
No ratings yet
Prediksi Data Curah Hujan Dengan Menggunakan Statistika Non Parametrik
10 pages
Assignment of Econometrics
No ratings yet
Assignment of Econometrics
10 pages
83cf PDF
No ratings yet
83cf PDF
15 pages
Lecture 5. Discrete Probability
No ratings yet
Lecture 5. Discrete Probability
25 pages
102b ProblemSet 5 Solutions
No ratings yet
102b ProblemSet 5 Solutions
10 pages
Bangake2012 Pooled Mean Group Estimation On International Capital Mobility
No ratings yet
Bangake2012 Pooled Mean Group Estimation On International Capital Mobility
11 pages
Sensebot Log
No ratings yet
Sensebot Log
1 page
Evaluation and Cross Validation Detailed
No ratings yet
Evaluation and Cross Validation Detailed
2 pages
Quantitative Methods - Chapter 1-2-5-6-7-8-9-10-15-17
No ratings yet
Quantitative Methods - Chapter 1-2-5-6-7-8-9-10-15-17
197 pages
Session 09 - BS - 2020-Z Score
No ratings yet
Session 09 - BS - 2020-Z Score
32 pages
Chapter 3
No ratings yet
Chapter 3
15 pages
Hasil Uji Statistik Penelitian
No ratings yet
Hasil Uji Statistik Penelitian
8 pages
A Primer On Strong Vs Weak Control of Familywise Error Rate: Michael A. Proschan Erica H. Brittain
No ratings yet
A Primer On Strong Vs Weak Control of Familywise Error Rate: Michael A. Proschan Erica H. Brittain
7 pages
Stat 101 Compild Questions
No ratings yet
Stat 101 Compild Questions
1 page
Advanced C Concepts and Programming: First Edition
From Everand
Advanced C Concepts and Programming: First Edition
Gayatri
3/5 (1)
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet
Inverse Trigonometric Functions (Trigonometry) Mathematics Question Bank
From Everand
Inverse Trigonometric Functions (Trigonometry) Mathematics Question Bank
Mohmmad Khaja Shareef
No ratings yet