Assignment 2
Assignment 2
import numpy as np
import pandas as pd
dataset=pd.read_csv('IRIS.csv')
dataset=pd.DataFrame(dataset)
X=dataset.iloc[:,[0,1,2,3]]
Y=dataset.iloc[:,[4]]
dataset.replace(to_replace=['Iris-setosa','Iris-virginica','Iris-
versicolor'],value=['1','2','3'],inplace=True)
dataset.head()
df = pd.read_csv('./IRIS.csv')
clf = DecisionTreeClassifier()
clf.fit(X_train, y_train)
y_pred = clf.predict(X_test)
plt.figure(figsize=(10, 10))
tree.plot_tree(clf)
#Accuray of the model
ac = accuracy_score(y_test, y_pred)
df = pd.read_csv('./IRIS.csv')
X = df.iloc[:, [0, 1, 2, 3]].values
y = df['species']
rand_forest = RandomForestClassifier(n_estimators=10)
clf.fit(X_train,y_train)
y_pred = clf.predict(X_test)
ac = accuracy_score(y_test, y_pred)
print("Accuracy: ", ac*100)
print(confusion_matrix(y_test,y_pred))
# TiTanic NBayes
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.naive_bayes import GaussianNB
from sklearn.metrics import accuracy_score
df = pd.read_csv('./titanic.csv')
dataset = df[df['Age'].notna()]
dataset = dataset.sample(frac = 1, random_state = 5).reset_index()
dataset = dataset.drop('index', axis = 1)
clf = GaussianNB()
clf.fit(X_train, y_train)
y_pred = clf.predict(X_test)
ac = accuracy_score(y_test,y_pred)
print('\nAccuracy = ', ac*100,'%')
print(confusion_matrix(y_test,y_pred))
# Titanic id3
import pandas as pd
import matplotlib.pyplot as plt
from sklearn.model_selection import train_test_split
from sklearn.tree import DecisionTreeClassifier
from sklearn import tree
from sklearn.metrics import accuracy_score
cls = DecisionTreeClassifier()
cls.fit(X_train, y_train)
y_pred = cls.predict(X_test)
plt.figure(figsize=(15, 15))
tree.plot_tree(cls)
ac = accuracy_score(y_test, y_pred)
print("\nAccuracy: ", ac*100)
print(confusion_matrix(y_test,y_pred))
# Titanic Random Forest
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import accuracy_score
df = pd.read_csv('./titanic.csv')
clf.fit(X_train,y_train)
y_pred = clf.predict(X_test)
ac = accuracy_score(y_test, y_pred)
print("Accuracy: ", ac*100)
print(confusion_matrix(y_test,y_pred))