Sample code
Sample code
import time
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
#import seaborn as sns
from keras.utils.vis_utils import plot_model
import tkinter as tk
from tkinter.filedialog import askopenfilename
x=np.empty([569,30])
y=np.empty([569,1])
dataset=pd.DataFrame()
dataset=dataset.fillna(0)
def gettraindata():
global v
global allurlsdata
global dataset
global x,y
csv_file_path = askopenfilename()
print(csv_file_path)
v.set(csv_file_path)
dataset = pd.read_csv(csv_file_path)
x = dataset.iloc[:, 2:].values
y = dataset.iloc[:, 1].values
def ccdata():
global y
from sklearn.preprocessing import LabelEncoder
labelencoder_X_1 = LabelEncoder()
y = labelencoder_X_1.fit_transform(y)
from tkinter import scrolledtext
txt2 = scrolledtext.ScrolledText(root,width=10,height=10,wrap=tk.WORD)
txt2.grid(column=3,row=3)
txt2.insert(tk.INSERT,y)
x_train=[]
x_test=[]
y_train=[]
y_test=[]
def tts():
global x,y,x_train,x_test,y_train,y_test
from sklearn.model_selection import train_test_split
x_train, x_test, y_train, y_test = train_test_split(x, y, test_size = 0.1, random_state
= 0)
def fs():
global x_train,x_test
from sklearn.preprocessing import StandardScaler
sc = StandardScaler()
x_train = sc.fit_transform(x_train)
x_test = sc.transform(x_test)
from tkinter import scrolledtext
txt3 = scrolledtext.ScrolledText(root,width=10,height=10,wrap=tk.WORD)
txt3.grid(column=3,row=5)
txt3.insert(tk.INSERT,x_train)
from tkinter import scrolledtext
txt4 = scrolledtext.ScrolledText(root,width=10,height=10,wrap=tk.WORD)
txt4.grid(column=4,row=5)
txt4.insert(tk.INSERT,x_test)
def bm():
from numpy.random import seed
seed(1)
import keras
from keras.models import Sequential
from keras.layers import Dense, Dropout
global x,y,x_train,x_test,y_train,y_test
root = tk.Tk()
start_time = time.time()
#tk.Label(root, text='File Path').grid(row=0, column=0)
v = tk.StringVar()
entry = tk.Entry(root, textvariable=v).grid(row=0, column=0)
tk.Button(root, text='Select Data File',command=gettraindata).grid(row=0, column=2)
tk.Button(root, text='Convert Categorical Data',command=ccdata).grid(row=3,
column=2)
tk.Button(root, text='Train Test Split',command=tts).grid(row=4, column=2)
tk.Button(root, text='Feature Scaling',command=fs).grid(row=5, column=2)
tk.Button(root, text='Build Model',command=bm).grid(row=6, column=2)
root.mainloop()
Machine Learning Models
import time
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from keras.utils.vis_utils import plot_model
# Importing data
data = pd.read_csv('data.csv')
#del data['Unnamed: 32']
X = data.iloc[:, 2:].values
y = data.iloc[:, 1].values
from sklearn.preprocessing import LabelEncoder
labelencoder_X_1 = LabelEncoder()
y = labelencoder_X_1.fit_transform(y)
# Splitting the dataset into the Training set and Test set
from sklearn.model_selection import train_test_split
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size = 0.2, random_state =
0)
#Feature Scaling
# from sklearn.preprocessing import StandardScaler
# sc = StandardScaler()
# X_train = sc.fit_transform(X_train)
# X_test = sc.transform(X_test)
print("==================LOGISTIC REGRESSION===============")
from sklearn.linear_model import LogisticRegression
from sklearn import metrics
model= LogisticRegression()
model.fit(X_train,y_train)
y_pred=model.predict(X_test)
from sklearn.metrics import accuracy_score
acc_sco=accuracy_score(y_test, y_pred)
print("ACCURACY",acc_sco)
from sklearn.metrics import classification_report
cr=classification_report(y_test, y_pred)
print("Classification report",cr)
print("==========DECISION TREE================")
from sklearn.tree import DecisionTreeClassifier
from sklearn import tree
model1= DecisionTreeClassifier()
model1.fit(X_train,y_train)
y_pred1=model1.predict(X_test)
from sklearn.metrics import accuracy_score
acc_sco1=accuracy_score(y_test, y_pred1)
print("ACCURACY",acc_sco1)
from sklearn.metrics import classification_report
cr=classification_report(y_test, y_pred1)
print("Classification report",cr)
print("====================Random Forest================")
from sklearn.ensemble import RandomForestClassifier
model2= RandomForestClassifier()
model2.fit(X_train,y_train)
y_pred2=model2.predict(X_test)
from sklearn.metrics import accuracy_score
acc_sco2=accuracy_score(y_test, y_pred2)
print("ACCURACY",acc_sco2)
from sklearn.metrics import classification_report
cr=classification_report(y_test, y_pred2)
print("Classification report",cr)