0% found this document useful (0 votes)

76 views

Sample Code

This document contains the code for a fake news detection application. It uses natural language processing techniques like cleaning, tokenization, and TF-IDF to preprocess text data. It then trains an LSTM neural network model to classify news articles as genuine or fake. The code provides functions for uploading and preprocessing data, running the LSTM algorithm, viewing training accuracy and loss graphs, and testing the model on new data. A GUI is created using Tkinter to allow users to interact with the various functions of the application.

Uploaded by

Dudhipala Deepak Reddy

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

76 views

Sample Code

Uploaded by

Dudhipala Deepak Reddy

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

You are on page 1/ 8

SAMPLE CODE

Main.py

from tkinter import messagebox

from tkinter import *
from tkinter import simpledialog
import tkinter
import matplotlib.pyplot as plt
import numpy as np
from tkinter import ttk
from tkinter import filedialog
import pandas as pd
from sklearn.model_selection import train_test_split
from string import punctuation
from nltk.corpus import stopwords
import nltk
from nltk.stem import WordNetLemmatizer
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.preprocessing import LabelEncoder
from keras.models import Sequential
from keras.layers.core import Dense,Activation,Dropout
from sklearn.preprocessing import OneHotEncoder
import keras.layers
from keras.models import model_from_json
import pickle
import os
from sklearn.preprocessing import normalize

from keras.models import Sequential

from keras.layers import Dense, Dropout, Flatten, LSTM

main = Tk()
main.title("DETECTION OF FAKE NEWS THROUGH
IMPLEMENTATION OF DATA SCIENCE APPLICATION")
main.geometry("1300x1200")
global filename
global X, Y
global tfidf_X_train, tfidf_X_test, tfidf_y_train, tfidf_y_test
global tfidf_vectorizer
global accuracy,error

stop_words = set(stopwords.words('english'))
lemmatizer = WordNetLemmatizer()

textdata = []
labels = []
global classifier

def cleanPost(doc):
tokens = doc.split()
table = str.maketrans('', '', punctuation)
tokens = [w.translate(table) for w in tokens]
tokens = [word for word in tokens if word.isalpha()]
tokens = [w for w in tokens if not w in stop_words]
tokens = [word for word in tokens if len(word) > 1]
tokens = [lemmatizer.lemmatize(token) for token in tokens]
tokens = ' '.join(tokens)
return tokens

def uploadDataset():
global filename
text.delete('1.0', END)
filename =
filedialog.askopenfilename(initialdir="TwitterNewsData")
textdata.clear()
labels.clear()
dataset = pd.read_csv(filename)
dataset = dataset.fillna(' ')
for i in range(len(dataset)):
msg = dataset.get_value(i, 'text')
label = dataset.get_value(i, 'target')
msg = str(msg)
msg = msg.strip().lower()
labels.append(int(label))
clean = cleanPost(msg)
textdata.append(clean)
text.insert(END,clean+" ==== "+str(label)+"\n")

def preprocess():
text.delete('1.0', END)
global X, Y
global tfidf_vectorizer
global tfidf_X_train, tfidf_X_test, tfidf_y_train, tfidf_y_test
stopwords=stopwords = nltk.corpus.stopwords.words("english")
tfidf_vectorizer = TfidfVectorizer(stop_words=stopwords,
use_idf=True, ngram_range=(1,2),smooth_idf=False, norm=None,
decode_error='replace', max_features=200)
tfidf = tfidf_vectorizer.fit_transform(textdata).toarray()
df = pd.DataFrame(tfidf,
columns=tfidf_vectorizer.get_feature_names())
text.insert(END,str(df))
print(df.shape)
df = df.values
X = df[:, 0:df.shape[1]]
X = normalize(X)
Y = np.asarray(labels)
le = LabelEncoder()
Y = le.fit_transform(Y)
indices = np.arange(X.shape[0])
np.random.shuffle(indices)
X = X[indices]
Y = Y[indices]
Y = Y.reshape(-1, 1)
print(X.shape)
encoder = OneHotEncoder(sparse=False)
#Y = encoder.fit_transform(Y)
X = X.reshape((X.shape[0], X.shape[1], 1))
print(Y)
print(Y.shape)
print(X.shape)
tfidf_X_train, tfidf_X_test, tfidf_y_train, tfidf_y_test =
train_test_split(X, Y, test_size=0.2)
text.insert(END,"\n\nTotal News found in dataset : "+str(len(X))
+"\n")
text.insert(END,"Total records used to train machine learning
algorithms : "+str(len(tfidf_X_train))+"\n")
text.insert(END,"Total records used to test machine learning
algorithms : "+str(len(tfidf_X_test))+"\n")

def runLSTM():
text.delete('1.0', END)
global classifier
if os.path.exists('model/model.json'):
with open('model/model.json', "r") as json_file:
loaded_model_json = json_file.read()
classifier = model_from_json(loaded_model_json)
classifier.load_weights("model/model_weights.h5")
classifier._make_predict_function()
print(classifier.summary())
f = open('model/history.pckl', 'rb')
data = pickle.load(f)
f.close()
acc = data['accuracy']
acc = acc[9] * 100
text.insert(END,"LSTM Fake News Detection Accuracy :
"+str(acc)+"\n\n")
text.insert(END,'LSTM Model Summary can be seen in black
console for layer details\n')
with open('model/model.txt', 'rb') as file:
classifier = pickle.load(file)
file.close()
else:
lstm_model = Sequential()
lstm_model.add(LSTM(128, input_shape=(X.shape[1:]),
activation='relu', return_sequences=True))
lstm_model.add(Dropout(0.2))

lstm_model.add(LSTM(128, activation='relu'))
lstm_model.add(Dropout(0.2))

lstm_model.add(Dense(32, activation='relu'))
lstm_model.add(Dropout(0.2))

lstm_model.add(Dense(2, activation='softmax'))
lstm_model.compile(loss='sparse_categorical_crossentropy',
optimizer='adam', metrics=['accuracy'])
hist = lstm_model.fit(X, Y, epochs=10,
validation_data=(tfidf_X_test, tfidf_y_test))
classifier = lstm_model
classifier.save_weights('model/model_weights.h5')
model_json = classifier.to_json()
with open("model/model.json", "w") as json_file:
json_file.write(model_json)
accuracy = hist.history
f = open('model/history.pckl', 'wb')
pickle.dump(accuracy, f)
f.close()
acc = accuracy['accuracy']
acc = acc[9] * 100
text.insert(END,"LSTM Accuracy : "+str(acc)+"\n\n")
text.insert(END,'LSTM Model Summary can be seen in black
console for layer details\n')
print(lstm_model.summary())

def graph():
f = open('model/history.pckl', 'rb')
data = pickle.load(f)
f.close()
acc = data['accuracy']
loss = data['loss']
plt.figure(figsize=(10,6))
plt.grid(True)
plt.xlabel('Epcchs')
plt.ylabel('Accuracy/Loss')
plt.plot(acc, 'ro-', color = 'green')
plt.plot(loss, 'ro-', color = 'blue')
plt.legend(['Accuracy','Loss'], loc='upper left')
#plt.xticks(wordloss.index)
plt.title('LSTM Model Accuracy & Loss Graph')
plt.show()

def predict():
testfile =
filedialog.askopenfilename(initialdir="TwitterNewsData")
testData = pd.read_csv(testfile)
text.delete('1.0', END)
testData = testData.values
testData = testData[:,0]
print(testData)
for i in range(len(testData)):
msg = testData[i]
msg1 = testData[i]
print(msg)
review = msg.lower()
review = review.strip().lower()
review = cleanPost(review)
testReview = tfidf_vectorizer.transform([review]).toarray()
predict = classifier.predict(testReview)
print(predict)
if predict == 0:
text.insert(END,msg1+" === Given news predicted as
GENUINE\n\n")
else:
text.insert(END,msg1+" == Given news predicted as FAKE\
n\n")

font = ('times', 15, 'bold')

title = Label(main, text='DETECTION OF FAKE NEWS
THROUGH IMPLEMENTATION OF DATA SCIENCE
APPLICATION')
title.config(bg='gold2', fg='thistle1')
title.config(font=font)
title.config(height=3, width=120)
title.place(x=0,y=5)

font1 = ('times', 13, 'bold')

ff = ('times', 12, 'bold')

uploadButton = Button(main, text="Upload Fake News Dataset",

command=uploadDataset)
uploadButton.place(x=20,y=100)
uploadButton.config(font=ff)
processButton = Button(main, text="Preprocess Dataset",
command=preprocess)
processButton.place(x=20,y=150)
processButton.config(font=ff)

dtButton = Button(main, text="Run LSTM Algorithm",

command=runLSTM)
dtButton.place(x=20,y=200)
dtButton.config(font=ff)

graphButton = Button(main, text="Accuracy & Loss Graph",

command=graph)
graphButton.place(x=20,y=250)
graphButton.config(font=ff)

predictButton = Button(main, text="Test News Detection",

command=predict)
predictButton.place(x=20,y=300)
predictButton.config(font=ff)

font1 = ('times', 12, 'bold')

text=Text(main,height=30,width=100)
scroll=Scrollbar(text)
text.configure(yscrollcommand=scroll.set)
text.place(x=330,y=100)
text.config(font=font1)

main.config(bg='DarkSlateGray1')
main.mainloop()

LSTM From Scratch in Python
No ratings yet
LSTM From Scratch in Python
11 pages
2nd Sem VTU Python Lab Manual
No ratings yet
2nd Sem VTU Python Lab Manual
40 pages
SlotDesigner Manual
No ratings yet
SlotDesigner Manual
142 pages
R
No ratings yet
R
4 pages
FND Imp Points
No ratings yet
FND Imp Points
6 pages
Sentence Embedding Code
No ratings yet
Sentence Embedding Code
9 pages
code text
No ratings yet
code text
4 pages
Untitled 10
No ratings yet
Untitled 10
6 pages
DL_3
No ratings yet
DL_3
6 pages
sentiment analysis using LSTM (1)
No ratings yet
sentiment analysis using LSTM (1)
5 pages
Sample
No ratings yet
Sample
6 pages
vertopal.com_movie review classification
No ratings yet
vertopal.com_movie review classification
5 pages
751_DNN_Assn 01
No ratings yet
751_DNN_Assn 01
8 pages
twins code
No ratings yet
twins code
4 pages
unit4 (1)
No ratings yet
unit4 (1)
23 pages
DL
No ratings yet
DL
17 pages
School of Engineering: Lab Manual On Machine Learning Lab
No ratings yet
School of Engineering: Lab Manual On Machine Learning Lab
23 pages
Cv prince
No ratings yet
Cv prince
120 pages
QLSTMvs LSTM
No ratings yet
QLSTMvs LSTM
7 pages
vit32_gptMD
No ratings yet
vit32_gptMD
6 pages
Final Code
No ratings yet
Final Code
16 pages
ccc
No ratings yet
ccc
25 pages
Medical Text Classifier GabrieldeOlaguibel
No ratings yet
Medical Text Classifier GabrieldeOlaguibel
12 pages
Dl 5 Excuted
No ratings yet
Dl 5 Excuted
13 pages
vertopal.com_HandWritten
No ratings yet
vertopal.com_HandWritten
13 pages
IRT Lab Programs
No ratings yet
IRT Lab Programs
9 pages
malaria_1735833704
No ratings yet
malaria_1735833704
14 pages
Pdf
No ratings yet
Pdf
41 pages
cyberbullying code
No ratings yet
cyberbullying code
6 pages
566f0619-9145-4b8f-b12b-cb8a5b0cd30d
No ratings yet
566f0619-9145-4b8f-b12b-cb8a5b0cd30d
17 pages
Fake News Classification - Ipynb - Colaboratory
No ratings yet
Fake News Classification - Ipynb - Colaboratory
6 pages
Document
No ratings yet
Document
3 pages
Train Edu Bert
No ratings yet
Train Edu Bert
3 pages
Neural Network
No ratings yet
Neural Network
10 pages
Import As Import As Import As Import As From Import From Import From Import From Import From Import From Import From Import From Import From Import
No ratings yet
Import As Import As Import As Import As From Import From Import From Import From Import From Import From Import From Import From Import From Import
8 pages
ML Report Fake News Detection
No ratings yet
ML Report Fake News Detection
15 pages
ML Week10.1
No ratings yet
ML Week10.1
5 pages
Super Visionado VSRegras
No ratings yet
Super Visionado VSRegras
6 pages
GloVe Embedding code
No ratings yet
GloVe Embedding code
3 pages
Assingment-3 NLP
No ratings yet
Assingment-3 NLP
5 pages
gpt-2 code
No ratings yet
gpt-2 code
2 pages
Deep Learning
No ratings yet
Deep Learning
46 pages
Lab 2 Assignment_W2022
No ratings yet
Lab 2 Assignment_W2022
8 pages
Null 0
No ratings yet
Null 0
6 pages
A5 - Jupyter Notebook PDF
No ratings yet
A5 - Jupyter Notebook PDF
4 pages
Random Forest
No ratings yet
Random Forest
5 pages
Aped For Fake News
No ratings yet
Aped For Fake News
6 pages
Lab5 Example Fall 23
No ratings yet
Lab5 Example Fall 23
4 pages
import numpy as np
No ratings yet
import numpy as np
3 pages
MNIST Classification Using CNN
No ratings yet
MNIST Classification Using CNN
5 pages
0.0.1 Implementation of Recurrent Neural Network: #Importing The Required Libraries
No ratings yet
0.0.1 Implementation of Recurrent Neural Network: #Importing The Required Libraries
9 pages
Import Numpy as Np
No ratings yet
Import Numpy as Np
5 pages
hatespeech_code_ipynb
No ratings yet
hatespeech_code_ipynb
31 pages
Assignment 3 DS5620
No ratings yet
Assignment 3 DS5620
11 pages
Report On - Social Media Research Topic Modeling
No ratings yet
Report On - Social Media Research Topic Modeling
26 pages
Import Library Python
No ratings yet
Import Library Python
10 pages
Keras Cheat Sheet Python
No ratings yet
Keras Cheat Sheet Python
1 page
NER_Brahui_NLP_Project (1)
No ratings yet
NER_Brahui_NLP_Project (1)
12 pages
Python CA 4
No ratings yet
Python CA 4
9 pages
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet
The Essential R Reference
From Everand
The Essential R Reference
Mark Gardener
No ratings yet
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet
Advanced C Concepts and Programming: First Edition
From Everand
Advanced C Concepts and Programming: First Edition
Gayatri
3/5 (1)
Jake Ryan: Southwestern University Blinn College
No ratings yet
Jake Ryan: Southwestern University Blinn College
1 page
Cs506 Solved Mcqs Final Term by Junaid
No ratings yet
Cs506 Solved Mcqs Final Term by Junaid
53 pages
Assembly Language Programs
No ratings yet
Assembly Language Programs
33 pages
Nested Loops
No ratings yet
Nested Loops
11 pages
Usb Cam Log
No ratings yet
Usb Cam Log
5 pages
FND Debug09feb
No ratings yet
FND Debug09feb
557 pages
TechNucleus - SQL Queries
No ratings yet
TechNucleus - SQL Queries
39 pages
12 CS 2024-25 SQP 3
No ratings yet
12 CS 2024-25 SQP 3
7 pages
Ques
No ratings yet
Ques
5 pages
Linked List Cheat Sheet
No ratings yet
Linked List Cheat Sheet
3 pages
Cambridge O Level: Computer Science 2210/22
No ratings yet
Cambridge O Level: Computer Science 2210/22
16 pages
C - Opengl - Question About glutMainLoop - Stack Overflow
No ratings yet
C - Opengl - Question About glutMainLoop - Stack Overflow
2 pages
Job Title: Software Development & Support Reports To: Senior Manager Location: Toronto, ON
No ratings yet
Job Title: Software Development & Support Reports To: Senior Manager Location: Toronto, ON
1 page
CS3361 Data Science Lab Manual
No ratings yet
CS3361 Data Science Lab Manual
43 pages
rohini_52749330676
No ratings yet
rohini_52749330676
14 pages
Chapter 1: Creating Relational Database (8 Marks) : Data
No ratings yet
Chapter 1: Creating Relational Database (8 Marks) : Data
11 pages
Python Module 1 2 3 CIE 1 Complete Solutions
No ratings yet
Python Module 1 2 3 CIE 1 Complete Solutions
48 pages
JBilling 3.2 Integration Guide
No ratings yet
JBilling 3.2 Integration Guide
90 pages
Crystal Reports in
No ratings yet
Crystal Reports in
21 pages
COMP1112 Lab6
No ratings yet
COMP1112 Lab6
9 pages
Katoch2021 Article AReviewOnGeneticAlgorithmPastP
No ratings yet
Katoch2021 Article AReviewOnGeneticAlgorithmPastP
37 pages
Chapter - 5 Concurrency Control PDF
No ratings yet
Chapter - 5 Concurrency Control PDF
57 pages
How To Debug Transfer Rules and Update Rules
No ratings yet
How To Debug Transfer Rules and Update Rules
6 pages
Visual Basic Language Companion PDF
No ratings yet
Visual Basic Language Companion PDF
139 pages
OS Interview Questions
No ratings yet
OS Interview Questions
29 pages
CS8661 - IP Lab Manual Final
No ratings yet
CS8661 - IP Lab Manual Final
86 pages
Computer Applications
No ratings yet
Computer Applications
17 pages

Sample Code

Uploaded by

Sample Code

Uploaded by

SAMPLE CODE

from tkinter import messagebox

from keras.models import Sequential

font = ('times', 15, 'bold')

font1 = ('times', 13, 'bold')

uploadButton = Button(main, text="Upload Fake News Dataset",

dtButton = Button(main, text="Run LSTM Algorithm",

graphButton = Button(main, text="Accuracy & Loss Graph",

predictButton = Button(main, text="Test News Detection",

font1 = ('times', 12, 'bold')

You might also like