0% found this document useful (0 votes)

21 views6 pages

Super Visionado VSRegras

Uploaded by

debora.brigida

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

21 views6 pages

Super Visionado VSRegras

Uploaded by

debora.brigida

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 6

###Prof. Fernando Amaral https://www.eia.

ai/

import pandas as pd
from google.colab import files
import numpy as np

from sklearn.model_selection import train_test_split

from sklearn.preprocessing import LabelEncoder
from sklearn.metrics import confusion_matrix, accuracy_score

from keras.models import Sequential

from keras.layers import Dense, Embedding, LSTM, SpatialDropout1D
from tensorflow.keras.preprocessing.text import Tokenizer
from keras.preprocessing.sequence import pad_sequences
from tensorflow.keras.utils import to_categorical

import nltk
from nltk.sentiment.vader import SentimentIntensityAnalyzer
nltk.download("vader_lexicon")

[nltk_data] Downloading package vader_lexicon to /root/nltk_data...

True

files.upload()

Tweets = pd.read_csv("Tweets2.csv")
Tweets.shape

(74682, 4)

Tweets.head()

{"summary":"{\n \"name\": \"Tweets\",\n \"rows\": 74682,\n

\"fields\": [\n {\n \"column\": \"id\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": 3740,\n
\"min\": 1,\n \"max\": 13200,\n \"num_unique_values\":
12447,\n \"samples\": [\n 1616,\n 2660,\n
2335\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"local\",\n \"properties\": {\n \"dtype\": \"category\",\
n \"num_unique_values\": 32,\n \"samples\": [\n
\"Cyberpunk2077\",\n \"Microsoft\",\n
\"TomClancysRainbowSix\"\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"sentiment\",\n \"properties\": {\n
\"dtype\": \"category\",\n \"num_unique_values\": 4,\n
\"samples\": [\n \"Neutral\",\n \"Irrelevant\",\n
\"Positive\"\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"text\",\n \"properties\": {\n \"dtype\": \"string\",\n
\"num_unique_values\": 69491,\n \"samples\": [\n
\"Thanks to @ Kain0025 for the raid. Thanks to @ gamingstreams and @
velonese002 for the bitts! And thanks to @ ColTrysTohete for hanging
out and hanging out!. I hope to continue streaming regularly.. watch
the w / @ Cohtstreams _ coming live!\",\n \"How not to get
bored about every damn thing in life.\",\n \"The Best Way to
Protect the Samsung Galaxy Note10+ buff.ly/2zkjIhU <unk> ^\"\
n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n }\n ]\
n}","type":"dataframe","variable_name":"Tweets"}

Tweets.groupby(['sentiment']).size()

sentiment
Irrelevant 12990
Negative 22542
Neutral 18318
Positive 20832
dtype: int64

Tweets.loc[Tweets['sentiment']=='Irrelevant','sentiment'] = 'Neutral'

Tweets = Tweets.dropna(subset=['text'])
Tweets.reset_index(drop=True, inplace=True)

Tweets.shape

(73996, 4)

Tweets.groupby(['sentiment']).size()

sentiment
Negative 22358
Neutral 30983
Positive 20655
dtype: int64

Supervisionado
token = Tokenizer(num_words=100)
token.fit_on_texts(Tweets['text'].values)

X = token.texts_to_sequences(Tweets['text'].values)
X = pad_sequences(X, padding="post", maxlen=100)

labelencoder = LabelEncoder()
y = labelencoder.fit_transform(Tweets['sentiment'])
print(y)

[2 2 2 ... 2 2 2]
y = to_categorical(y)
print(y)

[[0. 0. 1.]
[0. 0. 1.]
[0. 0. 1.]
...
[0. 0. 1.]
[0. 0. 1.]
[0. 0. 1.]]

X_train, X_test, y_train, y_test = train_test_split(X,y, test_size =

0.4)
X_test

array([[95, 99, 3, ..., 0, 0, 0],

[13, 18, 4, ..., 0, 0, 0],
[10, 7, 5, ..., 0, 0, 0],
...,
[37, 11, 7, ..., 0, 0, 0],
[ 0, 0, 0, ..., 0, 0, 0],
[87, 7, 17, ..., 0, 0, 0]], dtype=int32)

modelo = Sequential()
modelo.add(Embedding(input_dim= len(token.word_index), output_dim=128,
input_length=X.shape[1]))
modelo.add(SpatialDropout1D(0.2))
modelo.add(LSTM(units=196, dropout=0.2, recurrent_dropout=0,
activation='tanh',
recurrent_activation='sigmoid', unroll=False,
use_bias=True))
modelo.add(Dense(units=3,activation="softmax"))

/usr/local/lib/python3.10/dist-packages/keras/src/layers/core/
embedding.py:90: UserWarning: Argument `input_length` is deprecated.
Just remove it.
warnings.warn(

modelo.compile(loss='categorical_crossentropy', optimizer='adam',
metrics = ['accuracy'])
print(modelo.summary())

Model: "sequential_1"

┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳
━━━━━━━━━━━━━━━━━┓
┃ Layer (type) ┃ Output Shape ┃
Param # ┃
┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇
━━━━━━━━━━━━━━━━━┩
│ embedding_1 (Embedding) │ ? │
0 (unbuilt) │
├──────────────────────────────────────┼─────────────────────────────┼
─────────────────┤
│ spatial_dropout1d_1 │ ? │
0 (unbuilt) │
│ (SpatialDropout1D) │ │
│
├──────────────────────────────────────┼─────────────────────────────┼
─────────────────┤
│ lstm_1 (LSTM) │ ? │
0 (unbuilt) │
├──────────────────────────────────────┼─────────────────────────────┼
─────────────────┤
│ dense_1 (Dense) │ ? │
0 (unbuilt) │
└──────────────────────────────────────┴─────────────────────────────┴
─────────────────┘

Total params: 0 (0.00 B)

Trainable params: 0 (0.00 B)

Non-trainable params: 0 (0.00 B)

None

modelo.fit(X_train, y_train, epochs=5, batch_size=500,verbose=True)

Epoch 1/5
89/89 ━━━━━━━━━━━━━━━━━━━━ 6s 46ms/step - accuracy: 0.4188 - loss:
1.0838
Epoch 2/5
89/89 ━━━━━━━━━━━━━━━━━━━━ 4s 44ms/step - accuracy: 0.4183 - loss:
1.0831
Epoch 3/5
89/89 ━━━━━━━━━━━━━━━━━━━━ 5s 45ms/step - accuracy: 0.4200 - loss:
1.0821
Epoch 4/5
89/89 ━━━━━━━━━━━━━━━━━━━━ 4s 46ms/step - accuracy: 0.4156 - loss:
1.0837
Epoch 5/5
89/89 ━━━━━━━━━━━━━━━━━━━━ 4s 45ms/step - accuracy: 0.4183 - loss:
1.0825

<keras.src.callbacks.history.History at 0x7d98d00fe200>

_, accuracy = modelo.evaluate(X_test,y_test)
print("Accuracy: ", accuracy)
925/925 ━━━━━━━━━━━━━━━━━━━━ 4s 4ms/step - accuracy: 0.4207 - loss:
1.0815
Accuracy: 0.41920334100723267

VADER
mas = SentimentIntensityAnalyzer()
Tweets['vander_sentiment'] = ''

for y in range(len(Tweets.index)):
x = mas.polarity_scores(Tweets['text'].iloc[y])
del x['compound']
maior = max(x,key=x.get) #neg pos neu
Tweets.loc[y,'vander_sentiment'] = maior

Tweets.groupby(['vander_sentiment']).size()

vander_sentiment
neg 3660
neu 65581
pos 4755
dtype: int64

Tweets.groupby(['sentiment']).size()

sentiment
Negative 22358
Neutral 30983
Positive 20655
dtype: int64

Tweets.loc[Tweets['vander_sentiment']== 'neu' , 'vander_sentiment'] =

'Neutral'
Tweets.loc[Tweets['vander_sentiment']== 'neg' , 'vander_sentiment'] =
'Negative'
Tweets.loc[Tweets['vander_sentiment']== 'pos' , 'vander_sentiment'] =
'Positive'

Tweets.groupby(['vander_sentiment']).size()

vander_sentiment
Negative 3660
Neutral 65581
Positive 4755
dtype: int64

y_pred = Tweets['vander_sentiment']
y_test = Tweets['sentiment']
cm = confusion_matrix(y_test, y_pred)
print(cm)

[[ 2004 19902 452]

[ 1122 28384 1477]
[ 534 17295 2826]]

accuracy = accuracy_score(y_test, y_pred)

print(accuracy)

0.44886210065408944

Familyandfriends 5 Teachersbookpdf
No ratings yet
Familyandfriends 5 Teachersbookpdf
2 pages
Neural Syllabus
No ratings yet
Neural Syllabus
1 page
The Complete Edition of Murphy's Laws PDF
100% (1)
The Complete Edition of Murphy's Laws PDF
109 pages
UPSC Mains Answer Writing Tips by IAS Topper
No ratings yet
UPSC Mains Answer Writing Tips by IAS Topper
16 pages
Community Based Rehabilitation
No ratings yet
Community Based Rehabilitation
9 pages
CHP-6 Learning
No ratings yet
CHP-6 Learning
13 pages
Tensorflow 2 - 0 Slides PDF
No ratings yet
Tensorflow 2 - 0 Slides PDF
100 pages
End of Term 3 7em Joint 2 1
No ratings yet
End of Term 3 7em Joint 2 1
2 pages
Images in Multimedia
No ratings yet
Images in Multimedia
26 pages
Scope Flex Endoscpy
No ratings yet
Scope Flex Endoscpy
1 page
Keras Cheat Sheet Python
No ratings yet
Keras Cheat Sheet Python
1 page
Tensor Flow 2
No ratings yet
Tensor Flow 2
3 pages
Classworkunit 1
No ratings yet
Classworkunit 1
24 pages
Compendium PDF
No ratings yet
Compendium PDF
128 pages
History Lesson Plan: THEME 2: Brunei Sultanate, 14th To 16th Century
No ratings yet
History Lesson Plan: THEME 2: Brunei Sultanate, 14th To 16th Century
6 pages
Microprotol CADTech Consultants
No ratings yet
Microprotol CADTech Consultants
13 pages
HUM 113 - 2 Assumptions of Art
No ratings yet
HUM 113 - 2 Assumptions of Art
10 pages
Me 455
No ratings yet
Me 455
4 pages
Tesis Deporte en La Edad de Plata
No ratings yet
Tesis Deporte en La Edad de Plata
378 pages
Importing Packages: Id Label Tweet 0 1 2 3 4
No ratings yet
Importing Packages: Id Label Tweet 0 1 2 3 4
8 pages
Availability Bias
No ratings yet
Availability Bias
15 pages
Science 7 Structure and Forces - For Merge
No ratings yet
Science 7 Structure and Forces - For Merge
15 pages
3rdTrimesterMAT130 takeawayCAT
No ratings yet
3rdTrimesterMAT130 takeawayCAT
2 pages
Omputer Eekly Buyer S Guide To Threat Management: Making Unified Threat Management A Key Security Tool
No ratings yet
Omputer Eekly Buyer S Guide To Threat Management: Making Unified Threat Management A Key Security Tool
19 pages
LP 15
No ratings yet
LP 15
4 pages
Sample Code
No ratings yet
Sample Code
8 pages
Image Caption2
No ratings yet
Image Caption2
9 pages
Psych 2220 Syllabus
No ratings yet
Psych 2220 Syllabus
7 pages
IMDB - Colaboratory
No ratings yet
IMDB - Colaboratory
10 pages
Fault Modeling: Why Model Faults? Some Real Defects in VLSI and PCB Common Fault Models Stuck-At Faults
No ratings yet
Fault Modeling: Why Model Faults? Some Real Defects in VLSI and PCB Common Fault Models Stuck-At Faults
18 pages
CTRL
No ratings yet
CTRL
5 pages
Jaycolpdf 1
No ratings yet
Jaycolpdf 1
5 pages
Import As Import As Import As Import As From Import From Import From Import From Import From Import From Import From Import From Import From Import
No ratings yet
Import As Import As Import As Import As From Import From Import From Import From Import From Import From Import From Import From Import From Import
8 pages
GD Ready Set Go
No ratings yet
GD Ready Set Go
34 pages
TMA01 Question 2 (55 Marks)
No ratings yet
TMA01 Question 2 (55 Marks)
26 pages
Ualpa General Instructions
No ratings yet
Ualpa General Instructions
28 pages
Sample
No ratings yet
Sample
6 pages
Module 7 Posttest Clinical Internship II Clinical Microscopy and Parasitology II
No ratings yet
Module 7 Posttest Clinical Internship II Clinical Microscopy and Parasitology II
19 pages
Cell Theory Timeline
No ratings yet
Cell Theory Timeline
14 pages
Neural Networks
No ratings yet
Neural Networks
8 pages
Assignment 2
No ratings yet
Assignment 2
8 pages
Python Code
No ratings yet
Python Code
52 pages
Integer-Encoding-Simplernn - Ipynb - Colaboratory
No ratings yet
Integer-Encoding-Simplernn - Ipynb - Colaboratory
4 pages
ML Week10.1
No ratings yet
ML Week10.1
5 pages
Q 3
No ratings yet
Q 3
2 pages
Twitter Sentiment Analysis Dss
No ratings yet
Twitter Sentiment Analysis Dss
14 pages
NN & DL Lab Manual 1
No ratings yet
NN & DL Lab Manual 1
44 pages
SHCC Topics 2022-2023
No ratings yet
SHCC Topics 2022-2023
1 page
CV Prince
No ratings yet
CV Prince
120 pages
Sentimental Analysis
No ratings yet
Sentimental Analysis
3 pages
Sentence Embedding Code
No ratings yet
Sentence Embedding Code
9 pages
FALLSEM2024-25 BCSE332P LO VL2024250102168 2024-10-07 Reference-Material-I
No ratings yet
FALLSEM2024-25 BCSE332P LO VL2024250102168 2024-10-07 Reference-Material-I
18 pages
Exp 10 Sentiment Analysis BERT
No ratings yet
Exp 10 Sentiment Analysis BERT
5 pages
3-Sentiment Analysis BERT
No ratings yet
3-Sentiment Analysis BERT
5 pages
NLP Transformer-Based Models Used For Sentiment Analysis: 1. BERT
No ratings yet
NLP Transformer-Based Models Used For Sentiment Analysis: 1. BERT
98 pages
Stress Level Detection
No ratings yet
Stress Level Detection
10 pages
DL
No ratings yet
DL
17 pages
Untitled 10
No ratings yet
Untitled 10
6 pages
DL - 22 - IMDB - SentimentAnalysis - RNN - Ipynb - Colab
No ratings yet
DL - 22 - IMDB - SentimentAnalysis - RNN - Ipynb - Colab
6 pages
Import As From Import From Import From Import From Import: # Load The IMDB Dataset
No ratings yet
Import As From Import From Import From Import From Import: # Load The IMDB Dataset
6 pages
Sentiment Analysis Using LSTM
No ratings yet
Sentiment Analysis Using LSTM
5 pages
Neural DEEP
No ratings yet
Neural DEEP
39 pages
Machine Learning Code Explanation
No ratings yet
Machine Learning Code Explanation
33 pages
NLP Transformer-Based Models Used For Sentiment Analysis
No ratings yet
NLP Transformer-Based Models Used For Sentiment Analysis
45 pages
566f0619-9145-4b8f-b12b-cb8a5b0cd30d
No ratings yet
566f0619-9145-4b8f-b12b-cb8a5b0cd30d
17 pages
4.text Classification Using ML - Ipynb
No ratings yet
4.text Classification Using ML - Ipynb
47 pages
Bertweet Tokenizer
No ratings yet
Bertweet Tokenizer
2 pages
HateSpeech - Ipynb - Colab
No ratings yet
HateSpeech - Ipynb - Colab
8 pages
Adobe Scan 08 Jan 2025
No ratings yet
Adobe Scan 08 Jan 2025
7 pages
Code Text
No ratings yet
Code Text
4 pages
DL 22Q71A4206
No ratings yet
DL 22Q71A4206
65 pages
Movie Review Classification
No ratings yet
Movie Review Classification
5 pages
CCS355-Neural Networks and Deep Learning - Assignment 1
No ratings yet
CCS355-Neural Networks and Deep Learning - Assignment 1
15 pages
DL 3
No ratings yet
DL 3
6 pages
L2 - Basic ANN Model Building With TF-Keras
No ratings yet
L2 - Basic ANN Model Building With TF-Keras
16 pages
Kindle Review Sentiment Analysis - Ipynb - Colab
No ratings yet
Kindle Review Sentiment Analysis - Ipynb - Colab
5 pages
DL5.ipynb - Colab
No ratings yet
DL5.ipynb - Colab
3 pages
Ccs355 - NN&DL Lab Manual
No ratings yet
Ccs355 - NN&DL Lab Manual
34 pages
DL Exp-10,11,12
No ratings yet
DL Exp-10,11,12
6 pages
Ai Lab Final
No ratings yet
Ai Lab Final
21 pages
Emotion Detection - Merged
No ratings yet
Emotion Detection - Merged
8 pages
DL Exps
No ratings yet
DL Exps
9 pages
DLP Science3 w5d3
No ratings yet
DLP Science3 w5d3
3 pages
CCS355
No ratings yet
CCS355
29 pages
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet
How to a Developers Guide to 4k: Developer edition, #3
From Everand
How to a Developers Guide to 4k: Developer edition, #3
Xinc Cyberwizard
No ratings yet
Gd Script
From Everand
Gd Script
Marijo Trkulja
No ratings yet
MCS-011: Problem Solving and Programming
From Everand
MCS-011: Problem Solving and Programming
Dr. DK Sukhani
No ratings yet
Amazing Java: Learn Java Quickly
From Everand
Amazing Java: Learn Java Quickly
Andrei Besedin
No ratings yet

Super Visionado VSRegras

Uploaded by

Super Visionado VSRegras

Uploaded by

###Prof. Fernando Amaral https://www.eia.

from sklearn.model_selection import train_test_split

from keras.models import Sequential

[nltk_data] Downloading package vader_lexicon to /root/nltk_data...

{"summary":"{\n \"name\": \"Tweets\",\n \"rows\": 74682,\n

X_train, X_test, y_train, y_test = train_test_split(X,y, test_size =

array([[95, 99, 3, ..., 0, 0, 0],

Total params: 0 (0.00 B)

Trainable params: 0 (0.00 B)

Non-trainable params: 0 (0.00 B)

modelo.fit(X_train, y_train, epochs=5, batch_size=500,verbose=True)

Tweets.loc[Tweets['vander_sentiment']== 'neu' , 'vander_sentiment'] =

[[ 2004 19902 452]

accuracy = accuracy_score(y_test, y_pred)

You might also like