Word2Vec code

Uploaded by

valachi b-boy

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

1 views

Word2Vec code

Uploaded by

valachi b-boy

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 2

#Word2Vec + BiLSTM

#code 0 updated with early stop

import pandas as pd
import numpy as np
from tensorflow.keras.preprocessing.text import Tokenizer
from tensorflow.keras.preprocessing.sequence import pad_sequences
from tensorflow.keras.layers import Input, Embedding, Conv1D, MaxPooling1D, LSTM,
Dense, Dropout, Bidirectional, Concatenate
from tensorflow.keras.models import Model
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.callbacks import EarlyStopping
import matplotlib.pyplot as plt
print('import done')

# define hyperparameters
MAX_SEQ_LENGTH = 100
MAX_NB_WORDS = 20000
EMBEDDING_DIM = 100
FILTER_SIZES = [3, 4, 5]
NUM_FILTERS = 128
LSTM_UNITS = 64
DENSE_UNITS = 1
DROPOUT_RATE = 0.5
PATIENCE = 10
EPOCHS = 50
print('config done')

# load data
df =
pd.read_csv("/kaggle/input/sentiment140/training.1600000.processed.noemoticon.csv",
encoding='latin-1', header=None)
df.columns = ["sentiment", "id", "date", "query", "user", "text"]
df = df[["sentiment", "text"]]
df["sentiment"] = df["sentiment"].replace({0: "negative", 4: "positive"})
texts = df["text"].values
labels = df["sentiment"].values
labels = np.array([1 if label == "positive" else 0 for label in labels])
print(df.head(10))

# preprocess text data

tokenizer = Tokenizer(num_words=MAX_NB_WORDS)
tokenizer.fit_on_texts(texts)
sequences = tokenizer.texts_to_sequences(texts)
word_index = tokenizer.word_index
data = pad_sequences(sequences, maxlen=MAX_SEQ_LENGTH)
print('preprocessing done')

# define model architecture

inputs = Input(shape=(MAX_SEQ_LENGTH,))
embedding = Embedding(input_dim=len(word_index) + 1, output_dim=EMBEDDING_DIM,
input_length=MAX_SEQ_LENGTH)(inputs)
conv_layers = []
for filter_size in FILTER_SIZES:
conv = Conv1D(filters=NUM_FILTERS, kernel_size=filter_size, activation='relu')
(embedding)
pool = MaxPooling1D(pool_size=MAX_SEQ_LENGTH - filter_size + 1)(conv)
conv_layers.append(pool)
concat = Concatenate()(conv_layers)
lstm = Bidirectional(LSTM(units=LSTM_UNITS))(concat)
dropout = Dropout(rate=DROPOUT_RATE)(lstm)
outputs = Dense(units=DENSE_UNITS, activation='sigmoid')(dropout)
model = Model(inputs=inputs, outputs=outputs)
model.compile(optimizer=Adam(), loss='binary_crossentropy', metrics=['accuracy'])
model.summary()

# train the model with early stopping

es = EarlyStopping(monitor='val_accuracy', patience=PATIENCE, mode='max',
min_delta=0.01, baseline=0.85)
history = model.fit(data, labels, epochs= EPOCHS, validation_split=0.4,
callbacks=[es])

# Plot accuracy
plt.plot(history.history['accuracy'])
plt.plot(history.history['val_accuracy'])
plt.title('Model Accuracy')
plt.xlabel('Epoch')
plt.ylabel('Accuracy')
plt.legend(['Train', 'Validation'], loc='upper left')
plt.show()

# Make predictions on new data

new_texts = ["is upset that he can't update his Facebook by texting it... and might
cry as a result School today ...",
"@Kenichan I dived many times for the ball. Managed to save 50% The
rest go out of bounds",
"my whole body feels itchy and like its on fire",
"@nationwideclass no, it's not behaving at all. i'm mad. why am i
here? because I can't see you all o...",
"@Kwesidei not the whole crew",
"@LettyA ahh ive always wanted to see rent love the soundtrack!!",
"@FakerPattyPattz Oh dear. Were you drinking out of the forgotten
table drinks? "]
new_sequences = tokenizer.texts_to_sequences(new_texts)
new_data = pad_sequences(new_sequences, maxlen=MAX_SEQ_LENGTH)
predictions = model.predict(new_data)

# Evaluate the model

y_pred = np.round(predictions)
y_true = np.array([0, 0, 0, 0, 0, 0, 0]) # true labels of new data
cm = confusion_matrix(y_true, y_pred)
print(cm)

Astm E1245-2003-R-2008
100% (1)
Astm E1245-2003-R-2008
8 pages
gpt-2 code
No ratings yet
gpt-2 code
2 pages
GloVe Embedding code
No ratings yet
GloVe Embedding code
3 pages
bertweet tokenizer
No ratings yet
bertweet tokenizer
2 pages
sentiment analysis using LSTM (1)
No ratings yet
sentiment analysis using LSTM (1)
5 pages
566f0619-9145-4b8f-b12b-cb8a5b0cd30d
No ratings yet
566f0619-9145-4b8f-b12b-cb8a5b0cd30d
17 pages
Importing Packages: Id Label Tweet 0 1 2 3 4
No ratings yet
Importing Packages: Id Label Tweet 0 1 2 3 4
8 pages
1729401471516
No ratings yet
1729401471516
98 pages
NLP
No ratings yet
NLP
45 pages
DL
No ratings yet
DL
17 pages
LSTM Flow
No ratings yet
LSTM Flow
3 pages
NLP Assignment 2
No ratings yet
NLP Assignment 2
3 pages
Adobe Scan 08 Jan 2025
No ratings yet
Adobe Scan 08 Jan 2025
7 pages
2023 Aug How To Produce Data For A Neural networkORG
No ratings yet
2023 Aug How To Produce Data For A Neural networkORG
6 pages
Sample Code
No ratings yet
Sample Code
8 pages
Hugging Face
No ratings yet
Hugging Face
1 page
PHASE 2 IBM
No ratings yet
PHASE 2 IBM
5 pages
Twitter Sentiment Analysis Dss
No ratings yet
Twitter Sentiment Analysis Dss
14 pages
DL 6th Exp Program
No ratings yet
DL 6th Exp Program
3 pages
unit4 (1)
No ratings yet
unit4 (1)
23 pages
Sample
No ratings yet
Sample
6 pages
Prac 5
No ratings yet
Prac 5
3 pages
code text
No ratings yet
code text
4 pages
A3_44_DL_TA
No ratings yet
A3_44_DL_TA
10 pages
intent_recognizer
No ratings yet
intent_recognizer
5 pages
Super Visionado VSRegras
No ratings yet
Super Visionado VSRegras
6 pages
2023 Aug How To Prepare Data For A Neural Network A Step-by-Step Guide
No ratings yet
2023 Aug How To Prepare Data For A Neural Network A Step-by-Step Guide
7 pages
Exp 7 Text Sequence Generator LSTM
No ratings yet
Exp 7 Text Sequence Generator LSTM
12 pages
new 2
No ratings yet
new 2
2 pages
Sentence Embedding Code
No ratings yet
Sentence Embedding Code
9 pages
NLP Lab
No ratings yet
NLP Lab
18 pages
Dl lab answers batch 2
No ratings yet
Dl lab answers batch 2
27 pages
Tweet-Sentiment-Extraction - Bidirectional-LSTM Model
No ratings yet
Tweet-Sentiment-Extraction - Bidirectional-LSTM Model
57 pages
Exp 8 Machine Translation
No ratings yet
Exp 8 Machine Translation
11 pages
Assingment-3 NLP
No ratings yet
Assingment-3 NLP
5 pages
Sentimental Analysis
No ratings yet
Sentimental Analysis
3 pages
DL 4
No ratings yet
DL 4
5 pages
Computer Organization: National Institute of Technology Hamirpur
No ratings yet
Computer Organization: National Institute of Technology Hamirpur
8 pages
Next Word Prediction With NLP and Deep Learning
No ratings yet
Next Word Prediction With NLP and Deep Learning
13 pages
HateSpeech.ipynb - Colab
No ratings yet
HateSpeech.ipynb - Colab
8 pages
IRT Lab Programs
No ratings yet
IRT Lab Programs
9 pages
DL Programs
No ratings yet
DL Programs
13 pages
Rajeek 7
No ratings yet
Rajeek 7
3 pages
cyberbullying code
No ratings yet
cyberbullying code
6 pages
Artificial Neural Network Code
No ratings yet
Artificial Neural Network Code
3 pages
NLP
No ratings yet
NLP
4 pages
Sentiment Analysis On User-Generated Tweets
No ratings yet
Sentiment Analysis On User-Generated Tweets
15 pages
Recurring Neural Networks For Sequence - Sentiment Analysis With The IMDb Dataset - Ipynb - Colaboratory
No ratings yet
Recurring Neural Networks For Sequence - Sentiment Analysis With The IMDb Dataset - Ipynb - Colaboratory
16 pages
phase 3 IBM project
No ratings yet
phase 3 IBM project
4 pages
Image Caption2
No ratings yet
Image Caption2
9 pages
Word2vec Flow
No ratings yet
Word2vec Flow
2 pages
ML Week10.1
No ratings yet
ML Week10.1
5 pages
hatespeech_code_ipynb
No ratings yet
hatespeech_code_ipynb
31 pages
NLP Group 22
No ratings yet
NLP Group 22
8 pages
Import As Import As Import As Import As From Import From Import From Import From Import From Import From Import From Import From Import From Import
No ratings yet
Import As Import As Import As Import As From Import From Import From Import From Import From Import From Import From Import From Import From Import
8 pages
NLP PDF
No ratings yet
NLP PDF
17 pages
Image_Captioning_with_Visual_Attention.pdf
No ratings yet
Image_Captioning_with_Visual_Attention.pdf
16 pages
Assignment 7
No ratings yet
Assignment 7
10 pages
Neural Networks
No ratings yet
Neural Networks
8 pages
SQL Server: Tips and Tricks - 1
From Everand
SQL Server: Tips and Tricks - 1
Priyanka Agarwal
5/5 (1)
Reason Tool Docs
No ratings yet
Reason Tool Docs
17 pages
Ds1922E Ibutton High-Temperature Logger With 8Kb Datalog Memory
No ratings yet
Ds1922E Ibutton High-Temperature Logger With 8Kb Datalog Memory
44 pages
Carroll - Ostlie 02.15
No ratings yet
Carroll - Ostlie 02.15
5 pages
Bms Battery Charging
No ratings yet
Bms Battery Charging
12 pages
Kalman Filtering Approach To Market Price Forecasting
No ratings yet
Kalman Filtering Approach To Market Price Forecasting
117 pages
7066 - Sni 7648-2010
100% (1)
7066 - Sni 7648-2010
22 pages
MSZ DW
No ratings yet
MSZ DW
2 pages
Assignment
No ratings yet
Assignment
2 pages
Carbazole Violet
No ratings yet
Carbazole Violet
1 page
B-Tree Insert and Delete
No ratings yet
B-Tree Insert and Delete
22 pages
Homogeneous
No ratings yet
Homogeneous
10 pages
Pass Guide: 100% Pass Your Exam Test With Our Valid and Useful Exam Study Guide
No ratings yet
Pass Guide: 100% Pass Your Exam Test With Our Valid and Useful Exam Study Guide
6 pages
Intelligent Energy Management in Hybrid Electric Vehicles
No ratings yet
Intelligent Energy Management in Hybrid Electric Vehicles
32 pages
Botler, Jiménez - 2017 - On Path Decompositions of 2k-Regular Graphs
No ratings yet
Botler, Jiménez - 2017 - On Path Decompositions of 2k-Regular Graphs
7 pages
Vishal Kumar Singh CV_2024
No ratings yet
Vishal Kumar Singh CV_2024
3 pages
Siddhanta Shiromani CH 14 Translated
No ratings yet
Siddhanta Shiromani CH 14 Translated
3 pages
Public-Key Cryptography Standards: PKCS: Yongge Wang, PH.D., University of North Carolina at Charlotte
No ratings yet
Public-Key Cryptography Standards: PKCS: Yongge Wang, PH.D., University of North Carolina at Charlotte
19 pages
Introduction To C Language
No ratings yet
Introduction To C Language
55 pages
Cosmetic Automation Sorav
No ratings yet
Cosmetic Automation Sorav
21 pages
Resumen CCNA Data Center 200-155
No ratings yet
Resumen CCNA Data Center 200-155
15 pages
Opgw - 24g652-Ast-177 (69.8 - 256.7)
No ratings yet
Opgw - 24g652-Ast-177 (69.8 - 256.7)
9 pages
Mack III 8 211 V Service Manual
100% (55)
Mack III 8 211 V Service Manual
20 pages
On Fly Ash by Sumit Suman
100% (3)
On Fly Ash by Sumit Suman
20 pages
PolyU CVS Lab Report
No ratings yet
PolyU CVS Lab Report
6 pages
Composites and Applications
No ratings yet
Composites and Applications
46 pages
Cowan Reines Experiment
No ratings yet
Cowan Reines Experiment
13 pages
Hughes2021 Book QuantumComputingForTheQuantumC
100% (6)
Hughes2021 Book QuantumComputingForTheQuantumC
159 pages
23
No ratings yet
23
70 pages
Journal of Trading - Behind Stock Price Movement
No ratings yet
Journal of Trading - Behind Stock Price Movement
12 pages

Word2Vec code

Uploaded by

Word2Vec code

Uploaded by

#Word2Vec + BiLSTM

#code 0 updated with early stop

# preprocess text data

# define model architecture

# train the model with early stopping

# Make predictions on new data

# Evaluate the model

You might also like