gpt-2 code

Uploaded by

valachi b-boy

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

2 views2 pages

gpt-2 code

Uploaded by

valachi b-boy

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 2

import pandas as pd

import numpy as np
import matplotlib.pyplot as plt
import torch
from sklearn.metrics import confusion_matrix
from tensorflow.keras.preprocessing.sequence import pad_sequences
from tensorflow.keras.layers import Input, Embedding, Conv1D, MaxPooling1D, GRU,
Dense, Dropout, Concatenate
from tensorflow.keras.models import Model
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.callbacks import EarlyStopping
from transformers import GPT2Tokenizer, GPT2Model

print('import done')

# Define hyperparameters
MAX_SEQ_LENGTH = 100
MAX_NB_WORDS = 20000
EMBEDDING_DIM = 100
FILTER_SIZES = [3, 5, 7]
NUM_FILTERS = 256
GRU_UNITS = 256
DENSE_UNITS = 1
DROPOUT_RATE = 0.8
print('config done')

# Load the dataset

df =
pd.read_csv("/kaggle/input/sentiment140/training.1600000.processed.noemoticon.csv",
encoding='latin-1',
header=None)
df.columns = ["sentiment", "id", "date", "query", "user", "text"]
df = df[["sentiment", "text"]]
df["sentiment"] = df["sentiment"].replace({0: "negative", 4: "positive"})
texts = df["text"].values
labels = df["sentiment"].values
labels = np.array([1 if label == "positive" else 0 for label in labels])
print(df.head(10))

# Preprocess text data

tokenizer = GPT2Tokenizer.from_pretrained("gpt2")
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
gpt_model = GPT2Model.from_pretrained("gpt2").to(device)

def extract_gpt_features(text):
inputs = tokenizer.encode_plus(text, add_special_tokens=True,
return_tensors="pt")
inputs = inputs.to(device)

with torch.no_grad():
outputs = gpt_model(**inputs)[0]

features = outputs[:, 0, :].squeeze(0).cpu().numpy()

return features

sequences = np.array([extract_gpt_features(text) for text in texts])

word_index = None # We don't need word index for GPT-based features
data = pad_sequences(sequences, maxlen=MAX_SEQ_LENGTH)
# Define model architecture
inputs = Input(shape=(MAX_SEQ_LENGTH,))
embedding = Embedding(input_dim=len(word_index) + 1, output_dim=EMBEDDING_DIM,
input_length=MAX_SEQ_LENGTH)(inputs)
conv_layers = []
for filter_size in FILTER_SIZES:
conv = Conv1D(filters=NUM_FILTERS, kernel_size=filter_size, activation='relu')
(embedding)
pool = MaxPooling1D(pool_size=MAX_SEQ_LENGTH - filter_size + 1)(conv)
conv_layers.append(pool)
concat = Concatenate()(conv_layers)
gru = GRU(units=GRU_UNITS)(concat)
dropout = Dropout(rate=DROPOUT_RATE)(gru)
outputs = Dense(units=DENSE_UNITS, activation='sigmoid')(dropout)
model = Model(inputs=inputs, outputs=outputs)
model.compile(optimizer=Adam(), loss='binary_crossentropy', metrics=['accuracy'])
model.summary()

# Train the model with early stopping

es = EarlyStopping(monitor='val_accuracy', patience=5, mode='max', min_delta=0.01,
baseline=0.85)
history = model.fit(data, labels, epochs=50, validation_split=0.3, callbacks=[es])

# Plot accuracy
plt.plot(history.history['accuracy'])
plt.plot(history.history['val_accuracy'])
plt.title('Model Accuracy')
plt.xlabel('Epoch')
plt.ylabel('Accuracy')
plt.legend(['Train', 'Validation'], loc='upper left')
plt.show()

# Make predictions on new data

new_texts = ["is upset that he can't update his Facebook by texting it... and might
cry as a result School today ...",
"@Kenichan I dived many times for the ball. Managed to save 50% The
rest go out of bounds",
"my whole body feels itchy and like its on fire",
"@nationwideclass no, it's not behaving at all. i'm mad. why am i
here? because I can't see you all o...",
"@Kwesidei not the whole crew", "@LettyA ahh ive always wanted to see
rent love the soundtrack!!",
"@FakerPattyPattz Oh dear. Were you drinking out of the forgotten
table drinks? "]

new_sequences = np.array([extract_gpt_features(text) for text in new_texts])

new_data = pad_sequences(new_sequences, maxlen=MAX_SEQ_LENGTH)
predictions = model.predict(new_data)

# Evaluate the model

y_pred = np.round(predictions)
y_true = np.array([0, 0, 0, 0, 0, 0, 0]) # True labels of new data
cm = confusion_matrix(y_true, y_pred)
print(cm)

Placement Brochure 2024-25_compressed (1)
No ratings yet
Placement Brochure 2024-25_compressed (1)
77 pages
1729401471516
No ratings yet
1729401471516
98 pages
Cv prince
No ratings yet
Cv prince
120 pages
Sampling (UK Stream) and ISA 530, Audit Sampling and Other Selective Testing Procedures (International Stream)
No ratings yet
Sampling (UK Stream) and ISA 530, Audit Sampling and Other Selective Testing Procedures (International Stream)
15 pages
AD3511 - Deep Learning Lab Manual - - Copy
No ratings yet
AD3511 - Deep Learning Lab Manual - - Copy
61 pages
Dl lab answers batch 2
No ratings yet
Dl lab answers batch 2
27 pages
NLP
No ratings yet
NLP
45 pages
DL
No ratings yet
DL
17 pages
Deep Learning Manual (1)
No ratings yet
Deep Learning Manual (1)
53 pages
rldl
No ratings yet
rldl
23 pages
rldl
No ratings yet
rldl
27 pages
Exp 6,7,8
No ratings yet
Exp 6,7,8
17 pages
GloVe Embedding code
No ratings yet
GloVe Embedding code
3 pages
566f0619-9145-4b8f-b12b-cb8a5b0cd30d
No ratings yet
566f0619-9145-4b8f-b12b-cb8a5b0cd30d
17 pages
DOC-20250104-WA0000.
No ratings yet
DOC-20250104-WA0000.
40 pages
ccc
No ratings yet
ccc
25 pages
Word2Vec code
No ratings yet
Word2Vec code
2 pages
bertweet tokenizer
No ratings yet
bertweet tokenizer
2 pages
Adobe Scan 08 Jan 2025
No ratings yet
Adobe Scan 08 Jan 2025
7 pages
NNProject t2
No ratings yet
NNProject t2
9 pages
unit4 (1)
No ratings yet
unit4 (1)
23 pages
DL_3
No ratings yet
DL_3
6 pages
Untitled 10
No ratings yet
Untitled 10
6 pages
Recurrent Neural Networks: Pytorch
No ratings yet
Recurrent Neural Networks: Pytorch
6 pages
EncoderDecoderSeq2Seq DeepLSTM
No ratings yet
EncoderDecoderSeq2Seq DeepLSTM
7 pages
intent_recognizer
No ratings yet
intent_recognizer
5 pages
Sample Code
No ratings yet
Sample Code
8 pages
QLSTMvs LSTM
No ratings yet
QLSTMvs LSTM
7 pages
Sentence Embedding Code
No ratings yet
Sentence Embedding Code
9 pages
A3_44_DL_TA
No ratings yet
A3_44_DL_TA
10 pages
Dl Lab Manual
No ratings yet
Dl Lab Manual
18 pages
dl exps
No ratings yet
dl exps
9 pages
sentiment analysis using LSTM (1)
No ratings yet
sentiment analysis using LSTM (1)
5 pages
Course 3 - Week 2 - Exercise - Answer - Ipynb - Colaboratory
No ratings yet
Course 3 - Week 2 - Exercise - Answer - Ipynb - Colaboratory
8 pages
2023 Aug How To Produce Data For A Neural networkORG
No ratings yet
2023 Aug How To Produce Data For A Neural networkORG
6 pages
Cummins Insite Date Unlock Rapidsharebfdcm
0% (1)
Cummins Insite Date Unlock Rapidsharebfdcm
3 pages
import numpy as np
No ratings yet
import numpy as np
3 pages
Sample
No ratings yet
Sample
6 pages
7
No ratings yet
7
4 pages
Assingment-3 NLP
No ratings yet
Assingment-3 NLP
5 pages
Experiment 10 NLP
No ratings yet
Experiment 10 NLP
5 pages
Emotion Detection_merged
No ratings yet
Emotion Detection_merged
8 pages
HateSpeech.ipynb - Colab
No ratings yet
HateSpeech.ipynb - Colab
8 pages
Experiment 6.2
No ratings yet
Experiment 6.2
4 pages
C1W2 Assignment
No ratings yet
C1W2 Assignment
5 pages
Neural Networks
No ratings yet
Neural Networks
8 pages
Super Visionado VSRegras
No ratings yet
Super Visionado VSRegras
6 pages
code text
No ratings yet
code text
4 pages
new 2
No ratings yet
new 2
2 pages
Final Code
No ratings yet
Final Code
16 pages
Bert
No ratings yet
Bert
2 pages
(P) Program AIO
No ratings yet
(P) Program AIO
22 pages
Belize Electronic Transactions Act
No ratings yet
Belize Electronic Transactions Act
21 pages
Tanveer_Younas_B22F0047AI067
No ratings yet
Tanveer_Younas_B22F0047AI067
3 pages
PHASE 2 IBM
No ratings yet
PHASE 2 IBM
5 pages
Rajeek 7
No ratings yet
Rajeek 7
3 pages
Null 0
No ratings yet
Null 0
6 pages
Assignment3
No ratings yet
Assignment3
6 pages
Importing Packages: Id Label Tweet 0 1 2 3 4
No ratings yet
Importing Packages: Id Label Tweet 0 1 2 3 4
8 pages
Hugging Face
No ratings yet
Hugging Face
1 page
BTP Integration Suite Edge Integration Cell on Azure
No ratings yet
BTP Integration Suite Edge Integration Cell on Azure
8 pages
Forensic Accounting Syllabus Sofia University 2010
No ratings yet
Forensic Accounting Syllabus Sofia University 2010
10 pages
Healthcare Outbound
100% (1)
Healthcare Outbound
16 pages
ID6001_Homework_2b57bb1d39ec7c53700fa31dc04520dc
No ratings yet
ID6001_Homework_2b57bb1d39ec7c53700fa31dc04520dc
2 pages
Antenna Name Weight Size KG L (M) W (M)
No ratings yet
Antenna Name Weight Size KG L (M) W (M)
5 pages
Mba Fy 2024-25
No ratings yet
Mba Fy 2024-25
7 pages
keras
No ratings yet
keras
4 pages
Futwork Offer Letter - Yocket - Shpyari
No ratings yet
Futwork Offer Letter - Yocket - Shpyari
7 pages
Keshtokar Eurodrip General 1
No ratings yet
Keshtokar Eurodrip General 1
8 pages
Data Communication and Networking: Assignment#01 Topic: Coaxial Cable
No ratings yet
Data Communication and Networking: Assignment#01 Topic: Coaxial Cable
17 pages
Development of Arduino Microcontroller Based Non-Intrusive Appliances Monitoring System Using Artificial Neural Network
No ratings yet
Development of Arduino Microcontroller Based Non-Intrusive Appliances Monitoring System Using Artificial Neural Network
9 pages
Engine Control PDF
No ratings yet
Engine Control PDF
1 page
You Are My Everything (Ost Descendants of The Sun) (Gummy) - Score and Parts
No ratings yet
You Are My Everything (Ost Descendants of The Sun) (Gummy) - Score and Parts
15 pages
Kami Export - Pdf_ch76 (2)
No ratings yet
Kami Export - Pdf_ch76 (2)
6 pages
Optional Protocol To The ICCPR
No ratings yet
Optional Protocol To The ICCPR
7 pages
Mindjet Large Scale Deployment Guide
No ratings yet
Mindjet Large Scale Deployment Guide
59 pages
Chapter 3 Solutions
No ratings yet
Chapter 3 Solutions
16 pages
Transformation Problems
No ratings yet
Transformation Problems
18 pages
Sample Paper - 2010 Class - X Subject - Information Technology
No ratings yet
Sample Paper - 2010 Class - X Subject - Information Technology
4 pages
Ra 9288 Basis For Questionnaire PDF
No ratings yet
Ra 9288 Basis For Questionnaire PDF
22 pages
Activity 4
No ratings yet
Activity 4
2 pages
Dagupan City, Pangasinan: University of Pangasinan Phinma Education Network
No ratings yet
Dagupan City, Pangasinan: University of Pangasinan Phinma Education Network
10 pages
AO1 Worksheet 3 Using Economic Terms Answers
100% (1)
AO1 Worksheet 3 Using Economic Terms Answers
3 pages
The Great Migration: Reading
No ratings yet
The Great Migration: Reading
1 page
If 005
No ratings yet
If 005
2 pages
4th Tos Math7 New Format
No ratings yet
4th Tos Math7 New Format
2 pages
Heat Transfer
No ratings yet
Heat Transfer
21 pages
Sagot Ko Sa Ethics
No ratings yet
Sagot Ko Sa Ethics
1 page
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet
Amazing Java: Learn Java Quickly
From Everand
Amazing Java: Learn Java Quickly
Andrei Besedin
No ratings yet

gpt-2 code

Uploaded by

gpt-2 code

Uploaded by

import pandas as pd

# Load the dataset

# Preprocess text data

features = outputs[:, 0, :].squeeze(0).cpu().numpy()

sequences = np.array([extract_gpt_features(text) for text in texts])

# Train the model with early stopping

# Make predictions on new data

new_sequences = np.array([extract_gpt_features(text) for text in new_texts])

# Evaluate the model

You might also like