0% found this document useful (0 votes)

13 views3 pages

RNN Text Generation

Rnn

Uploaded by

kishoranbu14

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

13 views3 pages

RNN Text Generation

Rnn

Uploaded by

kishoranbu14

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

You are on page 1/ 3

RNN Language Model for Text Generation

Python Code:

# Step 1: Preprocessing Text

def preprocess_text(text):
text = re.sub(r'[^a-zA-Z0-9\s]', '', text) # Remove punctuation
text = text.lower() # Convert to lowercase
words = text.split() # Tokenize
return words

# Sample text (use a larger corpus for better results)

corpus = """
Joseph Vijay Chandrasekhar (born 22 June 1974), known professionally as Vijay, is an
Indian actor and playback singer who works in Tamil cinema. ...
"""

# Preprocess and create vocabulary

words = preprocess_text(corpus)
vocab = sorted(set(words))
word_to_idx = {word: idx for idx, word in enumerate(vocab)}
idx_to_word = {idx: word for word, idx in word_to_idx.items()}

# Encode the text

encoded = [word_to_idx[word] for word in words]

# Step 2: Dataset Preparation

sequence_length = 5 # Number of words in input sequence

class TextDataset(Dataset):
def __init__(self, encoded_text, sequence_length):
self.data = []
for i in range(len(encoded_text) - sequence_length):
input_seq = encoded_text[i:i + sequence_length]
target = encoded_text[i + sequence_length]
self.data.append((input_seq, target))

def __len__(self):
return len(self.data)

def getitem(self, idx):

return torch.tensor(self.data[idx][0]), torch.tensor(self.data[idx][1])
dataset = TextDataset(encoded, sequence_length)
dataloader = DataLoader(dataset, batch_size=16, shuffle=True)

# Step 3: Define the RNN Model

class RNNLanguageModel(nn.Module):
def __init__(self, vocab_size, embedding_dim, hidden_dim):
super(RNNLanguageModel, self).__init__()
self.embedding = nn.Embedding(vocab_size, embedding_dim)
self.rnn = nn.RNN(embedding_dim, hidden_dim, batch_first=True)
self.fc = nn.Linear(hidden_dim, vocab_size)

def forward(self, x, hidden):

embedded = self.embedding(x) # (batch, seq_len, embedding_dim)
out, hidden = self.rnn(embedded, hidden) # (batch, seq_len, hidden_dim)
out = self.fc(out[:, -1, :]) # Output for the last time step
return out, hidden

def init_hidden(self, batch_size):

return torch.zeros(1, batch_size, hidden_dim)

# Hyperparameters
embedding_dim = 64
hidden_dim = 128
learning_rate = 0.01
epochs = 20

# Initialize model, criterion, and optimizer

model = RNNLanguageModel(vocab_size, embedding_dim, hidden_dim)
criterion = nn.CrossEntropyLoss()
optimizer = optim.Adam(model.parameters(), lr=learning_rate)

# Step 4: Training the Model

for epoch in range(epochs):
total_loss = 0
for inputs, targets in dataloader:
batch_size = inputs.size(0)
hidden = model.init_hidden(batch_size)

# Forward pass
outputs, hidden = model(inputs, hidden)
loss = criterion(outputs, targets)
# Backward pass
optimizer.zero_grad()
loss.backward()
optimizer.step()

total_loss += loss.item()

print(f"Epoch {epoch+1}/{epochs}, Loss: {total_loss / len(dataloader):.4f}")

# Step 5: Text Generation

def generate_text(model, start_sequence, num_words):
model.eval()
input_seq = [word_to_idx[word] for word in preprocess_text(start_sequence)]
generated = start_sequence

hidden = model.init_hidden(1)
input_tensor = torch.tensor(input_seq).unsqueeze(0) # Add batch dimension

for _ in range(num_words):
with torch.no_grad():
output, hidden = model(input_tensor, hidden)
next_word_idx = torch.argmax(output, dim=1).item()
next_word = idx_to_word[next_word_idx]

generated += " " + next_word

input_tensor = torch.tensor([[next_word_idx]]) # Update input

return generated

# Generate text
start_sequence = "Vijay"
num_words = 20
generated_text = generate_text(model, start_sequence, num_words)
print("\nGenerated Text:")
print(generated_text)

Teaching Word Recognition
No ratings yet
Teaching Word Recognition
176 pages
Pashto Self-Learning
100% (4)
Pashto Self-Learning
220 pages
RRL in Research PDF
75% (8)
RRL in Research PDF
26 pages
Effectiveness of Electronic Dictionary
No ratings yet
Effectiveness of Electronic Dictionary
4 pages
94 Tet English Noun 12 Answer
100% (2)
94 Tet English Noun 12 Answer
5 pages
English Teaching Professional Magazine 63
No ratings yet
English Teaching Professional Magazine 63
68 pages
Neurall Network Language
No ratings yet
Neurall Network Language
47 pages
AI Lab6
No ratings yet
AI Lab6
22 pages
Research Paper Summarization
No ratings yet
Research Paper Summarization
13 pages
M5 Topic 1 - Encoder Decoder
No ratings yet
M5 Topic 1 - Encoder Decoder
21 pages
Lab 5
No ratings yet
Lab 5
7 pages
AI Quiz ch3
No ratings yet
AI Quiz ch3
29 pages
Final DL
No ratings yet
Final DL
26 pages
Natural Language Processing Lab 9
No ratings yet
Natural Language Processing Lab 9
13 pages
Steps
No ratings yet
Steps
3 pages
Practical 1
No ratings yet
Practical 1
6 pages
04 - RNNs
No ratings yet
04 - RNNs
37 pages
Language Modelling Using RNN
No ratings yet
Language Modelling Using RNN
3 pages
Automated Image Captioning With Convnets and Recurrent Nets: Andrej Karpathy, Fei-Fei Li
No ratings yet
Automated Image Captioning With Convnets and Recurrent Nets: Andrej Karpathy, Fei-Fei Li
105 pages
DL Lab Answers Batch 2
No ratings yet
DL Lab Answers Batch 2
27 pages
Code Explanation
No ratings yet
Code Explanation
8 pages
Summaries of The Chapters
No ratings yet
Summaries of The Chapters
29 pages
RNN StannfordBased
No ratings yet
RNN StannfordBased
102 pages
RNN LSTM From Scratch - Ipynb
No ratings yet
RNN LSTM From Scratch - Ipynb
55 pages
Professions PDF
No ratings yet
Professions PDF
4 pages
Tensor Flow Chat Bot
No ratings yet
Tensor Flow Chat Bot
44 pages
Sequence Models-II
No ratings yet
Sequence Models-II
10 pages
Case Study
No ratings yet
Case Study
25 pages
AIML LAB Week9 2
No ratings yet
AIML LAB Week9 2
3 pages
DL 7
No ratings yet
DL 7
6 pages
Experiment 10 NLP
No ratings yet
Experiment 10 NLP
5 pages
Transformer 2017
No ratings yet
Transformer 2017
7 pages
Transformers Torch
No ratings yet
Transformers Torch
38 pages
Systematic Replication of The Effects of A Supplementary Technol
No ratings yet
Systematic Replication of The Effects of A Supplementary Technol
28 pages
ChatBot With GANs
No ratings yet
ChatBot With GANs
61 pages
English 9 Unit 8
No ratings yet
English 9 Unit 8
23 pages
Assignment 7
No ratings yet
Assignment 7
10 pages
Assignment 9
No ratings yet
Assignment 9
4 pages
CNN RNN LSTM Attention
No ratings yet
CNN RNN LSTM Attention
86 pages
DL 4
No ratings yet
DL 4
5 pages
20 Parts of Speech
100% (2)
20 Parts of Speech
12 pages
Chapter 3
No ratings yet
Chapter 3
14 pages
NLP
No ratings yet
NLP
15 pages
Class44-46 Introduction To Enncoder-Decoder Model Attention-03-09May2023
No ratings yet
Class44-46 Introduction To Enncoder-Decoder Model Attention-03-09May2023
35 pages
Basic Concepts On LTM and Review
No ratings yet
Basic Concepts On LTM and Review
3 pages
Solutions
No ratings yet
Solutions
11 pages
Phonics W2 April
No ratings yet
Phonics W2 April
52 pages
Recurrent Neural Networks (RNN) : Subtitle
No ratings yet
Recurrent Neural Networks (RNN) : Subtitle
53 pages
Exp 8 Machine Translation
No ratings yet
Exp 8 Machine Translation
11 pages
Assingment-3 NLP
No ratings yet
Assingment-3 NLP
5 pages
Cse425 Assignement - 20101257
No ratings yet
Cse425 Assignement - 20101257
12 pages
DL Programs
No ratings yet
DL Programs
13 pages
NLP 4
No ratings yet
NLP 4
10 pages
Observation Report 2 (Focus 1 and 2)
No ratings yet
Observation Report 2 (Focus 1 and 2)
2 pages
Polynomial Expansion Paper
No ratings yet
Polynomial Expansion Paper
4 pages
CNN Text Classification
No ratings yet
CNN Text Classification
12 pages
DAA FinalReport
No ratings yet
DAA FinalReport
14 pages
The Illustrated Transformer - Jay Alammar - Visualizing Machine Learning One Concept at A Time - .Booklet
No ratings yet
The Illustrated Transformer - Jay Alammar - Visualizing Machine Learning One Concept at A Time - .Booklet
14 pages
Nn4ir PDF
No ratings yet
Nn4ir PDF
290 pages
DL - Assignment 1
No ratings yet
DL - Assignment 1
12 pages
Assessment Brief 23-24 NEW - April 24 - SIT
No ratings yet
Assessment Brief 23-24 NEW - April 24 - SIT
11 pages
Machine Translation Using Natural Language Process
No ratings yet
Machine Translation Using Natural Language Process
6 pages
EncoderDecoderSeq2Seq DeepLSTM
No ratings yet
EncoderDecoderSeq2Seq DeepLSTM
7 pages
Cs 224N: Assignment #4: 1. Neural Machine Translation With Rnns (45 Points)
No ratings yet
Cs 224N: Assignment #4: 1. Neural Machine Translation With Rnns (45 Points)
10 pages
Language & Literature - Criteria C & D: Year 3
No ratings yet
Language & Literature - Criteria C & D: Year 3
1 page
Assignment 1
No ratings yet
Assignment 1
7 pages
Skyline Quick Test Contents: Skyline 1 Skyline 2 Skyline 3 Skyline 4 Skyline 5
No ratings yet
Skyline Quick Test Contents: Skyline 1 Skyline 2 Skyline 3 Skyline 4 Skyline 5
3 pages
Afif Fauzi-Fitk
No ratings yet
Afif Fauzi-Fitk
54 pages
Internal Evaluation - I Learn Smart Start Grade 3-Students Book
No ratings yet
Internal Evaluation - I Learn Smart Start Grade 3-Students Book
2 pages
German Vocab Builder S1 #36 at A Hotel: Lesson Notes
No ratings yet
German Vocab Builder S1 #36 at A Hotel: Lesson Notes
4 pages
REPORT-MTechPESJul23BGrp2-3 (22-02-25)
No ratings yet
REPORT-MTechPESJul23BGrp2-3 (22-02-25)
15 pages
Medical Text Classifier GabrieldeOlaguibel
No ratings yet
Medical Text Classifier GabrieldeOlaguibel
12 pages
GPT2 From Scratch in PyTorch
No ratings yet
GPT2 From Scratch in PyTorch
13 pages
Annotated Bibliography - Davis
No ratings yet
Annotated Bibliography - Davis
9 pages
Daily Lesson Plan TS25
No ratings yet
Daily Lesson Plan TS25
3 pages
Neubig 16 Afnlp
No ratings yet
Neubig 16 Afnlp
58 pages
Grade 7-2
No ratings yet
Grade 7-2
8 pages
Chotto
No ratings yet
Chotto
10 pages
Persepolis Lesson Plans Rationale
No ratings yet
Persepolis Lesson Plans Rationale
8 pages
2022 Specimen Paper 3 Instructions For Teachers Examiners
0% (1)
2022 Specimen Paper 3 Instructions For Teachers Examiners
32 pages
Introducing LexTALEA A Quick and Valid Lexical Test For Advanced Learners of English
No ratings yet
Introducing LexTALEA A Quick and Valid Lexical Test For Advanced Learners of English
19 pages
Next Word Prediction With NLP and Deep Learning
No ratings yet
Next Word Prediction With NLP and Deep Learning
13 pages
NLP Assignment 2
No ratings yet
NLP Assignment 2
3 pages
Lexical Relations Introduction
No ratings yet
Lexical Relations Introduction
9 pages
Lesson Plan - Lets Talk About Food
No ratings yet
Lesson Plan - Lets Talk About Food
2 pages
CS4740/5740 Introduction To NLP Fall 2017 Neural Language Models and Classifiers
No ratings yet
CS4740/5740 Introduction To NLP Fall 2017 Neural Language Models and Classifiers
7 pages
Cs 224N: Assignment #4: 1. Neural Machine Translation With Rnns (45 Points)
No ratings yet
Cs 224N: Assignment #4: 1. Neural Machine Translation With Rnns (45 Points)
7 pages
IELTS Writing Band Descriptors
No ratings yet
IELTS Writing Band Descriptors
2 pages
Flyers Skill Kit 2
100% (2)
Flyers Skill Kit 2
48 pages

RNN Text Generation

Uploaded by

RNN Text Generation

Uploaded by

RNN Language Model for Text Generation

# Step 1: Preprocessing Text

# Sample text (use a larger corpus for better results)

# Preprocess and create vocabulary

# Encode the text

# Step 2: Dataset Preparation

def __getitem__(self, idx):

# Step 3: Define the RNN Model

def forward(self, x, hidden):

def init_hidden(self, batch_size):

# Initialize model, criterion, and optimizer

# Step 4: Training the Model

print(f"Epoch {epoch+1}/{epochs}, Loss: {total_loss / len(dataloader):.4f}")

# Step 5: Text Generation

generated += " " + next_word

You might also like

def getitem(self, idx):