0% found this document useful (0 votes)

8 views6 pages

DL 7

The document provides a Python program for machine translation using an Encoder-Decoder model implemented with TensorFlow and Keras. It includes hyperparameters, a sample vocabulary, dummy data for training, model architecture, training process, and functions for encoding and decoding sentences. The program demonstrates the translation of the input sentence 'I am learning' into French as 'J'apprends'.

Uploaded by

MATHAN KUMAR M

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

8 views6 pages

DL 7

Uploaded by

MATHAN KUMAR M

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

You are on page 1/ 6

EX 7: Machine Translation using Encoder-Decoder model

Program:

import tensorflow as tf

from tensorflow.keras.models import Model

from tensorflow.keras.layers import Input, LSTM, Dense

import numpy as np

# ------------------- HYPERPARAMETERS -------------------

latent_dim = 256 # Size of the LSTM hidden state

num_encoder_tokens = 5 # Small vocab for demo purposes

num_decoder_tokens = 5

max_encoder_seq_length = 5 # Small sequence length

max_decoder_seq_length = 5

# ------------------- SAMPLE VOCABULARY -------------------

input_token_index = {'I': 0, 'am': 1, 'learning': 2, '<PAD>': 3}

target_token_index = {'<START>': 0, 'J\'apprends': 1, '<END>': 2, '<PAD>': 3}

reverse_target_token_index = {0: '<START>', 1: "J'apprends", 2: '<END>', 3:

'<PAD>'}

# ------------------- DUMMY DATA (Simple Training Example) -------------------

encoder_input_data = np.zeros((1, max_encoder_seq_length,

num_encoder_tokens))

decoder_input_data = np.zeros((1, max_decoder_seq_length,

num_decoder_tokens))
decoder_target_data = np.zeros((1, max_decoder_seq_length,
num_decoder_tokens))

# Example input: "I am learning"

encoder_input_data[0, 0, 0] = 1 # "I"

encoder_input_data[0, 1, 1] = 1 # "am"

encoder_input_data[0, 2, 2] = 1 # "learning"

# Example output: "<START> J'apprends <END>"

decoder_input_data[0, 0, 0] = 1 # "<START>"

decoder_target_data[0, 0, 1] = 1 # "J'apprends"

decoder_target_data[0, 1, 2] = 1 # "<END>"

# ------------------- MODEL ARCHITECTURE -------------------

# Encoder Model

encoder_inputs = Input(shape=(None, num_encoder_tokens))

encoder_lstm = LSTM(latent_dim, return_state=True)

_, state_h, state_c = encoder_lstm(encoder_inputs)

encoder_states = [state_h, state_c]

# Decoder Model

decoder_inputs = Input(shape=(None, num_decoder_tokens))

decoder_lstm = LSTM(latent_dim, return_sequences=True, return_state=True)

decoder_outputs, _, _ = decoder_lstm(decoder_inputs,
initial_state=encoder_states)

decoder_dense = Dense(num_decoder_tokens, activation='softmax')

decoder_outputs = decoder_dense(decoder_outputs)
# Full Model

model = Model([encoder_inputs, decoder_inputs], decoder_outputs)

model.compile(optimizer='rmsprop', loss='categorical_crossentropy')

# ------------------- TRAINING -------------------

model.fit([encoder_input_data, decoder_input_data], decoder_target_data,

batch_size=1, epochs=10)

# ------------------- INFERENCE MODE -------------------

# Encoder model for inference

encoder_model = Model(encoder_inputs, encoder_states)

# Decoder model for inference

decoder_state_input_h = Input(shape=(latent_dim,))

decoder_state_input_c = Input(shape=(latent_dim,))

decoder_states_inputs = [decoder_state_input_h, decoder_state_input_c]

decoder_outputs, state_h, state_c = decoder_lstm(

decoder_inputs, initial_state=decoder_states_inputs)

decoder_states = [state_h, state_c]

decoder_outputs = decoder_dense(decoder_outputs)

decoder_model = Model([decoder_inputs] + decoder_states_inputs,

[decoder_outputs] + decoder_states)

# ------------------- ENCODING FUNCTION -------------------

def encode_input_sentence(sentence):

"""Encodes an input sentence into a padded sequence of tokens."""

tokens = [input_token_index.get(word, 3) for word in sentence.split()] #
Default to <PAD>

encoder_input = np.zeros((1, max_encoder_seq_length,

num_encoder_tokens))

for t, token in enumerate(tokens):

encoder_input[0, t, token] = 1.0

return encoder_input

# ------------------- DECODING FUNCTION -------------------

def decode_sequence(input_seq):

"""Generates the output sentence word-by-word using the decoder."""

states_value = encoder_model.predict(input_seq)

# Start with the <START> token

target_seq = np.zeros((1, 1, num_decoder_tokens))

target_seq[0, 0, target_token_index['<START>']] = 1.0

decoded_sentence = ''

stop_condition = False

while not stop_condition:

output_tokens, h, c = decoder_model.predict([target_seq] + states_value)

sampled_token_index = np.argmax(output_tokens[0, -1, :])

sampled_word = reverse_target_token_index.get(sampled_token_index,
'<UNK>')

if sampled_word == '<END>' or len(decoded_sentence.split()) >

max_decoder_seq_length:

stop_condition = True

else:
decoded_sentence += ' ' + sampled_word

# Update the target sequence and states

target_seq = np.zeros((1, 1, num_decoder_tokens))

target_seq[0, 0, sampled_token_index] = 1.0

states_value = [h, c]

return decoded_sentence.strip()

# ------------------- TEST TRANSLATION -------------------

input_sentence = "I am learning"

input_seq = encode_input_sentence(input_sentence)

translated_sentence = decode_sequence(input_seq)

print(f"Input: {input_sentence}")

print(f"Translated: {translated_sentence}")

Output:

Tax 1 Syllabus 24 25
No ratings yet
Tax 1 Syllabus 24 25
8 pages
Transformers Torch
No ratings yet
Transformers Torch
38 pages
Unit IV DL
No ratings yet
Unit IV DL
122 pages
05 Attention Slides
No ratings yet
05 Attention Slides
69 pages
Encoder Decoder Transformers Notes
No ratings yet
Encoder Decoder Transformers Notes
6 pages
Difficulties of Students Encountering TLE
67% (3)
Difficulties of Students Encountering TLE
5 pages
Unit IV DL
No ratings yet
Unit IV DL
122 pages
Dlunit 4
No ratings yet
Dlunit 4
122 pages
Lecture 13 - Transformer Encoder Decoderv2
No ratings yet
Lecture 13 - Transformer Encoder Decoderv2
65 pages
Neural Machine Translation: Shusen Wang
No ratings yet
Neural Machine Translation: Shusen Wang
57 pages
cl8 Encdec
No ratings yet
cl8 Encdec
51 pages
Visualizing A Neural Machine Translation Model
No ratings yet
Visualizing A Neural Machine Translation Model
38 pages
Nqesh Exam 2022 Guide For 21ST Century School Principals
100% (4)
Nqesh Exam 2022 Guide For 21ST Century School Principals
17 pages
10 Encdec Attention Notes
No ratings yet
10 Encdec Attention Notes
29 pages
Earth & Life Science Q1 Module 2 - DESIREE VICTORINO
50% (4)
Earth & Life Science Q1 Module 2 - DESIREE VICTORINO
22 pages
RNN LSTM From Scratch - Ipynb
No ratings yet
RNN LSTM From Scratch - Ipynb
55 pages
Force of Eating: Teacher Note Answer Key
No ratings yet
Force of Eating: Teacher Note Answer Key
6 pages
Unit5 3
No ratings yet
Unit5 3
48 pages
Exp 8 Machine Translation
No ratings yet
Exp 8 Machine Translation
11 pages
Language Translation
No ratings yet
Language Translation
15 pages
Bahdanau Attention Mechanism (Also Known As Additive Attention)
No ratings yet
Bahdanau Attention Mechanism (Also Known As Additive Attention)
41 pages
Cse425 Assignement - 20101257
No ratings yet
Cse425 Assignement - 20101257
12 pages
Deep Recurrent Neural Networks
No ratings yet
Deep Recurrent Neural Networks
24 pages
Project Source
No ratings yet
Project Source
21 pages
Solutions
No ratings yet
Solutions
11 pages
Cs 224N: Assignment #4: 1. Neural Machine Translation With Rnns (45 Points)
No ratings yet
Cs 224N: Assignment #4: 1. Neural Machine Translation With Rnns (45 Points)
10 pages
Tensor Flow Chat Bot
No ratings yet
Tensor Flow Chat Bot
44 pages
Assignment 7
No ratings yet
Assignment 7
10 pages
A Character-Level Decoder Without Explicit Segmentation For Neural Machine Translation
No ratings yet
A Character-Level Decoder Without Explicit Segmentation For Neural Machine Translation
11 pages
English Lesson Plan
0% (1)
English Lesson Plan
8 pages
M5 Topic 1 - Encoder Decoder
No ratings yet
M5 Topic 1 - Encoder Decoder
21 pages
Image Captioning With Visual Attention PDF
No ratings yet
Image Captioning With Visual Attention PDF
16 pages
DL Programs
No ratings yet
DL Programs
13 pages
Module 3 Part 2 Encoder
No ratings yet
Module 3 Part 2 Encoder
14 pages
Sequence Models-II
No ratings yet
Sequence Models-II
10 pages
Visual Transformer
No ratings yet
Visual Transformer
18 pages
NLP
No ratings yet
NLP
15 pages
WEEK 12 Materials Selection, Adaptation and Simplification
100% (1)
WEEK 12 Materials Selection, Adaptation and Simplification
37 pages
DL 8
No ratings yet
DL 8
7 pages
Encoder-Decoder Sequence To Sequence Architechure
No ratings yet
Encoder-Decoder Sequence To Sequence Architechure
16 pages
EncoderDecoderSeq2Seq DeepLSTM
No ratings yet
EncoderDecoderSeq2Seq DeepLSTM
7 pages
Natural Language Processing Lab 9
No ratings yet
Natural Language Processing Lab 9
13 pages
GPT2 From Scratch in PyTorch
No ratings yet
GPT2 From Scratch in PyTorch
13 pages
Pertemuan 11 - Sequence To Sequence
No ratings yet
Pertemuan 11 - Sequence To Sequence
21 pages
NLP 4
No ratings yet
NLP 4
10 pages
To Embed A Tokenization Process Into A Decoder Implementation With LSTM
No ratings yet
To Embed A Tokenization Process Into A Decoder Implementation With LSTM
4 pages
Encode and Decoder Diagram Explanation
No ratings yet
Encode and Decoder Diagram Explanation
8 pages
Transformer 2017
No ratings yet
Transformer 2017
7 pages
Language Translation With NN - Transformer and Torchtext - PyTorch Tutorials 2.3.0+cu121 Documentation
No ratings yet
Language Translation With NN - Transformer and Torchtext - PyTorch Tutorials 2.3.0+cu121 Documentation
8 pages
2014 10 Cho EMNLP
No ratings yet
2014 10 Cho EMNLP
11 pages
Obe Syllabus Format Rcastillo Pol Theory
100% (1)
Obe Syllabus Format Rcastillo Pol Theory
11 pages
Machine Translation Using Encoder
No ratings yet
Machine Translation Using Encoder
2 pages
Assignment 9
No ratings yet
Assignment 9
4 pages
Worksheet 5: Daily Routine
No ratings yet
Worksheet 5: Daily Routine
2 pages
DL Notations
No ratings yet
DL Notations
5 pages
DL 4
No ratings yet
DL 4
5 pages
Polynomial Expansion Paper
No ratings yet
Polynomial Expansion Paper
4 pages
Sentiment Analysis Using LSTM
No ratings yet
Sentiment Analysis Using LSTM
5 pages
Cs 224N: Assignment #4: 1. Neural Machine Translation With Rnns (45 Points)
No ratings yet
Cs 224N: Assignment #4: 1. Neural Machine Translation With Rnns (45 Points)
7 pages
Attention Mechanism
No ratings yet
Attention Mechanism
11 pages
DL 6
No ratings yet
DL 6
4 pages
DL 6
No ratings yet
DL 6
4 pages
RNN Text Generation
No ratings yet
RNN Text Generation
3 pages
Written Language. The Reading-Writing Process. Reading Comprehension Techniques of Global and Specific Understanding of Texts. Writing From Comprehension To Production.
100% (1)
Written Language. The Reading-Writing Process. Reading Comprehension Techniques of Global and Specific Understanding of Texts. Writing From Comprehension To Production.
9 pages
DL 6th Exp Program
No ratings yet
DL 6th Exp Program
3 pages
Simple Addition: Learning Objectives
No ratings yet
Simple Addition: Learning Objectives
2 pages
Autoencoder Transformer
No ratings yet
Autoencoder Transformer
2 pages
Chatbot Exp6
No ratings yet
Chatbot Exp6
1 page
Simple NMT
No ratings yet
Simple NMT
3 pages
Grade 10 ORV Test
No ratings yet
Grade 10 ORV Test
2 pages
Corpuz
100% (2)
Corpuz
2 pages
Chapter 3 For Consumer Behavior
No ratings yet
Chapter 3 For Consumer Behavior
30 pages
English On The Go 3 TB - Dig
No ratings yet
English On The Go 3 TB - Dig
120 pages
1 Grade Lesson Plan - Counting With Ten and Leftovers - Using Base Ten Blocks
100% (1)
1 Grade Lesson Plan - Counting With Ten and Leftovers - Using Base Ten Blocks
3 pages
Chapter 2
No ratings yet
Chapter 2
4 pages
8609 Paper Solved
No ratings yet
8609 Paper Solved
14 pages
Almoguerra Form-2-Ta-Manahan-Tb-Avila-Demo-Teaching-Rubric
No ratings yet
Almoguerra Form-2-Ta-Manahan-Tb-Avila-Demo-Teaching-Rubric
2 pages
September 03 - Mathematics - Ordonio
No ratings yet
September 03 - Mathematics - Ordonio
3 pages
Curriculum Map in English 10.1
No ratings yet
Curriculum Map in English 10.1
6 pages
LP Urban Decay, Suburban Hell
No ratings yet
LP Urban Decay, Suburban Hell
4 pages
Internship Report
No ratings yet
Internship Report
26 pages
Hudson
No ratings yet
Hudson
4 pages
3 8 - Wednesday - Butterfly Lesson Plan
No ratings yet
3 8 - Wednesday - Butterfly Lesson Plan
2 pages
Linear Models (Unit II) Chapter III 1
No ratings yet
Linear Models (Unit II) Chapter III 1
24 pages
Implementaion of Simplified A
No ratings yet
Implementaion of Simplified A
2 pages
Visuals Applications and Software For Learner With Autism Spectrum Disorders Tahira
No ratings yet
Visuals Applications and Software For Learner With Autism Spectrum Disorders Tahira
3 pages
Unit Planner-EY2 - WWA
No ratings yet
Unit Planner-EY2 - WWA
4 pages
EXP 2 Multiplication
No ratings yet
EXP 2 Multiplication
2 pages
Institut Pendidikan Guru, Kampus Rajang: Tugasan Kerja Kursus Tahun Akademik: Jun 2016
No ratings yet
Institut Pendidikan Guru, Kampus Rajang: Tugasan Kerja Kursus Tahun Akademik: Jun 2016
4 pages
SVSF
No ratings yet
SVSF
3 pages
Implementation of Constrains Satisfaction Problem
No ratings yet
Implementation of Constrains Satisfaction Problem
2 pages
Essay Competition 2022
No ratings yet
Essay Competition 2022
2 pages
Python For Beginners
From Everand
Python For Beginners
Célio Azevedo
No ratings yet
Profound Linux For Developers
From Everand
Profound Linux For Developers
Onder Teker
No ratings yet

DL 7

Uploaded by

DL 7

Uploaded by

EX 7: Machine Translation using Encoder-Decoder model

from tensorflow.keras.models import Model

from tensorflow.keras.layers import Input, LSTM, Dense

# ------------------- HYPERPARAMETERS -------------------

latent_dim = 256 # Size of the LSTM hidden state

num_encoder_tokens = 5 # Small vocab for demo purposes

max_encoder_seq_length = 5 # Small sequence length

# ------------------- SAMPLE VOCABULARY -------------------

input_token_index = {'I': 0, 'am': 1, 'learning': 2, '<PAD>': 3}

target_token_index = {'<START>': 0, 'J\'apprends': 1, '<END>': 2, '<PAD>': 3}

reverse_target_token_index = {0: '<START>', 1: "J'apprends", 2: '<END>', 3:

# ------------------- DUMMY DATA (Simple Training Example) -------------------

encoder_input_data = np.zeros((1, max_encoder_seq_length,

decoder_input_data = np.zeros((1, max_decoder_seq_length,

# Example input: "I am learning"

# Example output: "<START> J'apprends <END>"

# ------------------- MODEL ARCHITECTURE -------------------

encoder_inputs = Input(shape=(None, num_encoder_tokens))

encoder_lstm = LSTM(latent_dim, return_state=True)

_, state_h, state_c = encoder_lstm(encoder_inputs)

encoder_states = [state_h, state_c]

decoder_inputs = Input(shape=(None, num_decoder_tokens))

decoder_lstm = LSTM(latent_dim, return_sequences=True, return_state=True)

decoder_dense = Dense(num_decoder_tokens, activation='softmax')

model = Model([encoder_inputs, decoder_inputs], decoder_outputs)

# ------------------- TRAINING -------------------

model.fit([encoder_input_data, decoder_input_data], decoder_target_data,

# ------------------- INFERENCE MODE -------------------

# Encoder model for inference

encoder_model = Model(encoder_inputs, encoder_states)

# Decoder model for inference

decoder_states_inputs = [decoder_state_input_h, decoder_state_input_c]

decoder_outputs, state_h, state_c = decoder_lstm(

decoder_states = [state_h, state_c]

decoder_model = Model([decoder_inputs] + decoder_states_inputs,

# ------------------- ENCODING FUNCTION -------------------

"""Encodes an input sentence into a padded sequence of tokens."""

encoder_input = np.zeros((1, max_encoder_seq_length,

for t, token in enumerate(tokens):

encoder_input[0, t, token] = 1.0

# ------------------- DECODING FUNCTION -------------------

"""Generates the output sentence word-by-word using the decoder."""

# Start with the <START> token

target_seq = np.zeros((1, 1, num_decoder_tokens))

target_seq[0, 0, target_token_index['<START>']] = 1.0

while not stop_condition:

output_tokens, h, c = decoder_model.predict([target_seq] + states_value)

sampled_token_index = np.argmax(output_tokens[0, -1, :])

if sampled_word == '<END>' or len(decoded_sentence.split()) >

# Update the target sequence and states

target_seq = np.zeros((1, 1, num_decoder_tokens))

target_seq[0, 0, sampled_token_index] = 1.0

# ------------------- TEST TRANSLATION -------------------

input_sentence = "I am learning"

You might also like