0% found this document useful (0 votes)

16 views5 pages

3

Uploaded by

shifaansari1975

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

16 views5 pages

3

Uploaded by

shifaansari1975

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 5

*********Practical – 1 Write a program to implement sentence and word

tokenization.********

import nltk
nltk.download('punkt')
doc= "An eight-time Olympic gold medalist, Bolt is the only sprinter to win Olympic
100 m and 200 m titles at three consecutive Olympics (2008, 2012, and 2016). He
also won two 4 × 100 relay gold medals."
tokens= nltk.word_tokenize(doc)
print(tokens)

*****************Practical – 2 Write a program to implement stemming and

lemmatization.*****************

import nltk
from nltk.stem import WordNetLemmatizer
from nltk.stem import PorterStemmer
from nltk.tokenize import word_tokenize
nltk.download('wordnet')
ps = PorterStemmer()
words= ["program", "programs", "programmer", "programming", "programmers"]
for w in words:
print(w, ":" , ps.stem(w))
lemmatizer = WordNetLemmatizer()
print("rocks:", lemmatizer.lemmatize("rocks"))

**************************Practical – 3 Write a program to implement a tri-gram

model.********************

import nltk
import markovify
import os
from collections import Counter
nltk.download('punkt')
content = []
for filename in os.listdir("trigram/"):
with open(f'trigram/{filename}') as f:
content.append(f.read())
corpus = []
for item in content:
corpus.extend(
[word.lower() for word in nltk.word_tokenize(item) if any(c.isalpha()for c
in word)])
ngrams = Counter(nltk.ngrams(corpus, 3))
for ngram, freq in ngrams.most_common(10):
print(f'{freq}:{ngram}')

with open('Usain.txt') as f:
text = f.read()
model = markovify.Text(text)
sent = model.make_sentence()
print(sent)

********************************Practical – 4 Write a program to implement PoS

tagging using HMM & Neural Model.*********************

from tabulate import tabulate

import pandas as pd
def generate_sequence(states, sequence_length):
all_sequences = []
nodes= []
depth= sequence_length
def gen_seq_recur(states, nodes, depth):
if depth == 0:
# print nodes
all_sequences.append(nodes)
else:
for state in states:
temp_nodes = list(nodes)
temp_nodes.append(state)
gen_seq_recur(states, temp_nodes, depth - 1)
gen_seq_recur(states, [], depth)
return all_sequences

def score_sequences(sequences, initial_probs, transition_probs, emission_probs,

obs):
best_score = -1
best_sequence = None
sequence_scores = []
for seq in sequences:
total_score = 1
first= True
for i in range(len(seq)):
state_score= 1
if(first == True):
state_score *= initial_probs[seq[i]]
first=False
else:
state_score = transition_probs[seq[i] + "|" + seq[i-1]]
state_score = emission_probs[obs[i] + "|" +seq[i]]
total_score *= state_score
sequence_scores.append(total_score)
return sequence_scores

def pretty_print_probs(distribs):
print(distribs)
rows = set()
cols = set()
for val in distribs.keys():
temp = val.split("|")
rows.add(temp[0])
cols.add(temp[1])
rows = list(rows)
cols = list(cols)
df = []
for i in range(len(rows)):
temp = []
for j in range(len(cols)):
temp.append(distribs[rows[i] + "|" + cols[j]])
df.append(temp)
l = pd.Index(rows, name="rows")
C = pd.Index(cols, name="cols")
df = pd.DataFrame(data=df, index=l, columns=C)
print(tabulate(df, headers="keys", tablefmt="psql"))

def initializeSequences(_obs):
# Generate hst ot sequences
seqlen = len(_obs)
seqs = generate_sequence(states, seqlen)
# Score sequences
seq_scores = score_sequences(seqs, initial_probs, transition_probs,
emission_probs, obs)
return (seqlen, seqs, seq_scores)
states = ["Noun","Verb","Determiner"]
initial_probs = {"Noun":0.9, "Verb":0.05, "Determiner":0.05}
transition_probs = {"Noun|Noun":0.2, "Noun|Verb": 0.1, "Noun|Determiner":0.8,
"Verb|Noun":0.8,"Verb|Verb":0.1, "Verb|Determiner":0.1, "Determiner|Noun":0.1,
"Determiner|Verb":0.8, "Determiner|Determiner":0.1}
emission_probs = {"Vimal|Noun":0.9,"taught|Noun":0.05, "the|Noun": 0.05,"class|
Noun":0.9, "Vimal|Verb":0.05, "taught|Verb":0.9, "the|Verb":0.05, "class|
Verb":0.05, "Vimal|Determiner":0.05, "taught|Determiner":0.05, "the|
Determiner":0.9, "class|Determiner":0.05}
print("Initial Distributions")
print(initial_probs)

print("Transition Probabilities")
pretty_print_probs(transition_probs)

print("Emission Probabilities")
pretty_print_probs(emission_probs)

obs = ["Vimal","taught","the",'class']
print("Scores")
sequence_length, sequences, sequence_scores = initializeSequences(obs)
for i in range(len(sequences)):
print("Sequence:%-60s Score:%0.6f" % (sequences[i],sequence_scores[i]))
print("Best Sequence")
print(sequences[sequence_scores.index(max(sequence_scores))], max(sequence_scores))

******************Practical – 5 Write a program to implement syntactic parsing of a

given text.**************

import nltk
nltk.download('punkt')
nltk.download('averaged_perceptron_tagger')
from nltk import pos_tag, word_tokenize, RegexpParser
sample_text = "Usain Bolt is the only sprinter to win Olympic 100 m and 200 m
titles at three consecutive Olympics (2008, 2012, and 2016)."
tagged = pos_tag(word_tokenize(sample_text))
print(tagged)
grammar= r"""
NP: {<DT>?<JJ>*<NN>} #To e xtract Noun Phroscs
P: {<IN>} #To extract Verbs
PP: {<p> <NP>} #To extract Prc1>0s1t1onal Phrases
VP: {<V> <NP|PP>*} #To extract Verb Phrases
"""
chunker = RegexpParser(grammar)
output = chunker.parse(tagged)
print(" After Extracting\n", output)
output.draw()
*********************Practical – 6 Write a program to implement a dependency
parsing of a text.************

import spacy
from spacy import displacy
nlp = spacy.load("en_core_web_sm")
sentence = "Usain Bolt is the fastest sprinter in the world."
doc=nlp(sentence)
print ("{:<15} | {:<8} | {:<15} | {:<20}".format('Token','Relatlon','Head',
'Children'))
print("-"*70 )
for token in doc:
print("{:<15} | {:<8} | {:<15} | {:<20}"
.format(str(token.text), str(token.dep_), str(token.head.text), str([child for
child in token.children])))
displacy.render(doc,style='dep',jupyter=True,options={'distance':120})

********************************* Practical – 7 Write a program to implement a

Named Entity Recognition (NER).************

import spacy
nlp = spacy.load("en_core_web_sm")
sentence = "World's Fastest sprinter Usain Bolt has the record for 100m in 9.58s"
doc = nlp(sentence)
for ent in doc.ents:
print(ent.text, ent.start_char, ent.end_char, ent.label_)

****************************Practical – 8 Write a program to implement Text

Summarization for given text.***********

import nltk
from nltk.corpus import stopwords
from nltk.cluster.util import cosine_distance
import numpy as np
import networkx as nx
nltk.download('stopwords')
def read_artlcle(file_name):
file = open(file_name, "r")
filedata = file.readlines()
article = filedata[0].split(". ")
sentences = []
for sentence in article:
print(sentence)
sentences.append(sentence.replace("[^a-zA-Z]"," ").split(" "))
sentences.pop()
return sentences
def build_similarity_matrix(sentences, stop_words):
similarity_matrix = np.zeros((len(sentences),len(sentences)))
for idx1 in range(len(sentences)):
for idx2 in range(len(sentences)):
if idx1 == idx2:
continue
similarity_matrix[idx1][idx2] =
sentence_similarity(sentences[idx1],sentences[idx2],stop_words)
return similarity_matrix
def sentence_similarity(sent1, sent2, stopwords=None):
if stopwords is None:
stopwords = []
sent1 = [w.lower() for w in sent1]
sent2 = [w.lower() for w in sent2]
all_words = list(set(sent1 + sent2))
vector1 = [0]*len(all_words)
vector2 = [0]*len(all_words)
for w in sent1:
if w in stopwords:
continue
vector1[all_words.index(w)] += 1
for w in sent2:
if w in stopwords:
continue
vector2[all_words.index(w)] += 1
return 1 - cosine_distance(vector1, vector2)
def generate_summary(file_name, top_n=5):
stop_words = stopwords.words('english')
summarize_text = []
sentences = read_artlcle(file_name)
sentence_similarity_matrix = build_similarity_matrix(sentences, stop_words)
sentence_similarity_graph = nx.from_numpy_array(sentence_similarity_matrix)
scores = nx.pagerank(sentence_similarity_graph)
ranked_sentence = sorted(((scores[i],s) for i,s in enumerate(sentences)),
reverse=True)
print("Indexes of top ranked_sentence order are", ranked_sentence)
for i in range(top_n):
summarize_text.append(" ".join(ranked_sentence[i][1]))
print("Summarize Text: \n", " . ".join(summarize_text))
generate_summary('Usain.txt',2)

MAGNESITA CEMENT Folder 092015
No ratings yet
MAGNESITA CEMENT Folder 092015
24 pages
Chapter 7 - Introduction To Arrays
No ratings yet
Chapter 7 - Introduction To Arrays
33 pages
NLP Lab Manual
No ratings yet
NLP Lab Manual
21 pages
EM 300 G3 Manual 12 2016 EN
100% (1)
EM 300 G3 Manual 12 2016 EN
60 pages
Unit 3 Exam - Hands-On - Part 1
No ratings yet
Unit 3 Exam - Hands-On - Part 1
2 pages
Med Plus
No ratings yet
Med Plus
20 pages
Dokumen - Pub - Natural Language Processing Practical Using Transformers With Python
No ratings yet
Dokumen - Pub - Natural Language Processing Practical Using Transformers With Python
275 pages
Assume You Have Just Been Hired As A Business Manager
0% (1)
Assume You Have Just Been Hired As A Business Manager
3 pages
Ai&Ml Bai601 NLP Lab Manual
No ratings yet
Ai&Ml Bai601 NLP Lab Manual
48 pages
Ccs339 Text and Speech Analysis Lab Manual
No ratings yet
Ccs339 Text and Speech Analysis Lab Manual
51 pages
NLPPractical
No ratings yet
NLPPractical
12 pages
NLP Record
No ratings yet
NLP Record
16 pages
NLP Assignment 4 (22bce9560)
No ratings yet
NLP Assignment 4 (22bce9560)
12 pages
Tsarecord
No ratings yet
Tsarecord
22 pages
UNIT-5 and 6
No ratings yet
UNIT-5 and 6
40 pages
NLP Assignment (917722H031)
No ratings yet
NLP Assignment (917722H031)
18 pages
A7 Dsbda Sana
No ratings yet
A7 Dsbda Sana
15 pages
DSBA+Master+Codebook+ +Text+Mining+&+TSF
No ratings yet
DSBA+Master+Codebook+ +Text+Mining+&+TSF
11 pages
Information Retrival
No ratings yet
Information Retrival
43 pages
Gen AIL
No ratings yet
Gen AIL
12 pages
SABA Sports Book
No ratings yet
SABA Sports Book
11 pages
For Assignment-10 (Machine Learning With Python - NLP-2)
No ratings yet
For Assignment-10 (Machine Learning With Python - NLP-2)
37 pages
EX1
No ratings yet
EX1
6 pages
DS 7
No ratings yet
DS 7
3 pages
NLP Lab
No ratings yet
NLP Lab
18 pages
AI Lab Programs
No ratings yet
AI Lab Programs
9 pages
NLP Lab Assignment 8
No ratings yet
NLP Lab Assignment 8
14 pages
NLP Lab Manual
No ratings yet
NLP Lab Manual
7 pages
Assignment - 7: Import Import Import Import
No ratings yet
Assignment - 7: Import Import Import Import
3 pages
Practicle 7-Notes
No ratings yet
Practicle 7-Notes
2 pages
Salut D'amour: E.Elgar
No ratings yet
Salut D'amour: E.Elgar
9 pages
Methodology
No ratings yet
Methodology
9 pages
NLP Lab - Manual
No ratings yet
NLP Lab - Manual
33 pages
Sumati
No ratings yet
Sumati
10 pages
DL 5
No ratings yet
DL 5
9 pages
Glove
100% (1)
Glove
10 pages
NLP FinAL
No ratings yet
NLP FinAL
27 pages
Self Evaluation Exercises
No ratings yet
Self Evaluation Exercises
12 pages
Laboratory Manual: Faculty of Engineering and Technology Bachelor of Technology
No ratings yet
Laboratory Manual: Faculty of Engineering and Technology Bachelor of Technology
10 pages
WhitespaceAlpha Deck Jan'25
No ratings yet
WhitespaceAlpha Deck Jan'25
18 pages
NLP Lab Programs
No ratings yet
NLP Lab Programs
18 pages
7 TextAnalysis
No ratings yet
7 TextAnalysis
3 pages
Final NLP Lab File
No ratings yet
Final NLP Lab File
28 pages
Ir Lab 2 Ir Learning Outcomes: Pyterrier
No ratings yet
Ir Lab 2 Ir Learning Outcomes: Pyterrier
7 pages
Sahil NLP
No ratings yet
Sahil NLP
16 pages
Crack Waves
No ratings yet
Crack Waves
9 pages
Clean Data
No ratings yet
Clean Data
4 pages
CMO 88 S. 2017 BS Electrical Engineering
No ratings yet
CMO 88 S. 2017 BS Electrical Engineering
112 pages
Feb 25 Pay Slip
No ratings yet
Feb 25 Pay Slip
1 page
Get TRDoc
No ratings yet
Get TRDoc
309 pages
NLP Manual
No ratings yet
NLP Manual
21 pages
SK NLP Practical (FS)
No ratings yet
SK NLP Practical (FS)
22 pages
Python Code Examples
100% (1)
Python Code Examples
30 pages
Rajeev Mishra 20 SCSE1180087
No ratings yet
Rajeev Mishra 20 SCSE1180087
29 pages
Sumo
No ratings yet
Sumo
21 pages
Ass5 DL Inp OUT
No ratings yet
Ass5 DL Inp OUT
5 pages
Classroom Management: Experience
No ratings yet
Classroom Management: Experience
5 pages
2022 I-95 Snow Incident of January 3-4 Performance Audit From Office of The Inspector General
No ratings yet
2022 I-95 Snow Incident of January 3-4 Performance Audit From Office of The Inspector General
29 pages
Assignment No - 7
No ratings yet
Assignment No - 7
4 pages
Skripta Iz Engleskog Sa Vezbama
No ratings yet
Skripta Iz Engleskog Sa Vezbama
54 pages
TARUN 230914500082 11092023 NoMemo H
No ratings yet
TARUN 230914500082 11092023 NoMemo H
6 pages
DSBD 7 Ass
No ratings yet
DSBD 7 Ass
9 pages
Dsbda 7
No ratings yet
Dsbda 7
1 page
Aped For Fake News
No ratings yet
Aped For Fake News
6 pages
Text Summarization Using Natural Language Processing
No ratings yet
Text Summarization Using Natural Language Processing
8 pages
AP19110010110 Lab Assignment-2 - Jupyter Notebook
No ratings yet
AP19110010110 Lab Assignment-2 - Jupyter Notebook
18 pages
Database Architecture
100% (2)
Database Architecture
26 pages
ASTW RA03 PracticalManual
No ratings yet
ASTW RA03 PracticalManual
18 pages
NLP - Practical List
No ratings yet
NLP - Practical List
14 pages
FDP Manual - Petrel Dynamic Modeling PDF
83% (6)
FDP Manual - Petrel Dynamic Modeling PDF
28 pages
Statement of Financial Position (S.F.P)
No ratings yet
Statement of Financial Position (S.F.P)
3 pages
Parts of Speech Tagger
No ratings yet
Parts of Speech Tagger
12 pages
Next Word Prediction With NLP and Deep Learning
No ratings yet
Next Word Prediction With NLP and Deep Learning
13 pages
Shubham Jade MSC It 31031420010 NLP Practical Journal
No ratings yet
Shubham Jade MSC It 31031420010 NLP Practical Journal
17 pages
ML Lab
No ratings yet
ML Lab
7 pages
6 - Text Vectorization-CSC688-SP22
No ratings yet
6 - Text Vectorization-CSC688-SP22
5 pages
Sketchuptextureclub - Textures - Terms of Use
No ratings yet
Sketchuptextureclub - Textures - Terms of Use
2 pages
The Essential R Reference
From Everand
The Essential R Reference
Mark Gardener
No ratings yet
CSR Bernard Madoff Case Analysis and Conclusion
No ratings yet
CSR Bernard Madoff Case Analysis and Conclusion
6 pages
Tips and Techniques To Cleanup Outlook 2007-2010
No ratings yet
Tips and Techniques To Cleanup Outlook 2007-2010
10 pages
Machine Learning NLP LAB Sayak Mallick
No ratings yet
Machine Learning NLP LAB Sayak Mallick
4 pages
Quiz 4
No ratings yet
Quiz 4
2 pages
EPC-5 Presentation
No ratings yet
EPC-5 Presentation
19 pages
Definition and Scope of Ergonomic
No ratings yet
Definition and Scope of Ergonomic
8 pages
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet
Https Raw - Githubusercontent.com Joelgrus Data-Science-From-Scratch Master Code Natural Language Processing
No ratings yet
Https Raw - Githubusercontent.com Joelgrus Data-Science-From-Scratch Master Code Natural Language Processing
5 pages
Accomplishment Report On Booklet
No ratings yet
Accomplishment Report On Booklet
5 pages
A - First Solar FS 275
No ratings yet
A - First Solar FS 275
2 pages
NLP Lab Manual
No ratings yet
NLP Lab Manual
15 pages
Cleaning Validation For Biopharmaceutical Manufacturing at Genentech
100% (1)
Cleaning Validation For Biopharmaceutical Manufacturing at Genentech
4 pages

3

Uploaded by

3

Uploaded by

*********Practical – 1 Write a program to implement sentence and word

*****************Practical – 2 Write a program to implement stemming and

**************************Practical – 3 Write a program to implement a tri-gram

********************************Practical – 4 Write a program to implement PoS

from tabulate import tabulate

def score_sequences(sequences, initial_probs, transition_probs, emission_probs,

******************Practical – 5 Write a program to implement syntactic parsing of a

********************************* Practical – 7 Write a program to implement a

****************************Practical – 8 Write a program to implement Text

You might also like