Editor Python Online - Contoh Source Code - Kode Program 1
Editor Python Online - Contoh Source Code - Kode Program 1
text="Hello Mr. Smith, how are you doing today? The weather is
great, and city is awesome.The sky is pinkish-blue. You shouldn't
eat cardboard"
tokenized_text=sent_tokenize(text)
print(tokenized_text)
tokenized_word=word_tokenize(text)
print(tokenized_word)
filtered_sent=[]
for w in tokenized_sent:
if w not in stop_words:
filtered_sent.append(w)
print("Tokenized Sentence:",tokenized_sent)
print("Filterd Sentence:",filtered_sent)
# Stemming
1
from nltk.stem import PorterStemmer
from nltk.tokenize import sent_tokenize, word_tokenize
ps = PorterStemmer()
stemmed_words=[]
for w in filtered_sent:
stemmed_words.append(ps.stem(w))
print("Filtered Sentence:",filtered_sent)
print("Stemmed Sentence:",stemmed_words)
#Lexicon Normalization
#performing stemming and Lemmatization
word = "flying"
print("Lemmatized Word:",lem.lemmatize(word,"v"))
print("Stemmed Word:",stem.stem(word))
tokens=nltk.word_tokenize(sent)
print(tokens)
nltk.pos_tag(tokens)
import nltk
nltk.download('punkt')
groucho_grammar = nltk.CFG.fromstring("""
2
S -> NP VP
PP -> P NP
NP -> Det N | Det N PP | 'I'
VP -> V NP | VP PP
Det -> 'an' | 'my'
N -> 'elephant' | 'pajamas'
V -> 'shot'
P -> 'in'
""")
parser = nltk.ChartParser(groucho_grammar)
for tree in parser.parse(tokenized_word):
print(tree)
tree.draw()