NLP Exp 4
NLP Exp 4
ipynb - Colab
import nltk
from nltk.tokenize import word_tokenize
from nltk.stem import PorterStemmer, WordNetLemmatizer
from nltk.corpus import wordnet
def get_wordnet_pos(treebank_tag):
"""Convert treebank tags to wordnet tags."""
if treebank_tag.startswith('J'):
return wordnet.ADJ
elif treebank_tag.startswith('V'):
return wordnet.VERB
elif treebank_tag.startswith('N'):
return wordnet.NOUN
elif treebank_tag.startswith('R'):
return wordnet.ADV
else:
return None
# Example text
text = "The dogs are running faster than the better-trained dog."
# Print results
print(f"Token: {token}")
print(f"POS Tag: {tag}")
print(f"Lemmatized: {lemmatized}")
print(f"Stemmed: {stemmed}")
print()
Token: The
POS Tag: DT
Lemmatized: The
Stemmed: the
Token: dogs
POS Tag: NNS
Lemmatized: dog
Stemmed: dog
Token: are
POS Tag: VBP
Lemmatized: be
Stemmed: are
Token: running
POS Tag: VBG
Lemmatized: run
Stemmed: run
Token: faster
POS Tag: RBR
Lemmatized: faster
Stemmed: faster
Token: than
POS Tag: IN
Lemmatized: than
https://colab.research.google.com/drive/13Y1y7SMqzJNqb3cI_X29q0jPLciyaBBz#scrollTo=Wm2zkrGxLiuO&printMode=true 1/2
8/27/24, 3:04 PM Untitled5.ipynb - Colab
Stemmed: than
Token: the
POS Tag: DT
Lemmatized: the
Stemmed: the
Token: better-trained
POS Tag: JJ
Lemmatized: better-trained
Stemmed: better-train
Token: dog
POS Tag: NN
Lemmatized: dog
Stemmed: dog
Token: .
POS Tag: .
Lemmatized: .
Stemmed: .
https://colab.research.google.com/drive/13Y1y7SMqzJNqb3cI_X29q0jPLciyaBBz#scrollTo=Wm2zkrGxLiuO&printMode=true 2/2