GamerBhai02

NLP Exp 6

Oct 9th, 2025
118
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 1.07 KB | Source Code | 0 0
  1. import nltk
  2. from nltk.corpus import wordnet, stopwords
  3. from nltk.tokenize import word_tokenize
  4. from nltk.stem import WordNetLemmatizer
  5. from nltk import pos_tag
  6.  
  7. nltk.download('punkt')
  8. nltk.download('averaged_perceptron_tagger')
  9. nltk.download('wordnet')
  10. nltk.download('omw-1.4')
  11. nltk.download('stopwords')
  12. nltk.download('averaged_perceptron_tagger_eng')
  13.  
  14. lemmatizer = WordNetLemmatizer()
  15.  
  16. def get_wordnet_pos(nltk_pos_tag):
  17.     if nltk_pos_tag.startswith('J'):
  18.         return wordnet.ADJ
  19.     elif nltk_pos_tag.startswith('V'):
  20.         return wordnet.VERB
  21.     elif nltk_pos_tag.startswith('N'):
  22.         return wordnet.NOUN
  23.     elif nltk_pos_tag.startswith('R'):
  24.         return wordnet.ADV
  25.     else:
  26.         return wordnet.NOUN
  27.  
  28. text = """
  29. The striped bats are hanging on their feet for best.
  30. """
  31.  
  32. tokens = word_tokenize(text)
  33. pos_tags = pos_tag(tokens)
  34.  
  35. lemmatized_tokens = [lemmatizer.lemmatize(token, get_wordnet_pos(pos)) for token, pos in pos_tags]
  36.  
  37. print("Original Tokens and POS Tags:")
  38. print(pos_tags)
  39. print("\nLemmatized Tokens:")
  40. print(lemmatized_tokens)
Tags: nlp
Advertisement
Add Comment
Please, Sign In to add comment