Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- >>> from nltk.corpus import wordnet as wn
- >>> from nltk.stem import PorterStemmer
- >>> from difflib import get_close_matches as gcm
- >>> from itertools import chain
- >>> dictionary = set(chain(*[i.lemma_names() for i in wn.all_synsets()]))
- >>> len(dictionary)
- 148730
- >>> porter = PorterStemmer()
- >>> stemmed = porter.stem('force')
- >>> gcm(stemmed, dictionary)
- [u'force', u'formic', u'forced']
- >>> gcm(stemmed, dictionary)[0]
- u'force'
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement