Guest User

Untitled

a guest
Oct 19th, 2017
82
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.24 KB | None | 0 0
  1. def word_count(self,List):
  2. > dictionary_text={}
  3. > for word in List:
  4. > if word in dictionary_text:
  5. > dictionary_text[word]+=1
  6. > else:
  7. > dictionary_text[word]=1
  8.  
  9. >
  10.  
  11. > > def text_process(self,string):
  12. > > from nltk.stem import WordNetLemmatizer
  13. > > from nltk.tokenize import word_tokenize
  14. > > lemmatizer = WordNetLemmatizer()
  15. > > New_text=word_tokenize(string)
  16. > > New_text_lem=[lemmatizer.lemmatize(words) for words in New_text]
  17. > > dictionary_text=self.word_count(New_text_lem)
  18. > > return dictionary_text
  19.  
  20. def main(self,Text):
  21. text_1=self.text_process(Text[0])
  22. text_2=self.text_process(Text[1])
  23. text_3=self.text_process(Text[2])
  24. final_dic={}
  25. for key in set(text_1.keys() + text_2.keys() + text_3.keys()):
  26. try:
  27. final_dic.setdefault(key,[]).append(text_1[key])
  28. except KeyError:
  29. pass
  30.  
  31. try:
  32. final_dic.setdefault(key,[]).append(text_2[key])
  33. except KeyError:
  34. pass
  35.  
  36. try:
  37. final_dic.setdefault(key,[]).append(text_3[key])
  38. except KeyError:
  39. pass
Add Comment
Please, Sign In to add comment