Guest User

Untitled

a guest
Jan 23rd, 2018
72
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.01 KB | None | 0 0
  1. from bs4 import BeautifulSoup
  2. from wordcloud import WordCloud, STOPWORDS, ImageColorGenerator
  3. from more_words import words
  4. from PIL import Image
  5. import numpy as np
  6.  
  7. msg_file_name = "175.html"
  8. u1 = u"A***** B*****"
  9. u2 = u"H***** B*******"
  10.  
  11. msg_file = open(msg_file_name)
  12.  
  13. soup = BeautifulSoup(msg_file, "html.parser")
  14.  
  15. u1_msgs = []
  16. u2_msgs = []
  17.  
  18. msg = soup.find("p")
  19.  
  20. while True:
  21. if msg == None:
  22. break
  23. name = msg.find_previous("div", class_="message").span.text
  24.  
  25. if u1 == name:
  26. u1_msgs.append(msg.text)
  27. elif u2 == name:
  28. u2_msgs.append(msg.text)
  29.  
  30. msg = msg.find_next("p")
  31.  
  32. stopwords = set(STOPWORDS)
  33. mask = np.array(Image.open("example.jpg"))
  34. image_colors = ImageColorGenerator(mask)
  35.  
  36. for x in words:
  37. stopwords.add(x)
  38. #stopwords.add("said")
  39.  
  40. wc = WordCloud(background_color="white", mask=mask, stopwords=stopwords)
  41. wc.generate(" ".join(u1_msgs))
  42. wc.recolor(color_func=image_colors)
  43. wc.to_file("u1.png")
  44.  
  45. wc.generate(" ".join(u2_msgs))
  46. wc.recolor(color_func=image_colors)
  47. wc.to_file("u2.png")
Add Comment
Please, Sign In to add comment