Guest User

Untitled

a guest
Dec 19th, 2018
107
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.60 KB | None | 0 0
  1. import numpy as np
  2. import pandas as pd
  3. from sklearn.naive_bayes import BernoulliNB
  4. from sklearn.naive_bayes import MultinomialNB
  5. from sklearn.feature_extraction.text import CountVectorizer
  6.  
  7. count_vect = CountVectorizer()
  8. values = []
  9. results = []
  10. tsv = pd.read_table("data.tsv").values.tolist()
  11. for row in tsv:
  12. values.append(row[-1])
  13. results.append(1 if row[1] == 'p' else 0)
  14. X = count_vect.fit_transform(values)
  15. y = np.array(results)
  16. b_clf = BernoulliNB()
  17. b_clf.fit(X, y)
  18. print(b_clf.score(X, y))
  19. #=> 0.7609423570921667
  20. m_clf = MultinomialNB()
  21. m_clf.fit(X, y)
  22. print(m_clf.score(X, y))
  23. #=> 0.7551450818115486
Add Comment
Please, Sign In to add comment