Advertisement
Guest User

Untitled

a guest
Jul 16th, 2019
79
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.63 KB | None | 0 0
  1. from sklearn.model_selection import train_test_split
  2. from sklearn.feature_extraction.text import CountVectorizer
  3. from sklearn.naive_bayes import MultinomialNB
  4.  
  5. df['mixed_feature'] = df['Text'] +' '+ df['Topic']
  6.  
  7. X_train, X_test, y_train, y_test = train_test_split(df['mixed_feature'], df['Sentiment'], test_size=0.2)
  8.  
  9. count_vect = CountVectorizer()
  10. X_train_counts = count_vect.fit_transform(X_train)
  11. tfidf_transformer = TfidfTransformer()
  12. X_train_tfidf = tfidf_transformer.fit_transform(X_train_counts)
  13. clf = MultinomialNB().fit(X_train_tfidf, y_train)
  14.  
  15. clf.predict(count_vect.transform([df['Text][i]])) ## For whatever text is in row i
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement