Guest User

Untitled

a guest
Feb 22nd, 2018
89
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.79 KB | None | 0 0
  1. model_ug_dmm = Doc2Vec.load('d2v_model_ug_dmm.doc2vec')
  2. model_ug_dmm.delete_temporary_training_data(keep_doctags_vectors=True, keep_inference=True)
  3.  
  4. def get_w2v_ugdbowdmm(tweet, size):
  5. vec = np.zeros(size).reshape((1, size))
  6. count = 0.
  7. for word in tweet.split():
  8. try:
  9. vec += np.append(model_ug_dbow[word],model_ug_dmm[word]).reshape((1, size))
  10. count += 1.
  11. except KeyError:
  12. continue
  13. if count != 0:
  14. vec /= count
  15. return vec
  16.  
  17. train_vecs_w2v_dbowdmm = np.concatenate([get_w2v_ugdbowdmm(z, 200) for z in x_train])
  18. validation_vecs_w2v_dbowdmm = np.concatenate([get_w2v_ugdbowdmm(z, 200) for z in x_validation])
  19.  
  20. clf = LogisticRegression()
  21. clf.fit(train_vecs_w2v_dbowdmm, y_train)
  22. clf.score(validation_vecs_w2v_dbowdmm, y_validation)
Add Comment
Please, Sign In to add comment