Advertisement
Guest User

tfidf

a guest
Jun 29th, 2017
66
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 0.93 KB | None | 0 0
  1. # Create tf–idf matrix
  2. from sklearn.feature_extraction.text import TfidfVectorizer
  3. vectorizer = TfidfVectorizer(stop_words = 'english')
  4. X = vectorizer.fit_transform(corpus)
  5. X.todense()
  6. Out[37]:
  7. matrix([[ 0.89469821,  0.        ,  0.        ,  0.        ,  0.        ,
  8.           0.23513012,  0.        ,  0.        ,  0.        ,  0.29823274,
  9.           0.        ,  0.23513012],
  10.         [ 0.        ,  0.        ,  0.        ,  0.70710678,  0.        ,
  11.           0.        ,  0.70710678,  0.        ,  0.        ,  0.        ,
  12.           0.        ,  0.        ],
  13.         [ 0.        ,  0.35415727,  0.35415727,  0.        ,  0.        ,
  14.           0.55844332,  0.        ,  0.        ,  0.        ,  0.        ,
  15.           0.35415727,  0.55844332],
  16.         [ 0.        ,  0.        ,  0.        ,  0.38274272,  0.48546061,
  17.           0.        ,  0.38274272,  0.48546061,  0.48546061,  0.        ,
  18.           0.        ,  0.        ]])
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement