Guest User

Untitled

a guest
Oct 23rd, 2018
82
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.76 KB | None | 0 0
  1. User Item
  2. Louis 1
  3. Louis 2
  4. Adam 1
  5. Adam 3
  6.  
  7. 1 2 3
  8. 1 0 1 1
  9. 2 1 0 0
  10. 3 1 0 0
  11.  
  12. import pandas as pd
  13. import numpy as np
  14. from scipy.sparse import csr_matrix, lil_matrix
  15. raw = pd.DataFrame(columns=['user','item'])
  16. raw['user']=['Louis','Louis','Adam','Adam']
  17. raw['item']=[1,2,1,3]
  18.  
  19. item_list = raw.item.unique().tolist()
  20. user_list = raw.user.unique().tolist()
  21. m = lil_matrix((len(raw.item.unique()),len(raw.item.unique())))
  22. for user in user_list:
  23. temp = raw.loc[np.in1d(raw['user'], user)].item
  24. if len(temp) > 1:
  25. for idx1, id1 in enumerate(temp[0:-1]):
  26. for id2 in temp[idx1+1:]:
  27. m[item_list.index(id1),item_list.index(id2)]+=1
  28. m[item_list.index(id2),item_list.index(id1)]+=1
  29. m.toarray()
Add Comment
Please, Sign In to add comment