Advertisement
Guest User

Untitled

a guest
Mar 18th, 2019
79
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 0.80 KB | None | 0 0
  1. import pandas
  2.  
  3.  
  4. def build_dataframe(user_rates_with_movies):
  5.     genres_list = list(set([item for sublist in user_rates_with_movies['genres'].tolist() for item in sublist]))
  6.     json_columns_list = list(['userID', 'movieID', 'rating'])
  7.     json_columns_list.extend(list(('genre-' + item) for item in genres_list))
  8.     elements = {}
  9.     iterator = 0
  10.  
  11.     for row in user_rates_with_movies[['userID', 'movieID', 'rating', 'genres']].to_dict(orient='records'):
  12.         element = [row['userID'], row['movieID'], row['rating']]
  13.  
  14.         for genre in genres_list:
  15.             element.extend([(genre in row['genres']) if int(1) else int(0)])
  16.  
  17.         elements[iterator] = element
  18.         iterator = iterator + 1
  19.  
  20.     return pandas.DataFrame.from_dict(elements, orient='index', columns=json_columns_list)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement