Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import pandas
- def build_dataframe(user_rates_with_movies):
- genres_list = list(set([item for sublist in user_rates_with_movies['genres'].tolist() for item in sublist]))
- json_columns_list = list(['userID', 'movieID', 'rating'])
- json_columns_list.extend(list(('genre-' + item) for item in genres_list))
- elements = {}
- iterator = 0
- for row in user_rates_with_movies[['userID', 'movieID', 'rating', 'genres']].to_dict(orient='records'):
- element = [row['userID'], row['movieID'], row['rating']]
- for genre in genres_list:
- element.extend([(genre in row['genres']) if int(1) else int(0)])
- elements[iterator] = element
- iterator = iterator + 1
- return pandas.DataFrame.from_dict(elements, orient='index', columns=json_columns_list)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement