Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import random
- import redis
- import json
- import pandas as pd
- from wtiproj01_client import *
- import time
- #for x in range(10):
- # time.sleep(0.01)
- # random = get_dummy_randomized_dict()
- # push_dict_to_queue(random, "q")
- def get_DFUserRatedMovies(nrows):
- DFUserRatedMovies = pd.read_csv("user_ratedmovies.dat", header=0, delimiter='\t', usecols=['userID', 'movieID', 'rating'], nrows=nrows)
- return DFUserRatedMovies
- def ptd_bug(row_as_dict, list_of_keys_of_non_ints):
- list_of_all_keys = list(row_as_dict)
- list_of_keys_of_ints = set(list_of_all_keys).difference(set(list_of_keys_of_non_ints))
- for key_of_int in list_of_keys_of_ints:
- row_as_dict[key_of_int] = int(row_as_dict[key_of_int])
- return row_as_dict
- if __name__ == "__main__":
- queue_name = 'q'
- list_of_keys_of_non_ints = ["rating"]
- DFUserRatedMovies = get_DFUserRatedMovies(100)
- row_iterator = DFUserRatedMovies.iterrows()
- diagnostic_row_index = 0
- row_from_csv = row_iterator.next()
- print(row_from_csv)
- print(type(row_from_csv))
- for row in row_iterator:
- row_as_dict = row[1].to_dict()
- row_as_dict["diagnostic-index"] = diagnostic_row_index
- row_as_dict = ptd_bug(row_as_dict, list_of_keys_of_non_ints)
- push_dict_to_queue(row_as_dict, "q")
- diagnostic_row_index += 1
- #printout_queue("q")
- time.sleep(0.5)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement