Guest User

Untitled

a guest
Jan 9th, 2018
106
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.94 KB | None | 0 0
  1. import pymysql
  2. import time
  3. import datetime
  4. import pprint
  5. from collections import defaultdict
  6.  
  7. #今天时间
  8. today = datetime.date.today()
  9. #print(today)
  10. #昨天时间
  11. yesterday = today - datetime.timedelta(days=1)
  12. #print(yesterday)
  13.  
  14. #得到昨天开始时间戳
  15. def get_start_time():
  16. return int(time.mktime(time.strptime(str(yesterday), '%Y-%m-%d')))
  17. #print(get_start_time())
  18. #得到昨天结束时间戳
  19. def get_end_time():
  20. return (int(time.mktime(time.strptime(str(today), '%Y-%m-%d'))) - 1)
  21.  
  22. #print(get_end_time())
  23.  
  24. conn = (pymysql.connect(host='192.168.0.13',user = 'root',
  25. password='root',database='copyright_for_crawler',
  26. use_unicode=True,charset='utf8'))
  27. cur = conn.cursor()
  28. #sql = "SELECT * FROM copyright_for_crawler.kanjian_ddex_album_release_feedback;"
  29. sql_two = ("SELECT id,dsp_id,cw_url,cw_timestamp FROM copyright_for_crawler.kanjian_ddex_album_release_feedback WHERE cw_timestamp BETWEEN %s AND %s;"
  30. % (get_start_time(), get_end_time()))
  31.  
  32. cur.execute(sql_two)
  33. results = cur.fetchall()
  34. #print(results)
  35. album_dict = defaultdict(dict)
  36.  
  37. for row in results:
  38. #cw_timestamp = row[3]
  39. #print(cw_timestamp)
  40.  
  41. #if (cw_timestamp >= get_start_time() and cw_timestamp <= get_end_time()):
  42. if row[2]:
  43. album_id =row[0]
  44. #print(album_id)
  45. if album_id not in album_dict:
  46. album_dict[row[0]]["cw_url"] = row[2]
  47. album_dict[row[0]]["dsp_id"] = row[1]
  48.  
  49. #pprint.pprint(album_dict)
  50.  
  51.  
  52. #pprint.pprint(dict(album_dict))
  53. sql_re = "SELECT id,name FROM copyright_for_crawler.kanjian_ddex_album;"
  54. cur.execute(sql_re)
  55. results_re = cur.fetchall()
  56. for row in results_re:
  57. album_id_re = row[0]
  58. if album_id_re in album_dict:
  59. album_dict[row[0]]["name"] = row[1]
  60.  
  61. #pprint.pprint(album_dict)
  62.  
  63. sql_ree = "SELECT id, name FROM copyright_for_crawler.kanjian_ddexdsp;"
  64. cur.execute(sql_ree)
  65. results_ree = cur.fetchall()
  66. for row in results_ree:
  67. dsp_id = row[0]
  68. for key in album_dict:
  69. if dsp_id == album_dict[key]["dsp_id"]:
  70. album_dict[key]["dsp_id"] = row[1]
  71.  
  72. pprint.pprint(album_dict)
Add Comment
Please, Sign In to add comment