Advertisement
LibbyK

Untitled

Feb 19th, 2020
107
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.64 KB | None | 0 0
  1. import pandas as pd
  2. #import numpy as np
  3.  
  4. data = pd.read_csv('/datasets/visits_eng.csv', sep='\t')
  5. data['local_time'] = (
  6. pd.to_datetime(data['date_time'], format='%Y-%m-%dT%H:%M:%S')
  7. - pd.Timedelta(hours=7)
  8. )
  9. #print(data.head)
  10.  
  11. #data["too_fast"] = data["time_spent"].apply(lambda x: True if x <60 else False)
  12. data["too_fast"] = data["time_spent"]<60
  13.  
  14.  
  15. #print(data["too_fast"].mean())
  16. too_fast_stat = pd.pivot_table(data, values='too_fast', index=['id'])
  17. #print(too_fast_stat.head())
  18. too_fast_stat.hist(bins = 30)
  19.  
  20. data["too_slow"] =data["time_spent"]>1000
  21. data.pivot_table(values='too_slow', index=['id']).hist(bins = 30 )
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement