Advertisement
Guest User

Untitled

a guest
Apr 29th, 2017
71
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.81 KB | None | 0 0
  1. def getdata(year):
  2. df = pd.read_csv('data/CTA_-_Ridership_-_Bus_Routes_-_Monthly_Day-Type_Averages___Totals.csv')
  3. df = df[['route', 'routename', 'Month_Beginning', 'Avg_Weekday_Rides', 'Avg_Saturday_Rides', 'Avg_Sunday-Holiday_Rides', 'MonthTotal']]
  4. df['year'] = pd.DatetimeIndex(df['Month_Beginning']).year
  5.  
  6. if year >= 2001 and year <= 2015:
  7. df = df[df['year'] == int(year)] # get data base on the given year in the argument
  8. df['month'] = pd.DatetimeIndex(df['Month_Beginning']).month
  9. else:
  10. df = df[df['year'] <= 2015] # get data base on the given year in the argument
  11.  
  12. df.set_index(['route', 'routename'], inplace=True)
  13. return df
  14.  
  15. # inyear = 2014 # Enter year here (from 2001 to 2015)
  16. # from cta_data import getdata
  17. df_ridership = getdata(2014)
  18. df_ridership.head()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement