Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- trip.start_date=pd.to_datetime(trip.start_date,infer_datetime_format=True)
- trip.end_date=pd.to_datetime(trip.end_date,infer_datetime_format=True)
- import re
- import datetime
- def add_datepart(df, fldname, drop=True, time=False):
- fld = df[fldname]
- fld_dtype = fld.dtype
- if isinstance(fld_dtype, pd.core.dtypes.dtypes.DatetimeTZDtype):
- fld_dtype = np.datetime64
- if not np.issubdtype(fld_dtype, np.datetime64):
- df[fldname] = fld = pd.to_datetime(fld, infer_datetime_format=True)
- targ_pre = re.sub('[Dd]ate$', '', fldname)
- attr = ['Year', 'Month', 'Week', 'Day', 'Dayofweek', 'Dayofyear',
- 'Is_month_end', 'Is_month_start', 'Is_quarter_end', 'Is_quarter_start', 'Is_year_end', 'Is_year_start']
- if time: attr = attr + ['Hour', 'Minute', 'Second']
- for n in attr: df[targ_pre + n] = getattr(fld.dt, n.lower())
- df[targ_pre + 'Elapsed'] = fld.astype(np.int64) // 10 ** 9
- if drop: df.drop(fldname, axis=1, inplace=True)
- add_datepart(trip, 'start_date', drop=False, time=True)
- add_datepart(trip, 'end_date', drop=False, time=True)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement