Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- # for each query, find min & max date
- df_by_query_date = df.groupby("query").aggregate({"date": ["min","max"], "clicks": "sum",
- "impressions": "sum", "position": "mean"}).sort_values(("impressions","sum"),ascending=False)
- # filter to just queries in above the median in impressions
- df_by_query_date = df_by_query_date[df_by_query_date[("impressions","sum")] >= df_by_query_date[("impressions","sum")].quantile(0.50)]
- # find all queries that haven't appeared in the last two weeks
- df_by_query_date[df_by_query_date[("date","max")] < datetime.datetime.now() - datetime.timedelta(days=14)].head(5)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement