Guest User

Untitled

a guest
Aug 19th, 2018
85
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.30 KB | None | 0 0
  1. import pandas as pd
  2. from define_types import define_types
  3.  
  4. ARTISTS, SHOWS, ARTWORKS, ARTICLES, AUCTIONS, INQUIRIES, FRONT, GENES, GALLERIES, MUSEUMS = define_types()
  5.  
  6. def get_type():
  7.  
  8. # Load page views test data
  9. page_views_df = pd.read_csv('pageviews.csv')
  10.  
  11. # Delimit path into a list
  12. page_views_df['first_segment'] = page_views_df['path'].str.split("/", expand=False)
  13. page_views_df['first_segment'] = page_views_df.first_segment.map(lambda x: x[1])
  14.  
  15. # Determine which list the first path segment is found in
  16. # Assign type to first path segment
  17. def get_type(first_seg):
  18. if first_seg in ARTISTS:
  19. return 'artists'
  20. if first_seg in SHOWS:
  21. return 'shows'
  22. if first_seg in ARTWORKS:
  23. return 'artworks'
  24. if first_seg in ARTICLES:
  25. return 'articles'
  26. if first_seg in GALLERIES:
  27. return 'galleries'
  28. if first_seg in AUCTIONS:
  29. return 'auctions'
  30. if first_seg in INQUIRIES:
  31. return 'inquiries'
  32. if first_seg in FRONT:
  33. return 'front page'
  34. if first_seg in GENES:
  35. return 'genes'
  36. if first_seg in MUSEUMS:
  37. return 'museums'
  38. else:
  39. return 'undefined'
  40.  
  41.  
  42. # Add new column 'type'
  43. page_views_df['type'] = page_views_df['first_segment'].apply(lambda x: get_type(x))
  44. # Export dataframe to reveiew results
  45. page_views_df.to_csv('pageviews_withtype.csv',index=False)
  46.  
  47. return page_views_df
  48.  
  49.  
  50. get_type()
Add Comment
Please, Sign In to add comment