Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import pandas as pd
- from define_types import define_types
- ARTISTS, SHOWS, ARTWORKS, ARTICLES, AUCTIONS, INQUIRIES, FRONT, GENES, GALLERIES, MUSEUMS = define_types()
- def get_type():
- # Load page views test data
- page_views_df = pd.read_csv('pageviews.csv')
- # Delimit path into a list
- page_views_df['first_segment'] = page_views_df['path'].str.split("/", expand=False)
- page_views_df['first_segment'] = page_views_df.first_segment.map(lambda x: x[1])
- # Determine which list the first path segment is found in
- # Assign type to first path segment
- def get_type(first_seg):
- if first_seg in ARTISTS:
- return 'artists'
- if first_seg in SHOWS:
- return 'shows'
- if first_seg in ARTWORKS:
- return 'artworks'
- if first_seg in ARTICLES:
- return 'articles'
- if first_seg in GALLERIES:
- return 'galleries'
- if first_seg in AUCTIONS:
- return 'auctions'
- if first_seg in INQUIRIES:
- return 'inquiries'
- if first_seg in FRONT:
- return 'front page'
- if first_seg in GENES:
- return 'genes'
- if first_seg in MUSEUMS:
- return 'museums'
- else:
- return 'undefined'
- # Add new column 'type'
- page_views_df['type'] = page_views_df['first_segment'].apply(lambda x: get_type(x))
- # Export dataframe to reveiew results
- page_views_df.to_csv('pageviews_withtype.csv',index=False)
- return page_views_df
- get_type()
Add Comment
Please, Sign In to add comment