Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import csv
- import os.path
- import matplotlib.pyplot as plt
- import matplotlib.patches as patches
- import seaborn as sns
- %matplotlib inline
- #data loading
- data = ....
- ------------------------------
- def visualizeComedyByOtherGenres(data):
- keysToNotInclude = ['Id', 'Duration', 'Language', 'Country', 'Rating', 'Target', "Poster"]
- keys = [key for key in data[0].keys() if not key in keysToNotInclude]
- isComedyKey = 'Target'
- plotValues = dict.fromkeys(keys, 0)
- for item in data:
- if item[isComedyKey] == "1":
- for key in keys:
- if item[key] == "1":
- plotValues[key] += 1
- xValues = []
- yValues = []
- for key, value in plotValues.items():
- xValues.append(key)
- yValues.append(value)
- sns.set_context("notebook", font_scale=10)
- gr = sns.barplot(x=xValues, y=yValues)
- plt.setp(gr.get_xticklabels(), rotation=90)
- plt.title("By Genres")
- plt.rcParams['figure.figsize']=(70,40)
- visualizeComedyByOtherGenres(data)
- ----------------------------------
- def visualizeByLanguage(data):
- languageKey = "Language"
- langToNumComedies = {}
- for item in data:
- language = item[languageKey]
- numMovies, numComedies = langToNumComedies.get(language, (0,0))
- numMovies += 1
- if(item['Target'] == "1"):
- numComedies += 1
- langToNumComedies[language] = (numMovies, numComedies)
- xValues = list(langToNumComedies.keys())
- yValues = []
- for key in xValues:
- numMovies, numComedies = langToNumComedies[key]
- yValues.append(numComedies/numMovies)
- plt.rcParams['figure.figsize']=(75,30)
- gr = sns.barplot(x=xValues, y=yValues)
- sns.set_context("notebook", font_scale=10)
- plt.setp(gr.get_xticklabels(), rotation=90)
- plt.title("By Language(Normalized)")
- visualizeByLanguage(data)
- ------------------------------
- etc
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement