Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import urllib2, ast, csv, random
- with open('gender_data.csv', 'rb') as csvfile:
- csvreader = csv.reader(csvfile, delimiter=',', quotechar='|')
- next(csvreader, None)
- male_scores = []
- female_scores = []
- for row in csvreader:
- country_code = row[0]
- score = row[1]
- first_name = row[2]
- first_name = first_name.split(' ')[0]
- request_url = "https://api.genderize.io/?name=" + first_name + "&country_id=" + country_code
- response = ""
- if random.random() < 0.1:
- try:
- response = urllib2.urlopen(request_url).read()
- response = ast.literal_eval(response)
- gender = response['gender']
- if gender == 'male':
- male_scores.append(score)
- elif gender == 'female':
- female_scores.append(score)
- except:
- print response
- print "males"
- print male_scores
- print "females"
- print female_scores
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement