Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import codecs
- import csv
- import json
- import pprint
- import re
- FIELDS = ["name", "timeZone_label", "utcOffset", "homepage", "governmentType_label", "isPartOf_label", "areaCode", "populationTotal",
- "elevation", "maximumElevation", "minimumElevation", "populationDensity", "wgs84_pos#lat", "wgs84_pos#long",
- "areaLand", "areaMetro", "areaUrban"]
- def audit_file():
- with open('/Users/stephan/Desktop/cities.csv', "r") as f:
- mycsv=csv.DictReader(f)
- helper=set()
- fieldtypes={}
- headers=None
- for row in mycsv:
- for col in FIELDS:
- try:
- helper.add(get_the_type(row[col]))
- #print(row[col])
- print helper
- except KeyError:
- pass
- fieldtypes[col]=helper
- print helper
- def get_the_type(value):
- if value== "NULL" or value=="":
- return(type(None))
- elif (value=="{"):
- return (type([]))
- elif isinstance(value,(int)):
- return type(1)
- elif isinstance(value,(float)):
- return(type(1.1))
- else:
- return (type("bla"))
- audit_file
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement