Advertisement
Guest User

Untitled

a guest
Apr 19th, 2015
272
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 0.99 KB | None | 0 0
  1. import codecs
  2. import csv
  3. import json
  4. import pprint
  5. import re
  6.  
  7.  
  8. FIELDS = ["name", "timeZone_label", "utcOffset", "homepage", "governmentType_label", "isPartOf_label", "areaCode", "populationTotal",
  9.         "elevation", "maximumElevation", "minimumElevation", "populationDensity", "wgs84_pos#lat", "wgs84_pos#long",
  10.         "areaLand", "areaMetro", "areaUrban"]
  11.  
  12. def audit_file():
  13.     with open('/Users/stephan/Desktop/cities.csv', "r") as f:
  14.         mycsv=csv.DictReader(f)
  15.         helper=set()
  16.         fieldtypes={}
  17.         headers=None
  18.         for row in mycsv:
  19.             for col in FIELDS:
  20.                 try:
  21.                     helper.add(get_the_type(row[col]))             
  22.                     #print(row[col])
  23.                     print helper
  24.                     except KeyError:
  25.                         pass
  26.                 fieldtypes[col]=helper
  27.                 print helper
  28.  
  29. def get_the_type(value):
  30.     if value== "NULL" or value=="":
  31.         return(type(None))
  32.     elif (value=="{"):
  33.         return (type([]))
  34.     elif isinstance(value,(int)):
  35.         return type(1)
  36.     elif isinstance(value,(float)):
  37.         return(type(1.1))
  38.     else:
  39.         return (type("bla"))
  40.  
  41. audit_file
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement