Advertisement
Guest User

Untitled

a guest
Nov 18th, 2019
133
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 0.99 KB | None | 0 0
  1. #!/opt/conda/envs/dsenv/bin/python
  2.  
  3. import sys, os
  4. import logging
  5. from joblib import load
  6. import pandas as pd
  7.  
  8. sys.path.append('.')
  9. from model import fields_2, fields, numeric_features, categorical_features
  10.  
  11. #
  12. # Init the logger
  13. #
  14. #logging.basicConfig(level=logging.DEBUG)
  15. #logging.info("CURRENT_DIR {}".format(os.getcwd()))
  16. ##logging.info("SCRIPT CALLED AS {}".format(sys.argv[0]))
  17. #logging.info("ARGS {}".format(sys.argv[1:]))
  18.  
  19. model = load("2.joblib")
  20.  
  21.  
  22. #fields = """doc_id,hotel_name,hotel_url,street,city,state,country,zip,class,price,
  23. #num_reviews,CLEANLINESS,ROOM,SERVICE,LOCATION,VALUE,COMFORT,overall_ratingsource""".replace("\n",'').split(",")
  24.  
  25. #read and infere
  26. read_opts=dict(
  27.         sep='\t', names= fields_2, index_col=False, header=None,
  28.         iterator=True, chunksize=10000, na_values = '\\N'
  29. )
  30.  
  31. for df in pd.read_csv(sys.stdin, **read_opts):
  32.     pred = model.predict_proba(df)[:,1]
  33.     out = zip(df.id, pred)
  34.     print("\n".join(["{0}\t{1}".format(*i) for i in out]))
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement