Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- #!/opt/conda/envs/dsenv/bin/python
- import sys, os
- import logging
- from joblib import load
- import pandas as pd
- sys.path.append('.')
- from model import fields_2, fields, numeric_features, categorical_features
- #
- # Init the logger
- #
- #logging.basicConfig(level=logging.DEBUG)
- #logging.info("CURRENT_DIR {}".format(os.getcwd()))
- ##logging.info("SCRIPT CALLED AS {}".format(sys.argv[0]))
- #logging.info("ARGS {}".format(sys.argv[1:]))
- model = load("2.joblib")
- #fields = """doc_id,hotel_name,hotel_url,street,city,state,country,zip,class,price,
- #num_reviews,CLEANLINESS,ROOM,SERVICE,LOCATION,VALUE,COMFORT,overall_ratingsource""".replace("\n",'').split(",")
- #read and infere
- read_opts=dict(
- sep='\t', names= fields_2, index_col=False, header=None,
- iterator=True, chunksize=10000, na_values = '\\N'
- )
- for df in pd.read_csv(sys.stdin, **read_opts):
- pred = model.predict_proba(df)[:,1]
- out = zip(df.id, pred)
- print("\n".join(["{0}\t{1}".format(*i) for i in out]))
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement