Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import pandas as pd
- import numpy as np
- from sklearn.ensemble import RandomForestClassifier
- train = pd.read_json('train.json')
- test = pd.read_json('test.json')
- y = train.requester_received_pizza
- ids = test.request_id
- string_columns = [column for dtype, column in zip(list(test.dtypes), list(test.dtypes.index))
- if dtype == np.dtype('O')]
- test.drop(string_columns, inplace=True, axis=1)
- train = train[test.columns]
- clf = RandomForestClassifier(n_estimators=1000)
- clf.fit(train.values, y)
- predictions = clf.predict_proba(test.values)
- pd.Series(predictions[:, 1], index=ids, name='requester_received_pizza').to_csv('res.csv', header=True)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement