Advertisement
Guest User

Untitled

a guest
Jul 17th, 2018
68
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.50 KB | None | 0 0
  1. import pandas as pd
  2. import numpy as np
  3. from sklearn.preprocessing import Imputer
  4.  
  5. data = pd.read_csv('/home/josipa/Desktop/coffee_data/coffee_data.csv')
  6. #numerical data imputation
  7. for feature in ['opens', 'closes']:
  8. print(type(data[[feature]]))
  9. imputer = Imputer(missing_values=np.nan, strategy='median', axis=0)
  10. data[[feature]] = data[[feature]].replace('unknown', np.nan)
  11. print(data[[feature]])
  12. data[[feature]] = imputer.fit_transform(data[[feature]])
  13. print(data[[feature]])
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement