Guest User

Untitled

a guest
Jul 18th, 2018
79
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.71 KB | None | 0 0
  1. # Importing the tasty stuff
  2. from sklearn.model_selection import train_test_split
  3. from sklearn.preprocessing import StandardScaler
  4. from sklearn.ensemble import RandomForestClassifier
  5. from sklearn.metrics import confusion_matrix
  6. from sklearn.externals import joblib
  7.  
  8. X = finalDf['size_in_mb']
  9. y = finalDf['pop_categories']
  10.  
  11. X_train, X_test, y_train, y_test = train_test_split(X, y, test_size = 0.25, random_state = 21)
  12.  
  13. # For single label values
  14. npX_train = np.array(X_train)
  15. npX_train = npX_train.reshape(-1,1)
  16.  
  17. npX_test = np.array(X_test)
  18. npX_test = npX_test.reshape(-1,1)
  19.  
  20. # Scaling, of course, for quicker learning time
  21. scaler = StandardScaler()
  22.  
  23. npX_train = scaler.fit_transform(npX_train)
  24. npX_test = scaler.transform(npX_test)
Add Comment
Please, Sign In to add comment