Guest User

Untitled

a guest
Apr 20th, 2018
74
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.01 KB | None | 0 0
  1. def DTC(df,target):
  2. import numpy as np
  3. import pandas as pd
  4. from sklearn import grid_search
  5. from sklearn.tree import DecisionTreeClassifier
  6.  
  7. #Splitting the data into train and test
  8. x_train,x_test,y_train,y_test = ms.train_test_split(df,target,test_size=0.3,random_state=123)
  9.  
  10. dtc = DecisionTreeClassifier(criterion='gini',min_samples_split=2,random_state=123)
  11. dtc.fit(x_train,y_train)
  12.  
  13. pred_dt_train = dtc.predict(x_train)
  14. pred_dt_test=dtc.predict(x_test)
  15. print(dtc.score(x_train,y_train))
  16. print(dtc.score(x_test,y_test))
  17.  
  18. #parameter tuning using grid search
  19. parameters = {'max_depth': list(range(3,20)),'min_samples_leaf':list(range(2,8))}
  20. dtc_cv = grid_search.GridSearchCV(DecisionTreeClassifier(random_state=123), parameters)
  21. dtc_cv.fit(x_train,y_train)
  22. tree_model = dtc_cv.best_estimator_
  23. print("\n Tuning with Grid Search \n")
  24. print(tree_model)
  25. print ("\n best score \n",dtc_cv.best_score_,"\n best params \n", dtc_cv.best_params_)
Add Comment
Please, Sign In to add comment