Advertisement
Guest User

cocalc tree

a guest
Aug 31st, 2020
175
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 2.05 KB | None | 0 0
  1. # Load libraries
  2. # Atau: Panggil guru-guru yang relevan: pandas, sklearn
  3. import pandas as pd
  4. from sklearn.tree import DecisionTreeClassifier # Import Decision Tree Classifier
  5. from sklearn.model_selection import train_test_split # Import train_test_split function
  6. from sklearn import metrics #Import scikit-learn metrics module for accuracy calculation
  7.  
  8. # Beri nama kolom yang sesuai dengan data.csv yang kita gunakan juga kemarin
  9. col_names = ['pregnant', 'glucose', 'bp', 'skin', 'insulin', 'bmi', 'pedigree', 'age', 'label']
  10. # load dataset, mirip dengan yang sebelumnya
  11. pima = pd.read_csv("data.csv", header=None, names=col_names)
  12.  
  13. # split dataset in features and target variable
  14. # kita pisahkan berdasarkan nama kolom, pada sebelumnya kita pisahkan antara 8 kolom di kiri dan 1 kolom di kanan
  15. # kali ini kita pisahkan berdasarkan nama. Ini merupakan pendekatan yang berbeda dalam menyiapkan data
  16. feature_cols = ['pregnant', 'insulin', 'bmi', 'age','glucose','bp','pedigree']
  17. X = pima[feature_cols] # Features
  18. y = pima.label # Target variable
  19.  
  20. # Split dataset into training set and test set
  21. # kali ini kita memisahkan data yang banyak menjadi Training dan Test. Sebelumnya tidak kita lakukan
  22. X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=1) # 70% training and 30% test
  23.  
  24. # Create Decision Tree classifer object without Pre-Pruning above and with Pre-Pruning below, comment one of them
  25. clf = DecisionTreeClassifier() # without Pruning
  26. # clf = DecisionTreeClassifier(criterion="entropy", max_depth=3) # with Pruning
  27.  
  28. # Train the Decision Tree
  29. clf = clf.fit(X_train,y_train)
  30.  
  31. #Predict the response for test dataset
  32. y_pred = clf.predict(X_test)
  33.  
  34. # Model Accuracy, how often is the classifier correct?
  35. print("Accuracy:",metrics.accuracy_score(y_test, y_pred)*100,"%")
  36.  
  37. # Prepare the Plotter as Graph
  38. # Untuk menampilkan Grafik-nya
  39. from matplotlib import pyplot as plt
  40. from sklearn import tree
  41.  
  42. fig = plt.figure(figsize=(25,20))
  43.  
  44. _ = tree.plot_tree(clf,feature_names = feature_cols,class_names=['0','1'],filled=True)
  45.  
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement