Guest User

Untitled

a guest
Aug 19th, 2018
81
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 4.08 KB | None | 0 0
  1. import numpy
  2. from sklearn.tree import DecisionTreeClassifier
  3. from sklearn.metrics import accuracy_score
  4. from sklearn import tree
  5. from sklearn.model_selection import train_test_split
  6. filename = 'diabetes.csv'
  7. raw_data = open(filename, 'rt')
  8. data = numpy.loadtxt(raw_data, delimiter=",", skiprows=1)
  9. print(data.shape)
  10.  
  11. X = data[:,0:8] #identify columns as data sets
  12. Y = data[:, 9] #identfy last column as target
  13. print(X)
  14. print(Y)
  15. X_train, X_test, Y_train, Y_test = train_test_split(
  16. X, Y, test_size=0.25)
  17. treeClassifier = DecisionTreeClassifier(max_depth=5)
  18. treeClassifier.fit(X_train, Y_train)
  19. with open("treeClassifier.txt", "w") as f:
  20. f = tree.export_graphviz(treeClassifier, out_file=f)
  21.  
  22. (768, 10)
  23. [[ 6. 148. 72. ... 33.6 0.627 50. ]
  24. [ 1. 85. 66. ... 26.6 0.351 31. ]
  25. [ 8. 183. 64. ... 23.3 0.672 32. ]
  26. ...
  27. [ 5. 121. 72. ... 26.2 0.245 30. ]
  28. [ 1. 126. 60. ... 30.1 0.349 47. ]
  29. [ 1. 93. 70. ... 30.4 0.315 23. ]]
  30. [1. 0. 1. 0. 1. 0. 1. 0. 1. 1. 0. 1. 0. 1. 1. 1. 1. 1. 0. 1. 0. 0. 1. 1.
  31. 1. 1. 1. 0. 0. 0. 0. 1. 0. 0. 0. 0. 0. 1. 1. 1. 0. 0. 0. 1. 0. 1. 0. 0.
  32. 1. 0. 0. 0. 0. 1. 0. 0. 1. 0. 0. 0. 0. 1. 0. 0. 1. 0. 1. 0. 0. 0. 1. 0.
  33. 1. 0. 0. 0. 0. 0. 1. 0. 0. 0. 0. 0. 1. 0. 0. 0. 1. 0. 0. 0. 0. 1. 0. 0.
  34. 0. 0. 0. 1. 1. 0. 0. 0. 0. 0. 0. 0. 0. 1. 1. 1. 0. 0. 1. 1. 1. 0. 0. 0.
  35. 1. 0. 0. 0. 1. 1. 0. 0. 1. 1. 1. 1. 1. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 1.
  36. 0. 0. 0. 0. 0. 0. 0. 0. 1. 0. 1. 1. 0. 0. 0. 1. 0. 0. 0. 0. 1. 1. 0. 0.
  37. 0. 0. 1. 1. 0. 0. 0. 1. 0. 1. 0. 1. 0. 0. 0. 0. 0. 1. 1. 1. 1. 1. 0. 0.
  38. 1. 1. 0. 1. 0. 1. 1. 1. 0. 0. 0. 0. 0. 0. 1. 1. 0. 1. 0. 0. 0. 1. 1. 1.
  39. 1. 0. 1. 1. 1. 1. 0. 0. 0. 0. 0. 1. 0. 0. 1. 1. 0. 0. 0. 1. 1. 1. 1. 0.
  40. 0. 0. 1. 1. 0. 1. 0. 0. 0. 0. 0. 0. 0. 0. 1. 1. 0. 0. 0. 1. 0. 1. 0. 0.
  41. 1. 0. 1. 0. 0. 1. 1. 0. 0. 0. 0. 0. 1. 0. 0. 0. 1. 0. 0. 1. 1. 0. 0. 1.
  42. 0. 0. 0. 1. 1. 1. 0. 0. 1. 0. 1. 0. 1. 1. 0. 1. 0. 0. 1. 0. 1. 1. 0. 0.
  43. 1. 0. 1. 0. 0. 1. 0. 1. 0. 1. 1. 1. 0. 0. 1. 0. 1. 0. 0. 0. 1. 0. 0. 0.
  44. 0. 1. 1. 1. 0. 0. 0. 0. 0. 0. 0. 0. 0. 1. 0. 0. 0. 0. 0. 1. 1. 1. 0. 1.
  45. 1. 0. 0. 1. 0. 0. 1. 0. 0. 1. 1. 0. 0. 0. 0. 1. 0. 0. 1. 0. 0. 0. 0. 0.
  46. 0. 0. 1. 1. 1. 0. 0. 1. 0. 0. 1. 0. 0. 1. 0. 1. 1. 0. 1. 0. 1. 0. 1. 0.
  47. 1. 1. 0. 0. 0. 0. 1. 1. 0. 1. 0. 1. 0. 0. 0. 0. 1. 1. 0. 1. 0. 1. 0. 0.
  48. 0. 0. 0. 1. 0. 0. 0. 0. 1. 0. 0. 1. 1. 1. 0. 0. 1. 0. 0. 1. 0. 0. 0. 1.
  49. 0. 0. 1. 0. 0. 0. 0. 0. 0. 0. 0. 0. 1. 0. 0. 0. 0. 0. 0. 0. 1. 0. 0. 0.
  50. 1. 0. 0. 0. 1. 1. 0. 0. 0. 0. 0. 0. 0. 1. 0. 0. 0. 0. 1. 0. 0. 0. 1. 0.
  51. 0. 0. 1. 0. 0. 0. 1. 0. 0. 0. 0. 1. 1. 0. 0. 0. 0. 0. 0. 1. 0. 0. 0. 0.
  52. 0. 0. 0. 0. 0. 0. 0. 1. 0. 0. 0. 1. 1. 1. 1. 0. 0. 1. 1. 0. 0. 0. 0. 0.
  53. 0. 0. 0. 0. 0. 0. 0. 0. 1. 1. 0. 0. 0. 0. 0. 0. 0. 1. 0. 0. 0. 0. 0. 0.
  54. 0. 1. 0. 1. 1. 0. 0. 0. 1. 0. 1. 0. 1. 0. 1. 0. 1. 0. 0. 1. 0. 0. 1. 0.
  55. 0. 0. 0. 1. 1. 0. 1. 0. 0. 0. 0. 1. 1. 0. 1. 0. 0. 0. 1. 1. 0. 0. 0. 0.
  56. 0. 0. 0. 0. 0. 0. 1. 0. 0. 0. 0. 1. 0. 0. 1. 0. 0. 0. 1. 0. 0. 0. 1. 1.
  57. 1. 0. 0. 0. 0. 0. 0. 1. 0. 0. 0. 1. 0. 1. 1. 1. 1. 0. 1. 1. 0. 0. 0. 0.
  58. 0. 0. 0. 1. 1. 0. 1. 0. 0. 1. 0. 1. 0. 0. 0. 0. 0. 1. 0. 1. 0. 1. 0. 1.
  59. 1. 0. 0. 0. 0. 1. 1. 0. 0. 0. 1. 0. 1. 1. 0. 0. 1. 0. 0. 1. 1. 0. 0. 1.
  60. 0. 0. 1. 0. 0. 0. 0. 0. 0. 0. 1. 1. 1. 0. 0. 0. 0. 0. 0. 1. 1. 0. 0. 1.
  61. 0. 0. 1. 0. 1. 1. 1. 0. 0. 1. 1. 1. 0. 1. 0. 1. 0. 1. 0. 0. 0. 0. 1. 0.]
  62.  
  63. tree.export_graphviz(treeClassifier, out_file=f)
  64.  
  65. tree.export_graphviz(treeClassifier, class_names=['0', '1'], out_file=f)
  66.  
  67. import graphviz
  68. import numpy as np
  69. from sklearn.tree import DecisionTreeClassifier
  70. from sklearn import tree
  71. from sklearn.model_selection import train_test_split
  72.  
  73. np.random.seed(42)
  74. X = np.random.random((100, 8))
  75. Y = np.random.randint(2, size=100)
  76. X_train, X_test, Y_train, Y_test = train_test_split(X, Y, test_size=0.25)
  77. tree_classifier = DecisionTreeClassifier(max_depth=5)
  78. tree_classifier.fit(X_train, Y_train)
  79.  
  80. dot_data = tree.export_graphviz(tree_classifier, class_names=['0', '1'], out_file=None)
  81. graph = graphviz.Source(dot_data)
  82. graph
  83.  
  84. tree.export_graphviz(treeClassifier, class_names=['0', '1'],
  85. filled=True, rounded=True, out_file=f)
Add Comment
Please, Sign In to add comment