Advertisement
Guest User

Untitled

a guest
Nov 14th, 2019
137
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.05 KB | None | 0 0
  1. # -*- coding: utf-8 -*-
  2. """
  3. Created on Tue Nov 12 09:05:11 2019
  4.  
  5. @author: A6319
  6. """
  7.  
  8. import pandas as pd
  9. from sklearn.tree import DecisionTreeClassifier
  10. from sklearn.model_selection import train_test_split
  11. from sklearn import metrics
  12.  
  13. def readFile(file):
  14. f = pd.read_csv(file)
  15. X = f.loc[:,f.columns != "Outcome"]
  16. y = f.Outcome
  17. return X, y
  18.  
  19. def decisionTree(X, y):
  20. X_train, X_test, y_train, y_test = train_test_split(X, y, test_size = 0.2, random_state = 1)
  21.  
  22. """
  23. clf = DecisionTreeClassifier()
  24. clf = clf.fit(X_train, y_train)
  25. y_pred = clf.predict(X_test)
  26. print("Acuracy: ", metrics.accuracy_score(y_test, y_pred))
  27. """
  28.  
  29. clf = DecisionTreeClassifier(criterion="gini", max_depth=3)
  30. clf = clf.fit(X_train, y_train)
  31. y_pred = clf.predict(X_test)
  32. print("Acuracy: ", metrics.accuracy_score(y_test, y_pred))
  33. #print(clf.score(X_test,y_test))
  34.  
  35.  
  36. def main():
  37. X, y = readFile("diabetes.csv")
  38. decisionTree(X, y)
  39.  
  40.  
  41.  
  42. if __name__ == "__main__":
  43. main()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement