Advertisement
Guest User

bbbb

a guest
Nov 15th, 2019
121
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.27 KB | None | 0 0
  1. import matplotlib.pyplot as plt #explanatory modeling
  2. import pandas
  3. from pandas.plotting import scatter_matrix
  4.  
  5. from sklearn import model_selection
  6. from sklearn.model_selection import train_test_split
  7.  
  8. from sklearn.naive_bayes import GaussianNB
  9. from sklearn import metrics
  10.  
  11. url="c:/Users/bmaxwel/Documents/winequality-red.csv"
  12.  
  13. names=['fixed acidity','volatile acidity ','citric acid' ,'residual sugar', 'chlorides','free sulfur dioxide','total sulfur dioxide',
  14. 'density','pH','sulphates','alcohol','quality']
  15. dataset = pandas.read_csv(url,names=names)
  16.  
  17. print(dataset.shape)
  18. print(dataset.head)
  19. print(dataset)
  20. print(dataset.describe())
  21.  
  22.  
  23. dataset.plot(kind='box',subplots=True,layout=(6,6),sharex=False, sharey=False)
  24. plt.show()
  25.  
  26. dataset.hist()
  27. plt.show()
  28.  
  29. scatter_matrix(dataset)
  30. plt.show()
  31.  
  32. array = dataset.values
  33. x = array[:,0:11]
  34. y = array[:,11]
  35.  
  36. validation_size =0.20
  37. seed =7
  38. x_train,x_test,y_train,y_test = model_selection.train_test_split\
  39. (x, y, test_size=validation_size, random_state=seed)
  40.  
  41. print("x_train",x_train)
  42. print("x_test",x_test)
  43. print("y_train",y_train)
  44. print("y_test",y_test)
  45.  
  46. model = GaussianNB()
  47. model = model.fit(x_train ,y_train)
  48.  
  49. y_predicted = model.predict(x_test)
  50. print(metrics.accuracy_score(y_test, y_predicted))
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement