Advertisement
Guest User

Untitled

a guest
Dec 9th, 2019
84
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 1.25 KB | None | 0 0
  1.  
  2. import pandas as pd
  3. import numpy as np
  4. from sklearn import preprocessing
  5. from sklearn.model_selection import train_test_split
  6. from sklearn.neighbors import KNeighborsClassifier
  7.  
  8.  
  9. wineData=pd.read_csv('winequality.csv')
  10. print(wineData.columns)
  11. quality=wineData['Quality']
  12. del wineData['Quality']
  13. wineDataArray=wineData.values
  14. min_max_scaler=preprocessing.MinMaxScaler()
  15. wineData_scaled=min_max_scaler.fit_transform(wineDataArray)
  16. wineData=pd.DataFrame(wineData_scaled,columns=wineData.columns)
  17. wineData['Quality']=quality
  18. print(wineData.head())
  19.  
  20. train_accuracy=np.empty(9)
  21. test_accuracy=np.empty(9)
  22. X=wineData.iloc[:,wineData.columns!='Quality']
  23. y=wineData['Quality']
  24. X_train,X_test,y_train,y_test=train_test_split(X,y,test_size=0.3,random_state=10,stratify=y)
  25.  
  26. max=0
  27. bestk=0
  28.  
  29. for k in range(1,10):
  30.     knn=KNeighborsClassifier(n_neighbors=k)
  31.     knn.fit(X_train,y_train)
  32.     y_pred=knn.predict(X_test)
  33.     train_accuracy[k-1]=knn.score(X_train,y_train)
  34.     test_accuracy[k-1]=knn.score(X_test,y_test)
  35.     if knn.score(X_train,y_train)>=max:
  36.         max=knn.score(X_train,y_train)
  37.         bestk=k
  38.         print(max)
  39.         print(bestk)
  40. print(train_accuracy)
  41. print(test_accuracy)
  42. print('k=',bestk,'produced the best accuracy')#part 4
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement