Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- # author Wojciech Jakub Jargielo & Michal Domagała
- import time
- import numpy as np
- import pandas as pd
- from sklearn.model_selection import train_test_split
- from sklearn.neighbors import KNeighborsClassifier
- from sklearn.preprocessing import MinMaxScaler
- from sklearn.preprocessing import StandardScaler
- def readcsv(filename):
- data = pd.read_csv(filename)
- return np.array(data)
- def getClassesFromFile(data):
- classesList = []
- for item in data:
- classesList.append(item[0])
- return classesList
- def standarization(data):
- scaler = StandardScaler()
- scaler.fit(data)
- # print(scaler.mean_)
- return scaler.transform(data)
- def minMax(data):
- scaler = MinMaxScaler()
- scaler.fit(data)
- # print(scaler.data_max_)
- return scaler.transform(data)
- def KNN(X, y):
- neigh = KNeighborsClassifier(n_neighbors=1,n_jobs=1)
- X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.33)
- neigh.fit(X_train, y_train)
- score = neigh.score(X_test, y_test)
- # print(score)
- if __name__ == "__main__":
- data = readcsv("xaa.csv")
- # print(data)ariterate
- # iterate
- # to do - get classes from csv
- # KNN(standarization(data), y)
- y = getClassesFromFile(data)
- for i in range(30):
- start = time.time()
- KNN(minMax(data), y)
- end = time.time()
- print(end-start)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement