Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import numpy as np
- import pandas as pd
- from scipy.spatial import distance
- columns = ['комнаты', 'площадь', 'кухня', 'пл. жилая', 'этаж', 'всего этажей', 'кондиционер']
- df_train = pd.DataFrame([
- [1, 38.5, 6.9, 18.9, 3, 5, 1],
- [1, 38.0, 8.5, 19.2, 9, 17, 0],
- [1, 34.7, 10.3, 19.8, 1, 9, 0],
- [1, 45.9, 11.1, 17.5, 11, 23, 1],
- [1, 42.4, 10.0, 19.9, 6, 14, 0],
- [1, 46.0, 10.2, 20.5, 3, 12, 1],
- [2, 77.7, 13.2, 39.3, 3, 17, 1],
- [2, 69.8, 11.1, 31.4, 12, 23, 0],
- [2, 78.2, 19.4, 33.2, 4, 9, 0],
- [2, 55.5, 7.8, 29.6, 1, 25, 1],
- [2, 74.3, 16.0, 34.2, 14, 17, 1],
- [2, 78.3, 12.3, 42.6, 23, 23, 0],
- [2, 74.0, 18.1, 49.0, 8, 9, 0],
- [2, 91.4, 20.1, 60.4, 2, 10, 0],
- [3, 85.0, 17.8, 56.1, 14, 14, 1],
- [3, 79.8, 9.8, 44.8, 9, 10, 0],
- [3, 72.0, 10.2, 37.3, 7, 9, 1],
- [3, 95.3, 11.0, 51.5, 15, 23, 1],
- [3, 69.3, 8.5, 39.3, 4, 9, 0],
- [3, 89.8, 11.2, 58.2, 24, 25, 0],
- ], columns=columns)
- def nearest_neighbor_predict(train_features, train_target, new_features):
- distances = [distance.euclidean(train_features.loc[i].values, new_features) for i in range(train_features.shape[0])]
- best_index = np.array(distances).argsort()[1]
- return train_target.loc[best_index]
- train_features = df_train.drop('кондиционер', axis=1)
- train_target = df_train['кондиционер']
- new_apartment = np.array([2, 51.0, 8.2, 35.9, 5, 5])
- prediction = nearest_neighbor_predict(train_features, train_target, new_apartment)
- print(prediction)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement