Advertisement
Guest User

Untitled

a guest
Oct 23rd, 2019
94
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.68 KB | None | 0 0
  1. import pandas as pd
  2. from sklearn.cluster import MiniBatchKMeans
  3. from sklearn.model_selection import train_test_split
  4.  
  5.  
  6. pitch_data = pd.read_csv('/Users/juliekent/PycharmProjects/clusters/pitches.csv')
  7.  
  8. x = pitch_data['px'].round(2).dropna()
  9. z = pitch_data['pz'].round(2).dropna()
  10.  
  11. combined = pd.concat([x, z], axis=1)
  12. print(combined)
  13.  
  14. kmeans = MiniBatchKMeans(n_clusters=3, batch_size=1000)
  15. kmeans.fit(combined)
  16.  
  17. # cluster assignments
  18. print('{}\n'.format(repr(kmeans.labels_)))
  19.  
  20. # centroids
  21. print('{}\n'.format(repr(kmeans.cluster_centers_)))
  22.  
  23. import numpy as np
  24. new_obs = np.array([(0.5, 1.2), (0.42, 2.5), (-0.19, 2.0) ])
  25.  
  26. # predict clusters
  27. print('{}\n'.format(repr(kmeans.predict(new_obs))))
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement