Advertisement
Guest User

Dummy Classifier Workshop Thing

a guest
Nov 19th, 2019
150
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 1.20 KB | None | 0 0
  1. import pickle
  2. import os
  3. from sklearn.model_selection import train_test_split
  4. from sklearn.dummy import DummyRegressor
  5. import seaborn as sns
  6.  
  7. # Set a random seed so that we can see the difference between classifiers
  8. random_seed = 1
  9.  
  10. # Load data from the internet, or from cache if available on disk
  11. if not os.path.isfile("regression_data.pkl"):
  12.     df_mpg = sns.load_dataset('mpg')
  13.     df_mpg = df_mpg.dropna()
  14.     df_mpg = df_mpg.drop('origin', axis=1)
  15.     df_mpg = df_mpg.drop('name', axis=1)
  16.  
  17.     X = df_mpg.drop('mpg', axis=1)
  18.     y = df_mpg['mpg']
  19.  
  20.     pickle.dump((X, y), open("regression_data.pkl", "wb"))
  21. else:
  22.     print("Loading data...")
  23.     X, y = pickle.load(open("regression_data.pkl", "rb"))
  24.  
  25. # Separate train/test data from original data
  26. print("Splitting test and train data...")
  27. X_train, X_test, y_train, y_test = train_test_split(X, y, train_size=0.8, test_size=0.2, random_state=random_seed)
  28.  
  29. # Create your classifier
  30. classifier = DummyRegressor()
  31.  
  32. # Fit the classifier
  33. print("Fitting the classifier...")
  34. classifier.fit(X_train, y_train)
  35.  
  36. print("Training set score: %f" % classifier.score(X_train, y_train))
  37. print("Test set score: %f" % classifier.score(X_test, y_test))
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement