Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import matplotlib.pyplot as plt
- import numpy as np
- import matplotlib.patches as patches
- from scipy import linalg
- from matplotlib import colors
- from sklearn.discriminant_analysis import LinearDiscriminantAnalysis, QuadraticDiscriminantAnalysis
- # #############################################################################
- # Colormap
- cmap = colors.LinearSegmentedColormap(
- 'red_blue_classes',
- {'red': [(0, 1, 1), (1, 0.7, 0.7)],
- 'green': [(0, 0.7, 0.7), (1, 0.7, 0.7)],
- 'blue': [(0, 0.7, 0.7), (1, 1, 1)]})
- plt.cm.register_cmap(cmap=cmap)
- # #############################################################################
- # Generate datasets
- def dataset_fixed_cov():
- n, dim = 300, 2
- np.random.seed(0)
- C = np.array([[0., -0.23], [0.83, .23]])
- X = np.r_[np.dot(np.random.randn(n, dim), C),
- np.dot(np.random.randn(n, dim), C) + np.array([1, 1])]
- y = np.hstack((np.zeros(n), np.ones(n)))
- return X, y
- def dataset_cov():
- n, dim = 300, 2
- np.random.seed(0)
- C = np.array([[0., -1.], [2.5, .7]]) * 2.
- X = np.r_[np.dot(np.random.randn(n, dim), C),
- np.dot(np.random.randn(n, dim), C.T) + np.array([1, 4])]
- y = np.hstack((np.zeros(n), np.ones(n)))
- return X, y
- # #############################################################################
- # Plot functions
- def plot_data(lda, X, y, y_pred, fig_index):
- splot = plt.subplot(2, 2, fig_index)
- if fig_index == 1:
- plt.title('Линейный дискриминантный анализ')
- plt.ylabel('Данные с\n фиксированной ковариацией')
- elif fig_index == 2:
- plt.title('Квадратичный дискриминантный анализ')
- elif fig_index == 3:
- plt.ylabel('Данные с\n изменяющимися ковариациями')
- tp = (y == y_pred)
- tp0, tp1 = tp[y == 0], tp[y == 1]
- X0, X1 = X[y == 0], X[y == 1]
- X0_tp, X0_fp = X0[tp0], X0[~tp0]
- X1_tp, X1_fp = X1[tp1], X1[~tp1]
- plt.scatter(X0_tp[:, 0], X0_tp[:, 1], marker='.', color='red')
- plt.scatter(X0_fp[:, 0], X0_fp[:, 1], marker='x', s=20, color='#990000')
- plt.scatter(X1_tp[:, 0], X1_tp[:, 1], marker='.', color='blue')
- plt.scatter(X1_fp[:, 0], X1_fp[:, 1], marker='x', s=20, color='#000099')
- # Вставляем код для построения эллипса для класса 0
- v, w = linalg.eigh(lda.covariance_)
- u = w[0] / linalg.norm(w[0])
- angle = np.arctan(u[1] / u[0])
- angle = 180 * angle / np.pi
- ell = patches.Ellipse(lda.means_[0], 2 * v[0] ** 0.5, 2 * v[1] ** 0.5,
- 180 + angle, facecolor='none', edgecolor='red', linewidth=2)
- splot.add_patch(ell)
- # Вставляем код для построения эллипса для класса 1
- v, w = linalg.eigh(lda.covariance_)
- u = w[0] / linalg.norm(w[0])
- angle = np.arctan(u[1] / u[0])
- angle = 180 * angle / np.pi
- ell = patches.Ellipse(lda.means_[1], 2 * v[0] ** 0.5, 2 * v[1] ** 0.5,
- 180 + angle, facecolor='none', edgecolor='blue', linewidth=2)
- splot.add_patch(ell)
- nx, ny = 200, 100
- x_min, x_max = plt.xlim()
- y_min, y_max = plt.ylim()
- xx, yy = np.meshgrid(np.linspace(x_min, x_max, nx),
- np.linspace(y_min, y_max, ny))
- Z = lda.predict_proba(np.c_[xx.ravel(), yy.ravel()])
- Z = Z[:, 1].reshape(xx.shape)
- plt.pcolormesh(xx, yy, Z, cmap='red_blue_classes', norm=colors.Normalize(0., 1.), zorder=0)
- plt.contour(xx, yy, Z, [0.5], linewidths=2., colors='white')
- plt.plot(lda.means_[0][0], lda.means_[0][1], '*', color='yellow', markersize=15, markeredgecolor='grey')
- plt.plot(lda.means_[1][0], lda.means_[1][1], '*', color='yellow', markersize=15, markeredgecolor='grey')
- splot.set_xticks(())
- splot.set_yticks(())
- # #############################################################################
- # Main Code
- plt.figure(figsize=(10, 8), facecolor='white')
- plt.suptitle('Линейный Дискриминантный Анализ vs Квадратичный Дискриминантный Анализ',
- y=0.98, fontsize=15)
- for i, (X, y) in enumerate([dataset_fixed_cov(), dataset_cov()]):
- lda = LinearDiscriminantAnalysis(solver="svd", store_covariance=True)
- y_pred = lda.fit(X, y).predict(X)
- splot = plot_data(lda, X, y, y_pred, fig_index=2 * i + 1)
- plt.axis('tight')
- qda = QuadraticDiscriminantAnalysis(store_covariance=True)
- y_pred = qda.fit(X, y).predict(X)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement