python model code

import numpy as np
import tensorflow as tf
import keras
from keras import backend as K
from keras.models import Sequential, load_model
from keras.layers import Dense, Dropout, Flatten
from keras.layers import Conv2D, MaxPooling2D, BatchNormalization
from tensorflow.keras.optimizers import Adam
from keras.utils import np_utils
from keras import regularizers

from sklearn.metrics import precision_recall_fscore_support, confusion_matrix
import load_data
import matplotlib
matplotlib.use("Agg")
from matplotlib import pyplot as plt
import itertools
import os

# use the GPU to train!
# os.environ["CUDA_VISIBLE_DEVICES"] = "0"


# Models to be passed to Music_Genre_CNN
song_labels = ["Blues", "Classical", "Country", "Disco", "Hip hop", "Jazz", "Metal", "Pop", "Reggae", "Rock"]


def plot_confusion_matrix(cm, classes, normalize=False, title='Confusion matrix', cmap=plt.cm.Blues):
    """
    This function prints and plots the confusion matrix.
    Normalization can be applied by setting `normalize=True`.
    """
    if normalize:
        cm = cm.astype('float') / cm.sum(axis=1)[:, np.newaxis]
        print("Normalized confusion matrix")
    else:
        print('Confusion matrix, without normalization')

    print(cm)

    plt.imshow(cm, interpolation='nearest', cmap=cmap)
    plt.title(title)
    plt.colorbar()
    tick_marks = np.arange(len(classes))
    plt.xticks(tick_marks, classes, rotation=45)
    plt.yticks(tick_marks, classes)

    fmt = '.1f' if normalize else 'd'
    thresh = cm.max() / 2.
    for i, j in itertools.product(range(cm.shape[0]), range(cm.shape[1])):
        plt.text(j, i, format(cm[i, j], fmt),
                 horizontalalignment="center",
                 color="white" if cm[i, j] > thresh else "black")

    plt.ylabel('True label')
    plt.xlabel('Predicted label')
    plt.tight_layout()


def metric(y_true, y_pred):
    return K.mean(K.equal(K.argmax(y_true, axis=1), K.argmax(y_pred, axis=1)))


def cnn(num_genres=10, input_shape=(64, 173, 1)):
    model = Sequential()
    model.add(Conv2D(64, kernel_size=(4, 4),
                     activation='relu', #kernel_regularizer=regularizers.l2(0.04),
                     input_shape=input_shape))
    model.add(BatchNormalization())
    model.add(MaxPooling2D(pool_size=(2, 4)))
    model.add(Conv2D(64, (3, 5), activation='relu', kernel_regularizer=regularizers.l2(0.04)))
    model.add(MaxPooling2D(pool_size=(2, 2)))
    model.add(Dropout(0.2))
    model.add(Conv2D(64, (2, 2), activation='relu'))
    #,kernel_regularizer=regularizers.l2(0.04)
    model.add(BatchNormalization())
    model.add(MaxPooling2D(pool_size=(2, 2)))
    model.add(Dropout(0.2))
    model.add(Flatten())
    model.add(Dense(64, activation='relu', kernel_regularizer=regularizers.l2(0.04)))
    model.add(Dropout(0.5))
    model.add(Dense(32, activation='relu', kernel_regularizer=regularizers.l2(0.04)))
    model.add(Dense(num_genres, activation='softmax'))
    model.compile(loss=keras.losses.categorical_crossentropy,
                  optimizer=Adam(learning_rate=0.001, beta_1=0.9, beta_2=0.999, epsilon=1e-08, decay=0.0),
                  metrics=[metric])
    return model


class model(object):
    # Main network thingy to train
    def __init__(self, ann_model):
        self.model = ann_model()

    def train_model(self, train_x, train_y, val_x=None, val_y=None,
                    small_batch_size=200,
                    max_iteration=300,
                    print_interval=1,
                    test_x=None, test_y=None):

        """
        epoch数是一个超参数，它定义了学习算法在整个训练数据集中的工作次数
        """

        m = len(train_x)

        #
        for it in range(max_iteration):

            # split training data into even batches
            batch_idx = np.random.permutation(m)
            train_x = train_x[batch_idx]
            train_y = train_y[batch_idx]

            num_batches = int(m / small_batch_size)
            for batch in range(num_batches):

                x_batch = train_x[batch*small_batch_size: (batch+1)*small_batch_size]
                y_batch = train_y[batch*small_batch_size: (batch+1)*small_batch_size]
                print("starting batch\t", batch, "\t Epoch:\t", it)
                self.model.train_on_batch(x_batch, y_batch)

            if it % print_interval == 0:
                validation_accuracy = self.model.evaluate(val_x, val_y)
                training_accuracy = self.model.evaluate(train_x, train_y)
                testing_accuracy = self.model.evaluate(test_x, test_y)

                # print of test error used only after development of the model
                print("\nTraining accuracy: %f\t Validation accuracy: %f\t Testing Accuracy: %f" %
                      (training_accuracy[1], validation_accuracy[1], testing_accuracy[1]))
                print("\nTraining loss: %f    \t Validation loss: %f    \t Testing Loss: %f \n" %
                      (training_accuracy[0], validation_accuracy[0], testing_accuracy[0]))
                print()

            # 验证集准确度>.81则输出训练的效果图 matrix
            if validation_accuracy[1] > .81:
                print("Saving confusion data...")
                model_name = "model" + str(100*validation_accuracy[1]) + str(100* testing_accuracy[1]) + ".h5"
                self.model.save(model_name)
                # pred = self.model.predict_classes(test_x, verbose=1)
                pred = self.model.predict(test_x, verbose=1)
                cnf_matrix = confusion_matrix(np.argmax(test_y, axis=1), pred)
                np.set_printoptions(precision=2)

                # visualization
                plt.figure()
                plot_confusion_matrix(cnf_matrix,
                                      classes=song_labels,
                                      normalize=True,
                                      title='Normalized confusion matrix')
                print(precision_recall_fscore_support(np.argmax(test_y, axis=1), pred, average='macro'))
                plt.savefig(str(batch)+".png", dpi=600)

    # def model_predict(self, test_x):
    #     pred = self.model.predict(test_x, verbose=1)
    #     cnf_matrix = confusion_matrix(np.argmax(test_y, axis=1), pred)
    #     np.set_printoptions(precision=2)
    #
    #     # visualization
    #     plt.figure()
    #     plot_confusion_matrix(cnf_matrix,
    #                           classes=song_labels,
    #                           normalize=True,
    #                           title='Normalized confusion matrix')
    #     print(precision_recall_fscore_support(np.argmax(test_y, axis=1), pred, average='macro'))
    #     plt.savefig(str(batch) + ".png", dpi=600)


def main():
    # Data stuff
    # data = load_data.loadall('melspects.npz')

    tmp = np.load('melspects.npz')
    x_tr = tmp['x_tr']
    y_tr = tmp['y_tr']
    x_te = tmp['x_te']
    y_te = tmp['y_te']
    x_cv = tmp['x_cv']
    y_cv = tmp['y_cv']
    # data = {'x_tr': x_tr, 'y_tr': y_tr,
    #         'x_te': x_te, 'y_te': y_te,
    #         'x_cv': x_cv, 'y_cv': y_cv, }
    #
    # x_tr = data['x_tr']
    # y_tr = data['y_tr']
    # x_te = data['x_te']
    # y_te = data['y_te']
    # x_cv = data['x_cv']
    # y_cv = data['y_cv']

    tr_idx = np.random.permutation(len(x_tr))
    te_idx = np.random.permutation(len(x_te))
    cv_idx = np.random.permutation(len(x_cv))

    x_tr = x_tr[tr_idx]
    y_tr = y_tr[tr_idx]
    x_te = x_te[te_idx]
    y_te = y_te[te_idx]
    x_cv = x_cv[cv_idx]
    y_cv = y_cv[cv_idx]

    x_tr = x_tr[:, :, :, np.newaxis]
    x_te = x_te[:, :, :, np.newaxis]
    x_cv = x_cv[:, :, :, np.newaxis]

    y_tr = np_utils.to_categorical(y_tr)
    y_te = np_utils.to_categorical(y_te)
    y_cv = np_utils.to_categorical(y_cv)


# training = np.load('gtzan/gtzan_tr.npy')
# x_tr = np.delete(training, -1, 1)
# label_tr = training[:,-1]

# test = np.load('gtzan/gtzan_te.npy')
# x_te = np.delete(test, -1, 1)
# label_te = test[:,-1]

# cv = np.load('gtzan/gtzan_cv.npy')
# x_cv = np.delete(cv, -1, 1)
# label_cv = test[:,-1]

# temp = np.zeros((len(label_tr),10))
# temp[np.arange(len(label_tr)),label_tr.astype(int)] = 1
# y_tr = temp
# temp = np.zeros((len(label_te),10))
# temp[np.arange(len(label_te)),label_te.astype(int)] = 1
# y_te = temp
# temp = np.zeros((len(label_cv),10))
# temp[np.arange(len(label_cv)),label_cv.astype(int)] = 1
# y_cv = temp
# del temp

#################################################

#    if True:
#   model = keras.models.load_model('model84.082.0.h5', custom_objects={'metric': metric})
#   print("Saving confusion data...")
#   pred = model.predict_classes(x_te, verbose=1)
#   cnf_matrix = confusion_matrix(np.argmax(y_te, axis=1), pred)
#   np.set_printoptions(precision=1)
#   plt.figure()
#   plot_confusion_matrix(cnf_matrix, classes=song_labels, normalize=True, title='Normalized confusion matrix')
#   print(precision_recall_fscore_support(np.argmax(y_te, axis=1),pred, average='macro'))
#   plt.savefig("matrix",format='png', dpi=1000)
#   raise SystemExit
    ann = model(cnn)
    ann.train_model(x_tr, y_tr, val_x=x_cv, val_y=y_cv, test_x=x_te, test_y=y_te)


if __name__ == '__main__':
    main()