Untitled

from ml import utilities
import numpy as np
import sys
from abc import ABC,abstractmethod
from functools import wraps

class ML(ABC):
    coef_ = []
    classes_ = []
    intercept_ = []

    @abstractmethod
    def fit(self,X,y):
        pass

    @abstractmethod
    def predict(self,X):

        pass

    @abstractmethod
    def score(self,X,y):
        pass


class FisherLinearDiscriminant(ML):
    '''
    w = S^-1 * (m2 − m1)
    S = sum n -> c1 ((xn - m1) + (xn -m1)^-1) + sum n -> c2 ((xn - m2) + (xn -m2)^-1)
    w0 = -w^T * (m1 + m2)/2
    '''

    means_ = []

    def fit(self,X,y):

        """Fit process classification model
        Parameters
        ----------
        X : array-like, shape = (n_samples, n_features)
            Training data
        y : array-like, shape = (n_samples,)
            Target values, must be binary
        Returns
        -------
        self : returns an instance of self.
        """
        self.classes_ = list(set(y))
        sum_samples = dict.fromkeys(self.classes_, [0]* len(X[0]))
        n_samples = dict.fromkeys(self.classes_, 0)
        for index, value in enumerate(y):
            sum_samples[value] = [old_val + new_val for old_val, new_val in zip(sum_samples[value], X[index])]
            n_samples[value] += 1
        for index, value in enumerate(self.classes_): #calculate means of each class
            self.means_.append(np.divide(sum_samples[value],n_samples[value]))

        for class_index,class_ in enumerate(self.classes_):
            rest_means = [0]*len(X[0])
            rest_sample_size = 0
            for index, value in enumerate(self.classes_): #calculate means of each class
                if value != class_:
                    rest_means =np.add(rest_means,sum_samples[value])
                    rest_sample_size += 1
            rest_means = np.divide(rest_means,rest_sample_size)
            class_variance = [[0]*len(X[0]) for i in range(len(X[0]))]
            rest_classes_variance = [[0]*len(X[0]) for i in range(len(X[0]))]
            for i, j in enumerate(y):
                if j == class_:
                    class_variance = np.add(class_variance,self._sample_variance(self.means_[class_index],X[i]))
                else:
                    rest_classes_variance = np.add(rest_classes_variance,self._sample_variance(rest_means,X[i]))
            sw =np.add(class_variance,rest_classes_variance)
            sw_inverse = np.linalg.pinv(sw)
            sub_means = np.subtract(rest_means,self.means_[class_index])
            wieghts = np.matmul(sw_inverse,utilities.transpose_matrix(sub_means))
            self.coef_.append(np.transpose(wieghts)[0])
            avg_means = np.divide(np.add(rest_means,self.means_[class_index]),2)
            self.intercept_.append(np.multiply(np.dot(self.coef_[class_index],avg_means),-1))
    def predict(self,X):
        """Perform classification on an array of test vectors X.
        Parameters
        ----------
        X : array-like, shape = (n_samples, n_features)
        Returns
        -------
        C : array, shape = (n_samples,)
            Predicted target values for X, values are from ``classes_``
        """
        y = []
        for features in X:
            predicted_y = sys.maxsize
            predicted_class_index = -1
            for index,coef in enumerate(self.coef_):
                tmp_predicted_y =np.dot(coef,features) + self.intercept_[index]
                if predicted_y > tmp_predicted_y:
                    predicted_y = tmp_predicted_y
                    predicted_class_index = index
            y.append(self.classes_[predicted_class_index])

        return y


    def score(self,X,y):
        """Returns the mean accuracy on the given test data and labels.
        In multi-label classification, this is the subset accuracy
        which is a harsh metric since you require for each sample that
        each label set be correctly predicted.
        Parameters
        ----------
        X : array-like, shape = (n_samples, n_features)
            Test samples.
        y : array-like, shape = (n_samples) or (n_samples, n_outputs)
            True labels for X.
        sample_weight : array-like, shape = [n_samples], optional
            Sample weights.
        Returns
        -------
        score : float
            Mean accuracy of self.predict(X) wrt. y.
        """
        confusion_matrix = [[0]*len(self.classes_) for i in range(len(self.classes_))]
        correct_predict = 0
        for real_class_index,features in enumerate(X):
            predicted_y = sys.maxsize

            predicted_class_index = -1
            for index,coef in enumerate(self.coef_):
                tmp_predicted_y =np.dot(coef,features) + self.intercept_[index]
                if predicted_y > tmp_predicted_y:
                    predicted_y = tmp_predicted_y
                    predicted_class_index = index
            y_index = self.classes_.index(y[real_class_index])
            if y_index == predicted_class_index:
                correct_predict += 1
            confusion_matrix[y_index][predicted_class_index] += 1
        return float(correct_predict/len(X)) , confusion_matrix

    def _sample_variance(self,class_mean,sample):
        sample_sub_mean_transpose = np.subtract(sample,class_mean)
        sample_sub_mean =np.transpose([sample_sub_mean_transpose])
        return np.matmul(sample_sub_mean,[sample_sub_mean_transpose])

class LeastSquares(ML):
    def fit(self,X,y):
        pass

    def score(self,X,y):
        pass

    def predict(self,X):
pass

def multipy_matrix(matrix_1,matrix_2):
        '''
        multiply two matrices
        --------------------
        matrix_1 :
            2 dimantions array
        matrix_2 :
            2 dimantion array

        return :
            2 dimantion array matrix_1 rows * matrix2 columns
        '''

        if len(matrix_1[0]) != len(matrix_2): # check if columns of matrix_1 equal rows of matrix_2
            raise ValueError('Number of column of vector 1 must equals Number of rows in second vector')

        result_rows ,result_columns = len(matrix_1) , len(matrix_2[0])
        result_matrix = [[0]*result_columns for i in range(result_rows)]

        matrix_2_transpose = transpose_matrix(matrix_2)

        for row_num in range(result_rows):
            for column_num in range(result_columns):
                result_matrix[row_num][column_num] = dot_produnct(matrix_1[row_num],matrix_2_transpose[column_num])

        return result_matrix


def transpose_matrix(matrix):
    '''
    transpose of a matrix is an operator which flips a matrix over its diagonal
    ---------------------------------------------------------------------------
    matrix :
            disrable transpose matricx (multi dimantion array or vector)

    return :
            transposed matrix
    '''
    if  not type(matrix[0]) == list: # check if the matrix is vector
        result_rows = len(matrix)
        result_columns = 1
    else:
        result_rows = len(matrix[0])
        result_columns = len(matrix)


    transpose_matrix = [[0]*result_columns for i in range(result_rows)]
    for row in range(result_rows):
        transpose_matrix[row] = column(matrix,row)

    return transpose_matrix


def column(matrix, i):
    '''
    get  column from matrix
    --------------------------------------
    matrix:
            (multi dimantion array or vector)
    i :
        column index

    return :
        column list
    '''
    if  not type(matrix[0]) == list:
        return [matrix[i]]
    else:
        return [row[i] for row in matrix]

def dot_produnct(vector_1,vector_2):
    if len(vector_1) != len(vector_2):
        raise ValueError('vector_1 and vector_2 must have the same lenght')

    return sum( [vector_1[i]*vector_2[i] for i in range(len(vector_2))] )

def sum_two_vect(f_vect,s_vect):
    '''
    summation of two vectors
    -------------------------
    f_vect :
            array of first vector
    s_vect :
            array of second vector
    return
            summ vector
    '''

    return [x + y for x, y in zip(f_vect, s_vect)]

def subtract_two_vect(f_vect,s_vect):
    '''
    summation of two vectors
    -------------------------
    f_vect :
            array of first vector
    s_vect :
            array of second vector
    return
            summ vector
    '''

    return [x - y for x, y in zip(f_vect, s_vect)]

def sum_matrices(matrix_1,matrix_2):
    if len(matrix_1) != len(matrix_2) | len(matrix_1[0]) != len(matrix_2[0]) :
        raise ValueError("The two matrices must be the same size")

    result_matrix =  [[0]*len(matrix_1[0]) for i in range(len(matrix_1))]
    for row_num,m1_row in enumerate(matrix_1):
        result_matrix[row_num] = sum_two_vect(matrix_1[row_num],matrix_2[row_num])

    return result_matrix

def div_arr_by_num(arr,num):
    '''
    divide array by number
    ----------------------
    arr :
        array contains the numbers
    num :
        number you want divide array elemets by it
    return :
        new array divided by the given number
    '''
    return [x / num for x in arr]

def matmult(a,b):
    zip_b = zip(*b)
    # uncomment next line if python 3 :
    zip_b = list(zip_b)
    return [[sum(ele_a*ele_b for ele_a, ele_b in zip(row_a, col_b))
for col_b in zip_b] for row_a in a]