LinearMAE

__author__ = 'Miroslaw Horbal'
__email__ = 'miroslaw@gmail.com'
__date__ = '2013-03-09'

import numpy as np
from scipy import optimize

OPTIMIZATION_FUNCTIONS = { 'cg':   optimize.fmin_cg,
                           'bfgs': optimize.fmin_bfgs }

class LinearMAE(object):
    """Linear model with Mean Absolute Error"""
    def __init__(self, l1=0.0, l2=0.0, opt='bfgs', maxiter=1000,
                 tol=1e-4, verbose=False):
        """
        Parameters:
          l1 - magnitude of l1 penalty (default 0.0)
          l2 - magnitude of l2 penalty (default 0.0)
          opt - optimization algorithm to use for gardient decent
                options are 'cg', 'bfgs' (default 'bfgs')
          maxiter - maximum number of iterations (default 1000)
          tol - terminate optimization if gradient l2 is smaller than tol (default 1e-4)
          verbose - display convergence information at each iteration (default False)
        """
        self.opt = opt
        self.maxiter = maxiter
        self.tol = tol
        self.l1 = l1
        self.l2 = l2
        self.verbose = verbose

    @property
    def opt(self):
        """Optimization algorithm to use for gradient decent"""
        return self._opt

    @opt.setter
    def opt(self, o):
        """
        Set the optimization algorithm for gradient decent

        Parameters:
          o - 'cg' for conjugate gradient decent
              'bfgs' for BFGS algorithm
        """
        if o not in OPTIMIZATION_FUNCTIONS:
            raise Error('Unknown optimization routine %s' % o)
        self._opt = o
        self._optimize = OPTIMIZATION_FUNCTIONS[o]

    def score(self, X, y):
        """
        Compute the MAE of the linear model prediction on X against y

        Must only be run after calling fit

        Parameters:
          X - data array for the linear model. Has shape (m,n)
          y - output target array for the linear model. Has shape (m,o)
        """
        y = _2d(y)
        pred = self.predict(X)
        return np.mean(np.abs(pred - y))

    def predict(self, X):
        """
        Compute the linear model prediction on X

        Must only be run after calling fit

        Parameters:
          X - data array for the linear model. Has shape (m,n)
        """
        return X.dot(self.coef_[1:]) + self.coef_[0]

    def fit(self, X, y, coef=None):
        """
        Fit the linear model using gradient decent methods

        Parameters:
          X - data array for the linear model. Has shape (m,n)
          y - output target array for the linear model. Has shape (m,o)
          coef - None or array of size (n+1) * o

        Sets attributes:
          coef_ - the weights of the linear model
        """
        y = _2d(y)
        m, n = X.shape
        m, o = y.shape
        if coef is None:
            coef = np.zeros((n+1, o))
        elif coef.shape != (n+1, o):
            raise Error('coef must be None or be shape %s' % (str((n+1, o))))
        self._coef_shape = coef.shape
        coef = self._optimize(f=cost,
                              x0=coef.flatten(),
                              fprime=grad,
                              args=(X, y, self.l1, self.l2),
                              gtol=self.tol,
                              maxiter=self.maxiter,
                              disp=0,
                              callback=self._callback(X,y))
        self.coef_ = np.reshape(coef, self._coef_shape)
        return self

    def _callback(self, X, y):
        """
        Helper method that generates a callback function for the optimization
        algorithm opt if verbose is set to True
        """
        def callback(coef):
            self.i += 1
            self.coef_ = np.reshape(coef, self._coef_shape)
            score = self.score(X, y)
            print 'iter %i | Score: %f\r' % (self.i, score)
        self.i = 0
        return callback if self.verbose else None

def _2d(a):
    """Returns a 2d array of a if rank a <= 2"""
    if len(a.shape) == 1:
        a.shape = (len(a), 1)
    return a