Advertisement
Guest User

SAMUEL MIRA AQUI

a guest
Dec 11th, 2019
110
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 1.00 KB | None | 0 0
  1. from sklearn.base import BaseEstimator, TransformerMixin
  2. from sklearn.utils import check_array
  3.  
  4. # Elimina todas las variables que tengan un porcentaje de valores
  5. # iguales a 0 mayor que 0.4
  6. class MissingValuesTransformer(BaseEstimator, TransformerMixin):
  7.     def __init__(self, missing_values=0, missing_percentage=0.4):
  8.         self.missing_values = missing_values
  9.         self.missing_percentage = missing_percentage
  10.    
  11.     def fit(self, X, y=None):
  12.         X = check_array(X)
  13.         self.n_features_ = X.shape[1]
  14.         self.columns_ = np.sum(
  15.             X == self.missing_values,
  16.             axis=0) / X.shape[0] <= self.missing_percentage
  17.         return self
  18.    
  19.     def transform(self, X, y=None):
  20.         X = check_array(X)
  21.         if self.n_features_ != X.shape[1]:
  22.             raise ValueError("Se han recibido de entrada {} características cuando se esperaban {}.".format(X.shape[1],self.n_features_))
  23.         return X[:, self.columns_]
  24.  
  25. pima_remover = MissingValuesTransformer()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement