Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- def outliers_zscore(data, col, col_zscores):
- outlier_thresh = 3
- mean = data[col].mean()
- stdev = data[col].std()
- data[col_zscores] = (data[col] - mean) / stdev # compute zscore
- data = data[abs(data[col_zscores])<=3] # remove outliers
- return data.drop(col_zscores, axis=1) # drop zscore columns
- autos_zscore = outliers_zscore(autos, 'price_dollar', 'price_zscores')
- autos_zscore = outliers_zscore(autos_zscore, 'odometer_km', 'Odometer_zscores')
Add Comment
Please, Sign In to add comment