Advertisement
Guest User

asd

a guest
Feb 20th, 2020
175
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.92 KB | None | 0 0
  1. # -*- coding: utf-8 -*-
  2. """
  3. Created on Thu Feb 20 15:44:48 2020
  4.  
  5. @author: User
  6. """
  7.  
  8. import pandas
  9. import numpy as np
  10. from sklearn.impute import SimpleImputer
  11. # membaca file dan direktori tempat iris.data.missing.csv disimpan
  12. direktori = "bjir.csv"
  13. # memberi nama variabel
  14. names = ['class','age', 'sex','steroid','antiviral','fatigue', 'malaise','anorexia','liver-big','liver-firm', 'spleen-palpable','spiders','ascites','varices', 'bilirubin','alk-phosphate','sgot','albumin', 'protime','histology']
  15. # membaca data dengan library panda
  16. datamissing = pandas.read_csv(direktori, names=names, na_values=["?"])
  17. #panggil dataset
  18. array = datamissing.values
  19. # pisah input dan output
  20. x = array[:,0:19] #inputnya adalah kolom ke-0, 1, 2, 3
  21. y = array[:,0] #outputnya adalah kolom ke 4
  22. #imputasi mean
  23. imp = SimpleImputer(missing_values=np.nan, strategy="mean")
  24. #simpan hasil imputasi ke dalam variable X
  25. X = imp.fit_transform(x)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement