Guest User

Untitled

a guest
Nov 21st, 2018
167
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 3.68 KB | None | 0 0
  1. from random import seed
  2. from random import randrange
  3. from csv import reader
  4.  
  5. # fungsi load file CSV
  6. def load_csv(filename):
  7. dataset = list()
  8. with open(filename, 'r') as file:
  9. csv_reader = reader(file)
  10. for row in csv_reader:
  11. if not row:
  12. continue
  13. dataset.append(row)
  14. return dataset
  15.  
  16. # fungsi mengubah tipe data string kolom dataset ke float
  17. def str_column_to_float(dataset, column):
  18. for row in dataset:
  19. row[column] = float(row[column].strip())
  20.  
  21. # fungsi mengubah tipe data string kolom dataset ke integer
  22. def str_column_to_int(dataset, column):
  23. class_values = [row[column] for row in dataset]
  24. unique = set(class_values)
  25. lookup = dict()
  26. for i, value in enumerate(unique):
  27. lookup[value] = i
  28. for row in dataset:
  29. row[column] = lookup[row[column]]
  30. return lookup
  31.  
  32. # membagi dataset menjadi k folds
  33. def cross_validation_split(dataset, n_folds):
  34. dataset_split = list()
  35. dataset_copy = list(dataset)
  36. fold_size = int(len(dataset) / n_folds)
  37. for i in range(n_folds):
  38. fold = list()
  39. while len(fold) < fold_size:
  40. index = randrange(len(dataset_copy))
  41. fold.append(dataset_copy.pop(index))
  42. dataset_split.append(fold)
  43. return dataset_split
  44.  
  45. # kalkulasi persentase akurasi
  46. def accuracy_metric(actual, predicted):
  47. correct = 0
  48. for i in range(len(actual)):
  49. if actual[i] == predicted[i]:
  50. correct += 1
  51. return correct / float(len(actual)) * 100.0
  52.  
  53. # mengevaluasi sebuah algoritma memakai cross_validation_split
  54. def evaluate_algorithm(dataset, algorithm, n_folds, *args):
  55. folds = cross_validation_split(dataset, n_folds)
  56. scores = list()
  57. for fold in folds:
  58. train_set = list(folds)
  59. train_set.remove(fold)
  60. train_set = sum(train_set, [])
  61. test_set = list()
  62. for row in fold:
  63. row_copy = list(row)
  64. test_set.append(row_copy)
  65. row_copy[-1] = None
  66. predicted = algorithm(train_set, test_set, *args)
  67. actual = [row[-1] for row in fold]
  68. accuracy = accuracy_metric(actual, predicted)
  69. scores.append(accuracy)
  70. return scores
  71.  
  72. # membuat sebuah prediksi dengan bobot
  73. def predict(row, weights):
  74. activation = weights[0]
  75. for i in range(len(row)-1):
  76. activation += weights[i + 1] * row[i]
  77. return 1.0 if activation >= 0.0 else 0.0
  78.  
  79. # menentukan bobot perceptron menggunakan stochastic gradient descent
  80. def train_weights(train, l_rate, n_epoch):
  81. weights = [0.0 for i in range(len(train[0]))]
  82. for epoch in range(n_epoch):
  83. for row in train:
  84. prediction = predict(row, weights)
  85. error = row[-1] - prediction
  86. weights[0] = weights[0] + l_rate * error
  87. for i in range(len(row)-1):
  88. weights[i + 1] = weights[i + 1] + l_rate * error * row[i]
  89. return weights
  90.  
  91. # algo preceptron dengan memakai stochastic gradient descent
  92. def perceptron(train, test, l_rate, n_epoch):
  93. predictions = list()
  94. weights = train_weights(train, l_rate, n_epoch)
  95. for row in test:
  96. prediction = predict(row, weights)
  97. predictions.append(prediction)
  98. return(predictions)
  99.  
  100. # tes algoritma perceptron pada dataset diabetes
  101. seed(1)
  102.  
  103. # load dan siapkan data
  104. filename = 'diabetes.csv'
  105. dataset = load_csv(filename)
  106. for i in range(len(dataset[0])-1):
  107. str_column_to_float(dataset, i)
  108.  
  109. # ubah kelas string ke integers
  110. str_column_to_int(dataset, len(dataset[0])-1)
  111.  
  112. # evaluasi algoritma
  113. n_folds = 5
  114. l_rate = 0.01
  115. n_epoch = 1000
  116. scores = evaluate_algorithm(dataset, perceptron, n_folds, l_rate, n_epoch)
  117. print('Scores: %s' % scores)
  118. print('Mean Accuracy: %.3f%%' % (sum(scores)/float(len(scores))))
Add Comment
Please, Sign In to add comment