Advertisement
Guest User

Untitled

a guest
Nov 14th, 2018
102
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
R 5.09 KB | None | 0 0
  1.  
  2. set.seed(1234)
  3. #import datasets
  4. green <- read.csv("C:/Users/tiago/Desktop/CDados/dataset2/green.csv")
  5. hinselmann <- read.csv("C:/Users/tiago/Desktop/CDados/dataset2/hinselmann.csv")
  6. schiller <- read.csv("C:/Users/tiago/Desktop/CDados/dataset2/schiller.csv")
  7. group <- rbind(green,hinselmann,schiller)
  8. nb <- NULL
  9.  
  10.  
  11. #turn some variables factors
  12. factorize <- function(dataset){
  13.   dataset$experts..0 <- as.factor(dataset$experts..0)
  14.   dataset$experts..1 <- as.factor(dataset$experts..1)
  15.   dataset$experts..2 <- as.factor(dataset$experts..2)
  16.   dataset$experts..3 <- as.factor(dataset$experts..3)
  17.   dataset$experts..4 <- as.factor(dataset$experts..4)
  18.   dataset$experts..5 <- as.factor(dataset$experts..5)
  19.   dataset$consensus <- as.factor(dataset$consensus)
  20.  
  21.   return(dataset)
  22.  
  23. }
  24.  
  25. group <- factorize(group)
  26. green <- factorize(green)
  27. hinselmann <- factorize(hinselmann)
  28. schiller <- factorize(schiller)
  29.  
  30. #remove cervix_area because we will have problems in preProcess with it in future computations
  31. group$cervix_area <- NULL
  32. green$cervix_area <- NULL
  33. hinselmann$cervix_area <- NULL
  34. schiller$cervix_area <- NULL
  35.  
  36. # Random splitting of data as 70% train and 30%test datasets
  37.  
  38. #group
  39. indexC_group <- createDataPartition(group$consensus, p=0.70, list=FALSE)
  40. trainDataC_group = group[indexC_group,]
  41. testDataC_group = group[-indexC_group,]
  42.  
  43.  
  44.  
  45. #green
  46. indexC_green <- createDataPartition(green$consensus, p=0.70, list=FALSE)
  47. trainDataC_green = green[indexC_green,]
  48. testDataC_green = green[-indexC_green,]
  49.  
  50.  
  51. #hinselmann
  52. indexC_hinselmann <- createDataPartition(hinselmann$consensus, p=0.70, list=FALSE)
  53. trainDataC_hinselmann = hinselmann[indexC_hinselmann,]
  54. testDataC_hinselmann = hinselmann[-indexC_hinselmann,]
  55.  
  56.  
  57. #schiller
  58. indexC_schiller <- createDataPartition(schiller$consensus, p=0.70, list=FALSE)
  59. trainDataC_schiller = schiller[indexC_schiller,]
  60. testDataC_schiller = schiller[-indexC_schiller,]
  61.  
  62.  
  63. #clustering
  64. cl <- makeCluster(8, type="SOCK")
  65. registerDoSNOW(cl)
  66.  
  67. grid <- data.frame(fL=c(0.5,1.0), usekernel = TRUE, adjust=c(0.5,1.0))
  68.  
  69.  
  70. # define training control
  71. train_control <- trainControl(method="repeatedcv", number=10)
  72.  
  73. #train based on consensus with and without pp
  74. nb.model_nbC_group_cv = train(trainDataC_group[1:(length(trainDataC_group)-8)], trainDataC_group$consensus, method="nb", trControl=train_control, tuneGrid=grid)
  75. nb.model_nbC_group_pp_c_S_cv = train(trainDataC_group[1:(length(trainDataC_group)-8)], trainDataC_group$consensus, method="nb", trControl=train_control, tuneGrid=grid, preProcess=c("center", "scale"))
  76. nb.model_nbC_group_pp_pca_cv = train(trainDataC_group[1:(length(trainDataC_group)-8)], trainDataC_group$consensus, method="nb", trControl=train_control, tuneGrid=grid, preProcess=c("center", "scale","pca"))
  77.  
  78. nb.model_nbC_green_cv = train(trainDataC_green[1:(length(trainDataC_green)-8)], trainDataC_green$consensus, method="nb", trControl=train_control, tuneGrid=grid)
  79. nb.model_nbC_green_pp_c_S_cv = train(trainDataC_green[1:(length(trainDataC_green)-8)], trainDataC_green$consensus, method="nb", trControl=train_control, tuneGrid=grid, preProcess=c("center", "scale"))
  80. nb.model_nbC_green_pp_pca_cv = train(trainDataC_green[1:(length(trainDataC_green)-8)], trainDataC_green$consensus, method="nb", trControl=train_control, tuneGrid=grid, preProcess=c("center", "scale","pca"))
  81.  
  82. nb.model_nbC_hinselmann_cv = train(trainDataC_hinselmann[1:(length(trainDataC_hinselmann)-8)], trainDataC_hinselmann$consensus, method="nb", trControl=train_control, tuneGrid=grid)
  83. nb.model_nbC_hinselmann_pp_c_S_cv = train(trainDataC_hinselmann[1:(length(trainDataC_hinselmann)-8)], trainDataC_hinselmann$consensus, method="nb", trControl=train_control, tuneGrid=grid, preProcess=c("center", "scale"))
  84. nb.model_nbC_hinselmann_pp_pca_cv = train(trainDataC_hinselmann[1:(length(trainDataC_hinselmann)-8)], trainDataC_hinselmann$consensus, method="nb", trControl=train_control, tuneGrid=grid, preProcess=c("center", "scale","pca"))
  85.  
  86. nb.model_nbC_schiller_cv = train(trainDataC_schiller[1:(length(trainDataC_schiller)-8)], trainDataC_schiller$consensus, method="nb", trControl=train_control, tuneGrid=grid)
  87. nb.model_nbC_schiller_pp_c_S_cv = train(trainDataC_schiller[1:(length(trainDataC_schiller)-8)], trainDataC_schiller$consensus, method="nb", trControl=train_control, tuneGrid=grid, preProcess=c("center", "scale"))
  88. nb.model_nbC_schiller_pp_pca_cv = train(trainDataC_schiller[1:(length(trainDataC_schiller)-8)], trainDataC_schiller$consensus, method="nb", trControl=train_control, tuneGrid=grid, preProcess=c("center", "scale","pca"))
  89.  
  90. stopCluster(cl)
  91.  
  92. nb.model_nbC_group_cv$results$Accuracy
  93. nb.model_nbC_group_pp_c_S_cv$results$Accuracy
  94. nb.model_nbC_group_pp_pca_cv$results$Accuracy
  95.  
  96. nb.model_nbC_green_cv$results$Accuracy
  97. nb.model_nbC_green_pp_c_S_cv$results$Accuracy
  98. nb.model_nbC_green_pp_pca_cv$results$Accuracy
  99.  
  100. nb.model_nbC_hinselmann_cv$results$Accuracy
  101. nb.model_nbC_hinselmann_pp_c_S_cv$results$Accuracy
  102. nb.model_nbC_hinselmann_pp_pca_cv$results$Accuracy
  103.  
  104. nb.model_nbC_schiller_cv$results$Accuracy
  105. nb.model_nbC_schiller_pp_c_S_cv$results$Accuracy
  106. nb.model_nbC_schiller_pp_pca_cv$results$Accuracy
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement