Advertisement
Guest User

Untitled

a guest
May 20th, 2019
253
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
R 1.22 KB | None | 0 0
  1. library(dplyr)
  2. library(caret)
  3. library(randomForest)
  4. library(ModelMetrics)
  5. setwd("F:/pajtoon/lab 11")
  6. load('dataLeukemia.RData')
  7.  
  8. View(data[1:100,1:100])
  9. names(data)[1:10]
  10. unique(data$Leukemia.class)
  11.  
  12. set.data = data[data$Leukemia.class == "AML with normal karyotype + other abnormalities" |data$Leukemia.class == "CLL", -c(1,3)]
  13. set.data$Leukemia.class = as.numeric(set.data$Leukemia.class)/6-1
  14. View(set.data[,1:100])
  15. rm(data)
  16. v=1:length(set.data$Leukemia.class)
  17.  
  18. index.test = sample(v,round(length(set.data$Leukemia.class)/3))
  19. index.train = v[-index.test]
  20.  
  21. data.train = set.data[index.train,]
  22. data.test = set.data[index.test,]
  23.  
  24. result = randomForest(x=data.train[,-1], y=as.factor(data.train[,1]), importance = TRUE)
  25. var.imp = result$importance  # View(var.imp)
  26. var.imp100 = row.names(var.imp[order(var.imp[,4], decreasing = TRUE),])[1:100]
  27. View(var.imp[order(var.imp[,4], decreasing = TRUE),])
  28. var.pred.test = predict(result, x=data.test[,var.imp100])
  29. print(auc(as.factor(data.test[,1]), var.pred.test))
  30.  
  31. result2 = randomForest(x=data.train[,var.imp100], y=as.factor(data.train[,1]), importance = TRUE)
  32. var.pred.test = predict(result2, x=data.test[,var.imp100])
  33. print(auc(as.factor(data.test[,1]), var.pred.test))
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement