Advertisement
Guest User

Untitled

a guest
May 23rd, 2018
69
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.78 KB | None | 0 0
  1. load('dataLeukemia.RData')
  2.  
  3. names(data[.1:10])
  4. data$Leukemia.class = as.numeric(data$Leukemia.class)
  5. data = data[.-c(1,3)]
  6. dataSel = data[data$Leukemia.class ==11 |data$Leukemia.class ==15,]
  7. table(data_sel$Leukemia.class)
  8.  
  9. indexTrain = indexTest = list()
  10. indexAll = 1:391
  11. indexTest[[1]]= c(1:66,199:262)
  12. indexTrain[[1]]= indexAll[-c(1:66,199:262)]
  13. indexTest[[2]]= c(67:132,263:327)
  14. indexTrain[[2]]= indexAll[-c(67:132,263:327)]
  15. indexTest[[3]]= c(133:198,328:391)
  16. indexTrain[[3]]= indexAll[-c(133:198,328:391)]
  17.  
  18. dim(dataSel)
  19.  
  20. class = dataSel[,1]
  21. dataGenes = dataSel[,-1]
  22.  
  23. #resultTest = tTest(x =c(dataGenes[,1]), y=class.alternative = c("two.sided"), var.equal = TRUE)
  24. #usunac nadmiarowe dane, te niepotrzebne
  25.  
  26. tTest = function(m,dataGenes, class){
  27. resultTest =t.test(x =c(dataGenes[,1]), y=class, alternative = c("two.sided"), var.equal = TRUE)
  28. resultTestpValue = resultTest$p.value
  29. return(resultTest$p.value)
  30. }
  31.  
  32. dataGenes0 = dataGenes[indexTrain[[3]],]
  33. class0 = class[indexTrain[[3]]]
  34.  
  35. listpValue = list()
  36. for(i in 1:ncol(dataGenes0)){
  37. listpValue[[i]] = tTest(i,dataGenes0, class0)
  38. }
  39.  
  40. vecpValue = unlist(listpValue)
  41. nameGenepValue = cbind(names(dataGenes), vecpValue)
  42. nameGenepValueSort = nameGenepValue[order(nameGenepValue[,2]),]
  43. nameGenepValueSortAdj = cbind(nameGenepValueSort[.1], p.adjust(nameGenepValueSort[.2], method = 'BH'))
  44.  
  45. varImp<- nameGenepValueSortAdj[which(nameGenepValueSort[.2]<0.05),]
  46.  
  47. resultModel = randomForest:: randomForest(x= dataGenes[indexTrain[[3]]], varImp[1:100,1], y= as.factor(class[indexTrain[[3]]]),
  48. xtest = dataGenes[indexTest[[3]]], varImp[1:100,1], yTest = as.factor(class[indexTest[[3]]]),
  49. nTree = 500, importance = True)
  50.  
  51. resultModel$importance
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement