Advertisement
Guest User

Untitled

a guest
Apr 23rd, 2017
72
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
R 1.26 KB | None | 0 0
  1. library(caret)
  2.  
  3. library(ISLR)
  4.  
  5. library(caTools)
  6.  
  7. train_data <- read.csv('C:\\Users\\Yevhen\\Documents\\Courses\\Data Mining\\HW6\\train.csv', sep=',', header=TRUE)
  8. test_data <- read.csv('C:\\Users\\Yevhen\\Documents\\Courses\\Data Mining\\HW6\\test.csv', sep=',', header=TRUE)
  9. set.seed(101)
  10.  
  11. split = sample.split(train_data$agegroup, SplitRatio = 0.90)
  12. train = subset(train_data, split == TRUE)
  13. test = subset(train_data, split == FALSE)
  14. feats <- names(train[, 1:ncol(train)-1])
  15. f <- paste(feats,collapse=' + ')
  16. f <- paste('target ~',f)
  17. f <- as.formula(f)
  18.  
  19. # prepare training scheme
  20. control <- trainControl(method="repeatedcv", number=5, repeats=3)
  21. # train the GBM model
  22. set.seed(7)
  23. modelGbm <- train(f, data=train, method="gbm", trControl=control, verbose=FALSE)
  24. predvals <- predict(modelGbm, test[,1:ncol(test)-1])
  25.  
  26. n_test = nrow(test)
  27. rmse_ = sqrt(sum((test$target-predvals)^2) / n_test)
  28. rmse_
  29.  
  30.  
  31. modelGbm <- train(f, data=train, method="gbm", trControl=control, verbose=FALSE)
  32. test_pred_values <- as.data.frame(predict(modelGbm, newdata=test_data))
  33. predict <- data.frame(test_data$ID, test_pred_values)
  34. colnames(predict) <- c("ID", "target")
  35. write.csv(predict, file = "C:\\Users\\Yevhen\\Documents\\Courses\\Data Mining\\prediction.csv", row.names=FALSE)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement