Advertisement
Guest User

Untitled

a guest
Feb 21st, 2017
57
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 2.56 KB | None | 0 0
  1. # ------------------------------------------------------------------
  2. # |PROGRAM NAME: R basic data manipulation
  3. # |DATE: 2/20/17
  4. # |CREATED BY: MATT BOGARD
  5. # |PROJECT FILE:
  6. # |----------------------------------------------------------------
  7. # | PURPOSE: BASIC DATA MANAGEMENT AND STATS IN R
  8. # |----------------------------------------------------------------
  9.  
  10. # create some toy data
  11.  
  12. GARST <- c(150,140,145,137,141,145,149,153,157,161)
  13. PIO <- c(160,150,146,138,142,146,150,154,158,162)
  14. MYC <- c(137,148,151,139,143,120,115,136,130,129)
  15. DEK <- c(150,149,145,140,144,148,152,156,160,164)
  16. PLOT <- c(1,2,3,4,5,6,7,8,9,10)
  17. BT <- c('Y','Y','N','N','N','N','Y','N','Y','Y')
  18. RR <- c('Y','N','Y','N','N','N','N','Y','Y','N')
  19.  
  20. yield_data <- data.frame(GARST,PIO,MYC,DEK,PLOT,BT,RR)
  21.  
  22. #---------------------------
  23. # subsetting data
  24. #---------------------------
  25.  
  26. # subset data via variable selection
  27.  
  28. my_hybrids <- yield_data[ c("GARST", "PIO")]
  29.  
  30. print(my_hybrids)
  31.  
  32. # subset based on variable values
  33. high_yields <- yield_data [ yield_data$GARST==150 & yield_data$PIO==160,]
  34.  
  35. print(high_yields)
  36.  
  37. stacked_traits <-yield_data[ yield_data$BT =="Y" & yield_data$RR =="Y",]
  38. stacked_traits
  39.  
  40. #--------------------------------------
  41. # creating and adding new variables
  42. #--------------------------------------
  43.  
  44. yield_data$d_grst_pio <- yield_data$GARST - yield_data$PIO
  45.  
  46. #----------------------------------
  47. # conditional processing
  48. #----------------------------------
  49.  
  50. yield_data$GMO <- ifelse(yield_data$BT == 'Y' & yield_data$RR == 'Y','Stacked Trait',
  51. ifelse(yield_data$RR == "Y" , 'Single Trait ',
  52. ifelse(yield_data$BT =="Y",'Single Trait ', 'Non-GMO ')))
  53.  
  54. #-----------------------------------------
  55. # stacking and merging data
  56. #-----------------------------------------
  57.  
  58. # create two data sets to stack
  59.  
  60. top <- yield_data [ yield_data$PLOT <= 5,]
  61. bottom <- yield_data [ yield_data$PLOT > 5,]
  62.  
  63. stack <- rbind(top,bottom)
  64.  
  65. # create two separate data sources to join
  66. my_hybrids <- yield_data[ c("GARST", "PIO")]
  67.  
  68. hybrid <- yield_data[c("GARST","PLOT")]
  69. traits <- yield_data[c("GMO","PLOT")]
  70.  
  71. # join this data on PLOT as a key
  72. hybrid_traits <-merge(hybrid,traits,by=c("PLOT"))
  73.  
  74. #-------------------------------------
  75. # sorting data
  76. #------------------------------------
  77.  
  78. # sort in descending order by prefacing with (-)
  79. hybrid_traits <- hybrid_traits[order(-hybrid_traits$PLOT),]
  80.  
  81. # sort ascending by trait and by descending GARST yield_data
  82.  
  83. hybrid_traits <- hybrid_traits[order(hybrid_traits$GMO,-hybrid_traits$GARST),]
  84.  
  85. R basic data manipulation.txt
  86. Displaying R basic data manipulation.txt.
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement