Advertisement
limedog

asn8

Mar 18th, 2019
146
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.88 KB | None | 0 0
  1. ---
  2. title: "Assignment 8"
  3. output: html_document
  4. author: "Ian Ho"
  5. ---
  6.  
  7. ```{r setup, include=FALSE}
  8. knitr::opts_chunk$set(echo = TRUE)
  9. ```
  10.  
  11. ```{r}
  12. course_url = "https://www.sfu.ca/outlines.html?2019/spring/stat/240/d100"
  13. course_page = readLines(course_url)
  14. ```
  15.  
  16. Question 1
  17. ==========
  18.  
  19. a
  20. ---------
  21.  
  22. ```{r}
  23. heading_index = grep("<h3", course_page)
  24. heading = course_page[heading_index]
  25. heading = gsub("</.*>", "", heading)
  26. heading = gsub("<.*>", "", heading)
  27. heading = gsub("[[:space:]]", "", heading)
  28. heading
  29. ```
  30.  
  31. b
  32. ---------
  33.  
  34. ```{r}
  35. course_num_index = grep("<h1 id", course_page)
  36. course_num = course_page[course_num_index]
  37. course_num = gsub("<[^>]*>", "", course_num)
  38. course_num = gsub("\\s{2,}", "", course_num)
  39. course_num
  40. ```
  41.  
  42. c
  43. --------
  44.  
  45. ```{r}
  46. start_index = grep("<h2 id", course_page)
  47. end_index = grep("<h3 id=\"class-number\"", course_page)
  48. course_name = course_page[start_index:end_index]
  49. course_name = paste(course_name,collapse="")
  50. course_name = gsub("<h3.*", "", course_name)
  51. course_name = gsub("<[^>]*>", "", course_name)
  52. course_name = gsub("\\s{2,}", "", course_name)
  53. course_name
  54. ```
  55.  
  56. d
  57. -----------
  58.  
  59. ```{r}
  60. start_index = grep("<h4>Instructor:</h4>", course_page)
  61. end_index = grep("<ul class=\"prereq-line\"", course_page)
  62. name = paste(course_page[start_index:end_index], collapse="")
  63.  
  64. name = gsub("<br.*", "", name)
  65. name = gsub("<.*/h4>", "", name)
  66. name = gsub("<[^>]*>", "", name)
  67. name = gsub("\\s{2,}", "", name)
  68. name
  69. ```
  70.  
  71. e
  72. ------------
  73.  
  74. ```{r}
  75. start_index = grep("<li class=\"course-times\">", course_page)
  76. end_index = grep("<li class=\"exam-times\">", course_page)
  77.  
  78. time_loc = paste(course_page[start_index:end_index], collapse="")
  79.  
  80. time_loc = gsub("</li.*", "", time_loc)
  81. time_loc = gsub("<.*/h4>", "", time_loc)
  82. time_loc = gsub("<[^>]*>", "", time_loc)
  83. time_loc = gsub("\\s{2,}", "", time_loc)
  84. time_loc
  85. ```
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement