Advertisement
Guest User

Text Mining Twitter

a guest
Mar 25th, 2015
416
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
R 1.77 KB | None | 0 0
  1. ## Acceso a la Twitter API
  2. # for this method you need the following objects from the
  3. # "keys and access token" tab in your developers account
  4.  
  5. key <-"3omnRf2j6bp9AscKkf0VMlqsk"
  6. secret <- "V22lCy4eWZNf7tp853Cjlxcpnpsot24EwnH0txxFilWx9EmloV"
  7. secrettk <- "H0xTlxFuxZ2Qae9S2nKJYwWjl5CTvEcj2HHsCY5N1fWj1"
  8. mytoken <- "301911069-Jfw1ZWsOr7scILP7Zjt7xTU5Dpb7cM0wdqEPb8V1"
  9.  
  10. #packages
  11. library("twitteR")
  12. library("httr")
  13.  
  14. # keep this order of arguments
  15. setup_twitter_oauth(key, secret, mytoken, secrettk)
  16.  
  17. ### Let’s start with the Twitter scraping!
  18. library("twitteR")
  19.  
  20. # we are now scraping x tweets for Udemy
  21. udemytweets = searchTwitter("#Udemy", n=100, lang="en")
  22.  
  23. library("tm")
  24.  
  25. udemylist <- sapply(udemytweets, function(x) x$getText())
  26.  
  27. # initiating a function
  28.  
  29. udemycorpus <- Corpus(VectorSource(udemylist))
  30.  
  31. ## Transformation
  32. # putting text to lower case
  33. udemycorpus <- tm_map(udemycorpus, content_transformer(tolower))
  34. # remove puntuación
  35. udemycorpus <- tm_map(udemycorpus, removePunctuation)
  36. # remove stopwords (meaningless words)
  37. udemycorpus <- tm_map(udemycorpus, function(x)removeWords(x,stopwords()))
  38.  
  39. # keep a copy of corpus to use later as a dictionary for stem completion
  40. #udemycorpuscopy <- udemycorpus
  41.  
  42. # stem words
  43. #udemycorpus <- tm_map(udemycorpus, stemDocument)
  44.  
  45. # stem completion
  46. #udemycorpus <- tm_map(udemycorpus, stemCompletion, dictionary = udemycorpuscopy)
  47.  
  48. # quitar espacios en blanco
  49. udemycorpus <- tm_map(udemycorpus, stripWhitespace)
  50.  
  51. # to trasform to plain text which wordcloud can use
  52. udemycorpus <- tm_map(udemycorpus, PlainTextDocument)
  53.  
  54. library("wordcloud")
  55.  
  56. palette <- brewer.pal(5,"Paired")
  57. wordcloud(udemycorpus, min.freq=3, scale=c(4,1),
  58.           random.color=F, max.word=45, random.order=F, colors=palette, rot.per=.5)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement