Advertisement
Guest User

Untitled

a guest
Nov 18th, 2018
91
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
R 0.44 KB | None | 0 0
  1. library(sparklyr)
  2. library(ggplot2)
  3. library(dplyr)
  4.  
  5. sc <- spark_connect(master = "local")
  6.  
  7. dir.create("source")
  8. reactiveCount <- stream_read_text(sc, "source/") %>%
  9.   ft_tokenizer("line", "tokens") %>%
  10.   ft_stop_words_remover("tokens", "words") %>%
  11.   transmute(words = explode(words)) %>%
  12.   filter(nchar(words) > 0) %>%
  13.   group_by(words) %>%
  14.   summarize(n = n()) %>%
  15.   arrange(desc(n)) %>%
  16.   filter(n > 100) %>%
  17.   reactiveSpark()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement