Advertisement
Guest User

Odsluchania w miesiacu

a guest
May 11th, 2019
75
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Scala 0.81 KB | None | 0 0
  1. val spark = org.apache.spark.sql.SparkSession.builder
  2.       .master("local")
  3.       .appName("Spark CSV Reader")
  4.       .getOrCreate;
  5.  
  6.     val samples = spark.read.format("com.databricks.spark.csv").
  7.       option("sep",",").
  8.       csv("samples.txt").
  9.       toDF("user_id", "song_id", "date_id")
  10.     val songs = spark.read.format("com.databricks.spark.csv").
  11.       option("sep",",").
  12.       csv("tracks1.txt").
  13.       toDF("track_id","song_id","artist","title","nowe_id")
  14.  
  15.     val dates = spark.read.format("com.databricks.spark.csv").
  16.       option("sep",",").
  17.       csv("dates.txt").
  18.       toDF("date_id","day","month","year")
  19.  
  20.     samples.select("date_id").
  21.       join(dates, "date_id").
  22.       groupBy("month").
  23.       count().
  24.       orderBy(asc("month")).
  25.       select("month", "count").
  26.       show(false)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement