Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- val spark = org.apache.spark.sql.SparkSession.builder
- .master("local")
- .appName("Spark CSV Reader")
- .getOrCreate;
- val samples = spark.read.format("com.databricks.spark.csv").
- option("sep",",").
- csv("samples.txt").
- toDF("user_id", "song_id", "date_id")
- val songs = spark.read.format("com.databricks.spark.csv").
- option("sep",",").
- csv("tracks1.txt").
- toDF("track_id","song_id","artist","title","nowe_id")
- samples.select("song_id").
- join(songs, "song_id").
- groupBy("artist").
- count().
- orderBy(desc("count")).
- select("artist", "count").
- show(1, false)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement