Advertisement
Guest User

Untitled

a guest
Aug 21st, 2017
76
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.61 KB | None | 0 0
  1. val df = CSV.load(args(0))
  2. val sumSteps = df.sum("steps")
  3.  
  4. import sqlContext.implicits._
  5. import org.apache.spark.sql.functions._
  6.  
  7. val df = sc.parallelize(Array(10,2,3,4)).toDF("steps")
  8. df.select(col("steps")).rdd.map(_(0).asInstanceOf[Int]).reduce(_+_)
  9.  
  10. //res1 Int = 19
  11.  
  12. import org.apache.spark.sql.functions._
  13.  
  14. val df = CSV.load(args(0))
  15. val sumSteps = df.agg(sum("steps")).first.get(0)
  16.  
  17. val sumSteps: Long = df.agg(sum("steps").cast("long")).first.getLong(0)
  18.  
  19. val sums = df.agg(sum("col1").as("sum_col1"), sum("col2").as("sum_col2"), ...).first
  20.  
  21. df.groupBy().sum()
  22.  
  23. df.groupby('steps').sum().show()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement