Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- val opts = Map(
- "url" -> s"jdbc:postgresql://$DB_HOST:$DB_PORT/$DATABASE",
- "driver" -> "org.postgresql.Driver",
- "dbtable" -> DB_TABLE,
- "user" -> DB_USER,
- "password"-> DB_PASSWORD,
- "partitionColumn" -> "id",
- "lowerBound" -> "1",
- "upperBound" -> "96509080",
- "numPartitions" -> "10000"
- )
- val reportsDf = sparkSession.read.format("jdbc").options(opts).load
- reportsDf.createOrReplaceTempView("custom_reports")
- val reportId = reportsDf.select("fileId").distinct.as[String].collect()
- reportId.repartition(100).cache()
- ....
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement