Advertisement
Guest User

Untitled

a guest
Mar 23rd, 2017
72
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.83 KB | None | 0 0
  1. val rddToSave = sc.parallelize(Seq(("1111123", "456456", "Name1"), ("22222234", "8987987", "Name2")))
  2.  
  3. val columnName = ("ACCT_ID", "ACCT_NAME")
  4. val columnFamily = ("CF", "PP")
  5.  
  6. val rdd = rddToSave.map(x => {
  7. val key = x._1
  8. val acct_id = x._2
  9. val acct_name = x._3
  10. val colNameAcctId = columnName._1
  11. val colNameAcctName = columnName._2
  12.  
  13. val colFamily = columnFamily._1
  14.  
  15. val kv = new KeyValue(Bytes.toBytes(key), colFamily.getBytes(), colNameAcctId.getBytes(), acct_id.getBytes())
  16.  
  17. (new ImmutableBytesWritable(Bytes.toBytes(key)), kv)
  18. })
  19.  
  20. rdd.saveAsNewAPIHadoopFile(pathToHFile, classOf[ImmutableBytesWritable], classOf[KeyValue],
  21. classOf[HFileOutputFormat], conf)
  22.  
  23. val loadFfiles = new LoadIncrementalHFiles(conf)
  24. loadFfiles.doBulkLoad(new Path(pathToHFile), hTable)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement