Guest User

Untitled

a guest
Jan 16th, 2019
92
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.04 KB | None | 0 0
  1. WITH TabA as (SELECT cid, NUM_PURCHASES from MyTable where dt>= '20161001' and dt <= '20181001'),
  2. TabB as (SELECT cid from MyTable where dt='20181001')
  3. SELECT TabA.cid as ID,
  4. SUM(TabA.NUM_PURCHASES) as total_p
  5. FROM TabA LEFT SEMI JOIN TabB on (TabB.cid = TabA.cid) GROUP BY TabA.cid;
  6.  
  7. set hive.auto.convert.join=true;
  8. SET hive.variable.substitute.depth=150;
  9. set hive.auto.convert.join=true;
  10. set hive.optimize.skewjoin.compiletime=true;
  11. set hive.optimize.skewjoin=true;
  12. set hive.enforce.bucketing = true;
  13. set hive.input.format=org.apache.hadoop.hive.ql.io.BucketizedHiveInputFormat;
  14. set hive.optimize.bucketmapjoin=true;
  15. set hive.optimize.bucketmapjoin.sortedmerge=true;
  16. set hive.exec.parallel=true;
  17. set hive.vectorized.execution.enabled = true;
  18. set hive.vectorized.execution.reduce.enabled = true;
  19. set hive.vectorized.execution.reduce.groupby.enabled = true;
  20. set hive.cbo.enable=true;
  21. SET mapred.child.java.opts=-Xmx4G -XX:+UseConcMarkSweepGC -XX:-UseGCOverheadLimit;
  22. set mapreduce.map.memory.mb=9216;
  23. set mapreduce.reduce.memory.mb=9216;
Add Comment
Please, Sign In to add comment