Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- SQL(gen_par_ins.sql):
- select concat('beeline -u "jdbc:hive2://bigdataplatform-uat.nam.nsroot.net:10000/',decode(unhex(hex(59)), 'US-ASCII'),
- 'principal=hive/bigdataplatform-uat.nam.nsroot.net',decode(unhex(hex(64)), 'US-ASCII'),'CTIP.NAM.NSROOT.NET',decode(unhex(hex(59)), 'US-ASCII'),
- 'ssl=true" --outputformat=csv2 --verbose=false --fastConnect=true --silent=true -e "set hive.exec.dynamic.partition.mode=nonstrict',decode(unhex(hex(59)), 'US-ASCII'),
- 'set hive.merge.mapfiles=true',decode(unhex(hex(59)), 'US-ASCII'),
- 'set hive.merge.mapredfiles=true',decode(unhex(hex(59)), 'US-ASCII'),
- 'set hive.merge.smallfiles.avgsize=67108864',decode(unhex(hex(59)), 'US-ASCII'),
- 'set mapred.max.split.size=67108864',decode(unhex(hex(59)), 'US-ASCII'),
- 'set mapred.min.split.size=67108864; set hive.exec.parallel=true; set hive.execution.engine=mr;',
- 'insert overwrite table gfocnnsd_standardization.eq_single_order_detail_sf2 partition(p_year,p_month,p_day,pfilter) select * from gfocnnsd_standardization.eq_single_order_detail_sf_tmp where pfilter = \'',pfilter,
- '\' sort by trd_date, src_sys,sys_order_id" >logs/insp.eq_single_order_detail_sf2.',row_number() over(),'.log
- ')
- from (
- select distinct pfilter from gfocnnsd_standardization.eq_single_order_detail_sf_tmp ) ccc;
- Command:
- beeline -u 'jdbc:hive2://bigdataplatform-uat.nam.nsroot.net:10000/;principal=hive/bigdataplatform-uat.nam.nsroot.net@CTIP.NAM.NSROOT.NET;ssl=true' \
- --outputformat=csv2 --verbose=false --silent=true -f gen_par_ins.sql>par_ins.sh
- Result:
- beeline -u "jdbc:hive2://bigdataplatform-uat.nam.nsroot.net:10000/;principal=hive/bigdataplatform-uat.nam.nsroot.net@CTIP.NAM.NSROOT.NET;ssl=true" --fastConnect=true -e "set hive.exec.dynamic.partition.mode=nonstrict; set hive.merge.mapfiles=true; set hive.merge.mapredfiles=true; set hive.merge.smallfiles.avgsize=67108864; set mapred.max.split.size=67108864; set mapred.min.split.size=67108864; set hive.exec.parallel=true; set hive.execution.engine=mr;insert overwrite table gfocnnsd_standardization.eq_single_order_detail_sf2 partition(p_year,p_month,p_day,pfilter) select * from gfocnnsd_standardization.eq_single_order_detail_sf_tmp where pfilter = 'TRD_DATE-20180920.SRC_SYS+099.TICKER_SYMBOL-NOTLIKE.REG_NMS_LINK_TYPE+NULL.OCEAN_PRODUCT_ID+099.PRODUCT_CAT_CD+099.EVENT_TYPE_CD+ALL' sort by trd_date, src_sys,sys_order_id">logs/insp.eq_single_order_detail_sf2.1.log
- beeline -u "jdbc:hive2://bigdataplatform-uat.nam.nsroot.net:10000/;principal=hive/bigdataplatform-uat.nam.nsroot.net@CTIP.NAM.NSROOT.NET;ssl=true" --fastConnect=true -e "set hive.exec.dynamic.partition.mode=nonstrict; set hive.merge.mapfiles=true; set hive.merge.mapredfiles=true; set hive.merge.smallfiles.avgsize=67108864; set mapred.max.split.size=67108864; set mapred.min.split.size=67108864; set hive.exec.parallel=true; set hive.execution.engine=mr;insert overwrite table gfocnnsd_standardization.eq_single_order_detail_sf2 partition(p_year,p_month,p_day,pfilter) select * from gfocnnsd_standardization.eq_single_order_detail_sf_tmp where pfilter = 'TRD_DATE+20180920.SRC_SYS+UK.TICKER_SYMBOL+NOTLIKE.REG_NMS_LINK_TYPE+NULL.OCEAN_PRODUCT_ID+099.PRODUCT_CAT_CD+NULL.EVENT_TYPE_CD+NEW_REQ' sort by trd_date, src_sys,sys_order_id" >logs/insp.eq_single_order_detail_sf2.2.log
- ...
- beeline -u "jdbc:hive2://bigdataplatform-uat.nam.nsroot.net:10000/;principal=hive/bigdataplatform-uat.nam.nsroot.net@CTIP.NAM.NSROOT.NET;ssl=true" --fastConnect=true -e "set hive.exec.dynamic.partition.mode=nonstrict; set hive.merge.mapfiles=true; set hive.merge.mapredfiles=true; set hive.merge.smallfiles.avgsize=67108864; set mapred.max.split.size=67108864; set mapred.min.split.size=67108864; set hive.exec.parallel=true; set hive.execution.engine=mr;insert overwrite table gfocnnsd_standardization.eq_single_order_detail_sf2 partition(p_year,p_month,p_day,pfilter) select * from gfocnnsd_standardization.eq_single_order_detail_sf_tmp where pfilter = 'TRD_DATE+20180920.SRC_SYS+UK.TICKER_SYMBOL+NOTLIKE.REG_NMS_LINK_TYPE+NULL.OCEAN_PRODUCT_ID+099.PRODUCT_CAT_CD+NULL.EVENT_TYPE_CD+NEW_CONF' sort by trd_date, src_sys,sys_order_id" >logs/insp.eq_single_order_detail_sf2.3.log
- Now you can execute it.
- FAIL=0
- echo "starting"
- (
- beeline -u "jdbc:hive2://bigdataplatform-uat.nam.nsroot.net:10000/;principal=hive/bigdataplatform-uat.nam.nsroot.net@CTIP.NAM.NSROOT.NET;ssl=true" --fastConnect=true -e "set hive.exec.dynamic.partition.mode=nonstrict; set hive.merge.mapfiles=true; set hive.merge.mapredfiles=true; set hive.merge.smallfiles.avgsize=67108864; set mapred.max.split.size=67108864; set mapred.min.split.size=67108864; set hive.exec.parallel=true; set hive.execution.engine=mr;insert overwrite table gfocnnsd_standardization.eq_single_order_detail_sf2 partition(p_year,p_month,p_day,pfilter) select * from gfocnnsd_standardization.eq_single_order_detail_sf_tmp where pfilter = 'TRD_DATE-20180920.SRC_SYS+099.TICKER_SYMBOL-NOTLIKE.REG_NMS_LINK_TYPE+NULL.OCEAN_PRODUCT_ID+099.PRODUCT_CAT_CD+099.EVENT_TYPE_CD+ALL' sort by trd_date, src_sys,sys_order_id">logs/insp.eq_single_order_detail_sf2.1.log
- beeline -u "jdbc:hive2://bigdataplatform-uat.nam.nsroot.net:10000/;principal=hive/bigdataplatform-uat.nam.nsroot.net@CTIP.NAM.NSROOT.NET;ssl=true" --fastConnect=true -e "set hive.exec.dynamic.partition.mode=nonstrict; set hive.merge.mapfiles=true; set hive.merge.mapredfiles=true; set hive.merge.smallfiles.avgsize=67108864; set mapred.max.split.size=67108864; set mapred.min.split.size=67108864; set hive.exec.parallel=true; set hive.execution.engine=mr;insert overwrite table gfocnnsd_standardization.eq_single_order_detail_sf2 partition(p_year,p_month,p_day,pfilter) select * from gfocnnsd_standardization.eq_single_order_detail_sf_tmp where pfilter = 'TRD_DATE+20180920.SRC_SYS+UK.TICKER_SYMBOL+NOTLIKE.REG_NMS_LINK_TYPE+NULL.OCEAN_PRODUCT_ID+099.PRODUCT_CAT_CD+NULL.EVENT_TYPE_CD+NEW_REQ' sort by trd_date, src_sys,sys_order_id" >logs/insp.eq_single_order_detail_sf2.2.log
- beeline -u "jdbc:hive2://bigdataplatform-uat.nam.nsroot.net:10000/;principal=hive/bigdataplatform-uat.nam.nsroot.net@CTIP.NAM.NSROOT.NET;ssl=true" --fastConnect=true -e "set hive.exec.dynamic.partition.mode=nonstrict; set hive.merge.mapfiles=true; set hive.merge.mapredfiles=true; set hive.merge.smallfiles.avgsize=67108864; set mapred.max.split.size=67108864; set mapred.min.split.size=67108864; set hive.exec.parallel=true; set hive.execution.engine=mr;insert overwrite table gfocnnsd_standardization.eq_single_order_detail_sf2 partition(p_year,p_month,p_day,pfilter) select * from gfocnnsd_standardization.eq_single_order_detail_sf_tmp where pfilter = 'TRD_DATE+20180920.SRC_SYS+UK.TICKER_SYMBOL+NOTLIKE.REG_NMS_LINK_TYPE+NULL.OCEAN_PRODUCT_ID+099.PRODUCT_CAT_CD+NULL.EVENT_TYPE_CD+NEW_CONF' sort by trd_date, src_sys,sys_order_id" >logs/insp.eq_single_order_detail_sf2.3.log
- )&
- . . .
- (
- beeline -u "jdbc:hive2://bigdataplatform-uat.nam.nsroot.net:10000/;principal=hive/bigdataplatform-uat.nam.nsroot.net@CTIP.NAM.NSROOT.NET;ssl=true" --fastConnect=true -e "set hive.exec.dynamic.partition.mode=nonstrict; set hive.merge.mapfiles=true; set hive.merge.mapredfiles=true; set hive.merge.smallfiles.avgsize=67108864; set mapred.max.split.size=67108864; set mapred.min.split.size=67108864; set hive.exec.parallel=true; set hive.execution.engine=mr;insert overwrite table gfocnnsd_standardization.eq_single_order_detail_sf2 partition(p_year,p_month,p_day,pfilter) select * from gfocnnsd_standardization.eq_single_order_detail_sf_tmp where pfilter = 'TRD_DATE-20180920.SRC_SYS+099.TICKER_SYMBOL-NOTLIKE.REG_NMS_LINK_TYPE+NULL.OCEAN_PRODUCT_ID+099.PRODUCT_CAT_CD+099.EVENT_TYPE_CD+ALL' sort by trd_date, src_sys,sys_order_id">logs/insp.eq_single_order_detail_sf2.1.log
- beeline -u "jdbc:hive2://bigdataplatform-uat.nam.nsroot.net:10000/;principal=hive/bigdataplatform-uat.nam.nsroot.net@CTIP.NAM.NSROOT.NET;ssl=true" --fastConnect=true -e "set hive.exec.dynamic.partition.mode=nonstrict; set hive.merge.mapfiles=true; set hive.merge.mapredfiles=true; set hive.merge.smallfiles.avgsize=67108864; set mapred.max.split.size=67108864; set mapred.min.split.size=67108864; set hive.exec.parallel=true; set hive.execution.engine=mr;insert overwrite table gfocnnsd_standardization.eq_single_order_detail_sf2 partition(p_year,p_month,p_day,pfilter) select * from gfocnnsd_standardization.eq_single_order_detail_sf_tmp where pfilter = 'TRD_DATE+20180920.SRC_SYS+UK.TICKER_SYMBOL+NOTLIKE.REG_NMS_LINK_TYPE+NULL.OCEAN_PRODUCT_ID+099.PRODUCT_CAT_CD+NULL.EVENT_TYPE_CD+NEW_REQ' sort by trd_date, src_sys,sys_order_id" >logs/insp.eq_single_order_detail_sf2.2.log
- beeline -u "jdbc:hive2://bigdataplatform-uat.nam.nsroot.net:10000/;principal=hive/bigdataplatform-uat.nam.nsroot.net@CTIP.NAM.NSROOT.NET;ssl=true" --fastConnect=true -e "set hive.exec.dynamic.partition.mode=nonstrict; set hive.merge.mapfiles=true; set hive.merge.mapredfiles=true; set hive.merge.smallfiles.avgsize=67108864; set mapred.max.split.size=67108864; set mapred.min.split.size=67108864; set hive.exec.parallel=true; set hive.execution.engine=mr;insert overwrite table gfocnnsd_standardization.eq_single_order_detail_sf2 partition(p_year,p_month,p_day,pfilter) select * from gfocnnsd_standardization.eq_single_order_detail_sf_tmp where pfilter = 'TRD_DATE+20180920.SRC_SYS+UK.TICKER_SYMBOL+NOTLIKE.REG_NMS_LINK_TYPE+NULL.OCEAN_PRODUCT_ID+099.PRODUCT_CAT_CD+NULL.EVENT_TYPE_CD+NEW_CONF' sort by trd_date, src_sys,sys_order_id" >logs/insp.eq_single_order_detail_sf2.3.log
- )&
- for job in `jobs -p`
- do
- echo $job
- wait $job || let "FAIL+=1"
- done
- echo $FAIL
- if [ "$FAIL" == "0" ];
- then
- echo "Part Load DONE"
- else
- echo "FAIL! ($FAIL)"
- fi
- Result for 50Gb/ 53 part table:
- Part Load DONE
- real 100m16.758s
- user 18m23.229s
- sys 2m3.298s
Add Comment
Please, Sign In to add comment