Guest User

Untitled

a guest
Sep 8th, 2018
114
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.71 KB | None | 0 0
  1. sqoop-import-all-tables --connect "jdbc:mysql://quickstart.cloudera:3306/retail_db" \
  2. --username retail_dba \
  3. --password cloudera \
  4. --warehouse-dir "/user/hive/warehouse/retail_stage.db" \
  5. --comrpes \
  6. --compression-codec snappy \
  7. --as-avrodatafile \
  8. -m 1
  9.  
  10.  
  11. hadoop fs -get /user/hive/warehouse/retail_stage.db/orders/part-m-00000.avro
  12.  
  13. avro-tools getschema part-m-00000.avro > orders.avsc
  14. hadoop fs -mkdir /user/hive/schemas
  15. hadoop fs -mkdir /user/hive/schemas/order
  16. hadoop fs -copyFromLocal orders.avsc /user/hive/schemas/order
  17.  
  18. create table orders_sqoop
  19. stored as avro
  20. location "/user/hive/warehouse/retail_stage.db/orders"
  21. TBLPROPERTIES("avro.schema.url"="/user/hive/schemas/order/orders.avsc")
  22.  
  23.  
  24.  
  25. select order_id,to_date(from_unixtime(cast(order_date/1000 as int))) order_format_date from orders_sqoop s where s.order_date in (select q.order_date from (select order_date,count(order_id) order_count from orders_sqoop group by order_date order by order_count desc limit 1) q);
  26.  
  27. create table orders_avro
  28. (order_id int,
  29. order_date date,
  30. order_customer_id int,
  31. order_status string)
  32. partitioned by(order_month string)
  33. stored as avro;
  34.  
  35. insert overwrite table orders_avro partition(order_month)
  36. select order_id,to_date(from_unixtime(cast(order_date/1000 as int))),order_customer_id,order_status,
  37. substr(from_unixtime(cast(order_date/1000 as int)),1,7) as order_month from default.orders_sqoop;
  38.  
  39.  
  40. select * from orders_avro where order_date in (select order_date from (select order_id,order_date,count(order_id) order_count from orders_avro group by order_date order by order_count desc limit 1) q)
  41.  
  42.  
  43. hadoop fs -get orsers.avsc
  44. gedit orders.avsc
  45.  
  46. {
  47. "name":"order_zone",
  48. "type":["null","int"],
  49. "default":"null,
  50. "columnName":"order_zone",
  51. "sqlType":"4"
  52. }
Add Comment
Please, Sign In to add comment