Guest User

Untitled

a guest
Apr 13th, 2018
114
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 2.63 KB | None | 0 0
  1. # Basic sqoop commands
  2. sqoop import --connect jdbc:mysql://quickstart.cloudera:3306/retail_db \
  3. --username root \
  4. -P \
  5. --table categories \
  6. --target-dir /user/cloudera/categories_pipe \
  7. --terminated-by "\n" \
  8. --fields-seperated-by "|"
  9.  
  10. sqoop import --connect jdbc:mysql://quickstart.cloudera:3306/retail_db \
  11. --username root \
  12. -P \
  13. --table categories \
  14. --target-dir /user/cloudera/categories_pipe \
  15. --fields-seperated-by "|"
  16.  
  17. # Specifying your line and field seperators
  18. sqoop import --connect jdbc:mysql://quickstart.cloudera:3306/retail_db \
  19. --username root \
  20. -P \
  21. --table categories \
  22. --target-dir /user/cloudera/categories_new_sep \
  23. --fields-terminated-by "|" \
  24. --lines-terminated-by "§"
  25.  
  26. # Setting number of mappers to 2
  27. sqoop import --connect jdbc:mysql://quickstart:3306/retail_db \
  28. --username root \
  29. # never use password arg this way; always use -P
  30. --password cloudera \
  31. --table categories \
  32. --target-dir /user/cloudera/categories_pipe_2m \
  33. --fields-terminated-by '|' \
  34. -m 2
  35.  
  36. # Setting number of mappers to 1
  37. sqoop import --connect jdbc:mysql://quickstart:3306/retail_db \
  38. --username root \
  39. -P \
  40. --table categories \
  41. --target-dir /user/cloudera/categories_pipe_1m \
  42. --fields-terminated-by '|' \
  43. -num-mappers 1
  44.  
  45. # Sqooping data into Parquet
  46. sqoop import --connect jdbc:mysql://quickstart:3306/retail_db \
  47. --username root \
  48. -P \
  49. --table categories \
  50. --warehouse-dir /user/cloudera/parquets \
  51. --fields-terminated-by '|' \
  52. --as-parquetfile
  53.  
  54. sqoop import --connect jdbc:mysql://quickstart:3306/retail_db \
  55. --username root \
  56. -P \
  57. --table products \
  58. --columns product_id,product_name,product_price \
  59. --target-dir /user/cloudera/parquets/custom_columns \
  60. --fields-terminated-by '|' \
  61. --as-textfile
  62.  
  63. sqoop import --connect jdbc:mysql://quickstart:3306/retail_db \
  64. --username root \
  65. -P \
  66. --query "select a.*, b.* from products as a left join categories as b on a.product_category_id = b.category_id where \$CONDITIONS" \
  67. --split-by product_id \
  68. --target-dir /user/cloudera/parquets/innerjoin \
  69. --fields-terminated-by '|' \
  70. --as-textfile
  71.  
  72. sqoop import --connect jdbc:mysql://quickstart:3306/retail_db \
  73. --username root \
  74. -P \
  75. --table products \
  76. --where "\`product_id\`\<100 " \
  77. --target-dir /user/cloudera/parquets/filtered_data \
  78. --fields-terminated-by '|' \
  79. --as-textfile
  80.  
  81. sqoop import --connect jdbc:mysql://quickstart:3306/demo \
  82. --username root \
  83. -P \
  84. --table names \
  85. --target-dir /user/cloudera/parquets/null_data2 \
  86. --fields-terminated-by '|' \
  87. --null-string "Unknown" \
  88. --null-non-string "0" \
  89. --as-textfile -m 1
Add Comment
Please, Sign In to add comment