web_returns.sql 2.2 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071
  1. set hive.enforce.bucketing=true;
  2. set hive.exec.dynamic.partition.mode=nonstrict;
  3. set hive.exec.max.dynamic.partitions=4096;
  4. set hive.exec.max.dynamic.partitions.pernode=4096;
  5. set mapred.job.reduce.input.buffer.percent=0.0;
  6. create database if not exists ${DB};
  7. use ${DB};
  8. drop table if exists web_returns;
  9. create table web_returns
  10. (
  11. wr_returned_date_sk int,
  12. wr_returned_time_sk int,
  13. wr_item_sk int,
  14. wr_refunded_customer_sk int,
  15. wr_refunded_cdemo_sk int,
  16. wr_refunded_hdemo_sk int,
  17. wr_refunded_addr_sk int,
  18. wr_returning_customer_sk int,
  19. wr_returning_cdemo_sk int,
  20. wr_returning_hdemo_sk int,
  21. wr_returning_addr_sk int,
  22. wr_web_page_sk int,
  23. wr_reason_sk int,
  24. wr_order_number int,
  25. wr_return_quantity int,
  26. wr_return_amt float,
  27. wr_return_tax float,
  28. wr_return_amt_inc_tax float,
  29. wr_fee float,
  30. wr_return_ship_cost float,
  31. wr_refunded_cash float,
  32. wr_reversed_charge float,
  33. wr_account_credit float,
  34. wr_net_loss float
  35. )
  36. partitioned by (wr_returned_date string)
  37. stored as ${FILE};
  38. insert overwrite table web_returns partition (wr_returned_date)
  39. select
  40. wr.wr_returned_date_sk,
  41. wr.wr_returned_time_sk,
  42. wr.wr_item_sk,
  43. wr.wr_refunded_customer_sk,
  44. wr.wr_refunded_cdemo_sk,
  45. wr.wr_refunded_hdemo_sk,
  46. wr.wr_refunded_addr_sk,
  47. wr.wr_returning_customer_sk,
  48. wr.wr_returning_cdemo_sk,
  49. wr.wr_returning_hdemo_sk,
  50. wr.wr_returning_addr_sk,
  51. wr.wr_web_page_sk,
  52. wr.wr_reason_sk,
  53. wr.wr_order_number,
  54. wr.wr_return_quantity,
  55. wr.wr_return_amt,
  56. wr.wr_return_tax,
  57. wr.wr_return_amt_inc_tax,
  58. wr.wr_fee,
  59. wr.wr_return_ship_cost,
  60. wr.wr_refunded_cash,
  61. wr.wr_reversed_charge,
  62. wr.wr_account_credit,
  63. wr.wr_net_loss,
  64. dd.d_date as wr_returned_date
  65. from ${SOURCE}.web_returns wr
  66. left outer join ${SOURCE}.date_dim dd
  67. on (wr.wr_returned_date_sk = dd.d_date_sk);