store_sales.sql 2.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869
  1. set hive.enforce.bucketing=true;
  2. set hive.exec.dynamic.partition.mode=nonstrict;
  3. set hive.exec.max.dynamic.partitions=4096;
  4. set hive.exec.max.dynamic.partitions.pernode=4096;
  5. set mapred.job.reduce.input.buffer.percent=0.0;
  6. create database if not exists ${DB};
  7. use ${DB};
  8. drop table if exists store_sales;
  9. create table store_sales
  10. (
  11. ss_sold_date_sk int,
  12. ss_sold_time_sk int,
  13. ss_item_sk int,
  14. ss_customer_sk int,
  15. ss_cdemo_sk int,
  16. ss_hdemo_sk int,
  17. ss_addr_sk int,
  18. ss_store_sk int,
  19. ss_promo_sk int,
  20. ss_ticket_number int,
  21. ss_quantity int,
  22. ss_wholesale_cost float,
  23. ss_list_price float,
  24. ss_sales_price float,
  25. ss_ext_discount_amt float,
  26. ss_ext_sales_price float,
  27. ss_ext_wholesale_cost float,
  28. ss_ext_list_price float,
  29. ss_ext_tax float,
  30. ss_coupon_amt float,
  31. ss_net_paid float,
  32. ss_net_paid_inc_tax float,
  33. ss_net_profit float
  34. )
  35. partitioned by (ss_sold_date string)
  36. stored as ${FILE};
  37. insert overwrite table store_sales partition (ss_sold_date)
  38. select
  39. ss.ss_sold_date_sk,
  40. ss.ss_sold_time_sk,
  41. ss.ss_item_sk,
  42. ss.ss_customer_sk,
  43. ss.ss_cdemo_sk,
  44. ss.ss_hdemo_sk,
  45. ss.ss_addr_sk,
  46. ss.ss_store_sk,
  47. ss.ss_promo_sk,
  48. ss.ss_ticket_number,
  49. ss.ss_quantity,
  50. ss.ss_wholesale_cost,
  51. ss.ss_list_price,
  52. ss.ss_sales_price,
  53. ss.ss_ext_discount_amt,
  54. ss.ss_ext_sales_price,
  55. ss.ss_ext_wholesale_cost,
  56. ss.ss_ext_list_price,
  57. ss.ss_ext_tax,
  58. ss.ss_coupon_amt,
  59. ss.ss_net_paid,
  60. ss.ss_net_paid_inc_tax,
  61. ss.ss_net_profit,
  62. dd.d_date as ss_sold_date
  63. from ${SOURCE}.store_sales ss
  64. left outer join ${SOURCE}.date_dim dd
  65. on (ss.ss_sold_date_sk = dd.d_date_sk);