create table store_sales ( ss_sold_time_sk bigint, ss_item_sk bigint, ss_customer_sk bigint, ss_cdemo_sk bigint, ss_hdemo_sk bigint, ss_addr_sk bigint, ss_store_sk bigint, ss_promo_sk bigint, ss_ticket_number bigint, ss_quantity int, ss_wholesale_cost double, ss_list_price double, ss_sales_price double, ss_ext_discount_amt double, ss_ext_sales_price double, ss_ext_wholesale_cost double, ss_ext_list_price double, ss_ext_tax double, ss_coupon_amt double, ss_net_paid double, ss_net_paid_inc_tax double, ss_net_profit double ) partitioned by (ss_sold_date_sk bigint) CLUSTERED BY (ss_ticket_number) INTO 2 BUCKETS STORED AS ORC TBLPROPERTIES ('transactional'='true', 'transactional_properties'='default') ; hive> set hive.exec.max.dynamic.partitions.pernode=10000; hive> set hive.exec.max.dynamic.partitions = 100000; hive> SET hive.exec.dynamic.partition = true; hive> SET hive.exec.dynamic.partition.mode = nonstrict; hive> set hive.optimize.sort.dynamic.partition = true; hive> set hive.explain.user=false; hive> > explain from tpcds_text_1000.store_sales ss > insert into table store_sales partition (ss_sold_date_sk) > select > ss.ss_sold_time_sk, > ss.ss_item_sk, > ss.ss_customer_sk, > ss.ss_cdemo_sk, > ss.ss_hdemo_sk, > ss.ss_addr_sk, > ss.ss_store_sk, > ss.ss_promo_sk, > ss.ss_ticket_number, > ss.ss_quantity, > ss.ss_wholesale_cost, > ss.ss_list_price, > ss.ss_sales_price, > ss.ss_ext_discount_amt, > ss.ss_ext_sales_price, > ss.ss_ext_wholesale_cost, > ss.ss_ext_list_price, > ss.ss_ext_tax, > ss.ss_coupon_amt, > ss.ss_net_paid, > ss.ss_net_paid_inc_tax, > ss.ss_net_profit, > ss.ss_sold_date_sk > where ss.ss_sold_date_sk is not null > insert into table store_sales partition (ss_sold_date_sk) > select > ss.ss_sold_time_sk, > ss.ss_item_sk, > ss.ss_customer_sk, > ss.ss_cdemo_sk, > ss.ss_hdemo_sk, > ss.ss_addr_sk, > ss.ss_store_sk, > ss.ss_promo_sk, > ss.ss_ticket_number, > ss.ss_quantity, > ss.ss_wholesale_cost, > ss.ss_list_price, > ss.ss_sales_price, > ss.ss_ext_discount_amt, > ss.ss_ext_sales_price, > ss.ss_ext_wholesale_cost, > ss.ss_ext_list_price, > ss.ss_ext_tax, > ss.ss_coupon_amt, > ss.ss_net_paid, > ss.ss_net_paid_inc_tax, > ss.ss_net_profit, > ss.ss_sold_date_sk > where ss.ss_sold_date_sk is null > ; OK STAGE DEPENDENCIES: Stage-2 is a root stage Stage-3 depends on stages: Stage-2 Stage-0 depends on stages: Stage-3 Stage-4 depends on stages: Stage-0 Stage-1 depends on stages: Stage-3 Stage-5 depends on stages: Stage-1 STAGE PLANS: Stage: Stage-2 Tez DagId: hive_20170703065604_6c0a9bf5-dbd0-403c-87cb-f13253e459ed:1 Edges: Reducer 2 <- Map 1 (SIMPLE_EDGE) Reducer 3 <- Map 1 (SIMPLE_EDGE) DagName: Vertices: Map 1 Map Operator Tree: TableScan alias: ss Statistics: Num rows: 2326249836 Data size: 418724970496 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: ss_sold_date_sk is not null (type: boolean) Statistics: Num rows: 2326249836 Data size: 418724970496 Basic stats: COMPLETE Column stats: NONE Select Operator expressions: ss_sold_time_sk (type: bigint), ss_item_sk (type: bigint), ss_customer_sk (type: bigint), ss_cdemo_sk (type: bigint), ss_hdemo_sk (type: bigint), ss_addr_sk (type: bigint), ss_store_sk (type: bigint), ss_promo_sk (type: bigint), ss_ticket_number (type: bigint), ss_quantity (type: int), ss_wholesale_cost (type: double), ss_list_price (type: double), ss_sales_price (type: double), ss_ext_discount_amt (type: double), ss_ext_sales_price (type: double), ss_ext_wholesale_cost (type: double), ss_ext_list_price (type: double), ss_ext_tax (type: double), ss_coupon_amt (type: double), ss_net_paid (type: double), ss_net_paid_inc_tax (type: double), ss_net_profit (type: double), ss_sold_date_sk (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20, _col21, _col22 Statistics: Num rows: 2326249836 Data size: 418724970496 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator key expressions: _col22 (type: bigint), '_bucket_number' (type: string) sort order: ++ Map-reduce partition columns: _col22 (type: bigint) Statistics: Num rows: 2326249836 Data size: 418724970496 Basic stats: COMPLETE Column stats: NONE value expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: bigint), _col3 (type: bigint), _col4 (type: bigint), _col5 (type: bigint), _col6 (type: bigint), _col7 (type: bigint), _col8 (type: bigint), _col9 (type: int), _col10 (type: double), _col11 (type: double), _col12 (type: double), _col13 (type: double), _col14 (type: double), _col15 (type: double), _col16 (type: double), _col17 (type: double), _col18 (type: double), _col19 (type: double), _col20 (type: double), _col21 (type: double) Filter Operator predicate: ss_sold_date_sk is null (type: boolean) Statistics: Num rows: 1163124918 Data size: 209362485248 Basic stats: COMPLETE Column stats: NONE Select Operator expressions: ss_sold_time_sk (type: bigint), ss_item_sk (type: bigint), ss_wholesale_cost (type: double), ss_list_price (type: double), ss_sales_price (type: double), ss_ext_discount_amt (type: double), ss_ext_sales_price (type: double), ss_ext_wholesale_cost (type: double), ss_ext_list_price (type: double), ss_ext_tax (type: double), ss_coupon_amt (type: double), ss_net_paid (type: double), ss_customer_sk (type: bigint), ss_net_paid_inc_tax (type: double), ss_net_profit (type: double), ss_cdemo_sk (type: bigint), ss_hdemo_sk (type: bigint), ss_addr_sk (type: bigint), ss_store_sk (type: bigint), ss_promo_sk (type: bigint), ss_ticket_number (type: bigint), ss_quantity (type: int) outputColumnNames: _col0, _col1, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col2, _col20, _col21, _col3, _col4, _col5, _col6, _col7, _col8, _col9 Statistics: Num rows: 1163124918 Data size: 209362485248 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator sort order: Map-reduce partition columns: _col8 (type: bigint) Statistics: Num rows: 1163124918 Data size: 209362485248 Basic stats: COMPLETE Column stats: NONE value expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: bigint), _col3 (type: bigint), _col4 (type: bigint), _col5 (type: bigint), _col6 (type: bigint), _col7 (type: bigint), _col8 (type: bigint), _col9 (type: int), _col10 (type: double), _col11 (type: double), _col12 (type: double), _col13 (type: double), _col14 (type: double), _col15 (type: double), _col16 (type: double), _col17 (type: double), _col18 (type: double), _col19 (type: double), _col20 (type: double), _col21 (type: double) Execution mode: llap LLAP IO: no inputs Reducer 2 Execution mode: vectorized, llap Reduce Operator Tree: Select Operator expressions: VALUE._col0 (type: bigint), VALUE._col1 (type: bigint), VALUE._col2 (type: bigint), VALUE._col3 (type: bigint), VALUE._col4 (type: bigint), VALUE._col5 (type: bigint), VALUE._col6 (type: bigint), VALUE._col7 (type: bigint), VALUE._col8 (type: bigint), VALUE._col9 (type: int), VALUE._col10 (type: double), VALUE._col11 (type: double), VALUE._col12 (type: double), VALUE._col13 (type: double), VALUE._col14 (type: double), VALUE._col15 (type: double), VALUE._col16 (type: double), VALUE._col17 (type: double), VALUE._col18 (type: double), VALUE._col19 (type: double), VALUE._col20 (type: double), VALUE._col21 (type: double), KEY._col22 (type: bigint), KEY.'_bucket_number' (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20, _col21, _col22, '_bucket_number' Statistics: Num rows: 2326249836 Data size: 418724970496 Basic stats: COMPLETE Column stats: NONE File Output Operator compressed: false Statistics: Num rows: 2326249836 Data size: 418724970496 Basic stats: COMPLETE Column stats: NONE table: input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat serde: org.apache.hadoop.hive.ql.io.orc.OrcSerde name: tpcds_bin_partitioned_acid_1000.store_sales Reducer 3 Execution mode: vectorized, llap Reduce Operator Tree: Select Operator expressions: VALUE._col0 (type: bigint), VALUE._col1 (type: bigint), VALUE._col2 (type: bigint), VALUE._col3 (type: bigint), VALUE._col4 (type: bigint), VALUE._col5 (type: bigint), VALUE._col6 (type: bigint), VALUE._col7 (type: bigint), VALUE._col8 (type: bigint), VALUE._col9 (type: int), VALUE._col10 (type: double), VALUE._col11 (type: double), VALUE._col12 (type: double), VALUE._col13 (type: double), VALUE._col14 (type: double), VALUE._col15 (type: double), VALUE._col16 (type: double), VALUE._col17 (type: double), VALUE._col18 (type: double), VALUE._col19 (type: double), VALUE._col20 (type: double), VALUE._col21 (type: double), null (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20, _col21, _col22 Statistics: Num rows: 1163124918 Data size: 209362485248 Basic stats: COMPLETE Column stats: NONE File Output Operator compressed: false Statistics: Num rows: 1163124918 Data size: 209362485248 Basic stats: COMPLETE Column stats: NONE table: input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat serde: org.apache.hadoop.hive.ql.io.orc.OrcSerde name: tpcds_bin_partitioned_acid_1000.store_sales Stage: Stage-3 Dependency Collection Stage: Stage-0 Move Operator tables: partition: ss_sold_date_sk replace: false table: input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat serde: org.apache.hadoop.hive.ql.io.orc.OrcSerde name: tpcds_bin_partitioned_acid_1000.store_sales Stage: Stage-4 Stats-Aggr Operator Stage: Stage-1 Move Operator tables: partition: ss_sold_date_sk replace: false table: input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat serde: org.apache.hadoop.hive.ql.io.orc.OrcSerde name: tpcds_bin_partitioned_acid_1000.store_sales Stage: Stage-5 Stats-Aggr Operator