explain vectorization detail MERGE INTO tpcds_1000_iceberg_mor_v4.store_sales_delete_1 t USING tpcds_1000_update.ssv s ON (t.ss_item_sk = s.ss_item_sk AND t.ss_customer_sk=s.ss_customer_sk AND t.ss_sold_date_sk = "2451181" AND ((Floor((s.ss_item_sk) / 1000) * 1000) BETWEEN 1000 AND 2000) AND s.ss_ext_discount_amt < 0.0) WHEN matched AND t.ss_ext_discount_amt IS NULL THEN UPDATE SET ss_ext_discount_amt = 0.0 WHEN NOT matched THEN INSERT (ss_sold_time_sk, ss_item_sk, ss_customer_sk, ss_cdemo_sk, ss_hdemo_sk, ss_addr_sk, ss_store_sk, ss_promo_sk, ss_ticket_number, ss_quantity, ss_wholesale_cost, ss_list_price, ss_sales_price, ss_ext_discount_amt, ss_ext_sales_price, ss_ext_wholesale_cost, ss_ext_list_price, ss_ext_tax, ss_coupon_amt, ss_net_paid, ss_net_paid_inc_tax, ss_net_profit, ss_sold_date_sk) VALUES (s.ss_sold_time_sk, s.ss_item_sk, s.ss_customer_sk, s.ss_cdemo_sk, s.ss_hdemo_sk, s.ss_addr_sk, s.ss_store_sk, s.ss_promo_sk, s.ss_ticket_number, s.ss_quantity, s.ss_wholesale_cost, s.ss_list_price, s.ss_sales_price, s.ss_ext_discount_amt, s.ss_ext_sales_price, s.ss_ext_wholesale_cost, s.ss_ext_list_price, s.ss_ext_tax, s.ss_coupon_amt, s.ss_net_paid, s.ss_net_paid_inc_tax, s.ss_net_profit, "2451181") INFO : Starting task [Stage-8:EXPLAIN] in serial mode INFO : Completed executing command(queryId=hive_20230130052219_cf1bf75e-b27b-4993-91af-16bea8cc4c7f); Time taken: 0.023 seconds INFO : OK Explain PLAN VECTORIZATION: enabled: true enabledConditionsMet: [hive.vectorized.execution.enabled IS true] STAGE DEPENDENCIES: Stage-4 is a root stage Stage-5 depends on stages: Stage-4 Stage-0 depends on stages: Stage-5 Stage-6 depends on stages: Stage-0 Stage-3 depends on stages: Stage-5 Stage-7 depends on stages: Stage-3 STAGE PLANS: Stage: Stage-4 Tez DagId: hive_20230130052219_cf1bf75e-b27b-4993-91af-16bea8cc4c7f:55 Edges: Reducer 2 <- Map 1 (CUSTOM_SIMPLE_EDGE), Map 5 (CUSTOM_SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Reducer 4 <- Reducer 2 (SIMPLE_EDGE) DagName: hive_20230130052219_cf1bf75e-b27b-4993-91af-16bea8cc4c7f:55 Vertices: Map 1 Map Operator Tree: TableScan alias: s Statistics: Num rows: 18864648 Data size: 26059576152 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:ss_sold_date_sk:int, 1:ss_sold_time_sk:int, 2:ss_item_sk:int, 3:ss_customer_sk:int, 4:ss_cdemo_sk:int, 5:ss_hdemo_sk:int, 6:ss_addr_sk:int, 7:ss_store_sk:int, 8:ss_promo_sk:int, 9:ss_ticket_number:int, 10:ss_quantity:int, 11:ss_wholesale_cost:decimal(7,2), 12:ss_list_price:decimal(7,2), 13:ss_sales_price:decimal(7,2), 14:ss_ext_discount_amt:decimal(19,2), 15:ss_ext_sales_price:decimal(18,2), 16:ss_ext_wholesale_cost:decimal(18,2), 17:ss_ext_list_price:decimal(18,2), 18:ss_ext_tax:decimal(13,4), 19:ss_coupon_amt:decimal(7,2), 20:ss_net_paid:decimal(19,2), 21:ss_net_paid_inc_tax:decimal(26,4), 22:ss_net_profit:decimal(20,2), 23:ROW__ID:struct, 24:ROW__IS__DELETED:boolean] Select Operator expressions: ss_sold_time_sk (type: int), ss_item_sk (type: int), ss_customer_sk (type: int), ss_cdemo_sk (type: int), ss_hdemo_sk (type: int), ss_addr_sk (type: int), ss_store_sk (type: int), ss_promo_sk (type: int), ss_ticket_number (type: int), ss_quantity (type: int), ss_wholesale_cost (type: decimal(7,2)), ss_list_price (type: decimal(7,2)), ss_sales_price (type: decimal(7,2)), ss_ext_discount_amt (type: decimal(19,2)), ss_ext_sales_price (type: decimal(18,2)), ss_ext_wholesale_cost (type: decimal(18,2)), ss_ext_list_price (type: decimal(18,2)), ss_ext_tax (type: decimal(13,4)), ss_coupon_amt (type: decimal(7,2)), ss_net_paid (type: decimal(19,2)), ss_net_paid_inc_tax (type: decimal(26,4)), ss_net_profit (type: decimal(20,2)), (1000L <= (floor((UDFToDouble(ss_item_sk) / 1000.0D)) * 1000L)) (type: boolean), ((floor((UDFToDouble(ss_item_sk) / 1000.0D)) * 1000L) <= 2000L) (type: boolean), (ss_ext_discount_amt < 0) (type: boolean) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20, _col21, _col22, _col23, _col24 Select Vectorization: className: VectorSelectOperator native: true projectedOutputColumnNums: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 29, 34, 35] selectExpressions: LongScalarLessEqualLongColumn(val 1000, col 28:bigint)(children: LongColMultiplyLongScalar(col 27:bigint, val 1000)(children: FuncFloorDoubleToLong(col 26:double)(children: DoubleColDivideDoubleScalar(col 25:double, val 1000.0)(children: CastLongToDouble(col 2:int) -> 25:double) -> 26:double) -> 27:bigint) -> 28:bigint) -> 29:boolean, LongColLessEqualLongScalar(col 33:bigint, val 2000)(children: LongColMultiplyLongScalar(col 32:bigint, val 1000)(children: FuncFloorDoubleToLong(col 31:double)(children: DoubleColDivideDoubleScalar(col 30:double, val 1000.0)(children: CastLongToDouble(col 2:int) -> 30:double) -> 31:double) -> 32:bigint) -> 33:bigint) -> 34:boolean, DecimalColLessDecimalScalar(col 14:decimal(19,2), val 0) -> 35:boolean Statistics: Num rows: 18864648 Data size: 26285951928 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: int), _col2 (type: int) null sort order: aa sort order: ++ Map-reduce partition columns: _col1 (type: int), _col2 (type: int) Reduce Sink Vectorization: className: VectorReduceSinkMultiKeyOperator keyColumns: 2:int, 3:int native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumns: 1:int, 4:int, 5:int, 6:int, 7:int, 8:int, 9:int, 10:int, 11:decimal(7,2), 12:decimal(7,2), 13:decimal(7,2), 14:decimal(19,2), 15:decimal(18,2), 16:decimal(18,2), 17:decimal(18,2), 18:decimal(13,4), 19:decimal(7,2), 20:decimal(19,2), 21:decimal(26,4), 22:decimal(20,2), 29:boolean, 34:boolean, 35:boolean Statistics: Num rows: 18864648 Data size: 26285951928 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: int), _col6 (type: int), _col7 (type: int), _col8 (type: int), _col9 (type: int), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col12 (type: decimal(7,2)), _col13 (type: decimal(19,2)), _col14 (type: decimal(18,2)), _col15 (type: decimal(18,2)), _col16 (type: decimal(18,2)), _col17 (type: decimal(13,4)), _col18 (type: decimal(7,2)), _col19 (type: decimal(19,2)), _col20 (type: decimal(26,4)), _col21 (type: decimal(20,2)), _col22 (type: boolean), _col23 (type: boolean), _col24 (type: boolean) Execution mode: vectorized, llap LLAP IO: all inputs (cache only) Map Vectorization: enabled: true enabledConditionsMet: hive.vectorized.use.vectorized.input.format IS true inputFormatFeatureSupport: [] featureSupportInUse: [] inputFileFormats: org.apache.hadoop.hive.ql.io.parquet.MapredParquetInputFormat allNative: true usesVectorUDFAdaptor: false vectorized: true rowBatchContext: dataColumnCount: 23 includeColumns: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22] dataColumns: ss_sold_date_sk:int, ss_sold_time_sk:int, ss_item_sk:int, ss_customer_sk:int, ss_cdemo_sk:int, ss_hdemo_sk:int, ss_addr_sk:int, ss_store_sk:int, ss_promo_sk:int, ss_ticket_number:int, ss_quantity:int, ss_wholesale_cost:decimal(7,2), ss_list_price:decimal(7,2), ss_sales_price:decimal(7,2), ss_ext_discount_amt:decimal(19,2), ss_ext_sales_price:decimal(18,2), ss_ext_wholesale_cost:decimal(18,2), ss_ext_list_price:decimal(18,2), ss_ext_tax:decimal(13,4), ss_coupon_amt:decimal(7,2), ss_net_paid:decimal(19,2), ss_net_paid_inc_tax:decimal(26,4), ss_net_profit:decimal(20,2) partitionColumnCount: 0 scratchColumnTypeNames: [double, double, bigint, bigint, bigint, double, double, bigint, bigint, bigint, bigint] Map 5 Map Operator Tree: TableScan alias: store_sales_delete_1 filterExpr: ((ss_sold_date_sk = 2451181) and ss_item_sk is not null and ss_customer_sk is not null) (type: boolean) Statistics: (RUNTIME) Num rows: 18864648 Data size: 24939064656 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: ((ss_sold_date_sk = 2451181) and ss_item_sk is not null and ss_customer_sk is not null) (type: boolean) Statistics: (RUNTIME) Num rows: 18864648 Data size: 24939064656 Basic stats: COMPLETE Column stats: NONE Select Operator expressions: PARTITION__SPEC__ID (type: int), PARTITION__HASH (type: bigint), FILE__PATH (type: string), ROW__POSITION (type: bigint), ss_sold_time_sk (type: int), ss_cdemo_sk (type: int), ss_hdemo_sk (type: int), ss_addr_sk (type: int), ss_store_sk (type: int), ss_promo_sk (type: int), ss_ticket_number (type: bigint), ss_quantity (type: int), ss_wholesale_cost (type: decimal(7,2)), ss_list_price (type: decimal(7,2)), ss_sales_price (type: decimal(7,2)), ss_ext_discount_amt (type: decimal(7,2)), ss_ext_sales_price (type: decimal(7,2)), ss_ext_wholesale_cost (type: decimal(7,2)), ss_ext_list_price (type: decimal(7,2)), ss_ext_tax (type: decimal(7,2)), ss_coupon_amt (type: decimal(7,2)), ss_net_paid (type: decimal(7,2)), ss_net_paid_inc_tax (type: decimal(7,2)), ss_net_profit (type: decimal(7,2)), 2451181 (type: int), ss_sold_time_sk (type: int), ss_item_sk (type: int), ss_customer_sk (type: int), ss_cdemo_sk (type: int), ss_hdemo_sk (type: int), ss_addr_sk (type: int), ss_store_sk (type: int), ss_promo_sk (type: int), ss_ticket_number (type: bigint), ss_quantity (type: int), ss_wholesale_cost (type: decimal(7,2)), ss_list_price (type: decimal(7,2)), ss_sales_price (type: decimal(7,2)), ss_ext_discount_amt (type: decimal(7,2)), ss_ext_sales_price (type: decimal(7,2)), ss_ext_wholesale_cost (type: decimal(7,2)), ss_ext_list_price (type: decimal(7,2)), ss_ext_tax (type: decimal(7,2)), ss_coupon_amt (type: decimal(7,2)), ss_net_paid (type: decimal(7,2)), ss_net_paid_inc_tax (type: decimal(7,2)), ss_net_profit (type: decimal(7,2)), 2451181 (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20, _col21, _col22, _col23, _col24, _col25, _col26, _col27, _col28, _col29, _col30, _col31, _col32, _col33, _col34, _col35, _col36, _col37, _col38, _col39, _col40, _col41, _col42, _col43, _col44, _col45, _col46, _col47, _col48, _col49 Statistics: (RUNTIME) Num rows: 18864648 Data size: 24939064656 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator key expressions: _col28 (type: int), _col29 (type: int) null sort order: aa sort order: ++ Map-reduce partition columns: _col28 (type: int), _col29 (type: int) Statistics: (RUNTIME) Num rows: 18864648 Data size: 24939064656 Basic stats: COMPLETE Column stats: NONE value expressions: _col0 (type: int), _col1 (type: bigint), _col2 (type: string), _col3 (type: bigint), _col4 (type: int), _col7 (type: int), _col8 (type: int), _col9 (type: int), _col10 (type: int), _col11 (type: int), _col12 (type: bigint), _col13 (type: int), _col14 (type: decimal(7,2)), _col15 (type: decimal(7,2)), _col16 (type: decimal(7,2)), _col17 (type: decimal(7,2)), _col18 (type: decimal(7,2)), _col19 (type: decimal(7,2)), _col20 (type: decimal(7,2)), _col21 (type: decimal(7,2)), _col22 (type: decimal(7,2)), _col23 (type: decimal(7,2)), _col24 (type: decimal(7,2)), _col25 (type: decimal(7,2)), _col26 (type: int), _col27 (type: int), _col30 (type: int), _col31 (type: int), _col32 (type: int), _col33 (type: int), _col34 (type: int), _col35 (type: bigint), _col36 (type: int), _col37 (type: decimal(7,2)), _col38 (type: decimal(7,2)), _col39 (type: decimal(7,2)), _col40 (type: decimal(7,2)), _col41 (type: decimal(7,2)), _col42 (type: decimal(7,2)), _col43 (type: decimal(7,2)), _col44 (type: decimal(7,2)), _col45 (type: decimal(7,2)), _col46 (type: decimal(7,2)), _col47 (type: decimal(7,2)), _col48 (type: decimal(7,2)), _col49 (type: int) Execution mode: llap LLAP IO: no inputs Map Vectorization: enabled: true enabledConditionsMet: hive.vectorized.use.vectorized.input.format IS true inputFileFormats: org.apache.iceberg.mr.hive.HiveIcebergInputFormat notVectorizedReason: Select expression for SELECT operator: Virtual column PARTITION__SPEC__ID is not supported vectorized: false Reducer 2 Execution mode: llap Reduce Vectorization: enabled: true enableConditionsMet: hive.vectorized.execution.reduce.enabled IS true, hive.execution.engine tez IN [tez] IS true notVectorizedReason: exception: java.lang.RuntimeException: Full Outer Small Table Key Mapping duplicate column 0 in ordered column map {0=(value column: 30, type info: int), 1=(value column: 31, type info: int)} when adding value column 53, type into int stack trace: org.apache.hadoop.hive.ql.exec.vector.VectorColumnOrderedMap.add(VectorColumnOrderedMap.java:102), org.apache.hadoop.hive.ql.exec.vector.VectorColumnSourceMapping.add(VectorColumnSourceMapping.java:41), org.apache.hadoop.hive.ql.optimizer.physical.Vectorizer.canSpecializeMapJoin(Vectorizer.java:3865), org.apache.hadoop.hive.ql.optimizer.physical.Vectorizer.validateAndVectorizeOperator(Vectorizer.java:5246), org.apache.hadoop.hive.ql.optimizer.physical.Vectorizer.doProcessChild(Vectorizer.java:988), org.apache.hadoop.hive.ql.optimizer.physical.Vectorizer.doProcessChildren(Vectorizer.java:874), org.apache.hadoop.hive.ql.optimizer.physical.Vectorizer.validateAndVectorizeOperatorTree(Vectorizer.java:841), org.apache.hadoop.hive.ql.optimizer.physical.Vectorizer.access$2400(Vectorizer.java:251), org.apache.hadoop.hive.ql.optimizer.physical.Vectorizer$VectorizationDispatcher.validateAndVectorizeReduceOperators(Vectorizer.java:2298), org.apache.hadoop.hive.ql.optimizer.physical.Vectorizer$VectorizationDispatcher.validateAndVectorizeReduceOperators(Vectorizer.java:2246), org.apache.hadoop.hive.ql.optimizer.physical.Vectorizer$VectorizationDispatcher.validateAndVectorizeReduceWork(Vectorizer.java:2224), org.apache.hadoop.hive.ql.optimizer.physical.Vectorizer$VectorizationDispatcher.convertReduceWork(Vectorizer.java:2206), org.apache.hadoop.hive.ql.optimizer.physical.Vectorizer$VectorizationDispatcher.dispatch(Vectorizer.java:1038), org.apache.hadoop.hive.ql.lib.TaskGraphWalker.dispatch(TaskGraphWalker.java:111), org.apache.hadoop.hive.ql.lib.TaskGraphWalker.walk(TaskGraphWalker.java:180), ... vectorized: false Reduce Operator Tree: Map Join Operator condition map: Left Outer Join 0 to 1 filter predicates: 0 {VALUE._col20} {VALUE._col21} {VALUE._col22} 1 keys: 0 KEY.reducesinkkey0 (type: int), KEY.reducesinkkey1 (type: int) 1 KEY.reducesinkkey0 (type: int), KEY.reducesinkkey1 (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20, _col21, _col25, _col26, _col27, _col28, _col29, _col30, _col31, _col32, _col33, _col34, _col35, _col36, _col37, _col38, _col39, _col40, _col41, _col42, _col43, _col44, _col45, _col46, _col47, _col48, _col49, _col50, _col51, _col52, _col53, _col54, _col55, _col56, _col57, _col58, _col59, _col60, _col61, _col62, _col63, _col64, _col65, _col66, _col67, _col68, _col69, _col70, _col71, _col72, _col73, _col74 input vertices: 1 Map 5 Statistics: Num rows: 20751113 Data size: 28914547747 Basic stats: COMPLETE Column stats: NONE DynamicPartitionHashJoin: true Select Operator expressions: _col62 (type: decimal(7,2)), _col19 (type: decimal(19,2)), _col55 (type: int), _col61 (type: int), _col21 (type: decimal(20,2)), _col25 (type: int), _col7 (type: int), _col3 (type: int), _col51 (type: int), _col10 (type: decimal(7,2)), _col30 (type: int), _col37 (type: bigint), _col42 (type: decimal(7,2)), _col71 (type: decimal(7,2)), _col60 (type: bigint), _col6 (type: int), _col72 (type: decimal(7,2)), _col2 (type: int), _col33 (type: int), _col11 (type: decimal(7,2)), _col29 (type: int), _col56 (type: int), _col48 (type: decimal(7,2)), _col17 (type: decimal(13,4)), _col43 (type: decimal(7,2)), _col14 (type: decimal(18,2)), _col67 (type: decimal(7,2)), _col1 (type: int), _col69 (type: decimal(7,2)), _col20 (type: decimal(26,4)), _col35 (type: int), _col44 (type: decimal(7,2)), _col8 (type: int), _col57 (type: int), _col53 (type: int), _col45 (type: decimal(7,2)), _col63 (type: decimal(7,2)), _col47 (type: decimal(7,2)), _col46 (type: decimal(7,2)), _col58 (type: int), _col4 (type: int), _col70 (type: decimal(7,2)), _col49 (type: decimal(7,2)), _col5 (type: int), _col27 (type: string), _col40 (type: decimal(7,2)), _col13 (type: decimal(19,2)), _col26 (type: bigint), _col12 (type: decimal(7,2)), _col34 (type: int), _col38 (type: int), _col32 (type: int), _col66 (type: decimal(7,2)), _col65 (type: decimal(7,2)), _col16 (type: decimal(18,2)), _col74 (type: int), _col15 (type: decimal(18,2)), _col18 (type: decimal(7,2)), _col9 (type: int), _col52 (type: int), _col36 (type: int), _col64 (type: decimal(7,2)), _col31 (type: int), _col0 (type: int), _col28 (type: bigint), _col73 (type: decimal(7,2)), _col39 (type: decimal(7,2)), _col50 (type: decimal(7,2)), _col54 (type: int), _col59 (type: int), _col68 (type: decimal(7,2)), _col41 (type: decimal(7,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20, _col21, _col22, _col23, _col24, _col25, _col26, _col27, _col28, _col29, _col30, _col31, _col32, _col33, _col34, _col35, _col36, _col37, _col38, _col39, _col40, _col41, _col42, _col43, _col44, _col45, _col46, _col47, _col48, _col49, _col50, _col51, _col52, _col53, _col54, _col55, _col56, _col57, _col58, _col59, _col60, _col61, _col62, _col63, _col64, _col65, _col66, _col67, _col68, _col69, _col70, _col71 Statistics: Num rows: 20751113 Data size: 28914547747 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: ((_col34 = _col27) and (_col68 = _col17) and (_col55 = 2451181) and (floor((_col27 / 1000)) * 1000) BETWEEN 1000 AND 2000 and (_col46 < 0) and _col53 is null) (type: boolean) Statistics: Num rows: 48034 Data size: 66930452 Basic stats: COMPLETE Column stats: NONE Select Operator expressions: _col5 (type: int), _col47 (type: bigint), _col44 (type: string), _col64 (type: bigint), _col20 (type: int), _col10 (type: int), _col62 (type: int), _col51 (type: int), _col18 (type: int), _col49 (type: int), _col30 (type: int), _col60 (type: int), _col11 (type: bigint), _col50 (type: int), _col66 (type: decimal(7,2)), _col45 (type: decimal(7,2)), _col71 (type: decimal(7,2)), _col12 (type: decimal(7,2)), _col24 (type: decimal(7,2)), _col31 (type: decimal(7,2)), _col35 (type: decimal(7,2)), _col38 (type: decimal(7,2)), _col37 (type: decimal(7,2)), _col22 (type: decimal(7,2)), _col42 (type: decimal(7,2)), _col67 (type: decimal(7,2)), _col8 (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20, _col21, _col22, _col23, _col24, _col25, _col26 Statistics: Num rows: 48034 Data size: 66930452 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator key expressions: _col0 (type: int), _col1 (type: bigint), _col2 (type: string), _col3 (type: bigint) null sort order: zzzz sort order: ++++ Statistics: Num rows: 48034 Data size: 66930452 Basic stats: COMPLETE Column stats: NONE value expressions: _col4 (type: int), _col5 (type: int), _col6 (type: int), _col7 (type: int), _col8 (type: int), _col9 (type: int), _col10 (type: int), _col11 (type: int), _col12 (type: bigint), _col13 (type: int), _col14 (type: decimal(7,2)), _col15 (type: decimal(7,2)), _col16 (type: decimal(7,2)), _col17 (type: decimal(7,2)), _col18 (type: decimal(7,2)), _col19 (type: decimal(7,2)), _col20 (type: decimal(7,2)), _col21 (type: decimal(7,2)), _col22 (type: decimal(7,2)), _col23 (type: decimal(7,2)), _col24 (type: decimal(7,2)), _col25 (type: decimal(7,2)), _col26 (type: int) Filter Operator predicate: ((_col34 = _col27) and (_col68 = _col17) and (_col55 = 2451181) and (floor((_col27 / 1000)) * 1000) BETWEEN 1000 AND 2000 and (_col46 < 0) and _col53 is null) (type: boolean) Statistics: Num rows: 48034 Data size: 66930452 Basic stats: COMPLETE Column stats: NONE Select Operator expressions: _col59 (type: int), _col34 (type: int), _col68 (type: int), _col2 (type: int), _col21 (type: int), _col33 (type: int), _col39 (type: int), _col69 (type: int), _col14 (type: bigint), _col3 (type: int), _col0 (type: decimal(7,2)), _col36 (type: decimal(7,2)), _col61 (type: decimal(7,2)), 0 (type: decimal(7,2)), _col52 (type: decimal(7,2)), _col26 (type: decimal(7,2)), _col70 (type: decimal(7,2)), _col28 (type: decimal(7,2)), _col41 (type: decimal(7,2)), _col13 (type: decimal(7,2)), _col16 (type: decimal(7,2)), _col65 (type: decimal(7,2)), 2451181 (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20, _col21, _col22 Statistics: Num rows: 48034 Data size: 66930452 Basic stats: COMPLETE Column stats: NONE File Output Operator compressed: false Statistics: Num rows: 48034 Data size: 66930452 Basic stats: COMPLETE Column stats: NONE table: input format: org.apache.iceberg.mr.hive.HiveIcebergInputFormat output format: org.apache.iceberg.mr.hive.HiveIcebergOutputFormat serde: org.apache.iceberg.mr.hive.HiveIcebergSerDe name: tpcds_1000_iceberg_mor_v4.store_sales_delete_1 Filter Operator predicate: (_col34 is null and _col68 is null and _col55 is null) (type: boolean) Statistics: Num rows: 2593889 Data size: 3614318294 Basic stats: COMPLETE Column stats: NONE Select Operator expressions: _col63 (type: int), _col27 (type: int), _col17 (type: int), _col7 (type: int), _col40 (type: int), _col43 (type: int), _col15 (type: int), _col6 (type: int), UDFToLong(_col32) (type: bigint), _col58 (type: int), _col9 (type: decimal(7,2)), _col19 (type: decimal(7,2)), _col48 (type: decimal(7,2)), CAST( _col46 AS decimal(7,2)) (type: decimal(7,2)), CAST( _col25 AS decimal(7,2)) (type: decimal(7,2)), CAST( _col56 AS decimal(7,2)) (type: decimal(7,2)), CAST( _col54 AS decimal(7,2)) (type: decimal(7,2)), CAST( _col23 AS decimal(7,2)) (type: decimal(7,2)), _col57 (type: decimal(7,2)), CAST( _col1 AS decimal(7,2)) (type: decimal(7,2)), CAST( _col29 AS decimal(7,2)) (type: decimal(7,2)), CAST( _col4 AS decimal(7,2)) (type: decimal(7,2)), 2451181 (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20, _col21, _col22 Statistics: Num rows: 2593889 Data size: 3614318294 Basic stats: COMPLETE Column stats: NONE File Output Operator compressed: false Statistics: Num rows: 2593889 Data size: 3614318294 Basic stats: COMPLETE Column stats: NONE table: input format: org.apache.iceberg.mr.hive.HiveIcebergInputFormat output format: org.apache.iceberg.mr.hive.HiveIcebergOutputFormat serde: org.apache.iceberg.mr.hive.HiveIcebergSerDe name: tpcds_1000_iceberg_mor_v4.store_sales_delete_1 Filter Operator predicate: ((_col34 = _col27) and (_col68 = _col17) and (_col55 = 2451181) and (floor((_col27 / 1000)) * 1000) BETWEEN 1000 AND 2000 and (_col46 < 0)) (type: boolean) Statistics: Num rows: 96069 Data size: 133862298 Basic stats: COMPLETE Column stats: NONE Select Operator expressions: _col5 (type: int), _col44 (type: string), _col47 (type: bigint), _col64 (type: bigint) outputColumnNames: _col5, _col44, _col47, _col64 Statistics: Num rows: 96069 Data size: 133862298 Basic stats: COMPLETE Column stats: NONE Group By Operator aggregations: count() keys: _col5 (type: int), _col47 (type: bigint), _col44 (type: string), _col64 (type: bigint) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4 Statistics: Num rows: 96069 Data size: 133862298 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator key expressions: _col0 (type: int), _col1 (type: bigint), _col2 (type: string), _col3 (type: bigint) null sort order: aaaa sort order: ++++ Map-reduce partition columns: _col0 (type: int), _col1 (type: bigint), _col2 (type: string), _col3 (type: bigint) Statistics: Num rows: 96069 Data size: 133862298 Basic stats: COMPLETE Column stats: NONE value expressions: _col4 (type: bigint) Reducer 3 Execution mode: vectorized, llap Reduce Vectorization: enabled: true enableConditionsMet: hive.vectorized.execution.reduce.enabled IS true, hive.execution.engine tez IN [tez] IS true reduceColumnNullOrder: zzzz reduceColumnSortOrder: ++++ allNative: false usesVectorUDFAdaptor: false vectorized: true rowBatchContext: dataColumnCount: 27 dataColumns: KEY.reducesinkkey0:int, KEY.reducesinkkey1:bigint, KEY.reducesinkkey2:string, KEY.reducesinkkey3:bigint, VALUE._col0:int, VALUE._col1:int, VALUE._col2:int, VALUE._col3:int, VALUE._col4:int, VALUE._col5:int, VALUE._col6:int, VALUE._col7:int, VALUE._col8:bigint, VALUE._col9:int, VALUE._col10:decimal(7,2)/DECIMAL_64, VALUE._col11:decimal(7,2)/DECIMAL_64, VALUE._col12:decimal(7,2)/DECIMAL_64, VALUE._col13:decimal(7,2)/DECIMAL_64, VALUE._col14:decimal(7,2)/DECIMAL_64, VALUE._col15:decimal(7,2)/DECIMAL_64, VALUE._col16:decimal(7,2)/DECIMAL_64, VALUE._col17:decimal(7,2)/DECIMAL_64, VALUE._col18:decimal(7,2)/DECIMAL_64, VALUE._col19:decimal(7,2)/DECIMAL_64, VALUE._col20:decimal(7,2)/DECIMAL_64, VALUE._col21:decimal(7,2)/DECIMAL_64, VALUE._col22:int partitionColumnCount: 0 scratchColumnTypeNames: [] Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey0 (type: int), KEY.reducesinkkey1 (type: bigint), KEY.reducesinkkey2 (type: string), KEY.reducesinkkey3 (type: bigint), VALUE._col0 (type: int), VALUE._col1 (type: int), VALUE._col2 (type: int), VALUE._col3 (type: int), VALUE._col4 (type: int), VALUE._col5 (type: int), VALUE._col6 (type: int), VALUE._col7 (type: int), VALUE._col8 (type: bigint), VALUE._col9 (type: int), VALUE._col10 (type: decimal(7,2)), VALUE._col11 (type: decimal(7,2)), VALUE._col12 (type: decimal(7,2)), VALUE._col13 (type: decimal(7,2)), VALUE._col14 (type: decimal(7,2)), VALUE._col15 (type: decimal(7,2)), VALUE._col16 (type: decimal(7,2)), VALUE._col17 (type: decimal(7,2)), VALUE._col18 (type: decimal(7,2)), VALUE._col19 (type: decimal(7,2)), VALUE._col20 (type: decimal(7,2)), VALUE._col21 (type: decimal(7,2)), VALUE._col22 (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20, _col21, _col22, _col23, _col24, _col25, _col26 Select Vectorization: className: VectorSelectOperator native: true projectedOutputColumnNums: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26] Statistics: Num rows: 48034 Data size: 66930452 Basic stats: COMPLETE Column stats: NONE File Output Operator compressed: false File Sink Vectorization: className: VectorFileSinkOperator native: false Statistics: Num rows: 48034 Data size: 66930452 Basic stats: COMPLETE Column stats: NONE table: input format: org.apache.iceberg.mr.hive.HiveIcebergInputFormat output format: org.apache.iceberg.mr.hive.HiveIcebergOutputFormat serde: org.apache.iceberg.mr.hive.HiveIcebergSerDe name: tpcds_1000_iceberg_mor_v4.store_sales_delete_1 Reducer 4 Execution mode: vectorized, llap Reduce Vectorization: enabled: true enableConditionsMet: hive.vectorized.execution.reduce.enabled IS true, hive.execution.engine tez IN [tez] IS true reduceColumnNullOrder: aaaa reduceColumnSortOrder: ++++ allNative: false usesVectorUDFAdaptor: true vectorized: true rowBatchContext: dataColumnCount: 5 dataColumns: KEY._col0:int, KEY._col1:bigint, KEY._col2:string, KEY._col3:bigint, VALUE._col0:bigint partitionColumnCount: 0 scratchColumnTypeNames: [] Reduce Operator Tree: Group By Operator aggregations: count(VALUE._col0) Group By Vectorization: aggregators: VectorUDAFCountMerge(col 4:bigint) -> bigint className: VectorGroupByOperator groupByMode: MERGEPARTIAL keyExpressions: col 0:int, col 1:bigint, col 2:string, col 3:bigint native: false vectorProcessingMode: MERGE_PARTIAL projectedOutputColumnNums: [0] keys: KEY._col0 (type: int), KEY._col1 (type: bigint), KEY._col2 (type: string), KEY._col3 (type: bigint) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4 Statistics: Num rows: 48034 Data size: 66930452 Basic stats: COMPLETE Column stats: NONE Filter Operator Filter Vectorization: className: VectorFilterOperator native: true predicateExpression: FilterLongColGreaterLongScalar(col 4:bigint, val 1) predicate: (_col4 > 1L) (type: boolean) Statistics: Num rows: 16011 Data size: 22309686 Basic stats: COMPLETE Column stats: NONE Select Operator expressions: cardinality_violation(_col0,_col1,_col2,_col3) (type: int) outputColumnNames: _col0 Select Vectorization: className: VectorSelectOperator native: true projectedOutputColumnNums: [5] selectExpressions: VectorUDFAdaptor(cardinality_violation(_col0,_col1,_col2,_col3)) -> 5:int Statistics: Num rows: 16011 Data size: 22309686 Basic stats: COMPLETE Column stats: NONE File Output Operator compressed: false File Sink Vectorization: className: VectorFileSinkOperator native: false Statistics: Num rows: 16011 Data size: 22309686 Basic stats: COMPLETE Column stats: NONE table: input format: org.apache.hadoop.mapred.TextInputFormat output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe name: tpcds_1000_iceberg_mor_v4.merge_tmp_table Stage: Stage-5 Dependency Collection Stage: Stage-0 Move Operator tables: replace: false table: input format: org.apache.iceberg.mr.hive.HiveIcebergInputFormat output format: org.apache.iceberg.mr.hive.HiveIcebergOutputFormat serde: org.apache.iceberg.mr.hive.HiveIcebergSerDe name: tpcds_1000_iceberg_mor_v4.store_sales_delete_1 Stage: Stage-6 Stats Work Basic Stats Work: Stage: Stage-3 Move Operator tables: replace: false table: input format: org.apache.hadoop.mapred.TextInputFormat output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe name: tpcds_1000_iceberg_mor_v4.merge_tmp_table Stage: Stage-7 Stats Work Basic Stats Work: 311 rows selected (0.57 seconds)