diff --git ql/src/test/results/clientpositive/autoColumnStats_2.q.out ql/src/test/results/clientpositive/autoColumnStats_2.q.out index b209ff0..b1161b5 100644 --- ql/src/test/results/clientpositive/autoColumnStats_2.q.out +++ ql/src/test/results/clientpositive/autoColumnStats_2.q.out @@ -129,7 +129,7 @@ data_type string min max num_nulls 0 -distinct_count 309 +distinct_count 316 avg_col_len 2.812 max_col_len 3 num_trues @@ -148,7 +148,7 @@ data_type string min max num_nulls 0 -distinct_count 309 +distinct_count 316 avg_col_len 2.812 max_col_len 3 num_trues @@ -253,7 +253,7 @@ data_type string min max num_nulls 0 -distinct_count 309 +distinct_count 316 avg_col_len 2.812 max_col_len 3 num_trues @@ -272,7 +272,7 @@ data_type string min max num_nulls 0 -distinct_count 309 +distinct_count 307 avg_col_len 6.812 max_col_len 7 num_trues @@ -301,7 +301,7 @@ data_type string min max num_nulls 10 -distinct_count 309 +distinct_count 316 avg_col_len 2.812 max_col_len 3 num_trues @@ -320,7 +320,7 @@ data_type string min max num_nulls 10 -distinct_count 309 +distinct_count 307 avg_col_len 6.812 max_col_len 7 num_trues @@ -349,7 +349,7 @@ data_type string min max num_nulls 20 -distinct_count 309 +distinct_count 316 avg_col_len 2.812 max_col_len 3 num_trues @@ -368,7 +368,7 @@ data_type string min max num_nulls 10 -distinct_count 319 +distinct_count 316 avg_col_len 8.0 max_col_len 8 num_trues diff --git ql/src/test/results/clientpositive/autoColumnStats_9.q.out ql/src/test/results/clientpositive/autoColumnStats_9.q.out index 0dfcf04..3466936 100644 --- ql/src/test/results/clientpositive/autoColumnStats_9.q.out +++ ql/src/test/results/clientpositive/autoColumnStats_9.q.out @@ -251,7 +251,7 @@ data_type int min 0 max 498 num_nulls 0 -distinct_count 309 +distinct_count 303 avg_col_len max_col_len num_trues @@ -270,7 +270,7 @@ data_type string min max num_nulls 0 -distinct_count 309 +distinct_count 307 avg_col_len 6.834630350194552 max_col_len 7 num_trues diff --git ql/src/test/results/clientpositive/bitvector.q.out ql/src/test/results/clientpositive/bitvector.q.out index 1e0284f..e310ebe 100644 --- ql/src/test/results/clientpositive/bitvector.q.out +++ ql/src/test/results/clientpositive/bitvector.q.out @@ -9,7 +9,7 @@ data_type string min max num_nulls 0 -distinct_count 309 +distinct_count 316 avg_col_len 2.812 max_col_len 3 num_trues diff --git ql/src/test/results/clientpositive/compute_stats_date.q.out ql/src/test/results/clientpositive/compute_stats_date.q.out index 796b3d3..89c2128 100644 --- ql/src/test/results/clientpositive/compute_stats_date.q.out +++ ql/src/test/results/clientpositive/compute_stats_date.q.out @@ -43,7 +43,7 @@ POSTHOOK: query: select compute_stats(fl_date, 'hll') from tab_date POSTHOOK: type: QUERY POSTHOOK: Input: default@tab_date #### A masked pattern was here #### -{"columntype":"Date","min":"2000-11-20","max":"2010-10-29","countnulls":0,"numdistinctvalues":19,"ndvbitvector":HLL�ê����!���]����������������Y���T��P��R������W��� �ĈN������������} +{"columntype":"Date","min":"2000-11-20","max":"2010-10-29","countnulls":0,"numdistinctvalues":19,"ndvbitvector":HLL�Ǫ����!���]����������������Y���T���P��R������W��� �ĈN������������} PREHOOK: query: explain analyze table tab_date compute statistics for columns fl_date PREHOOK: type: QUERY diff --git ql/src/test/results/clientpositive/confirm_initial_tbl_stats.q.out ql/src/test/results/clientpositive/confirm_initial_tbl_stats.q.out index a900194..846b600 100644 --- ql/src/test/results/clientpositive/confirm_initial_tbl_stats.q.out +++ ql/src/test/results/clientpositive/confirm_initial_tbl_stats.q.out @@ -19,7 +19,7 @@ data_type string min max num_nulls 0 -distinct_count 309 +distinct_count 316 avg_col_len 2.812 max_col_len 3 num_trues @@ -105,7 +105,7 @@ data_type string min max num_nulls 0 -distinct_count 309 +distinct_count 307 avg_col_len 6.812 max_col_len 7 num_trues @@ -134,7 +134,7 @@ data_type string min max num_nulls 0 -distinct_count 430 +distinct_count 431 avg_col_len 6.802 max_col_len 7 num_trues @@ -163,7 +163,7 @@ data_type string min max num_nulls 0 -distinct_count 309 +distinct_count 307 avg_col_len 6.812 max_col_len 7 num_trues @@ -199,7 +199,7 @@ data_type string min max num_nulls 0 -distinct_count 309 +distinct_count 316 avg_col_len 2.812 max_col_len 3 num_trues diff --git ql/src/test/results/clientpositive/cross_join_merge.q.out ql/src/test/results/clientpositive/cross_join_merge.q.out index 7241dfe..f4956de 100644 --- ql/src/test/results/clientpositive/cross_join_merge.q.out +++ ql/src/test/results/clientpositive/cross_join_merge.q.out @@ -233,7 +233,7 @@ STAGE PLANS: Processor Tree: ListSink -Warning: Shuffle Join JOIN[11][tables = [$hdt$_0, $hdt$_1]] in Stage 'Stage-1:MAPRED' is a cross product +Warning: Shuffle Join JOIN[14][tables = [$hdt$_0, $hdt$_1, $hdt$_2]] in Stage 'Stage-2:MAPRED' is a cross product PREHOOK: query: explain select src1.key from src src1 join src src2 on 5 = src2.key join src src3 on src1.key=src3.key PREHOOK: type: QUERY @@ -250,7 +250,7 @@ STAGE PLANS: Map Reduce Map Operator Tree: TableScan - alias: src3 + alias: src1 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: key is not null (type: boolean) @@ -260,29 +260,34 @@ STAGE PLANS: outputColumnNames: _col0 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - sort order: + key expressions: _col0 (type: string) + sort order: + + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - value expressions: _col0 (type: string) TableScan - alias: src2 + alias: src3 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Filter Operator - predicate: (5.0 = UDFToDouble(key)) (type: boolean) - Statistics: Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE + predicate: key is not null (type: boolean) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Select Operator - Statistics: Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE + expressions: key (type: string) + outputColumnNames: _col0 + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - sort order: - Statistics: Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE + key expressions: _col0 (type: string) + sort order: + + Map-reduce partition columns: _col0 (type: string) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Reduce Operator Tree: Join Operator condition map: Inner Join 0 to 1 keys: - 0 - 1 + 0 _col0 (type: string) + 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 125000 Data size: 2781000 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE File Output Operator compressed: false table: @@ -295,45 +300,36 @@ STAGE PLANS: Map Operator Tree: TableScan Reduce Output Operator - key expressions: _col0 (type: string) - sort order: + - Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 125000 Data size: 2781000 Basic stats: COMPLETE Column stats: NONE + sort order: + Statistics: Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE + value expressions: _col0 (type: string) TableScan - alias: src1 + alias: src2 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Filter Operator - predicate: key is not null (type: boolean) - Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + predicate: (5.0 = UDFToDouble(key)) (type: boolean) + Statistics: Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: key (type: string) - outputColumnNames: _col0 - Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col0 (type: string) - sort order: + - Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + sort order: + Statistics: Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE Reduce Operator Tree: Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col0 (type: string) - 1 _col0 (type: string) - outputColumnNames: _col2 - Statistics: Num rows: 137500 Data size: 3059100 Basic stats: COMPLETE Column stats: NONE - Select Operator - expressions: _col2 (type: string) - outputColumnNames: _col0 - Statistics: Num rows: 137500 Data size: 3059100 Basic stats: COMPLETE Column stats: NONE - File Output Operator - compressed: false - Statistics: Num rows: 137500 Data size: 3059100 Basic stats: COMPLETE Column stats: NONE - table: - input format: org.apache.hadoop.mapred.SequenceFileInputFormat - output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat - serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + 0 + 1 + outputColumnNames: _col0 + Statistics: Num rows: 137500 Data size: 3059050 Basic stats: COMPLETE Column stats: NONE + File Output Operator + compressed: false + Statistics: Num rows: 137500 Data size: 3059050 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.SequenceFileInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe Stage: Stage-0 Fetch Operator diff --git ql/src/test/results/clientpositive/describe_table.q.out ql/src/test/results/clientpositive/describe_table.q.out index 8f7d0f6..5657eb1 100644 --- ql/src/test/results/clientpositive/describe_table.q.out +++ ql/src/test/results/clientpositive/describe_table.q.out @@ -205,7 +205,7 @@ data_type string min max num_nulls 0 -distinct_count 309 +distinct_count 316 avg_col_len 2.812 max_col_len 3 num_trues @@ -302,7 +302,7 @@ data_type string min max num_nulls 0 -distinct_count 309 +distinct_count 316 avg_col_len 2.812 max_col_len 3 num_trues diff --git ql/src/test/results/clientpositive/encrypted/encryption_move_tbl.q.out ql/src/test/results/clientpositive/encrypted/encryption_move_tbl.q.out index 4eee575..5d7e2cb 100644 --- ql/src/test/results/clientpositive/encrypted/encryption_move_tbl.q.out +++ ql/src/test/results/clientpositive/encrypted/encryption_move_tbl.q.out @@ -66,7 +66,7 @@ data_type int min 0 max 498 num_nulls 0 -distinct_count 309 +distinct_count 303 avg_col_len max_col_len num_trues @@ -85,7 +85,7 @@ data_type string min max num_nulls 0 -distinct_count 309 +distinct_count 307 avg_col_len 6.812 max_col_len 7 num_trues @@ -117,7 +117,7 @@ data_type int min 0 max 498 num_nulls 0 -distinct_count 309 +distinct_count 303 avg_col_len max_col_len num_trues @@ -136,7 +136,7 @@ data_type string min max num_nulls 0 -distinct_count 309 +distinct_count 307 avg_col_len 6.812 max_col_len 7 num_trues diff --git ql/src/test/results/clientpositive/hll.q.out ql/src/test/results/clientpositive/hll.q.out index 3b90b56..0c80e7e 100644 --- ql/src/test/results/clientpositive/hll.q.out +++ ql/src/test/results/clientpositive/hll.q.out @@ -182,7 +182,7 @@ data_type int min 0 max 498 num_nulls 0 -distinct_count 309 +distinct_count 303 avg_col_len max_col_len num_trues @@ -236,7 +236,7 @@ data_type double min 0.0 max 498.0 num_nulls 0 -distinct_count 309 +distinct_count 316 avg_col_len max_col_len num_trues @@ -290,7 +290,7 @@ data_type decimal(10,0) min 0 max 498 num_nulls 0 -distinct_count 309 +distinct_count 316 avg_col_len max_col_len num_trues diff --git ql/src/test/results/clientpositive/llap/acid_no_buckets.q.out ql/src/test/results/clientpositive/llap/acid_no_buckets.q.out index 9b83fad..a0cfbb4 100644 --- ql/src/test/results/clientpositive/llap/acid_no_buckets.q.out +++ ql/src/test/results/clientpositive/llap/acid_no_buckets.q.out @@ -302,15 +302,15 @@ STAGE PLANS: Statistics: Num rows: 2015 Data size: 916825 Basic stats: COMPLETE Column stats: PARTIAL Filter Operator predicate: (key) IN ('1001', '213', '43') (type: boolean) - Statistics: Num rows: 20 Data size: 9100 Basic stats: COMPLETE Column stats: PARTIAL + Statistics: Num rows: 19 Data size: 8645 Basic stats: COMPLETE Column stats: PARTIAL Select Operator expressions: ROW__ID (type: struct), ds (type: string), hr (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 20 Data size: 8880 Basic stats: COMPLETE Column stats: PARTIAL + Statistics: Num rows: 19 Data size: 8436 Basic stats: COMPLETE Column stats: PARTIAL Reduce Output Operator key expressions: _col0 (type: struct) sort order: + - Statistics: Num rows: 20 Data size: 8880 Basic stats: COMPLETE Column stats: PARTIAL + Statistics: Num rows: 19 Data size: 8436 Basic stats: COMPLETE Column stats: PARTIAL value expressions: _col1 (type: string), _col2 (type: string) Execution mode: llap LLAP IO: may be used (ACID table) @@ -320,10 +320,10 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: struct), VALUE._col0 (type: string), VALUE._col1 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 20 Data size: 8880 Basic stats: COMPLETE Column stats: PARTIAL + Statistics: Num rows: 19 Data size: 8436 Basic stats: COMPLETE Column stats: PARTIAL File Output Operator compressed: false - Statistics: Num rows: 20 Data size: 8880 Basic stats: COMPLETE Column stats: PARTIAL + Statistics: Num rows: 19 Data size: 8436 Basic stats: COMPLETE Column stats: PARTIAL table: input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat @@ -800,16 +800,16 @@ STAGE PLANS: Statistics: Num rows: 2015 Data size: 916825 Basic stats: COMPLETE Column stats: PARTIAL Filter Operator predicate: (key) IN ('1001', '213', '43') (type: boolean) - Statistics: Num rows: 20 Data size: 9100 Basic stats: COMPLETE Column stats: PARTIAL + Statistics: Num rows: 19 Data size: 8645 Basic stats: COMPLETE Column stats: PARTIAL Select Operator expressions: ROW__ID (type: struct), ds (type: string), hr (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 20 Data size: 8880 Basic stats: COMPLETE Column stats: PARTIAL + Statistics: Num rows: 19 Data size: 8436 Basic stats: COMPLETE Column stats: PARTIAL Reduce Output Operator key expressions: _col0 (type: struct) sort order: + Map-reduce partition columns: UDFToInteger(_col0) (type: int) - Statistics: Num rows: 20 Data size: 8880 Basic stats: COMPLETE Column stats: PARTIAL + Statistics: Num rows: 19 Data size: 8436 Basic stats: COMPLETE Column stats: PARTIAL value expressions: _col1 (type: string), _col2 (type: string) Execution mode: llap LLAP IO: may be used (ACID table) @@ -819,10 +819,10 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: struct), VALUE._col0 (type: string), VALUE._col1 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 20 Data size: 8880 Basic stats: COMPLETE Column stats: PARTIAL + Statistics: Num rows: 19 Data size: 8436 Basic stats: COMPLETE Column stats: PARTIAL File Output Operator compressed: false - Statistics: Num rows: 20 Data size: 8880 Basic stats: COMPLETE Column stats: PARTIAL + Statistics: Num rows: 19 Data size: 8436 Basic stats: COMPLETE Column stats: PARTIAL table: input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat diff --git ql/src/test/results/clientpositive/llap/autoColumnStats_2.q.out ql/src/test/results/clientpositive/llap/autoColumnStats_2.q.out index 0cc0c05..1bf1dff 100644 --- ql/src/test/results/clientpositive/llap/autoColumnStats_2.q.out +++ ql/src/test/results/clientpositive/llap/autoColumnStats_2.q.out @@ -127,7 +127,7 @@ data_type string min max num_nulls 0 -distinct_count 309 +distinct_count 316 avg_col_len 2.812 max_col_len 3 num_trues @@ -146,7 +146,7 @@ data_type string min max num_nulls 0 -distinct_count 309 +distinct_count 316 avg_col_len 2.812 max_col_len 3 num_trues @@ -251,7 +251,7 @@ data_type string min max num_nulls 0 -distinct_count 309 +distinct_count 316 avg_col_len 2.812 max_col_len 3 num_trues @@ -270,7 +270,7 @@ data_type string min max num_nulls 0 -distinct_count 309 +distinct_count 307 avg_col_len 6.812 max_col_len 7 num_trues @@ -299,7 +299,7 @@ data_type string min max num_nulls 10 -distinct_count 309 +distinct_count 316 avg_col_len 2.812 max_col_len 3 num_trues @@ -318,7 +318,7 @@ data_type string min max num_nulls 10 -distinct_count 309 +distinct_count 307 avg_col_len 6.812 max_col_len 7 num_trues @@ -347,7 +347,7 @@ data_type string min max num_nulls 20 -distinct_count 309 +distinct_count 316 avg_col_len 2.812 max_col_len 3 num_trues @@ -366,7 +366,7 @@ data_type string min max num_nulls 10 -distinct_count 319 +distinct_count 316 avg_col_len 8.0 max_col_len 8 num_trues diff --git ql/src/test/results/clientpositive/llap/auto_join1.q.out ql/src/test/results/clientpositive/llap/auto_join1.q.out index bbe63e2..aff06aa 100644 --- ql/src/test/results/clientpositive/llap/auto_join1.q.out +++ ql/src/test/results/clientpositive/llap/auto_join1.q.out @@ -68,14 +68,14 @@ STAGE PLANS: outputColumnNames: _col0, _col2 input vertices: 0 Map 1 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: UDFToInteger(_col0) (type: int), _col2 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 809 Data size: 76855 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 75145 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 809 Data size: 76855 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 75145 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.TextInputFormat output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat diff --git ql/src/test/results/clientpositive/llap/auto_join21.q.out ql/src/test/results/clientpositive/llap/auto_join21.q.out index 4956af4..e79e3a9 100644 --- ql/src/test/results/clientpositive/llap/auto_join21.q.out +++ ql/src/test/results/clientpositive/llap/auto_join21.q.out @@ -75,25 +75,25 @@ STAGE PLANS: 1 key (type: string) 2 key (type: string) outputColumnNames: _col0, _col1, _col5, _col6, _col10, _col11 - Statistics: Num rows: 434 Data size: 231756 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 415 Data size: 221610 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col1 (type: string), _col5 (type: string), _col6 (type: string), _col10 (type: string), _col11 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 434 Data size: 231756 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 415 Data size: 221610 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string) sort order: ++++++ - Statistics: Num rows: 434 Data size: 231756 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 415 Data size: 221610 Basic stats: COMPLETE Column stats: COMPLETE Reducer 3 Execution mode: llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: string), KEY.reducesinkkey3 (type: string), KEY.reducesinkkey4 (type: string), KEY.reducesinkkey5 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 434 Data size: 231756 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 415 Data size: 221610 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 434 Data size: 231756 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 415 Data size: 221610 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/auto_join29.q.out ql/src/test/results/clientpositive/llap/auto_join29.q.out index 3fb3184..c8fd93f 100644 --- ql/src/test/results/clientpositive/llap/auto_join29.q.out +++ ql/src/test/results/clientpositive/llap/auto_join29.q.out @@ -75,25 +75,25 @@ STAGE PLANS: 1 key (type: string) 2 key (type: string) outputColumnNames: _col0, _col1, _col5, _col6, _col10, _col11 - Statistics: Num rows: 434 Data size: 231756 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 415 Data size: 221610 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col1 (type: string), _col5 (type: string), _col6 (type: string), _col10 (type: string), _col11 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 434 Data size: 231756 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 415 Data size: 221610 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string) sort order: ++++++ - Statistics: Num rows: 434 Data size: 231756 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 415 Data size: 221610 Basic stats: COMPLETE Column stats: COMPLETE Reducer 3 Execution mode: llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: string), KEY.reducesinkkey3 (type: string), KEY.reducesinkkey4 (type: string), KEY.reducesinkkey5 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 434 Data size: 231756 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 415 Data size: 221610 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 434 Data size: 231756 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 415 Data size: 221610 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -693,25 +693,25 @@ STAGE PLANS: 1 key (type: string) 2 key (type: string) outputColumnNames: _col0, _col1, _col5, _col6, _col10, _col11 - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 137 Data size: 73158 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col1 (type: string), _col5 (type: string), _col6 (type: string), _col10 (type: string), _col11 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 137 Data size: 73158 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string) sort order: ++++++ - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 137 Data size: 73158 Basic stats: COMPLETE Column stats: COMPLETE Reducer 3 Execution mode: llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: string), KEY.reducesinkkey3 (type: string), KEY.reducesinkkey4 (type: string), KEY.reducesinkkey5 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 137 Data size: 73158 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 137 Data size: 73158 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -1311,25 +1311,25 @@ STAGE PLANS: 1 key (type: string) 2 key (type: string) outputColumnNames: _col0, _col1, _col5, _col6, _col10, _col11 - Statistics: Num rows: 432 Data size: 230688 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 415 Data size: 221610 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col1 (type: string), _col5 (type: string), _col6 (type: string), _col10 (type: string), _col11 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 432 Data size: 230688 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 415 Data size: 221610 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string) sort order: ++++++ - Statistics: Num rows: 432 Data size: 230688 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 415 Data size: 221610 Basic stats: COMPLETE Column stats: COMPLETE Reducer 3 Execution mode: llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: string), KEY.reducesinkkey3 (type: string), KEY.reducesinkkey4 (type: string), KEY.reducesinkkey5 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 432 Data size: 230688 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 415 Data size: 221610 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 432 Data size: 230688 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 415 Data size: 221610 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -1938,25 +1938,25 @@ STAGE PLANS: 1 key (type: string) 2 key (type: string) outputColumnNames: _col0, _col1, _col5, _col6, _col10, _col11 - Statistics: Num rows: 434 Data size: 231756 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 415 Data size: 221610 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col1 (type: string), _col5 (type: string), _col6 (type: string), _col10 (type: string), _col11 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 434 Data size: 231756 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 415 Data size: 221610 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string) sort order: ++++++ - Statistics: Num rows: 434 Data size: 231756 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 415 Data size: 221610 Basic stats: COMPLETE Column stats: COMPLETE Reducer 3 Execution mode: llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: string), KEY.reducesinkkey3 (type: string), KEY.reducesinkkey4 (type: string), KEY.reducesinkkey5 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 434 Data size: 231756 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 415 Data size: 221610 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 434 Data size: 231756 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 415 Data size: 221610 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -2567,25 +2567,25 @@ STAGE PLANS: 1 key (type: string) 2 key (type: string) outputColumnNames: _col0, _col1, _col5, _col6, _col10, _col11 - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 135 Data size: 72090 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col1 (type: string), _col5 (type: string), _col6 (type: string), _col10 (type: string), _col11 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 135 Data size: 72090 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string) sort order: ++++++ - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 135 Data size: 72090 Basic stats: COMPLETE Column stats: COMPLETE Reducer 3 Execution mode: llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: string), KEY.reducesinkkey3 (type: string), KEY.reducesinkkey4 (type: string), KEY.reducesinkkey5 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 135 Data size: 72090 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 135 Data size: 72090 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -2685,25 +2685,25 @@ STAGE PLANS: 1 key (type: string) 2 key (type: string) outputColumnNames: _col0, _col1, _col5, _col6, _col10, _col11 - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 136 Data size: 72624 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col1 (type: string), _col5 (type: string), _col6 (type: string), _col10 (type: string), _col11 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 136 Data size: 72624 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string) sort order: ++++++ - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 136 Data size: 72624 Basic stats: COMPLETE Column stats: COMPLETE Reducer 3 Execution mode: llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: string), KEY.reducesinkkey3 (type: string), KEY.reducesinkkey4 (type: string), KEY.reducesinkkey5 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 136 Data size: 72624 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 136 Data size: 72624 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -3263,15 +3263,15 @@ STAGE PLANS: input vertices: 1 Map 3 2 Map 4 - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 136 Data size: 72624 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col1 (type: string), _col5 (type: string), _col6 (type: string), _col10 (type: string), _col11 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 136 Data size: 72624 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string) sort order: ++++++ - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 136 Data size: 72624 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: llap LLAP IO: no inputs Map 3 @@ -3312,10 +3312,10 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: string), KEY.reducesinkkey3 (type: string), KEY.reducesinkkey4 (type: string), KEY.reducesinkkey5 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 136 Data size: 72624 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 136 Data size: 72624 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -3394,15 +3394,15 @@ STAGE PLANS: input vertices: 0 Map 1 2 Map 4 - Statistics: Num rows: 431 Data size: 230154 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 414 Data size: 221076 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col1 (type: string), _col5 (type: string), _col6 (type: string), _col10 (type: string), _col11 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 431 Data size: 230154 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 414 Data size: 221076 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string) sort order: ++++++ - Statistics: Num rows: 431 Data size: 230154 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 414 Data size: 221076 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: llap LLAP IO: no inputs Map 4 @@ -3427,10 +3427,10 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: string), KEY.reducesinkkey3 (type: string), KEY.reducesinkkey4 (type: string), KEY.reducesinkkey5 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 431 Data size: 230154 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 414 Data size: 221076 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 431 Data size: 230154 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 414 Data size: 221076 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -3511,15 +3511,15 @@ STAGE PLANS: input vertices: 1 Map 3 2 Map 4 - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 135 Data size: 72090 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col1 (type: string), _col5 (type: string), _col6 (type: string), _col10 (type: string), _col11 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 135 Data size: 72090 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string) sort order: ++++++ - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 135 Data size: 72090 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: llap LLAP IO: no inputs Map 3 @@ -3560,10 +3560,10 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: string), KEY.reducesinkkey3 (type: string), KEY.reducesinkkey4 (type: string), KEY.reducesinkkey5 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 135 Data size: 72090 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 143 Data size: 76362 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 135 Data size: 72090 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/auto_join30.q.out ql/src/test/results/clientpositive/llap/auto_join30.q.out index e5f5fda..271f806 100644 --- ql/src/test/results/clientpositive/llap/auto_join30.q.out +++ ql/src/test/results/clientpositive/llap/auto_join30.q.out @@ -67,7 +67,7 @@ STAGE PLANS: outputColumnNames: _col2, _col3 input vertices: 0 Map 1 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(hash(_col2,_col3)) mode: hash @@ -167,7 +167,7 @@ STAGE PLANS: outputColumnNames: _col2, _col3 input vertices: 1 Map 3 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(hash(_col2,_col3)) mode: hash @@ -300,7 +300,7 @@ STAGE PLANS: outputColumnNames: _col2, _col3 input vertices: 0 Map 1 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(hash(_col2,_col3)) mode: hash @@ -431,7 +431,7 @@ STAGE PLANS: input vertices: 0 Map 1 2 Map 4 - Statistics: Num rows: 1309 Data size: 233002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1251 Data size: 222678 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(hash(_col2,_col3)) mode: hash @@ -605,7 +605,7 @@ STAGE PLANS: 1 _col0 (type: string) 2 _col0 (type: string) outputColumnNames: _col2, _col3 - Statistics: Num rows: 1309 Data size: 233002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1251 Data size: 222678 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(hash(_col2,_col3)) mode: hash @@ -758,7 +758,7 @@ STAGE PLANS: 1 _col0 (type: string) 2 _col0 (type: string) outputColumnNames: _col2, _col3 - Statistics: Num rows: 1309 Data size: 233002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1251 Data size: 222678 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(hash(_col2,_col3)) mode: hash @@ -911,7 +911,7 @@ STAGE PLANS: 1 _col0 (type: string) 2 _col0 (type: string) outputColumnNames: _col2, _col3 - Statistics: Num rows: 1309 Data size: 233002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1251 Data size: 222678 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(hash(_col2,_col3)) mode: hash @@ -1064,7 +1064,7 @@ STAGE PLANS: 1 _col0 (type: string) 2 _col0 (type: string) outputColumnNames: _col2, _col3 - Statistics: Num rows: 1309 Data size: 233002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1251 Data size: 222678 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(hash(_col2,_col3)) mode: hash diff --git ql/src/test/results/clientpositive/llap/bucket_map_join_tez1.q.out ql/src/test/results/clientpositive/llap/bucket_map_join_tez1.q.out index 808f4de..f94f719 100644 --- ql/src/test/results/clientpositive/llap/bucket_map_join_tez1.q.out +++ ql/src/test/results/clientpositive/llap/bucket_map_join_tez1.q.out @@ -235,25 +235,25 @@ STAGE PLANS: 0 _col0 (type: int) 1 _col0 (type: int) outputColumnNames: _col0, _col1, _col3 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 74214 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: int), _col1 (type: string), _col3 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 74214 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int), _col1 (type: string), _col2 (type: string) sort order: +++ - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 74214 Basic stats: COMPLETE Column stats: COMPLETE Reducer 3 Execution mode: llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey0 (type: int), KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 74214 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 74214 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -823,15 +823,15 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col3 input vertices: 0 Map 1 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 74214 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: int), _col1 (type: string), _col3 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 74214 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int), _col1 (type: string), _col2 (type: string) sort order: +++ - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 74214 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: llap LLAP IO: no inputs Reducer 3 @@ -840,10 +840,10 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: int), KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 74214 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 74214 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -1436,7 +1436,7 @@ STAGE PLANS: keys: 0 _col0 (type: int) 1 _col0 (type: int) - Statistics: Num rows: 195 Data size: 1560 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 199 Data size: 1592 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -1565,7 +1565,7 @@ STAGE PLANS: 1 _col0 (type: int) input vertices: 1 Map 4 - Statistics: Num rows: 195 Data size: 1560 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 199 Data size: 1592 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -1696,7 +1696,7 @@ STAGE PLANS: keys: 0 _col0 (type: int) 1 _col0 (type: int) - Statistics: Num rows: 632 Data size: 5056 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 658 Data size: 5264 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -1731,16 +1731,16 @@ STAGE PLANS: 0 _col0 (type: int) 1 _col0 (type: int) outputColumnNames: _col1 - Statistics: Num rows: 391 Data size: 1564 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 1596 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: int) outputColumnNames: _col0 - Statistics: Num rows: 391 Data size: 1564 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 1596 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + Map-reduce partition columns: _col0 (type: int) - Statistics: Num rows: 391 Data size: 1564 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 1596 Basic stats: COMPLETE Column stats: COMPLETE Stage: Stage-0 Fetch Operator @@ -1838,11 +1838,11 @@ STAGE PLANS: outputColumnNames: _col1 input vertices: 1 Map 4 - Statistics: Num rows: 391 Data size: 1564 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 1596 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: int) outputColumnNames: _col0 - Statistics: Num rows: 391 Data size: 1564 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 1596 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -1851,7 +1851,7 @@ STAGE PLANS: 1 _col0 (type: int) input vertices: 0 Map 1 - Statistics: Num rows: 632 Data size: 5056 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 658 Data size: 5264 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -2007,7 +2007,7 @@ STAGE PLANS: keys: 0 _col0 (type: int) 1 _col0 (type: int) - Statistics: Num rows: 632 Data size: 5056 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 658 Data size: 5264 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -2042,16 +2042,16 @@ STAGE PLANS: 0 _col0 (type: int) 1 _col0 (type: int) outputColumnNames: _col1 - Statistics: Num rows: 391 Data size: 1564 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 1596 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: int) outputColumnNames: _col0 - Statistics: Num rows: 391 Data size: 1564 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 1596 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + Map-reduce partition columns: _col0 (type: int) - Statistics: Num rows: 391 Data size: 1564 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 1596 Basic stats: COMPLETE Column stats: COMPLETE Stage: Stage-0 Fetch Operator @@ -2149,11 +2149,11 @@ STAGE PLANS: outputColumnNames: _col1 input vertices: 1 Map 4 - Statistics: Num rows: 391 Data size: 1564 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 1596 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: int) outputColumnNames: _col0 - Statistics: Num rows: 391 Data size: 1564 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 1596 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -2162,7 +2162,7 @@ STAGE PLANS: 1 _col0 (type: int) input vertices: 0 Map 1 - Statistics: Num rows: 632 Data size: 5056 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 658 Data size: 5264 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -2566,11 +2566,11 @@ STAGE PLANS: 0 _col0 (type: int) 1 _col0 (type: int) outputColumnNames: _col1, _col2 - Statistics: Num rows: 391 Data size: 37145 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 37905 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: int), substr(_col2, 5) (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 391 Data size: 37145 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 37905 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col1) keys: _col0 (type: int) @@ -2708,11 +2708,11 @@ STAGE PLANS: outputColumnNames: _col1, _col2 input vertices: 0 Map 2 - Statistics: Num rows: 391 Data size: 37145 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 37905 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: int), substr(_col2, 5) (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 391 Data size: 37145 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 37905 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col1) keys: _col0 (type: int) @@ -2866,14 +2866,14 @@ STAGE PLANS: 0 _col0 (type: int) 1 _col1 (type: int) outputColumnNames: _col1, _col2, _col3 - Statistics: Num rows: 247 Data size: 25441 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 252 Data size: 25956 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col3 (type: int), _col2 (type: double), _col1 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 247 Data size: 25441 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 252 Data size: 25956 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 247 Data size: 25441 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 252 Data size: 25956 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -2949,14 +2949,14 @@ STAGE PLANS: outputColumnNames: _col1, _col2, _col3 input vertices: 1 Reducer 3 - Statistics: Num rows: 247 Data size: 25441 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 252 Data size: 25956 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col3 (type: int), _col2 (type: double), _col1 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 247 Data size: 25441 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 252 Data size: 25956 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 247 Data size: 25441 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 252 Data size: 25956 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -3139,14 +3139,14 @@ STAGE PLANS: 1 _col0 (type: int) 2 _col0 (type: int) outputColumnNames: _col0, _col1, _col4 - Statistics: Num rows: 619 Data size: 115134 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 117366 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: int), _col1 (type: string), _col4 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 619 Data size: 115134 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 117366 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 619 Data size: 115134 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 117366 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -3202,14 +3202,14 @@ STAGE PLANS: input vertices: 1 Map 2 2 Map 3 - Statistics: Num rows: 619 Data size: 115134 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 117366 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: int), _col1 (type: string), _col4 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 619 Data size: 115134 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 117366 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 619 Data size: 115134 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 117366 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -3304,12 +3304,12 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 1 Map 3 - Statistics: Num rows: 391 Data size: 37145 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 37905 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + Map-reduce partition columns: _col0 (type: int) - Statistics: Num rows: 391 Data size: 37145 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 37905 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string) Execution mode: llap LLAP IO: no inputs @@ -3362,14 +3362,14 @@ STAGE PLANS: 0 _col0 (type: int) 1 _col0 (type: int) outputColumnNames: _col0, _col1, _col3 - Statistics: Num rows: 618 Data size: 114948 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 117366 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: int), _col1 (type: string), _col3 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 618 Data size: 114948 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 117366 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 618 Data size: 114948 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 117366 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -3422,7 +3422,7 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 1 Map 2 - Statistics: Num rows: 391 Data size: 37145 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 37905 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -3432,14 +3432,14 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col3 input vertices: 1 Map 3 - Statistics: Num rows: 618 Data size: 114948 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 117366 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: int), _col1 (type: string), _col3 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 618 Data size: 114948 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 117366 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 618 Data size: 114948 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 117366 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -3586,14 +3586,14 @@ STAGE PLANS: 0 _col0 (type: int) 1 _col0 (type: int) outputColumnNames: _col0, _col1, _col3 - Statistics: Num rows: 195 Data size: 20085 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 199 Data size: 20497 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: int), _col1 (type: double), _col3 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 195 Data size: 20085 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 199 Data size: 20497 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 195 Data size: 20085 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 199 Data size: 20497 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -3675,14 +3675,14 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col3 input vertices: 0 Reducer 2 - Statistics: Num rows: 195 Data size: 20085 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 199 Data size: 20497 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: int), _col1 (type: double), _col3 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 195 Data size: 20085 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 199 Data size: 20497 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 195 Data size: 20085 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 199 Data size: 20497 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -3799,14 +3799,14 @@ STAGE PLANS: 0 _col0 (type: int) 1 _col0 (type: int) outputColumnNames: _col0, _col1, _col3 - Statistics: Num rows: 247 Data size: 25441 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 252 Data size: 25956 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: int), _col1 (type: double), _col3 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 247 Data size: 25441 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 252 Data size: 25956 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 247 Data size: 25441 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 252 Data size: 25956 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -3882,14 +3882,14 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col3 input vertices: 0 Reducer 2 - Statistics: Num rows: 247 Data size: 25441 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 252 Data size: 25956 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: int), _col1 (type: double), _col3 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 247 Data size: 25441 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 252 Data size: 25956 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 247 Data size: 25441 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 252 Data size: 25956 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -3987,10 +3987,10 @@ STAGE PLANS: 0 _col1 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 394 Data size: 73284 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 394 Data size: 73284 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -4071,10 +4071,10 @@ STAGE PLANS: 0 _col1 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 394 Data size: 73284 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 394 Data size: 73284 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -4293,7 +4293,7 @@ STAGE PLANS: #### A masked pattern was here #### Edges: Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) - Reducer 3 <- Map 1 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) + Reducer 3 <- Map 5 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) #### A masked pattern was here #### Vertices: Map 1 @@ -4309,11 +4309,18 @@ STAGE PLANS: outputColumnNames: _col0, _col1 Statistics: Num rows: 500 Data size: 47500 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: int) + key expressions: _col1 (type: string) sort order: + - Map-reduce partition columns: _col0 (type: int) + Map-reduce partition columns: _col1 (type: string) Statistics: Num rows: 500 Data size: 47500 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: string) + value expressions: _col0 (type: int) + Execution mode: llap + LLAP IO: no inputs + Map 4 + Map Operator Tree: + TableScan + alias: b + Statistics: Num rows: 500 Data size: 47500 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: value is not null (type: boolean) Statistics: Num rows: 500 Data size: 47500 Basic stats: COMPLETE Column stats: COMPLETE @@ -4329,7 +4336,7 @@ STAGE PLANS: value expressions: _col0 (type: int) Execution mode: llap LLAP IO: no inputs - Map 4 + Map 5 Map Operator Tree: TableScan alias: c @@ -4355,16 +4362,16 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 _col0 (type: int) - 1 _col0 (type: int) - outputColumnNames: _col0, _col1 - Statistics: Num rows: 809 Data size: 76855 Basic stats: COMPLETE Column stats: COMPLETE + 0 _col1 (type: string) + 1 _col1 (type: string) + outputColumnNames: _col0, _col2 + Statistics: Num rows: 814 Data size: 6512 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col1 (type: string) + key expressions: _col0 (type: int) sort order: + - Map-reduce partition columns: _col1 (type: string) - Statistics: Num rows: 809 Data size: 76855 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col0 (type: int) + Map-reduce partition columns: _col0 (type: int) + Statistics: Num rows: 814 Data size: 6512 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col2 (type: int) Reducer 3 Execution mode: llap Reduce Operator Tree: @@ -4372,17 +4379,17 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 _col1 (type: string) - 1 _col1 (type: string) - outputColumnNames: _col0, _col3 - Statistics: Num rows: 1309 Data size: 10472 Basic stats: COMPLETE Column stats: COMPLETE + 0 _col0 (type: int) + 1 _col0 (type: int) + outputColumnNames: _col0, _col2 + Statistics: Num rows: 1343 Data size: 10744 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: _col0 (type: int), _col3 (type: int) + expressions: _col0 (type: int), _col2 (type: int) outputColumnNames: _col0, _col1 - Statistics: Num rows: 1309 Data size: 10472 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1343 Data size: 10744 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1309 Data size: 10472 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1343 Data size: 10744 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -4407,8 +4414,8 @@ STAGE PLANS: Tez #### A masked pattern was here #### Edges: - Map 1 <- Map 3 (CUSTOM_EDGE) Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) + Reducer 3 <- Map 5 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) #### A masked pattern was here #### Vertices: Map 1 @@ -4423,41 +4430,12 @@ STAGE PLANS: expressions: key (type: int), value (type: string) outputColumnNames: _col0, _col1 Statistics: Num rows: 500 Data size: 47500 Basic stats: COMPLETE Column stats: COMPLETE - Map Join Operator - condition map: - Inner Join 0 to 1 - keys: - 0 _col0 (type: int) - 1 _col0 (type: int) - outputColumnNames: _col0, _col1 - input vertices: - 1 Map 3 - Statistics: Num rows: 809 Data size: 76855 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - key expressions: _col1 (type: string) - sort order: + - Map-reduce partition columns: _col1 (type: string) - Statistics: Num rows: 809 Data size: 76855 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col0 (type: int) - Execution mode: llap - LLAP IO: no inputs - Map 3 - Map Operator Tree: - TableScan - alias: c - Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator - predicate: key is not null (type: boolean) - Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator - expressions: key (type: int) - outputColumnNames: _col0 - Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: int) + key expressions: _col1 (type: string) sort order: + - Map-reduce partition columns: _col0 (type: int) - Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 500 Data size: 47500 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col0 (type: int) Execution mode: llap LLAP IO: no inputs Map 4 @@ -4480,6 +4458,25 @@ STAGE PLANS: value expressions: _col0 (type: int) Execution mode: llap LLAP IO: no inputs + Map 5 + Map Operator Tree: + TableScan + alias: c + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE + Filter Operator + predicate: key is not null (type: boolean) + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE + Select Operator + expressions: key (type: int) + outputColumnNames: _col0 + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + key expressions: _col0 (type: int) + sort order: + + Map-reduce partition columns: _col0 (type: int) + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE + Execution mode: llap + LLAP IO: no inputs Reducer 2 Execution mode: llap Reduce Operator Tree: @@ -4489,15 +4486,32 @@ STAGE PLANS: keys: 0 _col1 (type: string) 1 _col1 (type: string) - outputColumnNames: _col0, _col3 - Statistics: Num rows: 1309 Data size: 10472 Basic stats: COMPLETE Column stats: COMPLETE + outputColumnNames: _col0, _col2 + Statistics: Num rows: 814 Data size: 6512 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + key expressions: _col0 (type: int) + sort order: + + Map-reduce partition columns: _col0 (type: int) + Statistics: Num rows: 814 Data size: 6512 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col2 (type: int) + Reducer 3 + Execution mode: llap + Reduce Operator Tree: + Merge Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 _col0 (type: int) + 1 _col0 (type: int) + outputColumnNames: _col0, _col2 + Statistics: Num rows: 1343 Data size: 10744 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: _col0 (type: int), _col3 (type: int) + expressions: _col0 (type: int), _col2 (type: int) outputColumnNames: _col0, _col1 - Statistics: Num rows: 1309 Data size: 10472 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1343 Data size: 10744 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1309 Data size: 10472 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1343 Data size: 10744 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -4594,14 +4608,14 @@ STAGE PLANS: 0 _col0 (type: int), _col2 (type: string) 1 _col0 (type: int), _col2 (type: string) outputColumnNames: _col0, _col1, _col4 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 74214 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: int), _col1 (type: string), _col4 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 74214 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 74214 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -4698,14 +4712,14 @@ STAGE PLANS: 0 _col0 (type: int), _col2 (type: string) 1 _col0 (type: int), _col2 (type: string) outputColumnNames: _col0, _col1, _col4 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 74214 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: int), _col1 (type: string), _col4 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 74214 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 399 Data size: 74214 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -4783,14 +4797,14 @@ STAGE PLANS: 0 _col0 (type: int), _col1 (type: string) 1 _col0 (type: int), _col1 (type: string) outputColumnNames: _col0, _col1, _col3 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 394 Data size: 73284 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: int), _col1 (type: string), _col3 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 394 Data size: 73284 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 394 Data size: 73284 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -5358,14 +5372,14 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col3 input vertices: 0 Map 1 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 394 Data size: 73284 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: int), _col1 (type: string), _col3 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 394 Data size: 73284 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 394 Data size: 73284 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -5979,14 +5993,14 @@ STAGE PLANS: 0 _col0 (type: int), _col1 (type: string) 1 _col0 (type: int), _col1 (type: string) outputColumnNames: _col0, _col1, _col3 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 394 Data size: 73284 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: int), _col1 (type: string), _col3 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 394 Data size: 73284 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 394 Data size: 73284 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -6554,14 +6568,14 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col3 input vertices: 0 Map 1 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 394 Data size: 73284 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: int), _col1 (type: string), _col3 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 394 Data size: 73284 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 394 Data size: 73284 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/bucket_map_join_tez2.q.out ql/src/test/results/clientpositive/llap/bucket_map_join_tez2.q.out index b84edde..528106d 100644 --- ql/src/test/results/clientpositive/llap/bucket_map_join_tez2.q.out +++ ql/src/test/results/clientpositive/llap/bucket_map_join_tez2.q.out @@ -178,7 +178,7 @@ STAGE PLANS: #### A masked pattern was here #### Edges: Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) - Reducer 3 <- Map 1 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) + Reducer 3 <- Map 5 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) #### A masked pattern was here #### Vertices: Map 1 @@ -194,11 +194,18 @@ STAGE PLANS: outputColumnNames: _col0, _col1 Statistics: Num rows: 500 Data size: 47500 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: int) + key expressions: _col1 (type: string) sort order: + - Map-reduce partition columns: _col0 (type: int) + Map-reduce partition columns: _col1 (type: string) Statistics: Num rows: 500 Data size: 47500 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: string) + value expressions: _col0 (type: int) + Execution mode: llap + LLAP IO: no inputs + Map 4 + Map Operator Tree: + TableScan + alias: b + Statistics: Num rows: 500 Data size: 47500 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: value is not null (type: boolean) Statistics: Num rows: 500 Data size: 47500 Basic stats: COMPLETE Column stats: COMPLETE @@ -214,7 +221,7 @@ STAGE PLANS: value expressions: _col0 (type: int) Execution mode: llap LLAP IO: no inputs - Map 4 + Map 5 Map Operator Tree: TableScan alias: c @@ -240,16 +247,16 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 _col0 (type: int) - 1 _col0 (type: int) - outputColumnNames: _col0, _col1 - Statistics: Num rows: 809 Data size: 76855 Basic stats: COMPLETE Column stats: COMPLETE + 0 _col1 (type: string) + 1 _col1 (type: string) + outputColumnNames: _col0, _col2 + Statistics: Num rows: 814 Data size: 6512 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col1 (type: string) + key expressions: _col0 (type: int) sort order: + - Map-reduce partition columns: _col1 (type: string) - Statistics: Num rows: 809 Data size: 76855 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col0 (type: int) + Map-reduce partition columns: _col0 (type: int) + Statistics: Num rows: 814 Data size: 6512 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col2 (type: int) Reducer 3 Execution mode: llap Reduce Operator Tree: @@ -257,17 +264,17 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 _col1 (type: string) - 1 _col1 (type: string) - outputColumnNames: _col0, _col3 - Statistics: Num rows: 1309 Data size: 10472 Basic stats: COMPLETE Column stats: COMPLETE + 0 _col0 (type: int) + 1 _col0 (type: int) + outputColumnNames: _col0, _col2 + Statistics: Num rows: 1343 Data size: 10744 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: _col0 (type: int), _col3 (type: int) + expressions: _col0 (type: int), _col2 (type: int) outputColumnNames: _col0, _col1 - Statistics: Num rows: 1309 Data size: 10472 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1343 Data size: 10744 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1309 Data size: 10472 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1343 Data size: 10744 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -292,8 +299,8 @@ STAGE PLANS: Tez #### A masked pattern was here #### Edges: - Map 1 <- Map 3 (CUSTOM_EDGE) Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) + Reducer 3 <- Map 5 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) #### A masked pattern was here #### Vertices: Map 1 @@ -308,41 +315,12 @@ STAGE PLANS: expressions: key (type: int), value (type: string) outputColumnNames: _col0, _col1 Statistics: Num rows: 500 Data size: 47500 Basic stats: COMPLETE Column stats: COMPLETE - Map Join Operator - condition map: - Inner Join 0 to 1 - keys: - 0 _col0 (type: int) - 1 _col0 (type: int) - outputColumnNames: _col0, _col1 - input vertices: - 1 Map 3 - Statistics: Num rows: 809 Data size: 76855 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - key expressions: _col1 (type: string) - sort order: + - Map-reduce partition columns: _col1 (type: string) - Statistics: Num rows: 809 Data size: 76855 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col0 (type: int) - Execution mode: llap - LLAP IO: no inputs - Map 3 - Map Operator Tree: - TableScan - alias: c - Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator - predicate: key is not null (type: boolean) - Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator - expressions: key (type: int) - outputColumnNames: _col0 - Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: int) + key expressions: _col1 (type: string) sort order: + - Map-reduce partition columns: _col0 (type: int) - Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 500 Data size: 47500 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col0 (type: int) Execution mode: llap LLAP IO: no inputs Map 4 @@ -365,6 +343,25 @@ STAGE PLANS: value expressions: _col0 (type: int) Execution mode: llap LLAP IO: no inputs + Map 5 + Map Operator Tree: + TableScan + alias: c + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE + Filter Operator + predicate: key is not null (type: boolean) + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE + Select Operator + expressions: key (type: int) + outputColumnNames: _col0 + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + key expressions: _col0 (type: int) + sort order: + + Map-reduce partition columns: _col0 (type: int) + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE + Execution mode: llap + LLAP IO: no inputs Reducer 2 Execution mode: llap Reduce Operator Tree: @@ -374,15 +371,32 @@ STAGE PLANS: keys: 0 _col1 (type: string) 1 _col1 (type: string) - outputColumnNames: _col0, _col3 - Statistics: Num rows: 1309 Data size: 10472 Basic stats: COMPLETE Column stats: COMPLETE + outputColumnNames: _col0, _col2 + Statistics: Num rows: 814 Data size: 6512 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + key expressions: _col0 (type: int) + sort order: + + Map-reduce partition columns: _col0 (type: int) + Statistics: Num rows: 814 Data size: 6512 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col2 (type: int) + Reducer 3 + Execution mode: llap + Reduce Operator Tree: + Merge Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 _col0 (type: int) + 1 _col0 (type: int) + outputColumnNames: _col0, _col2 + Statistics: Num rows: 1343 Data size: 10744 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: _col0 (type: int), _col3 (type: int) + expressions: _col0 (type: int), _col2 (type: int) outputColumnNames: _col0, _col1 - Statistics: Num rows: 1309 Data size: 10472 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1343 Data size: 10744 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1309 Data size: 10472 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1343 Data size: 10744 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -496,14 +510,14 @@ STAGE PLANS: 0 UDFToDouble(_col0) (type: double) 1 UDFToDouble(_col0) (type: double) outputColumnNames: _col0, _col1, _col3 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 382 Data size: 71052 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: int), _col1 (type: string), _col3 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 382 Data size: 71052 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 382 Data size: 71052 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -585,14 +599,14 @@ STAGE PLANS: 0 UDFToDouble(_col0) (type: double) 1 UDFToDouble(_col0) (type: double) outputColumnNames: _col0, _col1, _col3 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 382 Data size: 71052 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: int), _col1 (type: string), _col3 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 382 Data size: 71052 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 391 Data size: 72726 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 382 Data size: 71052 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -670,10 +684,10 @@ STAGE PLANS: 0 _col0 (type: int) 1 _col0 (type: int) outputColumnNames: _col0, _col1 - Statistics: Num rows: 267 Data size: 2136 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 272 Data size: 2176 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 267 Data size: 2136 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 272 Data size: 2176 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -724,10 +738,10 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 1 Map 2 - Statistics: Num rows: 267 Data size: 2136 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 272 Data size: 2176 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 267 Data size: 2136 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 272 Data size: 2176 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -826,10 +840,10 @@ STAGE PLANS: 0 _col0 (type: int) 1 _col0 (type: int) outputColumnNames: _col0, _col1 - Statistics: Num rows: 267 Data size: 2136 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 272 Data size: 2176 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 267 Data size: 2136 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 272 Data size: 2176 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -880,10 +894,10 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 1 Map 2 - Statistics: Num rows: 267 Data size: 2136 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 272 Data size: 2176 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 267 Data size: 2136 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 272 Data size: 2176 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -982,10 +996,10 @@ STAGE PLANS: 0 _col0 (type: int) 1 _col0 (type: int) outputColumnNames: _col0, _col1 - Statistics: Num rows: 267 Data size: 2136 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 272 Data size: 2176 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 267 Data size: 2136 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 272 Data size: 2176 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -1055,10 +1069,10 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 0 Map 1 - Statistics: Num rows: 267 Data size: 2136 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 272 Data size: 2176 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 267 Data size: 2136 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 272 Data size: 2176 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -1565,7 +1579,7 @@ STAGE PLANS: keys: 0 _col0 (type: int), _col1 (type: string) 1 _col0 (type: int), _col1 (type: string) - Statistics: Num rows: 195 Data size: 1560 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 197 Data size: 1576 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -1675,7 +1689,7 @@ STAGE PLANS: 1 _col0 (type: int), _col1 (type: string) input vertices: 1 Map 4 - Statistics: Num rows: 195 Data size: 1560 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 197 Data size: 1576 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash diff --git ql/src/test/results/clientpositive/llap/correlationoptimizer1.q.out ql/src/test/results/clientpositive/llap/correlationoptimizer1.q.out index b138a2d..ed5a7a5 100644 --- ql/src/test/results/clientpositive/llap/correlationoptimizer1.q.out +++ ql/src/test/results/clientpositive/llap/correlationoptimizer1.q.out @@ -72,7 +72,7 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 40 Data size: 3440 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3354 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) @@ -220,7 +220,7 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 40 Data size: 3440 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3354 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) @@ -360,7 +360,7 @@ STAGE PLANS: outputColumnNames: _col0 input vertices: 0 Map 1 - Statistics: Num rows: 40 Data size: 3440 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3354 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) @@ -515,18 +515,18 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 20 Data size: 1720 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 1634 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 10 Data size: 940 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9 Data size: 846 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 10 Data size: 940 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9 Data size: 846 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Reducer 3 Execution mode: llap @@ -536,11 +536,11 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 10 Data size: 940 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9 Data size: 846 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: hash(_col0) (type: int), hash(_col1) (type: int) outputColumnNames: _col0, _col1 - Statistics: Num rows: 10 Data size: 940 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9 Data size: 846 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col0), sum(_col1) mode: hash @@ -668,18 +668,18 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 20 Data size: 1720 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 1634 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 10 Data size: 940 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9 Data size: 846 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 10 Data size: 940 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9 Data size: 846 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Reducer 3 Execution mode: llap @@ -689,11 +689,11 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 10 Data size: 940 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9 Data size: 846 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: hash(_col0) (type: int), hash(_col1) (type: int) outputColumnNames: _col0, _col1 - Statistics: Num rows: 10 Data size: 940 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9 Data size: 846 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col0), sum(_col1) mode: hash @@ -810,7 +810,7 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 40 Data size: 3440 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3354 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) @@ -952,7 +952,7 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 40 Data size: 3440 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3354 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) @@ -1094,7 +1094,7 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col1 - Statistics: Num rows: 40 Data size: 3480 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3393 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col1 (type: string) @@ -1236,7 +1236,7 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col1 - Statistics: Num rows: 40 Data size: 3480 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3393 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col1 (type: string) @@ -1375,18 +1375,18 @@ STAGE PLANS: 0 _col0 (type: string), _col1 (type: string) 1 _col0 (type: string), _col1 (type: string) outputColumnNames: _col0, _col3 - Statistics: Num rows: 40 Data size: 7080 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6903 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string), _col3 (type: string) mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 20 Data size: 3700 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3515 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string) - Statistics: Num rows: 20 Data size: 3700 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3515 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: bigint) Reducer 3 Execution mode: llap @@ -1396,10 +1396,10 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: string) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 20 Data size: 3700 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3515 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 20 Data size: 3700 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3515 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -1506,18 +1506,18 @@ STAGE PLANS: 0 _col0 (type: string), _col1 (type: string) 1 _col0 (type: string), _col1 (type: string) outputColumnNames: _col0, _col3 - Statistics: Num rows: 40 Data size: 7080 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6903 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string), _col3 (type: string) mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 20 Data size: 3700 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3515 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string) - Statistics: Num rows: 20 Data size: 3700 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3515 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: bigint) Reducer 3 Execution mode: llap @@ -1527,10 +1527,10 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: string) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 20 Data size: 3700 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3515 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 20 Data size: 3700 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3515 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -1924,7 +1924,7 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 500 Data size: 3526 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 3440 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) @@ -2066,7 +2066,7 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 500 Data size: 3526 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 3440 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) @@ -2208,7 +2208,7 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 525 Data size: 3526 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 525 Data size: 3440 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) @@ -2350,7 +2350,7 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 525 Data size: 3526 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 525 Data size: 3440 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) @@ -2499,18 +2499,18 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string), _col1 (type: string) mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 20 Data size: 3660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3477 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string) - Statistics: Num rows: 20 Data size: 3660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3477 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: bigint) Reducer 3 Execution mode: llap @@ -2520,11 +2520,11 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: string) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 20 Data size: 3660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3477 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: hash(_col0) (type: int), hash(_col1) (type: int), hash(_col2) (type: int) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 20 Data size: 3660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3477 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col0), sum(_col1), sum(_col2) mode: hash @@ -2648,18 +2648,18 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string), _col1 (type: string) mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 20 Data size: 3660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3477 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string) - Statistics: Num rows: 20 Data size: 3660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3477 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: bigint) Reducer 3 Execution mode: llap @@ -2669,11 +2669,11 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: string) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 20 Data size: 3660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3477 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: hash(_col0) (type: int), hash(_col1) (type: int), hash(_col2) (type: int) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 20 Data size: 3660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3477 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col0), sum(_col1), sum(_col2) mode: hash @@ -2796,7 +2796,7 @@ STAGE PLANS: 0 _col0 (type: string), _col1 (type: string) 1 _col0 (type: string), _col1 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 40 Data size: 3440 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3354 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) @@ -2944,7 +2944,7 @@ STAGE PLANS: 0 _col0 (type: string), _col1 (type: string) 1 _col0 (type: string), _col1 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 40 Data size: 3440 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3354 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) diff --git ql/src/test/results/clientpositive/llap/correlationoptimizer2.q.out ql/src/test/results/clientpositive/llap/correlationoptimizer2.q.out index 64248e7..0a39763 100644 --- ql/src/test/results/clientpositive/llap/correlationoptimizer2.q.out +++ ql/src/test/results/clientpositive/llap/correlationoptimizer2.q.out @@ -1804,16 +1804,16 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col1, _col2 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: string), _col2 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string) Reducer 3 Execution mode: llap @@ -1825,11 +1825,11 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 30 Data size: 8070 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 29 Data size: 7801 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: hash(_col0) (type: int), hash(_col1) (type: int), hash(_col2) (type: int), hash(_col3) (type: int) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 30 Data size: 8070 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 29 Data size: 7801 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col0), sum(_col1), sum(_col2), sum(_col3) mode: hash @@ -1985,16 +1985,16 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col1, _col2 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: string), _col2 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string) Reducer 3 Execution mode: llap @@ -2006,11 +2006,11 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 30 Data size: 8070 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 29 Data size: 7801 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: hash(_col0) (type: int), hash(_col1) (type: int), hash(_col2) (type: int), hash(_col3) (type: int) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 30 Data size: 8070 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 29 Data size: 7801 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col0), sum(_col1), sum(_col2), sum(_col3) mode: hash diff --git ql/src/test/results/clientpositive/llap/correlationoptimizer3.q.out ql/src/test/results/clientpositive/llap/correlationoptimizer3.q.out index 0d3c3bc..005af0e 100644 --- ql/src/test/results/clientpositive/llap/correlationoptimizer3.q.out +++ ql/src/test/results/clientpositive/llap/correlationoptimizer3.q.out @@ -101,16 +101,16 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col1, _col2 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: string), _col2 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string) Reducer 3 Execution mode: llap @@ -122,11 +122,11 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1, _col3 - Statistics: Num rows: 40 Data size: 7320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7137 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: hash(_col0) (type: int), hash(_col3) (type: int), hash(_col1) (type: int) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 40 Data size: 7320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7137 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col0), sum(_col1), sum(_col2) mode: hash @@ -161,7 +161,7 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col1 - Statistics: Num rows: 40 Data size: 3440 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3354 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col1 (type: string) @@ -318,16 +318,16 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col1, _col2 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: string), _col2 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string) Reducer 3 Execution mode: llap @@ -339,11 +339,11 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1, _col3 - Statistics: Num rows: 40 Data size: 7320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7137 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: hash(_col0) (type: int), hash(_col3) (type: int), hash(_col1) (type: int) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 40 Data size: 7320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7137 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col0), sum(_col1), sum(_col2) mode: hash @@ -378,7 +378,7 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col1 - Statistics: Num rows: 40 Data size: 3440 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3354 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col1 (type: string) @@ -482,11 +482,11 @@ STAGE PLANS: outputColumnNames: _col1, _col2 input vertices: 1 Map 3 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: string), _col2 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -496,11 +496,11 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col3 input vertices: 1 Reducer 5 - Statistics: Num rows: 40 Data size: 7320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7137 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: hash(_col0) (type: int), hash(_col3) (type: int), hash(_col1) (type: int) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 40 Data size: 7320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7137 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col0), sum(_col1), sum(_col2) mode: hash @@ -553,7 +553,7 @@ STAGE PLANS: outputColumnNames: _col1 input vertices: 1 Map 6 - Statistics: Num rows: 40 Data size: 3440 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3354 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col1 (type: string) @@ -746,16 +746,16 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col1, _col2 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: string), _col2 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string) Reducer 3 Execution mode: llap @@ -767,11 +767,11 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col1, _col2, _col3 - Statistics: Num rows: 40 Data size: 7320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7137 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: hash(_col2) (type: int), hash(_col3) (type: int), hash(_col1) (type: int) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 40 Data size: 7320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7137 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col0), sum(_col1), sum(_col2) mode: hash @@ -806,7 +806,7 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col1 - Statistics: Num rows: 40 Data size: 3440 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3354 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col1 (type: string) @@ -963,16 +963,16 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col1, _col2 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: string), _col2 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string) Reducer 3 Execution mode: llap @@ -984,11 +984,11 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col1, _col2, _col3 - Statistics: Num rows: 40 Data size: 7320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7137 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: hash(_col2) (type: int), hash(_col3) (type: int), hash(_col1) (type: int) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 40 Data size: 7320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7137 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col0), sum(_col1), sum(_col2) mode: hash @@ -1023,7 +1023,7 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col1 - Statistics: Num rows: 40 Data size: 3440 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3354 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col1 (type: string) @@ -1127,11 +1127,11 @@ STAGE PLANS: outputColumnNames: _col1, _col2 input vertices: 1 Map 3 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: string), _col2 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -1141,11 +1141,11 @@ STAGE PLANS: outputColumnNames: _col1, _col2, _col3 input vertices: 1 Reducer 5 - Statistics: Num rows: 40 Data size: 7320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7137 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: hash(_col2) (type: int), hash(_col3) (type: int), hash(_col1) (type: int) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 40 Data size: 7320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7137 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col0), sum(_col1), sum(_col2) mode: hash @@ -1198,7 +1198,7 @@ STAGE PLANS: outputColumnNames: _col1 input vertices: 1 Map 6 - Statistics: Num rows: 40 Data size: 3440 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3354 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col1 (type: string) diff --git ql/src/test/results/clientpositive/llap/correlationoptimizer6.q.out ql/src/test/results/clientpositive/llap/correlationoptimizer6.q.out index d94dda2..6742bb7 100644 --- ql/src/test/results/clientpositive/llap/correlationoptimizer6.q.out +++ ql/src/test/results/clientpositive/llap/correlationoptimizer6.q.out @@ -172,18 +172,18 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 809 Data size: 70383 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 68817 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Reducer 8 Execution mode: llap @@ -193,12 +193,12 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Stage: Stage-0 @@ -416,18 +416,18 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 809 Data size: 70383 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 68817 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Reducer 8 Execution mode: llap @@ -437,12 +437,12 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Stage: Stage-0 @@ -593,18 +593,18 @@ STAGE PLANS: outputColumnNames: _col0 input vertices: 1 Map 6 - Statistics: Num rows: 809 Data size: 70383 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 68817 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Execution mode: llap LLAP IO: no inputs @@ -650,7 +650,7 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -788,10 +788,10 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 20 Data size: 3620 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3439 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 20 Data size: 3620 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3439 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -929,10 +929,10 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 20 Data size: 3620 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3439 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 20 Data size: 3620 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3439 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -1105,18 +1105,18 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 809 Data size: 70383 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 68817 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Reducer 5 Execution mode: llap @@ -1126,12 +1126,12 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Stage: Stage-0 @@ -1286,18 +1286,18 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 809 Data size: 70383 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 68817 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Reducer 5 Execution mode: llap @@ -1307,12 +1307,12 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Stage: Stage-0 @@ -1864,14 +1864,14 @@ STAGE PLANS: 1 _col0 (type: string) 2 _col0 (type: string) outputColumnNames: _col1, _col2, _col3 - Statistics: Num rows: 40 Data size: 7240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7059 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: string), _col2 (type: string), _col3 (type: bigint) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 40 Data size: 7240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7059 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 40 Data size: 7240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7059 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -1886,18 +1886,18 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 809 Data size: 70383 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 68817 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Reducer 5 Execution mode: llap @@ -1907,12 +1907,12 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Stage: Stage-0 @@ -2082,14 +2082,14 @@ STAGE PLANS: 1 _col0 (type: string) 2 _col0 (type: string) outputColumnNames: _col1, _col2, _col3 - Statistics: Num rows: 40 Data size: 7240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7059 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: string), _col2 (type: string), _col3 (type: bigint) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 40 Data size: 7240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7059 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 40 Data size: 7240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7059 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -2104,18 +2104,18 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 809 Data size: 70383 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 68817 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Reducer 5 Execution mode: llap @@ -2125,12 +2125,12 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Stage: Stage-0 @@ -2298,18 +2298,18 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 809 Data size: 70383 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 68817 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Reducer 3 Execution mode: llap @@ -2319,12 +2319,12 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Reducer 4 Execution mode: llap @@ -2338,14 +2338,14 @@ STAGE PLANS: 1 _col0 (type: string) 2 _col0 (type: string) outputColumnNames: _col0, _col1, _col3 - Statistics: Num rows: 40 Data size: 7240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7059 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col3 (type: string), _col0 (type: string), _col1 (type: bigint) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 40 Data size: 7240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7059 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 40 Data size: 7240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7059 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -2516,18 +2516,18 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 809 Data size: 70383 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 68817 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Reducer 3 Execution mode: llap @@ -2537,12 +2537,12 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Reducer 4 Execution mode: llap @@ -2556,14 +2556,14 @@ STAGE PLANS: 1 _col0 (type: string) 2 _col0 (type: string) outputColumnNames: _col0, _col1, _col3 - Statistics: Num rows: 40 Data size: 7240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7059 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col3 (type: string), _col0 (type: string), _col1 (type: bigint) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 40 Data size: 7240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7059 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 40 Data size: 7240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7059 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -3327,18 +3327,18 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string), _col1 (type: string) mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 404 Data size: 75144 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 395 Data size: 73470 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string) - Statistics: Num rows: 404 Data size: 75144 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 395 Data size: 73470 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: bigint) Reducer 9 Execution mode: llap @@ -3348,12 +3348,12 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: string) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 404 Data size: 75144 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 395 Data size: 73470 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 404 Data size: 75144 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 395 Data size: 73470 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string), _col2 (type: bigint) Stage: Stage-0 @@ -3572,18 +3572,18 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string), _col1 (type: string) mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 404 Data size: 75144 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 395 Data size: 73470 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string) - Statistics: Num rows: 404 Data size: 75144 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 395 Data size: 73470 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: bigint) Reducer 8 Execution mode: llap @@ -3593,12 +3593,12 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: string) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 404 Data size: 75144 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 395 Data size: 73470 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 404 Data size: 75144 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 395 Data size: 73470 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string), _col2 (type: bigint) Stage: Stage-0 @@ -3749,18 +3749,18 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 1 Map 6 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string), _col1 (type: string) mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 404 Data size: 75144 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 395 Data size: 73470 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string) - Statistics: Num rows: 404 Data size: 75144 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 395 Data size: 73470 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: bigint) Execution mode: llap LLAP IO: no inputs @@ -3806,7 +3806,7 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: string) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 404 Data size: 75144 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 395 Data size: 73470 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 diff --git ql/src/test/results/clientpositive/llap/cross_join.q.out ql/src/test/results/clientpositive/llap/cross_join.q.out index 6bde893..f5666a8 100644 --- ql/src/test/results/clientpositive/llap/cross_join.q.out +++ ql/src/test/results/clientpositive/llap/cross_join.q.out @@ -200,10 +200,10 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 809 Data size: 70383 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 68817 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 809 Data size: 70383 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 68817 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -390,10 +390,10 @@ STAGE PLANS: outputColumnNames: _col0 input vertices: 1 Map 2 - Statistics: Num rows: 809 Data size: 70383 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 68817 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 809 Data size: 70383 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 68817 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/dynamic_semijoin_reduction.q.out ql/src/test/results/clientpositive/llap/dynamic_semijoin_reduction.q.out index 3d711c3..dff86d7 100644 --- ql/src/test/results/clientpositive/llap/dynamic_semijoin_reduction.q.out +++ ql/src/test/results/clientpositive/llap/dynamic_semijoin_reduction.q.out @@ -452,12 +452,12 @@ STAGE PLANS: keys: _col0 (type: string) mode: hash outputColumnNames: _col0 - Statistics: Num rows: 309 Data size: 26883 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 27492 Basic stats: COMPLETE Column stats: COMPLETE Dynamic Partitioning Event Operator Target column: ds (string) Target Input: srcpart_small Partition key expr: ds - Statistics: Num rows: 309 Data size: 26883 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 27492 Basic stats: COMPLETE Column stats: COMPLETE Target Vertex: Map 4 Execution mode: llap LLAP IO: all inputs @@ -723,7 +723,7 @@ STAGE PLANS: outputColumnNames: _col0 Statistics: Num rows: 2000 Data size: 174000 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator - aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=309) + aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=316) mode: hash outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 1 Data size: 552 Basic stats: COMPLETE Column stats: COMPLETE @@ -826,7 +826,7 @@ STAGE PLANS: Execution mode: llap Reduce Operator Tree: Group By Operator - aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, expectedEntries=309) + aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, expectedEntries=316) mode: final outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 1 Data size: 552 Basic stats: COMPLETE Column stats: COMPLETE diff --git ql/src/test/results/clientpositive/llap/dynamic_semijoin_reduction_sw.q.out ql/src/test/results/clientpositive/llap/dynamic_semijoin_reduction_sw.q.out index d6103a8..880ba53 100644 --- ql/src/test/results/clientpositive/llap/dynamic_semijoin_reduction_sw.q.out +++ ql/src/test/results/clientpositive/llap/dynamic_semijoin_reduction_sw.q.out @@ -231,7 +231,7 @@ STAGE PLANS: outputColumnNames: _col0 Statistics: Num rows: 1000 Data size: 87000 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator - aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=309) + aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=316) mode: hash outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 1 Data size: 552 Basic stats: COMPLETE Column stats: COMPLETE @@ -284,7 +284,7 @@ STAGE PLANS: outputColumnNames: _col0 Statistics: Num rows: 1000 Data size: 87000 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator - aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=309) + aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=316) mode: hash outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 1 Data size: 552 Basic stats: COMPLETE Column stats: COMPLETE @@ -369,7 +369,7 @@ STAGE PLANS: Execution mode: llap Reduce Operator Tree: Group By Operator - aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, expectedEntries=309) + aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, expectedEntries=316) mode: final outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 1 Data size: 552 Basic stats: COMPLETE Column stats: COMPLETE @@ -430,7 +430,7 @@ STAGE PLANS: Execution mode: llap Reduce Operator Tree: Group By Operator - aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, expectedEntries=309) + aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, expectedEntries=316) mode: final outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 1 Data size: 552 Basic stats: COMPLETE Column stats: COMPLETE diff --git ql/src/test/results/clientpositive/llap/explainanalyze_2.q.out ql/src/test/results/clientpositive/llap/explainanalyze_2.q.out index 7db3b13..d671d0e 100644 --- ql/src/test/results/clientpositive/llap/explainanalyze_2.q.out +++ ql/src/test/results/clientpositive/llap/explainanalyze_2.q.out @@ -41,134 +41,129 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Vertex dependency in root stage -Map 1 <- Union 2 (CONTAINS) +Map 12 <- Union 10 (CONTAINS) Map 13 <- Union 14 (CONTAINS) Map 16 <- Union 14 (CONTAINS) -Map 8 <- Union 2 (CONTAINS) -Reducer 10 <- Map 9 (SIMPLE_EDGE), Reducer 15 (SIMPLE_EDGE) -Reducer 11 <- Map 17 (SIMPLE_EDGE), Reducer 10 (SIMPLE_EDGE), Union 6 (CONTAINS) +Map 9 <- Union 10 (CONTAINS) +Reducer 11 <- Union 10 (SIMPLE_EDGE) Reducer 15 <- Union 14 (SIMPLE_EDGE) -Reducer 3 <- Union 2 (SIMPLE_EDGE) -Reducer 4 <- Map 9 (SIMPLE_EDGE), Reducer 3 (SIMPLE_EDGE) -Reducer 5 <- Map 12 (SIMPLE_EDGE), Reducer 4 (SIMPLE_EDGE), Union 6 (CONTAINS) -Reducer 7 <- Union 6 (SIMPLE_EDGE) +Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 8 (SIMPLE_EDGE) +Reducer 3 <- Reducer 11 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE), Union 4 (CONTAINS) +Reducer 5 <- Union 4 (SIMPLE_EDGE) +Reducer 6 <- Map 1 (SIMPLE_EDGE), Map 8 (SIMPLE_EDGE) +Reducer 7 <- Reducer 15 (SIMPLE_EDGE), Reducer 6 (SIMPLE_EDGE), Union 4 (CONTAINS) Stage-0 Fetch Operator limit:-1 Stage-1 - Reducer 7 llap + Reducer 5 llap File Output Operator [FS_56] - Group By Operator [GBY_54] (rows=32/15 width=177) + Group By Operator [GBY_54] (rows=48/15 width=177) Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 - <-Union 6 [SIMPLE_EDGE] - <-Reducer 11 [CONTAINS] llap + <-Union 4 [SIMPLE_EDGE] + <-Reducer 3 [CONTAINS] llap Reduce Output Operator [RS_53] PartitionCols:_col0, _col1 - Select Operator [SEL_49] (rows=67/61 width=177) + Select Operator [SEL_24] (rows=66/61 width=177) Output:["_col0","_col1"] - Merge Join Operator [MERGEJOIN_82] (rows=67/61 width=177) - Conds:RS_46._col2=RS_47._col0(Inner),Output:["_col1","_col2"] - <-Map 17 [SIMPLE_EDGE] llap - SHUFFLE [RS_47] - PartitionCols:_col0 - Select Operator [SEL_42] (rows=500/500 width=87) - Output:["_col0"] - Filter Operator [FIL_78] (rows=500/500 width=87) - predicate:key is not null - TableScan [TS_40] (rows=500/500 width=87) - default@src,y,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] - <-Reducer 10 [SIMPLE_EDGE] llap - SHUFFLE [RS_46] + Merge Join Operator [MERGEJOIN_79] (rows=66/61 width=177) + Conds:RS_21._col2=RS_22._col1(Inner),Output:["_col1","_col4"] + <-Reducer 11 [SIMPLE_EDGE] llap + SHUFFLE [RS_22] + PartitionCols:_col1 + Select Operator [SEL_17] (rows=525/319 width=178) + Output:["_col1"] + Group By Operator [GBY_16] (rows=525/319 width=178) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 10 [SIMPLE_EDGE] + <-Map 12 [CONTAINS] llap + Reduce Output Operator [RS_15] + PartitionCols:_col1, _col0 + Select Operator [SEL_11] (rows=500/500 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_72] (rows=500/500 width=178) + predicate:value is not null + TableScan [TS_9] (rows=500/500 width=178) + Output:["key","value"] + <-Map 9 [CONTAINS] llap + Reduce Output Operator [RS_15] + PartitionCols:_col1, _col0 + Select Operator [SEL_8] (rows=25/25 width=175) + Output:["_col0","_col1"] + Filter Operator [FIL_71] (rows=25/25 width=175) + predicate:value is not null + TableScan [TS_6] (rows=25/25 width=175) + Output:["key","value"] + <-Reducer 2 [SIMPLE_EDGE] llap + SHUFFLE [RS_21] PartitionCols:_col2 - Merge Join Operator [MERGEJOIN_81] (rows=42/52 width=177) - Conds:RS_43._col1=RS_44._col1(Inner),Output:["_col1","_col2"] - <-Map 9 [SIMPLE_EDGE] llap - SHUFFLE [RS_44] - PartitionCols:_col1 - Select Operator [SEL_14] (rows=25/25 width=175) + Merge Join Operator [MERGEJOIN_77] (rows=39/37 width=175) + Conds:RS_18._col0=RS_19._col0(Inner),Output:["_col1","_col2"] + <-Map 1 [SIMPLE_EDGE] llap + SHUFFLE [RS_18] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=500/500 width=87) + Output:["_col0"] + Filter Operator [FIL_69] (rows=500/500 width=87) + predicate:key is not null + TableScan [TS_0] (rows=500/500 width=87) + default@src,y,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Map 8 [SIMPLE_EDGE] llap + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=25/25 width=175) Output:["_col0","_col1"] - Filter Operator [FIL_73] (rows=25/25 width=175) + Filter Operator [FIL_70] (rows=25/25 width=175) predicate:(key is not null and value is not null) - TableScan [TS_12] (rows=25/25 width=175) + TableScan [TS_3] (rows=25/25 width=175) default@src1,x,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] - <-Reducer 15 [SIMPLE_EDGE] llap - SHUFFLE [RS_43] - PartitionCols:_col1 - Select Operator [SEL_36] (rows=525/319 width=178) - Output:["_col1"] - Group By Operator [GBY_35] (rows=525/319 width=178) - Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 - <-Union 14 [SIMPLE_EDGE] - <-Map 13 [CONTAINS] llap - Reduce Output Operator [RS_34] - PartitionCols:_col1, _col0 - Select Operator [SEL_27] (rows=25/25 width=175) - Output:["_col0","_col1"] - Filter Operator [FIL_75] (rows=25/25 width=175) - predicate:value is not null - TableScan [TS_25] (rows=25/25 width=175) - Output:["key","value"] - <-Map 16 [CONTAINS] llap - Reduce Output Operator [RS_34] - PartitionCols:_col1, _col0 - Select Operator [SEL_30] (rows=500/500 width=178) - Output:["_col0","_col1"] - Filter Operator [FIL_76] (rows=500/500 width=178) - predicate:value is not null - TableScan [TS_28] (rows=500/500 width=178) - Output:["key","value"] - <-Reducer 5 [CONTAINS] llap + <-Reducer 7 [CONTAINS] llap Reduce Output Operator [RS_53] PartitionCols:_col0, _col1 - Select Operator [SEL_24] (rows=67/61 width=177) + Select Operator [SEL_49] (rows=66/61 width=177) Output:["_col0","_col1"] - Merge Join Operator [MERGEJOIN_80] (rows=67/61 width=177) - Conds:RS_21._col2=RS_22._col0(Inner),Output:["_col1","_col2"] - <-Map 12 [SIMPLE_EDGE] llap - SHUFFLE [RS_22] - PartitionCols:_col0 - Select Operator [SEL_17] (rows=500/500 width=87) - Output:["_col0"] - Filter Operator [FIL_74] (rows=500/500 width=87) - predicate:key is not null - TableScan [TS_15] (rows=500/500 width=87) - default@src,y,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] - <-Reducer 4 [SIMPLE_EDGE] llap - SHUFFLE [RS_21] + Merge Join Operator [MERGEJOIN_80] (rows=66/61 width=177) + Conds:RS_46._col2=RS_47._col1(Inner),Output:["_col1","_col4"] + <-Reducer 15 [SIMPLE_EDGE] llap + SHUFFLE [RS_47] + PartitionCols:_col1 + Select Operator [SEL_42] (rows=525/319 width=178) + Output:["_col1"] + Group By Operator [GBY_41] (rows=525/319 width=178) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 14 [SIMPLE_EDGE] + <-Map 13 [CONTAINS] llap + Reduce Output Operator [RS_40] + PartitionCols:_col1, _col0 + Select Operator [SEL_33] (rows=25/25 width=175) + Output:["_col0","_col1"] + Filter Operator [FIL_75] (rows=25/25 width=175) + predicate:value is not null + TableScan [TS_31] (rows=25/25 width=175) + Output:["key","value"] + <-Map 16 [CONTAINS] llap + Reduce Output Operator [RS_40] + PartitionCols:_col1, _col0 + Select Operator [SEL_36] (rows=500/500 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_76] (rows=500/500 width=178) + predicate:value is not null + TableScan [TS_34] (rows=500/500 width=178) + Output:["key","value"] + <-Reducer 6 [SIMPLE_EDGE] llap + SHUFFLE [RS_46] PartitionCols:_col2 - Merge Join Operator [MERGEJOIN_79] (rows=42/52 width=177) - Conds:RS_18._col1=RS_19._col1(Inner),Output:["_col1","_col2"] - <-Map 9 [SIMPLE_EDGE] llap - SHUFFLE [RS_19] - PartitionCols:_col1 - Please refer to the previous Select Operator [SEL_14] - <-Reducer 3 [SIMPLE_EDGE] llap - SHUFFLE [RS_18] - PartitionCols:_col1 - Select Operator [SEL_11] (rows=525/319 width=178) - Output:["_col1"] - Group By Operator [GBY_10] (rows=525/319 width=178) - Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 - <-Union 2 [SIMPLE_EDGE] - <-Map 1 [CONTAINS] llap - Reduce Output Operator [RS_9] - PartitionCols:_col1, _col0 - Select Operator [SEL_2] (rows=25/25 width=175) - Output:["_col0","_col1"] - Filter Operator [FIL_71] (rows=25/25 width=175) - predicate:value is not null - TableScan [TS_0] (rows=25/25 width=175) - Output:["key","value"] - <-Map 8 [CONTAINS] llap - Reduce Output Operator [RS_9] - PartitionCols:_col1, _col0 - Select Operator [SEL_5] (rows=500/500 width=178) - Output:["_col0","_col1"] - Filter Operator [FIL_72] (rows=500/500 width=178) - predicate:value is not null - TableScan [TS_3] (rows=500/500 width=178) - Output:["key","value"] + Merge Join Operator [MERGEJOIN_78] (rows=39/37 width=175) + Conds:RS_43._col0=RS_44._col0(Inner),Output:["_col1","_col2"] + <-Map 1 [SIMPLE_EDGE] llap + SHUFFLE [RS_43] + PartitionCols:_col0 + Please refer to the previous Select Operator [SEL_2] + <-Map 8 [SIMPLE_EDGE] llap + SHUFFLE [RS_44] + PartitionCols:_col0 + Please refer to the previous Select Operator [SEL_5] PREHOOK: query: SELECT x.key, y.value FROM src1 x JOIN src y ON (x.key = y.key) @@ -229,249 +224,244 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Vertex dependency in root stage -Map 1 <- Union 2 (CONTAINS) -Map 10 <- Union 2 (CONTAINS) +Map 13 <- Union 14 (CONTAINS) +Map 16 <- Union 14 (CONTAINS) Map 17 <- Union 18 (CONTAINS) Map 22 <- Union 18 (CONTAINS) Map 23 <- Union 20 (CONTAINS) -Map 25 <- Union 26 (CONTAINS) -Map 32 <- Union 26 (CONTAINS) -Map 33 <- Union 28 (CONTAINS) -Map 34 <- Union 30 (CONTAINS) -Reducer 12 <- Map 11 (SIMPLE_EDGE), Reducer 21 (SIMPLE_EDGE) -Reducer 13 <- Map 24 (SIMPLE_EDGE), Reducer 12 (SIMPLE_EDGE), Union 6 (CONTAINS) -Reducer 14 <- Map 11 (SIMPLE_EDGE), Reducer 31 (SIMPLE_EDGE) -Reducer 15 <- Map 16 (SIMPLE_EDGE), Reducer 14 (SIMPLE_EDGE), Union 8 (CONTAINS) +Map 24 <- Union 25 (CONTAINS) +Map 31 <- Union 25 (CONTAINS) +Map 32 <- Union 27 (CONTAINS) +Map 33 <- Union 29 (CONTAINS) +Reducer 10 <- Map 1 (SIMPLE_EDGE), Map 12 (SIMPLE_EDGE) +Reducer 11 <- Reducer 10 (SIMPLE_EDGE), Reducer 30 (SIMPLE_EDGE), Union 6 (CONTAINS) +Reducer 15 <- Union 14 (SIMPLE_EDGE) Reducer 19 <- Union 18 (SIMPLE_EDGE), Union 20 (CONTAINS) +Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 12 (SIMPLE_EDGE) Reducer 21 <- Union 20 (SIMPLE_EDGE) -Reducer 27 <- Union 26 (SIMPLE_EDGE), Union 28 (CONTAINS) -Reducer 29 <- Union 28 (SIMPLE_EDGE), Union 30 (CONTAINS) -Reducer 3 <- Union 2 (SIMPLE_EDGE) -Reducer 31 <- Union 30 (SIMPLE_EDGE) -Reducer 4 <- Map 11 (SIMPLE_EDGE), Reducer 3 (SIMPLE_EDGE) -Reducer 5 <- Map 16 (SIMPLE_EDGE), Reducer 4 (SIMPLE_EDGE), Union 6 (CONTAINS) -Reducer 7 <- Union 6 (SIMPLE_EDGE), Union 8 (CONTAINS) -Reducer 9 <- Union 8 (SIMPLE_EDGE) +Reducer 26 <- Union 25 (SIMPLE_EDGE), Union 27 (CONTAINS) +Reducer 28 <- Union 27 (SIMPLE_EDGE), Union 29 (CONTAINS) +Reducer 3 <- Reducer 15 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE), Union 4 (CONTAINS) +Reducer 30 <- Union 29 (SIMPLE_EDGE) +Reducer 5 <- Union 4 (SIMPLE_EDGE), Union 6 (CONTAINS) +Reducer 7 <- Union 6 (SIMPLE_EDGE) +Reducer 8 <- Map 1 (SIMPLE_EDGE), Map 12 (SIMPLE_EDGE) +Reducer 9 <- Reducer 21 (SIMPLE_EDGE), Reducer 8 (SIMPLE_EDGE), Union 4 (CONTAINS) Stage-0 Fetch Operator limit:-1 Stage-1 - Reducer 9 llap + Reducer 7 llap File Output Operator [FS_114] - Group By Operator [GBY_112] (rows=398/15 width=177) + Group By Operator [GBY_112] (rows=384/15 width=177) Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 - <-Union 8 [SIMPLE_EDGE] - <-Reducer 15 [CONTAINS] llap + <-Union 6 [SIMPLE_EDGE] + <-Reducer 11 [CONTAINS] llap Reduce Output Operator [RS_111] PartitionCols:_col0, _col1 - Select Operator [SEL_107] (rows=199/61 width=177) + Select Operator [SEL_107] (rows=193/61 width=177) Output:["_col0","_col1"] - Merge Join Operator [MERGEJOIN_162] (rows=199/61 width=177) - Conds:RS_104._col2=RS_105._col0(Inner),Output:["_col2","_col5"] - <-Map 16 [SIMPLE_EDGE] llap - SHUFFLE [RS_105] - PartitionCols:_col0 - Select Operator [SEL_17] (rows=500/500 width=178) - Output:["_col0","_col1"] - Filter Operator [FIL_145] (rows=500/500 width=178) - predicate:key is not null - TableScan [TS_15] (rows=500/500 width=178) - default@src,y,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] - <-Reducer 14 [SIMPLE_EDGE] llap + Merge Join Operator [MERGEJOIN_156] (rows=193/61 width=177) + Conds:RS_104._col3=RS_105._col1(Inner),Output:["_col1","_col2"] + <-Reducer 10 [SIMPLE_EDGE] llap SHUFFLE [RS_104] - PartitionCols:_col2 - Merge Join Operator [MERGEJOIN_161] (rows=123/52 width=86) - Conds:RS_101._col1=RS_102._col1(Inner),Output:["_col2"] - <-Map 11 [SIMPLE_EDGE] llap + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_153] (rows=39/37 width=266) + Conds:RS_101._col0=RS_102._col0(Inner),Output:["_col1","_col2","_col3"] + <-Map 1 [SIMPLE_EDGE] llap + SHUFFLE [RS_101] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=500/500 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_136] (rows=500/500 width=178) + predicate:key is not null + TableScan [TS_0] (rows=500/500 width=178) + default@src,y,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] + <-Map 12 [SIMPLE_EDGE] llap SHUFFLE [RS_102] - PartitionCols:_col1 - Select Operator [SEL_14] (rows=25/25 width=175) + PartitionCols:_col0 + Select Operator [SEL_5] (rows=25/25 width=175) Output:["_col0","_col1"] - Filter Operator [FIL_144] (rows=25/25 width=175) + Filter Operator [FIL_137] (rows=25/25 width=175) predicate:(key is not null and value is not null) - TableScan [TS_12] (rows=25/25 width=175) + TableScan [TS_3] (rows=25/25 width=175) default@src1,x,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] - <-Reducer 31 [SIMPLE_EDGE] llap - SHUFFLE [RS_101] - PartitionCols:_col1 - Select Operator [SEL_94] (rows=1525/319 width=178) - Output:["_col1"] - Group By Operator [GBY_93] (rows=1525/319 width=178) - Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 - <-Union 30 [SIMPLE_EDGE] - <-Map 34 [CONTAINS] llap - Reduce Output Operator [RS_92] - PartitionCols:_col1, _col0 - Select Operator [SEL_88] (rows=500/500 width=178) - Output:["_col0","_col1"] - Filter Operator [FIL_154] (rows=500/500 width=178) - predicate:value is not null - TableScan [TS_86] (rows=500/500 width=178) - Output:["key","value"] - <-Reducer 29 [CONTAINS] llap - Reduce Output Operator [RS_92] - PartitionCols:_col1, _col0 - Select Operator [SEL_85] (rows=1025/319 width=178) - Output:["_col0","_col1"] - Group By Operator [GBY_84] (rows=1025/319 width=178) - Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 - <-Union 28 [SIMPLE_EDGE] - <-Map 33 [CONTAINS] llap - Reduce Output Operator [RS_83] - PartitionCols:_col1, _col0 - Select Operator [SEL_79] (rows=500/500 width=178) - Output:["_col0","_col1"] - Filter Operator [FIL_153] (rows=500/500 width=178) - predicate:value is not null - TableScan [TS_77] (rows=500/500 width=178) - Output:["key","value"] - <-Reducer 27 [CONTAINS] llap - Reduce Output Operator [RS_83] - PartitionCols:_col1, _col0 - Select Operator [SEL_76] (rows=525/319 width=178) - Output:["_col0","_col1"] - Group By Operator [GBY_75] (rows=525/319 width=178) - Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 - <-Union 26 [SIMPLE_EDGE] - <-Map 25 [CONTAINS] llap - Reduce Output Operator [RS_74] - PartitionCols:_col1, _col0 - Select Operator [SEL_67] (rows=25/25 width=175) - Output:["_col0","_col1"] - Filter Operator [FIL_151] (rows=25/25 width=175) - predicate:value is not null - TableScan [TS_65] (rows=25/25 width=175) - Output:["key","value"] - <-Map 32 [CONTAINS] llap - Reduce Output Operator [RS_74] - PartitionCols:_col1, _col0 - Select Operator [SEL_70] (rows=500/500 width=178) - Output:["_col0","_col1"] - Filter Operator [FIL_152] (rows=500/500 width=178) - predicate:value is not null - TableScan [TS_68] (rows=500/500 width=178) - Output:["key","value"] - <-Reducer 7 [CONTAINS] llap + <-Reducer 30 [SIMPLE_EDGE] llap + SHUFFLE [RS_105] + PartitionCols:_col1 + Select Operator [SEL_100] (rows=1525/319 width=178) + Output:["_col1"] + Group By Operator [GBY_99] (rows=1525/319 width=178) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 29 [SIMPLE_EDGE] + <-Map 33 [CONTAINS] llap + Reduce Output Operator [RS_98] + PartitionCols:_col1, _col0 + Select Operator [SEL_94] (rows=500/500 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_150] (rows=500/500 width=178) + predicate:value is not null + TableScan [TS_92] (rows=500/500 width=178) + Output:["key","value"] + <-Reducer 28 [CONTAINS] llap + Reduce Output Operator [RS_98] + PartitionCols:_col1, _col0 + Select Operator [SEL_91] (rows=1025/319 width=178) + Output:["_col0","_col1"] + Group By Operator [GBY_90] (rows=1025/319 width=178) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 27 [SIMPLE_EDGE] + <-Map 32 [CONTAINS] llap + Reduce Output Operator [RS_89] + PartitionCols:_col1, _col0 + Select Operator [SEL_85] (rows=500/500 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_149] (rows=500/500 width=178) + predicate:value is not null + TableScan [TS_83] (rows=500/500 width=178) + Output:["key","value"] + <-Reducer 26 [CONTAINS] llap + Reduce Output Operator [RS_89] + PartitionCols:_col1, _col0 + Select Operator [SEL_82] (rows=525/319 width=178) + Output:["_col0","_col1"] + Group By Operator [GBY_81] (rows=525/319 width=178) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 25 [SIMPLE_EDGE] + <-Map 24 [CONTAINS] llap + Reduce Output Operator [RS_80] + PartitionCols:_col1, _col0 + Select Operator [SEL_73] (rows=25/25 width=175) + Output:["_col0","_col1"] + Filter Operator [FIL_147] (rows=25/25 width=175) + predicate:value is not null + TableScan [TS_71] (rows=25/25 width=175) + Output:["key","value"] + <-Map 31 [CONTAINS] llap + Reduce Output Operator [RS_80] + PartitionCols:_col1, _col0 + Select Operator [SEL_76] (rows=500/500 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_148] (rows=500/500 width=178) + predicate:value is not null + TableScan [TS_74] (rows=500/500 width=178) + Output:["key","value"] + <-Reducer 5 [CONTAINS] llap Reduce Output Operator [RS_111] PartitionCols:_col0, _col1 - Group By Operator [GBY_63] (rows=199/15 width=177) + Group By Operator [GBY_63] (rows=196/15 width=177) Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 - <-Union 6 [SIMPLE_EDGE] - <-Reducer 13 [CONTAINS] llap - Reduce Output Operator [RS_62] - PartitionCols:_col0, _col1 - Select Operator [SEL_58] (rows=132/61 width=177) - Output:["_col0","_col1"] - Merge Join Operator [MERGEJOIN_160] (rows=132/61 width=177) - Conds:RS_55._col2=RS_56._col0(Inner),Output:["_col2","_col5"] - <-Map 24 [SIMPLE_EDGE] llap - SHUFFLE [RS_56] - PartitionCols:_col0 - Select Operator [SEL_51] (rows=500/500 width=178) - Output:["_col0","_col1"] - Filter Operator [FIL_150] (rows=500/500 width=178) - predicate:key is not null - TableScan [TS_49] (rows=500/500 width=178) - default@src,y,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] - <-Reducer 12 [SIMPLE_EDGE] llap - SHUFFLE [RS_55] - PartitionCols:_col2 - Merge Join Operator [MERGEJOIN_159] (rows=82/52 width=86) - Conds:RS_52._col1=RS_53._col1(Inner),Output:["_col2"] - <-Map 11 [SIMPLE_EDGE] llap - SHUFFLE [RS_53] - PartitionCols:_col1 - Please refer to the previous Select Operator [SEL_14] - <-Reducer 21 [SIMPLE_EDGE] llap - SHUFFLE [RS_52] - PartitionCols:_col1 - Select Operator [SEL_45] (rows=1025/319 width=178) - Output:["_col1"] - Group By Operator [GBY_44] (rows=1025/319 width=178) - Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 - <-Union 20 [SIMPLE_EDGE] - <-Map 23 [CONTAINS] llap - Reduce Output Operator [RS_43] - PartitionCols:_col1, _col0 - Select Operator [SEL_39] (rows=500/500 width=178) - Output:["_col0","_col1"] - Filter Operator [FIL_148] (rows=500/500 width=178) - predicate:value is not null - TableScan [TS_37] (rows=500/500 width=178) - Output:["key","value"] - <-Reducer 19 [CONTAINS] llap - Reduce Output Operator [RS_43] - PartitionCols:_col1, _col0 - Select Operator [SEL_36] (rows=525/319 width=178) - Output:["_col0","_col1"] - Group By Operator [GBY_35] (rows=525/319 width=178) - Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 - <-Union 18 [SIMPLE_EDGE] - <-Map 17 [CONTAINS] llap - Reduce Output Operator [RS_34] - PartitionCols:_col1, _col0 - Select Operator [SEL_27] (rows=25/25 width=175) - Output:["_col0","_col1"] - Filter Operator [FIL_146] (rows=25/25 width=175) - predicate:value is not null - TableScan [TS_25] (rows=25/25 width=175) - Output:["key","value"] - <-Map 22 [CONTAINS] llap - Reduce Output Operator [RS_34] - PartitionCols:_col1, _col0 - Select Operator [SEL_30] (rows=500/500 width=178) - Output:["_col0","_col1"] - Filter Operator [FIL_147] (rows=500/500 width=178) - predicate:value is not null - TableScan [TS_28] (rows=500/500 width=178) - Output:["key","value"] - <-Reducer 5 [CONTAINS] llap + <-Union 4 [SIMPLE_EDGE] + <-Reducer 3 [CONTAINS] llap Reduce Output Operator [RS_62] PartitionCols:_col0, _col1 - Select Operator [SEL_24] (rows=67/61 width=177) + Select Operator [SEL_24] (rows=66/61 width=177) Output:["_col0","_col1"] - Merge Join Operator [MERGEJOIN_158] (rows=67/61 width=177) - Conds:RS_21._col2=RS_22._col0(Inner),Output:["_col2","_col5"] - <-Map 16 [SIMPLE_EDGE] llap + Merge Join Operator [MERGEJOIN_154] (rows=66/61 width=177) + Conds:RS_21._col3=RS_22._col1(Inner),Output:["_col1","_col2"] + <-Reducer 15 [SIMPLE_EDGE] llap SHUFFLE [RS_22] - PartitionCols:_col0 - Please refer to the previous Select Operator [SEL_17] - <-Reducer 4 [SIMPLE_EDGE] llap + PartitionCols:_col1 + Select Operator [SEL_17] (rows=525/319 width=178) + Output:["_col1"] + Group By Operator [GBY_16] (rows=525/319 width=178) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 14 [SIMPLE_EDGE] + <-Map 13 [CONTAINS] llap + Reduce Output Operator [RS_15] + PartitionCols:_col1, _col0 + Select Operator [SEL_8] (rows=25/25 width=175) + Output:["_col0","_col1"] + Filter Operator [FIL_138] (rows=25/25 width=175) + predicate:value is not null + TableScan [TS_6] (rows=25/25 width=175) + Output:["key","value"] + <-Map 16 [CONTAINS] llap + Reduce Output Operator [RS_15] + PartitionCols:_col1, _col0 + Select Operator [SEL_11] (rows=500/500 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_139] (rows=500/500 width=178) + predicate:value is not null + TableScan [TS_9] (rows=500/500 width=178) + Output:["key","value"] + <-Reducer 2 [SIMPLE_EDGE] llap SHUFFLE [RS_21] - PartitionCols:_col2 - Merge Join Operator [MERGEJOIN_157] (rows=42/52 width=86) - Conds:RS_18._col1=RS_19._col1(Inner),Output:["_col2"] - <-Map 11 [SIMPLE_EDGE] llap - SHUFFLE [RS_19] - PartitionCols:_col1 - Please refer to the previous Select Operator [SEL_14] - <-Reducer 3 [SIMPLE_EDGE] llap + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_151] (rows=39/37 width=266) + Conds:RS_18._col0=RS_19._col0(Inner),Output:["_col1","_col2","_col3"] + <-Map 1 [SIMPLE_EDGE] llap SHUFFLE [RS_18] - PartitionCols:_col1 - Select Operator [SEL_11] (rows=525/319 width=178) - Output:["_col1"] - Group By Operator [GBY_10] (rows=525/319 width=178) - Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 - <-Union 2 [SIMPLE_EDGE] - <-Map 1 [CONTAINS] llap - Reduce Output Operator [RS_9] - PartitionCols:_col1, _col0 - Select Operator [SEL_2] (rows=25/25 width=175) - Output:["_col0","_col1"] - Filter Operator [FIL_142] (rows=25/25 width=175) - predicate:value is not null - TableScan [TS_0] (rows=25/25 width=175) - Output:["key","value"] - <-Map 10 [CONTAINS] llap - Reduce Output Operator [RS_9] - PartitionCols:_col1, _col0 - Select Operator [SEL_5] (rows=500/500 width=178) - Output:["_col0","_col1"] - Filter Operator [FIL_143] (rows=500/500 width=178) - predicate:value is not null - TableScan [TS_3] (rows=500/500 width=178) - Output:["key","value"] + PartitionCols:_col0 + Please refer to the previous Select Operator [SEL_2] + <-Map 12 [SIMPLE_EDGE] llap + SHUFFLE [RS_19] + PartitionCols:_col0 + Please refer to the previous Select Operator [SEL_5] + <-Reducer 9 [CONTAINS] llap + Reduce Output Operator [RS_62] + PartitionCols:_col0, _col1 + Select Operator [SEL_58] (rows=130/61 width=177) + Output:["_col0","_col1"] + Merge Join Operator [MERGEJOIN_155] (rows=130/61 width=177) + Conds:RS_55._col3=RS_56._col1(Inner),Output:["_col1","_col2"] + <-Reducer 21 [SIMPLE_EDGE] llap + SHUFFLE [RS_56] + PartitionCols:_col1 + Select Operator [SEL_51] (rows=1025/319 width=178) + Output:["_col1"] + Group By Operator [GBY_50] (rows=1025/319 width=178) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 20 [SIMPLE_EDGE] + <-Map 23 [CONTAINS] llap + Reduce Output Operator [RS_49] + PartitionCols:_col1, _col0 + Select Operator [SEL_45] (rows=500/500 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_144] (rows=500/500 width=178) + predicate:value is not null + TableScan [TS_43] (rows=500/500 width=178) + Output:["key","value"] + <-Reducer 19 [CONTAINS] llap + Reduce Output Operator [RS_49] + PartitionCols:_col1, _col0 + Select Operator [SEL_42] (rows=525/319 width=178) + Output:["_col0","_col1"] + Group By Operator [GBY_41] (rows=525/319 width=178) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 18 [SIMPLE_EDGE] + <-Map 17 [CONTAINS] llap + Reduce Output Operator [RS_40] + PartitionCols:_col1, _col0 + Select Operator [SEL_33] (rows=25/25 width=175) + Output:["_col0","_col1"] + Filter Operator [FIL_142] (rows=25/25 width=175) + predicate:value is not null + TableScan [TS_31] (rows=25/25 width=175) + Output:["key","value"] + <-Map 22 [CONTAINS] llap + Reduce Output Operator [RS_40] + PartitionCols:_col1, _col0 + Select Operator [SEL_36] (rows=500/500 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_143] (rows=500/500 width=178) + predicate:value is not null + TableScan [TS_34] (rows=500/500 width=178) + Output:["key","value"] + <-Reducer 8 [SIMPLE_EDGE] llap + SHUFFLE [RS_55] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_152] (rows=39/37 width=266) + Conds:RS_52._col0=RS_53._col0(Inner),Output:["_col1","_col2","_col3"] + <-Map 1 [SIMPLE_EDGE] llap + SHUFFLE [RS_52] + PartitionCols:_col0 + Please refer to the previous Select Operator [SEL_2] + <-Map 12 [SIMPLE_EDGE] llap + SHUFFLE [RS_53] + PartitionCols:_col0 + Please refer to the previous Select Operator [SEL_5] PREHOOK: query: CREATE TABLE srcbucket_mapjoin(key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE PREHOOK: type: CREATETABLE @@ -629,20 +619,20 @@ Stage-0 Stage-1 Map 1 llap File Output Operator [FS_10] - Merge Join Operator [MERGEJOIN_15] (rows=253/480 width=190) + Merge Join Operator [MERGEJOIN_15] (rows=382/480 width=95) Conds:SEL_2._col0=SEL_5._col0(Inner),Output:["_col0","_col1"] - <-Select Operator [SEL_5] (rows=230/242 width=14) + <-Select Operator [SEL_5] (rows=242/242 width=4) Output:["_col0"] - Filter Operator [FIL_14] (rows=230/242 width=14) + Filter Operator [FIL_14] (rows=242/242 width=4) predicate:key is not null - TableScan [TS_3] (rows=242/242 width=14) - default@tab,s3,Tbl:COMPLETE,Col:NONE,Output:["key"] - <-Select Operator [SEL_2] (rows=230/242 width=190) + TableScan [TS_3] (rows=242/242 width=4) + default@tab,s3,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Select Operator [SEL_2] (rows=242/242 width=95) Output:["_col0","_col1"] - Filter Operator [FIL_13] (rows=230/242 width=190) + Filter Operator [FIL_13] (rows=242/242 width=95) predicate:key is not null - TableScan [TS_0] (rows=242/242 width=190) - default@tab,s1,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + TableScan [TS_0] (rows=242/242 width=95) + default@tab,s1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] PREHOOK: query: select s1.key as key, s1.value as value from tab s1 join tab s3 on s1.key=s3.key join tab s2 on s1.value=s2.value PREHOOK: type: QUERY @@ -671,36 +661,34 @@ Stage-0 Stage-1 Reducer 2 llap File Output Operator [FS_16] - Select Operator [SEL_15] (rows=278/1166 width=3) - Output:["_col0","_col1"] - Merge Join Operator [MERGEJOIN_27] (rows=278/1166 width=3) - Conds:RS_12._col2=RS_13._col1(Inner),Output:["_col1","_col2"] - <-Map 1 [SIMPLE_EDGE] llap - SHUFFLE [RS_12] - PartitionCols:_col2 - Merge Join Operator [MERGEJOIN_25] (rows=253/480 width=3) - Conds:SEL_2._col0=SEL_5._col0(Inner),Output:["_col1","_col2"] - <-Select Operator [SEL_5] (rows=218/242 width=179) - Output:["_col0","_col1"] - Filter Operator [FIL_23] (rows=218/242 width=179) - predicate:(key is not null and value is not null) - TableScan [TS_3] (rows=242/242 width=179) - default@tab,s1,Tbl:COMPLETE,Col:NONE,Output:["key","value"] - <-Select Operator [SEL_2] (rows=230/242 width=3) - Output:["_col0"] - Filter Operator [FIL_22] (rows=230/242 width=3) - predicate:key is not null - TableScan [TS_0] (rows=242/242 width=3) - default@tab,s3,Tbl:COMPLETE,Col:NONE,Output:["key"] - <-Map 4 [SIMPLE_EDGE] llap - SHUFFLE [RS_13] - PartitionCols:_col1 - Select Operator [SEL_8] (rows=230/242 width=175) - Output:["_col1"] - Filter Operator [FIL_24] (rows=230/242 width=175) - predicate:value is not null - TableScan [TS_6] (rows=242/242 width=175) - default@tab,s2,Tbl:COMPLETE,Col:NONE,Output:["value"] + Merge Join Operator [MERGEJOIN_27] (rows=604/1166 width=95) + Conds:RS_12._col1=RS_13._col1(Inner),Output:["_col0","_col1"] + <-Map 1 [SIMPLE_EDGE] llap + SHUFFLE [RS_12] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_25] (rows=382/480 width=95) + Conds:SEL_2._col0=SEL_5._col0(Inner),Output:["_col0","_col1"] + <-Select Operator [SEL_5] (rows=242/242 width=4) + Output:["_col0"] + Filter Operator [FIL_23] (rows=242/242 width=4) + predicate:key is not null + TableScan [TS_3] (rows=242/242 width=4) + default@tab,s3,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Select Operator [SEL_2] (rows=242/242 width=95) + Output:["_col0","_col1"] + Filter Operator [FIL_22] (rows=242/242 width=95) + predicate:(key is not null and value is not null) + TableScan [TS_0] (rows=242/242 width=95) + default@tab,s1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] + <-Map 4 [SIMPLE_EDGE] llap + SHUFFLE [RS_13] + PartitionCols:_col1 + Select Operator [SEL_8] (rows=242/242 width=91) + Output:["_col1"] + Filter Operator [FIL_24] (rows=242/242 width=91) + predicate:value is not null + TableScan [TS_6] (rows=242/242 width=91) + default@tab,s2,Tbl:COMPLETE,Col:COMPLETE,Output:["value"] PREHOOK: query: select s1.key as key, s1.value as value from tab s1 join tab2 s3 on s1.key=s3.key PREHOOK: type: QUERY @@ -730,20 +718,20 @@ Stage-0 Stage-1 Map 1 llap File Output Operator [FS_10] - Merge Join Operator [MERGEJOIN_15] (rows=253/480 width=190) + Merge Join Operator [MERGEJOIN_15] (rows=382/480 width=95) Conds:SEL_2._col0=SEL_5._col0(Inner),Output:["_col0","_col1"] - <-Select Operator [SEL_5] (rows=230/242 width=14) + <-Select Operator [SEL_5] (rows=242/242 width=4) Output:["_col0"] - Filter Operator [FIL_14] (rows=230/242 width=14) + Filter Operator [FIL_14] (rows=242/242 width=4) predicate:key is not null - TableScan [TS_3] (rows=242/242 width=14) - default@tab2,s3,Tbl:COMPLETE,Col:NONE,Output:["key"] - <-Select Operator [SEL_2] (rows=230/242 width=190) + TableScan [TS_3] (rows=242/242 width=4) + default@tab2,s3,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Select Operator [SEL_2] (rows=242/242 width=95) Output:["_col0","_col1"] - Filter Operator [FIL_13] (rows=230/242 width=190) + Filter Operator [FIL_13] (rows=242/242 width=95) predicate:key is not null - TableScan [TS_0] (rows=242/242 width=190) - default@tab,s1,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + TableScan [TS_0] (rows=242/242 width=95) + default@tab,s1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] PREHOOK: query: select s1.key as key, s1.value as value from tab s1 join tab2 s3 on s1.key=s3.key join tab2 s2 on s1.value=s2.value PREHOOK: type: QUERY @@ -776,36 +764,34 @@ Stage-0 Stage-1 Reducer 2 llap File Output Operator [FS_16] - Select Operator [SEL_15] (rows=278/1166 width=3) - Output:["_col0","_col1"] - Merge Join Operator [MERGEJOIN_27] (rows=278/1166 width=3) - Conds:RS_12._col2=RS_13._col1(Inner),Output:["_col1","_col2"] - <-Map 1 [SIMPLE_EDGE] llap - SHUFFLE [RS_12] - PartitionCols:_col2 - Merge Join Operator [MERGEJOIN_25] (rows=253/480 width=3) - Conds:SEL_2._col0=SEL_5._col0(Inner),Output:["_col1","_col2"] - <-Select Operator [SEL_5] (rows=218/242 width=179) - Output:["_col0","_col1"] - Filter Operator [FIL_23] (rows=218/242 width=179) - predicate:(key is not null and value is not null) - TableScan [TS_3] (rows=242/242 width=179) - default@tab,s1,Tbl:COMPLETE,Col:NONE,Output:["key","value"] - <-Select Operator [SEL_2] (rows=230/242 width=3) - Output:["_col0"] - Filter Operator [FIL_22] (rows=230/242 width=3) - predicate:key is not null - TableScan [TS_0] (rows=242/242 width=3) - default@tab2,s3,Tbl:COMPLETE,Col:NONE,Output:["key"] - <-Map 4 [SIMPLE_EDGE] llap - SHUFFLE [RS_13] - PartitionCols:_col1 - Select Operator [SEL_8] (rows=230/242 width=175) - Output:["_col1"] - Filter Operator [FIL_24] (rows=230/242 width=175) - predicate:value is not null - TableScan [TS_6] (rows=242/242 width=175) - default@tab2,s2,Tbl:COMPLETE,Col:NONE,Output:["value"] + Merge Join Operator [MERGEJOIN_27] (rows=604/1166 width=95) + Conds:RS_12._col1=RS_13._col1(Inner),Output:["_col0","_col1"] + <-Map 1 [SIMPLE_EDGE] llap + SHUFFLE [RS_12] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_25] (rows=382/480 width=95) + Conds:SEL_2._col0=SEL_5._col0(Inner),Output:["_col0","_col1"] + <-Select Operator [SEL_5] (rows=242/242 width=4) + Output:["_col0"] + Filter Operator [FIL_23] (rows=242/242 width=4) + predicate:key is not null + TableScan [TS_3] (rows=242/242 width=4) + default@tab2,s3,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Select Operator [SEL_2] (rows=242/242 width=95) + Output:["_col0","_col1"] + Filter Operator [FIL_22] (rows=242/242 width=95) + predicate:(key is not null and value is not null) + TableScan [TS_0] (rows=242/242 width=95) + default@tab,s1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] + <-Map 4 [SIMPLE_EDGE] llap + SHUFFLE [RS_13] + PartitionCols:_col1 + Select Operator [SEL_8] (rows=242/242 width=91) + Output:["_col1"] + Filter Operator [FIL_24] (rows=242/242 width=91) + predicate:value is not null + TableScan [TS_6] (rows=242/242 width=91) + default@tab2,s2,Tbl:COMPLETE,Col:COMPLETE,Output:["value"] PREHOOK: query: select count(*) from (select s1.key as key, s1.value as value from tab s1 join tab s3 on s1.key=s3.key UNION ALL @@ -857,43 +843,43 @@ Stage-0 Output:["_col0"],aggregations:["count()"] <-Reducer 3 [CUSTOM_SIMPLE_EDGE] llap PARTITION_ONLY_SHUFFLE [RS_22] - Merge Join Operator [MERGEJOIN_38] (rows=531/1646 width=3) + Merge Join Operator [MERGEJOIN_38] (rows=1029/1646 width=8) Conds:Union 2._col0=RS_19._col0(Inner) <-Map 7 [SIMPLE_EDGE] llap SHUFFLE [RS_19] PartitionCols:_col0 - Select Operator [SEL_17] (rows=475/500 width=3) + Select Operator [SEL_17] (rows=500/500 width=4) Output:["_col0"] - Filter Operator [FIL_35] (rows=475/500 width=3) + Filter Operator [FIL_35] (rows=500/500 width=4) predicate:key is not null - TableScan [TS_15] (rows=500/500 width=3) - default@tab_part,b,Tbl:COMPLETE,Col:NONE,Output:["key"] + TableScan [TS_15] (rows=500/500 width=4) + default@tab_part,b,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] <-Union 2 [SIMPLE_EDGE] <-Map 1 [CONTAINS] llap Reduce Output Operator [RS_18] PartitionCols:_col0 - Merge Join Operator [MERGEJOIN_36] (rows=253/480 width=3) + Merge Join Operator [MERGEJOIN_36] (rows=382/480 width=4) Conds:SEL_2._col0=SEL_5._col0(Inner),Output:["_col0"] - <-Select Operator [SEL_5] (rows=230/242 width=3) + <-Select Operator [SEL_5] (rows=242/242 width=4) Output:["_col0"] - Filter Operator [FIL_33] (rows=230/242 width=3) + Filter Operator [FIL_33] (rows=242/242 width=4) predicate:key is not null - TableScan [TS_3] (rows=242/242 width=3) - default@tab,s3,Tbl:COMPLETE,Col:NONE,Output:["key"] - <-Select Operator [SEL_2] (rows=230/242 width=3) + TableScan [TS_3] (rows=242/242 width=4) + default@tab,s3,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Select Operator [SEL_2] (rows=242/242 width=4) Output:["_col0"] - Filter Operator [FIL_32] (rows=230/242 width=3) + Filter Operator [FIL_32] (rows=242/242 width=4) predicate:key is not null - TableScan [TS_0] (rows=242/242 width=3) + TableScan [TS_0] (rows=242/242 width=4) Output:["key"] <-Map 6 [CONTAINS] llap Reduce Output Operator [RS_18] PartitionCols:_col0 - Select Operator [SEL_12] (rows=230/242 width=3) + Select Operator [SEL_12] (rows=242/242 width=4) Output:["_col0"] - Filter Operator [FIL_34] (rows=230/242 width=3) + Filter Operator [FIL_34] (rows=242/242 width=4) predicate:key is not null - TableScan [TS_10] (rows=242/242 width=3) + TableScan [TS_10] (rows=242/242 width=4) Output:["key"] PREHOOK: query: select count(*) from (select s1.key as key, s1.value as value from tab s1 join tab s3 on s1.key=s3.key join tab s2 on s1.value=s2.value @@ -946,60 +932,58 @@ Stage-0 Output:["_col0"],aggregations:["count()"] <-Reducer 4 [CUSTOM_SIMPLE_EDGE] llap PARTITION_ONLY_SHUFFLE [RS_28] - Merge Join Operator [MERGEJOIN_50] (rows=558/3768 width=3) + Merge Join Operator [MERGEJOIN_50] (rows=1396/3768 width=8) Conds:Union 3._col0=RS_25._col0(Inner) <-Map 9 [SIMPLE_EDGE] llap SHUFFLE [RS_25] PartitionCols:_col0 - Select Operator [SEL_23] (rows=475/500 width=3) + Select Operator [SEL_23] (rows=500/500 width=4) Output:["_col0"] - Filter Operator [FIL_46] (rows=475/500 width=3) + Filter Operator [FIL_46] (rows=500/500 width=4) predicate:key is not null - TableScan [TS_21] (rows=500/500 width=3) - default@tab_part,b,Tbl:COMPLETE,Col:NONE,Output:["key"] + TableScan [TS_21] (rows=500/500 width=4) + default@tab_part,b,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] <-Union 3 [SIMPLE_EDGE] <-Map 8 [CONTAINS] llap Reduce Output Operator [RS_24] PartitionCols:_col0 - Select Operator [SEL_18] (rows=230/242 width=3) + Select Operator [SEL_18] (rows=242/242 width=4) Output:["_col0"] - Filter Operator [FIL_45] (rows=230/242 width=3) + Filter Operator [FIL_45] (rows=242/242 width=4) predicate:key is not null - TableScan [TS_16] (rows=242/242 width=3) + TableScan [TS_16] (rows=242/242 width=4) Output:["key"] <-Reducer 2 [CONTAINS] llap Reduce Output Operator [RS_24] PartitionCols:_col0 - Select Operator [SEL_15] (rows=278/1166 width=3) - Output:["_col0"] - Merge Join Operator [MERGEJOIN_49] (rows=278/1166 width=3) - Conds:RS_12._col2=RS_13._col1(Inner),Output:["_col1"] - <-Map 1 [SIMPLE_EDGE] llap - SHUFFLE [RS_12] - PartitionCols:_col2 - Merge Join Operator [MERGEJOIN_47] (rows=253/480 width=3) - Conds:SEL_2._col0=SEL_5._col0(Inner),Output:["_col1","_col2"] - <-Select Operator [SEL_5] (rows=218/242 width=179) - Output:["_col0","_col1"] - Filter Operator [FIL_43] (rows=218/242 width=179) - predicate:(key is not null and value is not null) - TableScan [TS_3] (rows=242/242 width=179) - default@tab,s1,Tbl:COMPLETE,Col:NONE,Output:["key","value"] - <-Select Operator [SEL_2] (rows=230/242 width=3) - Output:["_col0"] - Filter Operator [FIL_42] (rows=230/242 width=3) - predicate:key is not null - TableScan [TS_0] (rows=242/242 width=3) - default@tab,s3,Tbl:COMPLETE,Col:NONE,Output:["key"] - <-Map 7 [SIMPLE_EDGE] llap - SHUFFLE [RS_13] - PartitionCols:_col1 - Select Operator [SEL_8] (rows=230/242 width=175) - Output:["_col1"] - Filter Operator [FIL_44] (rows=230/242 width=175) - predicate:value is not null - TableScan [TS_6] (rows=242/242 width=175) - default@tab,s2,Tbl:COMPLETE,Col:NONE,Output:["value"] + Merge Join Operator [MERGEJOIN_49] (rows=604/1166 width=4) + Conds:RS_12._col1=RS_13._col1(Inner),Output:["_col0"] + <-Map 1 [SIMPLE_EDGE] llap + SHUFFLE [RS_12] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_47] (rows=382/480 width=95) + Conds:SEL_2._col0=SEL_5._col0(Inner),Output:["_col0","_col1"] + <-Select Operator [SEL_5] (rows=242/242 width=4) + Output:["_col0"] + Filter Operator [FIL_43] (rows=242/242 width=4) + predicate:key is not null + TableScan [TS_3] (rows=242/242 width=4) + default@tab,s3,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Select Operator [SEL_2] (rows=242/242 width=95) + Output:["_col0","_col1"] + Filter Operator [FIL_42] (rows=242/242 width=95) + predicate:(key is not null and value is not null) + TableScan [TS_0] (rows=242/242 width=95) + default@tab,s1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] + <-Map 7 [SIMPLE_EDGE] llap + SHUFFLE [RS_13] + PartitionCols:_col1 + Select Operator [SEL_8] (rows=242/242 width=91) + Output:["_col1"] + Filter Operator [FIL_44] (rows=242/242 width=91) + predicate:value is not null + TableScan [TS_6] (rows=242/242 width=91) + default@tab,s2,Tbl:COMPLETE,Col:COMPLETE,Output:["value"] PREHOOK: query: CREATE TABLE a(key STRING, value STRING) STORED AS TEXTFILE PREHOOK: type: CREATETABLE @@ -1112,21 +1096,21 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Vertex dependency in root stage -Map 1 <- Union 2 (CONTAINS) -Map 13 <- Union 14 (CONTAINS) -Map 15 <- Union 14 (CONTAINS) -Map 16 <- Union 14 (CONTAINS) +Map 10 <- Union 11 (CONTAINS) +Map 12 <- Union 11 (CONTAINS) +Map 14 <- Union 15 (CONTAINS) +Map 16 <- Union 15 (CONTAINS) +Map 17 <- Union 15 (CONTAINS) Map 19 <- Union 20 (CONTAINS) Map 21 <- Union 20 (CONTAINS) Map 22 <- Union 20 (CONTAINS) Map 23 <- Union 20 (CONTAINS) -Map 6 <- Union 2 (CONTAINS) -Reducer 11 <- Map 10 (SIMPLE_EDGE), Union 14 (SIMPLE_EDGE) -Reducer 12 <- Map 17 (SIMPLE_EDGE), Reducer 11 (SIMPLE_EDGE), Union 5 (CONTAINS) -Reducer 3 <- Map 7 (SIMPLE_EDGE), Union 2 (SIMPLE_EDGE) -Reducer 4 <- Map 10 (SIMPLE_EDGE), Reducer 3 (SIMPLE_EDGE), Union 5 (CONTAINS) +Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 7 (SIMPLE_EDGE) +Reducer 3 <- Reducer 2 (SIMPLE_EDGE), Union 11 (SIMPLE_EDGE), Union 4 (CONTAINS) +Reducer 5 <- Map 1 (SIMPLE_EDGE), Map 13 (SIMPLE_EDGE) +Reducer 6 <- Reducer 5 (SIMPLE_EDGE), Union 15 (SIMPLE_EDGE), Union 4 (CONTAINS) Reducer 8 <- Map 18 (SIMPLE_EDGE), Map 7 (SIMPLE_EDGE) -Reducer 9 <- Reducer 8 (SIMPLE_EDGE), Union 20 (SIMPLE_EDGE), Union 5 (CONTAINS) +Reducer 9 <- Reducer 8 (SIMPLE_EDGE), Union 20 (SIMPLE_EDGE), Union 4 (CONTAINS) Stage-5 Stats Work{} @@ -1136,147 +1120,147 @@ Stage-5 Stage-4 Dependency Collection{} Stage-3 - Union 5 - <-Reducer 12 [CONTAINS] llap + Union 4 + <-Reducer 3 [CONTAINS] llap File Output Operator [FS_75] table:{"name:":"default.a"} - Select Operator [SEL_44] (rows=2682/5421 width=178) + Select Operator [SEL_20] (rows=66/170 width=177) Output:["_col0","_col1"] - Merge Join Operator [MERGEJOIN_122] (rows=2682/5421 width=178) - Conds:RS_41._col1=RS_42._col0(Inner),Output:["_col1","_col4"] - <-Map 17 [SIMPLE_EDGE] llap - SHUFFLE [RS_42] - PartitionCols:_col0 - Select Operator [SEL_37] (rows=500/500 width=178) - Output:["_col0","_col1"] - Filter Operator [FIL_112] (rows=500/500 width=178) - predicate:key is not null - TableScan [TS_35] (rows=500/500 width=178) - default@src,y,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] - <-Reducer 11 [SIMPLE_EDGE] llap - SHUFFLE [RS_41] - PartitionCols:_col1 - Merge Join Operator [MERGEJOIN_121] (rows=1658/2097 width=87) - Conds:Union 14._col0=RS_39._col1(Inner),Output:["_col1"] - <-Map 10 [SIMPLE_EDGE] llap - SHUFFLE [RS_39] - PartitionCols:_col1 - Select Operator [SEL_34] (rows=500/500 width=178) + Merge Join Operator [MERGEJOIN_119] (rows=66/170 width=177) + Conds:RS_17._col3=Union 11._col0(Inner),Output:["_col1","_col2"] + <-Reducer 2 [SIMPLE_EDGE] llap + SHUFFLE [RS_17] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_116] (rows=39/37 width=266) + Conds:RS_14._col0=RS_15._col0(Inner),Output:["_col1","_col2","_col3"] + <-Map 1 [SIMPLE_EDGE] llap + SHUFFLE [RS_14] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=500/500 width=178) Output:["_col0","_col1"] - Filter Operator [FIL_111] (rows=500/500 width=178) - predicate:(key is not null and value is not null) - TableScan [TS_11] (rows=500/500 width=178) + Filter Operator [FIL_101] (rows=500/500 width=178) + predicate:key is not null + TableScan [TS_0] (rows=500/500 width=178) default@src,y,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] - <-Union 14 [SIMPLE_EDGE] - <-Map 13 [CONTAINS] llap - Reduce Output Operator [RS_38] - PartitionCols:_col0 - Select Operator [SEL_23] (rows=25/25 width=89) - Output:["_col0"] - Filter Operator [FIL_108] (rows=25/25 width=89) - predicate:value is not null - TableScan [TS_21] (rows=25/25 width=89) - Output:["value"] - <-Map 15 [CONTAINS] llap - Reduce Output Operator [RS_38] - PartitionCols:_col0 - Select Operator [SEL_26] (rows=500/500 width=91) - Output:["_col0"] - Filter Operator [FIL_109] (rows=500/500 width=91) - predicate:value is not null - TableScan [TS_24] (rows=500/500 width=91) - Output:["value"] - <-Map 16 [CONTAINS] llap - Reduce Output Operator [RS_38] - PartitionCols:_col0 - Select Operator [SEL_30] (rows=500/500 width=91) - Output:["_col0"] - Filter Operator [FIL_110] (rows=500/500 width=91) - predicate:value is not null - TableScan [TS_28] (rows=500/500 width=91) - Output:["value"] + <-Map 7 [SIMPLE_EDGE] llap + SHUFFLE [RS_15] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=25/25 width=175) + Output:["_col0","_col1"] + Filter Operator [FIL_102] (rows=25/25 width=175) + predicate:(key is not null and value is not null) + TableScan [TS_3] (rows=25/25 width=175) + default@src1,x,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] + <-Union 11 [SIMPLE_EDGE] + <-Map 10 [CONTAINS] llap + Reduce Output Operator [RS_18] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=25/25 width=89) + Output:["_col0"] + Filter Operator [FIL_103] (rows=25/25 width=89) + predicate:value is not null + TableScan [TS_6] (rows=25/25 width=89) + Output:["value"] + <-Map 12 [CONTAINS] llap + Reduce Output Operator [RS_18] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=500/500 width=91) + Output:["_col0"] + Filter Operator [FIL_104] (rows=500/500 width=91) + predicate:value is not null + TableScan [TS_9] (rows=500/500 width=91) + Output:["value"] File Output Operator [FS_77] table:{"name:":"default.b"} - Please refer to the previous Select Operator [SEL_44] + Please refer to the previous Select Operator [SEL_20] File Output Operator [FS_79] table:{"name:":"default.c"} - Please refer to the previous Select Operator [SEL_44] - <-Reducer 4 [CONTAINS] llap + Please refer to the previous Select Operator [SEL_20] + <-Reducer 6 [CONTAINS] llap File Output Operator [FS_75] table:{"name:":"default.a"} - Select Operator [SEL_20] (rows=67/170 width=177) + Select Operator [SEL_44] (rows=2640/5421 width=178) Output:["_col0","_col1"] - Merge Join Operator [MERGEJOIN_120] (rows=67/170 width=177) - Conds:RS_17._col1=RS_18._col0(Inner),Output:["_col1","_col4"] - <-Map 10 [SIMPLE_EDGE] llap - SHUFFLE [RS_18] - PartitionCols:_col0 - Select Operator [SEL_13] (rows=500/500 width=178) - Output:["_col0","_col1"] - Filter Operator [FIL_107] (rows=500/500 width=178) - predicate:key is not null - Please refer to the previous TableScan [TS_11] - <-Reducer 3 [SIMPLE_EDGE] llap - SHUFFLE [RS_17] + Merge Join Operator [MERGEJOIN_120] (rows=2640/5421 width=178) + Conds:RS_41._col1=Union 15._col0(Inner),Output:["_col0","_col3"] + <-Reducer 5 [SIMPLE_EDGE] llap + SHUFFLE [RS_41] PartitionCols:_col1 - Merge Join Operator [MERGEJOIN_119] (rows=42/108 width=86) - Conds:Union 2._col0=RS_15._col1(Inner),Output:["_col1"] - <-Map 7 [SIMPLE_EDGE] llap - SHUFFLE [RS_15] - PartitionCols:_col1 - Select Operator [SEL_10] (rows=25/25 width=175) + Merge Join Operator [MERGEJOIN_117] (rows=791/1028 width=269) + Conds:RS_38._col0=RS_39._col0(Inner),Output:["_col0","_col1","_col3"] + <-Map 1 [SIMPLE_EDGE] llap + SHUFFLE [RS_38] + PartitionCols:_col0 + Select Operator [SEL_23] (rows=500/500 width=178) Output:["_col0","_col1"] - Filter Operator [FIL_106] (rows=25/25 width=175) + Filter Operator [FIL_105] (rows=500/500 width=178) predicate:(key is not null and value is not null) - TableScan [TS_8] (rows=25/25 width=175) - default@src1,x,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] - <-Union 2 [SIMPLE_EDGE] - <-Map 1 [CONTAINS] llap - Reduce Output Operator [RS_14] - PartitionCols:_col0 - Select Operator [SEL_2] (rows=25/25 width=89) - Output:["_col0"] - Filter Operator [FIL_104] (rows=25/25 width=89) - predicate:value is not null - TableScan [TS_0] (rows=25/25 width=89) - Output:["value"] - <-Map 6 [CONTAINS] llap - Reduce Output Operator [RS_14] - PartitionCols:_col0 - Select Operator [SEL_5] (rows=500/500 width=91) - Output:["_col0"] - Filter Operator [FIL_105] (rows=500/500 width=91) - predicate:value is not null - TableScan [TS_3] (rows=500/500 width=91) - Output:["value"] + Please refer to the previous TableScan [TS_0] + <-Map 13 [SIMPLE_EDGE] llap + SHUFFLE [RS_39] + PartitionCols:_col0 + Select Operator [SEL_26] (rows=500/500 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_106] (rows=500/500 width=178) + predicate:key is not null + TableScan [TS_24] (rows=500/500 width=178) + default@src,y,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] + <-Union 15 [SIMPLE_EDGE] + <-Map 14 [CONTAINS] llap + Reduce Output Operator [RS_42] + PartitionCols:_col0 + Select Operator [SEL_29] (rows=25/25 width=89) + Output:["_col0"] + Filter Operator [FIL_107] (rows=25/25 width=89) + predicate:value is not null + TableScan [TS_27] (rows=25/25 width=89) + Output:["value"] + <-Map 16 [CONTAINS] llap + Reduce Output Operator [RS_42] + PartitionCols:_col0 + Select Operator [SEL_32] (rows=500/500 width=91) + Output:["_col0"] + Filter Operator [FIL_108] (rows=500/500 width=91) + predicate:value is not null + TableScan [TS_30] (rows=500/500 width=91) + Output:["value"] + <-Map 17 [CONTAINS] llap + Reduce Output Operator [RS_42] + PartitionCols:_col0 + Select Operator [SEL_36] (rows=500/500 width=91) + Output:["_col0"] + Filter Operator [FIL_109] (rows=500/500 width=91) + predicate:value is not null + TableScan [TS_34] (rows=500/500 width=91) + Output:["value"] File Output Operator [FS_77] table:{"name:":"default.b"} - Please refer to the previous Select Operator [SEL_20] + Please refer to the previous Select Operator [SEL_44] File Output Operator [FS_79] table:{"name:":"default.c"} - Please refer to the previous Select Operator [SEL_20] + Please refer to the previous Select Operator [SEL_44] <-Reducer 9 [CONTAINS] llap File Output Operator [FS_75] table:{"name:":"default.a"} - Select Operator [SEL_72] (rows=192/820 width=175) + Select Operator [SEL_72] (rows=193/820 width=175) Output:["_col0","_col1"] - Merge Join Operator [MERGEJOIN_124] (rows=192/820 width=175) + Merge Join Operator [MERGEJOIN_121] (rows=193/820 width=175) Conds:RS_69._col1=Union 20._col0(Inner),Output:["_col0","_col3"] <-Reducer 8 [SIMPLE_EDGE] llap SHUFFLE [RS_69] PartitionCols:_col1 - Merge Join Operator [MERGEJOIN_123] (rows=39/115 width=264) + Merge Join Operator [MERGEJOIN_118] (rows=39/115 width=264) Conds:RS_66._col0=RS_67._col0(Inner),Output:["_col0","_col1","_col3"] <-Map 7 [SIMPLE_EDGE] llap SHUFFLE [RS_66] PartitionCols:_col0 - Please refer to the previous Select Operator [SEL_10] + Please refer to the previous Select Operator [SEL_5] <-Map 18 [SIMPLE_EDGE] llap SHUFFLE [RS_67] PartitionCols:_col0 Select Operator [SEL_51] (rows=25/25 width=175) Output:["_col0","_col1"] - Filter Operator [FIL_114] (rows=25/25 width=175) + Filter Operator [FIL_111] (rows=25/25 width=175) predicate:key is not null TableScan [TS_49] (rows=25/25 width=175) default@src1,y,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] @@ -1286,7 +1270,7 @@ Stage-5 PartitionCols:_col0 Select Operator [SEL_54] (rows=25/25 width=89) Output:["_col0"] - Filter Operator [FIL_115] (rows=25/25 width=89) + Filter Operator [FIL_112] (rows=25/25 width=89) predicate:value is not null TableScan [TS_52] (rows=25/25 width=89) Output:["value"] @@ -1295,7 +1279,7 @@ Stage-5 PartitionCols:_col0 Select Operator [SEL_57] (rows=500/500 width=91) Output:["_col0"] - Filter Operator [FIL_116] (rows=500/500 width=91) + Filter Operator [FIL_113] (rows=500/500 width=91) predicate:value is not null TableScan [TS_55] (rows=500/500 width=91) Output:["value"] @@ -1304,7 +1288,7 @@ Stage-5 PartitionCols:_col0 Select Operator [SEL_61] (rows=500/500 width=91) Output:["_col0"] - Filter Operator [FIL_117] (rows=500/500 width=91) + Filter Operator [FIL_114] (rows=500/500 width=91) predicate:value is not null TableScan [TS_59] (rows=500/500 width=91) Output:["value"] @@ -1313,7 +1297,7 @@ Stage-5 PartitionCols:_col0 Select Operator [SEL_64] (rows=500/500 width=91) Output:["_col0"] - Filter Operator [FIL_118] (rows=500/500 width=91) + Filter Operator [FIL_115] (rows=500/500 width=91) predicate:value is not null TableScan [TS_62] (rows=500/500 width=91) Output:["value"] @@ -1411,29 +1395,29 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Vertex dependency in root stage -Map 1 <- Union 2 (CONTAINS) -Map 10 <- Union 2 (CONTAINS) -Map 17 <- Union 18 (CONTAINS) -Map 22 <- Union 18 (CONTAINS) -Map 23 <- Union 20 (CONTAINS) +Map 13 <- Union 14 (CONTAINS) +Map 16 <- Union 14 (CONTAINS) +Map 18 <- Union 19 (CONTAINS) +Map 23 <- Union 19 (CONTAINS) +Map 24 <- Union 21 (CONTAINS) Map 26 <- Union 27 (CONTAINS) Map 33 <- Union 27 (CONTAINS) Map 34 <- Union 29 (CONTAINS) Map 35 <- Union 31 (CONTAINS) -Reducer 12 <- Map 11 (SIMPLE_EDGE), Map 25 (SIMPLE_EDGE) -Reducer 13 <- Reducer 12 (SIMPLE_EDGE), Reducer 32 (SIMPLE_EDGE), Union 8 (CONTAINS) -Reducer 15 <- Map 14 (SIMPLE_EDGE), Reducer 21 (SIMPLE_EDGE) -Reducer 16 <- Map 24 (SIMPLE_EDGE), Reducer 15 (SIMPLE_EDGE), Union 6 (CONTAINS) -Reducer 19 <- Union 18 (SIMPLE_EDGE), Union 20 (CONTAINS) -Reducer 21 <- Union 20 (SIMPLE_EDGE) +Reducer 11 <- Map 10 (SIMPLE_EDGE), Map 25 (SIMPLE_EDGE) +Reducer 12 <- Reducer 11 (SIMPLE_EDGE), Reducer 32 (SIMPLE_EDGE), Union 6 (CONTAINS) +Reducer 15 <- Union 14 (SIMPLE_EDGE) +Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 10 (SIMPLE_EDGE) +Reducer 20 <- Union 19 (SIMPLE_EDGE), Union 21 (CONTAINS) +Reducer 22 <- Union 21 (SIMPLE_EDGE) Reducer 28 <- Union 27 (SIMPLE_EDGE), Union 29 (CONTAINS) -Reducer 3 <- Union 2 (SIMPLE_EDGE) +Reducer 3 <- Reducer 15 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE), Union 4 (CONTAINS) Reducer 30 <- Union 29 (SIMPLE_EDGE), Union 31 (CONTAINS) Reducer 32 <- Union 31 (SIMPLE_EDGE) -Reducer 4 <- Map 11 (SIMPLE_EDGE), Reducer 3 (SIMPLE_EDGE) -Reducer 5 <- Map 14 (SIMPLE_EDGE), Reducer 4 (SIMPLE_EDGE), Union 6 (CONTAINS) -Reducer 7 <- Union 6 (SIMPLE_EDGE), Union 8 (CONTAINS) -Reducer 9 <- Union 8 (SIMPLE_EDGE) +Reducer 5 <- Union 4 (SIMPLE_EDGE), Union 6 (CONTAINS) +Reducer 7 <- Union 6 (SIMPLE_EDGE) +Reducer 8 <- Map 1 (SIMPLE_EDGE), Map 17 (SIMPLE_EDGE) +Reducer 9 <- Reducer 22 (SIMPLE_EDGE), Reducer 8 (SIMPLE_EDGE), Union 4 (CONTAINS) Stage-5 Stats Work{} @@ -1443,39 +1427,39 @@ Stage-5 Stage-4 Dependency Collection{} Stage-3 - Reducer 9 llap + Reducer 7 llap File Output Operator [FS_115] table:{"name:":"default.a"} - Group By Operator [GBY_112] (rows=2941/319 width=178) + Group By Operator [GBY_112] (rows=2899/319 width=178) Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 - <-Union 8 [SIMPLE_EDGE] - <-Reducer 13 [CONTAINS] llap + <-Union 6 [SIMPLE_EDGE] + <-Reducer 12 [CONTAINS] llap Reduce Output Operator [RS_111] PartitionCols:_col0, _col1 - Select Operator [SEL_107] (rows=192/304 width=175) + Select Operator [SEL_107] (rows=193/304 width=175) Output:["_col0","_col1"] - Merge Join Operator [MERGEJOIN_164] (rows=192/304 width=175) + Merge Join Operator [MERGEJOIN_161] (rows=193/304 width=175) Conds:RS_104._col1=RS_105._col1(Inner),Output:["_col0","_col3"] - <-Reducer 12 [SIMPLE_EDGE] llap + <-Reducer 11 [SIMPLE_EDGE] llap SHUFFLE [RS_104] PartitionCols:_col1 - Merge Join Operator [MERGEJOIN_163] (rows=39/115 width=264) + Merge Join Operator [MERGEJOIN_158] (rows=39/115 width=264) Conds:RS_101._col0=RS_102._col0(Inner),Output:["_col0","_col1","_col3"] - <-Map 11 [SIMPLE_EDGE] llap + <-Map 10 [SIMPLE_EDGE] llap SHUFFLE [RS_101] PartitionCols:_col0 - Select Operator [SEL_14] (rows=25/25 width=175) + Select Operator [SEL_5] (rows=25/25 width=175) Output:["_col0","_col1"] - Filter Operator [FIL_146] (rows=25/25 width=175) + Filter Operator [FIL_142] (rows=25/25 width=175) predicate:(key is not null and value is not null) - TableScan [TS_12] (rows=25/25 width=175) + TableScan [TS_3] (rows=25/25 width=175) default@src1,x,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] <-Map 25 [SIMPLE_EDGE] llap SHUFFLE [RS_102] PartitionCols:_col0 Select Operator [SEL_70] (rows=25/25 width=175) Output:["_col0","_col1"] - Filter Operator [FIL_154] (rows=25/25 width=175) + Filter Operator [FIL_151] (rows=25/25 width=175) predicate:key is not null TableScan [TS_68] (rows=25/25 width=175) default@src1,y,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] @@ -1492,7 +1476,7 @@ Stage-5 PartitionCols:_col1, _col0 Select Operator [SEL_94] (rows=500/500 width=178) Output:["_col0","_col1"] - Filter Operator [FIL_158] (rows=500/500 width=178) + Filter Operator [FIL_155] (rows=500/500 width=178) predicate:value is not null TableScan [TS_92] (rows=500/500 width=178) Output:["key","value"] @@ -1509,7 +1493,7 @@ Stage-5 PartitionCols:_col1, _col0 Select Operator [SEL_85] (rows=500/500 width=178) Output:["_col0","_col1"] - Filter Operator [FIL_157] (rows=500/500 width=178) + Filter Operator [FIL_154] (rows=500/500 width=178) predicate:value is not null TableScan [TS_83] (rows=500/500 width=178) Output:["key","value"] @@ -1526,7 +1510,7 @@ Stage-5 PartitionCols:_col1, _col0 Select Operator [SEL_73] (rows=25/25 width=175) Output:["_col0","_col1"] - Filter Operator [FIL_155] (rows=25/25 width=175) + Filter Operator [FIL_152] (rows=25/25 width=175) predicate:value is not null TableScan [TS_71] (rows=25/25 width=175) Output:["key","value"] @@ -1535,139 +1519,139 @@ Stage-5 PartitionCols:_col1, _col0 Select Operator [SEL_76] (rows=500/500 width=178) Output:["_col0","_col1"] - Filter Operator [FIL_156] (rows=500/500 width=178) + Filter Operator [FIL_153] (rows=500/500 width=178) predicate:value is not null TableScan [TS_74] (rows=500/500 width=178) Output:["key","value"] - <-Reducer 7 [CONTAINS] llap + <-Reducer 5 [CONTAINS] llap Reduce Output Operator [RS_111] PartitionCols:_col0, _col1 - Group By Operator [GBY_63] (rows=2749/309 width=178) + Group By Operator [GBY_63] (rows=2706/309 width=178) Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 - <-Union 6 [SIMPLE_EDGE] - <-Reducer 16 [CONTAINS] llap + <-Union 4 [SIMPLE_EDGE] + <-Reducer 3 [CONTAINS] llap Reduce Output Operator [RS_62] PartitionCols:_col0, _col1 - Select Operator [SEL_58] (rows=2682/1056 width=178) + Select Operator [SEL_24] (rows=66/61 width=177) Output:["_col0","_col1"] - Merge Join Operator [MERGEJOIN_162] (rows=2682/1056 width=178) - Conds:RS_55._col2=RS_56._col0(Inner),Output:["_col2","_col5"] - <-Map 24 [SIMPLE_EDGE] llap - SHUFFLE [RS_56] - PartitionCols:_col0 - Select Operator [SEL_51] (rows=500/500 width=178) - Output:["_col0","_col1"] - Filter Operator [FIL_152] (rows=500/500 width=178) - predicate:key is not null - TableScan [TS_49] (rows=500/500 width=178) - default@src,y,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] + Merge Join Operator [MERGEJOIN_159] (rows=66/61 width=177) + Conds:RS_21._col3=RS_22._col1(Inner),Output:["_col1","_col2"] <-Reducer 15 [SIMPLE_EDGE] llap - SHUFFLE [RS_55] - PartitionCols:_col2 - Merge Join Operator [MERGEJOIN_161] (rows=1658/512 width=87) - Conds:RS_52._col1=RS_53._col1(Inner),Output:["_col2"] - <-Map 14 [SIMPLE_EDGE] llap - SHUFFLE [RS_53] - PartitionCols:_col1 - Select Operator [SEL_48] (rows=500/500 width=178) + SHUFFLE [RS_22] + PartitionCols:_col1 + Select Operator [SEL_17] (rows=525/319 width=178) + Output:["_col1"] + Group By Operator [GBY_16] (rows=525/319 width=178) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 14 [SIMPLE_EDGE] + <-Map 13 [CONTAINS] llap + Reduce Output Operator [RS_15] + PartitionCols:_col1, _col0 + Select Operator [SEL_8] (rows=25/25 width=175) + Output:["_col0","_col1"] + Filter Operator [FIL_143] (rows=25/25 width=175) + predicate:value is not null + TableScan [TS_6] (rows=25/25 width=175) + Output:["key","value"] + <-Map 16 [CONTAINS] llap + Reduce Output Operator [RS_15] + PartitionCols:_col1, _col0 + Select Operator [SEL_11] (rows=500/500 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_144] (rows=500/500 width=178) + predicate:value is not null + TableScan [TS_9] (rows=500/500 width=178) + Output:["key","value"] + <-Reducer 2 [SIMPLE_EDGE] llap + SHUFFLE [RS_21] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_156] (rows=39/37 width=266) + Conds:RS_18._col0=RS_19._col0(Inner),Output:["_col1","_col2","_col3"] + <-Map 1 [SIMPLE_EDGE] llap + SHUFFLE [RS_18] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=500/500 width=178) Output:["_col0","_col1"] - Filter Operator [FIL_151] (rows=500/500 width=178) - predicate:(key is not null and value is not null) - TableScan [TS_15] (rows=500/500 width=178) + Filter Operator [FIL_141] (rows=500/500 width=178) + predicate:key is not null + TableScan [TS_0] (rows=500/500 width=178) default@src,y,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] - <-Reducer 21 [SIMPLE_EDGE] llap - SHUFFLE [RS_52] - PartitionCols:_col1 - Select Operator [SEL_45] (rows=1025/319 width=178) - Output:["_col1"] - Group By Operator [GBY_44] (rows=1025/319 width=178) - Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 - <-Union 20 [SIMPLE_EDGE] - <-Map 23 [CONTAINS] llap - Reduce Output Operator [RS_43] - PartitionCols:_col1, _col0 - Select Operator [SEL_39] (rows=500/500 width=178) - Output:["_col0","_col1"] - Filter Operator [FIL_150] (rows=500/500 width=178) - predicate:value is not null - TableScan [TS_37] (rows=500/500 width=178) - Output:["key","value"] - <-Reducer 19 [CONTAINS] llap - Reduce Output Operator [RS_43] - PartitionCols:_col1, _col0 - Select Operator [SEL_36] (rows=525/319 width=178) - Output:["_col0","_col1"] - Group By Operator [GBY_35] (rows=525/319 width=178) - Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 - <-Union 18 [SIMPLE_EDGE] - <-Map 17 [CONTAINS] llap - Reduce Output Operator [RS_34] - PartitionCols:_col1, _col0 - Select Operator [SEL_27] (rows=25/25 width=175) - Output:["_col0","_col1"] - Filter Operator [FIL_148] (rows=25/25 width=175) - predicate:value is not null - TableScan [TS_25] (rows=25/25 width=175) - Output:["key","value"] - <-Map 22 [CONTAINS] llap - Reduce Output Operator [RS_34] - PartitionCols:_col1, _col0 - Select Operator [SEL_30] (rows=500/500 width=178) - Output:["_col0","_col1"] - Filter Operator [FIL_149] (rows=500/500 width=178) - predicate:value is not null - TableScan [TS_28] (rows=500/500 width=178) - Output:["key","value"] - <-Reducer 5 [CONTAINS] llap + <-Map 10 [SIMPLE_EDGE] llap + SHUFFLE [RS_19] + PartitionCols:_col0 + Please refer to the previous Select Operator [SEL_5] + <-Reducer 9 [CONTAINS] llap Reduce Output Operator [RS_62] PartitionCols:_col0, _col1 - Select Operator [SEL_24] (rows=67/61 width=177) + Select Operator [SEL_58] (rows=2640/1056 width=178) Output:["_col0","_col1"] - Merge Join Operator [MERGEJOIN_160] (rows=67/61 width=177) - Conds:RS_21._col2=RS_22._col0(Inner),Output:["_col2","_col5"] - <-Map 14 [SIMPLE_EDGE] llap - SHUFFLE [RS_22] - PartitionCols:_col0 - Select Operator [SEL_17] (rows=500/500 width=178) - Output:["_col0","_col1"] - Filter Operator [FIL_147] (rows=500/500 width=178) - predicate:key is not null - Please refer to the previous TableScan [TS_15] - <-Reducer 4 [SIMPLE_EDGE] llap - SHUFFLE [RS_21] - PartitionCols:_col2 - Merge Join Operator [MERGEJOIN_159] (rows=42/52 width=86) - Conds:RS_18._col1=RS_19._col1(Inner),Output:["_col2"] - <-Map 11 [SIMPLE_EDGE] llap - SHUFFLE [RS_19] - PartitionCols:_col1 - Please refer to the previous Select Operator [SEL_14] - <-Reducer 3 [SIMPLE_EDGE] llap - SHUFFLE [RS_18] - PartitionCols:_col1 - Select Operator [SEL_11] (rows=525/319 width=178) - Output:["_col1"] - Group By Operator [GBY_10] (rows=525/319 width=178) - Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 - <-Union 2 [SIMPLE_EDGE] - <-Map 1 [CONTAINS] llap - Reduce Output Operator [RS_9] - PartitionCols:_col1, _col0 - Select Operator [SEL_2] (rows=25/25 width=175) - Output:["_col0","_col1"] - Filter Operator [FIL_144] (rows=25/25 width=175) - predicate:value is not null - TableScan [TS_0] (rows=25/25 width=175) - Output:["key","value"] - <-Map 10 [CONTAINS] llap - Reduce Output Operator [RS_9] - PartitionCols:_col1, _col0 - Select Operator [SEL_5] (rows=500/500 width=178) - Output:["_col0","_col1"] - Filter Operator [FIL_145] (rows=500/500 width=178) - predicate:value is not null - TableScan [TS_3] (rows=500/500 width=178) - Output:["key","value"] + Merge Join Operator [MERGEJOIN_160] (rows=2640/1056 width=178) + Conds:RS_55._col1=RS_56._col1(Inner),Output:["_col0","_col3"] + <-Reducer 22 [SIMPLE_EDGE] llap + SHUFFLE [RS_56] + PartitionCols:_col1 + Select Operator [SEL_51] (rows=1025/319 width=178) + Output:["_col1"] + Group By Operator [GBY_50] (rows=1025/319 width=178) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 21 [SIMPLE_EDGE] + <-Map 24 [CONTAINS] llap + Reduce Output Operator [RS_49] + PartitionCols:_col1, _col0 + Select Operator [SEL_45] (rows=500/500 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_149] (rows=500/500 width=178) + predicate:value is not null + TableScan [TS_43] (rows=500/500 width=178) + Output:["key","value"] + <-Reducer 20 [CONTAINS] llap + Reduce Output Operator [RS_49] + PartitionCols:_col1, _col0 + Select Operator [SEL_42] (rows=525/319 width=178) + Output:["_col0","_col1"] + Group By Operator [GBY_41] (rows=525/319 width=178) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 19 [SIMPLE_EDGE] + <-Map 18 [CONTAINS] llap + Reduce Output Operator [RS_40] + PartitionCols:_col1, _col0 + Select Operator [SEL_33] (rows=25/25 width=175) + Output:["_col0","_col1"] + Filter Operator [FIL_147] (rows=25/25 width=175) + predicate:value is not null + TableScan [TS_31] (rows=25/25 width=175) + Output:["key","value"] + <-Map 23 [CONTAINS] llap + Reduce Output Operator [RS_40] + PartitionCols:_col1, _col0 + Select Operator [SEL_36] (rows=500/500 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_148] (rows=500/500 width=178) + predicate:value is not null + TableScan [TS_34] (rows=500/500 width=178) + Output:["key","value"] + <-Reducer 8 [SIMPLE_EDGE] llap + SHUFFLE [RS_55] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_157] (rows=791/1028 width=269) + Conds:RS_52._col0=RS_53._col0(Inner),Output:["_col0","_col1","_col3"] + <-Map 1 [SIMPLE_EDGE] llap + SHUFFLE [RS_52] + PartitionCols:_col0 + Select Operator [SEL_27] (rows=500/500 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_145] (rows=500/500 width=178) + predicate:(key is not null and value is not null) + Please refer to the previous TableScan [TS_0] + <-Map 17 [SIMPLE_EDGE] llap + SHUFFLE [RS_53] + PartitionCols:_col0 + Select Operator [SEL_30] (rows=500/500 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_146] (rows=500/500 width=178) + predicate:key is not null + TableScan [TS_28] (rows=500/500 width=178) + default@src,y,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] File Output Operator [FS_117] table:{"name:":"default.b"} Please refer to the previous Group By Operator [GBY_112] @@ -1754,9 +1738,9 @@ Stage-4 Reducer 5 llap File Output Operator [FS_18] table:{"name:":"default.dest1"} - Select Operator [SEL_16] (rows=309/310 width=272) + Select Operator [SEL_16] (rows=316/310 width=272) Output:["_col0","_col1"] - Group By Operator [GBY_15] (rows=309/310 width=96) + Group By Operator [GBY_15] (rows=316/310 width=96) Output:["_col0","_col1"],aggregations:["count(DISTINCT KEY._col1:0._col0)"],keys:KEY._col0 <-Reducer 4 [SIMPLE_EDGE] llap SHUFFLE [RS_14] @@ -1832,9 +1816,9 @@ Stage-0 Stage-1 Reducer 2 llap File Output Operator [FS_8] - Select Operator [SEL_7] (rows=261/4122 width=260) + Select Operator [SEL_7] (rows=250/4122 width=260) Output:["_col0","_col1","_col2"] - Merge Join Operator [MERGEJOIN_9] (rows=261/4122 width=260) + Merge Join Operator [MERGEJOIN_9] (rows=250/4122 width=260) Conds:RS_3.key=RS_3.key(Unique),RS_3.key=RS_3.key(Unique),RS_3.key=RS_3.key(Unique),Output:["_col0","_col5","_col10"] <-Map 1 [SIMPLE_EDGE] llap SHUFFLE [RS_3] @@ -1928,9 +1912,9 @@ Stage-4 Reducer 4 llap File Output Operator [FS_16] table:{"name:":"default.dest1"} - Select Operator [SEL_14] (rows=309/310 width=272) + Select Operator [SEL_14] (rows=316/310 width=272) Output:["_col0","_col1"] - Group By Operator [GBY_13] (rows=309/310 width=96) + Group By Operator [GBY_13] (rows=316/310 width=96) Output:["_col0","_col1"],aggregations:["count(DISTINCT KEY._col1:0._col0)"],keys:KEY._col0 <-Union 3 [SIMPLE_EDGE] <-Map 6 [CONTAINS] llap @@ -2046,9 +2030,9 @@ Stage-4 Reducer 4 llap File Output Operator [FS_14] table:{"name:":"default.dest1"} - Select Operator [SEL_12] (rows=309/310 width=272) + Select Operator [SEL_12] (rows=316/310 width=272) Output:["_col0","_col1"] - Group By Operator [GBY_11] (rows=309/310 width=96) + Group By Operator [GBY_11] (rows=316/310 width=96) Output:["_col0","_col1"],aggregations:["count(DISTINCT KEY._col1:0._col0)"],keys:KEY._col0 <-Union 3 [SIMPLE_EDGE] <-Map 6 [CONTAINS] llap diff --git ql/src/test/results/clientpositive/llap/explainuser_1.q.out ql/src/test/results/clientpositive/llap/explainuser_1.q.out index 5adf401..0788803 100644 --- ql/src/test/results/clientpositive/llap/explainuser_1.q.out +++ ql/src/test/results/clientpositive/llap/explainuser_1.q.out @@ -1683,9 +1683,9 @@ Stage-0 Stage-1 Reducer 2 llap File Output Operator [FS_19] - Select Operator [SEL_18] (rows=366 width=178) + Select Operator [SEL_18] (rows=365 width=178) Output:["_col0","_col1"] - Filter Operator [FIL_17] (rows=366 width=179) + Filter Operator [FIL_17] (rows=365 width=179) predicate:_col3 is null Merge Join Operator [MERGEJOIN_22] (rows=500 width=179) Conds:RS_14._col1=RS_15._col0(Left Outer),Output:["_col0","_col1","_col3"] @@ -1747,9 +1747,9 @@ Stage-0 Stage-1 Reducer 3 llap File Output Operator [FS_18] - Select Operator [SEL_17] (rows=183 width=178) + Select Operator [SEL_17] (rows=185 width=178) Output:["_col0","_col1"] - Filter Operator [FIL_16] (rows=183 width=179) + Filter Operator [FIL_16] (rows=185 width=179) predicate:_col4 is null Merge Join Operator [MERGEJOIN_21] (rows=250 width=179) Conds:RS_13._col0, _col1=RS_14._col0, _col1(Left Outer),Output:["_col0","_col1","_col4"] @@ -1822,7 +1822,7 @@ Stage-0 Stage-1 Reducer 2 llap File Output Operator [FS_12] - Merge Join Operator [MERGEJOIN_17] (rows=133 width=178) + Merge Join Operator [MERGEJOIN_17] (rows=131 width=178) Conds:RS_8._col0, _col1=RS_9._col0, _col1(Left Semi),Output:["_col0","_col1"] <-Map 1 [SIMPLE_EDGE] llap SHUFFLE [RS_8] @@ -1874,7 +1874,7 @@ Stage-0 Stage-1 Reducer 2 llap File Output Operator [FS_12] - Merge Join Operator [MERGEJOIN_17] (rows=133 width=178) + Merge Join Operator [MERGEJOIN_17] (rows=131 width=178) Conds:RS_8._col0, _col1=RS_9._col0, _col1(Left Semi),Output:["_col0","_col1"] <-Map 1 [SIMPLE_EDGE] llap SHUFFLE [RS_8] @@ -1916,7 +1916,7 @@ Stage-0 Stage-1 Reducer 2 llap File Output Operator [FS_12] - Merge Join Operator [MERGEJOIN_17] (rows=133 width=178) + Merge Join Operator [MERGEJOIN_17] (rows=131 width=178) Conds:RS_8._col0=RS_9._col0(Left Semi),Output:["_col0","_col1"] <-Map 1 [SIMPLE_EDGE] llap SHUFFLE [RS_8] @@ -2037,16 +2037,16 @@ Stage-0 <-Reducer 3 [SIMPLE_EDGE] llap SHUFFLE [RS_27] PartitionCols:_col2 - Filter Operator [FIL_37] (rows=66 width=186) + Filter Operator [FIL_37] (rows=65 width=186) predicate:_col2 is not null - Group By Operator [GBY_14] (rows=66 width=186) + Group By Operator [GBY_14] (rows=65 width=186) Output:["_col0","_col1","_col2"],aggregations:["count(VALUE._col0)"],keys:KEY._col0, KEY._col1 <-Reducer 2 [SIMPLE_EDGE] llap SHUFFLE [RS_13] PartitionCols:_col0, _col1 - Group By Operator [GBY_12] (rows=66 width=186) + Group By Operator [GBY_12] (rows=65 width=186) Output:["_col0","_col1","_col2"],aggregations:["count()"],keys:_col0, _col1 - Merge Join Operator [MERGEJOIN_43] (rows=133 width=178) + Merge Join Operator [MERGEJOIN_43] (rows=131 width=178) Conds:RS_8._col0=RS_9._col0(Left Semi),Output:["_col0","_col1"] <-Map 5 [SIMPLE_EDGE] llap SHUFFLE [RS_9] @@ -2646,7 +2646,7 @@ Stage-0 PartitionCols:_col0 Group By Operator [GBY_10] (rows=16 width=94) Output:["_col0","_col1"],aggregations:["count()"],keys:_col0 - Merge Join Operator [MERGEJOIN_24] (rows=40 width=86) + Merge Join Operator [MERGEJOIN_24] (rows=39 width=86) Conds:RS_6._col0=RS_7._col0(Inner),Output:["_col0"] <-Map 1 [SIMPLE_EDGE] llap SHUFFLE [RS_6] @@ -2707,7 +2707,7 @@ Stage-0 PartitionCols:_col0 Group By Operator [GBY_10] (rows=16 width=94) Output:["_col0","_col1"],aggregations:["count()"],keys:_col0 - Merge Join Operator [MERGEJOIN_24] (rows=40 width=86) + Merge Join Operator [MERGEJOIN_24] (rows=39 width=86) Conds:RS_6._col0=RS_7._col0(Inner),Output:["_col0"] <-Map 1 [SIMPLE_EDGE] llap SHUFFLE [RS_6] @@ -2768,7 +2768,7 @@ Stage-0 PartitionCols:_col0 Group By Operator [GBY_10] (rows=16 width=94) Output:["_col0","_col1"],aggregations:["count()"],keys:_col0 - Map Join Operator [MAPJOIN_24] (rows=40 width=86) + Map Join Operator [MAPJOIN_24] (rows=39 width=86) Conds:RS_6._col0=SEL_5._col0(Inner),Output:["_col0"] <-Map 1 [BROADCAST_EDGE] llap BROADCAST [RS_6] @@ -2817,16 +2817,16 @@ Stage-0 PARTITION_ONLY_SHUFFLE [RS_18] Group By Operator [GBY_17] (rows=1 width=16) Output:["_col0","_col1"],aggregations:["sum(_col0)","sum(_col1)"] - Select Operator [SEL_15] (rows=10 width=94) + Select Operator [SEL_15] (rows=9 width=94) Output:["_col0","_col1"] - Group By Operator [GBY_14] (rows=10 width=94) + Group By Operator [GBY_14] (rows=9 width=94) Output:["_col0","_col1"],aggregations:["count(VALUE._col0)"],keys:KEY._col0 <-Reducer 2 [SIMPLE_EDGE] llap SHUFFLE [RS_13] PartitionCols:_col0 - Group By Operator [GBY_12] (rows=10 width=94) + Group By Operator [GBY_12] (rows=9 width=94) Output:["_col0","_col1"],aggregations:["count()"],keys:_col0 - Merge Join Operator [MERGEJOIN_26] (rows=20 width=86) + Merge Join Operator [MERGEJOIN_26] (rows=19 width=86) Conds:RS_8._col0=RS_9._col0(Left Semi),Output:["_col0"] <-Map 1 [SIMPLE_EDGE] llap SHUFFLE [RS_8] @@ -5264,9 +5264,9 @@ Stage-3 Reducer 2 llap File Output Operator [FS_11] table:{"name:":"default.dest_j1"} - Select Operator [SEL_9] (rows=809 width=95) + Select Operator [SEL_9] (rows=791 width=95) Output:["_col0","_col1"] - Merge Join Operator [MERGEJOIN_16] (rows=809 width=178) + Merge Join Operator [MERGEJOIN_16] (rows=791 width=178) Conds:RS_6._col0=RS_7._col0(Inner),Output:["_col0","_col2"] <-Map 1 [SIMPLE_EDGE] llap SHUFFLE [RS_6] @@ -5503,7 +5503,7 @@ Stage-0 Stage-1 Reducer 2 llap File Output Operator [FS_10] - Merge Join Operator [MERGEJOIN_15] (rows=809 width=356) + Merge Join Operator [MERGEJOIN_15] (rows=791 width=356) Conds:RS_6._col0=RS_7._col0(Inner),Output:["_col0","_col1","_col2","_col3"] <-Map 1 [SIMPLE_EDGE] llap SHUFFLE [RS_6] diff --git ql/src/test/results/clientpositive/llap/explainuser_4.q.out ql/src/test/results/clientpositive/llap/explainuser_4.q.out index c4fdc18..d5f8cb7 100644 --- ql/src/test/results/clientpositive/llap/explainuser_4.q.out +++ ql/src/test/results/clientpositive/llap/explainuser_4.q.out @@ -26,11 +26,11 @@ Stage-0 Stage-1 Reducer 3 llap File Output Operator [FS_12] - Select Operator [SEL_11] (rows=2076 width=553) + Select Operator [SEL_11] (rows=2048 width=552) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23"] <-Reducer 2 [SIMPLE_EDGE] llap SHUFFLE [RS_10] - Merge Join Operator [MERGEJOIN_17] (rows=2076 width=553) + Merge Join Operator [MERGEJOIN_17] (rows=2048 width=552) Conds:RS_6._col2=RS_7._col2(Inner),Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23"] <-Map 1 [SIMPLE_EDGE] llap SHUFFLE [RS_6] @@ -111,7 +111,7 @@ Stage-0 PARTITION_ONLY_SHUFFLE [RS_11] Group By Operator [GBY_10] (rows=1 width=8) Output:["_col0"],aggregations:["count()"] - Merge Join Operator [MERGEJOIN_19] (rows=2076 width=8) + Merge Join Operator [MERGEJOIN_19] (rows=2048 width=8) Conds:RS_6._col0=RS_7._col0(Inner) <-Map 1 [SIMPLE_EDGE] llap SHUFFLE [RS_6] @@ -180,18 +180,18 @@ Stage-0 Stage-1 Reducer 4 llap File Output Operator [FS_16] - Select Operator [SEL_15] (rows=623 width=11) + Select Operator [SEL_15] (rows=631 width=11) Output:["_col0","_col1"] <-Reducer 3 [SIMPLE_EDGE] llap SHUFFLE [RS_14] - Group By Operator [GBY_12] (rows=623 width=11) + Group By Operator [GBY_12] (rows=631 width=11) Output:["_col0","_col1"],aggregations:["count(VALUE._col0)"],keys:KEY._col0 <-Reducer 2 [SIMPLE_EDGE] llap SHUFFLE [RS_11] PartitionCols:_col0 - Group By Operator [GBY_10] (rows=623 width=11) + Group By Operator [GBY_10] (rows=631 width=11) Output:["_col0","_col1"],aggregations:["count()"],keys:_col0 - Merge Join Operator [MERGEJOIN_21] (rows=2076 width=3) + Merge Join Operator [MERGEJOIN_21] (rows=2048 width=3) Conds:RS_6._col1=RS_7._col0(Inner),Output:["_col0"] <-Map 1 [SIMPLE_EDGE] llap SHUFFLE [RS_6] diff --git ql/src/test/results/clientpositive/llap/groupby1.q.out ql/src/test/results/clientpositive/llap/groupby1.q.out index d58a9fd..d60895d 100644 --- ql/src/test/results/clientpositive/llap/groupby1.q.out +++ ql/src/test/results/clientpositive/llap/groupby1.q.out @@ -67,14 +67,14 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: final outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: UDFToInteger(_col0) (type: int), _col1 (type: double) outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 3708 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 3792 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 309 Data size: 3708 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 3792 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.TextInputFormat output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat diff --git ql/src/test/results/clientpositive/llap/groupby2.q.out ql/src/test/results/clientpositive/llap/groupby2.q.out index 5ab6235..2967727 100644 --- ql/src/test/results/clientpositive/llap/groupby2.q.out +++ ql/src/test/results/clientpositive/llap/groupby2.q.out @@ -68,14 +68,14 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: final outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 309 Data size: 61800 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 63200 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), UDFToInteger(_col1) (type: int), concat(_col0, _col2) (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 309 Data size: 114948 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 117552 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 309 Data size: 114948 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 117552 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.TextInputFormat output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat diff --git ql/src/test/results/clientpositive/llap/groupby_resolution.q.out ql/src/test/results/clientpositive/llap/groupby_resolution.q.out index d3b85f8..d026bd9 100644 --- ql/src/test/results/clientpositive/llap/groupby_resolution.q.out +++ ql/src/test/results/clientpositive/llap/groupby_resolution.q.out @@ -38,10 +38,10 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: complete outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -93,10 +93,10 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: complete outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -164,10 +164,10 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: final outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -235,10 +235,10 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: final outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/hybridgrace_hashjoin_1.q.out ql/src/test/results/clientpositive/llap/hybridgrace_hashjoin_1.q.out index 02dc49d..8a6d5b6 100644 --- ql/src/test/results/clientpositive/llap/hybridgrace_hashjoin_1.q.out +++ ql/src/test/results/clientpositive/llap/hybridgrace_hashjoin_1.q.out @@ -56,7 +56,7 @@ STAGE PLANS: 1 _col0 (type: int) input vertices: 1 Map 3 - Statistics: Num rows: 25044 Data size: 200352 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 24737 Data size: 197896 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -177,7 +177,7 @@ STAGE PLANS: 1 _col0 (type: int) input vertices: 1 Map 3 - Statistics: Num rows: 25044 Data size: 200352 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 24737 Data size: 197896 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -296,7 +296,7 @@ STAGE PLANS: 1 _col0 (type: int) input vertices: 1 Map 3 - Statistics: Num rows: 18694 Data size: 149552 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 18464 Data size: 147712 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -413,7 +413,7 @@ STAGE PLANS: 1 _col0 (type: int) input vertices: 1 Map 3 - Statistics: Num rows: 18694 Data size: 149552 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 18464 Data size: 147712 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -527,7 +527,7 @@ STAGE PLANS: 1 _col0 (type: int) input vertices: 1 Map 3 - Statistics: Num rows: 25044 Data size: 200352 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 24737 Data size: 197896 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -638,7 +638,7 @@ STAGE PLANS: 1 _col0 (type: int) input vertices: 1 Map 3 - Statistics: Num rows: 25044 Data size: 200352 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 24737 Data size: 197896 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash diff --git ql/src/test/results/clientpositive/llap/join1.q.out ql/src/test/results/clientpositive/llap/join1.q.out index 661f55c..566d45d 100644 --- ql/src/test/results/clientpositive/llap/join1.q.out +++ ql/src/test/results/clientpositive/llap/join1.q.out @@ -77,14 +77,14 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col2 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: UDFToInteger(_col0) (type: int), _col2 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 809 Data size: 76855 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 75145 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 809 Data size: 76855 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 75145 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.TextInputFormat output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat diff --git ql/src/test/results/clientpositive/llap/join32_lessSize.q.out ql/src/test/results/clientpositive/llap/join32_lessSize.q.out index 140f87e..df4b752 100644 --- ql/src/test/results/clientpositive/llap/join32_lessSize.q.out +++ ql/src/test/results/clientpositive/llap/join32_lessSize.q.out @@ -66,13 +66,13 @@ STAGE PLANS: input vertices: 1 Map 3 Position of Big Table: 0 - Statistics: Num rows: 40 Data size: 10640 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 10374 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col3 (type: string) null sort order: a sort order: + Map-reduce partition columns: _col3 (type: string) - Statistics: Num rows: 40 Data size: 10640 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 10374 Basic stats: COMPLETE Column stats: COMPLETE tag: 0 value expressions: _col1 (type: string), _col2 (type: string) auto parallelism: true @@ -294,17 +294,17 @@ STAGE PLANS: 1 _col0 (type: string) outputColumnNames: _col1, _col2, _col4 Position of Big Table: 1 - Statistics: Num rows: 64 Data size: 17152 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 63 Data size: 16884 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col2 (type: string), _col4 (type: string), _col1 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 64 Data size: 17152 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 63 Data size: 16884 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false GlobalTableId: 1 #### A masked pattern was here #### NumFilesPerFileSink: 1 - Statistics: Num rows: 64 Data size: 17152 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 63 Data size: 16884 Basic stats: COMPLETE Column stats: COMPLETE #### A masked pattern was here #### table: input format: org.apache.hadoop.mapred.TextInputFormat @@ -509,8 +509,7 @@ STAGE PLANS: Tez #### A masked pattern was here #### Edges: - Map 1 <- Map 4 (BROADCAST_EDGE) - Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 5 (SIMPLE_EDGE) + Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE), Map 5 (SIMPLE_EDGE) Reducer 3 <- Map 6 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) #### A masked pattern was here #### Vertices: @@ -528,27 +527,15 @@ STAGE PLANS: expressions: key (type: string), value (type: string) outputColumnNames: _col0, _col1 Statistics: Num rows: 25 Data size: 4375 Basic stats: COMPLETE Column stats: COMPLETE - Map Join Operator - condition map: - Inner Join 0 to 1 - Estimated key counts: Map 4 => 25 - keys: - 0 _col0 (type: string) - 1 _col0 (type: string) - outputColumnNames: _col0, _col1, _col3 - input vertices: - 1 Map 4 - Position of Big Table: 0 - Statistics: Num rows: 39 Data size: 10296 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - key expressions: _col1 (type: string) - null sort order: a - sort order: + - Map-reduce partition columns: _col1 (type: string) - Statistics: Num rows: 39 Data size: 10296 Basic stats: COMPLETE Column stats: COMPLETE - tag: 0 - value expressions: _col0 (type: string), _col3 (type: string) - auto parallelism: true + Reduce Output Operator + key expressions: _col0 (type: string) + null sort order: a + sort order: + + Map-reduce partition columns: _col0 (type: string) + Statistics: Num rows: 25 Data size: 4375 Basic stats: COMPLETE Column stats: COMPLETE + tag: 0 + value expressions: _col1 (type: string) + auto parallelism: true Execution mode: llap LLAP IO: no inputs Path -> Alias: @@ -681,24 +668,25 @@ STAGE PLANS: Map 5 Map Operator Tree: TableScan - alias: w - Statistics: Num rows: 500 Data size: 45500 Basic stats: COMPLETE Column stats: COMPLETE + alias: y + Statistics: Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE GatherStats: false Filter Operator isSamplingPred: false - predicate: value is not null (type: boolean) - Statistics: Num rows: 500 Data size: 45500 Basic stats: COMPLETE Column stats: COMPLETE + predicate: key is not null (type: boolean) + Statistics: Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: value (type: string) - outputColumnNames: _col0 - Statistics: Num rows: 500 Data size: 45500 Basic stats: COMPLETE Column stats: COMPLETE + expressions: key (type: string), value (type: string) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: a sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 500 Data size: 45500 Basic stats: COMPLETE Column stats: COMPLETE - tag: 1 + Statistics: Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE + tag: 2 + value expressions: _col1 (type: string) auto parallelism: true Execution mode: llap LLAP IO: no inputs @@ -752,29 +740,28 @@ STAGE PLANS: name: default.src name: default.src Truncated Path -> Alias: - /src [w] + /src [y] Map 6 Map Operator Tree: TableScan - alias: y - Statistics: Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE + alias: w + Statistics: Num rows: 500 Data size: 45500 Basic stats: COMPLETE Column stats: COMPLETE GatherStats: false Filter Operator isSamplingPred: false - predicate: key is not null (type: boolean) - Statistics: Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE + predicate: value is not null (type: boolean) + Statistics: Num rows: 500 Data size: 45500 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: key (type: string), value (type: string) - outputColumnNames: _col0, _col1 - Statistics: Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE + expressions: value (type: string) + outputColumnNames: _col0 + Statistics: Num rows: 500 Data size: 45500 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: a sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 45500 Basic stats: COMPLETE Column stats: COMPLETE tag: 1 - value expressions: _col1 (type: string) auto parallelism: true Execution mode: llap LLAP IO: no inputs @@ -828,7 +815,7 @@ STAGE PLANS: name: default.src name: default.src Truncated Path -> Alias: - /src [y] + /src [w] Reducer 2 Execution mode: llap Needs Tagging: false @@ -836,20 +823,22 @@ STAGE PLANS: Merge Join Operator condition map: Inner Join 0 to 1 + Inner Join 0 to 2 keys: - 0 _col1 (type: string) + 0 _col0 (type: string) 1 _col0 (type: string) - outputColumnNames: _col0, _col3 - Position of Big Table: 1 - Statistics: Num rows: 63 Data size: 11025 Basic stats: COMPLETE Column stats: COMPLETE + 2 _col0 (type: string) + outputColumnNames: _col0, _col1, _col3, _col5 + Position of Big Table: 2 + Statistics: Num rows: 61 Data size: 21655 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: string) + key expressions: _col1 (type: string) null sort order: a sort order: + - Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 63 Data size: 11025 Basic stats: COMPLETE Column stats: COMPLETE + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 61 Data size: 21655 Basic stats: COMPLETE Column stats: COMPLETE tag: 0 - value expressions: _col3 (type: string) + value expressions: _col0 (type: string), _col3 (type: string), _col5 (type: string) auto parallelism: true Reducer 3 Execution mode: llap @@ -859,21 +848,21 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 _col0 (type: string) + 0 _col1 (type: string) 1 _col0 (type: string) - outputColumnNames: _col0, _col3, _col6 + outputColumnNames: _col0, _col3, _col5 Position of Big Table: 0 - Statistics: Num rows: 101 Data size: 26866 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 99 Data size: 26334 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: _col0 (type: string), _col3 (type: string), _col6 (type: string) + expressions: _col0 (type: string), _col3 (type: string), _col5 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 101 Data size: 26866 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 99 Data size: 26334 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false GlobalTableId: 1 #### A masked pattern was here #### NumFilesPerFileSink: 1 - Statistics: Num rows: 101 Data size: 26866 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 99 Data size: 26334 Basic stats: COMPLETE Column stats: COMPLETE #### A masked pattern was here #### table: input format: org.apache.hadoop.mapred.TextInputFormat @@ -1180,17 +1169,17 @@ STAGE PLANS: input vertices: 1 Map 4 Position of Big Table: 0 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: string), _col2 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: string) null sort order: a sort order: + Map-reduce partition columns: _col1 (type: string) - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE tag: 1 value expressions: _col0 (type: string) auto parallelism: true @@ -1335,17 +1324,17 @@ STAGE PLANS: 1 _col1 (type: string) outputColumnNames: _col0, _col3, _col4 Position of Big Table: 0 - Statistics: Num rows: 64 Data size: 17024 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 63 Data size: 16758 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col3 (type: string), _col0 (type: string), _col4 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 64 Data size: 17024 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 63 Data size: 16758 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false GlobalTableId: 1 #### A masked pattern was here #### NumFilesPerFileSink: 1 - Statistics: Num rows: 64 Data size: 17024 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 63 Data size: 16758 Basic stats: COMPLETE Column stats: COMPLETE #### A masked pattern was here #### table: input format: org.apache.hadoop.mapred.TextInputFormat @@ -1788,17 +1777,17 @@ STAGE PLANS: 1 _col1 (type: string) outputColumnNames: _col0, _col3, _col4 Position of Big Table: 1 - Statistics: Num rows: 64 Data size: 17024 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 63 Data size: 16758 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col3 (type: string), _col0 (type: string), _col4 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 64 Data size: 17024 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 63 Data size: 16758 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false GlobalTableId: 1 #### A masked pattern was here #### NumFilesPerFileSink: 1 - Statistics: Num rows: 64 Data size: 17024 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 63 Data size: 16758 Basic stats: COMPLETE Column stats: COMPLETE #### A masked pattern was here #### table: input format: org.apache.hadoop.mapred.TextInputFormat @@ -1837,17 +1826,17 @@ STAGE PLANS: 1 _col0 (type: string) outputColumnNames: _col1, _col2 Position of Big Table: 1 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: string), _col2 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: string) null sort order: a sort order: + Map-reduce partition columns: _col1 (type: string) - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE tag: 1 value expressions: _col0 (type: string) auto parallelism: true @@ -2083,16 +2072,16 @@ STAGE PLANS: outputColumnNames: _col1, _col2 input vertices: 1 Map 4 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: string), _col2 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: string) sort order: + Map-reduce partition columns: _col1 (type: string) - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: string) Execution mode: llap LLAP IO: no inputs @@ -2126,14 +2115,14 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col1 (type: string) outputColumnNames: _col0, _col3, _col4 - Statistics: Num rows: 64 Data size: 17024 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 63 Data size: 16758 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col3 (type: string), _col0 (type: string), _col4 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 64 Data size: 17024 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 63 Data size: 16758 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 64 Data size: 17024 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 63 Data size: 16758 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.TextInputFormat output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat @@ -2340,16 +2329,16 @@ STAGE PLANS: outputColumnNames: _col1, _col2 input vertices: 1 Map 4 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: string), _col2 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: string) sort order: + Map-reduce partition columns: _col1 (type: string) - Statistics: Num rows: 40 Data size: 7000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6825 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: string) Execution mode: llap LLAP IO: no inputs @@ -2383,14 +2372,14 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col1 (type: string) outputColumnNames: _col0, _col3, _col4 - Statistics: Num rows: 64 Data size: 17024 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 63 Data size: 16758 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col3 (type: string), _col0 (type: string), _col4 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 64 Data size: 17024 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 63 Data size: 16758 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 64 Data size: 17024 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 63 Data size: 16758 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.TextInputFormat output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat diff --git ql/src/test/results/clientpositive/llap/join_max_hashtable.q.out ql/src/test/results/clientpositive/llap/join_max_hashtable.q.out index ef1a6f3..cb090c2 100644 --- ql/src/test/results/clientpositive/llap/join_max_hashtable.q.out +++ ql/src/test/results/clientpositive/llap/join_max_hashtable.q.out @@ -39,10 +39,10 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 1 Map 2 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -116,10 +116,10 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 1 Map 2 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -223,11 +223,11 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 1 Map 3 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE HybridGraceHashJoin: true File Output Operator compressed: false - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -309,11 +309,11 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 1 Map 3 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE HybridGraceHashJoin: true File Output Operator compressed: false - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -396,11 +396,11 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 1 Map 3 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE HybridGraceHashJoin: true File Output Operator compressed: false - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -482,11 +482,11 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 1 Map 3 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE HybridGraceHashJoin: true File Output Operator compressed: false - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -539,10 +539,10 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 1 Map 2 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -616,10 +616,10 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 1 Map 2 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/limit_join_transpose.q.out ql/src/test/results/clientpositive/llap/limit_join_transpose.q.out index 4dd7432..ebaac18 100644 --- ql/src/test/results/clientpositive/llap/limit_join_transpose.q.out +++ ql/src/test/results/clientpositive/llap/limit_join_transpose.q.out @@ -66,7 +66,7 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 809 Data size: 288004 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 281596 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 1 Statistics: Num rows: 1 Data size: 356 Basic stats: COMPLETE Column stats: COMPLETE @@ -167,7 +167,7 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 809 Data size: 288004 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 281596 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 1 Statistics: Num rows: 1 Data size: 356 Basic stats: COMPLETE Column stats: COMPLETE @@ -954,7 +954,7 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 809 Data size: 288004 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 281596 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 1 Offset of rows: 1 @@ -1056,7 +1056,7 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 809 Data size: 288004 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 281596 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 1 Offset of rows: 1 diff --git ql/src/test/results/clientpositive/llap/limit_pushdown.q.out ql/src/test/results/clientpositive/llap/limit_pushdown.q.out index b067e45..a4040bd 100644 --- ql/src/test/results/clientpositive/llap/limit_pushdown.q.out +++ ql/src/test/results/clientpositive/llap/limit_pushdown.q.out @@ -395,12 +395,12 @@ STAGE PLANS: keys: cdouble (type: double) mode: hash outputColumnNames: _col0 - Statistics: Num rows: 5570 Data size: 33272 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5528 Data size: 33024 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: double) sort order: + Map-reduce partition columns: _col0 (type: double) - Statistics: Num rows: 5570 Data size: 33272 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5528 Data size: 33024 Basic stats: COMPLETE Column stats: COMPLETE TopN Hash Memory Usage: 0.3 Execution mode: llap LLAP IO: all inputs @@ -411,7 +411,7 @@ STAGE PLANS: keys: KEY._col0 (type: double) mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 5570 Data size: 33272 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5528 Data size: 33024 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 20 Statistics: Num rows: 20 Data size: 128 Basic stats: COMPLETE Column stats: COMPLETE @@ -1070,7 +1070,7 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: complete outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 30591 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 307 Data size: 30393 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 20 Statistics: Num rows: 20 Data size: 1980 Basic stats: COMPLETE Column stats: COMPLETE diff --git ql/src/test/results/clientpositive/llap/limit_pushdown3.q.out ql/src/test/results/clientpositive/llap/limit_pushdown3.q.out index 470cffe..8f4fb0d 100644 --- ql/src/test/results/clientpositive/llap/limit_pushdown3.q.out +++ ql/src/test/results/clientpositive/llap/limit_pushdown3.q.out @@ -424,12 +424,12 @@ STAGE PLANS: keys: cdouble (type: double) mode: hash outputColumnNames: _col0 - Statistics: Num rows: 5570 Data size: 33272 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5528 Data size: 33024 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: double) sort order: + Map-reduce partition columns: _col0 (type: double) - Statistics: Num rows: 5570 Data size: 33272 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5528 Data size: 33024 Basic stats: COMPLETE Column stats: COMPLETE TopN Hash Memory Usage: 0.3 Execution mode: llap LLAP IO: all inputs @@ -440,11 +440,11 @@ STAGE PLANS: keys: KEY._col0 (type: double) mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 5570 Data size: 33272 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5528 Data size: 33024 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: double) sort order: + - Statistics: Num rows: 5570 Data size: 33272 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5528 Data size: 33024 Basic stats: COMPLETE Column stats: COMPLETE TopN Hash Memory Usage: 0.3 Reducer 3 Execution mode: llap @@ -452,7 +452,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: double) outputColumnNames: _col0 - Statistics: Num rows: 5570 Data size: 33272 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5528 Data size: 33024 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 20 Statistics: Num rows: 20 Data size: 128 Basic stats: COMPLETE Column stats: COMPLETE @@ -1009,11 +1009,11 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: complete outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 30591 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 307 Data size: 30393 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + - Statistics: Num rows: 309 Data size: 30591 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 307 Data size: 30393 Basic stats: COMPLETE Column stats: COMPLETE TopN Hash Memory Usage: 0.3 value expressions: _col1 (type: double) Reducer 3 @@ -1022,7 +1022,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: string), VALUE._col0 (type: double) outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 30591 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 307 Data size: 30393 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 20 Statistics: Num rows: 20 Data size: 1980 Basic stats: COMPLETE Column stats: COMPLETE diff --git ql/src/test/results/clientpositive/llap/llap_vector_nohybridgrace.q.out ql/src/test/results/clientpositive/llap/llap_vector_nohybridgrace.q.out index 2c13d5d..b361b1e 100644 --- ql/src/test/results/clientpositive/llap/llap_vector_nohybridgrace.q.out +++ ql/src/test/results/clientpositive/llap/llap_vector_nohybridgrace.q.out @@ -65,7 +65,7 @@ STAGE PLANS: nativeConditionsMet: hive.mapjoin.optimized.hashtable IS true, hive.vectorized.execution.mapjoin.native.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, One MapJoin Condition IS true, No nullsafe IS true, Small table vectorizes IS true, Fast Hash Table and No Hybrid Hash Join IS true input vertices: 1 Map 3 - Statistics: Num rows: 25044 Data size: 200352 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 24737 Data size: 197896 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() Group By Vectorization: @@ -244,7 +244,7 @@ STAGE PLANS: nativeConditionsMet: hive.mapjoin.optimized.hashtable IS true, hive.vectorized.execution.mapjoin.native.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, One MapJoin Condition IS true, No nullsafe IS true, Small table vectorizes IS true, Fast Hash Table and No Hybrid Hash Join IS true input vertices: 1 Map 3 - Statistics: Num rows: 25044 Data size: 200352 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 24737 Data size: 197896 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() Group By Vectorization: diff --git ql/src/test/results/clientpositive/llap/mapjoin_mapjoin.q.out ql/src/test/results/clientpositive/llap/mapjoin_mapjoin.q.out index c4361de..5c68ff2 100644 --- ql/src/test/results/clientpositive/llap/mapjoin_mapjoin.q.out +++ ql/src/test/results/clientpositive/llap/mapjoin_mapjoin.q.out @@ -572,9 +572,9 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 _col1 (type: string) + 0 _col0 (type: string) 1 _col0 (type: string) - outputColumnNames: _col0, _col2 + outputColumnNames: _col1, _col2 input vertices: 1 Map 3 Statistics: Num rows: 2200 Data size: 23372 Basic stats: COMPLETE Column stats: NONE @@ -582,7 +582,7 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 _col0 (type: string) + 0 _col1 (type: string) 1 _col0 (type: string) outputColumnNames: _col2 input vertices: @@ -605,13 +605,13 @@ STAGE PLANS: Map 3 Map Operator Tree: TableScan - alias: src + alias: src1 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Filter Operator - predicate: value is not null (type: boolean) + predicate: key is not null (type: boolean) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: value (type: string) + expressions: key (type: string) outputColumnNames: _col0 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator @@ -624,13 +624,13 @@ STAGE PLANS: Map 4 Map Operator Tree: TableScan - alias: src1 + alias: src Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Filter Operator - predicate: key is not null (type: boolean) + predicate: value is not null (type: boolean) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: key (type: string) + expressions: value (type: string) outputColumnNames: _col0 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator diff --git ql/src/test/results/clientpositive/llap/mergejoin.q.out ql/src/test/results/clientpositive/llap/mergejoin.q.out index cec7c7e..05338c3 100644 --- ql/src/test/results/clientpositive/llap/mergejoin.q.out +++ ql/src/test/results/clientpositive/llap/mergejoin.q.out @@ -170,10 +170,10 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 40 Data size: 14120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 13767 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 40 Data size: 14120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 13767 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -410,7 +410,7 @@ STAGE PLANS: TableScan alias: a filterExpr: key is not null (type: boolean) - Statistics: Num rows: 242 Data size: 23672 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -420,7 +420,7 @@ STAGE PLANS: native: true predicateExpression: SelectColumnIsNotNull(col 0:int) predicate: key is not null (type: boolean) - Statistics: Num rows: 230 Data size: 22498 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int) outputColumnNames: _col0 @@ -428,7 +428,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0] - Statistics: Num rows: 230 Data size: 22498 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + @@ -439,7 +439,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 230 Data size: 22498 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -463,7 +463,7 @@ STAGE PLANS: TableScan alias: b filterExpr: key is not null (type: boolean) - Statistics: Num rows: 500 Data size: 48904 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -473,7 +473,7 @@ STAGE PLANS: native: true predicateExpression: SelectColumnIsNotNull(col 0:int) predicate: key is not null (type: boolean) - Statistics: Num rows: 475 Data size: 46458 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int) outputColumnNames: _col0 @@ -481,7 +481,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0] - Statistics: Num rows: 475 Data size: 46458 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + @@ -492,7 +492,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 475 Data size: 46458 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -520,15 +520,15 @@ STAGE PLANS: keys: 0 _col0 (type: int) 1 _col0 (type: int) - Statistics: Num rows: 522 Data size: 51103 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 399 Data size: 3192 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator sort order: - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint) Reducer 3 Execution mode: vectorized, llap @@ -557,13 +557,13 @@ STAGE PLANS: projectedOutputColumnNums: [0] mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false File Sink Vectorization: className: VectorFileSinkOperator native: false - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -1592,7 +1592,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: a - Statistics: Num rows: 242 Data size: 23672 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -1603,7 +1603,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0] - Statistics: Num rows: 242 Data size: 23672 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + @@ -1614,7 +1614,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 242 Data size: 23672 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -1637,7 +1637,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: b - Statistics: Num rows: 500 Data size: 48904 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -1648,7 +1648,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0] - Statistics: Num rows: 500 Data size: 48904 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + @@ -1659,7 +1659,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 500 Data size: 48904 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -1687,15 +1687,15 @@ STAGE PLANS: keys: 0 _col0 (type: int) 1 _col0 (type: int) - Statistics: Num rows: 550 Data size: 53794 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 399 Data size: 3192 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator sort order: - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint) Reducer 3 Execution mode: vectorized, llap @@ -1724,13 +1724,13 @@ STAGE PLANS: projectedOutputColumnNums: [0] mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false File Sink Vectorization: className: VectorFileSinkOperator native: false - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -1788,7 +1788,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: a - Statistics: Num rows: 242 Data size: 23672 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -1799,7 +1799,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0] - Statistics: Num rows: 242 Data size: 23672 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + @@ -1810,7 +1810,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 242 Data size: 23672 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -1833,7 +1833,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: b - Statistics: Num rows: 500 Data size: 48904 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -1844,7 +1844,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0] - Statistics: Num rows: 500 Data size: 48904 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + @@ -1855,7 +1855,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 500 Data size: 48904 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -1883,15 +1883,15 @@ STAGE PLANS: keys: 0 _col0 (type: int) 1 _col0 (type: int) - Statistics: Num rows: 550 Data size: 53794 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 4000 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator sort order: - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint) Reducer 3 Execution mode: vectorized, llap @@ -1920,13 +1920,13 @@ STAGE PLANS: projectedOutputColumnNums: [0] mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false File Sink Vectorization: className: VectorFileSinkOperator native: false - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -1984,7 +1984,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: a - Statistics: Num rows: 242 Data size: 23672 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -1995,7 +1995,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0] - Statistics: Num rows: 242 Data size: 23672 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + @@ -2006,7 +2006,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 242 Data size: 23672 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -2029,7 +2029,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: b - Statistics: Num rows: 500 Data size: 48904 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -2040,7 +2040,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0] - Statistics: Num rows: 500 Data size: 48904 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + @@ -2051,7 +2051,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 500 Data size: 48904 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -2079,15 +2079,15 @@ STAGE PLANS: keys: 0 _col0 (type: int) 1 _col0 (type: int) - Statistics: Num rows: 550 Data size: 53794 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 742 Data size: 5936 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator sort order: - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint) Reducer 3 Execution mode: vectorized, llap @@ -2116,13 +2116,13 @@ STAGE PLANS: projectedOutputColumnNums: [0] mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false File Sink Vectorization: className: VectorFileSinkOperator native: false - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -2170,11 +2170,13 @@ STAGE PLANS: Tez #### A masked pattern was here #### Edges: - Map 1 <- Reducer 6 (BROADCAST_EDGE) - Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 5 (SIMPLE_EDGE) - Reducer 3 <- Map 7 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) + Map 1 <- Reducer 7 (BROADCAST_EDGE) + Map 8 <- Reducer 5 (BROADCAST_EDGE) + Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 6 (SIMPLE_EDGE) + Reducer 3 <- Map 8 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) Reducer 4 <- Reducer 3 (CUSTOM_SIMPLE_EDGE) - Reducer 6 <- Map 5 (CUSTOM_SIMPLE_EDGE) + Reducer 5 <- Reducer 2 (CUSTOM_SIMPLE_EDGE) + Reducer 7 <- Map 6 (CUSTOM_SIMPLE_EDGE) #### A masked pattern was here #### Vertices: Map 1 @@ -2182,7 +2184,7 @@ STAGE PLANS: TableScan alias: a filterExpr: (key is not null and value is not null and (value BETWEEN DynamicValue(RS_10_c_value_min) AND DynamicValue(RS_10_c_value_max) and in_bloom_filter(value, DynamicValue(RS_10_c_value_bloom_filter)))) (type: boolean) - Statistics: Num rows: 242 Data size: 43428 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22990 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -2192,7 +2194,7 @@ STAGE PLANS: native: true predicateExpression: FilterExprAndExpr(children: SelectColumnIsNotNull(col 0:int), SelectColumnIsNotNull(col 1:string), FilterExprAndExpr(children: FilterStringColumnBetweenDynamicValue(col 1:string, left NULL, right NULL), VectorInBloomFilterColDynamicValue)) predicate: ((value BETWEEN DynamicValue(RS_10_c_value_min) AND DynamicValue(RS_10_c_value_max) and in_bloom_filter(value, DynamicValue(RS_10_c_value_bloom_filter))) and key is not null and value is not null) (type: boolean) - Statistics: Num rows: 218 Data size: 39121 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22990 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int), value (type: string) outputColumnNames: _col0, _col1 @@ -2200,7 +2202,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0, 1] - Statistics: Num rows: 218 Data size: 39121 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22990 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: string) sort order: + @@ -2211,7 +2213,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [0] - Statistics: Num rows: 218 Data size: 39121 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22990 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: int) Execution mode: vectorized, llap LLAP IO: all inputs @@ -2231,7 +2233,7 @@ STAGE PLANS: partitionColumnCount: 1 partitionColumns: ds:string scratchColumnTypeNames: [] - Map 5 + Map 6 Map Operator Tree: TableScan alias: c @@ -2314,12 +2316,12 @@ STAGE PLANS: dataColumns: key:string, value:string partitionColumnCount: 0 scratchColumnTypeNames: [] - Map 7 + Map 8 Map Operator Tree: TableScan alias: b - filterExpr: key is not null (type: boolean) - Statistics: Num rows: 500 Data size: 1904 Basic stats: COMPLETE Column stats: NONE + filterExpr: (key is not null and (key BETWEEN DynamicValue(RS_12_a_key_min) AND DynamicValue(RS_12_a_key_max) and in_bloom_filter(key, DynamicValue(RS_12_a_key_bloom_filter)))) (type: boolean) + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -2327,9 +2329,9 @@ STAGE PLANS: Filter Vectorization: className: VectorFilterOperator native: true - predicateExpression: SelectColumnIsNotNull(col 0:int) - predicate: key is not null (type: boolean) - Statistics: Num rows: 475 Data size: 1808 Basic stats: COMPLETE Column stats: NONE + predicateExpression: FilterExprAndExpr(children: SelectColumnIsNotNull(col 0:int), FilterExprAndExpr(children: FilterLongColumnBetweenDynamicValue(col 0:int, left 0, right 0), VectorInBloomFilterColDynamicValue)) + predicate: ((key BETWEEN DynamicValue(RS_12_a_key_min) AND DynamicValue(RS_12_a_key_max) and in_bloom_filter(key, DynamicValue(RS_12_a_key_bloom_filter))) and key is not null) (type: boolean) + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int) outputColumnNames: _col0 @@ -2337,7 +2339,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0] - Statistics: Num rows: 475 Data size: 1808 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + @@ -2348,7 +2350,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 475 Data size: 1808 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -2377,12 +2379,25 @@ STAGE PLANS: 0 _col1 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 239 Data size: 43033 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 39 Data size: 156 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + Map-reduce partition columns: _col0 (type: int) - Statistics: Num rows: 239 Data size: 43033 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 39 Data size: 156 Basic stats: COMPLETE Column stats: COMPLETE + Select Operator + expressions: _col0 (type: int) + outputColumnNames: _col0 + Statistics: Num rows: 39 Data size: 156 Basic stats: COMPLETE Column stats: COMPLETE + Group By Operator + aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=25) + mode: hash + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 1 Data size: 12 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + sort order: + Statistics: Num rows: 1 Data size: 12 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col0 (type: int), _col1 (type: int), _col2 (type: binary) Reducer 3 Execution mode: llap Reduce Operator Tree: @@ -2392,15 +2407,15 @@ STAGE PLANS: keys: 0 _col0 (type: int) 1 _col0 (type: int) - Statistics: Num rows: 522 Data size: 1988 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 64 Data size: 512 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator sort order: - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint) Reducer 4 Execution mode: vectorized, llap @@ -2429,18 +2444,56 @@ STAGE PLANS: projectedOutputColumnNums: [0] mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false File Sink Vectorization: className: VectorFileSinkOperator native: false - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe - Reducer 6 + Reducer 5 + Execution mode: vectorized, llap + Reduce Vectorization: + enabled: true + enableConditionsMet: hive.vectorized.execution.reduce.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true + reduceColumnNullOrder: + reduceColumnSortOrder: + allNative: false + usesVectorUDFAdaptor: false + vectorized: true + rowBatchContext: + dataColumnCount: 3 + dataColumns: VALUE._col0:int, VALUE._col1:int, VALUE._col2:binary + partitionColumnCount: 0 + scratchColumnTypeNames: [] + Reduce Operator Tree: + Group By Operator + aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, expectedEntries=25) + Group By Vectorization: + aggregators: VectorUDAFMinLong(col 0:int) -> int, VectorUDAFMaxLong(col 1:int) -> int, VectorUDAFBloomFilterMerge(col 2:binary) -> binary + className: VectorGroupByOperator + groupByMode: FINAL + native: false + vectorProcessingMode: STREAMING + projectedOutputColumnNums: [0, 1, 2] + mode: final + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 1 Data size: 12 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + sort order: + Reduce Sink Vectorization: + className: VectorReduceSinkEmptyKeyOperator + keyColumnNums: [] + native: true + nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true + valueColumnNums: [0, 1, 2] + Statistics: Num rows: 1 Data size: 12 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col0 (type: int), _col1 (type: int), _col2 (type: binary) + Reducer 7 Execution mode: vectorized, llap Reduce Vectorization: enabled: true @@ -2530,7 +2583,7 @@ STAGE PLANS: TableScan alias: a filterExpr: value is not null (type: boolean) - Statistics: Num rows: 242 Data size: 65252 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22022 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -2540,7 +2593,7 @@ STAGE PLANS: native: true predicateExpression: SelectColumnIsNotNull(col 1:string) predicate: value is not null (type: boolean) - Statistics: Num rows: 230 Data size: 62016 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22022 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: value (type: string) outputColumnNames: _col1 @@ -2548,7 +2601,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [1] - Statistics: Num rows: 230 Data size: 62016 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22022 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: string) sort order: + @@ -2559,7 +2612,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 230 Data size: 62016 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22022 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -2583,7 +2636,7 @@ STAGE PLANS: TableScan alias: b filterExpr: value is not null (type: boolean) - Statistics: Num rows: 500 Data size: 134584 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 45500 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -2593,7 +2646,7 @@ STAGE PLANS: native: true predicateExpression: SelectColumnIsNotNull(col 1:string) predicate: value is not null (type: boolean) - Statistics: Num rows: 475 Data size: 127854 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 45500 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: value (type: string) outputColumnNames: _col1 @@ -2601,7 +2654,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [1] - Statistics: Num rows: 475 Data size: 127854 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 45500 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: string) sort order: + @@ -2612,7 +2665,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 475 Data size: 127854 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 45500 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -2640,15 +2693,15 @@ STAGE PLANS: keys: 0 _col1 (type: string) 1 _col1 (type: string) - Statistics: Num rows: 522 Data size: 140639 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 394 Data size: 3152 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator sort order: - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint) Reducer 3 Execution mode: vectorized, llap @@ -2677,13 +2730,13 @@ STAGE PLANS: projectedOutputColumnNums: [0] mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false File Sink Vectorization: className: VectorFileSinkOperator native: false - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -2746,7 +2799,7 @@ STAGE PLANS: TableScan alias: s1 filterExpr: key is not null (type: boolean) - Statistics: Num rows: 242 Data size: 924 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -2756,7 +2809,7 @@ STAGE PLANS: native: true predicateExpression: SelectColumnIsNotNull(col 0:int) predicate: key is not null (type: boolean) - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int) outputColumnNames: _col0 @@ -2764,7 +2817,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0] - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + @@ -2775,7 +2828,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -2799,7 +2852,7 @@ STAGE PLANS: TableScan alias: s3 filterExpr: key is not null (type: boolean) - Statistics: Num rows: 242 Data size: 924 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -2809,7 +2862,7 @@ STAGE PLANS: native: true predicateExpression: SelectColumnIsNotNull(col 0:int) predicate: key is not null (type: boolean) - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int) outputColumnNames: _col0 @@ -2817,7 +2870,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0] - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + @@ -2828,7 +2881,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -2852,7 +2905,7 @@ STAGE PLANS: TableScan alias: s2 filterExpr: key is not null (type: boolean) - Statistics: Num rows: 242 Data size: 924 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -2862,7 +2915,7 @@ STAGE PLANS: native: true predicateExpression: SelectColumnIsNotNull(col 0:int) predicate: key is not null (type: boolean) - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int) outputColumnNames: _col0 @@ -2870,7 +2923,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0] - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + @@ -2881,7 +2934,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 483 Data size: 1843 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 624 Data size: 2496 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -2905,7 +2958,7 @@ STAGE PLANS: TableScan alias: b filterExpr: key is not null (type: boolean) - Statistics: Num rows: 500 Data size: 1904 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -2915,7 +2968,7 @@ STAGE PLANS: native: true predicateExpression: SelectColumnIsNotNull(col 0:int) predicate: key is not null (type: boolean) - Statistics: Num rows: 475 Data size: 1808 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int) outputColumnNames: _col0 @@ -2923,7 +2976,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0] - Statistics: Num rows: 475 Data size: 1808 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + @@ -2934,7 +2987,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 475 Data size: 1808 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -2963,12 +3016,12 @@ STAGE PLANS: 0 _col0 (type: int) 1 _col0 (type: int) outputColumnNames: _col0 - Statistics: Num rows: 253 Data size: 965 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 382 Data size: 1528 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + Map-reduce partition columns: _col0 (type: int) - Statistics: Num rows: 483 Data size: 1843 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 624 Data size: 2496 Basic stats: COMPLETE Column stats: COMPLETE Reducer 4 Execution mode: llap Reduce Operator Tree: @@ -2978,15 +3031,15 @@ STAGE PLANS: keys: 0 _col0 (type: int) 1 _col0 (type: int) - Statistics: Num rows: 531 Data size: 2027 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1029 Data size: 8232 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator sort order: - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint) Reducer 5 Execution mode: vectorized, llap @@ -3015,13 +3068,13 @@ STAGE PLANS: projectedOutputColumnNums: [0] mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false File Sink Vectorization: className: VectorFileSinkOperator native: false - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -3063,7 +3116,7 @@ STAGE PLANS: TableScan alias: a filterExpr: value is not null (type: boolean) - Statistics: Num rows: 242 Data size: 65252 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22022 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -3073,7 +3126,7 @@ STAGE PLANS: native: true predicateExpression: SelectColumnIsNotNull(col 1:string) predicate: value is not null (type: boolean) - Statistics: Num rows: 230 Data size: 62016 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22022 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: value (type: string) outputColumnNames: _col1 @@ -3081,7 +3134,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [1] - Statistics: Num rows: 230 Data size: 62016 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22022 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: string) sort order: + @@ -3092,7 +3145,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 230 Data size: 62016 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22022 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -3116,7 +3169,7 @@ STAGE PLANS: TableScan alias: b filterExpr: value is not null (type: boolean) - Statistics: Num rows: 500 Data size: 134584 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 45500 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -3126,7 +3179,7 @@ STAGE PLANS: native: true predicateExpression: SelectColumnIsNotNull(col 1:string) predicate: value is not null (type: boolean) - Statistics: Num rows: 475 Data size: 127854 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 45500 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: value (type: string) outputColumnNames: _col1 @@ -3134,7 +3187,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [1] - Statistics: Num rows: 475 Data size: 127854 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 45500 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: string) sort order: + @@ -3145,7 +3198,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 475 Data size: 127854 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 45500 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -3173,15 +3226,15 @@ STAGE PLANS: keys: 0 _col1 (type: string) 1 _col1 (type: string) - Statistics: Num rows: 522 Data size: 140639 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 394 Data size: 3152 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator sort order: - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint) Reducer 3 Execution mode: vectorized, llap @@ -3210,13 +3263,13 @@ STAGE PLANS: projectedOutputColumnNums: [0] mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false File Sink Vectorization: className: VectorFileSinkOperator native: false - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -3262,11 +3315,13 @@ STAGE PLANS: Tez #### A masked pattern was here #### Edges: - Map 1 <- Reducer 6 (BROADCAST_EDGE) - Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 5 (SIMPLE_EDGE) - Reducer 3 <- Map 7 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) + Map 1 <- Reducer 7 (BROADCAST_EDGE) + Map 8 <- Reducer 5 (BROADCAST_EDGE) + Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 6 (SIMPLE_EDGE) + Reducer 3 <- Map 8 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) Reducer 4 <- Reducer 3 (CUSTOM_SIMPLE_EDGE) - Reducer 6 <- Map 5 (CUSTOM_SIMPLE_EDGE) + Reducer 5 <- Reducer 2 (CUSTOM_SIMPLE_EDGE) + Reducer 7 <- Map 6 (CUSTOM_SIMPLE_EDGE) #### A masked pattern was here #### Vertices: Map 1 @@ -3274,7 +3329,7 @@ STAGE PLANS: TableScan alias: a filterExpr: (key is not null and value is not null and (value BETWEEN DynamicValue(RS_10_c_value_min) AND DynamicValue(RS_10_c_value_max) and in_bloom_filter(value, DynamicValue(RS_10_c_value_bloom_filter)))) (type: boolean) - Statistics: Num rows: 242 Data size: 43428 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22990 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -3284,7 +3339,7 @@ STAGE PLANS: native: true predicateExpression: FilterExprAndExpr(children: SelectColumnIsNotNull(col 0:int), SelectColumnIsNotNull(col 1:string), FilterExprAndExpr(children: FilterStringColumnBetweenDynamicValue(col 1:string, left NULL, right NULL), VectorInBloomFilterColDynamicValue)) predicate: ((value BETWEEN DynamicValue(RS_10_c_value_min) AND DynamicValue(RS_10_c_value_max) and in_bloom_filter(value, DynamicValue(RS_10_c_value_bloom_filter))) and key is not null and value is not null) (type: boolean) - Statistics: Num rows: 218 Data size: 39121 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22990 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int), value (type: string) outputColumnNames: _col0, _col1 @@ -3292,7 +3347,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0, 1] - Statistics: Num rows: 218 Data size: 39121 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22990 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: string) sort order: + @@ -3303,7 +3358,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [0] - Statistics: Num rows: 218 Data size: 39121 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22990 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: int) Execution mode: vectorized, llap LLAP IO: all inputs @@ -3323,7 +3378,7 @@ STAGE PLANS: partitionColumnCount: 1 partitionColumns: ds:string scratchColumnTypeNames: [] - Map 5 + Map 6 Map Operator Tree: TableScan alias: c @@ -3406,12 +3461,12 @@ STAGE PLANS: dataColumns: key:string, value:string partitionColumnCount: 0 scratchColumnTypeNames: [] - Map 7 + Map 8 Map Operator Tree: TableScan alias: b - filterExpr: key is not null (type: boolean) - Statistics: Num rows: 500 Data size: 1904 Basic stats: COMPLETE Column stats: NONE + filterExpr: (key is not null and (key BETWEEN DynamicValue(RS_12_a_key_min) AND DynamicValue(RS_12_a_key_max) and in_bloom_filter(key, DynamicValue(RS_12_a_key_bloom_filter)))) (type: boolean) + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -3419,9 +3474,9 @@ STAGE PLANS: Filter Vectorization: className: VectorFilterOperator native: true - predicateExpression: SelectColumnIsNotNull(col 0:int) - predicate: key is not null (type: boolean) - Statistics: Num rows: 475 Data size: 1808 Basic stats: COMPLETE Column stats: NONE + predicateExpression: FilterExprAndExpr(children: SelectColumnIsNotNull(col 0:int), FilterExprAndExpr(children: FilterLongColumnBetweenDynamicValue(col 0:int, left 0, right 0), VectorInBloomFilterColDynamicValue)) + predicate: ((key BETWEEN DynamicValue(RS_12_a_key_min) AND DynamicValue(RS_12_a_key_max) and in_bloom_filter(key, DynamicValue(RS_12_a_key_bloom_filter))) and key is not null) (type: boolean) + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int) outputColumnNames: _col0 @@ -3429,7 +3484,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0] - Statistics: Num rows: 475 Data size: 1808 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + @@ -3440,7 +3495,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 475 Data size: 1808 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -3469,12 +3524,25 @@ STAGE PLANS: 0 _col1 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 239 Data size: 43033 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 39 Data size: 156 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + Map-reduce partition columns: _col0 (type: int) - Statistics: Num rows: 239 Data size: 43033 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 39 Data size: 156 Basic stats: COMPLETE Column stats: COMPLETE + Select Operator + expressions: _col0 (type: int) + outputColumnNames: _col0 + Statistics: Num rows: 39 Data size: 156 Basic stats: COMPLETE Column stats: COMPLETE + Group By Operator + aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=25) + mode: hash + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 1 Data size: 12 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + sort order: + Statistics: Num rows: 1 Data size: 12 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col0 (type: int), _col1 (type: int), _col2 (type: binary) Reducer 3 Execution mode: llap Reduce Operator Tree: @@ -3484,15 +3552,15 @@ STAGE PLANS: keys: 0 _col0 (type: int) 1 _col0 (type: int) - Statistics: Num rows: 522 Data size: 1988 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 64 Data size: 512 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator sort order: - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint) Reducer 4 Execution mode: vectorized, llap @@ -3521,18 +3589,56 @@ STAGE PLANS: projectedOutputColumnNums: [0] mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false File Sink Vectorization: className: VectorFileSinkOperator native: false - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe - Reducer 6 + Reducer 5 + Execution mode: vectorized, llap + Reduce Vectorization: + enabled: true + enableConditionsMet: hive.vectorized.execution.reduce.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true + reduceColumnNullOrder: + reduceColumnSortOrder: + allNative: false + usesVectorUDFAdaptor: false + vectorized: true + rowBatchContext: + dataColumnCount: 3 + dataColumns: VALUE._col0:int, VALUE._col1:int, VALUE._col2:binary + partitionColumnCount: 0 + scratchColumnTypeNames: [] + Reduce Operator Tree: + Group By Operator + aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, expectedEntries=25) + Group By Vectorization: + aggregators: VectorUDAFMinLong(col 0:int) -> int, VectorUDAFMaxLong(col 1:int) -> int, VectorUDAFBloomFilterMerge(col 2:binary) -> binary + className: VectorGroupByOperator + groupByMode: FINAL + native: false + vectorProcessingMode: STREAMING + projectedOutputColumnNums: [0, 1, 2] + mode: final + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 1 Data size: 12 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + sort order: + Reduce Sink Vectorization: + className: VectorReduceSinkEmptyKeyOperator + keyColumnNums: [] + native: true + nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true + valueColumnNums: [0, 1, 2] + Statistics: Num rows: 1 Data size: 12 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col0 (type: int), _col1 (type: int), _col2 (type: binary) + Reducer 7 Execution mode: vectorized, llap Reduce Vectorization: enabled: true @@ -3630,7 +3736,7 @@ STAGE PLANS: TableScan alias: s1 filterExpr: key is not null (type: boolean) - Statistics: Num rows: 242 Data size: 924 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -3640,7 +3746,7 @@ STAGE PLANS: native: true predicateExpression: SelectColumnIsNotNull(col 0:int) predicate: key is not null (type: boolean) - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int) outputColumnNames: _col0 @@ -3648,7 +3754,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0] - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + @@ -3659,7 +3765,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -3683,7 +3789,7 @@ STAGE PLANS: TableScan alias: s3 filterExpr: key is not null (type: boolean) - Statistics: Num rows: 242 Data size: 924 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -3693,7 +3799,7 @@ STAGE PLANS: native: true predicateExpression: SelectColumnIsNotNull(col 0:int) predicate: key is not null (type: boolean) - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int) outputColumnNames: _col0 @@ -3701,7 +3807,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0] - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + @@ -3712,7 +3818,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -3736,7 +3842,7 @@ STAGE PLANS: TableScan alias: s2 filterExpr: key is not null (type: boolean) - Statistics: Num rows: 242 Data size: 924 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -3746,7 +3852,7 @@ STAGE PLANS: native: true predicateExpression: SelectColumnIsNotNull(col 0:int) predicate: key is not null (type: boolean) - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int) outputColumnNames: _col0 @@ -3754,7 +3860,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0] - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + @@ -3765,7 +3871,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 483 Data size: 1843 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 624 Data size: 2496 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -3789,7 +3895,7 @@ STAGE PLANS: TableScan alias: b filterExpr: key is not null (type: boolean) - Statistics: Num rows: 500 Data size: 1904 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -3799,7 +3905,7 @@ STAGE PLANS: native: true predicateExpression: SelectColumnIsNotNull(col 0:int) predicate: key is not null (type: boolean) - Statistics: Num rows: 475 Data size: 1808 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int) outputColumnNames: _col0 @@ -3807,7 +3913,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0] - Statistics: Num rows: 475 Data size: 1808 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + @@ -3818,7 +3924,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 475 Data size: 1808 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -3847,12 +3953,12 @@ STAGE PLANS: 0 _col0 (type: int) 1 _col0 (type: int) outputColumnNames: _col0 - Statistics: Num rows: 253 Data size: 965 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 382 Data size: 1528 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + Map-reduce partition columns: _col0 (type: int) - Statistics: Num rows: 483 Data size: 1843 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 624 Data size: 2496 Basic stats: COMPLETE Column stats: COMPLETE Reducer 4 Execution mode: llap Reduce Operator Tree: @@ -3862,15 +3968,15 @@ STAGE PLANS: keys: 0 _col0 (type: int) 1 _col0 (type: int) - Statistics: Num rows: 531 Data size: 2027 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1029 Data size: 8232 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator sort order: - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint) Reducer 5 Execution mode: vectorized, llap @@ -3899,13 +4005,13 @@ STAGE PLANS: projectedOutputColumnNums: [0] mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false File Sink Vectorization: className: VectorFileSinkOperator native: false - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -3961,7 +4067,7 @@ STAGE PLANS: TableScan alias: t1 filterExpr: key is not null (type: boolean) - Statistics: Num rows: 242 Data size: 66176 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22990 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -3971,7 +4077,7 @@ STAGE PLANS: native: true predicateExpression: SelectColumnIsNotNull(col 0:int) predicate: key is not null (type: boolean) - Statistics: Num rows: 230 Data size: 62894 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22990 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int), value (type: string) outputColumnNames: _col0, _col1 @@ -3979,7 +4085,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0, 1] - Statistics: Num rows: 230 Data size: 62894 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22990 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int), _col1 (type: string) sort order: ++ @@ -3989,7 +4095,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 230 Data size: 62894 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22990 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -4013,7 +4119,7 @@ STAGE PLANS: TableScan alias: t2 filterExpr: key is not null (type: boolean) - Statistics: Num rows: 500 Data size: 136488 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 47500 Basic stats: COMPLETE Column stats: COMPLETE TableScan Vectorization: native: true vectorizationSchemaColumns: [0:key:int, 1:value:string, 2:ds:string, 3:ROW__ID:struct] @@ -4023,7 +4129,7 @@ STAGE PLANS: native: true predicateExpression: SelectColumnIsNotNull(col 0:int) predicate: key is not null (type: boolean) - Statistics: Num rows: 475 Data size: 129663 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 47500 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int), value (type: string) outputColumnNames: _col0, _col1 @@ -4031,7 +4137,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0, 1] - Statistics: Num rows: 475 Data size: 129663 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 47500 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int), _col1 (type: string) sort order: ++ @@ -4041,7 +4147,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 475 Data size: 129663 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 47500 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: all inputs Map Vectorization: @@ -4083,7 +4189,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0] - Statistics: Num rows: 230 Data size: 62894 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + @@ -4094,7 +4200,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 230 Data size: 62894 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Reducer 3 Execution mode: llap Reduce Operator Tree: @@ -4104,15 +4210,15 @@ STAGE PLANS: keys: 0 _col0 (type: int) 1 _col0 (type: int) - Statistics: Num rows: 522 Data size: 142629 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 399 Data size: 3192 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator sort order: - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint) Reducer 4 Execution mode: vectorized, llap @@ -4141,13 +4247,13 @@ STAGE PLANS: projectedOutputColumnNums: [0] mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false File Sink Vectorization: className: VectorFileSinkOperator native: false - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -4175,7 +4281,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0] - Statistics: Num rows: 475 Data size: 129663 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + @@ -4186,7 +4292,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 475 Data size: 129663 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Stage: Stage-0 Fetch Operator diff --git ql/src/test/results/clientpositive/llap/mrr.q.out ql/src/test/results/clientpositive/llap/mrr.q.out index bfa26e4..0737c6e 100644 --- ql/src/test/results/clientpositive/llap/mrr.q.out +++ ql/src/test/results/clientpositive/llap/mrr.q.out @@ -457,17 +457,17 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col1, _col2 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col1 (type: string), _col2 (type: string) mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 404 Data size: 71912 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 395 Data size: 70310 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 404 Data size: 71912 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 395 Data size: 70310 Basic stats: COMPLETE Column stats: COMPLETE Reducer 3 Execution mode: llap Reduce Operator Tree: @@ -475,27 +475,27 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 404 Data size: 71912 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 395 Data size: 70310 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count(_col1) keys: _col0 (type: string) mode: complete outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: bigint), _col0 (type: string) sort order: ++ - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Reducer 4 Execution mode: llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey1 (type: string), KEY.reducesinkkey0 (type: bigint) outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -882,17 +882,17 @@ STAGE PLANS: outputColumnNames: _col1, _col2 input vertices: 0 Map 1 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col1 (type: string), _col2 (type: string) mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 404 Data size: 71912 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 395 Data size: 70310 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 404 Data size: 71912 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 395 Data size: 70310 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: llap LLAP IO: no inputs Reducer 3 @@ -902,27 +902,27 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 404 Data size: 71912 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 395 Data size: 70310 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count(_col1) keys: _col0 (type: string) mode: complete outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: bigint), _col0 (type: string) sort order: ++ - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Reducer 4 Execution mode: llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey1 (type: string), KEY.reducesinkkey0 (type: bigint) outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -1360,15 +1360,15 @@ STAGE PLANS: 1 _col0 (type: string) 2 _col0 (type: string) outputColumnNames: _col0, _col1, _col3, _col4, _col5 - Statistics: Num rows: 54 Data size: 10692 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 51 Data size: 10098 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col3 (type: bigint), _col1 (type: bigint), _col4 (type: string), _col5 (type: bigint) outputColumnNames: _col0, _col1, _col3, _col4, _col5 - Statistics: Num rows: 54 Data size: 15390 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 51 Data size: 14535 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + - Statistics: Num rows: 54 Data size: 15390 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 51 Data size: 14535 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint), _col3 (type: bigint), _col4 (type: string), _col5 (type: bigint) Reducer 4 Execution mode: llap @@ -1376,10 +1376,10 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: string), VALUE._col0 (type: bigint), KEY.reducesinkkey0 (type: string), VALUE._col1 (type: bigint), VALUE._col2 (type: string), VALUE._col3 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 54 Data size: 15390 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 51 Data size: 14535 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 54 Data size: 15390 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 51 Data size: 14535 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/multiMapJoin2.q.out ql/src/test/results/clientpositive/llap/multiMapJoin2.q.out index 88951c3..ee5e15e 100644 --- ql/src/test/results/clientpositive/llap/multiMapJoin2.q.out +++ ql/src/test/results/clientpositive/llap/multiMapJoin2.q.out @@ -47,11 +47,11 @@ STAGE PLANS: outputColumnNames: _col0 input vertices: 1 Map 4 - Statistics: Num rows: 40 Data size: 3480 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3393 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + - Statistics: Num rows: 80 Data size: 6960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 78 Data size: 6786 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: llap LLAP IO: no inputs Map 4 @@ -94,11 +94,11 @@ STAGE PLANS: outputColumnNames: _col0 input vertices: 1 Map 6 - Statistics: Num rows: 40 Data size: 3480 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3393 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + - Statistics: Num rows: 80 Data size: 6960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 78 Data size: 6786 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: llap LLAP IO: no inputs Map 6 @@ -126,10 +126,10 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 80 Data size: 6960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 78 Data size: 6786 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 80 Data size: 6960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 78 Data size: 6786 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -350,21 +350,21 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 40 Data size: 3480 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3393 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + - Statistics: Num rows: 80 Data size: 6960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 78 Data size: 6786 Basic stats: COMPLETE Column stats: COMPLETE Reducer 4 Execution mode: llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 80 Data size: 6960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 78 Data size: 6786 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 80 Data size: 6960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 78 Data size: 6786 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -379,11 +379,11 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 40 Data size: 3480 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3393 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + - Statistics: Num rows: 80 Data size: 6960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 78 Data size: 6786 Basic stats: COMPLETE Column stats: COMPLETE Union 3 Vertex: Union 3 @@ -556,11 +556,11 @@ STAGE PLANS: outputColumnNames: _col0 input vertices: 1 Map 6 - Statistics: Num rows: 40 Data size: 3480 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3393 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + - Statistics: Num rows: 52 Data size: 4512 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 51 Data size: 4425 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: llap LLAP IO: no inputs Map 6 @@ -593,17 +593,17 @@ STAGE PLANS: Reduce Output Operator key expressions: _col0 (type: string) sort order: + - Statistics: Num rows: 52 Data size: 4512 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 51 Data size: 4425 Basic stats: COMPLETE Column stats: COMPLETE Reducer 4 Execution mode: llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 52 Data size: 4524 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 51 Data size: 4437 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 52 Data size: 4524 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 51 Data size: 4437 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -750,7 +750,7 @@ STAGE PLANS: outputColumnNames: _col0 input vertices: 1 Map 5 - Statistics: Num rows: 40 Data size: 3480 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3393 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: string) mode: hash @@ -808,7 +808,7 @@ STAGE PLANS: outputColumnNames: _col0 input vertices: 1 Map 5 - Statistics: Num rows: 40 Data size: 3480 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3393 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: string) mode: hash @@ -990,7 +990,7 @@ STAGE PLANS: outputColumnNames: _col0 input vertices: 1 Map 5 - Statistics: Num rows: 40 Data size: 3480 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3393 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: string) mode: hash @@ -1048,7 +1048,7 @@ STAGE PLANS: outputColumnNames: _col0 input vertices: 1 Map 5 - Statistics: Num rows: 40 Data size: 3480 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3393 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: string) mode: hash @@ -1230,7 +1230,7 @@ STAGE PLANS: outputColumnNames: _col0 input vertices: 1 Map 5 - Statistics: Num rows: 40 Data size: 3480 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3393 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: string) mode: hash @@ -1454,7 +1454,7 @@ STAGE PLANS: outputColumnNames: _col0 input vertices: 1 Map 5 - Statistics: Num rows: 40 Data size: 3480 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3393 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: string) mode: hash @@ -1857,17 +1857,17 @@ STAGE PLANS: outputColumnNames: _col0 input vertices: 1 Map 5 - Statistics: Num rows: 809 Data size: 70383 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 68817 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: string) mode: hash outputColumnNames: _col0 - Statistics: Num rows: 309 Data size: 26883 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 27492 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 26883 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 27492 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: llap LLAP IO: no inputs Map 5 @@ -1896,17 +1896,17 @@ STAGE PLANS: outputColumnNames: _col0 input vertices: 1 Map 7 - Statistics: Num rows: 809 Data size: 70383 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 68817 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: string) mode: hash outputColumnNames: _col0 - Statistics: Num rows: 309 Data size: 26883 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 27492 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 26883 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 27492 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: llap LLAP IO: no inputs Map 6 diff --git ql/src/test/results/clientpositive/llap/offset_limit_ppd_optimizer.q.out ql/src/test/results/clientpositive/llap/offset_limit_ppd_optimizer.q.out index b6bc569..6d25176 100644 --- ql/src/test/results/clientpositive/llap/offset_limit_ppd_optimizer.q.out +++ ql/src/test/results/clientpositive/llap/offset_limit_ppd_optimizer.q.out @@ -399,12 +399,12 @@ STAGE PLANS: keys: cdouble (type: double) mode: hash outputColumnNames: _col0 - Statistics: Num rows: 5570 Data size: 33272 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5528 Data size: 33024 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: double) sort order: + Map-reduce partition columns: _col0 (type: double) - Statistics: Num rows: 5570 Data size: 33272 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5528 Data size: 33024 Basic stats: COMPLETE Column stats: COMPLETE TopN Hash Memory Usage: 0.3 Execution mode: llap LLAP IO: all inputs @@ -415,7 +415,7 @@ STAGE PLANS: keys: KEY._col0 (type: double) mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 5570 Data size: 33272 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5528 Data size: 33024 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 20 Offset of rows: 10 @@ -933,7 +933,7 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: complete outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 30591 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 307 Data size: 30393 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 20 Offset of rows: 10 @@ -1335,7 +1335,7 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: complete outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 20 Offset of rows: 10 @@ -1379,7 +1379,7 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: complete outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 20 Offset of rows: 20 diff --git ql/src/test/results/clientpositive/llap/partialdhj.q.out ql/src/test/results/clientpositive/llap/partialdhj.q.out index 4e62c4f..14298ae 100644 --- ql/src/test/results/clientpositive/llap/partialdhj.q.out +++ ql/src/test/results/clientpositive/llap/partialdhj.q.out @@ -143,11 +143,11 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2 input vertices: 0 Reducer 3 - Statistics: Num rows: 25 Data size: 6675 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 26 Data size: 6942 Basic stats: COMPLETE Column stats: COMPLETE HybridGraceHashJoin: true File Output Operator compressed: false - Statistics: Num rows: 25 Data size: 6675 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 26 Data size: 6942 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -336,11 +336,11 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2 input vertices: 1 Reducer 5 - Statistics: Num rows: 25 Data size: 6675 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 26 Data size: 6942 Basic stats: COMPLETE Column stats: COMPLETE HybridGraceHashJoin: true File Output Operator compressed: false - Statistics: Num rows: 25 Data size: 6675 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 26 Data size: 6942 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/reduce_deduplicate_extended.q.out ql/src/test/results/clientpositive/llap/reduce_deduplicate_extended.q.out index b4ac5a6..ab8da2b 100644 --- ql/src/test/results/clientpositive/llap/reduce_deduplicate_extended.q.out +++ ql/src/test/results/clientpositive/llap/reduce_deduplicate_extended.q.out @@ -42,10 +42,10 @@ STAGE PLANS: keys: _col0 (type: string) mode: complete outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -313,18 +313,18 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6942 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col0) keys: _col0 (type: string), _col1 (type: string) mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 20 Data size: 3720 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3534 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string) - Statistics: Num rows: 20 Data size: 3720 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3534 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: double) Reducer 3 Execution mode: llap @@ -334,14 +334,14 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: string) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 20 Data size: 3720 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 3534 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col2 (type: double) outputColumnNames: _col0, _col1 - Statistics: Num rows: 20 Data size: 1900 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 1805 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 20 Data size: 1900 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 1805 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -419,21 +419,21 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6942 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ - Statistics: Num rows: 40 Data size: 7120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6942 Basic stats: COMPLETE Column stats: COMPLETE Reducer 3 Execution mode: llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6942 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 40 Data size: 7120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6942 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -2596,10 +2596,10 @@ STAGE PLANS: keys: _col0 (type: string) mode: complete outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -2779,10 +2779,10 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: complete outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -2860,12 +2860,12 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6942 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string) - Statistics: Num rows: 40 Data size: 7120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6942 Basic stats: COMPLETE Column stats: COMPLETE Reducer 3 Execution mode: llap Reduce Operator Tree: @@ -2874,14 +2874,14 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: string) mode: complete outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 40 Data size: 7440 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 7254 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col2 (type: double) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 3800 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3705 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 40 Data size: 3800 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 3705 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -2959,21 +2959,21 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6942 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ - Statistics: Num rows: 40 Data size: 7120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6942 Basic stats: COMPLETE Column stats: COMPLETE Reducer 3 Execution mode: llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6942 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 40 Data size: 7120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6942 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -3033,10 +3033,10 @@ STAGE PLANS: keys: _col0 (type: string) mode: complete outputColumnNames: _col0 - Statistics: Num rows: 309 Data size: 26883 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 27492 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 309 Data size: 26883 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 27492 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -3093,10 +3093,10 @@ STAGE PLANS: keys: _col0 (type: string) mode: complete outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 309 Data size: 29355 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30020 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/semijoin_hint.q.out ql/src/test/results/clientpositive/llap/semijoin_hint.q.out index cdfa733..5493633 100644 --- ql/src/test/results/clientpositive/llap/semijoin_hint.q.out +++ ql/src/test/results/clientpositive/llap/semijoin_hint.q.out @@ -222,7 +222,7 @@ STAGE PLANS: outputColumnNames: _col0 Statistics: Num rows: 1000 Data size: 87000 Basic stats: PARTIAL Column stats: PARTIAL Group By Operator - aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=309) + aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=20) mode: hash outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 1 Data size: 639 Basic stats: PARTIAL Column stats: PARTIAL @@ -272,7 +272,7 @@ STAGE PLANS: Execution mode: llap Reduce Operator Tree: Group By Operator - aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, expectedEntries=309) + aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, expectedEntries=20) mode: final outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 1 Data size: 639 Basic stats: PARTIAL Column stats: PARTIAL @@ -478,16 +478,16 @@ STAGE PLANS: 0 cstring (type: string) 1 value (type: string) outputColumnNames: str - Statistics: Num rows: 4056 Data size: 352872 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4110 Data size: 357570 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: str (type: string) sort order: + Map-reduce partition columns: str (type: string) - Statistics: Num rows: 4056 Data size: 352872 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4110 Data size: 357570 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: str (type: string) outputColumnNames: _col0 - Statistics: Num rows: 4056 Data size: 352872 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4110 Data size: 357570 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=5000) mode: hash @@ -506,9 +506,9 @@ STAGE PLANS: keys: 0 str (type: string) 1 key1 (type: string) - Statistics: Num rows: 4461 Data size: 388159 Basic stats: PARTIAL Column stats: NONE + Statistics: Num rows: 4521 Data size: 393327 Basic stats: PARTIAL Column stats: NONE Select Operator - Statistics: Num rows: 4461 Data size: 388159 Basic stats: PARTIAL Column stats: NONE + Statistics: Num rows: 4521 Data size: 393327 Basic stats: PARTIAL Column stats: NONE Group By Operator aggregations: count() mode: hash @@ -1476,16 +1476,16 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col1 (type: string) outputColumnNames: _col1 - Statistics: Num rows: 4056 Data size: 352872 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4110 Data size: 357570 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: string) sort order: + Map-reduce partition columns: _col1 (type: string) - Statistics: Num rows: 4056 Data size: 352872 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4110 Data size: 357570 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 4056 Data size: 352872 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4110 Data size: 357570 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=5000) mode: hash @@ -1504,7 +1504,7 @@ STAGE PLANS: keys: 0 _col1 (type: string) 1 _col0 (type: string) - Statistics: Num rows: 4461 Data size: 388159 Basic stats: PARTIAL Column stats: NONE + Statistics: Num rows: 4521 Data size: 393327 Basic stats: PARTIAL Column stats: NONE Group By Operator aggregations: count() mode: hash @@ -2190,7 +2190,7 @@ STAGE PLANS: outputColumnNames: _col0 Statistics: Num rows: 1000 Data size: 87000 Basic stats: PARTIAL Column stats: PARTIAL Group By Operator - aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=309) + aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=20) mode: hash outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 1 Data size: 639 Basic stats: PARTIAL Column stats: PARTIAL @@ -2238,7 +2238,7 @@ STAGE PLANS: Execution mode: llap Reduce Operator Tree: Group By Operator - aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, expectedEntries=309) + aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, expectedEntries=20) mode: final outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 1 Data size: 639 Basic stats: PARTIAL Column stats: PARTIAL diff --git ql/src/test/results/clientpositive/llap/skewjoin.q.out ql/src/test/results/clientpositive/llap/skewjoin.q.out index b102bca..f3bf63c 100644 --- ql/src/test/results/clientpositive/llap/skewjoin.q.out +++ ql/src/test/results/clientpositive/llap/skewjoin.q.out @@ -141,14 +141,14 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col2 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: UDFToInteger(_col0) (type: int), _col2 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 809 Data size: 76855 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 75145 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 809 Data size: 76855 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 75145 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.TextInputFormat output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat @@ -655,7 +655,7 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col2, _col3 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(hash(_col2)), sum(hash(_col3)) mode: hash @@ -782,7 +782,7 @@ STAGE PLANS: 0 _col0 (type: string), UDFToDouble(substring(_col1, 5)) (type: double) 1 _col0 (type: string), (substring(_col1, 5) + 1) (type: double) outputColumnNames: _col2, _col3 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(hash(_col2)), sum(hash(_col3)) mode: hash @@ -938,7 +938,7 @@ STAGE PLANS: 1 _col0 (type: string) 2 _col0 (type: string) outputColumnNames: _col0, _col3 - Statistics: Num rows: 143 Data size: 25454 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 135 Data size: 24030 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(hash(_col0)), sum(hash(_col3)) mode: hash diff --git ql/src/test/results/clientpositive/llap/subquery_exists.q.out ql/src/test/results/clientpositive/llap/subquery_exists.q.out index dfe4240..160c8b1 100644 --- ql/src/test/results/clientpositive/llap/subquery_exists.q.out +++ ql/src/test/results/clientpositive/llap/subquery_exists.q.out @@ -81,10 +81,10 @@ STAGE PLANS: 0 _col0 (type: string), _col1 (type: string) 1 _col0 (type: string), _col1 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 133 Data size: 23674 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 131 Data size: 23318 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 133 Data size: 23674 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 131 Data size: 23318 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -289,10 +289,10 @@ STAGE PLANS: 0 _col1 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 404 Data size: 71912 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 407 Data size: 72446 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 404 Data size: 71912 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 407 Data size: 72446 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/subquery_in.q.out ql/src/test/results/clientpositive/llap/subquery_in.q.out index 5dcdfdd..4724dfb 100644 --- ql/src/test/results/clientpositive/llap/subquery_in.q.out +++ ql/src/test/results/clientpositive/llap/subquery_in.q.out @@ -74,10 +74,10 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 133 Data size: 23674 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 131 Data size: 23318 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 133 Data size: 23674 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 131 Data size: 23318 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -195,10 +195,10 @@ STAGE PLANS: 0 _col0 (type: string), _col1 (type: string) 1 _col0 (type: string), _col1 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 133 Data size: 23674 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 131 Data size: 23318 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 133 Data size: 23674 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 131 Data size: 23318 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -684,10 +684,10 @@ STAGE PLANS: 0 _col0 (type: string), _col1 (type: string) 1 _col0 (type: string), _col1 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 133 Data size: 23674 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 131 Data size: 23318 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 133 Data size: 23674 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 131 Data size: 23318 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -812,14 +812,14 @@ STAGE PLANS: 1 _col0 (type: string) outputColumnNames: _col0, _col1, _col3 residual filter predicates: {(_col1 <> _col3)} - Statistics: Num rows: 66 Data size: 17490 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 64 Data size: 16960 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col1 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 66 Data size: 11748 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 64 Data size: 11392 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 66 Data size: 11748 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 64 Data size: 11392 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -992,12 +992,12 @@ STAGE PLANS: keys: _col0 (type: string), _col1 (type: string) mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 10609 Data size: 1888402 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 10918 Data size: 1943404 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string) - Statistics: Num rows: 10609 Data size: 1888402 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 10918 Data size: 1943404 Basic stats: COMPLETE Column stats: COMPLETE Reducer 5 Execution mode: llap Reduce Operator Tree: @@ -3254,18 +3254,18 @@ STAGE PLANS: 0 _col1 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 404 Data size: 35148 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 407 Data size: 35409 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 202 Data size: 19190 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 203 Data size: 19285 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 202 Data size: 19190 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 203 Data size: 19285 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Reducer 3 Execution mode: llap @@ -3275,15 +3275,15 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 202 Data size: 19190 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 203 Data size: 19285 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: _col1 is not null (type: boolean) - Statistics: Num rows: 202 Data size: 19190 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 203 Data size: 19285 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: bigint) sort order: + Map-reduce partition columns: _col1 (type: bigint) - Statistics: Num rows: 202 Data size: 19190 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 203 Data size: 19285 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: string) Reducer 4 Execution mode: llap @@ -3475,18 +3475,18 @@ STAGE PLANS: 0 _col0 (type: string), _col1 (type: string) 1 _col0 (type: string), _col1 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 404 Data size: 35148 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 395 Data size: 34365 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 202 Data size: 19190 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 197 Data size: 18715 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 202 Data size: 19190 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 197 Data size: 18715 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Reducer 3 Execution mode: llap @@ -3496,15 +3496,15 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 202 Data size: 19190 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 197 Data size: 18715 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: _col1 is not null (type: boolean) - Statistics: Num rows: 202 Data size: 19190 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 197 Data size: 18715 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: bigint) sort order: + Map-reduce partition columns: _col1 (type: bigint) - Statistics: Num rows: 202 Data size: 19190 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 197 Data size: 18715 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: string) Reducer 4 Execution mode: llap @@ -4006,10 +4006,10 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6942 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 40 Data size: 7120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6942 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/subquery_in_having.q.out ql/src/test/results/clientpositive/llap/subquery_in_having.q.out index 0ffbaae..5100ea8 100644 --- ql/src/test/results/clientpositive/llap/subquery_in_having.q.out +++ ql/src/test/results/clientpositive/llap/subquery_in_having.q.out @@ -620,18 +620,18 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 133 Data size: 23674 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 131 Data size: 23318 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string), _col1 (type: string) mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 66 Data size: 12276 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 65 Data size: 12090 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string) - Statistics: Num rows: 66 Data size: 12276 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 65 Data size: 12090 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: bigint) Reducer 3 Execution mode: llap @@ -641,15 +641,15 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: string) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 66 Data size: 12276 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 65 Data size: 12090 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: _col2 is not null (type: boolean) - Statistics: Num rows: 66 Data size: 12276 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 65 Data size: 12090 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col2 (type: bigint) sort order: + Map-reduce partition columns: _col2 (type: bigint) - Statistics: Num rows: 66 Data size: 12276 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 65 Data size: 12090 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: string), _col1 (type: string) Reducer 4 Execution mode: llap @@ -785,18 +785,18 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 1 Map 3 - Statistics: Num rows: 133 Data size: 23674 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 131 Data size: 23318 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string), _col1 (type: string) mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 66 Data size: 12276 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 65 Data size: 12090 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string) - Statistics: Num rows: 66 Data size: 12276 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 65 Data size: 12090 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: bigint) Execution mode: llap LLAP IO: no inputs @@ -847,10 +847,10 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: string) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 66 Data size: 12276 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 65 Data size: 12090 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: _col2 is not null (type: boolean) - Statistics: Num rows: 66 Data size: 12276 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 65 Data size: 12090 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Left Semi Join 0 to 1 @@ -954,18 +954,18 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 1 Map 3 - Statistics: Num rows: 404 Data size: 71912 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 395 Data size: 70310 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string), _col1 (type: string) mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 202 Data size: 37572 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 197 Data size: 36642 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string) - Statistics: Num rows: 202 Data size: 37572 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 197 Data size: 36642 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: bigint) Execution mode: llap LLAP IO: no inputs @@ -1023,10 +1023,10 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: string) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 202 Data size: 37572 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 197 Data size: 36642 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: _col2 is not null (type: boolean) - Statistics: Num rows: 202 Data size: 37572 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 197 Data size: 36642 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Left Semi Join 0 to 1 diff --git ql/src/test/results/clientpositive/llap/subquery_multi.q.out ql/src/test/results/clientpositive/llap/subquery_multi.q.out index d0a78a2..7d97517 100644 --- ql/src/test/results/clientpositive/llap/subquery_multi.q.out +++ ql/src/test/results/clientpositive/llap/subquery_multi.q.out @@ -3221,18 +3221,18 @@ STAGE PLANS: 0 _col0 (type: string), _col1 (type: string) 1 _col0 (type: string), _col1 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 404 Data size: 71912 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 395 Data size: 70310 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string), _col1 (type: string) mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 202 Data size: 37572 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 197 Data size: 36642 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string) - Statistics: Num rows: 202 Data size: 37572 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 197 Data size: 36642 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: bigint) Reducer 3 Execution mode: llap @@ -3242,15 +3242,15 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: string) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 202 Data size: 37572 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 197 Data size: 36642 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: _col2 is not null (type: boolean) - Statistics: Num rows: 202 Data size: 37572 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 197 Data size: 36642 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col2 (type: bigint) sort order: + Map-reduce partition columns: _col2 (type: bigint) - Statistics: Num rows: 202 Data size: 37572 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 197 Data size: 36642 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: string), _col1 (type: string) Reducer 4 Execution mode: llap @@ -3280,7 +3280,7 @@ STAGE PLANS: 0 _col1 (type: string) 1 _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 134 Data size: 11658 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 135 Data size: 11745 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) @@ -4115,10 +4115,10 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col1, _col2, _col4 - Statistics: Num rows: 500 Data size: 50040 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 50028 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator sort order: - Statistics: Num rows: 500 Data size: 50040 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 50028 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string), _col2 (type: bigint), _col4 (type: boolean) Reducer 4 Execution mode: llap @@ -4130,12 +4130,12 @@ STAGE PLANS: 0 1 outputColumnNames: _col1, _col2, _col4, _col5 - Statistics: Num rows: 500 Data size: 52040 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 52028 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((_col4 is not null and (_col2 <> 0)) or _col1 is not null or _col5 is not null) (type: boolean) - Statistics: Num rows: 500 Data size: 52040 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 52028 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - Statistics: Num rows: 500 Data size: 52040 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 52028 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash diff --git ql/src/test/results/clientpositive/llap/subquery_notin.q.out ql/src/test/results/clientpositive/llap/subquery_notin.q.out index 5da1258..b4dfc6b 100644 --- ql/src/test/results/clientpositive/llap/subquery_notin.q.out +++ ql/src/test/results/clientpositive/llap/subquery_notin.q.out @@ -104,10 +104,10 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col5 - Statistics: Num rows: 500 Data size: 97540 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 97528 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((_col2 = 0) or (_col5 is null and _col0 is not null and (_col3 >= _col2))) (type: boolean) - Statistics: Num rows: 500 Data size: 97540 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 97528 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col1 (type: string) outputColumnNames: _col0, _col1 @@ -1560,10 +1560,10 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1, _col2, _col4 - Statistics: Num rows: 166 Data size: 17366 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 166 Data size: 17358 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((_col1 = 0) or (_col4 is null and _col0 is not null and (_col2 >= _col1))) (type: boolean) - Statistics: Num rows: 166 Data size: 17366 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 166 Data size: 17358 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string) outputColumnNames: _col0 @@ -3699,14 +3699,14 @@ STAGE PLANS: 0 _col1 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col5 - Statistics: Num rows: 500 Data size: 98620 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 98584 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((_col2 = 0) or (_col5 is null and _col1 is not null and (_col3 >= _col2))) (type: boolean) - Statistics: Num rows: 500 Data size: 98620 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 98584 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 500 Data size: 98620 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 98584 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) @@ -3971,12 +3971,12 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1, _col3, _col4 - Statistics: Num rows: 500 Data size: 95480 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 95336 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string) - Statistics: Num rows: 500 Data size: 95480 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 95336 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col4 (type: bigint) Reducer 3 Execution mode: llap @@ -3988,14 +3988,14 @@ STAGE PLANS: 0 _col0 (type: string), _col1 (type: string) 1 _col1 (type: string), _col0 (type: string) outputColumnNames: _col0, _col1, _col3, _col4, _col7 - Statistics: Num rows: 500 Data size: 97100 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 96920 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (not CASE WHEN ((_col3 = 0)) THEN (false) WHEN (_col3 is null) THEN (false) WHEN (_col7 is not null) THEN (true) WHEN (_col1 is null) THEN (null) WHEN ((_col4 < _col3)) THEN (true) ELSE (false) END) (type: boolean) - Statistics: Num rows: 250 Data size: 48560 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 250 Data size: 48460 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 250 Data size: 48560 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 250 Data size: 48460 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) @@ -4774,10 +4774,10 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col5 - Statistics: Num rows: 500 Data size: 97164 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 97160 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((_col2 = 0) or (_col5 is null and _col0 is not null and (_col3 >= _col2))) (type: boolean) - Statistics: Num rows: 500 Data size: 97164 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 97160 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col1 (type: string) outputColumnNames: _col0, _col1 @@ -7250,12 +7250,12 @@ STAGE PLANS: 0 _col1 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1, _col3, _col4 - Statistics: Num rows: 500 Data size: 91672 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 91688 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string) - Statistics: Num rows: 500 Data size: 91672 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 91688 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col4 (type: bigint) Reducer 3 Execution mode: llap @@ -7267,17 +7267,17 @@ STAGE PLANS: 0 _col0 (type: string), _col1 (type: string) 1 _col0 (type: string), _col1 (type: string) outputColumnNames: _col0, _col1, _col3, _col4, _col7 - Statistics: Num rows: 5833 Data size: 1149606 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5704 Data size: 1124080 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (not CASE WHEN ((_col3 = 0)) THEN (false) WHEN (_col3 is null) THEN (false) WHEN (_col7 is not null) THEN (true) WHEN (_col0 is null) THEN (null) WHEN ((_col4 < _col3)) THEN (true) ELSE (false) END) (type: boolean) - Statistics: Num rows: 2917 Data size: 574910 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2852 Data size: 562040 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col1 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 2917 Data size: 519226 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2852 Data size: 507656 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 2917 Data size: 519226 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2852 Data size: 507656 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/subquery_scalar.q.out ql/src/test/results/clientpositive/llap/subquery_scalar.q.out index ab67a7d..5034758 100644 --- ql/src/test/results/clientpositive/llap/subquery_scalar.q.out +++ ql/src/test/results/clientpositive/llap/subquery_scalar.q.out @@ -5503,18 +5503,18 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 133 Data size: 23674 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 131 Data size: 23318 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string), _col1 (type: string) mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 66 Data size: 12276 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 65 Data size: 12090 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string) - Statistics: Num rows: 66 Data size: 12276 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 65 Data size: 12090 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: bigint) Reducer 3 Execution mode: llap @@ -5524,10 +5524,10 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: string) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 66 Data size: 12276 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 65 Data size: 12090 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator sort order: - Statistics: Num rows: 66 Data size: 12276 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 65 Data size: 12090 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: string), _col1 (type: string), _col2 (type: bigint) Reducer 4 Execution mode: llap @@ -5540,14 +5540,14 @@ STAGE PLANS: 1 outputColumnNames: _col0, _col1, _col2, _col3 residual filter predicates: {(_col2 > _col3)} - Statistics: Num rows: 22 Data size: 4268 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 21 Data size: 4074 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col1 (type: string), _col2 (type: bigint) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 22 Data size: 4092 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 21 Data size: 3906 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 22 Data size: 4092 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 21 Data size: 3906 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/subquery_select.q.out ql/src/test/results/clientpositive/llap/subquery_select.q.out index d417046..69d57ca 100644 --- ql/src/test/results/clientpositive/llap/subquery_select.q.out +++ ql/src/test/results/clientpositive/llap/subquery_select.q.out @@ -1869,10 +1869,10 @@ STAGE PLANS: 0 _col0 (type: string), _col1 (type: string) 1 _col0 (type: string), _col1 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 134 Data size: 23852 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 131 Data size: 23318 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 134 Data size: 23852 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 131 Data size: 23318 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -2035,10 +2035,10 @@ STAGE PLANS: 0 _col0 (type: string), _col1 (type: string) 1 _col0 (type: string), _col1 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 108 Data size: 19224 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 106 Data size: 18868 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 108 Data size: 19224 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 106 Data size: 18868 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -2053,11 +2053,11 @@ STAGE PLANS: 0 _col1 (type: string) 1 _col1 (type: string) outputColumnNames: _col1, _col2 - Statistics: Num rows: 134 Data size: 36850 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 135 Data size: 37125 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col2 (type: string), _col1 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 134 Data size: 36850 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 135 Data size: 37125 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: string), _col1 (type: string) mode: hash diff --git ql/src/test/results/clientpositive/llap/subquery_views.q.out ql/src/test/results/clientpositive/llap/subquery_views.q.out index af69569..637f9ce 100644 --- ql/src/test/results/clientpositive/llap/subquery_views.q.out +++ ql/src/test/results/clientpositive/llap/subquery_views.q.out @@ -260,12 +260,12 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col2, _col3, _col4 - Statistics: Num rows: 67 Data size: 12194 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 65 Data size: 11830 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col4 (type: string), _col2 (type: string) sort order: ++ Map-reduce partition columns: _col4 (type: string), _col2 (type: string) - Statistics: Num rows: 67 Data size: 12194 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 65 Data size: 11830 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: boolean) Reducer 12 Execution mode: llap @@ -305,19 +305,19 @@ STAGE PLANS: 1 _col0 (type: string), _col1 (type: string) 2 _col4 (type: string), _col2 (type: string) outputColumnNames: _col0, _col1, _col4, _col5, _col9 - Statistics: Num rows: 87 Data size: 17226 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 81 Data size: 16038 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: CASE WHEN ((_col4 = 0)) THEN (true) WHEN (_col4 is null) THEN (true) WHEN (_col9 is not null) THEN (false) WHEN (_col0 is null) THEN (null) WHEN ((_col5 < _col4)) THEN (false) ELSE (true) END (type: boolean) - Statistics: Num rows: 43 Data size: 8514 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40 Data size: 7920 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col1 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 43 Data size: 7654 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40 Data size: 7120 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 43 Data size: 7654 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40 Data size: 7120 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string) Reducer 3 Execution mode: llap @@ -329,10 +329,10 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 43 Data size: 7654 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40 Data size: 7120 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 43 Data size: 7654 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40 Data size: 7120 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -380,12 +380,12 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col2, _col3, _col4 - Statistics: Num rows: 67 Data size: 12194 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 65 Data size: 11830 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col4 (type: string), _col2 (type: string) sort order: ++ Map-reduce partition columns: _col4 (type: string), _col2 (type: string) - Statistics: Num rows: 67 Data size: 12194 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 65 Data size: 11830 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: boolean) Reducer 7 Execution mode: llap @@ -399,24 +399,24 @@ STAGE PLANS: 1 _col0 (type: string), _col1 (type: string) 2 _col4 (type: string), _col2 (type: string) outputColumnNames: _col0, _col4, _col5, _col9 - Statistics: Num rows: 87 Data size: 9309 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 81 Data size: 8667 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: CASE WHEN ((_col4 = 0)) THEN (true) WHEN (_col4 is null) THEN (true) WHEN (_col9 is not null) THEN (false) WHEN (_col0 is null) THEN (null) WHEN ((_col5 < _col4)) THEN (false) ELSE (true) END (type: boolean) - Statistics: Num rows: 43 Data size: 4601 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40 Data size: 4280 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 43 Data size: 3741 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40 Data size: 3480 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: string) mode: hash outputColumnNames: _col0 - Statistics: Num rows: 8 Data size: 696 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7 Data size: 609 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 8 Data size: 696 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7 Data size: 609 Basic stats: COMPLETE Column stats: COMPLETE Reducer 8 Execution mode: llap Reduce Operator Tree: diff --git ql/src/test/results/clientpositive/llap/tez_dynpart_hashjoin_1.q.out ql/src/test/results/clientpositive/llap/tez_dynpart_hashjoin_1.q.out index b63b25f..05ea133 100644 --- ql/src/test/results/clientpositive/llap/tez_dynpart_hashjoin_1.q.out +++ ql/src/test/results/clientpositive/llap/tez_dynpart_hashjoin_1.q.out @@ -77,11 +77,11 @@ STAGE PLANS: 0 _col2 (type: int) 1 _col2 (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20, _col21, _col22, _col23 - Statistics: Num rows: 2076 Data size: 1148660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2048 Data size: 1131300 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col2 (type: int) sort order: + - Statistics: Num rows: 2076 Data size: 1148660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2048 Data size: 1131300 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: tinyint), _col1 (type: smallint), _col3 (type: bigint), _col4 (type: float), _col5 (type: double), _col6 (type: string), _col7 (type: string), _col8 (type: timestamp), _col9 (type: timestamp), _col10 (type: boolean), _col11 (type: boolean), _col12 (type: tinyint), _col13 (type: smallint), _col14 (type: int), _col15 (type: bigint), _col16 (type: float), _col17 (type: double), _col18 (type: string), _col19 (type: string), _col20 (type: timestamp), _col21 (type: timestamp), _col22 (type: boolean), _col23 (type: boolean) Reducer 3 Execution mode: llap @@ -89,10 +89,10 @@ STAGE PLANS: Select Operator expressions: VALUE._col0 (type: tinyint), VALUE._col1 (type: smallint), KEY.reducesinkkey0 (type: int), VALUE._col2 (type: bigint), VALUE._col3 (type: float), VALUE._col4 (type: double), VALUE._col5 (type: string), VALUE._col6 (type: string), VALUE._col7 (type: timestamp), VALUE._col8 (type: timestamp), VALUE._col9 (type: boolean), VALUE._col10 (type: boolean), VALUE._col11 (type: tinyint), VALUE._col12 (type: smallint), VALUE._col13 (type: int), VALUE._col14 (type: bigint), VALUE._col15 (type: float), VALUE._col16 (type: double), VALUE._col17 (type: string), VALUE._col18 (type: string), VALUE._col19 (type: timestamp), VALUE._col20 (type: timestamp), VALUE._col21 (type: boolean), VALUE._col22 (type: boolean) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20, _col21, _col22, _col23 - Statistics: Num rows: 2076 Data size: 1148660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2048 Data size: 1131300 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 2076 Data size: 1148660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2048 Data size: 1131300 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -206,7 +206,7 @@ STAGE PLANS: keys: 0 _col0 (type: int) 1 _col0 (type: int) - Statistics: Num rows: 2076 Data size: 16608 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2048 Data size: 16384 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -336,18 +336,18 @@ STAGE PLANS: 0 _col1 (type: int) 1 _col0 (type: int) outputColumnNames: _col0 - Statistics: Num rows: 2076 Data size: 6924 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2048 Data size: 6812 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: smallint) mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 623 Data size: 7064 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 7148 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: smallint) sort order: + Map-reduce partition columns: _col0 (type: smallint) - Statistics: Num rows: 623 Data size: 7064 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 7148 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Reducer 3 Execution mode: llap @@ -357,11 +357,11 @@ STAGE PLANS: keys: KEY._col0 (type: smallint) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 623 Data size: 7064 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 7148 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: bigint) sort order: + - Statistics: Num rows: 623 Data size: 7064 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 7148 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: smallint) Reducer 4 Execution mode: llap @@ -369,10 +369,10 @@ STAGE PLANS: Select Operator expressions: VALUE._col0 (type: smallint), KEY.reducesinkkey0 (type: bigint) outputColumnNames: _col0, _col1 - Statistics: Num rows: 623 Data size: 7064 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 7148 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 623 Data size: 7064 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 7148 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/tez_dynpart_hashjoin_2.q.out ql/src/test/results/clientpositive/llap/tez_dynpart_hashjoin_2.q.out index 642bda2..2b8a4ed 100644 --- ql/src/test/results/clientpositive/llap/tez_dynpart_hashjoin_2.q.out +++ ql/src/test/results/clientpositive/llap/tez_dynpart_hashjoin_2.q.out @@ -105,11 +105,11 @@ STAGE PLANS: 1 UDFToInteger(_col0) (type: int) 2 (UDFToInteger(_col0) + 0) (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11 - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: smallint), _col0 (type: tinyint), _col2 (type: int) sort order: +++ - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col4 (type: float), _col5 (type: double), _col6 (type: string), _col7 (type: string), _col8 (type: timestamp), _col9 (type: timestamp), _col10 (type: boolean), _col11 (type: boolean) Reducer 3 Execution mode: llap @@ -117,10 +117,10 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey1 (type: tinyint), KEY.reducesinkkey0 (type: smallint), KEY.reducesinkkey2 (type: int), VALUE._col0 (type: bigint), VALUE._col1 (type: float), VALUE._col2 (type: double), VALUE._col3 (type: string), VALUE._col4 (type: string), VALUE._col5 (type: timestamp), VALUE._col6 (type: timestamp), VALUE._col7 (type: boolean), VALUE._col8 (type: boolean) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11 - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -296,11 +296,11 @@ STAGE PLANS: 1 UDFToInteger(_col0) (type: int) 2 (UDFToInteger(_col0) + 0) (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11 - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: smallint), _col0 (type: tinyint), _col2 (type: int) sort order: +++ - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col4 (type: float), _col5 (type: double), _col6 (type: string), _col7 (type: string), _col8 (type: timestamp), _col9 (type: timestamp), _col10 (type: boolean), _col11 (type: boolean) Reducer 3 Execution mode: llap @@ -308,10 +308,10 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey1 (type: tinyint), KEY.reducesinkkey0 (type: smallint), KEY.reducesinkkey2 (type: int), VALUE._col0 (type: bigint), VALUE._col1 (type: float), VALUE._col2 (type: double), VALUE._col3 (type: string), VALUE._col4 (type: string), VALUE._col5 (type: timestamp), VALUE._col6 (type: timestamp), VALUE._col7 (type: boolean), VALUE._col8 (type: boolean) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11 - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -487,11 +487,11 @@ STAGE PLANS: 1 UDFToInteger(_col0) (type: int) 2 (UDFToInteger(_col0) + 0) (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11 - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: smallint), _col0 (type: tinyint), _col2 (type: int) sort order: +++ - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col4 (type: float), _col5 (type: double), _col6 (type: string), _col7 (type: string), _col8 (type: timestamp), _col9 (type: timestamp), _col10 (type: boolean), _col11 (type: boolean) Reducer 3 Execution mode: llap @@ -499,10 +499,10 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey1 (type: tinyint), KEY.reducesinkkey0 (type: smallint), KEY.reducesinkkey2 (type: int), VALUE._col0 (type: bigint), VALUE._col1 (type: float), VALUE._col2 (type: double), VALUE._col3 (type: string), VALUE._col4 (type: string), VALUE._col5 (type: timestamp), VALUE._col6 (type: timestamp), VALUE._col7 (type: boolean), VALUE._col8 (type: boolean) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11 - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/tez_join_hash.q.out ql/src/test/results/clientpositive/llap/tez_join_hash.q.out index 32f8d67..76472ce 100644 --- ql/src/test/results/clientpositive/llap/tez_join_hash.q.out +++ ql/src/test/results/clientpositive/llap/tez_join_hash.q.out @@ -207,7 +207,7 @@ STAGE PLANS: key expressions: _col1 (type: string) sort order: + Map-reduce partition columns: _col1 (type: string) - Statistics: Num rows: 14944 Data size: 2660032 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 14658 Data size: 2609124 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: string) Execution mode: vectorized, llap LLAP IO: no inputs @@ -240,16 +240,16 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col1, _col2 - Statistics: Num rows: 12944 Data size: 2304032 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 12658 Data size: 2253124 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col2 (type: string), _col1 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 12944 Data size: 2304032 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 12658 Data size: 2253124 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: string) sort order: + Map-reduce partition columns: _col1 (type: string) - Statistics: Num rows: 14944 Data size: 2660032 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 14658 Data size: 2609124 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: string) Reducer 4 Execution mode: llap @@ -261,18 +261,18 @@ STAGE PLANS: 0 _col1 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 24181 Data size: 4304218 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 23872 Data size: 4249216 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string), _col1 (type: string) mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 12090 Data size: 2248740 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 11936 Data size: 2220096 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string) - Statistics: Num rows: 12090 Data size: 2248740 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 11936 Data size: 2220096 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: bigint) Reducer 5 Execution mode: vectorized, llap @@ -282,14 +282,14 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: string) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 12090 Data size: 2248740 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 11936 Data size: 2220096 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col2 (type: bigint) outputColumnNames: _col0, _col1 - Statistics: Num rows: 12090 Data size: 1148550 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 11936 Data size: 1133920 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 12090 Data size: 1148550 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 11936 Data size: 1133920 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/tez_join_tests.q.out ql/src/test/results/clientpositive/llap/tez_join_tests.q.out index 75879fb..e25d256 100644 --- ql/src/test/results/clientpositive/llap/tez_join_tests.q.out +++ ql/src/test/results/clientpositive/llap/tez_join_tests.q.out @@ -71,12 +71,12 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6942 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: string) sort order: + Map-reduce partition columns: _col1 (type: string) - Statistics: Num rows: 40 Data size: 7120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6942 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: string) Reducer 3 Execution mode: llap @@ -88,11 +88,11 @@ STAGE PLANS: 0 _col1 (type: string) 1 _col1 (type: string) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 500 Data size: 100570 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 100392 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + - Statistics: Num rows: 500 Data size: 100570 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 100392 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string), _col2 (type: string), _col3 (type: string) Reducer 4 Execution mode: llap @@ -100,10 +100,10 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: string), VALUE._col0 (type: string), VALUE._col1 (type: string), VALUE._col2 (type: string) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 500 Data size: 100570 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 100392 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 500 Data size: 100570 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 100392 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/tez_joins_explain.q.out ql/src/test/results/clientpositive/llap/tez_joins_explain.q.out index 3790b37..8867c95 100644 --- ql/src/test/results/clientpositive/llap/tez_joins_explain.q.out +++ ql/src/test/results/clientpositive/llap/tez_joins_explain.q.out @@ -71,12 +71,12 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40 Data size: 7120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6942 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: string) sort order: + Map-reduce partition columns: _col1 (type: string) - Statistics: Num rows: 40 Data size: 7120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 6942 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: string) Reducer 3 Execution mode: llap @@ -88,11 +88,11 @@ STAGE PLANS: 0 _col1 (type: string) 1 _col1 (type: string) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 500 Data size: 100570 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 100392 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + - Statistics: Num rows: 500 Data size: 100570 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 100392 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string), _col2 (type: string), _col3 (type: string) Reducer 4 Execution mode: llap @@ -100,10 +100,10 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: string), VALUE._col0 (type: string), VALUE._col1 (type: string), VALUE._col2 (type: string) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 500 Data size: 100570 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 100392 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 500 Data size: 100570 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 100392 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/tez_smb_main.q.out ql/src/test/results/clientpositive/llap/tez_smb_main.q.out index f457814..e950d21 100644 --- ql/src/test/results/clientpositive/llap/tez_smb_main.q.out +++ ql/src/test/results/clientpositive/llap/tez_smb_main.q.out @@ -66,10 +66,10 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 40 Data size: 14120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 13767 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 40 Data size: 14120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 39 Data size: 13767 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -263,33 +263,33 @@ STAGE PLANS: Map Operator Tree: TableScan alias: a - Statistics: Num rows: 242 Data size: 3490 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: key is not null (type: boolean) - Statistics: Num rows: 230 Data size: 3316 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int) outputColumnNames: _col0 - Statistics: Num rows: 230 Data size: 3316 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + Map-reduce partition columns: _col0 (type: int) - Statistics: Num rows: 230 Data size: 3316 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: llap LLAP IO: no inputs Map 2 Map Operator Tree: TableScan alias: b - Statistics: Num rows: 500 Data size: 7216 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: key is not null (type: boolean) - Statistics: Num rows: 475 Data size: 6855 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int) outputColumnNames: _col0 - Statistics: Num rows: 475 Data size: 6855 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -298,15 +298,15 @@ STAGE PLANS: 1 _col0 (type: int) input vertices: 0 Map 1 - Statistics: Num rows: 522 Data size: 7540 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 399 Data size: 3192 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator sort order: - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint) Execution mode: llap LLAP IO: no inputs @@ -317,10 +317,10 @@ STAGE PLANS: aggregations: count(VALUE._col0) mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -374,33 +374,33 @@ STAGE PLANS: Map Operator Tree: TableScan alias: a - Statistics: Num rows: 242 Data size: 3490 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: key is not null (type: boolean) - Statistics: Num rows: 230 Data size: 3316 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int) outputColumnNames: _col0 - Statistics: Num rows: 230 Data size: 3316 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + Map-reduce partition columns: _col0 (type: int) - Statistics: Num rows: 230 Data size: 3316 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: llap LLAP IO: no inputs Map 2 Map Operator Tree: TableScan alias: b - Statistics: Num rows: 500 Data size: 7216 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: key is not null (type: boolean) - Statistics: Num rows: 475 Data size: 6855 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int) outputColumnNames: _col0 - Statistics: Num rows: 475 Data size: 6855 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -409,15 +409,15 @@ STAGE PLANS: 1 _col0 (type: int) input vertices: 0 Map 1 - Statistics: Num rows: 522 Data size: 7540 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 399 Data size: 3192 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator sort order: - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint) Execution mode: llap LLAP IO: no inputs @@ -428,10 +428,10 @@ STAGE PLANS: aggregations: count(VALUE._col0) mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -1674,14 +1674,14 @@ STAGE PLANS: Map Operator Tree: TableScan alias: s1 - Statistics: Num rows: 242 Data size: 924 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: key is not null (type: boolean) - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int) outputColumnNames: _col0 - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -1691,7 +1691,7 @@ STAGE PLANS: outputColumnNames: _col0 input vertices: 1 Map 4 - Statistics: Num rows: 253 Data size: 965 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 382 Data size: 1528 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -1700,15 +1700,15 @@ STAGE PLANS: 1 _col0 (type: int) input vertices: 1 Map 6 - Statistics: Num rows: 531 Data size: 2027 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1029 Data size: 8232 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator sort order: - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint) Execution mode: llap LLAP IO: no inputs @@ -1716,33 +1716,33 @@ STAGE PLANS: Map Operator Tree: TableScan alias: s3 - Statistics: Num rows: 242 Data size: 924 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: key is not null (type: boolean) - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int) outputColumnNames: _col0 - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + Map-reduce partition columns: _col0 (type: int) - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: llap LLAP IO: no inputs Map 5 Map Operator Tree: TableScan alias: s2 - Statistics: Num rows: 242 Data size: 924 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: key is not null (type: boolean) - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int) outputColumnNames: _col0 - Statistics: Num rows: 230 Data size: 878 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -1751,15 +1751,15 @@ STAGE PLANS: 1 _col0 (type: int) input vertices: 1 Map 6 - Statistics: Num rows: 531 Data size: 2027 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1029 Data size: 8232 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator sort order: - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint) Execution mode: llap LLAP IO: no inputs @@ -1767,24 +1767,24 @@ STAGE PLANS: Map Operator Tree: TableScan alias: b - Statistics: Num rows: 500 Data size: 1904 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: key is not null (type: boolean) - Statistics: Num rows: 475 Data size: 1808 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int) outputColumnNames: _col0 - Statistics: Num rows: 475 Data size: 1808 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + Map-reduce partition columns: _col0 (type: int) - Statistics: Num rows: 475 Data size: 1808 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) sort order: + Map-reduce partition columns: _col0 (type: int) - Statistics: Num rows: 475 Data size: 1808 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: llap LLAP IO: no inputs Reducer 3 @@ -1794,10 +1794,10 @@ STAGE PLANS: aggregations: count(VALUE._col0) mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -1838,7 +1838,8 @@ STAGE PLANS: Tez #### A masked pattern was here #### Edges: - Reducer 4 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) + Reducer 2 <- Map 1 (SIMPLE_EDGE) + Reducer 4 <- Map 3 (SIMPLE_EDGE), Reducer 2 (CUSTOM_SIMPLE_EDGE) Reducer 5 <- Reducer 4 (CUSTOM_SIMPLE_EDGE) #### A masked pattern was here #### Vertices: @@ -1846,65 +1847,74 @@ STAGE PLANS: Map Operator Tree: TableScan alias: t1 - Statistics: Num rows: 242 Data size: 45994 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22990 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: key is not null (type: boolean) - Statistics: Num rows: 230 Data size: 43713 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22990 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int), value (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 230 Data size: 43713 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22990 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int), _col1 (type: string) sort order: ++ - Statistics: Num rows: 230 Data size: 43713 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 22990 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: llap LLAP IO: no inputs Map 3 Map Operator Tree: TableScan alias: t2 - Statistics: Num rows: 500 Data size: 94800 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 47500 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: key is not null (type: boolean) - Statistics: Num rows: 475 Data size: 90060 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 47500 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: key (type: int), value (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 475 Data size: 90060 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 47500 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int), _col1 (type: string) sort order: ++ - Statistics: Num rows: 475 Data size: 90060 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 500 Data size: 47500 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: llap LLAP IO: no inputs - Reducer 4 + Reducer 2 + Execution mode: llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey0 (type: int) outputColumnNames: _col0 - Statistics: Num rows: 230 Data size: 43713 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + key expressions: _col0 (type: int) + sort order: + + Map-reduce partition columns: _col0 (type: int) + Statistics: Num rows: 242 Data size: 968 Basic stats: COMPLETE Column stats: COMPLETE + Reducer 4 Execution mode: llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey0 (type: int) outputColumnNames: _col0 - Statistics: Num rows: 475 Data size: 90060 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator + Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE + Map Join Operator condition map: Inner Join 0 to 1 keys: 0 _col0 (type: int) 1 _col0 (type: int) - Statistics: Num rows: 522 Data size: 99066 Basic stats: COMPLETE Column stats: NONE + input vertices: + 0 Reducer 2 + Statistics: Num rows: 399 Data size: 3192 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator sort order: - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint) Reducer 5 Execution mode: llap @@ -1913,10 +1923,10 @@ STAGE PLANS: aggregations: count(VALUE._col0) mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/tez_union.q.out ql/src/test/results/clientpositive/llap/tez_union.q.out index 9118403..f93922a 100644 --- ql/src/test/results/clientpositive/llap/tez_union.q.out +++ ql/src/test/results/clientpositive/llap/tez_union.q.out @@ -42,10 +42,10 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 1 Map 3 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1309 Data size: 233002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1291 Data size: 229798 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -82,7 +82,7 @@ STAGE PLANS: Statistics: Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1309 Data size: 233002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1291 Data size: 229798 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -264,7 +264,7 @@ STAGE PLANS: keys: 0 _col0 (type: string) 1 _col0 (type: string) - Statistics: Num rows: 3236 Data size: 25888 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3164 Data size: 25312 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -400,10 +400,10 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 0 Map 1 - Statistics: Num rows: 1618 Data size: 281532 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1582 Data size: 275268 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1618 Data size: 281532 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1582 Data size: 275268 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -431,10 +431,10 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 0 Map 1 - Statistics: Num rows: 1618 Data size: 281532 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1582 Data size: 275268 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1618 Data size: 281532 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1582 Data size: 275268 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -556,7 +556,7 @@ STAGE PLANS: outputColumnNames: _col0 input vertices: 1 Map 4 - Statistics: Num rows: 809 Data size: 70383 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 68817 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -569,15 +569,15 @@ STAGE PLANS: input vertices: 1 Map 9 2 Map 10 - Statistics: Num rows: 6354 Data size: 1658394 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5941 Data size: 1550601 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: string), _col0 (type: string), _col2 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 6354 Data size: 1658394 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5941 Data size: 1550601 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col2 (type: string) sort order: + - Statistics: Num rows: 6354 Data size: 1658394 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5941 Data size: 1550601 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: string), _col1 (type: string) Execution mode: llap LLAP IO: no inputs @@ -650,7 +650,7 @@ STAGE PLANS: outputColumnNames: _col0 input vertices: 1 Map 6 - Statistics: Num rows: 809 Data size: 70383 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 68817 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -663,15 +663,15 @@ STAGE PLANS: input vertices: 1 Map 9 2 Map 10 - Statistics: Num rows: 6354 Data size: 1658394 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5941 Data size: 1550601 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: string), _col0 (type: string), _col2 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 6354 Data size: 1658394 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5941 Data size: 1550601 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col2 (type: string) sort order: + - Statistics: Num rows: 6354 Data size: 1658394 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5941 Data size: 1550601 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: string), _col1 (type: string) Execution mode: llap LLAP IO: no inputs @@ -715,7 +715,7 @@ STAGE PLANS: outputColumnNames: _col0 input vertices: 1 Map 8 - Statistics: Num rows: 809 Data size: 70383 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 68817 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -728,15 +728,15 @@ STAGE PLANS: input vertices: 1 Map 9 2 Map 10 - Statistics: Num rows: 6354 Data size: 1658394 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5941 Data size: 1550601 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: string), _col0 (type: string), _col2 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 6354 Data size: 1658394 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5941 Data size: 1550601 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col2 (type: string) sort order: + - Statistics: Num rows: 6354 Data size: 1658394 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5941 Data size: 1550601 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: string), _col1 (type: string) Execution mode: llap LLAP IO: no inputs @@ -794,10 +794,10 @@ STAGE PLANS: Select Operator expressions: VALUE._col0 (type: string), VALUE._col1 (type: string), KEY.reducesinkkey0 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 6354 Data size: 1658394 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5941 Data size: 1550601 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 6354 Data size: 1658394 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5941 Data size: 1550601 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -996,10 +996,10 @@ STAGE PLANS: outputColumnNames: _col0 input vertices: 1 Map 3 - Statistics: Num rows: 809 Data size: 70383 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 68817 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1618 Data size: 140766 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1582 Data size: 137634 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -1046,10 +1046,10 @@ STAGE PLANS: outputColumnNames: _col0 input vertices: 1 Map 5 - Statistics: Num rows: 809 Data size: 70383 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 68817 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1618 Data size: 140766 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1582 Data size: 137634 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -1186,10 +1186,10 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3 input vertices: 1 Map 4 - Statistics: Num rows: 1618 Data size: 576008 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1582 Data size: 563192 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1618 Data size: 576008 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1582 Data size: 563192 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -1214,10 +1214,10 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3 input vertices: 1 Map 4 - Statistics: Num rows: 1618 Data size: 576008 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1582 Data size: 563192 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1618 Data size: 576008 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1582 Data size: 563192 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -1330,10 +1330,10 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 0 Union 2 - Statistics: Num rows: 1618 Data size: 281532 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1582 Data size: 275268 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1618 Data size: 281532 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1582 Data size: 275268 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/tez_union2.q.out ql/src/test/results/clientpositive/llap/tez_union2.q.out index 1c8dd11..b379340 100644 --- ql/src/test/results/clientpositive/llap/tez_union2.q.out +++ ql/src/test/results/clientpositive/llap/tez_union2.q.out @@ -61,12 +61,12 @@ STAGE PLANS: keys: _col0 (type: string), _col1 (type: string) mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 404 Data size: 71912 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 408 Data size: 72624 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string) - Statistics: Num rows: 404 Data size: 71912 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 408 Data size: 72624 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: llap LLAP IO: no inputs Map 4 @@ -118,10 +118,10 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 404 Data size: 71912 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 408 Data size: 72624 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 404 Data size: 71912 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 408 Data size: 72624 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -142,21 +142,21 @@ STAGE PLANS: keys: _col0 (type: string) mode: complete outputColumnNames: _col0 - Statistics: Num rows: 309 Data size: 26883 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 27492 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col0 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 53766 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 54984 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: string), _col1 (type: string) mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 404 Data size: 71912 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 408 Data size: 72624 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string) sort order: ++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string) - Statistics: Num rows: 404 Data size: 71912 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 408 Data size: 72624 Basic stats: COMPLETE Column stats: COMPLETE Union 2 Vertex: Union 2 Union 5 diff --git ql/src/test/results/clientpositive/llap/tez_union_multiinsert.q.out ql/src/test/results/clientpositive/llap/tez_union_multiinsert.q.out index f9535c5..f1dfe0f 100644 --- ql/src/test/results/clientpositive/llap/tez_union_multiinsert.q.out +++ ql/src/test/results/clientpositive/llap/tez_union_multiinsert.q.out @@ -186,14 +186,14 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29664 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30336 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), UDFToString(_col1) (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 84048 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 85952 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 309 Data size: 84048 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 85952 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.TextInputFormat output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat @@ -1061,14 +1061,14 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29664 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30336 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), UDFToString(_col1) (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 84048 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 85952 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 309 Data size: 84048 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 85952 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.TextInputFormat output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat @@ -1966,14 +1966,14 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 29664 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 30336 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), UDFToString(_col1) (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 309 Data size: 84048 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 85952 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 309 Data size: 84048 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 85952 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.TextInputFormat output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat diff --git ql/src/test/results/clientpositive/llap/tez_vector_dynpart_hashjoin_1.q.out ql/src/test/results/clientpositive/llap/tez_vector_dynpart_hashjoin_1.q.out index d0a5e62..049f46b 100644 --- ql/src/test/results/clientpositive/llap/tez_vector_dynpart_hashjoin_1.q.out +++ ql/src/test/results/clientpositive/llap/tez_vector_dynpart_hashjoin_1.q.out @@ -77,11 +77,11 @@ STAGE PLANS: 0 _col2 (type: int) 1 _col2 (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20, _col21, _col22, _col23 - Statistics: Num rows: 2076 Data size: 1148660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2048 Data size: 1131300 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col2 (type: int) sort order: + - Statistics: Num rows: 2076 Data size: 1148660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2048 Data size: 1131300 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: tinyint), _col1 (type: smallint), _col3 (type: bigint), _col4 (type: float), _col5 (type: double), _col6 (type: string), _col7 (type: string), _col8 (type: timestamp), _col9 (type: timestamp), _col10 (type: boolean), _col11 (type: boolean), _col12 (type: tinyint), _col13 (type: smallint), _col14 (type: int), _col15 (type: bigint), _col16 (type: float), _col17 (type: double), _col18 (type: string), _col19 (type: string), _col20 (type: timestamp), _col21 (type: timestamp), _col22 (type: boolean), _col23 (type: boolean) Reducer 3 Execution mode: llap @@ -89,10 +89,10 @@ STAGE PLANS: Select Operator expressions: VALUE._col0 (type: tinyint), VALUE._col1 (type: smallint), KEY.reducesinkkey0 (type: int), VALUE._col2 (type: bigint), VALUE._col3 (type: float), VALUE._col4 (type: double), VALUE._col5 (type: string), VALUE._col6 (type: string), VALUE._col7 (type: timestamp), VALUE._col8 (type: timestamp), VALUE._col9 (type: boolean), VALUE._col10 (type: boolean), VALUE._col11 (type: tinyint), VALUE._col12 (type: smallint), VALUE._col13 (type: int), VALUE._col14 (type: bigint), VALUE._col15 (type: float), VALUE._col16 (type: double), VALUE._col17 (type: string), VALUE._col18 (type: string), VALUE._col19 (type: timestamp), VALUE._col20 (type: timestamp), VALUE._col21 (type: boolean), VALUE._col22 (type: boolean) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20, _col21, _col22, _col23 - Statistics: Num rows: 2076 Data size: 1148660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2048 Data size: 1131300 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 2076 Data size: 1148660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2048 Data size: 1131300 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -206,7 +206,7 @@ STAGE PLANS: keys: 0 _col0 (type: int) 1 _col0 (type: int) - Statistics: Num rows: 2076 Data size: 16608 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2048 Data size: 16384 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -336,18 +336,18 @@ STAGE PLANS: 0 _col1 (type: int) 1 _col0 (type: int) outputColumnNames: _col0 - Statistics: Num rows: 2076 Data size: 6924 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2048 Data size: 6812 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: smallint) mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 623 Data size: 7064 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 7148 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: smallint) sort order: + Map-reduce partition columns: _col0 (type: smallint) - Statistics: Num rows: 623 Data size: 7064 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 7148 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Reducer 3 Execution mode: llap @@ -357,11 +357,11 @@ STAGE PLANS: keys: KEY._col0 (type: smallint) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 623 Data size: 7064 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 7148 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: bigint) sort order: + - Statistics: Num rows: 623 Data size: 7064 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 7148 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: smallint) Reducer 4 Execution mode: llap @@ -369,10 +369,10 @@ STAGE PLANS: Select Operator expressions: VALUE._col0 (type: smallint), KEY.reducesinkkey0 (type: bigint) outputColumnNames: _col0, _col1 - Statistics: Num rows: 623 Data size: 7064 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 7148 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 623 Data size: 7064 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 631 Data size: 7148 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/tez_vector_dynpart_hashjoin_2.q.out ql/src/test/results/clientpositive/llap/tez_vector_dynpart_hashjoin_2.q.out index 1ce7a3a..0f1883a 100644 --- ql/src/test/results/clientpositive/llap/tez_vector_dynpart_hashjoin_2.q.out +++ ql/src/test/results/clientpositive/llap/tez_vector_dynpart_hashjoin_2.q.out @@ -105,11 +105,11 @@ STAGE PLANS: 1 UDFToInteger(_col0) (type: int) 2 (UDFToInteger(_col0) + 0) (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11 - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: smallint), _col0 (type: tinyint), _col2 (type: int) sort order: +++ - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col4 (type: float), _col5 (type: double), _col6 (type: string), _col7 (type: string), _col8 (type: timestamp), _col9 (type: timestamp), _col10 (type: boolean), _col11 (type: boolean) Reducer 3 Execution mode: llap @@ -117,10 +117,10 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey1 (type: tinyint), KEY.reducesinkkey0 (type: smallint), KEY.reducesinkkey2 (type: int), VALUE._col0 (type: bigint), VALUE._col1 (type: float), VALUE._col2 (type: double), VALUE._col3 (type: string), VALUE._col4 (type: string), VALUE._col5 (type: timestamp), VALUE._col6 (type: timestamp), VALUE._col7 (type: boolean), VALUE._col8 (type: boolean) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11 - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -296,11 +296,11 @@ STAGE PLANS: 1 UDFToInteger(_col0) (type: int) 2 (UDFToInteger(_col0) + 0) (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11 - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: smallint), _col0 (type: tinyint), _col2 (type: int) sort order: +++ - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col4 (type: float), _col5 (type: double), _col6 (type: string), _col7 (type: string), _col8 (type: timestamp), _col9 (type: timestamp), _col10 (type: boolean), _col11 (type: boolean) Reducer 3 Execution mode: vectorized, llap @@ -308,10 +308,10 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey1 (type: tinyint), KEY.reducesinkkey0 (type: smallint), KEY.reducesinkkey2 (type: int), VALUE._col0 (type: bigint), VALUE._col1 (type: float), VALUE._col2 (type: double), VALUE._col3 (type: string), VALUE._col4 (type: string), VALUE._col5 (type: timestamp), VALUE._col6 (type: timestamp), VALUE._col7 (type: boolean), VALUE._col8 (type: boolean) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11 - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -487,11 +487,11 @@ STAGE PLANS: 1 UDFToInteger(_col0) (type: int) 2 (UDFToInteger(_col0) + 0) (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11 - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: smallint), _col0 (type: tinyint), _col2 (type: int) sort order: +++ - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col4 (type: float), _col5 (type: double), _col6 (type: string), _col7 (type: string), _col8 (type: timestamp), _col9 (type: timestamp), _col10 (type: boolean), _col11 (type: boolean) Reducer 3 Execution mode: vectorized, llap @@ -499,10 +499,10 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey1 (type: tinyint), KEY.reducesinkkey0 (type: smallint), KEY.reducesinkkey2 (type: int), VALUE._col0 (type: bigint), VALUE._col1 (type: float), VALUE._col2 (type: double), VALUE._col3 (type: string), VALUE._col4 (type: string), VALUE._col5 (type: timestamp), VALUE._col6 (type: timestamp), VALUE._col7 (type: boolean), VALUE._col8 (type: boolean) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11 - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1776 Data size: 312050 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1715 Data size: 293140 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/unionDistinct_3.q.out ql/src/test/results/clientpositive/llap/unionDistinct_3.q.out index 96c2124..a3d7c74 100644 --- ql/src/test/results/clientpositive/llap/unionDistinct_3.q.out +++ ql/src/test/results/clientpositive/llap/unionDistinct_3.q.out @@ -1747,10 +1747,10 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 66 Data size: 35904 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 65 Data size: 35360 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 66 Data size: 35904 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 65 Data size: 35360 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -1896,12 +1896,12 @@ STAGE PLANS: keys: _col0 (type: string) mode: hash outputColumnNames: _col0 - Statistics: Num rows: 309 Data size: 56856 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 58144 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 56856 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 58144 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: llap LLAP IO: no inputs Map 10 @@ -1917,12 +1917,12 @@ STAGE PLANS: keys: _col0 (type: string) mode: hash outputColumnNames: _col0 - Statistics: Num rows: 309 Data size: 56856 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 58144 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 56856 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 58144 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: llap LLAP IO: no inputs Map 11 @@ -1938,12 +1938,12 @@ STAGE PLANS: keys: _col0 (type: string) mode: hash outputColumnNames: _col0 - Statistics: Num rows: 309 Data size: 56856 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 58144 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 56856 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 58144 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: llap LLAP IO: no inputs Map 12 @@ -1959,12 +1959,12 @@ STAGE PLANS: keys: _col0 (type: string) mode: hash outputColumnNames: _col0 - Statistics: Num rows: 160 Data size: 29440 Basic stats: COMPLETE Column stats: PARTIAL + Statistics: Num rows: 163 Data size: 29992 Basic stats: COMPLETE Column stats: PARTIAL Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 160 Data size: 29440 Basic stats: COMPLETE Column stats: PARTIAL + Statistics: Num rows: 163 Data size: 29992 Basic stats: COMPLETE Column stats: PARTIAL Execution mode: llap LLAP IO: no inputs Map 13 @@ -1980,12 +1980,12 @@ STAGE PLANS: keys: _col0 (type: string) mode: hash outputColumnNames: _col0 - Statistics: Num rows: 85 Data size: 15640 Basic stats: COMPLETE Column stats: PARTIAL + Statistics: Num rows: 87 Data size: 16008 Basic stats: COMPLETE Column stats: PARTIAL Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 85 Data size: 15640 Basic stats: COMPLETE Column stats: PARTIAL + Statistics: Num rows: 87 Data size: 16008 Basic stats: COMPLETE Column stats: PARTIAL Execution mode: llap LLAP IO: no inputs Reducer 3 @@ -1995,17 +1995,17 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 309 Data size: 56856 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 58144 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: string) mode: hash outputColumnNames: _col0 - Statistics: Num rows: 309 Data size: 56856 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 58144 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 309 Data size: 56856 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 58144 Basic stats: COMPLETE Column stats: COMPLETE Reducer 5 Execution mode: llap Reduce Operator Tree: @@ -2013,17 +2013,17 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 309 Data size: 56856 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 316 Data size: 58144 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: string) mode: hash outputColumnNames: _col0 - Statistics: Num rows: 160 Data size: 29440 Basic stats: COMPLETE Column stats: PARTIAL + Statistics: Num rows: 163 Data size: 29992 Basic stats: COMPLETE Column stats: PARTIAL Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 160 Data size: 29440 Basic stats: COMPLETE Column stats: PARTIAL + Statistics: Num rows: 163 Data size: 29992 Basic stats: COMPLETE Column stats: PARTIAL Reducer 7 Execution mode: llap Reduce Operator Tree: @@ -2031,17 +2031,17 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 160 Data size: 29440 Basic stats: COMPLETE Column stats: PARTIAL + Statistics: Num rows: 163 Data size: 29992 Basic stats: COMPLETE Column stats: PARTIAL Group By Operator keys: _col0 (type: string) mode: hash outputColumnNames: _col0 - Statistics: Num rows: 85 Data size: 15640 Basic stats: COMPLETE Column stats: PARTIAL + Statistics: Num rows: 87 Data size: 16008 Basic stats: COMPLETE Column stats: PARTIAL Reduce Output Operator key expressions: _col0 (type: string) sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 85 Data size: 15640 Basic stats: COMPLETE Column stats: PARTIAL + Statistics: Num rows: 87 Data size: 16008 Basic stats: COMPLETE Column stats: PARTIAL Reducer 9 Execution mode: llap Reduce Operator Tree: @@ -2049,16 +2049,16 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 85 Data size: 15640 Basic stats: COMPLETE Column stats: PARTIAL + Statistics: Num rows: 87 Data size: 16008 Basic stats: COMPLETE Column stats: PARTIAL Group By Operator aggregations: count(1) keys: _col0 (type: string) mode: complete outputColumnNames: _col0, _col1 - Statistics: Num rows: 85 Data size: 16320 Basic stats: COMPLETE Column stats: PARTIAL + Statistics: Num rows: 87 Data size: 16704 Basic stats: COMPLETE Column stats: PARTIAL File Output Operator compressed: false - Statistics: Num rows: 85 Data size: 16320 Basic stats: COMPLETE Column stats: PARTIAL + Statistics: Num rows: 87 Data size: 16704 Basic stats: COMPLETE Column stats: PARTIAL table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/union_top_level.q.out ql/src/test/results/clientpositive/llap/union_top_level.q.out index 9635cad..2681c6a 100644 --- ql/src/test/results/clientpositive/llap/union_top_level.q.out +++ ql/src/test/results/clientpositive/llap/union_top_level.q.out @@ -274,15 +274,15 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col1, _col2 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col2 (type: string), _col1 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE TopN Hash Memory Usage: 0.1 value expressions: _col1 (type: string) Reducer 3 @@ -291,7 +291,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: string), VALUE._col0 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 10 Statistics: Num rows: 10 Data size: 1780 Basic stats: COMPLETE Column stats: COMPLETE @@ -312,15 +312,15 @@ STAGE PLANS: 0 _col0 (type: string) 1 _col0 (type: string) outputColumnNames: _col1, _col2 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col2 (type: string), _col1 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) sort order: + - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE TopN Hash Memory Usage: 0.1 value expressions: _col1 (type: string) Reducer 6 @@ -329,7 +329,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: string), VALUE._col0 (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 809 Data size: 144002 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 791 Data size: 140798 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 10 Statistics: Num rows: 10 Data size: 1780 Basic stats: COMPLETE Column stats: COMPLETE diff --git ql/src/test/results/clientpositive/llap/vector_groupby_mapjoin.q.out ql/src/test/results/clientpositive/llap/vector_groupby_mapjoin.q.out index 82b6ba0..43a6ddd 100644 --- ql/src/test/results/clientpositive/llap/vector_groupby_mapjoin.q.out +++ ql/src/test/results/clientpositive/llap/vector_groupby_mapjoin.q.out @@ -155,10 +155,10 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3, _col5 input vertices: 1 Reducer 6 - Statistics: Num rows: 500 Data size: 98620 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 98584 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((_col2 = 0) or (_col5 is null and _col0 is not null and (_col3 >= _col2))) (type: boolean) - Statistics: Num rows: 500 Data size: 98620 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 500 Data size: 98584 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col1 (type: string) outputColumnNames: _col0, _col1 diff --git ql/src/test/results/clientpositive/llap/vector_left_outer_join.q.out ql/src/test/results/clientpositive/llap/vector_left_outer_join.q.out index dc8f47e..b269f9b 100644 --- ql/src/test/results/clientpositive/llap/vector_left_outer_join.q.out +++ ql/src/test/results/clientpositive/llap/vector_left_outer_join.q.out @@ -51,7 +51,7 @@ STAGE PLANS: outputColumnNames: _col0 input vertices: 1 Map 3 - Statistics: Num rows: 25044 Data size: 87720 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 24737 Data size: 86492 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Left Outer Join 0 to 1 @@ -60,7 +60,7 @@ STAGE PLANS: 1 _col0 (type: tinyint) input vertices: 1 Map 4 - Statistics: Num rows: 2423154 Data size: 19385232 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2393450 Data size: 19147600 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash diff --git ql/src/test/results/clientpositive/llap/vectorization_short_regress.q.out ql/src/test/results/clientpositive/llap/vectorization_short_regress.q.out index 0027ab5..facf121 100644 --- ql/src/test/results/clientpositive/llap/vectorization_short_regress.q.out +++ ql/src/test/results/clientpositive/llap/vectorization_short_regress.q.out @@ -2202,7 +2202,7 @@ STAGE PLANS: keys: csmallint (type: smallint) mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 1141 Data size: 204228 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1156 Data size: 206912 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: smallint) sort order: + @@ -2211,7 +2211,7 @@ STAGE PLANS: className: VectorReduceSinkLongOperator native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true - Statistics: Num rows: 1141 Data size: 204228 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1156 Data size: 206912 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: struct), _col2 (type: bigint), _col3 (type: struct), _col4 (type: bigint) Execution mode: vectorized, llap LLAP IO: all inputs @@ -2246,7 +2246,7 @@ STAGE PLANS: keys: KEY._col0 (type: smallint) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 1141 Data size: 39924 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1156 Data size: 40448 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: smallint), (UDFToInteger(_col0) % -75) (type: int), _col1 (type: double), (-1.389 / CAST( _col0 AS decimal(5,0))) (type: decimal(10,9)), _col2 (type: bigint), (UDFToDouble((UDFToInteger(_col0) % -75)) / UDFToDouble(_col2)) (type: double), (- (UDFToInteger(_col0) % -75)) (type: int), _col3 (type: double), (- (- (UDFToInteger(_col0) % -75))) (type: int), _col4 (type: bigint), (_col4 - -89010) (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10 @@ -2255,7 +2255,7 @@ STAGE PLANS: native: true projectedOutputColumnNums: [0, 5, 1, 7, 2, 11, 12, 3, 8, 4, 13] selectExpressions: LongColModuloLongScalar(col 0:int, val -75)(children: col 0:smallint) -> 5:int, DecimalScalarDivideDecimalColumn(val -1.389, col 6:decimal(5,0))(children: CastLongToDecimal(col 0:smallint) -> 6:decimal(5,0)) -> 7:decimal(10,9), DoubleColDivideDoubleColumn(col 9:double, col 10:double)(children: CastLongToDouble(col 8:int)(children: LongColModuloLongScalar(col 0:int, val -75)(children: col 0:smallint) -> 8:int) -> 9:double, CastLongToDouble(col 2:bigint) -> 10:double) -> 11:double, LongColUnaryMinus(col 8:int)(children: LongColModuloLongScalar(col 0:int, val -75)(children: col 0:smallint) -> 8:int) -> 12:int, LongColUnaryMinus(col 13:int)(children: LongColUnaryMinus(col 8:int)(children: LongColModuloLongScalar(col 0:int, val -75)(children: col 0:smallint) -> 8:int) -> 13:int) -> 8:int, LongColSubtractLongScalar(col 4:bigint, val -89010) -> 13:bigint - Statistics: Num rows: 1141 Data size: 199664 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1156 Data size: 202288 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: smallint), _col1 (type: int), _col2 (type: double), _col3 (type: decimal(10,9)), _col4 (type: bigint), _col5 (type: double), _col6 (type: int), _col7 (type: double), _col8 (type: int), _col9 (type: bigint), _col10 (type: bigint) sort order: +++++++++++ @@ -2263,7 +2263,7 @@ STAGE PLANS: className: VectorReduceSinkObjectHashOperator native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true - Statistics: Num rows: 1141 Data size: 199664 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1156 Data size: 202288 Basic stats: COMPLETE Column stats: COMPLETE TopN Hash Memory Usage: 0.1 Reducer 3 Execution mode: vectorized, llap @@ -2281,7 +2281,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10] - Statistics: Num rows: 1141 Data size: 199664 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1156 Data size: 202288 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 20 Limit Vectorization: @@ -2478,7 +2478,7 @@ STAGE PLANS: keys: cdouble (type: double) mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 1136 Data size: 306696 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1127 Data size: 304272 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: double) sort order: + @@ -2487,7 +2487,7 @@ STAGE PLANS: className: VectorReduceSinkMultiKeyOperator native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true - Statistics: Num rows: 1136 Data size: 306696 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1127 Data size: 304272 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: struct), _col2 (type: bigint), _col3 (type: double), _col4 (type: struct), _col5 (type: struct), _col6 (type: double) Execution mode: vectorized, llap LLAP IO: all inputs @@ -2522,7 +2522,7 @@ STAGE PLANS: keys: KEY._col0 (type: double) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 1136 Data size: 61320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1127 Data size: 60840 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: double), _col1 (type: double), (2563.58 * _col1) (type: double), (- _col1) (type: double), _col2 (type: bigint), ((2563.58 * _col1) + -5638.15) (type: double), ((- _col1) * ((2563.58 * _col1) + -5638.15)) (type: double), _col3 (type: double), _col4 (type: double), (_col0 - (- _col1)) (type: double), _col5 (type: double), (_col0 + _col1) (type: double), (_col0 * 762.0) (type: double), _col6 (type: double), (-863.257 % (_col0 * 762.0)) (type: double) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14 @@ -2531,7 +2531,7 @@ STAGE PLANS: native: true projectedOutputColumnNums: [0, 1, 7, 8, 2, 10, 11, 3, 4, 12, 5, 9, 13, 6, 15] selectExpressions: DoubleScalarMultiplyDoubleColumn(val 2563.58, col 1:double) -> 7:double, DoubleColUnaryMinus(col 1:double) -> 8:double, DoubleColAddDoubleScalar(col 9:double, val -5638.15)(children: DoubleScalarMultiplyDoubleColumn(val 2563.58, col 1:double) -> 9:double) -> 10:double, DoubleColMultiplyDoubleColumn(col 9:double, col 12:double)(children: DoubleColUnaryMinus(col 1:double) -> 9:double, DoubleColAddDoubleScalar(col 11:double, val -5638.15)(children: DoubleScalarMultiplyDoubleColumn(val 2563.58, col 1:double) -> 11:double) -> 12:double) -> 11:double, DoubleColSubtractDoubleColumn(col 0:double, col 9:double)(children: DoubleColUnaryMinus(col 1:double) -> 9:double) -> 12:double, DoubleColAddDoubleColumn(col 0:double, col 1:double) -> 9:double, DoubleColMultiplyDoubleScalar(col 0:double, val 762.0) -> 13:double, DoubleScalarModuloDoubleColumn(val -863.257, col 14:double)(children: DoubleColMultiplyDoubleScalar(col 0:double, val 762.0) -> 14:double) -> 15:double - Statistics: Num rows: 1136 Data size: 143112 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1127 Data size: 141984 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: double) sort order: + @@ -2539,7 +2539,7 @@ STAGE PLANS: className: VectorReduceSinkObjectHashOperator native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true - Statistics: Num rows: 1136 Data size: 143112 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1127 Data size: 141984 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: double), _col2 (type: double), _col3 (type: double), _col4 (type: bigint), _col5 (type: double), _col6 (type: double), _col7 (type: double), _col8 (type: double), _col9 (type: double), _col10 (type: double), _col11 (type: double), _col12 (type: double), _col13 (type: double), _col14 (type: double) Reducer 3 Execution mode: vectorized, llap @@ -2557,13 +2557,13 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 13] - Statistics: Num rows: 1136 Data size: 143112 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1127 Data size: 141984 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false File Sink Vectorization: className: VectorFileSinkOperator native: false - Statistics: Num rows: 1136 Data size: 143112 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1127 Data size: 141984 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git ql/src/test/results/clientpositive/llap/vectorized_mapjoin.q.out ql/src/test/results/clientpositive/llap/vectorized_mapjoin.q.out index 0dff57a..6916b33 100644 --- ql/src/test/results/clientpositive/llap/vectorized_mapjoin.q.out +++ ql/src/test/results/clientpositive/llap/vectorized_mapjoin.q.out @@ -58,7 +58,7 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 1 Map 3 - Statistics: Num rows: 18694 Data size: 130960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 18464 Data size: 129120 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: int), _col1 (type: int), (_col0 + _col1) (type: int) outputColumnNames: _col0, _col1, _col2 @@ -67,7 +67,7 @@ STAGE PLANS: native: true projectedOutputColumnNums: [2, 2, 13] selectExpressions: LongColAddLongColumn(col 2:int, col 2:int) -> 13:int - Statistics: Num rows: 18694 Data size: 130960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 18464 Data size: 129120 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count(_col0), max(_col1), min(_col0), avg(_col2) Group By Vectorization: diff --git ql/src/test/results/clientpositive/llap/vectorized_nested_mapjoin.q.out ql/src/test/results/clientpositive/llap/vectorized_nested_mapjoin.q.out index 80e1cab..f876656 100644 --- ql/src/test/results/clientpositive/llap/vectorized_nested_mapjoin.q.out +++ ql/src/test/results/clientpositive/llap/vectorized_nested_mapjoin.q.out @@ -54,7 +54,7 @@ STAGE PLANS: outputColumnNames: _col1 input vertices: 1 Map 4 - Statistics: Num rows: 1284939 Data size: 10267240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1268540 Data size: 10136048 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col1) mode: hash diff --git ql/src/test/results/clientpositive/llap/vectorized_shufflejoin.q.out ql/src/test/results/clientpositive/llap/vectorized_shufflejoin.q.out index 72216d3..ba11284 100644 --- ql/src/test/results/clientpositive/llap/vectorized_shufflejoin.q.out +++ ql/src/test/results/clientpositive/llap/vectorized_shufflejoin.q.out @@ -118,11 +118,11 @@ STAGE PLANS: 0 _col0 (type: int) 1 _col0 (type: int) outputColumnNames: _col0, _col1 - Statistics: Num rows: 18694 Data size: 130960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 18464 Data size: 129120 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: int), _col1 (type: int), (_col0 + _col1) (type: int) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 18694 Data size: 130960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 18464 Data size: 129120 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count(_col0), max(_col1), min(_col0), avg(_col2) mode: hash diff --git ql/src/test/results/clientpositive/mapjoin_mapjoin.q.out ql/src/test/results/clientpositive/mapjoin_mapjoin.q.out index c2c514f..f78c32c 100644 --- ql/src/test/results/clientpositive/mapjoin_mapjoin.q.out +++ ql/src/test/results/clientpositive/mapjoin_mapjoin.q.out @@ -526,24 +526,24 @@ STAGE PLANS: Stage: Stage-9 Map Reduce Local Work Alias -> Map Local Tables: - $hdt$_1:src + $hdt$_1:src1 Fetch Operator limit: -1 Alias -> Map Local Operator Tree: - $hdt$_1:src + $hdt$_1:src1 TableScan - alias: src + alias: src1 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Filter Operator - predicate: value is not null (type: boolean) + predicate: key is not null (type: boolean) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: value (type: string) + expressions: key (type: string) outputColumnNames: _col0 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE HashTable Sink Operator keys: - 0 _col1 (type: string) + 0 _col0 (type: string) 1 _col0 (type: string) Stage: Stage-7 @@ -563,9 +563,9 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 _col1 (type: string) + 0 _col0 (type: string) 1 _col0 (type: string) - outputColumnNames: _col0, _col2 + outputColumnNames: _col1, _col2 Statistics: Num rows: 2200 Data size: 23372 Basic stats: COMPLETE Column stats: NONE File Output Operator compressed: false @@ -579,24 +579,24 @@ STAGE PLANS: Stage: Stage-8 Map Reduce Local Work Alias -> Map Local Tables: - $hdt$_2:src1 + $hdt$_2:src Fetch Operator limit: -1 Alias -> Map Local Operator Tree: - $hdt$_2:src1 + $hdt$_2:src TableScan - alias: src1 + alias: src Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Filter Operator - predicate: key is not null (type: boolean) + predicate: value is not null (type: boolean) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: key (type: string) + expressions: value (type: string) outputColumnNames: _col0 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE HashTable Sink Operator keys: - 0 _col0 (type: string) + 0 _col1 (type: string) 1 _col0 (type: string) Stage: Stage-3 @@ -607,7 +607,7 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 _col0 (type: string) + 0 _col1 (type: string) 1 _col0 (type: string) outputColumnNames: _col2 Statistics: Num rows: 2420 Data size: 25709 Basic stats: COMPLETE Column stats: NONE diff --git ql/src/test/results/clientpositive/spark/bucket_map_join_tez1.q.out ql/src/test/results/clientpositive/spark/bucket_map_join_tez1.q.out index 461c7da..2c86b3a 100644 --- ql/src/test/results/clientpositive/spark/bucket_map_join_tez1.q.out +++ ql/src/test/results/clientpositive/spark/bucket_map_join_tez1.q.out @@ -4269,74 +4269,74 @@ STAGE PLANS: outputColumnNames: _col0, _col1 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col0 (type: int) + key expressions: _col1 (type: string) sort order: + - Map-reduce partition columns: _col0 (type: int) + Map-reduce partition columns: _col1 (type: string) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - value expressions: _col1 (type: string) + value expressions: _col0 (type: int) Map 4 Map Operator Tree: TableScan - alias: c + alias: b Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Filter Operator - predicate: key is not null (type: boolean) + predicate: value is not null (type: boolean) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: key (type: int) - outputColumnNames: _col0 + expressions: key (type: int), value (type: string) + outputColumnNames: _col0, _col1 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col0 (type: int) + key expressions: _col1 (type: string) sort order: + - Map-reduce partition columns: _col0 (type: int) + Map-reduce partition columns: _col1 (type: string) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + value expressions: _col0 (type: int) Map 5 Map Operator Tree: TableScan - alias: b + alias: c Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Filter Operator - predicate: value is not null (type: boolean) + predicate: key is not null (type: boolean) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: key (type: int), value (type: string) - outputColumnNames: _col0, _col1 + expressions: key (type: int) + outputColumnNames: _col0 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col1 (type: string) + key expressions: _col0 (type: int) sort order: + - Map-reduce partition columns: _col1 (type: string) + Map-reduce partition columns: _col0 (type: int) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - value expressions: _col0 (type: int) Reducer 2 Reduce Operator Tree: Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col0 (type: int) - 1 _col0 (type: int) - outputColumnNames: _col0, _col1 + 0 _col1 (type: string) + 1 _col1 (type: string) + outputColumnNames: _col0, _col2 Statistics: Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col1 (type: string) + key expressions: _col0 (type: int) sort order: + - Map-reduce partition columns: _col1 (type: string) + Map-reduce partition columns: _col0 (type: int) Statistics: Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - value expressions: _col0 (type: int) + value expressions: _col2 (type: int) Reducer 3 Reduce Operator Tree: Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col1 (type: string) - 1 _col1 (type: string) - outputColumnNames: _col0, _col3 + 0 _col0 (type: int) + 1 _col0 (type: int) + outputColumnNames: _col0, _col2 Statistics: Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: _col0 (type: int), _col3 (type: int) + expressions: _col0 (type: int), _col2 (type: int) outputColumnNames: _col0, _col1 Statistics: Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE File Output Operator @@ -4382,74 +4382,74 @@ STAGE PLANS: outputColumnNames: _col0, _col1 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col0 (type: int) + key expressions: _col1 (type: string) sort order: + - Map-reduce partition columns: _col0 (type: int) + Map-reduce partition columns: _col1 (type: string) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - value expressions: _col1 (type: string) + value expressions: _col0 (type: int) Map 4 Map Operator Tree: TableScan - alias: c + alias: b Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Filter Operator - predicate: key is not null (type: boolean) + predicate: value is not null (type: boolean) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: key (type: int) - outputColumnNames: _col0 + expressions: key (type: int), value (type: string) + outputColumnNames: _col0, _col1 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col0 (type: int) + key expressions: _col1 (type: string) sort order: + - Map-reduce partition columns: _col0 (type: int) + Map-reduce partition columns: _col1 (type: string) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + value expressions: _col0 (type: int) Map 5 Map Operator Tree: TableScan - alias: b + alias: c Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Filter Operator - predicate: value is not null (type: boolean) + predicate: key is not null (type: boolean) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: key (type: int), value (type: string) - outputColumnNames: _col0, _col1 + expressions: key (type: int) + outputColumnNames: _col0 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col1 (type: string) + key expressions: _col0 (type: int) sort order: + - Map-reduce partition columns: _col1 (type: string) + Map-reduce partition columns: _col0 (type: int) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - value expressions: _col0 (type: int) Reducer 2 Reduce Operator Tree: Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col0 (type: int) - 1 _col0 (type: int) - outputColumnNames: _col0, _col1 + 0 _col1 (type: string) + 1 _col1 (type: string) + outputColumnNames: _col0, _col2 Statistics: Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col1 (type: string) + key expressions: _col0 (type: int) sort order: + - Map-reduce partition columns: _col1 (type: string) + Map-reduce partition columns: _col0 (type: int) Statistics: Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - value expressions: _col0 (type: int) + value expressions: _col2 (type: int) Reducer 3 Reduce Operator Tree: Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col1 (type: string) - 1 _col1 (type: string) - outputColumnNames: _col0, _col3 + 0 _col0 (type: int) + 1 _col0 (type: int) + outputColumnNames: _col0, _col2 Statistics: Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: _col0 (type: int), _col3 (type: int) + expressions: _col0 (type: int), _col2 (type: int) outputColumnNames: _col0, _col1 Statistics: Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE File Output Operator diff --git ql/src/test/results/clientpositive/spark/bucket_map_join_tez2.q.out ql/src/test/results/clientpositive/spark/bucket_map_join_tez2.q.out index 3ce67e2..f26a318 100644 --- ql/src/test/results/clientpositive/spark/bucket_map_join_tez2.q.out +++ ql/src/test/results/clientpositive/spark/bucket_map_join_tez2.q.out @@ -193,74 +193,74 @@ STAGE PLANS: outputColumnNames: _col0, _col1 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col0 (type: int) + key expressions: _col1 (type: string) sort order: + - Map-reduce partition columns: _col0 (type: int) + Map-reduce partition columns: _col1 (type: string) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - value expressions: _col1 (type: string) + value expressions: _col0 (type: int) Map 4 Map Operator Tree: TableScan - alias: c + alias: b Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Filter Operator - predicate: key is not null (type: boolean) + predicate: value is not null (type: boolean) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: key (type: int) - outputColumnNames: _col0 + expressions: key (type: int), value (type: string) + outputColumnNames: _col0, _col1 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col0 (type: int) + key expressions: _col1 (type: string) sort order: + - Map-reduce partition columns: _col0 (type: int) + Map-reduce partition columns: _col1 (type: string) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + value expressions: _col0 (type: int) Map 5 Map Operator Tree: TableScan - alias: b + alias: c Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Filter Operator - predicate: value is not null (type: boolean) + predicate: key is not null (type: boolean) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: key (type: int), value (type: string) - outputColumnNames: _col0, _col1 + expressions: key (type: int) + outputColumnNames: _col0 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col1 (type: string) + key expressions: _col0 (type: int) sort order: + - Map-reduce partition columns: _col1 (type: string) + Map-reduce partition columns: _col0 (type: int) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - value expressions: _col0 (type: int) Reducer 2 Reduce Operator Tree: Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col0 (type: int) - 1 _col0 (type: int) - outputColumnNames: _col0, _col1 + 0 _col1 (type: string) + 1 _col1 (type: string) + outputColumnNames: _col0, _col2 Statistics: Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col1 (type: string) + key expressions: _col0 (type: int) sort order: + - Map-reduce partition columns: _col1 (type: string) + Map-reduce partition columns: _col0 (type: int) Statistics: Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - value expressions: _col0 (type: int) + value expressions: _col2 (type: int) Reducer 3 Reduce Operator Tree: Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col1 (type: string) - 1 _col1 (type: string) - outputColumnNames: _col0, _col3 + 0 _col0 (type: int) + 1 _col0 (type: int) + outputColumnNames: _col0, _col2 Statistics: Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: _col0 (type: int), _col3 (type: int) + expressions: _col0 (type: int), _col2 (type: int) outputColumnNames: _col0, _col1 Statistics: Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE File Output Operator @@ -306,74 +306,74 @@ STAGE PLANS: outputColumnNames: _col0, _col1 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col0 (type: int) + key expressions: _col1 (type: string) sort order: + - Map-reduce partition columns: _col0 (type: int) + Map-reduce partition columns: _col1 (type: string) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - value expressions: _col1 (type: string) + value expressions: _col0 (type: int) Map 4 Map Operator Tree: TableScan - alias: c + alias: b Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Filter Operator - predicate: key is not null (type: boolean) + predicate: value is not null (type: boolean) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: key (type: int) - outputColumnNames: _col0 + expressions: key (type: int), value (type: string) + outputColumnNames: _col0, _col1 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col0 (type: int) + key expressions: _col1 (type: string) sort order: + - Map-reduce partition columns: _col0 (type: int) + Map-reduce partition columns: _col1 (type: string) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + value expressions: _col0 (type: int) Map 5 Map Operator Tree: TableScan - alias: b + alias: c Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Filter Operator - predicate: value is not null (type: boolean) + predicate: key is not null (type: boolean) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: key (type: int), value (type: string) - outputColumnNames: _col0, _col1 + expressions: key (type: int) + outputColumnNames: _col0 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col1 (type: string) + key expressions: _col0 (type: int) sort order: + - Map-reduce partition columns: _col1 (type: string) + Map-reduce partition columns: _col0 (type: int) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - value expressions: _col0 (type: int) Reducer 2 Reduce Operator Tree: Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col0 (type: int) - 1 _col0 (type: int) - outputColumnNames: _col0, _col1 + 0 _col1 (type: string) + 1 _col1 (type: string) + outputColumnNames: _col0, _col2 Statistics: Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col1 (type: string) + key expressions: _col0 (type: int) sort order: + - Map-reduce partition columns: _col1 (type: string) + Map-reduce partition columns: _col0 (type: int) Statistics: Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - value expressions: _col0 (type: int) + value expressions: _col2 (type: int) Reducer 3 Reduce Operator Tree: Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col1 (type: string) - 1 _col1 (type: string) - outputColumnNames: _col0, _col3 + 0 _col0 (type: int) + 1 _col0 (type: int) + outputColumnNames: _col0, _col2 Statistics: Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: _col0 (type: int), _col3 (type: int) + expressions: _col0 (type: int), _col2 (type: int) outputColumnNames: _col0, _col1 Statistics: Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE File Output Operator diff --git ql/src/test/results/clientpositive/spark/join32_lessSize.q.out ql/src/test/results/clientpositive/spark/join32_lessSize.q.out index d3e648f..ba60639 100644 --- ql/src/test/results/clientpositive/spark/join32_lessSize.q.out +++ ql/src/test/results/clientpositive/spark/join32_lessSize.q.out @@ -478,26 +478,25 @@ JOIN src y ON (x.key = y.key) JOIN src1 z ON (x.key = z.key) POSTHOOK: type: QUERY STAGE DEPENDENCIES: - Stage-4 is a root stage - Stage-3 depends on stages: Stage-4 + Stage-3 is a root stage Stage-1 depends on stages: Stage-3 Stage-0 depends on stages: Stage-1 Stage-2 depends on stages: Stage-0 STAGE PLANS: - Stage: Stage-4 + Stage: Stage-3 Spark #### A masked pattern was here #### Vertices: - Map 2 + Map 1 Map Operator Tree: TableScan - alias: z + alias: x Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE GatherStats: false Filter Operator isSamplingPred: false - predicate: key is not null (type: boolean) + predicate: (key is not null and value is not null) (type: boolean) Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE Select Operator expressions: key (type: string), value (type: string) @@ -507,7 +506,8 @@ STAGE PLANS: keys: 0 _col0 (type: string) 1 _col0 (type: string) - Position of Big Table: 0 + 2 _col0 (type: string) + Position of Big Table: 2 Local Work: Map Reduce Local Work Path -> Alias: @@ -560,42 +560,27 @@ STAGE PLANS: name: default.src1 name: default.src1 Truncated Path -> Alias: - /src1 [$hdt$_3:z] - - Stage: Stage-3 - Spark -#### A masked pattern was here #### - Vertices: - Map 1 + /src1 [$hdt$_2:x] + Map 2 Map Operator Tree: TableScan - alias: x + alias: z Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE GatherStats: false Filter Operator isSamplingPred: false - predicate: (key is not null and value is not null) (type: boolean) + predicate: key is not null (type: boolean) Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE Select Operator expressions: key (type: string), value (type: string) outputColumnNames: _col0, _col1 Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - Map Join Operator - condition map: - Inner Join 0 to 1 + Spark HashTable Sink Operator keys: 0 _col0 (type: string) 1 _col0 (type: string) - outputColumnNames: _col0, _col1, _col3 - input vertices: - 1 Map 2 - Position of Big Table: 0 - Statistics: Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE - Spark HashTable Sink Operator - keys: - 0 _col1 (type: string) - 1 _col0 (type: string) - Position of Big Table: 1 + 2 _col0 (type: string) + Position of Big Table: 2 Local Work: Map Reduce Local Work Path -> Alias: @@ -648,24 +633,24 @@ STAGE PLANS: name: default.src1 name: default.src1 Truncated Path -> Alias: - /src1 [$hdt$_2:x] + /src1 [$hdt$_3:z] Map 4 Map Operator Tree: TableScan - alias: y + alias: w Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE GatherStats: false Filter Operator isSamplingPred: false - predicate: key is not null (type: boolean) + predicate: value is not null (type: boolean) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: key (type: string), value (type: string) - outputColumnNames: _col0, _col1 + expressions: value (type: string) + outputColumnNames: _col0 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Spark HashTable Sink Operator keys: - 0 _col0 (type: string) + 0 _col1 (type: string) 1 _col0 (type: string) Position of Big Table: 0 Local Work: @@ -720,7 +705,7 @@ STAGE PLANS: name: default.src name: default.src Truncated Path -> Alias: - /src [$hdt$_0:y] + /src [$hdt$_0:w] Stage: Stage-1 Spark @@ -729,49 +714,52 @@ STAGE PLANS: Map 3 Map Operator Tree: TableScan - alias: w + alias: y Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE GatherStats: false Filter Operator isSamplingPred: false - predicate: value is not null (type: boolean) + predicate: key is not null (type: boolean) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: value (type: string) - outputColumnNames: _col0 + expressions: key (type: string), value (type: string) + outputColumnNames: _col0, _col1 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Map Join Operator condition map: Inner Join 0 to 1 + Inner Join 0 to 2 keys: - 0 _col1 (type: string) + 0 _col0 (type: string) 1 _col0 (type: string) - outputColumnNames: _col0, _col3 + 2 _col0 (type: string) + outputColumnNames: _col0, _col1, _col3, _col5 input vertices: 0 Map 1 - Position of Big Table: 1 - Statistics: Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE + 1 Map 2 + Position of Big Table: 2 + Statistics: Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col0 (type: string) + 0 _col1 (type: string) 1 _col0 (type: string) - outputColumnNames: _col0, _col3, _col6 + outputColumnNames: _col0, _col3, _col5 input vertices: 1 Map 4 Position of Big Table: 0 - Statistics: Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1210 Data size: 12854 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: _col0 (type: string), _col3 (type: string), _col6 (type: string) + expressions: _col0 (type: string), _col3 (type: string), _col5 (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1210 Data size: 12854 Basic stats: COMPLETE Column stats: NONE File Output Operator compressed: false GlobalTableId: 1 #### A masked pattern was here #### NumFilesPerFileSink: 1 - Statistics: Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 1210 Data size: 12854 Basic stats: COMPLETE Column stats: NONE #### A masked pattern was here #### table: input format: org.apache.hadoop.mapred.TextInputFormat @@ -850,7 +838,7 @@ STAGE PLANS: name: default.src name: default.src Truncated Path -> Alias: - /src [$hdt$_1:w] + /src [$hdt$_1:y] Stage: Stage-0 Move Operator diff --git ql/src/test/results/clientpositive/spark/mapjoin_mapjoin.q.out ql/src/test/results/clientpositive/spark/mapjoin_mapjoin.q.out index 618c7e0..98a3446 100644 --- ql/src/test/results/clientpositive/spark/mapjoin_mapjoin.q.out +++ ql/src/test/results/clientpositive/spark/mapjoin_mapjoin.q.out @@ -552,18 +552,18 @@ STAGE PLANS: Map 5 Map Operator Tree: TableScan - alias: src1 + alias: src Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Filter Operator - predicate: key is not null (type: boolean) + predicate: value is not null (type: boolean) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: key (type: string) + expressions: value (type: string) outputColumnNames: _col0 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Spark HashTable Sink Operator keys: - 0 _col0 (type: string) + 0 _col1 (type: string) 1 _col0 (type: string) Local Work: Map Reduce Local Work @@ -588,21 +588,21 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 2000 Data size: 21248 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col1 (type: string) + key expressions: _col0 (type: string) sort order: + - Map-reduce partition columns: _col1 (type: string) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 2000 Data size: 21248 Basic stats: COMPLETE Column stats: NONE - value expressions: _col0 (type: string), _col2 (type: string) + value expressions: _col1 (type: string), _col2 (type: string) Map 4 Map Operator Tree: TableScan - alias: src + alias: src1 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Filter Operator - predicate: value is not null (type: boolean) + predicate: key is not null (type: boolean) Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: value (type: string) + expressions: key (type: string) outputColumnNames: _col0 Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator @@ -618,15 +618,15 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 _col1 (type: string) + 0 _col0 (type: string) 1 _col0 (type: string) - outputColumnNames: _col0, _col2 + outputColumnNames: _col1, _col2 Statistics: Num rows: 2200 Data size: 23372 Basic stats: COMPLETE Column stats: NONE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col0 (type: string) + 0 _col1 (type: string) 1 _col0 (type: string) outputColumnNames: _col2 input vertices: diff --git ql/src/test/results/clientpositive/spark/spark_explainuser_1.q.out ql/src/test/results/clientpositive/spark/spark_explainuser_1.q.out index 6a4bea1..64badf1 100644 --- ql/src/test/results/clientpositive/spark/spark_explainuser_1.q.out +++ ql/src/test/results/clientpositive/spark/spark_explainuser_1.q.out @@ -1693,9 +1693,9 @@ Stage-0 Stage-1 Reducer 2 File Output Operator [FS_19] - Select Operator [SEL_18] (rows=366 width=178) + Select Operator [SEL_18] (rows=365 width=178) Output:["_col0","_col1"] - Filter Operator [FIL_17] (rows=366 width=179) + Filter Operator [FIL_17] (rows=365 width=179) predicate:_col3 is null Join Operator [JOIN_16] (rows=500 width=179) Output:["_col0","_col1","_col3"],condition map:[{"":"{\"type\":\"Left Outer\",\"left\":0,\"right\":1}"}],keys:{"0":"_col1","1":"_col0"} @@ -1758,9 +1758,9 @@ Stage-0 Stage-1 Reducer 3 File Output Operator [FS_18] - Select Operator [SEL_17] (rows=183 width=178) + Select Operator [SEL_17] (rows=185 width=178) Output:["_col0","_col1"] - Filter Operator [FIL_16] (rows=183 width=179) + Filter Operator [FIL_16] (rows=185 width=179) predicate:_col4 is null Join Operator [JOIN_15] (rows=250 width=179) Output:["_col0","_col1","_col4"],condition map:[{"":"{\"type\":\"Left Outer\",\"left\":0,\"right\":1}"}],keys:{"0":"_col0, _col1","1":"_col0, _col1"} @@ -1834,7 +1834,7 @@ Stage-0 Stage-1 Reducer 2 File Output Operator [FS_12] - Join Operator [JOIN_10] (rows=133 width=178) + Join Operator [JOIN_10] (rows=131 width=178) Output:["_col0","_col1"],condition map:[{"":"{\"type\":\"Left Semi\",\"left\":0,\"right\":1}"}],keys:{"0":"_col0, _col1","1":"_col0, _col1"} <-Map 1 [PARTITION-LEVEL SORT] PARTITION-LEVEL SORT [RS_8] @@ -1886,7 +1886,7 @@ Stage-0 Stage-1 Reducer 2 File Output Operator [FS_12] - Join Operator [JOIN_10] (rows=133 width=178) + Join Operator [JOIN_10] (rows=131 width=178) Output:["_col0","_col1"],condition map:[{"":"{\"type\":\"Left Semi\",\"left\":0,\"right\":1}"}],keys:{"0":"_col0, _col1","1":"_col0, _col1"} <-Map 1 [PARTITION-LEVEL SORT] PARTITION-LEVEL SORT [RS_8] @@ -1928,7 +1928,7 @@ Stage-0 Stage-1 Reducer 2 File Output Operator [FS_12] - Join Operator [JOIN_10] (rows=133 width=178) + Join Operator [JOIN_10] (rows=131 width=178) Output:["_col0","_col1"],condition map:[{"":"{\"type\":\"Left Semi\",\"left\":0,\"right\":1}"}],keys:{"0":"_col0","1":"_col0"} <-Map 1 [PARTITION-LEVEL SORT] PARTITION-LEVEL SORT [RS_8] @@ -2049,16 +2049,16 @@ Stage-0 <-Reducer 3 [PARTITION-LEVEL SORT] PARTITION-LEVEL SORT [RS_27] PartitionCols:_col2 - Filter Operator [FIL_15] (rows=66 width=186) + Filter Operator [FIL_15] (rows=65 width=186) predicate:_col2 is not null - Group By Operator [GBY_14] (rows=66 width=186) + Group By Operator [GBY_14] (rows=65 width=186) Output:["_col0","_col1","_col2"],aggregations:["count(VALUE._col0)"],keys:KEY._col0, KEY._col1 <-Reducer 2 [GROUP] GROUP [RS_13] PartitionCols:_col0, _col1 - Group By Operator [GBY_12] (rows=66 width=186) + Group By Operator [GBY_12] (rows=65 width=186) Output:["_col0","_col1","_col2"],aggregations:["count()"],keys:_col0, _col1 - Join Operator [JOIN_10] (rows=133 width=178) + Join Operator [JOIN_10] (rows=131 width=178) Output:["_col0","_col1"],condition map:[{"":"{\"type\":\"Left Semi\",\"left\":0,\"right\":1}"}],keys:{"0":"_col0","1":"_col0"} <-Map 1 [PARTITION-LEVEL SORT] PARTITION-LEVEL SORT [RS_8] @@ -2658,7 +2658,7 @@ Stage-0 PartitionCols:_col0 Group By Operator [GBY_10] (rows=16 width=94) Output:["_col0","_col1"],aggregations:["count()"],keys:_col0 - Join Operator [JOIN_8] (rows=40 width=86) + Join Operator [JOIN_8] (rows=39 width=86) Output:["_col0"],condition map:[{"":"{\"type\":\"Inner\",\"left\":0,\"right\":1}"}],keys:{"0":"_col0","1":"_col0"} <-Map 1 [PARTITION-LEVEL SORT] PARTITION-LEVEL SORT [RS_6] @@ -2719,7 +2719,7 @@ Stage-0 PartitionCols:_col0 Group By Operator [GBY_10] (rows=16 width=94) Output:["_col0","_col1"],aggregations:["count()"],keys:_col0 - Join Operator [JOIN_8] (rows=40 width=86) + Join Operator [JOIN_8] (rows=39 width=86) Output:["_col0"],condition map:[{"":"{\"type\":\"Inner\",\"left\":0,\"right\":1}"}],keys:{"0":"_col0","1":"_col0"} <-Map 1 [PARTITION-LEVEL SORT] PARTITION-LEVEL SORT [RS_6] @@ -2779,7 +2779,7 @@ Stage-0 PartitionCols:_col0 Group By Operator [GBY_10] (rows=16 width=94) Output:["_col0","_col1"],aggregations:["count()"],keys:_col0 - Map Join Operator [MAPJOIN_22] (rows=40 width=86) + Map Join Operator [MAPJOIN_22] (rows=39 width=86) Conds:SEL_5._col0=SEL_5._col0(Inner),Output:["_col0"] <-Select Operator [SEL_5] (rows=500 width=87) Output:["_col0"] @@ -2831,16 +2831,16 @@ Stage-0 GROUP [RS_18] Group By Operator [GBY_17] (rows=1 width=16) Output:["_col0","_col1"],aggregations:["sum(_col0)","sum(_col1)"] - Select Operator [SEL_15] (rows=10 width=94) + Select Operator [SEL_15] (rows=9 width=94) Output:["_col0","_col1"] - Group By Operator [GBY_14] (rows=10 width=94) + Group By Operator [GBY_14] (rows=9 width=94) Output:["_col0","_col1"],aggregations:["count(VALUE._col0)"],keys:KEY._col0 <-Reducer 2 [GROUP] GROUP [RS_13] PartitionCols:_col0 - Group By Operator [GBY_12] (rows=10 width=94) + Group By Operator [GBY_12] (rows=9 width=94) Output:["_col0","_col1"],aggregations:["count()"],keys:_col0 - Join Operator [JOIN_10] (rows=20 width=86) + Join Operator [JOIN_10] (rows=19 width=86) Output:["_col0"],condition map:[{"":"{\"type\":\"Left Semi\",\"left\":0,\"right\":1}"}],keys:{"0":"_col0","1":"_col0"} <-Map 1 [PARTITION-LEVEL SORT] PARTITION-LEVEL SORT [RS_8] @@ -5237,9 +5237,9 @@ Stage-2 Reducer 2 File Output Operator [FS_11] table:{"name:":"default.dest_j1"} - Select Operator [SEL_9] (rows=809 width=95) + Select Operator [SEL_9] (rows=791 width=95) Output:["_col0","_col1"] - Join Operator [JOIN_8] (rows=809 width=178) + Join Operator [JOIN_8] (rows=791 width=178) Output:["_col0","_col2"],condition map:[{"":"{\"type\":\"Inner\",\"left\":0,\"right\":1}"}],keys:{"0":"_col0","1":"_col0"} <-Map 1 [PARTITION-LEVEL SORT] PARTITION-LEVEL SORT [RS_6] @@ -5263,7 +5263,7 @@ Stage-2 Map 4 File Output Operator [FS_11] table:{"name:":"default.dest_j1"} - Select Operator [SEL_9] (rows=809 width=95) + Select Operator [SEL_9] (rows=791 width=95) Output:["_col0","_col1"] Map Join Operator [MAPJOIN_16] Conds:TS_14.reducesinkkey0=TS_14.reducesinkkey0(Inner),Output:["_col0","_col2"] @@ -5518,7 +5518,7 @@ Stage-0 Stage-1 Reducer 2 File Output Operator [FS_10] - Join Operator [JOIN_8] (rows=809 width=356) + Join Operator [JOIN_8] (rows=791 width=356) Output:["_col0","_col1","_col2","_col3"],condition map:[{"":"{\"type\":\"Inner\",\"left\":0,\"right\":1}"}],keys:{"0":"_col0","1":"_col0"} <-Map 1 [PARTITION-LEVEL SORT] PARTITION-LEVEL SORT [RS_6] diff --git ql/src/test/results/clientpositive/tez/explainanalyze_1.q.out ql/src/test/results/clientpositive/tez/explainanalyze_1.q.out index bc980b6..95f8990 100644 --- ql/src/test/results/clientpositive/tez/explainanalyze_1.q.out +++ ql/src/test/results/clientpositive/tez/explainanalyze_1.q.out @@ -240,7 +240,7 @@ Stage-0 Stage-1 Reducer 2 File Output Operator [FS_5] - Group By Operator [GBY_3] (rows=309/309 width=95) + Group By Operator [GBY_3] (rows=316/309 width=95) Output:["_col0","_col1"],aggregations:["count(KEY._col0)"],keys:KEY._col0 <-Map 1 [SIMPLE_EDGE] SHUFFLE [RS_2] @@ -287,7 +287,7 @@ Stage-0 Output:["_col0"],aggregations:["count()"] <-Reducer 2 [CUSTOM_SIMPLE_EDGE] PARTITION_ONLY_SHUFFLE [RS_10] - Merge Join Operator [MERGEJOIN_18] (rows=267/0 width=8) + Merge Join Operator [MERGEJOIN_18] (rows=262/0 width=8) Conds:RS_6._col0=RS_7._col0(Inner) <-Map 1 [SIMPLE_EDGE] SHUFFLE [RS_6] @@ -336,7 +336,7 @@ Stage-0 Output:["_col0"],aggregations:["count()"] <-Reducer 2 [CUSTOM_SIMPLE_EDGE] PARTITION_ONLY_SHUFFLE [RS_10] - Merge Join Operator [MERGEJOIN_18] (rows=267/1019 width=8) + Merge Join Operator [MERGEJOIN_18] (rows=262/1019 width=8) Conds:RS_6._col0=RS_7._col0(Inner) <-Map 1 [SIMPLE_EDGE] SHUFFLE [RS_6] @@ -440,9 +440,9 @@ Stage-0 Stage-1 Reducer 2 File Output Operator [FS_10] - Select Operator [SEL_9] (rows=809/1028 width=178) + Select Operator [SEL_9] (rows=791/1028 width=178) Output:["_col0","_col1"] - Merge Join Operator [MERGEJOIN_15] (rows=809/1028 width=178) + Merge Join Operator [MERGEJOIN_15] (rows=791/1028 width=178) Conds:RS_6._col0=RS_7._col0(Inner),Output:["_col0","_col2"] <-Map 1 [SIMPLE_EDGE] SHUFFLE [RS_6] @@ -502,9 +502,9 @@ Stage-0 Stage-1 Reducer 2 File Output Operator [FS_9] - Transform Operator [SCR_8] (rows=809/1028 width=178) + Transform Operator [SCR_8] (rows=791/1028 width=178) command:cat - Merge Join Operator [MERGEJOIN_14] (rows=809/1028 width=178) + Merge Join Operator [MERGEJOIN_14] (rows=791/1028 width=178) Conds:RS_3.key=RS_5.key(Inner),Output:["_col0","_col1"] <-Map 1 [SIMPLE_EDGE] SHUFFLE [RS_3] diff --git ql/src/test/results/clientpositive/tez/explainanalyze_4.q.out ql/src/test/results/clientpositive/tez/explainanalyze_4.q.out index 9c678ac..1e02610 100644 --- ql/src/test/results/clientpositive/tez/explainanalyze_4.q.out +++ ql/src/test/results/clientpositive/tez/explainanalyze_4.q.out @@ -44,11 +44,11 @@ Stage-0 Stage-1 Reducer 3 File Output Operator [FS_12] - Select Operator [SEL_11] (rows=2076/10 width=553) + Select Operator [SEL_11] (rows=2048/10 width=552) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23"] <-Reducer 2 [SIMPLE_EDGE] SHUFFLE [RS_10] - Merge Join Operator [MERGEJOIN_17] (rows=2076/10 width=553) + Merge Join Operator [MERGEJOIN_17] (rows=2048/10 width=552) Conds:RS_6._col2=RS_7._col2(Inner),Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23"] <-Map 1 [SIMPLE_EDGE] SHUFFLE [RS_6] @@ -143,7 +143,7 @@ Stage-0 Output:["_col0"],aggregations:["count()"] <-Reducer 2 [CUSTOM_SIMPLE_EDGE] PARTITION_ONLY_SHUFFLE [RS_10] - Merge Join Operator [MERGEJOIN_18] (rows=2076/10 width=8) + Merge Join Operator [MERGEJOIN_18] (rows=2048/10 width=8) Conds:RS_6._col0=RS_7._col0(Inner) <-Map 1 [SIMPLE_EDGE] SHUFFLE [RS_6] @@ -232,16 +232,16 @@ Stage-0 Stage-1 Reducer 4 File Output Operator [FS_15] - Select Operator [SEL_14] (rows=623/5 width=11) + Select Operator [SEL_14] (rows=631/5 width=11) Output:["_col0","_col1"] <-Reducer 3 [SIMPLE_EDGE] SHUFFLE [RS_13] - Group By Operator [GBY_11] (rows=623/5 width=11) + Group By Operator [GBY_11] (rows=631/5 width=11) Output:["_col0","_col1"],aggregations:["count()"],keys:KEY._col0 <-Reducer 2 [SIMPLE_EDGE] SHUFFLE [RS_10] PartitionCols:_col0 - Merge Join Operator [MERGEJOIN_20] (rows=2076/10 width=3) + Merge Join Operator [MERGEJOIN_20] (rows=2048/10 width=3) Conds:RS_6._col1=RS_7._col0(Inner),Output:["_col0"] <-Map 1 [SIMPLE_EDGE] SHUFFLE [RS_6] diff --git ql/src/test/results/clientpositive/tez/explainanalyze_5.q.out ql/src/test/results/clientpositive/tez/explainanalyze_5.q.out index 3558712..2e36ed2 100644 --- ql/src/test/results/clientpositive/tez/explainanalyze_5.q.out +++ ql/src/test/results/clientpositive/tez/explainanalyze_5.q.out @@ -114,9 +114,9 @@ Stage-3 <-Reducer 4 [CUSTOM_SIMPLE_EDGE] File Output Operator [FS_19] table:{"name:":"default.src_multi2"} - Select Operator [SEL_18] (rows=849/508 width=178) + Select Operator [SEL_18] (rows=830/508 width=178) Output:["_col0","_col1"] - Merge Join Operator [MERGEJOIN_26] (rows=849/508 width=178) + Merge Join Operator [MERGEJOIN_26] (rows=830/508 width=178) Conds:RS_15._col0=RS_16._col0(Inner),Output:["_col0","_col3"] <-Map 7 [SIMPLE_EDGE] SHUFFLE [RS_16] @@ -154,7 +154,7 @@ Stage-3 TableScan [TS_3] (rows=25/25 width=175) Output:["key","value"] PARTITION_ONLY_SHUFFLE [RS_2] - Select Operator [SEL_1] (rows=849/508 width=178) + Select Operator [SEL_1] (rows=830/508 width=178) Output:["key","value"] Please refer to the previous Select Operator [SEL_18] diff --git ql/src/test/results/clientpositive/tez/hybridgrace_hashjoin_1.q.out ql/src/test/results/clientpositive/tez/hybridgrace_hashjoin_1.q.out index a709920..535c124 100644 --- ql/src/test/results/clientpositive/tez/hybridgrace_hashjoin_1.q.out +++ ql/src/test/results/clientpositive/tez/hybridgrace_hashjoin_1.q.out @@ -56,7 +56,7 @@ STAGE PLANS: 1 _col0 (type: int) input vertices: 1 Map 3 - Statistics: Num rows: 25044 Data size: 200352 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 24737 Data size: 197896 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -172,7 +172,7 @@ STAGE PLANS: 1 _col0 (type: int) input vertices: 1 Map 3 - Statistics: Num rows: 25044 Data size: 200352 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 24737 Data size: 197896 Basic stats: COMPLETE Column stats: COMPLETE HybridGraceHashJoin: true Group By Operator aggregations: count() @@ -287,7 +287,7 @@ STAGE PLANS: 1 _col0 (type: int) input vertices: 1 Map 3 - Statistics: Num rows: 18694 Data size: 149552 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 18464 Data size: 147712 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -399,7 +399,7 @@ STAGE PLANS: 1 _col0 (type: int) input vertices: 1 Map 3 - Statistics: Num rows: 18694 Data size: 149552 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 18464 Data size: 147712 Basic stats: COMPLETE Column stats: COMPLETE HybridGraceHashJoin: true Group By Operator aggregations: count() @@ -509,7 +509,7 @@ STAGE PLANS: 1 _col0 (type: int) input vertices: 1 Map 3 - Statistics: Num rows: 25044 Data size: 200352 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 24737 Data size: 197896 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -615,7 +615,7 @@ STAGE PLANS: 1 _col0 (type: int) input vertices: 1 Map 3 - Statistics: Num rows: 25044 Data size: 200352 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 24737 Data size: 197896 Basic stats: COMPLETE Column stats: COMPLETE HybridGraceHashJoin: true Group By Operator aggregations: count() diff --git ql/src/test/results/clientpositive/tez/hybridgrace_hashjoin_2.q.out ql/src/test/results/clientpositive/tez/hybridgrace_hashjoin_2.q.out index 0b71be9..2a12203 100644 --- ql/src/test/results/clientpositive/tez/hybridgrace_hashjoin_2.q.out +++ ql/src/test/results/clientpositive/tez/hybridgrace_hashjoin_2.q.out @@ -71,7 +71,7 @@ STAGE PLANS: input vertices: 0 Map 1 2 Map 4 - Statistics: Num rows: 261 Data size: 2088 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 250 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -195,7 +195,7 @@ STAGE PLANS: input vertices: 0 Map 1 2 Map 4 - Statistics: Num rows: 261 Data size: 2088 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 250 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE HybridGraceHashJoin: true Group By Operator aggregations: count() @@ -334,7 +334,7 @@ STAGE PLANS: 0 Map 1 2 Map 4 3 Map 5 - Statistics: Num rows: 1694 Data size: 13552 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1584 Data size: 12672 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -478,7 +478,7 @@ STAGE PLANS: 0 Map 1 2 Map 4 3 Map 5 - Statistics: Num rows: 1694 Data size: 13552 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1584 Data size: 12672 Basic stats: COMPLETE Column stats: COMPLETE HybridGraceHashJoin: true Group By Operator aggregations: count() @@ -651,7 +651,7 @@ STAGE PLANS: input vertices: 0 Map 1 2 Map 6 - Statistics: Num rows: 261 Data size: 2088 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 250 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -706,7 +706,7 @@ STAGE PLANS: input vertices: 0 Map 7 2 Map 10 - Statistics: Num rows: 261 Data size: 2088 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 265 Data size: 2120 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -886,7 +886,7 @@ STAGE PLANS: input vertices: 0 Map 1 2 Map 6 - Statistics: Num rows: 261 Data size: 2088 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 250 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE HybridGraceHashJoin: true Group By Operator aggregations: count() @@ -942,7 +942,7 @@ STAGE PLANS: input vertices: 0 Map 7 2 Map 10 - Statistics: Num rows: 261 Data size: 2088 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 265 Data size: 2120 Basic stats: COMPLETE Column stats: COMPLETE HybridGraceHashJoin: true Group By Operator aggregations: count() @@ -1120,7 +1120,7 @@ STAGE PLANS: input vertices: 0 Map 1 2 Map 4 - Statistics: Num rows: 20 Data size: 1780 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 1691 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -1132,7 +1132,7 @@ STAGE PLANS: input vertices: 1 Map 5 2 Map 6 - Statistics: Num rows: 204 Data size: 1632 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 196 Data size: 1568 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() mode: hash @@ -1304,7 +1304,7 @@ STAGE PLANS: input vertices: 0 Map 1 2 Map 4 - Statistics: Num rows: 20 Data size: 1780 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19 Data size: 1691 Basic stats: COMPLETE Column stats: COMPLETE HybridGraceHashJoin: true Map Join Operator condition map: @@ -1317,7 +1317,7 @@ STAGE PLANS: input vertices: 1 Map 5 2 Map 6 - Statistics: Num rows: 204 Data size: 1632 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 196 Data size: 1568 Basic stats: COMPLETE Column stats: COMPLETE HybridGraceHashJoin: true Group By Operator aggregations: count() diff --git ql/src/test/results/clientpositive/tez/vectorization_limit.q.out ql/src/test/results/clientpositive/tez/vectorization_limit.q.out index 99544bb..3cb57a3 100644 --- ql/src/test/results/clientpositive/tez/vectorization_limit.q.out +++ ql/src/test/results/clientpositive/tez/vectorization_limit.q.out @@ -790,7 +790,7 @@ STAGE PLANS: keys: cdouble (type: double) mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 4159 Data size: 58120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4127 Data size: 57672 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: double) sort order: + @@ -801,7 +801,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [1] - Statistics: Num rows: 4159 Data size: 58120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4127 Data size: 57672 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Execution mode: vectorized Map Vectorization: @@ -848,7 +848,7 @@ STAGE PLANS: keys: KEY._col0 (type: double) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 4159 Data size: 58120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4127 Data size: 57672 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: bigint), _col0 (type: double) sort order: ++ @@ -858,7 +858,7 @@ STAGE PLANS: native: true nativeConditionsMet: hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine tez IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true valueColumnNums: [] - Statistics: Num rows: 4159 Data size: 58120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4127 Data size: 57672 Basic stats: COMPLETE Column stats: COMPLETE TopN Hash Memory Usage: 0.3 Reducer 3 Execution mode: vectorized @@ -883,7 +883,7 @@ STAGE PLANS: className: VectorSelectOperator native: true projectedOutputColumnNums: [1, 0] - Statistics: Num rows: 4159 Data size: 58120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4127 Data size: 57672 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 20 Limit Vectorization: diff --git standalone-metastore/src/main/java/org/apache/hadoop/hive/common/ndv/NumDistinctValueEstimatorFactory.java standalone-metastore/src/main/java/org/apache/hadoop/hive/common/ndv/NumDistinctValueEstimatorFactory.java index 4e4dfb7..b630fa3 100644 --- standalone-metastore/src/main/java/org/apache/hadoop/hive/common/ndv/NumDistinctValueEstimatorFactory.java +++ standalone-metastore/src/main/java/org/apache/hadoop/hive/common/ndv/NumDistinctValueEstimatorFactory.java @@ -25,6 +25,7 @@ import org.apache.hadoop.hive.common.ndv.fm.FMSketch; import org.apache.hadoop.hive.common.ndv.fm.FMSketchUtils; import org.apache.hadoop.hive.common.ndv.hll.HyperLogLog; +import org.apache.hadoop.hive.common.ndv.hll.HyperLogLogUtils; public class NumDistinctValueEstimatorFactory { @@ -44,7 +45,7 @@ public static NumDistinctValueEstimator getNumDistinctValueEstimator(byte[] buf) if (isFMSketch(buf)) { return FMSketchUtils.deserializeFM(buf); } else { - return HyperLogLog.builder().build().deserialize(buf); + return HyperLogLogUtils.deserializeHLL(buf); } } catch (IOException e) { throw new RuntimeException(e); @@ -56,7 +57,7 @@ public static NumDistinctValueEstimator getEmptyNumDistinctValueEstimator( if (n instanceof FMSketch) { return new FMSketch(((FMSketch) n).getNumBitVectors()); } else { - return HyperLogLog.builder().build(); + return HyperLogLog.builder().setSizeOptimized().build(); } } @@ -65,7 +66,7 @@ public static NumDistinctValueEstimator getEmptyNumDistinctValueEstimator(String if ("fm".equals(func.toLowerCase())) { return new FMSketch(numBitVectors); } else if ("hll".equals(func.toLowerCase())) { - return HyperLogLog.builder().build(); + return HyperLogLog.builder().setSizeOptimized().build(); } else { throw new RuntimeException("Can not recognize " + func); } diff --git standalone-metastore/src/main/java/org/apache/hadoop/hive/common/ndv/hll/HLLDenseRegister.java standalone-metastore/src/main/java/org/apache/hadoop/hive/common/ndv/hll/HLLDenseRegister.java index 12897fc..422bfbe 100644 --- standalone-metastore/src/main/java/org/apache/hadoop/hive/common/ndv/hll/HLLDenseRegister.java +++ standalone-metastore/src/main/java/org/apache/hadoop/hive/common/ndv/hll/HLLDenseRegister.java @@ -62,6 +62,31 @@ public boolean add(long hashcode) { return set(registerIdx, (byte) lr); } + // this is a lossy invert of the function above, which produces a hashcode + // which collides with the current winner of the register (we lose all higher + // bits, but we get all bits useful for lesser p-bit options) + + // +-------------|-------------+ + // |xxxx100000000|1000000000000| (lr=9 + idx=1024) + // +-------------|-------------+ + // \ + // +---------------|-----------+ + // |xxxx10000000010|00000000000| (lr=2 + idx=0) + // +---------------|-----------+ + + // This shows the relevant bits of the original hash value + // and how the conversion is moving bits from the index value + // over to the leading zero computation + + public void extractLowBitsTo(HLLRegister dest) { + for (int idx = 0; idx < register.length; idx++) { + byte lr = register[idx]; // this can be a max of 65, never > 127 + if (lr != 0) { + dest.add((long) ((1 << (p + lr - 1)) | idx)); + } + } + } + public boolean set(int idx, byte value) { boolean updated = false; if (idx < register.length && value > register[idx]) { diff --git standalone-metastore/src/main/java/org/apache/hadoop/hive/common/ndv/hll/HLLSparseRegister.java standalone-metastore/src/main/java/org/apache/hadoop/hive/common/ndv/hll/HLLSparseRegister.java index 82085dd..deaca9d 100644 --- standalone-metastore/src/main/java/org/apache/hadoop/hive/common/ndv/hll/HLLSparseRegister.java +++ standalone-metastore/src/main/java/org/apache/hadoop/hive/common/ndv/hll/HLLSparseRegister.java @@ -19,6 +19,7 @@ package org.apache.hadoop.hive.common.ndv.hll; import java.util.Map; +import java.util.Map.Entry; import java.util.TreeMap; public class HLLSparseRegister implements HLLRegister { @@ -199,6 +200,18 @@ public boolean set(int key, byte value) { return sparseMap; } + // this is effectively the same as the dense register impl. + public void extractLowBitsTo(HLLRegister dest) { + for (Entry entry : sparseMap.entrySet()) { + int idx = entry.getKey(); + byte lr = entry.getValue(); // this can be a max of 65, never > 127 + if (lr != 0) { + // should be a no-op for sparse + dest.add((long) ((1 << (p + lr - 1)) | idx)); + } + } + } + public int getP() { return p; } diff --git standalone-metastore/src/main/java/org/apache/hadoop/hive/common/ndv/hll/HyperLogLog.java standalone-metastore/src/main/java/org/apache/hadoop/hive/common/ndv/hll/HyperLogLog.java index 8bdb47b..b5455a0 100644 --- standalone-metastore/src/main/java/org/apache/hadoop/hive/common/ndv/hll/HyperLogLog.java +++ standalone-metastore/src/main/java/org/apache/hadoop/hive/common/ndv/hll/HyperLogLog.java @@ -163,6 +163,13 @@ public HyperLogLogBuilder setNumRegisterIndexBits(int b) { return this; } + public HyperLogLogBuilder setSizeOptimized() { + // allowing this to be increased via config breaks the merge impl + // p=10 = ~1kb per vector or smaller + this.numRegisterIndexBits = 10; + return this; + } + public HyperLogLogBuilder setEncoding(EncodingType enc) { this.encoding = enc; return this; @@ -440,12 +447,23 @@ public void setHLLDenseRegister(byte[] reg) { * @throws IllegalArgumentException */ public void merge(HyperLogLog hll) { - if (p != hll.p || chosenHashBits != hll.chosenHashBits) { + if (chosenHashBits != hll.chosenHashBits) { throw new IllegalArgumentException( "HyperLogLog cannot be merged as either p or hashbits are different. Current: " + toString() + " Provided: " + hll.toString()); } + if (p > hll.p) { + throw new IllegalArgumentException( + "HyperLogLog cannot merge a smaller p into a larger one : " + + toString() + " Provided: " + hll.toString()); + } + + if (p != hll.p) { + // invariant: p > hll.p + hll = hll.squash(p); + } + EncodingType otherEncoding = hll.getEncoding(); if (encoding.equals(EncodingType.SPARSE) && otherEncoding.equals(EncodingType.SPARSE)) { @@ -473,6 +491,36 @@ public void merge(HyperLogLog hll) { } /** + * Reduces the accuracy of the HLL provided to a smaller size + * @param p0 + * - new p size for the new HyperLogLog (smaller or no change) + * @return reduced (or same) HyperLogLog instance + */ + public HyperLogLog squash(final int p0) { + if (p0 > p) { + throw new IllegalArgumentException( + "HyperLogLog cannot be be squashed to be bigger. Current: " + + toString() + " Provided: " + p0); + } + + if (p0 == p) { + return this; + } + + final HyperLogLog hll = new HyperLogLogBuilder() + .setNumRegisterIndexBits(p0).setEncoding(EncodingType.DENSE) + .enableNoBias(noBias).build(); + final HLLDenseRegister result = hll.denseRegister; + + if (encoding == EncodingType.SPARSE) { + sparseRegister.extractLowBitsTo(result); + } else if (encoding == EncodingType.DENSE) { + denseRegister.extractLowBitsTo(result); + } + return hll; + } + + /** * Converts sparse to dense hll register * @param sparseRegister * - sparse register to be converted @@ -585,14 +633,7 @@ public void reset() { @Override public NumDistinctValueEstimator deserialize(byte[] buf) { - InputStream is = new ByteArrayInputStream(buf); - try { - HyperLogLog result = HyperLogLogUtils.deserializeHLL(is); - is.close(); - return result; - } catch (IOException e) { - throw new RuntimeException(e); - } + return HyperLogLogUtils.deserializeHLL(buf); } @Override diff --git standalone-metastore/src/main/java/org/apache/hadoop/hive/common/ndv/hll/HyperLogLogUtils.java standalone-metastore/src/main/java/org/apache/hadoop/hive/common/ndv/hll/HyperLogLogUtils.java index 4e6510b..6fd1c02 100644 --- standalone-metastore/src/main/java/org/apache/hadoop/hive/common/ndv/hll/HyperLogLogUtils.java +++ standalone-metastore/src/main/java/org/apache/hadoop/hive/common/ndv/hll/HyperLogLogUtils.java @@ -18,6 +18,7 @@ package org.apache.hadoop.hive.common.ndv.hll; +import java.io.ByteArrayInputStream; import java.io.EOFException; import java.io.IOException; import java.io.InputStream; @@ -126,7 +127,7 @@ public static void serializeHLL(OutputStream out, HyperLogLog hll) throws IOExce } /** - * Refer serializeHLL() for format of serialization. This funtions + * Refer serializeHLL() for format of serialization. This function * deserializes the serialized hyperloglogs * @param in * - input stream @@ -198,6 +199,22 @@ public static HyperLogLog deserializeHLL(InputStream in) throws IOException { return result; } + /** + * This function deserializes the serialized hyperloglogs from a byte array + * @param buf - to deserialize + * @return HyperLogLog + */ + public static HyperLogLog deserializeHLL(final byte[] buf) { + InputStream is = new ByteArrayInputStream(buf); // TODO: use faster non-sync inputstream + try { + HyperLogLog result = deserializeHLL(is); + is.close(); + return result; + } catch (IOException e) { + throw new RuntimeException(e); + } + } + private static void bitpackHLLRegister(OutputStream out, byte[] register, int bitWidth) throws IOException { int bitsLeft = 8; diff --git standalone-metastore/src/test/java/org/apache/hadoop/hive/common/ndv/hll/TestHyperLogLog.java standalone-metastore/src/test/java/org/apache/hadoop/hive/common/ndv/hll/TestHyperLogLog.java index b0eaad8..56ed407 100644 --- standalone-metastore/src/test/java/org/apache/hadoop/hive/common/ndv/hll/TestHyperLogLog.java +++ standalone-metastore/src/test/java/org/apache/hadoop/hive/common/ndv/hll/TestHyperLogLog.java @@ -34,14 +34,18 @@ public void testHLLDenseMerge() { HyperLogLog hll3 = HyperLogLog.builder().setEncoding(EncodingType.DENSE).build(); HyperLogLog hll4 = HyperLogLog.builder().setNumRegisterIndexBits(16) .setEncoding(EncodingType.DENSE).build(); + HyperLogLog hll5 = HyperLogLog.builder().setNumRegisterIndexBits(12) + .setEncoding(EncodingType.DENSE).build(); int size = 1000; for (int i = 0; i < size; i++) { hll.addLong(i); hll2.addLong(size + i); hll3.addLong(2 * size + i); + hll4.addLong(3 * size + i); } double threshold = size > 40000 ? longRangeTolerance : shortRangeTolerance; double delta = threshold * size / 100; + double delta4 = threshold * (4*size) / 100; assertEquals((double) size, (double) hll.count(), delta); assertEquals((double) size, (double) hll2.count(), delta); @@ -60,8 +64,13 @@ public void testHLLDenseMerge() { assertEquals((double) 3 * size, (double) hll.count(), delta); assertEquals(EncodingType.DENSE, hll.getEncoding()); - // invalid merge -- register set size doesn't match + // valid merge -- register set size gets bigger (also 4k items hll.merge(hll4); + assertEquals((double) 4 * size, (double) hll.count(), delta4); + assertEquals(EncodingType.DENSE, hll.getEncoding()); + + // invalid merge -- smaller register merge to bigger + hll.merge(hll5); } @Test(expected = IllegalArgumentException.class) @@ -71,14 +80,18 @@ public void testHLLSparseMerge() { HyperLogLog hll3 = HyperLogLog.builder().setEncoding(EncodingType.SPARSE).build(); HyperLogLog hll4 = HyperLogLog.builder().setNumRegisterIndexBits(16) .setEncoding(EncodingType.SPARSE).build(); + HyperLogLog hll5 = HyperLogLog.builder().setNumRegisterIndexBits(12) + .setEncoding(EncodingType.SPARSE).build(); int size = 500; for (int i = 0; i < size; i++) { hll.addLong(i); hll2.addLong(size + i); hll3.addLong(2 * size + i); + hll4.addLong(3 * size + i); } double threshold = size > 40000 ? longRangeTolerance : shortRangeTolerance; double delta = threshold * size / 100; + double delta4 = threshold * (4*size) / 100; assertEquals((double) size, (double) hll.count(), delta); assertEquals((double) size, (double) hll2.count(), delta); @@ -97,8 +110,13 @@ public void testHLLSparseMerge() { assertEquals((double) 3 * size, (double) hll.count(), delta); assertEquals(EncodingType.SPARSE, hll.getEncoding()); - // invalid merge -- register set size doesn't match + // valid merge -- register set size gets bigger & dense automatically hll.merge(hll4); + assertEquals((double) 4 * size, (double) hll.count(), delta4); + assertEquals(EncodingType.DENSE, hll.getEncoding()); + + // invalid merge -- smaller register merge to bigger + hll.merge(hll5); } @Test(expected = IllegalArgumentException.class) @@ -108,11 +126,14 @@ public void testHLLSparseDenseMerge() { HyperLogLog hll3 = HyperLogLog.builder().setEncoding(EncodingType.DENSE).build(); HyperLogLog hll4 = HyperLogLog.builder().setNumRegisterIndexBits(16) .setEncoding(EncodingType.DENSE).build(); + HyperLogLog hll5 = HyperLogLog.builder().setNumRegisterIndexBits(12) + .setEncoding(EncodingType.DENSE).build(); int size = 1000; for (int i = 0; i < size; i++) { hll.addLong(i); hll2.addLong(size + i); hll3.addLong(2 * size + i); + hll4.addLong(3 * size + i); } double threshold = size > 40000 ? longRangeTolerance : shortRangeTolerance; double delta = threshold * size / 100; @@ -134,8 +155,13 @@ public void testHLLSparseDenseMerge() { assertEquals((double) 3 * size, (double) hll.count(), delta); assertEquals(EncodingType.DENSE, hll.getEncoding()); - // invalid merge -- register set size doesn't match - hll.merge(hll4); + // merge should convert hll2 to DENSE + hll2.merge(hll4); + assertEquals((double) 2 * size, (double) hll2.count(), delta); + assertEquals(EncodingType.DENSE, hll2.getEncoding()); + + // invalid merge -- smaller register merge to bigger + hll.merge(hll5); } @Test(expected = IllegalArgumentException.class) @@ -145,11 +171,14 @@ public void testHLLDenseSparseMerge() { HyperLogLog hll3 = HyperLogLog.builder().setEncoding(EncodingType.SPARSE).build(); HyperLogLog hll4 = HyperLogLog.builder().setNumRegisterIndexBits(16) .setEncoding(EncodingType.SPARSE).build(); + HyperLogLog hll5 = HyperLogLog.builder().setNumRegisterIndexBits(12) + .setEncoding(EncodingType.SPARSE).build(); int size = 1000; for (int i = 0; i < size; i++) { hll.addLong(i); hll2.addLong(size + i); hll3.addLong(2 * size + i); + hll4.addLong(3 * size + i); } double threshold = size > 40000 ? longRangeTolerance : shortRangeTolerance; double delta = threshold * size / 100; @@ -171,8 +200,14 @@ public void testHLLDenseSparseMerge() { assertEquals((double) 3 * size, (double) hll.count(), delta); assertEquals(EncodingType.DENSE, hll.getEncoding()); - // invalid merge -- register set size doesn't match - hll.merge(hll4); + // merge should convert hll3 to DENSE + hll3.merge(hll4); + assertEquals((double) 2 * size, (double) hll3.count(), delta); + assertEquals(EncodingType.DENSE, hll3.getEncoding()); + + // invalid merge -- smaller register merge to bigger + hll.merge(hll5); + } @Test(expected = IllegalArgumentException.class) @@ -182,11 +217,14 @@ public void testHLLSparseOverflowMerge() { HyperLogLog hll3 = HyperLogLog.builder().setEncoding(EncodingType.SPARSE).build(); HyperLogLog hll4 = HyperLogLog.builder().setNumRegisterIndexBits(16) .setEncoding(EncodingType.SPARSE).build(); + HyperLogLog hll5 = HyperLogLog.builder().setNumRegisterIndexBits(12) + .setEncoding(EncodingType.SPARSE).build(); int size = 1000; for (int i = 0; i < size; i++) { hll.addLong(i); hll2.addLong(size + i); hll3.addLong(2 * size + i); + hll4.addLong(3 * size + i); } double threshold = size > 40000 ? longRangeTolerance : shortRangeTolerance; double delta = threshold * size / 100; @@ -208,8 +246,13 @@ public void testHLLSparseOverflowMerge() { assertEquals((double) 3 * size, (double) hll.count(), delta); assertEquals(EncodingType.DENSE, hll.getEncoding()); - // invalid merge -- register set size doesn't match - hll.merge(hll4); + // merge should convert hll2 to DENSE + hll2.merge(hll4); + assertEquals((double) 2 * size, (double) hll2.count(), delta); + assertEquals(EncodingType.DENSE, hll2.getEncoding()); + + // invalid merge -- smaller register merge to bigger + hll.merge(hll5); } @Test @@ -224,4 +267,69 @@ public void testHLLSparseMoreRegisterBits() { double delta = threshold * size / 100; assertEquals((double) size, (double) hll.count(), delta); } + + @Test + public void testHLLSquash() { + + int[] sizes = new int[] { 500, 1000, 2300, 4096}; + int minBits = 9; + for (final int size : sizes) { + + HyperLogLog hlls[] = new HyperLogLog[16]; + for (int k = minBits; k < hlls.length; k++) { + final HyperLogLog hll = HyperLogLog.builder() + .setEncoding(EncodingType.DENSE).setNumRegisterIndexBits(k).build(); + for (int i = 0; i < size; i++) { + hll.addLong(i); + } + hlls[k] = hll; + } + + for (int k = minBits; k < hlls.length; k++) { + for (int j = k + 1; j < hlls.length; j++) { + final HyperLogLog large = hlls[j]; + final HyperLogLog small = hlls[k]; + final HyperLogLog mush = large + .squash(small.getNumRegisterIndexBits()); + assertEquals(small.count(), mush.count(), 0); + double delta = Math.ceil(small.getStandardError()*size); + assertEquals((double) size, (double) mush.count(), delta); + } + } + } + } + + @Test + public void testHLLDenseDenseSquash() { + HyperLogLog p14HLL = HyperLogLog.builder().setEncoding(EncodingType.DENSE).setNumRegisterIndexBits(14).build(); + HyperLogLog p10HLL = HyperLogLog.builder().setEncoding(EncodingType.DENSE).setNumRegisterIndexBits(10).build(); + int size = 1_000_000; + for (int i = 0; i < size; i++) { + p14HLL.addLong(i); + } + + for (int i = 0; i < 10_000; i++) { + p10HLL.addLong(i); + } + + p14HLL.squash(p10HLL.getNumRegisterIndexBits()); + assertEquals((double) size, p14HLL.count(), longRangeTolerance * size / 100.0); + } + + @Test + public void testHLLSparseDenseSquash() { + HyperLogLog p14HLL = HyperLogLog.builder().setEncoding(EncodingType.SPARSE).setNumRegisterIndexBits(14).build(); + HyperLogLog p10HLL = HyperLogLog.builder().setEncoding(EncodingType.DENSE).setNumRegisterIndexBits(10).build(); + int size = 2000; + for (int i = 0; i < size; i++) { + p14HLL.addLong(i); + } + + for (int i = 0; i < 10_000; i++) { + p10HLL.addLong(i); + } + + p14HLL.squash(p10HLL.getNumRegisterIndexBits()); + assertEquals((double) size, p14HLL.count(), longRangeTolerance * size / 100.0); + } } diff --git standalone-metastore/src/test/java/org/apache/hadoop/hive/common/ndv/hll/TestHyperLogLogMerge.java standalone-metastore/src/test/java/org/apache/hadoop/hive/common/ndv/hll/TestHyperLogLogMerge.java new file mode 100644 index 0000000..2007c6f --- /dev/null +++ standalone-metastore/src/test/java/org/apache/hadoop/hive/common/ndv/hll/TestHyperLogLogMerge.java @@ -0,0 +1,147 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ +package org.apache.hadoop.hive.common.ndv.hll; + +import static org.junit.Assert.assertEquals; + +import java.util.Arrays; +import java.util.Collection; + +import org.junit.Test; +import org.junit.runner.RunWith; +import org.junit.runners.Parameterized; + +@RunWith(Parameterized.class) +public class TestHyperLogLogMerge { + // 5% tolerance for estimated count + private float longRangeTolerance = 5.0f; + private float shortRangeTolerance = 2.0f; + + int size; + + @Parameterized.Parameters + public static Collection data() { + return Arrays.asList(new Object[][] { + { 1_000 }, { 10_000 }, { 100_000 }, { 1_000_000 }, { 10_000_000 } + // { 100_000_000 }, { 1_000_000_000 } 1B passed but is super slow + }); + } + + public TestHyperLogLogMerge(int size) { + this.size = size; + } + + @Test + public void testHLLMergeDisjoint() { + HyperLogLog hll1 = HyperLogLog.builder().setNumRegisterIndexBits(16).build(); + for (int i = 0; i < size; i++) { + hll1.addLong(i); + } + HyperLogLog hll2 = HyperLogLog.builder().setNumRegisterIndexBits(16).build(); + for (int i = size; i < 2 * size; i++) { + hll2.addLong(i); + } + hll1.merge(hll2); + double threshold = size > 40000 ? longRangeTolerance : shortRangeTolerance; + double delta = threshold * size / 100; + long expected = 2 * size; + long actual = hll1.count(); + assertEquals(expected, actual, delta); + } + + @Test + public void testHLLMerge25PercentOverlap() { + HyperLogLog hll1 = HyperLogLog.builder().setNumRegisterIndexBits(16).build(); + for (int i = 0; i < size; i++) { + hll1.addLong(i); + } + HyperLogLog hll2 = HyperLogLog.builder().setNumRegisterIndexBits(16).build(); + int start = (int) (0.75 * size); + int end = (int) (size * 1.75); + for (int i = start; i < end; i++) { + hll2.addLong(i); + } + hll1.merge(hll2); + double threshold = size > 40000 ? longRangeTolerance : shortRangeTolerance; + double delta = threshold * size / 100; + long expected = (long) (1.75 * size); + long actual = hll1.count(); + assertEquals(expected, actual, delta); + } + + @Test + public void testHLLMerge50PercentOverlap() { + HyperLogLog hll1 = HyperLogLog.builder().setNumRegisterIndexBits(16).build(); + for (int i = 0; i < size; i++) { + hll1.addLong(i); + } + HyperLogLog hll2 = HyperLogLog.builder().setNumRegisterIndexBits(16).build(); + int start = (int) (0.5 * size); + int end = (int) (size * 1.5); + for (int i = start; i < end; i++) { + hll2.addLong(i); + } + hll1.merge(hll2); + double threshold = size > 40000 ? longRangeTolerance : shortRangeTolerance; + double delta = threshold * size / 100; + long expected = (long) (1.5 * size); + long actual = hll1.count(); + assertEquals(expected, actual, delta); + } + + + @Test + public void testHLLMerge75PercentOverlap() { + HyperLogLog hll1 = HyperLogLog.builder().setNumRegisterIndexBits(16).build(); + for (int i = 0; i < size; i++) { + hll1.addLong(i); + } + HyperLogLog hll2 = HyperLogLog.builder().setNumRegisterIndexBits(16).build(); + int start = (int) (0.25 * size); + int end = (int) (size * 1.25); + for (int i = start; i < end; i++) { + hll2.addLong(i); + } + hll1.merge(hll2); + double threshold = size > 40000 ? longRangeTolerance : shortRangeTolerance; + double delta = threshold * size / 100; + long expected = (long) (1.25 * size); + long actual = hll1.count(); + assertEquals(expected, actual, delta); + } + + + @Test + public void testHLLMerge100PercentOverlap() { + HyperLogLog hll1 = HyperLogLog.builder().setNumRegisterIndexBits(16).build(); + for (int i = 0; i < size; i++) { + hll1.addLong(i); + } + HyperLogLog hll2 = HyperLogLog.builder().setNumRegisterIndexBits(16).build(); + for (int i = 0; i < size; i++) { + hll2.addLong(i); + } + hll1.merge(hll2); + double threshold = size > 40000 ? longRangeTolerance : shortRangeTolerance; + double delta = threshold * size / 100; + long expected = size; + long actual = hll1.count(); + assertEquals(expected, actual, delta); + } + +}