Description
CREATE TABLE smb_input1(key int, value int) CLUSTERED BY (key) SORTED BY (key) INTO 2 BUCKETS; CREATE TABLE smb_input2(key int, value int) CLUSTERED BY (value) SORTED BY (value) INTO 2 BUCKETS; LOAD DATA LOCAL INPATH '../../data/files/in1.txt' into table smb_input1; LOAD DATA LOCAL INPATH '../../data/files/in2.txt' into table smb_input1; LOAD DATA LOCAL INPATH '../../data/files/in1.txt' into table smb_input2; LOAD DATA LOCAL INPATH '../../data/files/in2.txt' into table smb_input2; SET hive.optimize.bucketmapjoin = true; SET hive.optimize.bucketmapjoin.sortedmerge = true; SET hive.input.format = org.apache.hadoop.hive.ql.io.BucketizedHiveInputFormat; SET hive.outerjoin.supports.filters = false;
SELECT sum(hash(a.key,a.value,b.key,b.value)) FROM myinput1 a LEFT OUTER JOIN myinput1 b on a.key > 40 AND a.value > 50 AND a.key = a.value AND b.key > 40 AND b.value > 50 AND b.key = b.value;
Expected result: 3078400 Actual result: 4937935
Attachments
Attachments
Issue Links
- relates to
-
HIVE-1534 Join filters do not work correctly with outer joins
- Closed