blob: 7c38238cbe852c28b0832020ee3c03e884aba012 [file] [log] [blame]
set hive.strict.checks.bucketing=false;
CREATE TABLE srcbucket_mapjoin_n10(key int, value string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE;
load data local inpath '../../data/files/bmj/000000_0' INTO TABLE srcbucket_mapjoin_n10;
load data local inpath '../../data/files/bmj/000001_0' INTO TABLE srcbucket_mapjoin_n10;
CREATE TABLE srcbucket_mapjoin_part_n10 (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 3 BUCKETS STORED AS TEXTFILE;
load data local inpath '../../data/files/bmj/000000_0' INTO TABLE srcbucket_mapjoin_part_n10 partition(ds='2008-04-08');
load data local inpath '../../data/files/bmj/000001_0' INTO TABLE srcbucket_mapjoin_part_n10 partition(ds='2008-04-08');
load data local inpath '../../data/files/bmj/000002_0' INTO TABLE srcbucket_mapjoin_part_n10 partition(ds='2008-04-08');
set hive.cbo.enable=false;
set hive.optimize.bucketmapjoin = true;
create table bucketmapjoin_tmp_result_n4 (key string , value1 string, value2 string);
explain extended
insert overwrite table bucketmapjoin_tmp_result_n4
select /*+mapjoin(b)*/ a.key, a.value, b.value
from srcbucket_mapjoin_n10 a join srcbucket_mapjoin_part_n10 b
on a.key=b.key where b.ds="2008-04-08";