blob: 1039efcf268f1e38546a8414055c9f586b7c318e [file] [log] [blame]
--! qt:dataset:srcpart
set hive.mapred.mode=nonstrict;
set hive.exec.dynamic.partition=true;
set hive.input.format=org.apache.hadoop.hive.ql.io.HiveInputFormat;
set hive.merge.mapfiles=false;
set hive.merge.mapredfiles=false;
set mapred.input.dir.recursive=true;
-- list bucketing DML: multiple skewed columns. 2 stages
-- SORT_QUERY_RESULTS
-- create a skewed table
create table list_bucketing_dynamic_part_n1 (key String, value String)
partitioned by (ds String, hr String)
skewed by (key, value) on (('484','val_484'),('51','val_14'),('103','val_103'))
stored as DIRECTORIES;
-- list bucketing DML
explain extended
insert overwrite table list_bucketing_dynamic_part_n1 partition (ds='2008-04-08', hr) select key, value, hr from srcpart where ds='2008-04-08';
insert overwrite table list_bucketing_dynamic_part_n1 partition (ds='2008-04-08', hr) select key, value, hr from srcpart where ds='2008-04-08';
-- check DML result
desc formatted list_bucketing_dynamic_part_n1 partition (ds='2008-04-08', hr='11');
desc formatted list_bucketing_dynamic_part_n1 partition (ds='2008-04-08', hr='12');
select count(1) from srcpart where ds='2008-04-08';
select count(1) from list_bucketing_dynamic_part_n1 where ds='2008-04-08';
select key, value from srcpart where ds='2008-04-08' and key = "103" and value ="val_103";
set hive.optimize.listbucketing=true;
explain extended
select key, value, ds, hr from list_bucketing_dynamic_part_n1 where ds='2008-04-08' and key = "103" and value ="val_103";
select key, value, ds, hr from list_bucketing_dynamic_part_n1 where ds='2008-04-08' and key = "103" and value ="val_103";
-- clean up resources
drop table list_bucketing_dynamic_part_n1;