| --! qt:dataset:src |
| set hive.input.format=org.apache.hadoop.hive.ql.io.HiveInputFormat; |
| ; |
| set hive.exec.reducers.max = 1; |
| set hive.exec.script.trust = true; |
| set hive.optimize.reducededuplication = true; |
| set hive.optimize.reducededuplication.min.reducer = 1; |
| |
| |
| CREATE TABLE bucket5_1(key string, value string) CLUSTERED BY (key) INTO 2 BUCKETS; |
| explain extended |
| insert overwrite table bucket5_1 |
| select * from src cluster by key; |
| |
| insert overwrite table bucket5_1 |
| select * from src cluster by key; |
| |
| select sum(hash(key)),sum(hash(value)) from bucket5_1; |
| select sum(hash(key)),sum(hash(value)) from src; |
| |
| |
| create table complex_tbl_1(aid string, bid string, t int, ctime string, etime bigint, l string, et string) partitioned by (ds string); |
| |
| |
| create table complex_tbl_2(aet string, aes string) partitioned by (ds string); |
| |
| explain extended |
| insert overwrite table complex_tbl_1 partition (ds='2010-03-29') |
| select s2.* from |
| ( |
| select TRANSFORM (aid,bid,t,ctime,etime,l,et) |
| USING 'cat' |
| AS (aid string, bid string, t int, ctime string, etime bigint, l string, et string) |
| from |
| ( |
| select transform(aet,aes) |
| using 'cat' |
| as (aid string, bid string, t int, ctime string, etime bigint, l string, et string) |
| from complex_tbl_2 where ds ='2010-03-29' cluster by bid |
| )s |
| )s2; |
| |
| |
| |
| |
| |