| PREHOOK: query: drop table if exists t1_staging |
| PREHOOK: type: DROPTABLE |
| POSTHOOK: query: drop table if exists t1_staging |
| POSTHOOK: type: DROPTABLE |
| PREHOOK: query: create table t1_staging( |
| a string, |
| b int, |
| c int, |
| d string) |
| partitioned by (e string) |
| clustered by(a) |
| sorted by(a desc) |
| into 256 buckets stored as textfile |
| PREHOOK: type: CREATETABLE |
| PREHOOK: Output: database:default |
| PREHOOK: Output: default@t1_staging |
| POSTHOOK: query: create table t1_staging( |
| a string, |
| b int, |
| c int, |
| d string) |
| partitioned by (e string) |
| clustered by(a) |
| sorted by(a desc) |
| into 256 buckets stored as textfile |
| POSTHOOK: type: CREATETABLE |
| POSTHOOK: Output: database:default |
| POSTHOOK: Output: default@t1_staging |
| PREHOOK: query: load data local inpath '../../data/files/sortdp/000000_0' overwrite into table t1_staging partition (e='epart') |
| PREHOOK: type: LOAD |
| #### A masked pattern was here #### |
| PREHOOK: Output: default@t1_staging |
| POSTHOOK: query: load data local inpath '../../data/files/sortdp/000000_0' overwrite into table t1_staging partition (e='epart') |
| POSTHOOK: type: LOAD |
| #### A masked pattern was here #### |
| POSTHOOK: Output: default@t1_staging |
| POSTHOOK: Output: default@t1_staging@e=epart |
| PREHOOK: query: drop table t1_n147 |
| PREHOOK: type: DROPTABLE |
| POSTHOOK: query: drop table t1_n147 |
| POSTHOOK: type: DROPTABLE |
| PREHOOK: query: create table t1_n147( |
| a string, |
| b int, |
| c int, |
| d string) |
| partitioned by (e string) |
| clustered by(a) |
| sorted by(a desc) into 10 buckets stored as textfile |
| PREHOOK: type: CREATETABLE |
| PREHOOK: Output: database:default |
| PREHOOK: Output: default@t1_n147 |
| POSTHOOK: query: create table t1_n147( |
| a string, |
| b int, |
| c int, |
| d string) |
| partitioned by (e string) |
| clustered by(a) |
| sorted by(a desc) into 10 buckets stored as textfile |
| POSTHOOK: type: CREATETABLE |
| POSTHOOK: Output: database:default |
| POSTHOOK: Output: default@t1_n147 |
| PREHOOK: query: insert overwrite table t1_n147 partition(e) select a,b,c,d,'epart' from t1_staging |
| PREHOOK: type: QUERY |
| PREHOOK: Input: default@t1_staging |
| PREHOOK: Input: default@t1_staging@e=epart |
| PREHOOK: Output: default@t1_n147 |
| POSTHOOK: query: insert overwrite table t1_n147 partition(e) select a,b,c,d,'epart' from t1_staging |
| POSTHOOK: type: QUERY |
| POSTHOOK: Input: default@t1_staging |
| POSTHOOK: Input: default@t1_staging@e=epart |
| POSTHOOK: Output: default@t1_n147 |
| POSTHOOK: Output: default@t1_n147@e=epart |
| POSTHOOK: Lineage: t1_n147 PARTITION(e=epart).a SIMPLE [(t1_staging)t1_staging.FieldSchema(name:a, type:string, comment:null), ] |
| POSTHOOK: Lineage: t1_n147 PARTITION(e=epart).b SIMPLE [(t1_staging)t1_staging.FieldSchema(name:b, type:int, comment:null), ] |
| POSTHOOK: Lineage: t1_n147 PARTITION(e=epart).c SIMPLE [(t1_staging)t1_staging.FieldSchema(name:c, type:int, comment:null), ] |
| POSTHOOK: Lineage: t1_n147 PARTITION(e=epart).d SIMPLE [(t1_staging)t1_staging.FieldSchema(name:d, type:string, comment:null), ] |
| PREHOOK: query: select 'bucket_0' |
| PREHOOK: type: QUERY |
| PREHOOK: Input: _dummy_database@_dummy_table |
| #### A masked pattern was here #### |
| POSTHOOK: query: select 'bucket_0' |
| POSTHOOK: type: QUERY |
| POSTHOOK: Input: _dummy_database@_dummy_table |
| #### A masked pattern was here #### |
| bucket_0 |
| fff06c6e0fd675ebeff09350e6b7a3900115f72341fd353e5e185e8983d10534002015-01-21 |
| PREHOOK: query: select 'bucket_2' |
| PREHOOK: type: QUERY |
| PREHOOK: Input: _dummy_database@_dummy_table |
| #### A masked pattern was here #### |
| POSTHOOK: query: select 'bucket_2' |
| POSTHOOK: type: QUERY |
| POSTHOOK: Input: _dummy_database@_dummy_table |
| #### A masked pattern was here #### |
| bucket_2 |
| ffff67aef705abda0b89d899e408c28ef230fd0bb2cb0bb23b057e946ba9ca91\N\N2015-01-21 |
| fff3474e56ee23c0df629b538268a438d74da36208bdb114bda2da4253f0b4c9\N\N2015-01-21 |
| PREHOOK: query: select 'bucket_4' |
| PREHOOK: type: QUERY |
| PREHOOK: Input: _dummy_database@_dummy_table |
| #### A masked pattern was here #### |
| POSTHOOK: query: select 'bucket_4' |
| POSTHOOK: type: QUERY |
| POSTHOOK: Input: _dummy_database@_dummy_table |
| #### A masked pattern was here #### |
| bucket_4 |
| fffcb494aa56beb88fddb83cc3b0296d417d3ab7782be76c8c12d33e3f3d6a3c\N\N2015-01-21 |
| fffad1074d813e6db5c23302a9170fe472c2968844499c90445cbc8559d64fe1082015-01-21 |
| fff03007f38c32085bb4c9389270b965d371168032845555b663b7d4653ec8ee\N\N2015-01-21 |
| ffefa017a261a0b3e94c2386e0c47a015e2095e5d56b0f4fca2033d9755c9e45012015-01-21 |
| PREHOOK: query: select 'bucket_6' |
| PREHOOK: type: QUERY |
| PREHOOK: Input: _dummy_database@_dummy_table |
| #### A masked pattern was here #### |
| POSTHOOK: query: select 'bucket_6' |
| POSTHOOK: type: QUERY |
| POSTHOOK: Input: _dummy_database@_dummy_table |
| #### A masked pattern was here #### |
| bucket_6 |
| fffee943d640a7714d09f9bd50dba08a9d0ebdd146655e4642c293a4396cb385\N\N2015-01-21 |
| fffc0450ec9b28bae495dffc87a37cc3eea6d2d067ccea8b333185d28847ae2a\N\N2015-01-21 |
| PREHOOK: query: select 'bucket_8' |
| PREHOOK: type: QUERY |
| PREHOOK: Input: _dummy_database@_dummy_table |
| #### A masked pattern was here #### |
| POSTHOOK: query: select 'bucket_8' |
| POSTHOOK: type: QUERY |
| POSTHOOK: Input: _dummy_database@_dummy_table |
| #### A masked pattern was here #### |
| bucket_8 |
| fffcf74695669d1f444936243869f3586418c6d61d3abb5cc9acb67a3ad7bd2f002015-01-21 |
| fffbe3c110c390ec20218e5ad4a026ff515668ed55488b717319b556daa962a1002015-01-21 |
| fffb1b226efc3cfaac8d73647ce4fa4e82413d67265fb55366ac3a4996518738012015-01-21 |
| fff56191e39b15f0e2f04984c70152fb1bde2ecba52ff5a73b4c28bf4d58c017002015-01-21 |
| fff4166378aa9d94cd4f8a9cd543375890a61b4f09a57dbfb31a66b33b3e3fd9\N\N2015-01-21 |
| PREHOOK: query: drop table t1_n147 |
| PREHOOK: type: DROPTABLE |
| PREHOOK: Input: default@t1_n147 |
| PREHOOK: Output: default@t1_n147 |
| POSTHOOK: query: drop table t1_n147 |
| POSTHOOK: type: DROPTABLE |
| POSTHOOK: Input: default@t1_n147 |
| POSTHOOK: Output: default@t1_n147 |
| PREHOOK: query: create table t1_n147( |
| a string, |
| b int, |
| c int, |
| d string) |
| partitioned by (e string) |
| clustered by(a) |
| sorted by(a desc) into 10 buckets stored as textfile |
| PREHOOK: type: CREATETABLE |
| PREHOOK: Output: database:default |
| PREHOOK: Output: default@t1_n147 |
| POSTHOOK: query: create table t1_n147( |
| a string, |
| b int, |
| c int, |
| d string) |
| partitioned by (e string) |
| clustered by(a) |
| sorted by(a desc) into 10 buckets stored as textfile |
| POSTHOOK: type: CREATETABLE |
| POSTHOOK: Output: database:default |
| POSTHOOK: Output: default@t1_n147 |
| PREHOOK: query: insert overwrite table t1_n147 partition(e) select a,b,c,d,'epart' from t1_staging |
| PREHOOK: type: QUERY |
| PREHOOK: Input: default@t1_staging |
| PREHOOK: Input: default@t1_staging@e=epart |
| PREHOOK: Output: default@t1_n147 |
| POSTHOOK: query: insert overwrite table t1_n147 partition(e) select a,b,c,d,'epart' from t1_staging |
| POSTHOOK: type: QUERY |
| POSTHOOK: Input: default@t1_staging |
| POSTHOOK: Input: default@t1_staging@e=epart |
| POSTHOOK: Output: default@t1_n147 |
| POSTHOOK: Output: default@t1_n147@e=epart |
| POSTHOOK: Lineage: t1_n147 PARTITION(e=epart).a SIMPLE [(t1_staging)t1_staging.FieldSchema(name:a, type:string, comment:null), ] |
| POSTHOOK: Lineage: t1_n147 PARTITION(e=epart).b SIMPLE [(t1_staging)t1_staging.FieldSchema(name:b, type:int, comment:null), ] |
| POSTHOOK: Lineage: t1_n147 PARTITION(e=epart).c SIMPLE [(t1_staging)t1_staging.FieldSchema(name:c, type:int, comment:null), ] |
| POSTHOOK: Lineage: t1_n147 PARTITION(e=epart).d SIMPLE [(t1_staging)t1_staging.FieldSchema(name:d, type:string, comment:null), ] |
| PREHOOK: query: select 'bucket_0' |
| PREHOOK: type: QUERY |
| PREHOOK: Input: _dummy_database@_dummy_table |
| #### A masked pattern was here #### |
| POSTHOOK: query: select 'bucket_0' |
| POSTHOOK: type: QUERY |
| POSTHOOK: Input: _dummy_database@_dummy_table |
| #### A masked pattern was here #### |
| bucket_0 |
| fff06c6e0fd675ebeff09350e6b7a3900115f72341fd353e5e185e8983d10534002015-01-21 |
| PREHOOK: query: select 'bucket_2' |
| PREHOOK: type: QUERY |
| PREHOOK: Input: _dummy_database@_dummy_table |
| #### A masked pattern was here #### |
| POSTHOOK: query: select 'bucket_2' |
| POSTHOOK: type: QUERY |
| POSTHOOK: Input: _dummy_database@_dummy_table |
| #### A masked pattern was here #### |
| bucket_2 |
| ffff67aef705abda0b89d899e408c28ef230fd0bb2cb0bb23b057e946ba9ca91\N\N2015-01-21 |
| fff3474e56ee23c0df629b538268a438d74da36208bdb114bda2da4253f0b4c9\N\N2015-01-21 |
| PREHOOK: query: select 'bucket_4' |
| PREHOOK: type: QUERY |
| PREHOOK: Input: _dummy_database@_dummy_table |
| #### A masked pattern was here #### |
| POSTHOOK: query: select 'bucket_4' |
| POSTHOOK: type: QUERY |
| POSTHOOK: Input: _dummy_database@_dummy_table |
| #### A masked pattern was here #### |
| bucket_4 |
| fffcb494aa56beb88fddb83cc3b0296d417d3ab7782be76c8c12d33e3f3d6a3c\N\N2015-01-21 |
| fffad1074d813e6db5c23302a9170fe472c2968844499c90445cbc8559d64fe1082015-01-21 |
| fff03007f38c32085bb4c9389270b965d371168032845555b663b7d4653ec8ee\N\N2015-01-21 |
| ffefa017a261a0b3e94c2386e0c47a015e2095e5d56b0f4fca2033d9755c9e45012015-01-21 |
| PREHOOK: query: select 'bucket_6' |
| PREHOOK: type: QUERY |
| PREHOOK: Input: _dummy_database@_dummy_table |
| #### A masked pattern was here #### |
| POSTHOOK: query: select 'bucket_6' |
| POSTHOOK: type: QUERY |
| POSTHOOK: Input: _dummy_database@_dummy_table |
| #### A masked pattern was here #### |
| bucket_6 |
| fffee943d640a7714d09f9bd50dba08a9d0ebdd146655e4642c293a4396cb385\N\N2015-01-21 |
| fffc0450ec9b28bae495dffc87a37cc3eea6d2d067ccea8b333185d28847ae2a\N\N2015-01-21 |
| PREHOOK: query: select 'bucket_8' |
| PREHOOK: type: QUERY |
| PREHOOK: Input: _dummy_database@_dummy_table |
| #### A masked pattern was here #### |
| POSTHOOK: query: select 'bucket_8' |
| POSTHOOK: type: QUERY |
| POSTHOOK: Input: _dummy_database@_dummy_table |
| #### A masked pattern was here #### |
| bucket_8 |
| fffcf74695669d1f444936243869f3586418c6d61d3abb5cc9acb67a3ad7bd2f002015-01-21 |
| fffbe3c110c390ec20218e5ad4a026ff515668ed55488b717319b556daa962a1002015-01-21 |
| fffb1b226efc3cfaac8d73647ce4fa4e82413d67265fb55366ac3a4996518738012015-01-21 |
| fff56191e39b15f0e2f04984c70152fb1bde2ecba52ff5a73b4c28bf4d58c017002015-01-21 |
| fff4166378aa9d94cd4f8a9cd543375890a61b4f09a57dbfb31a66b33b3e3fd9\N\N2015-01-21 |
| PREHOOK: query: CREATE TABLE dynpart_sort_opt_bucketing_test (ca_address_sk int, ca_address_id string, ca_street_number string, ca_street_name string, |
| ca_street_type string, ca_suite_number string, ca_city string, ca_county string, ca_state string, |
| ca_zip string, ca_country string, ca_gmt_offset decimal(5,2)) |
| PARTITIONED BY (ca_location_type string) |
| CLUSTERED BY (ca_state) INTO 50 BUCKETS STORED AS ORC TBLPROPERTIES('transactional'='true') |
| PREHOOK: type: CREATETABLE |
| PREHOOK: Output: database:default |
| PREHOOK: Output: default@dynpart_sort_opt_bucketing_test |
| POSTHOOK: query: CREATE TABLE dynpart_sort_opt_bucketing_test (ca_address_sk int, ca_address_id string, ca_street_number string, ca_street_name string, |
| ca_street_type string, ca_suite_number string, ca_city string, ca_county string, ca_state string, |
| ca_zip string, ca_country string, ca_gmt_offset decimal(5,2)) |
| PARTITIONED BY (ca_location_type string) |
| CLUSTERED BY (ca_state) INTO 50 BUCKETS STORED AS ORC TBLPROPERTIES('transactional'='true') |
| POSTHOOK: type: CREATETABLE |
| POSTHOOK: Output: database:default |
| POSTHOOK: Output: default@dynpart_sort_opt_bucketing_test |
| PREHOOK: query: explain INSERT INTO TABLE dynpart_sort_opt_bucketing_test PARTITION (ca_location_type) VALUES (5555, 'AAAAAAAADLFBAAAA', '126', |
| 'Highland Park', 'Court', 'Suite E', 'San Jose', 'King George County', 'VA', '28003', 'United States', |
| '-5', 'single family') |
| PREHOOK: type: QUERY |
| PREHOOK: Input: _dummy_database@_dummy_table |
| PREHOOK: Output: default@dynpart_sort_opt_bucketing_test |
| POSTHOOK: query: explain INSERT INTO TABLE dynpart_sort_opt_bucketing_test PARTITION (ca_location_type) VALUES (5555, 'AAAAAAAADLFBAAAA', '126', |
| 'Highland Park', 'Court', 'Suite E', 'San Jose', 'King George County', 'VA', '28003', 'United States', |
| '-5', 'single family') |
| POSTHOOK: type: QUERY |
| POSTHOOK: Input: _dummy_database@_dummy_table |
| POSTHOOK: Output: default@dynpart_sort_opt_bucketing_test |
| STAGE DEPENDENCIES: |
| Stage-1 is a root stage |
| Stage-2 depends on stages: Stage-1 |
| Stage-0 depends on stages: Stage-2 |
| |
| STAGE PLANS: |
| Stage: Stage-1 |
| Tez |
| #### A masked pattern was here #### |
| Edges: |
| Reducer 2 <- Map 1 (SIMPLE_EDGE) |
| #### A masked pattern was here #### |
| Vertices: |
| Map 1 |
| Map Operator Tree: |
| TableScan |
| alias: _dummy_table |
| Row Limit Per Split: 1 |
| Statistics: Num rows: 1 Data size: 10 Basic stats: COMPLETE Column stats: COMPLETE |
| Select Operator |
| expressions: array(const struct(5555,'AAAAAAAADLFBAAAA','126','Highland Park','Court','Suite E','San Jose','King George County','VA','28003','United States','-5','single family')) (type: array<struct<col1:int,col2:string,col3:string,col4:string,col5:string,col6:string,col7:string,col8:string,col9:string,col10:string,col11:string,col12:string,col13:string>>) |
| outputColumnNames: _col0 |
| Statistics: Num rows: 1 Data size: 48 Basic stats: COMPLETE Column stats: COMPLETE |
| UDTF Operator |
| Statistics: Num rows: 1 Data size: 48 Basic stats: COMPLETE Column stats: COMPLETE |
| function name: inline |
| Select Operator |
| expressions: col1 (type: int), col2 (type: string), col3 (type: string), col4 (type: string), col5 (type: string), col6 (type: string), col7 (type: string), col8 (type: string), col9 (type: string), col10 (type: string), col11 (type: string), CAST( col12 AS decimal(5,2)) (type: decimal(5,2)), col13 (type: string) |
| outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12 |
| Statistics: Num rows: 1 Data size: 112 Basic stats: COMPLETE Column stats: COMPLETE |
| Reduce Output Operator |
| key expressions: _col12 (type: string), _bucket_number (type: string), _col8 (type: string) |
| null sort order: aaa |
| sort order: +++ |
| Map-reduce partition columns: _col12 (type: string) |
| Statistics: Num rows: 1 Data size: 112 Basic stats: COMPLETE Column stats: COMPLETE |
| value expressions: _col0 (type: int), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string), _col7 (type: string), _col9 (type: string), _col10 (type: string), _col11 (type: decimal(5,2)) |
| Execution mode: llap |
| LLAP IO: no inputs |
| Reducer 2 |
| Execution mode: llap |
| Reduce Operator Tree: |
| Select Operator |
| expressions: VALUE._col0 (type: int), VALUE._col1 (type: string), VALUE._col2 (type: string), VALUE._col3 (type: string), VALUE._col4 (type: string), VALUE._col5 (type: string), VALUE._col6 (type: string), VALUE._col7 (type: string), KEY._col8 (type: string), VALUE._col9 (type: string), VALUE._col10 (type: string), VALUE._col11 (type: decimal(5,2)), KEY._col12 (type: string), KEY._bucket_number (type: string) |
| outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _bucket_number |
| File Output Operator |
| compressed: false |
| Dp Sort State: PARTITION_BUCKET_SORTED |
| Statistics: Num rows: 1 Data size: 112 Basic stats: COMPLETE Column stats: COMPLETE |
| table: |
| input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat |
| output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat |
| serde: org.apache.hadoop.hive.ql.io.orc.OrcSerde |
| name: default.dynpart_sort_opt_bucketing_test |
| Write Type: INSERT |
| |
| Stage: Stage-2 |
| Dependency Collection |
| |
| Stage: Stage-0 |
| Move Operator |
| tables: |
| partition: |
| ca_location_type |
| replace: false |
| table: |
| input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat |
| output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat |
| serde: org.apache.hadoop.hive.ql.io.orc.OrcSerde |
| name: default.dynpart_sort_opt_bucketing_test |
| Write Type: INSERT |
| |
| PREHOOK: query: INSERT INTO TABLE dynpart_sort_opt_bucketing_test PARTITION (ca_location_type) VALUES (5555, 'AAAAAAAADLFBAAAA', '126', |
| 'Highland Park', 'Court', 'Suite E', 'San Jose', 'King George County', 'VA', '28003', 'United States', |
| '-5', 'single family') |
| PREHOOK: type: QUERY |
| PREHOOK: Input: _dummy_database@_dummy_table |
| PREHOOK: Output: default@dynpart_sort_opt_bucketing_test |
| POSTHOOK: query: INSERT INTO TABLE dynpart_sort_opt_bucketing_test PARTITION (ca_location_type) VALUES (5555, 'AAAAAAAADLFBAAAA', '126', |
| 'Highland Park', 'Court', 'Suite E', 'San Jose', 'King George County', 'VA', '28003', 'United States', |
| '-5', 'single family') |
| POSTHOOK: type: QUERY |
| POSTHOOK: Input: _dummy_database@_dummy_table |
| POSTHOOK: Output: default@dynpart_sort_opt_bucketing_test |
| POSTHOOK: Output: default@dynpart_sort_opt_bucketing_test@ca_location_type=single family |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_address_id SCRIPT [] |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_address_sk SCRIPT [] |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_city SCRIPT [] |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_country SCRIPT [] |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_county SCRIPT [] |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_gmt_offset SCRIPT [] |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_state SCRIPT [] |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_street_name SCRIPT [] |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_street_number SCRIPT [] |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_street_type SCRIPT [] |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_suite_number SCRIPT [] |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_zip SCRIPT [] |
| PREHOOK: query: select * from dynpart_sort_opt_bucketing_test |
| PREHOOK: type: QUERY |
| PREHOOK: Input: default@dynpart_sort_opt_bucketing_test |
| PREHOOK: Input: default@dynpart_sort_opt_bucketing_test@ca_location_type=single family |
| #### A masked pattern was here #### |
| POSTHOOK: query: select * from dynpart_sort_opt_bucketing_test |
| POSTHOOK: type: QUERY |
| POSTHOOK: Input: default@dynpart_sort_opt_bucketing_test |
| POSTHOOK: Input: default@dynpart_sort_opt_bucketing_test@ca_location_type=single family |
| #### A masked pattern was here #### |
| 5555 AAAAAAAADLFBAAAA 126 Highland Park Court Suite E San Jose King George County VA 28003 United States -5.00 single family |
| PREHOOK: query: explain INSERT INTO TABLE dynpart_sort_opt_bucketing_test PARTITION (ca_location_type) VALUES (5555, 'AAAAAAAADLFBAAAA', '126', |
| 'Highland Park', 'Court', 'Suite E', 'San Jose', 'King George County', 'VA', '28003', 'United States', |
| '-5', 'single family') |
| PREHOOK: type: QUERY |
| PREHOOK: Input: _dummy_database@_dummy_table |
| PREHOOK: Output: default@dynpart_sort_opt_bucketing_test |
| POSTHOOK: query: explain INSERT INTO TABLE dynpart_sort_opt_bucketing_test PARTITION (ca_location_type) VALUES (5555, 'AAAAAAAADLFBAAAA', '126', |
| 'Highland Park', 'Court', 'Suite E', 'San Jose', 'King George County', 'VA', '28003', 'United States', |
| '-5', 'single family') |
| POSTHOOK: type: QUERY |
| POSTHOOK: Input: _dummy_database@_dummy_table |
| POSTHOOK: Output: default@dynpart_sort_opt_bucketing_test |
| STAGE DEPENDENCIES: |
| Stage-1 is a root stage |
| Stage-2 depends on stages: Stage-1 |
| Stage-0 depends on stages: Stage-2 |
| Stage-3 depends on stages: Stage-0 |
| |
| STAGE PLANS: |
| Stage: Stage-1 |
| Tez |
| #### A masked pattern was here #### |
| Edges: |
| Reducer 2 <- Map 1 (SIMPLE_EDGE) |
| Reducer 3 <- Map 1 (SIMPLE_EDGE) |
| #### A masked pattern was here #### |
| Vertices: |
| Map 1 |
| Map Operator Tree: |
| TableScan |
| alias: _dummy_table |
| Row Limit Per Split: 1 |
| Statistics: Num rows: 1 Data size: 10 Basic stats: COMPLETE Column stats: COMPLETE |
| Select Operator |
| expressions: array(const struct(5555,'AAAAAAAADLFBAAAA','126','Highland Park','Court','Suite E','San Jose','King George County','VA','28003','United States','-5','single family')) (type: array<struct<col1:int,col2:string,col3:string,col4:string,col5:string,col6:string,col7:string,col8:string,col9:string,col10:string,col11:string,col12:string,col13:string>>) |
| outputColumnNames: _col0 |
| Statistics: Num rows: 1 Data size: 48 Basic stats: COMPLETE Column stats: COMPLETE |
| UDTF Operator |
| Statistics: Num rows: 1 Data size: 48 Basic stats: COMPLETE Column stats: COMPLETE |
| function name: inline |
| Select Operator |
| expressions: col1 (type: int), col2 (type: string), col3 (type: string), col4 (type: string), col5 (type: string), col6 (type: string), col7 (type: string), col8 (type: string), col9 (type: string), col10 (type: string), col11 (type: string), CAST( col12 AS decimal(5,2)) (type: decimal(5,2)), col13 (type: string) |
| outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12 |
| Statistics: Num rows: 1 Data size: 112 Basic stats: COMPLETE Column stats: COMPLETE |
| Select Operator |
| expressions: _col0 (type: int), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string), _col7 (type: string), _col8 (type: string), _col9 (type: string), _col10 (type: string), _col11 (type: decimal(5,2)), _col12 (type: string) |
| outputColumnNames: ca_address_sk, ca_address_id, ca_street_number, ca_street_name, ca_street_type, ca_suite_number, ca_city, ca_county, ca_state, ca_zip, ca_country, ca_gmt_offset, ca_location_type |
| Statistics: Num rows: 1 Data size: 112 Basic stats: COMPLETE Column stats: COMPLETE |
| Group By Operator |
| aggregations: min(ca_address_sk), max(ca_address_sk), count(1), count(ca_address_sk), compute_bit_vector(ca_address_sk, 'hll'), max(length(ca_address_id)), avg(COALESCE(length(ca_address_id),0)), count(ca_address_id), compute_bit_vector(ca_address_id, 'hll'), max(length(ca_street_number)), avg(COALESCE(length(ca_street_number),0)), count(ca_street_number), compute_bit_vector(ca_street_number, 'hll'), max(length(ca_street_name)), avg(COALESCE(length(ca_street_name),0)), count(ca_street_name), compute_bit_vector(ca_street_name, 'hll'), max(length(ca_street_type)), avg(COALESCE(length(ca_street_type),0)), count(ca_street_type), compute_bit_vector(ca_street_type, 'hll'), max(length(ca_suite_number)), avg(COALESCE(length(ca_suite_number),0)), count(ca_suite_number), compute_bit_vector(ca_suite_number, 'hll'), max(length(ca_city)), avg(COALESCE(length(ca_city),0)), count(ca_city), compute_bit_vector(ca_city, 'hll'), max(length(ca_county)), avg(COALESCE(length(ca_county),0)), count(ca_county), compute_bit_vector(ca_county, 'hll'), max(length(ca_state)), avg(COALESCE(length(ca_state),0)), count(ca_state), compute_bit_vector(ca_state, 'hll'), max(length(ca_zip)), avg(COALESCE(length(ca_zip),0)), count(ca_zip), compute_bit_vector(ca_zip, 'hll'), max(length(ca_country)), avg(COALESCE(length(ca_country),0)), count(ca_country), compute_bit_vector(ca_country, 'hll'), min(ca_gmt_offset), max(ca_gmt_offset), count(ca_gmt_offset), compute_bit_vector(ca_gmt_offset, 'hll') |
| keys: ca_location_type (type: string) |
| minReductionHashAggr: 0.0 |
| mode: hash |
| outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20, _col21, _col22, _col23, _col24, _col25, _col26, _col27, _col28, _col29, _col30, _col31, _col32, _col33, _col34, _col35, _col36, _col37, _col38, _col39, _col40, _col41, _col42, _col43, _col44, _col45, _col46, _col47, _col48, _col49 |
| Statistics: Num rows: 1 Data size: 3048 Basic stats: COMPLETE Column stats: COMPLETE |
| Reduce Output Operator |
| key expressions: _col0 (type: string) |
| null sort order: z |
| sort order: + |
| Map-reduce partition columns: _col0 (type: string) |
| Statistics: Num rows: 1 Data size: 3048 Basic stats: COMPLETE Column stats: COMPLETE |
| value expressions: _col1 (type: int), _col2 (type: int), _col3 (type: bigint), _col4 (type: bigint), _col5 (type: binary), _col6 (type: int), _col7 (type: struct<count:bigint,sum:double,input:int>), _col8 (type: bigint), _col9 (type: binary), _col10 (type: int), _col11 (type: struct<count:bigint,sum:double,input:int>), _col12 (type: bigint), _col13 (type: binary), _col14 (type: int), _col15 (type: struct<count:bigint,sum:double,input:int>), _col16 (type: bigint), _col17 (type: binary), _col18 (type: int), _col19 (type: struct<count:bigint,sum:double,input:int>), _col20 (type: bigint), _col21 (type: binary), _col22 (type: int), _col23 (type: struct<count:bigint,sum:double,input:int>), _col24 (type: bigint), _col25 (type: binary), _col26 (type: int), _col27 (type: struct<count:bigint,sum:double,input:int>), _col28 (type: bigint), _col29 (type: binary), _col30 (type: int), _col31 (type: struct<count:bigint,sum:double,input:int>), _col32 (type: bigint), _col33 (type: binary), _col34 (type: int), _col35 (type: struct<count:bigint,sum:double,input:int>), _col36 (type: bigint), _col37 (type: binary), _col38 (type: int), _col39 (type: struct<count:bigint,sum:double,input:int>), _col40 (type: bigint), _col41 (type: binary), _col42 (type: int), _col43 (type: struct<count:bigint,sum:double,input:int>), _col44 (type: bigint), _col45 (type: binary), _col46 (type: decimal(5,2)), _col47 (type: decimal(5,2)), _col48 (type: bigint), _col49 (type: binary) |
| Reduce Output Operator |
| key expressions: _col12 (type: string), _bucket_number (type: string), _col8 (type: string) |
| null sort order: aaa |
| sort order: +++ |
| Map-reduce partition columns: _col12 (type: string) |
| Statistics: Num rows: 1 Data size: 112 Basic stats: COMPLETE Column stats: COMPLETE |
| value expressions: _col0 (type: int), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string), _col7 (type: string), _col9 (type: string), _col10 (type: string), _col11 (type: decimal(5,2)) |
| Execution mode: llap |
| LLAP IO: no inputs |
| Reducer 2 |
| Execution mode: llap |
| Reduce Operator Tree: |
| Group By Operator |
| aggregations: min(VALUE._col0), max(VALUE._col1), count(VALUE._col2), count(VALUE._col3), compute_bit_vector(VALUE._col4), max(VALUE._col5), avg(VALUE._col6), count(VALUE._col7), compute_bit_vector(VALUE._col8), max(VALUE._col9), avg(VALUE._col10), count(VALUE._col11), compute_bit_vector(VALUE._col12), max(VALUE._col13), avg(VALUE._col14), count(VALUE._col15), compute_bit_vector(VALUE._col16), max(VALUE._col17), avg(VALUE._col18), count(VALUE._col19), compute_bit_vector(VALUE._col20), max(VALUE._col21), avg(VALUE._col22), count(VALUE._col23), compute_bit_vector(VALUE._col24), max(VALUE._col25), avg(VALUE._col26), count(VALUE._col27), compute_bit_vector(VALUE._col28), max(VALUE._col29), avg(VALUE._col30), count(VALUE._col31), compute_bit_vector(VALUE._col32), max(VALUE._col33), avg(VALUE._col34), count(VALUE._col35), compute_bit_vector(VALUE._col36), max(VALUE._col37), avg(VALUE._col38), count(VALUE._col39), compute_bit_vector(VALUE._col40), max(VALUE._col41), avg(VALUE._col42), count(VALUE._col43), compute_bit_vector(VALUE._col44), min(VALUE._col45), max(VALUE._col46), count(VALUE._col47), compute_bit_vector(VALUE._col48) |
| keys: KEY._col0 (type: string) |
| mode: mergepartial |
| outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20, _col21, _col22, _col23, _col24, _col25, _col26, _col27, _col28, _col29, _col30, _col31, _col32, _col33, _col34, _col35, _col36, _col37, _col38, _col39, _col40, _col41, _col42, _col43, _col44, _col45, _col46, _col47, _col48, _col49 |
| Statistics: Num rows: 1 Data size: 2368 Basic stats: COMPLETE Column stats: COMPLETE |
| Select Operator |
| expressions: 'LONG' (type: string), UDFToLong(_col1) (type: bigint), UDFToLong(_col2) (type: bigint), (_col3 - _col4) (type: bigint), COALESCE(ndv_compute_bit_vector(_col5),0) (type: bigint), _col5 (type: binary), 'STRING' (type: string), UDFToLong(COALESCE(_col6,0)) (type: bigint), COALESCE(_col7,0) (type: double), (_col3 - _col8) (type: bigint), COALESCE(ndv_compute_bit_vector(_col9),0) (type: bigint), _col9 (type: binary), 'STRING' (type: string), UDFToLong(COALESCE(_col10,0)) (type: bigint), COALESCE(_col11,0) (type: double), (_col3 - _col12) (type: bigint), COALESCE(ndv_compute_bit_vector(_col13),0) (type: bigint), _col13 (type: binary), 'STRING' (type: string), UDFToLong(COALESCE(_col14,0)) (type: bigint), COALESCE(_col15,0) (type: double), (_col3 - _col16) (type: bigint), COALESCE(ndv_compute_bit_vector(_col17),0) (type: bigint), _col17 (type: binary), 'STRING' (type: string), UDFToLong(COALESCE(_col18,0)) (type: bigint), COALESCE(_col19,0) (type: double), (_col3 - _col20) (type: bigint), COALESCE(ndv_compute_bit_vector(_col21),0) (type: bigint), _col21 (type: binary), 'STRING' (type: string), UDFToLong(COALESCE(_col22,0)) (type: bigint), COALESCE(_col23,0) (type: double), (_col3 - _col24) (type: bigint), COALESCE(ndv_compute_bit_vector(_col25),0) (type: bigint), _col25 (type: binary), 'STRING' (type: string), UDFToLong(COALESCE(_col26,0)) (type: bigint), COALESCE(_col27,0) (type: double), (_col3 - _col28) (type: bigint), COALESCE(ndv_compute_bit_vector(_col29),0) (type: bigint), _col29 (type: binary), 'STRING' (type: string), UDFToLong(COALESCE(_col30,0)) (type: bigint), COALESCE(_col31,0) (type: double), (_col3 - _col32) (type: bigint), COALESCE(ndv_compute_bit_vector(_col33),0) (type: bigint), _col33 (type: binary), 'STRING' (type: string), UDFToLong(COALESCE(_col34,0)) (type: bigint), COALESCE(_col35,0) (type: double), (_col3 - _col36) (type: bigint), COALESCE(ndv_compute_bit_vector(_col37),0) (type: bigint), _col37 (type: binary), 'STRING' (type: string), UDFToLong(COALESCE(_col38,0)) (type: bigint), COALESCE(_col39,0) (type: double), (_col3 - _col40) (type: bigint), COALESCE(ndv_compute_bit_vector(_col41),0) (type: bigint), _col41 (type: binary), 'STRING' (type: string), UDFToLong(COALESCE(_col42,0)) (type: bigint), COALESCE(_col43,0) (type: double), (_col3 - _col44) (type: bigint), COALESCE(ndv_compute_bit_vector(_col45),0) (type: bigint), _col45 (type: binary), 'DECIMAL' (type: string), _col46 (type: decimal(5,2)), _col47 (type: decimal(5,2)), (_col3 - _col48) (type: bigint), COALESCE(ndv_compute_bit_vector(_col49),0) (type: bigint), _col49 (type: binary), _col0 (type: string) |
| outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20, _col21, _col22, _col23, _col24, _col25, _col26, _col27, _col28, _col29, _col30, _col31, _col32, _col33, _col34, _col35, _col36, _col37, _col38, _col39, _col40, _col41, _col42, _col43, _col44, _col45, _col46, _col47, _col48, _col49, _col50, _col51, _col52, _col53, _col54, _col55, _col56, _col57, _col58, _col59, _col60, _col61, _col62, _col63, _col64, _col65, _col66, _col67, _col68, _col69, _col70, _col71, _col72 |
| Statistics: Num rows: 1 Data size: 3583 Basic stats: COMPLETE Column stats: COMPLETE |
| File Output Operator |
| compressed: false |
| Statistics: Num rows: 1 Data size: 3583 Basic stats: COMPLETE Column stats: COMPLETE |
| table: |
| input format: org.apache.hadoop.mapred.SequenceFileInputFormat |
| output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat |
| serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe |
| Reducer 3 |
| Execution mode: llap |
| Reduce Operator Tree: |
| Select Operator |
| expressions: VALUE._col0 (type: int), VALUE._col1 (type: string), VALUE._col2 (type: string), VALUE._col3 (type: string), VALUE._col4 (type: string), VALUE._col5 (type: string), VALUE._col6 (type: string), VALUE._col7 (type: string), KEY._col8 (type: string), VALUE._col9 (type: string), VALUE._col10 (type: string), VALUE._col11 (type: decimal(5,2)), KEY._col12 (type: string), KEY._bucket_number (type: string) |
| outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _bucket_number |
| File Output Operator |
| compressed: false |
| Dp Sort State: PARTITION_BUCKET_SORTED |
| Statistics: Num rows: 1 Data size: 112 Basic stats: COMPLETE Column stats: COMPLETE |
| table: |
| input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat |
| output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat |
| serde: org.apache.hadoop.hive.ql.io.orc.OrcSerde |
| name: default.dynpart_sort_opt_bucketing_test |
| Write Type: INSERT |
| |
| Stage: Stage-2 |
| Dependency Collection |
| |
| Stage: Stage-0 |
| Move Operator |
| tables: |
| partition: |
| ca_location_type |
| replace: false |
| table: |
| input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat |
| output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat |
| serde: org.apache.hadoop.hive.ql.io.orc.OrcSerde |
| name: default.dynpart_sort_opt_bucketing_test |
| Write Type: INSERT |
| |
| Stage: Stage-3 |
| Stats Work |
| Basic Stats Work: |
| Column Stats Desc: |
| Columns: ca_address_sk, ca_address_id, ca_street_number, ca_street_name, ca_street_type, ca_suite_number, ca_city, ca_county, ca_state, ca_zip, ca_country, ca_gmt_offset |
| Column Types: int, string, string, string, string, string, string, string, string, string, string, decimal(5,2) |
| Table: default.dynpart_sort_opt_bucketing_test |
| |
| PREHOOK: query: INSERT INTO TABLE dynpart_sort_opt_bucketing_test PARTITION (ca_location_type) VALUES (5555, 'AAAAAAAADLFBAAAA', '126', |
| 'Highland Park', 'Court', 'Suite E', 'San Jose', 'King George County', 'VA', '28003', 'United States', |
| '-5', 'single family') |
| PREHOOK: type: QUERY |
| PREHOOK: Input: _dummy_database@_dummy_table |
| PREHOOK: Output: default@dynpart_sort_opt_bucketing_test |
| POSTHOOK: query: INSERT INTO TABLE dynpart_sort_opt_bucketing_test PARTITION (ca_location_type) VALUES (5555, 'AAAAAAAADLFBAAAA', '126', |
| 'Highland Park', 'Court', 'Suite E', 'San Jose', 'King George County', 'VA', '28003', 'United States', |
| '-5', 'single family') |
| POSTHOOK: type: QUERY |
| POSTHOOK: Input: _dummy_database@_dummy_table |
| POSTHOOK: Output: default@dynpart_sort_opt_bucketing_test |
| POSTHOOK: Output: default@dynpart_sort_opt_bucketing_test@ca_location_type=single family |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_address_id SCRIPT [] |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_address_sk SCRIPT [] |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_city SCRIPT [] |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_country SCRIPT [] |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_county SCRIPT [] |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_gmt_offset SCRIPT [] |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_state SCRIPT [] |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_street_name SCRIPT [] |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_street_number SCRIPT [] |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_street_type SCRIPT [] |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_suite_number SCRIPT [] |
| POSTHOOK: Lineage: dynpart_sort_opt_bucketing_test PARTITION(ca_location_type=single family).ca_zip SCRIPT [] |
| PREHOOK: query: select * from dynpart_sort_opt_bucketing_test |
| PREHOOK: type: QUERY |
| PREHOOK: Input: default@dynpart_sort_opt_bucketing_test |
| PREHOOK: Input: default@dynpart_sort_opt_bucketing_test@ca_location_type=single family |
| #### A masked pattern was here #### |
| POSTHOOK: query: select * from dynpart_sort_opt_bucketing_test |
| POSTHOOK: type: QUERY |
| POSTHOOK: Input: default@dynpart_sort_opt_bucketing_test |
| POSTHOOK: Input: default@dynpart_sort_opt_bucketing_test@ca_location_type=single family |
| #### A masked pattern was here #### |
| 5555 AAAAAAAADLFBAAAA 126 Highland Park Court Suite E San Jose King George County VA 28003 United States -5.00 single family |
| 5555 AAAAAAAADLFBAAAA 126 Highland Park Court Suite E San Jose King George County VA 28003 United States -5.00 single family |
| PREHOOK: query: DROP TABLE dynpart_sort_opt_bucketing_test |
| PREHOOK: type: DROPTABLE |
| PREHOOK: Input: default@dynpart_sort_opt_bucketing_test |
| PREHOOK: Output: default@dynpart_sort_opt_bucketing_test |
| POSTHOOK: query: DROP TABLE dynpart_sort_opt_bucketing_test |
| POSTHOOK: type: DROPTABLE |
| POSTHOOK: Input: default@dynpart_sort_opt_bucketing_test |
| POSTHOOK: Output: default@dynpart_sort_opt_bucketing_test |
| PREHOOK: query: drop table if exists t1_staging |
| PREHOOK: type: DROPTABLE |
| PREHOOK: Input: default@t1_staging |
| PREHOOK: Output: default@t1_staging |
| POSTHOOK: query: drop table if exists t1_staging |
| POSTHOOK: type: DROPTABLE |
| POSTHOOK: Input: default@t1_staging |
| POSTHOOK: Output: default@t1_staging |
| PREHOOK: query: create table t1_staging( |
| a string, |
| b int, |
| c int, |
| d string) |
| partitioned by (e decimal(18,0)) |
| clustered by(a) |
| into 256 buckets STORED AS TEXTFILE |
| PREHOOK: type: CREATETABLE |
| PREHOOK: Output: database:default |
| PREHOOK: Output: default@t1_staging |
| POSTHOOK: query: create table t1_staging( |
| a string, |
| b int, |
| c int, |
| d string) |
| partitioned by (e decimal(18,0)) |
| clustered by(a) |
| into 256 buckets STORED AS TEXTFILE |
| POSTHOOK: type: CREATETABLE |
| POSTHOOK: Output: database:default |
| POSTHOOK: Output: default@t1_staging |
| PREHOOK: query: load data local inpath '../../data/files/sortdp/000000_0' overwrite into table t1_staging partition (e=100) |
| PREHOOK: type: LOAD |
| #### A masked pattern was here #### |
| PREHOOK: Output: default@t1_staging |
| POSTHOOK: query: load data local inpath '../../data/files/sortdp/000000_0' overwrite into table t1_staging partition (e=100) |
| POSTHOOK: type: LOAD |
| #### A masked pattern was here #### |
| POSTHOOK: Output: default@t1_staging |
| POSTHOOK: Output: default@t1_staging@e=100 |
| PREHOOK: query: drop table t1_n147 |
| PREHOOK: type: DROPTABLE |
| PREHOOK: Input: default@t1_n147 |
| PREHOOK: Output: default@t1_n147 |
| POSTHOOK: query: drop table t1_n147 |
| POSTHOOK: type: DROPTABLE |
| POSTHOOK: Input: default@t1_n147 |
| POSTHOOK: Output: default@t1_n147 |
| PREHOOK: query: create table t1_n147( |
| a string, |
| b decimal(6,0), |
| c int, |
| d string) |
| partitioned by (e decimal(3,0)) |
| clustered by(a,b) |
| into 10 buckets STORED AS ORC TBLPROPERTIES ('transactional'='true') |
| PREHOOK: type: CREATETABLE |
| PREHOOK: Output: database:default |
| PREHOOK: Output: default@t1_n147 |
| POSTHOOK: query: create table t1_n147( |
| a string, |
| b decimal(6,0), |
| c int, |
| d string) |
| partitioned by (e decimal(3,0)) |
| clustered by(a,b) |
| into 10 buckets STORED AS ORC TBLPROPERTIES ('transactional'='true') |
| POSTHOOK: type: CREATETABLE |
| POSTHOOK: Output: database:default |
| POSTHOOK: Output: default@t1_n147 |
| PREHOOK: query: explain insert overwrite table t1_n147 partition(e) select a,b,c,d,e from t1_staging |
| PREHOOK: type: QUERY |
| PREHOOK: Input: default@t1_staging |
| PREHOOK: Input: default@t1_staging@e=100 |
| PREHOOK: Output: default@t1_n147 |
| POSTHOOK: query: explain insert overwrite table t1_n147 partition(e) select a,b,c,d,e from t1_staging |
| POSTHOOK: type: QUERY |
| POSTHOOK: Input: default@t1_staging |
| POSTHOOK: Input: default@t1_staging@e=100 |
| POSTHOOK: Output: default@t1_n147 |
| STAGE DEPENDENCIES: |
| Stage-1 is a root stage |
| Stage-2 depends on stages: Stage-1 |
| Stage-0 depends on stages: Stage-2 |
| |
| STAGE PLANS: |
| Stage: Stage-1 |
| Tez |
| #### A masked pattern was here #### |
| Edges: |
| Reducer 2 <- Map 1 (SIMPLE_EDGE) |
| #### A masked pattern was here #### |
| Vertices: |
| Map 1 |
| Map Operator Tree: |
| TableScan |
| alias: t1_staging |
| Statistics: Num rows: 51 Data size: 23008 Basic stats: PARTIAL Column stats: PARTIAL |
| Select Operator |
| expressions: a (type: string), CAST( b AS decimal(6,0)) (type: decimal(6,0)), c (type: int), d (type: string), CAST( e AS decimal(3,0)) (type: decimal(3,0)) |
| outputColumnNames: _col0, _col1, _col2, _col3, _col4 |
| Statistics: Num rows: 51 Data size: 23008 Basic stats: PARTIAL Column stats: PARTIAL |
| Reduce Output Operator |
| key expressions: _col4 (type: decimal(3,0)), _bucket_number (type: string), _col0 (type: string), _col1 (type: decimal(6,0)) |
| null sort order: aaaa |
| sort order: ++++ |
| Map-reduce partition columns: _col4 (type: decimal(3,0)) |
| Statistics: Num rows: 51 Data size: 23008 Basic stats: PARTIAL Column stats: PARTIAL |
| value expressions: _col2 (type: int), _col3 (type: string) |
| Execution mode: llap |
| LLAP IO: all inputs |
| Reducer 2 |
| Execution mode: llap |
| Reduce Operator Tree: |
| Select Operator |
| expressions: KEY._col0 (type: string), KEY._col1 (type: decimal(6,0)), VALUE._col2 (type: int), VALUE._col3 (type: string), KEY._col4 (type: decimal(3,0)), KEY._bucket_number (type: string) |
| outputColumnNames: _col0, _col1, _col2, _col3, _col4, _bucket_number |
| File Output Operator |
| compressed: false |
| Dp Sort State: PARTITION_BUCKET_SORTED |
| Statistics: Num rows: 51 Data size: 23008 Basic stats: PARTIAL Column stats: PARTIAL |
| table: |
| input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat |
| output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat |
| serde: org.apache.hadoop.hive.ql.io.orc.OrcSerde |
| name: default.t1_n147 |
| Write Type: INSERT |
| |
| Stage: Stage-2 |
| Dependency Collection |
| |
| Stage: Stage-0 |
| Move Operator |
| tables: |
| partition: |
| e |
| replace: false |
| table: |
| input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat |
| output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat |
| serde: org.apache.hadoop.hive.ql.io.orc.OrcSerde |
| name: default.t1_n147 |
| Write Type: INSERT |
| |
| PREHOOK: query: insert overwrite table t1_n147 partition(e) select a,b,c,d,e from t1_staging |
| PREHOOK: type: QUERY |
| PREHOOK: Input: default@t1_staging |
| PREHOOK: Input: default@t1_staging@e=100 |
| PREHOOK: Output: default@t1_n147 |
| POSTHOOK: query: insert overwrite table t1_n147 partition(e) select a,b,c,d,e from t1_staging |
| POSTHOOK: type: QUERY |
| POSTHOOK: Input: default@t1_staging |
| POSTHOOK: Input: default@t1_staging@e=100 |
| POSTHOOK: Output: default@t1_n147 |
| POSTHOOK: Output: default@t1_n147@e=100 |
| POSTHOOK: Lineage: t1_n147 PARTITION(e=100).a SIMPLE [(t1_staging)t1_staging.FieldSchema(name:a, type:string, comment:null), ] |
| POSTHOOK: Lineage: t1_n147 PARTITION(e=100).b EXPRESSION [(t1_staging)t1_staging.FieldSchema(name:b, type:int, comment:null), ] |
| POSTHOOK: Lineage: t1_n147 PARTITION(e=100).c SIMPLE [(t1_staging)t1_staging.FieldSchema(name:c, type:int, comment:null), ] |
| POSTHOOK: Lineage: t1_n147 PARTITION(e=100).d SIMPLE [(t1_staging)t1_staging.FieldSchema(name:d, type:string, comment:null), ] |
| Warning: Shuffle Join MERGEJOIN[17][tables = [$hdt$_0, $hdt$_1]] in Stage 'Reducer 3' is a cross product |
| PREHOOK: query: with q1 as (select count(*) as cnt from t1_staging), |
| q2 as (select count(*) as cnt from t1_n147) |
| select q1.cnt = q2.cnt from q1 join q2 |
| PREHOOK: type: QUERY |
| PREHOOK: Input: default@t1_n147 |
| PREHOOK: Input: default@t1_n147@e=100 |
| PREHOOK: Input: default@t1_staging |
| PREHOOK: Input: default@t1_staging@e=100 |
| #### A masked pattern was here #### |
| POSTHOOK: query: with q1 as (select count(*) as cnt from t1_staging), |
| q2 as (select count(*) as cnt from t1_n147) |
| select q1.cnt = q2.cnt from q1 join q2 |
| POSTHOOK: type: QUERY |
| POSTHOOK: Input: default@t1_n147 |
| POSTHOOK: Input: default@t1_n147@e=100 |
| POSTHOOK: Input: default@t1_staging |
| POSTHOOK: Input: default@t1_staging@e=100 |
| #### A masked pattern was here #### |
| true |
| PREHOOK: query: drop table t1_staging |
| PREHOOK: type: DROPTABLE |
| PREHOOK: Input: default@t1_staging |
| PREHOOK: Output: default@t1_staging |
| POSTHOOK: query: drop table t1_staging |
| POSTHOOK: type: DROPTABLE |
| POSTHOOK: Input: default@t1_staging |
| POSTHOOK: Output: default@t1_staging |
| PREHOOK: query: drop table t1_n147 |
| PREHOOK: type: DROPTABLE |
| PREHOOK: Input: default@t1_n147 |
| PREHOOK: Output: default@t1_n147 |
| POSTHOOK: query: drop table t1_n147 |
| POSTHOOK: type: DROPTABLE |
| POSTHOOK: Input: default@t1_n147 |
| POSTHOOK: Output: default@t1_n147 |