blob: 6768c57da4979081dd31c521c36be9c383bcba18 [file] [log] [blame]
PREHOOK: query: create table vsmb_bucket_1(key int, value string)
CLUSTERED BY (key)
SORTED BY (key) INTO 1 BUCKETS
STORED AS ORC
PREHOOK: type: CREATETABLE
PREHOOK: Output: database:default
PREHOOK: Output: default@vsmb_bucket_1
POSTHOOK: query: create table vsmb_bucket_1(key int, value string)
CLUSTERED BY (key)
SORTED BY (key) INTO 1 BUCKETS
STORED AS ORC
POSTHOOK: type: CREATETABLE
POSTHOOK: Output: database:default
POSTHOOK: Output: default@vsmb_bucket_1
PREHOOK: query: create table vsmb_bucket_2(key int, value string)
CLUSTERED BY (key)
SORTED BY (key) INTO 1 BUCKETS
STORED AS ORC
PREHOOK: type: CREATETABLE
PREHOOK: Output: database:default
PREHOOK: Output: default@vsmb_bucket_2
POSTHOOK: query: create table vsmb_bucket_2(key int, value string)
CLUSTERED BY (key)
SORTED BY (key) INTO 1 BUCKETS
STORED AS ORC
POSTHOOK: type: CREATETABLE
POSTHOOK: Output: database:default
POSTHOOK: Output: default@vsmb_bucket_2
PREHOOK: query: create table vsmb_bucket_RC(key int, value string)
CLUSTERED BY (key)
SORTED BY (key) INTO 1 BUCKETS
STORED AS RCFILE
PREHOOK: type: CREATETABLE
PREHOOK: Output: database:default
PREHOOK: Output: default@vsmb_bucket_RC
POSTHOOK: query: create table vsmb_bucket_RC(key int, value string)
CLUSTERED BY (key)
SORTED BY (key) INTO 1 BUCKETS
STORED AS RCFILE
POSTHOOK: type: CREATETABLE
POSTHOOK: Output: database:default
POSTHOOK: Output: default@vsmb_bucket_RC
PREHOOK: query: create table vsmb_bucket_TXT(key int, value string)
CLUSTERED BY (key)
SORTED BY (key) INTO 1 BUCKETS
STORED AS TEXTFILE
PREHOOK: type: CREATETABLE
PREHOOK: Output: database:default
PREHOOK: Output: default@vsmb_bucket_TXT
POSTHOOK: query: create table vsmb_bucket_TXT(key int, value string)
CLUSTERED BY (key)
SORTED BY (key) INTO 1 BUCKETS
STORED AS TEXTFILE
POSTHOOK: type: CREATETABLE
POSTHOOK: Output: database:default
POSTHOOK: Output: default@vsmb_bucket_TXT
PREHOOK: query: insert into table vsmb_bucket_1 select cint, cstring1 from alltypesorc limit 2
PREHOOK: type: QUERY
PREHOOK: Input: default@alltypesorc
PREHOOK: Output: default@vsmb_bucket_1
POSTHOOK: query: insert into table vsmb_bucket_1 select cint, cstring1 from alltypesorc limit 2
POSTHOOK: type: QUERY
POSTHOOK: Input: default@alltypesorc
POSTHOOK: Output: default@vsmb_bucket_1
POSTHOOK: Lineage: vsmb_bucket_1.key SIMPLE [(alltypesorc)alltypesorc.FieldSchema(name:cint, type:int, comment:null), ]
POSTHOOK: Lineage: vsmb_bucket_1.value SIMPLE [(alltypesorc)alltypesorc.FieldSchema(name:cstring1, type:string, comment:null), ]
PREHOOK: query: insert into table vsmb_bucket_2 select cint, cstring1 from alltypesorc limit 2
PREHOOK: type: QUERY
PREHOOK: Input: default@alltypesorc
PREHOOK: Output: default@vsmb_bucket_2
POSTHOOK: query: insert into table vsmb_bucket_2 select cint, cstring1 from alltypesorc limit 2
POSTHOOK: type: QUERY
POSTHOOK: Input: default@alltypesorc
POSTHOOK: Output: default@vsmb_bucket_2
POSTHOOK: Lineage: vsmb_bucket_2.key SIMPLE [(alltypesorc)alltypesorc.FieldSchema(name:cint, type:int, comment:null), ]
POSTHOOK: Lineage: vsmb_bucket_2.value SIMPLE [(alltypesorc)alltypesorc.FieldSchema(name:cstring1, type:string, comment:null), ]
PREHOOK: query: insert into table vsmb_bucket_RC select cint, cstring1 from alltypesorc limit 2
PREHOOK: type: QUERY
PREHOOK: Input: default@alltypesorc
PREHOOK: Output: default@vsmb_bucket_rc
POSTHOOK: query: insert into table vsmb_bucket_RC select cint, cstring1 from alltypesorc limit 2
POSTHOOK: type: QUERY
POSTHOOK: Input: default@alltypesorc
POSTHOOK: Output: default@vsmb_bucket_rc
POSTHOOK: Lineage: vsmb_bucket_rc.key SIMPLE [(alltypesorc)alltypesorc.FieldSchema(name:cint, type:int, comment:null), ]
POSTHOOK: Lineage: vsmb_bucket_rc.value SIMPLE [(alltypesorc)alltypesorc.FieldSchema(name:cstring1, type:string, comment:null), ]
PREHOOK: query: insert into table vsmb_bucket_TXT select cint, cstring1 from alltypesorc limit 2
PREHOOK: type: QUERY
PREHOOK: Input: default@alltypesorc
PREHOOK: Output: default@vsmb_bucket_txt
POSTHOOK: query: insert into table vsmb_bucket_TXT select cint, cstring1 from alltypesorc limit 2
POSTHOOK: type: QUERY
POSTHOOK: Input: default@alltypesorc
POSTHOOK: Output: default@vsmb_bucket_txt
POSTHOOK: Lineage: vsmb_bucket_txt.key SIMPLE [(alltypesorc)alltypesorc.FieldSchema(name:cint, type:int, comment:null), ]
POSTHOOK: Lineage: vsmb_bucket_txt.value SIMPLE [(alltypesorc)alltypesorc.FieldSchema(name:cstring1, type:string, comment:null), ]
PREHOOK: query: explain vectorization expression
select /*+MAPJOIN(a)*/ * from vsmb_bucket_1 a join vsmb_bucket_2 b on a.key = b.key
PREHOOK: type: QUERY
POSTHOOK: query: explain vectorization expression
select /*+MAPJOIN(a)*/ * from vsmb_bucket_1 a join vsmb_bucket_2 b on a.key = b.key
POSTHOOK: type: QUERY
PLAN VECTORIZATION:
enabled: true
enabledConditionsMet: [hive.vectorized.execution.enabled IS true]
STAGE DEPENDENCIES:
Stage-1 is a root stage
Stage-0 depends on stages: Stage-1
STAGE PLANS:
Stage: Stage-1
Map Reduce
Map Operator Tree:
TableScan
alias: b
Statistics: Num rows: 2 Data size: 208 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: key is not null (type: boolean)
Statistics: Num rows: 2 Data size: 208 Basic stats: COMPLETE Column stats: NONE
Sorted Merge Bucket Map Join Operator
condition map:
Inner Join 0 to 1
keys:
0 key (type: int)
1 key (type: int)
outputColumnNames: _col0, _col1, _col5, _col6
Select Operator
expressions: _col0 (type: int), _col1 (type: string), _col5 (type: int), _col6 (type: string)
outputColumnNames: _col0, _col1, _col2, _col3
File Output Operator
compressed: false
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
Map Vectorization:
enabled: true
enabledConditionsMet: hive.vectorized.use.vectorized.input.format IS true
inputFileFormats: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat
notVectorizedReason: MAPJOIN operator: FilterMaps not supported for Vector Pass-Thru SMB MapJoin
vectorized: false
Stage: Stage-0
Fetch Operator
limit: -1
Processor Tree:
ListSink
PREHOOK: query: select /*+MAPJOIN(a)*/ * from vsmb_bucket_1 a join vsmb_bucket_2 b on a.key = b.key
PREHOOK: type: QUERY
PREHOOK: Input: default@vsmb_bucket_1
PREHOOK: Input: default@vsmb_bucket_2
#### A masked pattern was here ####
POSTHOOK: query: select /*+MAPJOIN(a)*/ * from vsmb_bucket_1 a join vsmb_bucket_2 b on a.key = b.key
POSTHOOK: type: QUERY
POSTHOOK: Input: default@vsmb_bucket_1
POSTHOOK: Input: default@vsmb_bucket_2
#### A masked pattern was here ####
528534767 cvLH6Eat2yFsyy7p 528534767 cvLH6Eat2yFsyy7p
528534767 cvLH6Eat2yFsyy7p 528534767 cvLH6Eat2yFsyy7p
528534767 cvLH6Eat2yFsyy7p 528534767 cvLH6Eat2yFsyy7p
528534767 cvLH6Eat2yFsyy7p 528534767 cvLH6Eat2yFsyy7p
PREHOOK: query: explain vectorization expression
select /*+MAPJOIN(b)*/ * from vsmb_bucket_1 a join vsmb_bucket_RC b on a.key = b.key
PREHOOK: type: QUERY
POSTHOOK: query: explain vectorization expression
select /*+MAPJOIN(b)*/ * from vsmb_bucket_1 a join vsmb_bucket_RC b on a.key = b.key
POSTHOOK: type: QUERY
PLAN VECTORIZATION:
enabled: true
enabledConditionsMet: [hive.vectorized.execution.enabled IS true]
STAGE DEPENDENCIES:
Stage-1 is a root stage
Stage-0 depends on stages: Stage-1
STAGE PLANS:
Stage: Stage-1
Map Reduce
Map Operator Tree:
TableScan
alias: a
Statistics: Num rows: 2 Data size: 208 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: key is not null (type: boolean)
Statistics: Num rows: 2 Data size: 208 Basic stats: COMPLETE Column stats: NONE
Sorted Merge Bucket Map Join Operator
condition map:
Inner Join 0 to 1
keys:
0 key (type: int)
1 key (type: int)
outputColumnNames: _col0, _col1, _col5, _col6
Select Operator
expressions: _col0 (type: int), _col1 (type: string), _col5 (type: int), _col6 (type: string)
outputColumnNames: _col0, _col1, _col2, _col3
File Output Operator
compressed: false
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
Map Vectorization:
enabled: true
enabledConditionsMet: hive.vectorized.use.vectorized.input.format IS true
inputFileFormats: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat
notVectorizedReason: MAPJOIN operator: FilterMaps not supported for Vector Pass-Thru SMB MapJoin
vectorized: false
Stage: Stage-0
Fetch Operator
limit: -1
Processor Tree:
ListSink
PREHOOK: query: select /*+MAPJOIN(b)*/ * from vsmb_bucket_1 a join vsmb_bucket_RC b on a.key = b.key
PREHOOK: type: QUERY
PREHOOK: Input: default@vsmb_bucket_1
PREHOOK: Input: default@vsmb_bucket_rc
#### A masked pattern was here ####
POSTHOOK: query: select /*+MAPJOIN(b)*/ * from vsmb_bucket_1 a join vsmb_bucket_RC b on a.key = b.key
POSTHOOK: type: QUERY
POSTHOOK: Input: default@vsmb_bucket_1
POSTHOOK: Input: default@vsmb_bucket_rc
#### A masked pattern was here ####
528534767 cvLH6Eat2yFsyy7p 528534767 cvLH6Eat2yFsyy7p
528534767 cvLH6Eat2yFsyy7p 528534767 cvLH6Eat2yFsyy7p
528534767 cvLH6Eat2yFsyy7p 528534767 cvLH6Eat2yFsyy7p
528534767 cvLH6Eat2yFsyy7p 528534767 cvLH6Eat2yFsyy7p
PREHOOK: query: explain vectorization expression
select /*+MAPJOIN(b)*/ * from vsmb_bucket_1 a join vsmb_bucket_TXT b on a.key = b.key
PREHOOK: type: QUERY
POSTHOOK: query: explain vectorization expression
select /*+MAPJOIN(b)*/ * from vsmb_bucket_1 a join vsmb_bucket_TXT b on a.key = b.key
POSTHOOK: type: QUERY
PLAN VECTORIZATION:
enabled: true
enabledConditionsMet: [hive.vectorized.execution.enabled IS true]
STAGE DEPENDENCIES:
Stage-1 is a root stage
Stage-0 depends on stages: Stage-1
STAGE PLANS:
Stage: Stage-1
Map Reduce
Map Operator Tree:
TableScan
alias: a
Statistics: Num rows: 2 Data size: 208 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: key is not null (type: boolean)
Statistics: Num rows: 2 Data size: 208 Basic stats: COMPLETE Column stats: NONE
Sorted Merge Bucket Map Join Operator
condition map:
Inner Join 0 to 1
keys:
0 key (type: int)
1 key (type: int)
outputColumnNames: _col0, _col1, _col5, _col6
Select Operator
expressions: _col0 (type: int), _col1 (type: string), _col5 (type: int), _col6 (type: string)
outputColumnNames: _col0, _col1, _col2, _col3
File Output Operator
compressed: false
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
Map Vectorization:
enabled: true
enabledConditionsMet: hive.vectorized.use.vectorized.input.format IS true
inputFileFormats: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat
notVectorizedReason: MAPJOIN operator: FilterMaps not supported for Vector Pass-Thru SMB MapJoin
vectorized: false
Stage: Stage-0
Fetch Operator
limit: -1
Processor Tree:
ListSink
PREHOOK: query: select /*+MAPJOIN(b)*/ * from vsmb_bucket_1 a join vsmb_bucket_TXT b on a.key = b.key
PREHOOK: type: QUERY
PREHOOK: Input: default@vsmb_bucket_1
PREHOOK: Input: default@vsmb_bucket_txt
#### A masked pattern was here ####
POSTHOOK: query: select /*+MAPJOIN(b)*/ * from vsmb_bucket_1 a join vsmb_bucket_TXT b on a.key = b.key
POSTHOOK: type: QUERY
POSTHOOK: Input: default@vsmb_bucket_1
POSTHOOK: Input: default@vsmb_bucket_txt
#### A masked pattern was here ####
528534767 cvLH6Eat2yFsyy7p 528534767 cvLH6Eat2yFsyy7p
528534767 cvLH6Eat2yFsyy7p 528534767 cvLH6Eat2yFsyy7p
528534767 cvLH6Eat2yFsyy7p 528534767 cvLH6Eat2yFsyy7p
528534767 cvLH6Eat2yFsyy7p 528534767 cvLH6Eat2yFsyy7p