blob: ac86f5e3e78435bef6693965cf6c742585d305af [file] [log] [blame]
PREHOOK: query: CREATE TABLE tmp_n2(c1 INT, c2 INT, c3 STRING, c4 STRING)
PREHOOK: type: CREATETABLE
PREHOOK: Output: database:default
PREHOOK: Output: default@tmp_n2
POSTHOOK: query: CREATE TABLE tmp_n2(c1 INT, c2 INT, c3 STRING, c4 STRING)
POSTHOOK: type: CREATETABLE
POSTHOOK: Output: database:default
POSTHOOK: Output: default@tmp_n2
PREHOOK: query: INSERT OVERWRITE TABLE tmp_n2
SELECT x.key, y.key, x.value, y.value FROM src x JOIN src y ON (x.key = y.key)
PREHOOK: type: QUERY
PREHOOK: Input: default@src
PREHOOK: Output: default@tmp_n2
POSTHOOK: query: INSERT OVERWRITE TABLE tmp_n2
SELECT x.key, y.key, x.value, y.value FROM src x JOIN src y ON (x.key = y.key)
POSTHOOK: type: QUERY
POSTHOOK: Input: default@src
POSTHOOK: Output: default@tmp_n2
POSTHOOK: Lineage: tmp_n2.c1 EXPRESSION [(src)x.FieldSchema(name:key, type:string, comment:default), ]
POSTHOOK: Lineage: tmp_n2.c2 EXPRESSION [(src)y.FieldSchema(name:key, type:string, comment:default), ]
POSTHOOK: Lineage: tmp_n2.c3 SIMPLE [(src)x.FieldSchema(name:value, type:string, comment:default), ]
POSTHOOK: Lineage: tmp_n2.c4 SIMPLE [(src)y.FieldSchema(name:value, type:string, comment:default), ]
PREHOOK: query: EXPLAIN
SELECT xx.key, yy.key, xx.cnt, yy.cnt
FROM
(SELECT x.c1 AS key, count(1) AS cnt FROM tmp_n2 x WHERE x.c1 < 120 GROUP BY x.c1) xx
JOIN
(SELECT x1.c2 AS key, count(1) AS cnt FROM tmp_n2 x1 WHERE x1.c2 > 100 GROUP BY x1.c2) yy
ON (xx.key = yy.key)
PREHOOK: type: QUERY
PREHOOK: Input: default@tmp_n2
#### A masked pattern was here ####
POSTHOOK: query: EXPLAIN
SELECT xx.key, yy.key, xx.cnt, yy.cnt
FROM
(SELECT x.c1 AS key, count(1) AS cnt FROM tmp_n2 x WHERE x.c1 < 120 GROUP BY x.c1) xx
JOIN
(SELECT x1.c2 AS key, count(1) AS cnt FROM tmp_n2 x1 WHERE x1.c2 > 100 GROUP BY x1.c2) yy
ON (xx.key = yy.key)
POSTHOOK: type: QUERY
POSTHOOK: Input: default@tmp_n2
#### A masked pattern was here ####
STAGE DEPENDENCIES:
Stage-1 is a root stage
Stage-0 depends on stages: Stage-1
STAGE PLANS:
Stage: Stage-1
Tez
#### A masked pattern was here ####
Edges:
Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE)
#### A masked pattern was here ####
Vertices:
Map 1
Map Operator Tree:
TableScan
alias: x
filterExpr: ((c1 < 120) and (c1 > 100)) (type: boolean)
Statistics: Num rows: 1028 Data size: 4112 Basic stats: COMPLETE Column stats: COMPLETE
Filter Operator
predicate: ((c1 < 120) and (c1 > 100)) (type: boolean)
Statistics: Num rows: 198 Data size: 792 Basic stats: COMPLETE Column stats: COMPLETE
Group By Operator
aggregations: count()
keys: c1 (type: int)
minReductionHashAggr: 0.70202017
mode: hash
outputColumnNames: _col0, _col1
Statistics: Num rows: 59 Data size: 708 Basic stats: COMPLETE Column stats: COMPLETE
Reduce Output Operator
key expressions: _col0 (type: int)
null sort order: z
sort order: +
Map-reduce partition columns: _col0 (type: int)
Statistics: Num rows: 59 Data size: 708 Basic stats: COMPLETE Column stats: COMPLETE
value expressions: _col1 (type: bigint)
Execution mode: vectorized, llap
LLAP IO: all inputs
Map 3
Map Operator Tree:
TableScan
alias: x1
filterExpr: ((c2 > 100) and (c2 < 120)) (type: boolean)
Statistics: Num rows: 1028 Data size: 4112 Basic stats: COMPLETE Column stats: COMPLETE
Filter Operator
predicate: ((c2 > 100) and (c2 < 120)) (type: boolean)
Statistics: Num rows: 198 Data size: 792 Basic stats: COMPLETE Column stats: COMPLETE
Group By Operator
aggregations: count()
keys: c2 (type: int)
minReductionHashAggr: 0.70202017
mode: hash
outputColumnNames: _col0, _col1
Statistics: Num rows: 59 Data size: 708 Basic stats: COMPLETE Column stats: COMPLETE
Reduce Output Operator
key expressions: _col0 (type: int)
null sort order: z
sort order: +
Map-reduce partition columns: _col0 (type: int)
Statistics: Num rows: 59 Data size: 708 Basic stats: COMPLETE Column stats: COMPLETE
value expressions: _col1 (type: bigint)
Execution mode: vectorized, llap
LLAP IO: all inputs
Reducer 2
Reduce Operator Tree:
Group By Operator
aggregations: count(VALUE._col0)
keys: KEY._col0 (type: int)
mode: mergepartial
outputColumnNames: _col0, _col1
Statistics: Num rows: 59 Data size: 708 Basic stats: COMPLETE Column stats: COMPLETE
Dummy Store
Execution mode: llap
Reduce Operator Tree:
Group By Operator
aggregations: count(VALUE._col0)
keys: KEY._col0 (type: int)
mode: mergepartial
outputColumnNames: _col0, _col1
Statistics: Num rows: 59 Data size: 708 Basic stats: COMPLETE Column stats: COMPLETE
Merge Join Operator
condition map:
Inner Join 0 to 1
keys:
0 _col0 (type: int)
1 _col0 (type: int)
outputColumnNames: _col0, _col1, _col2, _col3
Statistics: Num rows: 59 Data size: 1416 Basic stats: COMPLETE Column stats: COMPLETE
Select Operator
expressions: _col0 (type: int), _col2 (type: int), _col1 (type: bigint), _col3 (type: bigint)
outputColumnNames: _col0, _col1, _col2, _col3
Statistics: Num rows: 59 Data size: 1416 Basic stats: COMPLETE Column stats: COMPLETE
File Output Operator
compressed: false
Statistics: Num rows: 59 Data size: 1416 Basic stats: COMPLETE Column stats: COMPLETE
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
Stage: Stage-0
Fetch Operator
limit: -1
Processor Tree:
ListSink
PREHOOK: query: SELECT xx.key, yy.key, xx.cnt, yy.cnt
FROM
(SELECT x.c1 AS key, count(1) AS cnt FROM tmp_n2 x WHERE x.c1 < 120 GROUP BY x.c1) xx
JOIN
(SELECT x1.c2 AS key, count(1) AS cnt FROM tmp_n2 x1 WHERE x1.c2 > 100 GROUP BY x1.c2) yy
ON (xx.key = yy.key)
PREHOOK: type: QUERY
PREHOOK: Input: default@tmp_n2
#### A masked pattern was here ####
POSTHOOK: query: SELECT xx.key, yy.key, xx.cnt, yy.cnt
FROM
(SELECT x.c1 AS key, count(1) AS cnt FROM tmp_n2 x WHERE x.c1 < 120 GROUP BY x.c1) xx
JOIN
(SELECT x1.c2 AS key, count(1) AS cnt FROM tmp_n2 x1 WHERE x1.c2 > 100 GROUP BY x1.c2) yy
ON (xx.key = yy.key)
POSTHOOK: type: QUERY
POSTHOOK: Input: default@tmp_n2
#### A masked pattern was here ####
103 103 4 4
104 104 4 4
105 105 1 1
111 111 1 1
113 113 4 4
114 114 1 1
116 116 1 1
118 118 4 4
119 119 9 9
PREHOOK: query: EXPLAIN
SELECT xx.key, yy.key, xx.cnt, yy.cnt
FROM
(SELECT x.c1 AS key, count(1) AS cnt FROM tmp_n2 x WHERE x.c1 < 120 GROUP BY x.c1) xx
JOIN
(SELECT x1.c2 AS key, count(1) AS cnt FROM tmp_n2 x1 WHERE x1.c2 > 100 GROUP BY x1.c2) yy
ON (xx.key = yy.key)
PREHOOK: type: QUERY
PREHOOK: Input: default@tmp_n2
#### A masked pattern was here ####
POSTHOOK: query: EXPLAIN
SELECT xx.key, yy.key, xx.cnt, yy.cnt
FROM
(SELECT x.c1 AS key, count(1) AS cnt FROM tmp_n2 x WHERE x.c1 < 120 GROUP BY x.c1) xx
JOIN
(SELECT x1.c2 AS key, count(1) AS cnt FROM tmp_n2 x1 WHERE x1.c2 > 100 GROUP BY x1.c2) yy
ON (xx.key = yy.key)
POSTHOOK: type: QUERY
POSTHOOK: Input: default@tmp_n2
#### A masked pattern was here ####
STAGE DEPENDENCIES:
Stage-1 is a root stage
Stage-0 depends on stages: Stage-1
STAGE PLANS:
Stage: Stage-1
Tez
#### A masked pattern was here ####
Edges:
Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE)
#### A masked pattern was here ####
Vertices:
Map 1
Map Operator Tree:
TableScan
alias: x
filterExpr: ((c1 < 120) and (c1 > 100)) (type: boolean)
Statistics: Num rows: 1028 Data size: 4112 Basic stats: COMPLETE Column stats: COMPLETE
Filter Operator
predicate: ((c1 < 120) and (c1 > 100)) (type: boolean)
Statistics: Num rows: 198 Data size: 792 Basic stats: COMPLETE Column stats: COMPLETE
Group By Operator
aggregations: count()
keys: c1 (type: int)
minReductionHashAggr: 0.70202017
mode: hash
outputColumnNames: _col0, _col1
Statistics: Num rows: 59 Data size: 708 Basic stats: COMPLETE Column stats: COMPLETE
Reduce Output Operator
key expressions: _col0 (type: int)
null sort order: z
sort order: +
Map-reduce partition columns: _col0 (type: int)
Statistics: Num rows: 59 Data size: 708 Basic stats: COMPLETE Column stats: COMPLETE
value expressions: _col1 (type: bigint)
Execution mode: vectorized, llap
LLAP IO: all inputs
Map 3
Map Operator Tree:
TableScan
alias: x1
filterExpr: ((c2 > 100) and (c2 < 120)) (type: boolean)
Statistics: Num rows: 1028 Data size: 4112 Basic stats: COMPLETE Column stats: COMPLETE
Filter Operator
predicate: ((c2 > 100) and (c2 < 120)) (type: boolean)
Statistics: Num rows: 198 Data size: 792 Basic stats: COMPLETE Column stats: COMPLETE
Group By Operator
aggregations: count()
keys: c2 (type: int)
minReductionHashAggr: 0.70202017
mode: hash
outputColumnNames: _col0, _col1
Statistics: Num rows: 59 Data size: 708 Basic stats: COMPLETE Column stats: COMPLETE
Reduce Output Operator
key expressions: _col0 (type: int)
null sort order: z
sort order: +
Map-reduce partition columns: _col0 (type: int)
Statistics: Num rows: 59 Data size: 708 Basic stats: COMPLETE Column stats: COMPLETE
value expressions: _col1 (type: bigint)
Execution mode: vectorized, llap
LLAP IO: all inputs
Reducer 2
Reduce Operator Tree:
Group By Operator
aggregations: count(VALUE._col0)
keys: KEY._col0 (type: int)
mode: mergepartial
outputColumnNames: _col0, _col1
Statistics: Num rows: 59 Data size: 708 Basic stats: COMPLETE Column stats: COMPLETE
Dummy Store
Execution mode: llap
Reduce Operator Tree:
Group By Operator
aggregations: count(VALUE._col0)
keys: KEY._col0 (type: int)
mode: mergepartial
outputColumnNames: _col0, _col1
Statistics: Num rows: 59 Data size: 708 Basic stats: COMPLETE Column stats: COMPLETE
Merge Join Operator
condition map:
Inner Join 0 to 1
keys:
0 _col0 (type: int)
1 _col0 (type: int)
outputColumnNames: _col0, _col1, _col2, _col3
Statistics: Num rows: 59 Data size: 1416 Basic stats: COMPLETE Column stats: COMPLETE
Select Operator
expressions: _col0 (type: int), _col2 (type: int), _col1 (type: bigint), _col3 (type: bigint)
outputColumnNames: _col0, _col1, _col2, _col3
Statistics: Num rows: 59 Data size: 1416 Basic stats: COMPLETE Column stats: COMPLETE
File Output Operator
compressed: false
Statistics: Num rows: 59 Data size: 1416 Basic stats: COMPLETE Column stats: COMPLETE
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
Stage: Stage-0
Fetch Operator
limit: -1
Processor Tree:
ListSink
PREHOOK: query: SELECT xx.key, yy.key, xx.cnt, yy.cnt
FROM
(SELECT x.c1 AS key, count(1) AS cnt FROM tmp_n2 x WHERE x.c1 < 120 GROUP BY x.c1) xx
JOIN
(SELECT x1.c2 AS key, count(1) AS cnt FROM tmp_n2 x1 WHERE x1.c2 > 100 GROUP BY x1.c2) yy
ON (xx.key = yy.key)
PREHOOK: type: QUERY
PREHOOK: Input: default@tmp_n2
#### A masked pattern was here ####
POSTHOOK: query: SELECT xx.key, yy.key, xx.cnt, yy.cnt
FROM
(SELECT x.c1 AS key, count(1) AS cnt FROM tmp_n2 x WHERE x.c1 < 120 GROUP BY x.c1) xx
JOIN
(SELECT x1.c2 AS key, count(1) AS cnt FROM tmp_n2 x1 WHERE x1.c2 > 100 GROUP BY x1.c2) yy
ON (xx.key = yy.key)
POSTHOOK: type: QUERY
POSTHOOK: Input: default@tmp_n2
#### A masked pattern was here ####
103 103 4 4
104 104 4 4
105 105 1 1
111 111 1 1
113 113 4 4
114 114 1 1
116 116 1 1
118 118 4 4
119 119 9 9
PREHOOK: query: EXPLAIN
SELECT xx.key1, xx.key2, yy.key1, yy.key2, xx.cnt, yy.cnt
FROM
(SELECT x.c1 AS key1, x.c3 AS key2, count(1) AS cnt FROM tmp_n2 x WHERE x.c1 < 120 GROUP BY x.c1, x.c3) xx
JOIN
(SELECT x1.c1 AS key1, x1.c3 AS key2, count(1) AS cnt FROM tmp_n2 x1 WHERE x1.c2 > 100 GROUP BY x1.c1, x1.c3) yy
ON (xx.key1 = yy.key1 AND xx.key2 == yy.key2)
PREHOOK: type: QUERY
PREHOOK: Input: default@tmp_n2
#### A masked pattern was here ####
POSTHOOK: query: EXPLAIN
SELECT xx.key1, xx.key2, yy.key1, yy.key2, xx.cnt, yy.cnt
FROM
(SELECT x.c1 AS key1, x.c3 AS key2, count(1) AS cnt FROM tmp_n2 x WHERE x.c1 < 120 GROUP BY x.c1, x.c3) xx
JOIN
(SELECT x1.c1 AS key1, x1.c3 AS key2, count(1) AS cnt FROM tmp_n2 x1 WHERE x1.c2 > 100 GROUP BY x1.c1, x1.c3) yy
ON (xx.key1 = yy.key1 AND xx.key2 == yy.key2)
POSTHOOK: type: QUERY
POSTHOOK: Input: default@tmp_n2
#### A masked pattern was here ####
STAGE DEPENDENCIES:
Stage-1 is a root stage
Stage-0 depends on stages: Stage-1
STAGE PLANS:
Stage: Stage-1
Tez
#### A masked pattern was here ####
Edges:
Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE)
#### A masked pattern was here ####
Vertices:
Map 1
Map Operator Tree:
TableScan
alias: x
filterExpr: ((c1 < 120) and c3 is not null) (type: boolean)
Statistics: Num rows: 1028 Data size: 97660 Basic stats: COMPLETE Column stats: COMPLETE
Filter Operator
predicate: ((c1 < 120) and c3 is not null) (type: boolean)
Statistics: Num rows: 248 Data size: 23560 Basic stats: COMPLETE Column stats: COMPLETE
Group By Operator
aggregations: count()
keys: c1 (type: int), c3 (type: string)
minReductionHashAggr: 0.0
mode: hash
outputColumnNames: _col0, _col1, _col2
Statistics: Num rows: 124 Data size: 12772 Basic stats: COMPLETE Column stats: COMPLETE
Reduce Output Operator
key expressions: _col0 (type: int), _col1 (type: string)
null sort order: zz
sort order: ++
Map-reduce partition columns: _col0 (type: int), _col1 (type: string)
Statistics: Num rows: 124 Data size: 12772 Basic stats: COMPLETE Column stats: COMPLETE
value expressions: _col2 (type: bigint)
Execution mode: vectorized, llap
LLAP IO: all inputs
Map 3
Map Operator Tree:
TableScan
alias: x1
filterExpr: ((c2 > 100) and (c1 < 120) and c3 is not null) (type: boolean)
Statistics: Num rows: 1028 Data size: 101772 Basic stats: COMPLETE Column stats: COMPLETE
Filter Operator
predicate: ((c2 > 100) and (c1 < 120) and c3 is not null) (type: boolean)
Statistics: Num rows: 198 Data size: 19602 Basic stats: COMPLETE Column stats: COMPLETE
Select Operator
expressions: c1 (type: int), c3 (type: string)
outputColumnNames: c1, c3
Statistics: Num rows: 198 Data size: 19602 Basic stats: COMPLETE Column stats: COMPLETE
Group By Operator
aggregations: count()
keys: c1 (type: int), c3 (type: string)
minReductionHashAggr: 0.0
mode: hash
outputColumnNames: _col0, _col1, _col2
Statistics: Num rows: 99 Data size: 10197 Basic stats: COMPLETE Column stats: COMPLETE
Reduce Output Operator
key expressions: _col0 (type: int), _col1 (type: string)
null sort order: zz
sort order: ++
Map-reduce partition columns: _col0 (type: int), _col1 (type: string)
Statistics: Num rows: 99 Data size: 10197 Basic stats: COMPLETE Column stats: COMPLETE
value expressions: _col2 (type: bigint)
Execution mode: vectorized, llap
LLAP IO: all inputs
Reducer 2
Reduce Operator Tree:
Group By Operator
aggregations: count(VALUE._col0)
keys: KEY._col0 (type: int), KEY._col1 (type: string)
mode: mergepartial
outputColumnNames: _col0, _col1, _col2
Statistics: Num rows: 99 Data size: 10197 Basic stats: COMPLETE Column stats: COMPLETE
Dummy Store
Execution mode: llap
Reduce Operator Tree:
Group By Operator
aggregations: count(VALUE._col0)
keys: KEY._col0 (type: int), KEY._col1 (type: string)
mode: mergepartial
outputColumnNames: _col0, _col1, _col2
Statistics: Num rows: 124 Data size: 12772 Basic stats: COMPLETE Column stats: COMPLETE
Merge Join Operator
condition map:
Inner Join 0 to 1
keys:
0 _col0 (type: int), _col1 (type: string)
1 _col0 (type: int), _col1 (type: string)
outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
Statistics: Num rows: 99 Data size: 20394 Basic stats: COMPLETE Column stats: COMPLETE
Select Operator
expressions: _col0 (type: int), _col1 (type: string), _col3 (type: int), _col4 (type: string), _col2 (type: bigint), _col5 (type: bigint)
outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
Statistics: Num rows: 99 Data size: 20394 Basic stats: COMPLETE Column stats: COMPLETE
File Output Operator
compressed: false
Statistics: Num rows: 99 Data size: 20394 Basic stats: COMPLETE Column stats: COMPLETE
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
Stage: Stage-0
Fetch Operator
limit: -1
Processor Tree:
ListSink
PREHOOK: query: SELECT xx.key1, xx.key2, yy.key1, yy.key2, xx.cnt, yy.cnt
FROM
(SELECT x.c1 AS key1, x.c3 AS key2, count(1) AS cnt FROM tmp_n2 x WHERE x.c1 < 120 GROUP BY x.c1, x.c3) xx
JOIN
(SELECT x1.c1 AS key1, x1.c3 AS key2, count(1) AS cnt FROM tmp_n2 x1 WHERE x1.c2 > 100 GROUP BY x1.c1, x1.c3) yy
ON (xx.key1 = yy.key1 AND xx.key2 == yy.key2)
PREHOOK: type: QUERY
PREHOOK: Input: default@tmp_n2
#### A masked pattern was here ####
POSTHOOK: query: SELECT xx.key1, xx.key2, yy.key1, yy.key2, xx.cnt, yy.cnt
FROM
(SELECT x.c1 AS key1, x.c3 AS key2, count(1) AS cnt FROM tmp_n2 x WHERE x.c1 < 120 GROUP BY x.c1, x.c3) xx
JOIN
(SELECT x1.c1 AS key1, x1.c3 AS key2, count(1) AS cnt FROM tmp_n2 x1 WHERE x1.c2 > 100 GROUP BY x1.c1, x1.c3) yy
ON (xx.key1 = yy.key1 AND xx.key2 == yy.key2)
POSTHOOK: type: QUERY
POSTHOOK: Input: default@tmp_n2
#### A masked pattern was here ####
103 val_103 103 val_103 4 4
104 val_104 104 val_104 4 4
105 val_105 105 val_105 1 1
111 val_111 111 val_111 1 1
113 val_113 113 val_113 4 4
114 val_114 114 val_114 1 1
116 val_116 116 val_116 1 1
118 val_118 118 val_118 4 4
119 val_119 119 val_119 9 9
PREHOOK: query: EXPLAIN
SELECT xx.key1, xx.key2, yy.key1, yy.key2, xx.cnt, yy.cnt
FROM
(SELECT x.c1 AS key1, x.c3 AS key2, count(1) AS cnt FROM tmp_n2 x WHERE x.c1 < 120 GROUP BY x.c1, x.c3) xx
JOIN
(SELECT x1.c1 AS key1, x1.c3 AS key2, count(1) AS cnt FROM tmp_n2 x1 WHERE x1.c2 > 100 GROUP BY x1.c1, x1.c3) yy
ON (xx.key1 = yy.key1 AND xx.key2 == yy.key2)
PREHOOK: type: QUERY
PREHOOK: Input: default@tmp_n2
#### A masked pattern was here ####
POSTHOOK: query: EXPLAIN
SELECT xx.key1, xx.key2, yy.key1, yy.key2, xx.cnt, yy.cnt
FROM
(SELECT x.c1 AS key1, x.c3 AS key2, count(1) AS cnt FROM tmp_n2 x WHERE x.c1 < 120 GROUP BY x.c1, x.c3) xx
JOIN
(SELECT x1.c1 AS key1, x1.c3 AS key2, count(1) AS cnt FROM tmp_n2 x1 WHERE x1.c2 > 100 GROUP BY x1.c1, x1.c3) yy
ON (xx.key1 = yy.key1 AND xx.key2 == yy.key2)
POSTHOOK: type: QUERY
POSTHOOK: Input: default@tmp_n2
#### A masked pattern was here ####
STAGE DEPENDENCIES:
Stage-1 is a root stage
Stage-0 depends on stages: Stage-1
STAGE PLANS:
Stage: Stage-1
Tez
#### A masked pattern was here ####
Edges:
Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE)
#### A masked pattern was here ####
Vertices:
Map 1
Map Operator Tree:
TableScan
alias: x
filterExpr: ((c1 < 120) and c3 is not null) (type: boolean)
Statistics: Num rows: 1028 Data size: 97660 Basic stats: COMPLETE Column stats: COMPLETE
Filter Operator
predicate: ((c1 < 120) and c3 is not null) (type: boolean)
Statistics: Num rows: 248 Data size: 23560 Basic stats: COMPLETE Column stats: COMPLETE
Group By Operator
aggregations: count()
keys: c1 (type: int), c3 (type: string)
minReductionHashAggr: 0.0
mode: hash
outputColumnNames: _col0, _col1, _col2
Statistics: Num rows: 124 Data size: 12772 Basic stats: COMPLETE Column stats: COMPLETE
Reduce Output Operator
key expressions: _col0 (type: int), _col1 (type: string)
null sort order: zz
sort order: ++
Map-reduce partition columns: _col0 (type: int), _col1 (type: string)
Statistics: Num rows: 124 Data size: 12772 Basic stats: COMPLETE Column stats: COMPLETE
value expressions: _col2 (type: bigint)
Execution mode: vectorized, llap
LLAP IO: all inputs
Map 3
Map Operator Tree:
TableScan
alias: x1
filterExpr: ((c2 > 100) and (c1 < 120) and c3 is not null) (type: boolean)
Statistics: Num rows: 1028 Data size: 101772 Basic stats: COMPLETE Column stats: COMPLETE
Filter Operator
predicate: ((c2 > 100) and (c1 < 120) and c3 is not null) (type: boolean)
Statistics: Num rows: 198 Data size: 19602 Basic stats: COMPLETE Column stats: COMPLETE
Select Operator
expressions: c1 (type: int), c3 (type: string)
outputColumnNames: c1, c3
Statistics: Num rows: 198 Data size: 19602 Basic stats: COMPLETE Column stats: COMPLETE
Group By Operator
aggregations: count()
keys: c1 (type: int), c3 (type: string)
minReductionHashAggr: 0.0
mode: hash
outputColumnNames: _col0, _col1, _col2
Statistics: Num rows: 99 Data size: 10197 Basic stats: COMPLETE Column stats: COMPLETE
Reduce Output Operator
key expressions: _col0 (type: int), _col1 (type: string)
null sort order: zz
sort order: ++
Map-reduce partition columns: _col0 (type: int), _col1 (type: string)
Statistics: Num rows: 99 Data size: 10197 Basic stats: COMPLETE Column stats: COMPLETE
value expressions: _col2 (type: bigint)
Execution mode: vectorized, llap
LLAP IO: all inputs
Reducer 2
Reduce Operator Tree:
Group By Operator
aggregations: count(VALUE._col0)
keys: KEY._col0 (type: int), KEY._col1 (type: string)
mode: mergepartial
outputColumnNames: _col0, _col1, _col2
Statistics: Num rows: 99 Data size: 10197 Basic stats: COMPLETE Column stats: COMPLETE
Dummy Store
Execution mode: llap
Reduce Operator Tree:
Group By Operator
aggregations: count(VALUE._col0)
keys: KEY._col0 (type: int), KEY._col1 (type: string)
mode: mergepartial
outputColumnNames: _col0, _col1, _col2
Statistics: Num rows: 124 Data size: 12772 Basic stats: COMPLETE Column stats: COMPLETE
Merge Join Operator
condition map:
Inner Join 0 to 1
keys:
0 _col0 (type: int), _col1 (type: string)
1 _col0 (type: int), _col1 (type: string)
outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
Statistics: Num rows: 99 Data size: 20394 Basic stats: COMPLETE Column stats: COMPLETE
Select Operator
expressions: _col0 (type: int), _col1 (type: string), _col3 (type: int), _col4 (type: string), _col2 (type: bigint), _col5 (type: bigint)
outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
Statistics: Num rows: 99 Data size: 20394 Basic stats: COMPLETE Column stats: COMPLETE
File Output Operator
compressed: false
Statistics: Num rows: 99 Data size: 20394 Basic stats: COMPLETE Column stats: COMPLETE
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
Stage: Stage-0
Fetch Operator
limit: -1
Processor Tree:
ListSink
PREHOOK: query: SELECT xx.key1, xx.key2, yy.key1, yy.key2, xx.cnt, yy.cnt
FROM
(SELECT x.c1 AS key1, x.c3 AS key2, count(1) AS cnt FROM tmp_n2 x WHERE x.c1 < 120 GROUP BY x.c1, x.c3) xx
JOIN
(SELECT x1.c1 AS key1, x1.c3 AS key2, count(1) AS cnt FROM tmp_n2 x1 WHERE x1.c2 > 100 GROUP BY x1.c1, x1.c3) yy
ON (xx.key1 = yy.key1 AND xx.key2 == yy.key2)
PREHOOK: type: QUERY
PREHOOK: Input: default@tmp_n2
#### A masked pattern was here ####
POSTHOOK: query: SELECT xx.key1, xx.key2, yy.key1, yy.key2, xx.cnt, yy.cnt
FROM
(SELECT x.c1 AS key1, x.c3 AS key2, count(1) AS cnt FROM tmp_n2 x WHERE x.c1 < 120 GROUP BY x.c1, x.c3) xx
JOIN
(SELECT x1.c1 AS key1, x1.c3 AS key2, count(1) AS cnt FROM tmp_n2 x1 WHERE x1.c2 > 100 GROUP BY x1.c1, x1.c3) yy
ON (xx.key1 = yy.key1 AND xx.key2 == yy.key2)
POSTHOOK: type: QUERY
POSTHOOK: Input: default@tmp_n2
#### A masked pattern was here ####
103 val_103 103 val_103 4 4
104 val_104 104 val_104 4 4
105 val_105 105 val_105 1 1
111 val_111 111 val_111 1 1
113 val_113 113 val_113 4 4
114 val_114 114 val_114 1 1
116 val_116 116 val_116 1 1
118 val_118 118 val_118 4 4
119 val_119 119 val_119 9 9