blob: cc49fd37ea9ef075d87e68ce99eb01339a0257a6 [file] [log] [blame]
PREHOOK: query: create table `masking_test_n5` as select cast(key as int) as key, value from src
PREHOOK: type: CREATETABLE_AS_SELECT
PREHOOK: Input: default@src
PREHOOK: Output: database:default
PREHOOK: Output: default@masking_test_n5
POSTHOOK: query: create table `masking_test_n5` as select cast(key as int) as key, value from src
POSTHOOK: type: CREATETABLE_AS_SELECT
POSTHOOK: Input: default@src
POSTHOOK: Output: database:default
POSTHOOK: Output: default@masking_test_n5
POSTHOOK: Lineage: masking_test_n5.key EXPRESSION [(src)src.FieldSchema(name:key, type:string, comment:default), ]
POSTHOOK: Lineage: masking_test_n5.value SIMPLE [(src)src.FieldSchema(name:value, type:string, comment:default), ]
PREHOOK: query: create view `v0` as select * from `masking_test_n5`
PREHOOK: type: CREATEVIEW
PREHOOK: Input: default@masking_test_n5
PREHOOK: Output: database:default
PREHOOK: Output: default@v0
POSTHOOK: query: create view `v0` as select * from `masking_test_n5`
POSTHOOK: type: CREATEVIEW
POSTHOOK: Input: default@masking_test_n5
POSTHOOK: Output: database:default
POSTHOOK: Output: default@v0
POSTHOOK: Lineage: v0.key SIMPLE [(masking_test_n5)masking_test_n5.FieldSchema(name:key, type:int, comment:null), ]
POSTHOOK: Lineage: v0.value SIMPLE [(masking_test_n5)masking_test_n5.FieldSchema(name:value, type:string, comment:null), ]
PREHOOK: query: explain
select * from `v0`
PREHOOK: type: QUERY
POSTHOOK: query: explain
select * from `v0`
POSTHOOK: type: QUERY
STAGE DEPENDENCIES:
Stage-1 is a root stage
Stage-0 depends on stages: Stage-1
STAGE PLANS:
Stage: Stage-1
Map Reduce
Map Operator Tree:
TableScan
alias: masking_test_n5
properties:
insideView TRUE
Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: (((key % 2) = 0) and (key < 10)) (type: boolean)
Statistics: Num rows: 83 Data size: 881 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: key (type: int), reverse(value) (type: string)
outputColumnNames: _col0, _col1
Statistics: Num rows: 83 Data size: 881 Basic stats: COMPLETE Column stats: NONE
File Output Operator
compressed: false
Statistics: Num rows: 83 Data size: 881 Basic stats: COMPLETE Column stats: NONE
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
Execution mode: vectorized
Stage: Stage-0
Fetch Operator
limit: -1
Processor Tree:
ListSink
PREHOOK: query: select * from `v0`
PREHOOK: type: QUERY
PREHOOK: Input: default@masking_test_n5
PREHOOK: Input: default@v0
#### A masked pattern was here ####
POSTHOOK: query: select * from `v0`
POSTHOOK: type: QUERY
POSTHOOK: Input: default@masking_test_n5
POSTHOOK: Input: default@v0
#### A masked pattern was here ####
0 0_lav
4 4_lav
8 8_lav
0 0_lav
0 0_lav
2 2_lav
PREHOOK: query: create table `masking_test_subq_n1` as select cast(key as int) as key, value from src
PREHOOK: type: CREATETABLE_AS_SELECT
PREHOOK: Input: default@src
PREHOOK: Output: database:default
PREHOOK: Output: default@masking_test_subq_n1
POSTHOOK: query: create table `masking_test_subq_n1` as select cast(key as int) as key, value from src
POSTHOOK: type: CREATETABLE_AS_SELECT
POSTHOOK: Input: default@src
POSTHOOK: Output: database:default
POSTHOOK: Output: default@masking_test_subq_n1
POSTHOOK: Lineage: masking_test_subq_n1.key EXPRESSION [(src)src.FieldSchema(name:key, type:string, comment:default), ]
POSTHOOK: Lineage: masking_test_subq_n1.value SIMPLE [(src)src.FieldSchema(name:value, type:string, comment:default), ]
PREHOOK: query: create view `v1_n9` as select * from `masking_test_subq_n1`
PREHOOK: type: CREATEVIEW
PREHOOK: Input: default@masking_test_subq_n1
PREHOOK: Output: database:default
PREHOOK: Output: default@v1_n9
POSTHOOK: query: create view `v1_n9` as select * from `masking_test_subq_n1`
POSTHOOK: type: CREATEVIEW
POSTHOOK: Input: default@masking_test_subq_n1
POSTHOOK: Output: database:default
POSTHOOK: Output: default@v1_n9
POSTHOOK: Lineage: v1_n9.key SIMPLE [(masking_test_subq_n1)masking_test_subq_n1.FieldSchema(name:key, type:int, comment:null), ]
POSTHOOK: Lineage: v1_n9.value SIMPLE [(masking_test_subq_n1)masking_test_subq_n1.FieldSchema(name:value, type:string, comment:null), ]
PREHOOK: query: explain
select * from `v1_n9`
limit 20
PREHOOK: type: QUERY
POSTHOOK: query: explain
select * from `v1_n9`
limit 20
POSTHOOK: type: QUERY
STAGE DEPENDENCIES:
Stage-3 is a root stage
Stage-2 depends on stages: Stage-3
Stage-1 depends on stages: Stage-2
Stage-0 depends on stages: Stage-1
STAGE PLANS:
Stage: Stage-3
Map Reduce
Map Operator Tree:
TableScan
alias: masking_test_subq_n1
properties:
insideView TRUE
Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: key is not null (type: boolean)
Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE
Group By Operator
keys: key (type: int)
mode: hash
outputColumnNames: _col0
Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE
Reduce Output Operator
key expressions: _col0 (type: int)
sort order: +
Map-reduce partition columns: _col0 (type: int)
Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE
Execution mode: vectorized
Reduce Operator Tree:
Group By Operator
keys: KEY._col0 (type: int)
mode: mergepartial
outputColumnNames: _col0
Statistics: Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE
File Output Operator
compressed: false
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
serde: org.apache.hadoop.hive.serde2.lazybinary.LazyBinarySerDe
Stage: Stage-2
Map Reduce
Map Operator Tree:
TableScan
alias: src
Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: key is not null (type: boolean)
Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: key (type: string)
outputColumnNames: _col0
Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE
Reduce Output Operator
key expressions: UDFToDouble(_col0) (type: double)
sort order: +
Map-reduce partition columns: UDFToDouble(_col0) (type: double)
Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE
value expressions: _col0 (type: string)
TableScan
Reduce Output Operator
key expressions: UDFToDouble(_col0) (type: double)
sort order: +
Map-reduce partition columns: UDFToDouble(_col0) (type: double)
Statistics: Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE
value expressions: _col0 (type: int)
Reduce Operator Tree:
Join Operator
condition map:
Inner Join 0 to 1
keys:
0 UDFToDouble(_col0) (type: double)
1 UDFToDouble(_col0) (type: double)
outputColumnNames: _col0, _col1
Statistics: Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE
Group By Operator
keys: _col0 (type: string), _col1 (type: int)
mode: hash
outputColumnNames: _col0, _col1
Statistics: Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE
File Output Operator
compressed: false
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
serde: org.apache.hadoop.hive.serde2.lazybinary.LazyBinarySerDe
Stage: Stage-1
Map Reduce
Map Operator Tree:
TableScan
alias: masking_test_subq_n1
properties:
insideView TRUE
Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: key is not null (type: boolean)
Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: key (type: int), value (type: string)
outputColumnNames: _col0, _col1
Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE
Reduce Output Operator
key expressions: UDFToDouble(_col0) (type: double), _col0 (type: int)
sort order: ++
Map-reduce partition columns: UDFToDouble(_col0) (type: double), _col0 (type: int)
Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE
value expressions: _col1 (type: string)
TableScan
Reduce Output Operator
key expressions: UDFToDouble(_col0) (type: double), _col1 (type: int)
sort order: ++
Map-reduce partition columns: UDFToDouble(_col0) (type: double), _col1 (type: int)
Statistics: Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE
Reduce Operator Tree:
Join Operator
condition map:
Left Semi Join 0 to 1
keys:
0 UDFToDouble(_col0) (type: double), _col0 (type: int)
1 UDFToDouble(_col0) (type: double), _col1 (type: int)
outputColumnNames: _col0, _col1
Statistics: Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE
Limit
Number of rows: 20
Statistics: Num rows: 20 Data size: 200 Basic stats: COMPLETE Column stats: NONE
File Output Operator
compressed: false
Statistics: Num rows: 20 Data size: 200 Basic stats: COMPLETE Column stats: NONE
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
Stage: Stage-0
Fetch Operator
limit: 20
Processor Tree:
ListSink
PREHOOK: query: select * from `v1_n9`
limit 20
PREHOOK: type: QUERY
PREHOOK: Input: default@masking_test_subq_n1
PREHOOK: Input: default@src
PREHOOK: Input: default@v1_n9
#### A masked pattern was here ####
POSTHOOK: query: select * from `v1_n9`
limit 20
POSTHOOK: type: QUERY
POSTHOOK: Input: default@masking_test_subq_n1
POSTHOOK: Input: default@src
POSTHOOK: Input: default@v1_n9
#### A masked pattern was here ####
0 val_0
0 val_0
0 val_0
2 val_2
4 val_4
5 val_5
5 val_5
5 val_5
8 val_8
9 val_9
10 val_10
11 val_11
12 val_12
12 val_12
15 val_15
15 val_15
17 val_17
18 val_18
18 val_18
19 val_19
PREHOOK: query: create view `masking_test_view` as select key from `v0`
PREHOOK: type: CREATEVIEW
PREHOOK: Input: default@masking_test_n5
PREHOOK: Input: default@v0
PREHOOK: Output: database:default
PREHOOK: Output: default@masking_test_view
POSTHOOK: query: create view `masking_test_view` as select key from `v0`
POSTHOOK: type: CREATEVIEW
POSTHOOK: Input: default@masking_test_n5
POSTHOOK: Input: default@v0
POSTHOOK: Output: database:default
POSTHOOK: Output: default@masking_test_view
POSTHOOK: Lineage: masking_test_view.key SIMPLE [(masking_test_n5)masking_test_n5.FieldSchema(name:key, type:int, comment:null), ]
PREHOOK: query: explain
select key from `masking_test_view`
PREHOOK: type: QUERY
POSTHOOK: query: explain
select key from `masking_test_view`
POSTHOOK: type: QUERY
STAGE DEPENDENCIES:
Stage-1 is a root stage
Stage-0 depends on stages: Stage-1
STAGE PLANS:
Stage: Stage-1
Map Reduce
Map Operator Tree:
TableScan
alias: masking_test_n5
properties:
insideView TRUE
Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: (((key % 2) = 0) and (key < 10) and (key > 6)) (type: boolean)
Statistics: Num rows: 27 Data size: 286 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: UDFToInteger((UDFToDouble(key) / 2.0D)) (type: int)
outputColumnNames: _col0
Statistics: Num rows: 27 Data size: 286 Basic stats: COMPLETE Column stats: NONE
File Output Operator
compressed: false
Statistics: Num rows: 27 Data size: 286 Basic stats: COMPLETE Column stats: NONE
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
Execution mode: vectorized
Stage: Stage-0
Fetch Operator
limit: -1
Processor Tree:
ListSink
PREHOOK: query: select key from `masking_test_view`
PREHOOK: type: QUERY
PREHOOK: Input: default@masking_test_n5
PREHOOK: Input: default@masking_test_view
PREHOOK: Input: default@v0
#### A masked pattern was here ####
POSTHOOK: query: select key from `masking_test_view`
POSTHOOK: type: QUERY
POSTHOOK: Input: default@masking_test_n5
POSTHOOK: Input: default@masking_test_view
POSTHOOK: Input: default@v0
#### A masked pattern was here ####
4
PREHOOK: query: explain
select `v0`.value from `v0` join `masking_test_view` on `v0`.key = `masking_test_view`.key
PREHOOK: type: QUERY
POSTHOOK: query: explain
select `v0`.value from `v0` join `masking_test_view` on `v0`.key = `masking_test_view`.key
POSTHOOK: type: QUERY
STAGE DEPENDENCIES:
Stage-1 is a root stage
Stage-0 depends on stages: Stage-1
STAGE PLANS:
Stage: Stage-1
Map Reduce
Map Operator Tree:
TableScan
alias: masking_test_n5
properties:
insideView TRUE
Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: (((key % 2) = 0) and (key < 10)) (type: boolean)
Statistics: Num rows: 83 Data size: 881 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: key (type: int), reverse(value) (type: string)
outputColumnNames: _col0, _col1
Statistics: Num rows: 83 Data size: 881 Basic stats: COMPLETE Column stats: NONE
Reduce Output Operator
key expressions: _col0 (type: int)
sort order: +
Map-reduce partition columns: _col0 (type: int)
Statistics: Num rows: 83 Data size: 881 Basic stats: COMPLETE Column stats: NONE
value expressions: _col1 (type: string)
TableScan
alias: masking_test_n5
properties:
insideView TRUE
Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: (((UDFToInteger((UDFToDouble(key) / 2.0D)) % 2) = 0) and ((key % 2) = 0) and (UDFToInteger((UDFToDouble(key) / 2.0D)) < 10) and (key < 10) and (key > 6)) (type: boolean)
Statistics: Num rows: 4 Data size: 42 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: UDFToInteger((UDFToDouble(key) / 2.0D)) (type: int)
outputColumnNames: _col0
Statistics: Num rows: 4 Data size: 42 Basic stats: COMPLETE Column stats: NONE
Reduce Output Operator
key expressions: _col0 (type: int)
sort order: +
Map-reduce partition columns: _col0 (type: int)
Statistics: Num rows: 4 Data size: 42 Basic stats: COMPLETE Column stats: NONE
Reduce Operator Tree:
Join Operator
condition map:
Inner Join 0 to 1
keys:
0 _col0 (type: int)
1 _col0 (type: int)
outputColumnNames: _col1
Statistics: Num rows: 91 Data size: 969 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: _col1 (type: string)
outputColumnNames: _col0
Statistics: Num rows: 91 Data size: 969 Basic stats: COMPLETE Column stats: NONE
File Output Operator
compressed: false
Statistics: Num rows: 91 Data size: 969 Basic stats: COMPLETE Column stats: NONE
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
Stage: Stage-0
Fetch Operator
limit: -1
Processor Tree:
ListSink
PREHOOK: query: select `v0`.value from `v0` join `masking_test_view` on `v0`.key = `masking_test_view`.key
PREHOOK: type: QUERY
PREHOOK: Input: default@masking_test_n5
PREHOOK: Input: default@masking_test_view
PREHOOK: Input: default@v0
#### A masked pattern was here ####
POSTHOOK: query: select `v0`.value from `v0` join `masking_test_view` on `v0`.key = `masking_test_view`.key
POSTHOOK: type: QUERY
POSTHOOK: Input: default@masking_test_n5
POSTHOOK: Input: default@masking_test_view
POSTHOOK: Input: default@v0
#### A masked pattern was here ####
4_lav