blob: 01bb188b8b0bf30a0055045f76c3a7ac59185550 [file] [log] [blame]
PREHOOK: query: create table n_n0(key int)
PREHOOK: type: CREATETABLE
PREHOOK: Output: database:default
PREHOOK: Output: default@n_n0
POSTHOOK: query: create table n_n0(key int)
POSTHOOK: type: CREATETABLE
POSTHOOK: Output: database:default
POSTHOOK: Output: default@n_n0
PREHOOK: query: insert overwrite table n_n0 select null from src
PREHOOK: type: QUERY
PREHOOK: Input: default@src
PREHOOK: Output: default@n_n0
POSTHOOK: query: insert overwrite table n_n0 select null from src
POSTHOOK: type: QUERY
POSTHOOK: Input: default@src
POSTHOOK: Output: default@n_n0
POSTHOOK: Lineage: n_n0.key EXPRESSION []
PREHOOK: query: explain analyze table n_n0 compute statistics for columns
PREHOOK: type: ANALYZE_TABLE
PREHOOK: Input: default@n_n0
PREHOOK: Output: default@n_n0
#### A masked pattern was here ####
POSTHOOK: query: explain analyze table n_n0 compute statistics for columns
POSTHOOK: type: ANALYZE_TABLE
POSTHOOK: Input: default@n_n0
POSTHOOK: Output: default@n_n0
#### A masked pattern was here ####
STAGE DEPENDENCIES:
Stage-0 is a root stage
Stage-2 depends on stages: Stage-0
STAGE PLANS:
Stage: Stage-0
Tez
#### A masked pattern was here ####
Edges:
Reducer 2 <- Map 1 (CUSTOM_SIMPLE_EDGE)
#### A masked pattern was here ####
Vertices:
Map 1
Map Operator Tree:
TableScan
alias: n_n0
Statistics: Num rows: 500 Data size: 4 Basic stats: COMPLETE Column stats: COMPLETE
Select Operator
expressions: key (type: int)
outputColumnNames: key
Statistics: Num rows: 500 Data size: 4 Basic stats: COMPLETE Column stats: COMPLETE
Group By Operator
aggregations: min(key), max(key), count(1), count(key), compute_bit_vector(key, 'fm', 16)
minReductionHashAggr: 0.99
mode: hash
outputColumnNames: _col0, _col1, _col2, _col3, _col4
Statistics: Num rows: 1 Data size: 168 Basic stats: COMPLETE Column stats: COMPLETE
Reduce Output Operator
null sort order:
sort order:
Statistics: Num rows: 1 Data size: 168 Basic stats: COMPLETE Column stats: COMPLETE
value expressions: _col0 (type: int), _col1 (type: int), _col2 (type: bigint), _col3 (type: bigint), _col4 (type: binary)
Execution mode: llap
LLAP IO: all inputs
Reducer 2
Execution mode: llap
Reduce Operator Tree:
Group By Operator
aggregations: min(VALUE._col0), max(VALUE._col1), count(VALUE._col2), count(VALUE._col3), compute_bit_vector(VALUE._col4)
mode: mergepartial
outputColumnNames: _col0, _col1, _col2, _col3, _col4
Statistics: Num rows: 1 Data size: 168 Basic stats: COMPLETE Column stats: COMPLETE
Select Operator
expressions: 'LONG' (type: string), UDFToLong(_col0) (type: bigint), UDFToLong(_col1) (type: bigint), (_col2 - _col3) (type: bigint), COALESCE(ndv_compute_bit_vector(_col4),0) (type: bigint), _col4 (type: binary)
outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
Statistics: Num rows: 1 Data size: 264 Basic stats: COMPLETE Column stats: COMPLETE
File Output Operator
compressed: false
Statistics: Num rows: 1 Data size: 264 Basic stats: COMPLETE Column stats: COMPLETE
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
Stage: Stage-2
Stats Work
Basic Stats Work:
Column Stats Desc:
Columns: key
Column Types: int
Table: default.n_n0
PREHOOK: query: analyze table n_n0 compute statistics for columns
PREHOOK: type: ANALYZE_TABLE
PREHOOK: Input: default@n_n0
PREHOOK: Output: default@n_n0
#### A masked pattern was here ####
POSTHOOK: query: analyze table n_n0 compute statistics for columns
POSTHOOK: type: ANALYZE_TABLE
POSTHOOK: Input: default@n_n0
POSTHOOK: Output: default@n_n0
#### A masked pattern was here ####
PREHOOK: query: desc formatted n_n0 key
PREHOOK: type: DESCTABLE
PREHOOK: Input: default@n_n0
POSTHOOK: query: desc formatted n_n0 key
POSTHOOK: type: DESCTABLE
POSTHOOK: Input: default@n_n0
col_name key
data_type int
min 0
max 0
num_nulls 500
distinct_count 1
avg_col_len
max_col_len
num_trues
num_falses
bit_vector FM
comment from deserializer
COLUMN_STATS_ACCURATE {\"BASIC_STATS\":\"true\",\"COLUMN_STATS\":{\"key\":\"true\"}}
PREHOOK: query: create table i_n1(key int)
PREHOOK: type: CREATETABLE
PREHOOK: Output: database:default
PREHOOK: Output: default@i_n1
POSTHOOK: query: create table i_n1(key int)
POSTHOOK: type: CREATETABLE
POSTHOOK: Output: database:default
POSTHOOK: Output: default@i_n1
PREHOOK: query: insert overwrite table i_n1 select key from src
PREHOOK: type: QUERY
PREHOOK: Input: default@src
PREHOOK: Output: default@i_n1
POSTHOOK: query: insert overwrite table i_n1 select key from src
POSTHOOK: type: QUERY
POSTHOOK: Input: default@src
POSTHOOK: Output: default@i_n1
POSTHOOK: Lineage: i_n1.key EXPRESSION [(src)src.FieldSchema(name:key, type:string, comment:default), ]
PREHOOK: query: explain analyze table i_n1 compute statistics for columns
PREHOOK: type: ANALYZE_TABLE
PREHOOK: Input: default@i_n1
PREHOOK: Output: default@i_n1
#### A masked pattern was here ####
POSTHOOK: query: explain analyze table i_n1 compute statistics for columns
POSTHOOK: type: ANALYZE_TABLE
POSTHOOK: Input: default@i_n1
POSTHOOK: Output: default@i_n1
#### A masked pattern was here ####
STAGE DEPENDENCIES:
Stage-0 is a root stage
Stage-2 depends on stages: Stage-0
STAGE PLANS:
Stage: Stage-0
Tez
#### A masked pattern was here ####
Edges:
Reducer 2 <- Map 1 (CUSTOM_SIMPLE_EDGE)
#### A masked pattern was here ####
Vertices:
Map 1
Map Operator Tree:
TableScan
alias: i_n1
Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE
Select Operator
expressions: key (type: int)
outputColumnNames: key
Statistics: Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE
Group By Operator
aggregations: min(key), max(key), count(1), count(key), compute_bit_vector(key, 'fm', 16)
minReductionHashAggr: 0.99
mode: hash
outputColumnNames: _col0, _col1, _col2, _col3, _col4
Statistics: Num rows: 1 Data size: 168 Basic stats: COMPLETE Column stats: COMPLETE
Reduce Output Operator
null sort order:
sort order:
Statistics: Num rows: 1 Data size: 168 Basic stats: COMPLETE Column stats: COMPLETE
value expressions: _col0 (type: int), _col1 (type: int), _col2 (type: bigint), _col3 (type: bigint), _col4 (type: binary)
Execution mode: llap
LLAP IO: all inputs
Reducer 2
Execution mode: llap
Reduce Operator Tree:
Group By Operator
aggregations: min(VALUE._col0), max(VALUE._col1), count(VALUE._col2), count(VALUE._col3), compute_bit_vector(VALUE._col4)
mode: mergepartial
outputColumnNames: _col0, _col1, _col2, _col3, _col4
Statistics: Num rows: 1 Data size: 168 Basic stats: COMPLETE Column stats: COMPLETE
Select Operator
expressions: 'LONG' (type: string), UDFToLong(_col0) (type: bigint), UDFToLong(_col1) (type: bigint), (_col2 - _col3) (type: bigint), COALESCE(ndv_compute_bit_vector(_col4),0) (type: bigint), _col4 (type: binary)
outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
Statistics: Num rows: 1 Data size: 264 Basic stats: COMPLETE Column stats: COMPLETE
File Output Operator
compressed: false
Statistics: Num rows: 1 Data size: 264 Basic stats: COMPLETE Column stats: COMPLETE
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
Stage: Stage-2
Stats Work
Basic Stats Work:
Column Stats Desc:
Columns: key
Column Types: int
Table: default.i_n1
PREHOOK: query: analyze table i_n1 compute statistics for columns
PREHOOK: type: ANALYZE_TABLE
PREHOOK: Input: default@i_n1
PREHOOK: Output: default@i_n1
#### A masked pattern was here ####
POSTHOOK: query: analyze table i_n1 compute statistics for columns
POSTHOOK: type: ANALYZE_TABLE
POSTHOOK: Input: default@i_n1
POSTHOOK: Output: default@i_n1
#### A masked pattern was here ####
PREHOOK: query: desc formatted i_n1 key
PREHOOK: type: DESCTABLE
PREHOOK: Input: default@i_n1
POSTHOOK: query: desc formatted i_n1 key
POSTHOOK: type: DESCTABLE
POSTHOOK: Input: default@i_n1
col_name key
data_type int
min 0
max 498
num_nulls 0
distinct_count 196
avg_col_len
max_col_len
num_trues
num_falses
bit_vector FM
comment from deserializer
COLUMN_STATS_ACCURATE {\"BASIC_STATS\":\"true\",\"COLUMN_STATS\":{\"key\":\"true\"}}
PREHOOK: query: drop table i_n1
PREHOOK: type: DROPTABLE
PREHOOK: Input: default@i_n1
PREHOOK: Output: default@i_n1
POSTHOOK: query: drop table i_n1
POSTHOOK: type: DROPTABLE
POSTHOOK: Input: default@i_n1
POSTHOOK: Output: default@i_n1
PREHOOK: query: create table i_n1(key double)
PREHOOK: type: CREATETABLE
PREHOOK: Output: database:default
PREHOOK: Output: default@i_n1
POSTHOOK: query: create table i_n1(key double)
POSTHOOK: type: CREATETABLE
POSTHOOK: Output: database:default
POSTHOOK: Output: default@i_n1
PREHOOK: query: insert overwrite table i_n1 select key from src
PREHOOK: type: QUERY
PREHOOK: Input: default@src
PREHOOK: Output: default@i_n1
POSTHOOK: query: insert overwrite table i_n1 select key from src
POSTHOOK: type: QUERY
POSTHOOK: Input: default@src
POSTHOOK: Output: default@i_n1
POSTHOOK: Lineage: i_n1.key EXPRESSION [(src)src.FieldSchema(name:key, type:string, comment:default), ]
PREHOOK: query: analyze table i_n1 compute statistics for columns
PREHOOK: type: ANALYZE_TABLE
PREHOOK: Input: default@i_n1
PREHOOK: Output: default@i_n1
#### A masked pattern was here ####
POSTHOOK: query: analyze table i_n1 compute statistics for columns
POSTHOOK: type: ANALYZE_TABLE
POSTHOOK: Input: default@i_n1
POSTHOOK: Output: default@i_n1
#### A masked pattern was here ####
PREHOOK: query: desc formatted i_n1 key
PREHOOK: type: DESCTABLE
PREHOOK: Input: default@i_n1
POSTHOOK: query: desc formatted i_n1 key
POSTHOOK: type: DESCTABLE
POSTHOOK: Input: default@i_n1
col_name key
data_type double
min 0.0
max 498.0
num_nulls 0
distinct_count 234
avg_col_len
max_col_len
num_trues
num_falses
bit_vector FM
comment from deserializer
COLUMN_STATS_ACCURATE {\"BASIC_STATS\":\"true\",\"COLUMN_STATS\":{\"key\":\"true\"}}
PREHOOK: query: drop table i_n1
PREHOOK: type: DROPTABLE
PREHOOK: Input: default@i_n1
PREHOOK: Output: default@i_n1
POSTHOOK: query: drop table i_n1
POSTHOOK: type: DROPTABLE
POSTHOOK: Input: default@i_n1
POSTHOOK: Output: default@i_n1
PREHOOK: query: create table i_n1(key decimal)
PREHOOK: type: CREATETABLE
PREHOOK: Output: database:default
PREHOOK: Output: default@i_n1
POSTHOOK: query: create table i_n1(key decimal)
POSTHOOK: type: CREATETABLE
POSTHOOK: Output: database:default
POSTHOOK: Output: default@i_n1
PREHOOK: query: insert overwrite table i_n1 select key from src
PREHOOK: type: QUERY
PREHOOK: Input: default@src
PREHOOK: Output: default@i_n1
POSTHOOK: query: insert overwrite table i_n1 select key from src
POSTHOOK: type: QUERY
POSTHOOK: Input: default@src
POSTHOOK: Output: default@i_n1
POSTHOOK: Lineage: i_n1.key EXPRESSION [(src)src.FieldSchema(name:key, type:string, comment:default), ]
PREHOOK: query: analyze table i_n1 compute statistics for columns
PREHOOK: type: ANALYZE_TABLE
PREHOOK: Input: default@i_n1
PREHOOK: Output: default@i_n1
#### A masked pattern was here ####
POSTHOOK: query: analyze table i_n1 compute statistics for columns
POSTHOOK: type: ANALYZE_TABLE
POSTHOOK: Input: default@i_n1
POSTHOOK: Output: default@i_n1
#### A masked pattern was here ####
PREHOOK: query: desc formatted i_n1 key
PREHOOK: type: DESCTABLE
PREHOOK: Input: default@i_n1
POSTHOOK: query: desc formatted i_n1 key
POSTHOOK: type: DESCTABLE
POSTHOOK: Input: default@i_n1
col_name key
data_type decimal(10,0)
min 0
max 498
num_nulls 0
distinct_count 180
avg_col_len
max_col_len
num_trues
num_falses
bit_vector FM
comment from deserializer
COLUMN_STATS_ACCURATE {\"BASIC_STATS\":\"true\",\"COLUMN_STATS\":{\"key\":\"true\"}}
PREHOOK: query: drop table i_n1
PREHOOK: type: DROPTABLE
PREHOOK: Input: default@i_n1
PREHOOK: Output: default@i_n1
POSTHOOK: query: drop table i_n1
POSTHOOK: type: DROPTABLE
POSTHOOK: Input: default@i_n1
POSTHOOK: Output: default@i_n1
PREHOOK: query: create table i_n1(key date)
PREHOOK: type: CREATETABLE
PREHOOK: Output: database:default
PREHOOK: Output: default@i_n1
POSTHOOK: query: create table i_n1(key date)
POSTHOOK: type: CREATETABLE
POSTHOOK: Output: database:default
POSTHOOK: Output: default@i_n1
PREHOOK: query: insert into i_n1 values ('2012-08-17')
PREHOOK: type: QUERY
PREHOOK: Input: _dummy_database@_dummy_table
PREHOOK: Output: default@i_n1
POSTHOOK: query: insert into i_n1 values ('2012-08-17')
POSTHOOK: type: QUERY
POSTHOOK: Input: _dummy_database@_dummy_table
POSTHOOK: Output: default@i_n1
POSTHOOK: Lineage: i_n1.key SCRIPT []
PREHOOK: query: insert into i_n1 values ('2012-08-17')
PREHOOK: type: QUERY
PREHOOK: Input: _dummy_database@_dummy_table
PREHOOK: Output: default@i_n1
POSTHOOK: query: insert into i_n1 values ('2012-08-17')
POSTHOOK: type: QUERY
POSTHOOK: Input: _dummy_database@_dummy_table
POSTHOOK: Output: default@i_n1
POSTHOOK: Lineage: i_n1.key SCRIPT []
PREHOOK: query: insert into i_n1 values ('2013-08-17')
PREHOOK: type: QUERY
PREHOOK: Input: _dummy_database@_dummy_table
PREHOOK: Output: default@i_n1
POSTHOOK: query: insert into i_n1 values ('2013-08-17')
POSTHOOK: type: QUERY
POSTHOOK: Input: _dummy_database@_dummy_table
POSTHOOK: Output: default@i_n1
POSTHOOK: Lineage: i_n1.key SCRIPT []
PREHOOK: query: insert into i_n1 values ('2012-03-17')
PREHOOK: type: QUERY
PREHOOK: Input: _dummy_database@_dummy_table
PREHOOK: Output: default@i_n1
POSTHOOK: query: insert into i_n1 values ('2012-03-17')
POSTHOOK: type: QUERY
POSTHOOK: Input: _dummy_database@_dummy_table
POSTHOOK: Output: default@i_n1
POSTHOOK: Lineage: i_n1.key SCRIPT []
PREHOOK: query: insert into i_n1 values ('2012-05-17')
PREHOOK: type: QUERY
PREHOOK: Input: _dummy_database@_dummy_table
PREHOOK: Output: default@i_n1
POSTHOOK: query: insert into i_n1 values ('2012-05-17')
POSTHOOK: type: QUERY
POSTHOOK: Input: _dummy_database@_dummy_table
POSTHOOK: Output: default@i_n1
POSTHOOK: Lineage: i_n1.key SCRIPT []
PREHOOK: query: analyze table i_n1 compute statistics for columns
PREHOOK: type: ANALYZE_TABLE
PREHOOK: Input: default@i_n1
PREHOOK: Output: default@i_n1
#### A masked pattern was here ####
POSTHOOK: query: analyze table i_n1 compute statistics for columns
POSTHOOK: type: ANALYZE_TABLE
POSTHOOK: Input: default@i_n1
POSTHOOK: Output: default@i_n1
#### A masked pattern was here ####
PREHOOK: query: desc formatted i_n1 key
PREHOOK: type: DESCTABLE
PREHOOK: Input: default@i_n1
POSTHOOK: query: desc formatted i_n1 key
POSTHOOK: type: DESCTABLE
POSTHOOK: Input: default@i_n1
col_name key
data_type date
min 2012-03-17
max 2013-08-17
num_nulls 0
distinct_count 3
avg_col_len
max_col_len
num_trues
num_falses
bit_vector FM
comment from deserializer
COLUMN_STATS_ACCURATE {\"BASIC_STATS\":\"true\",\"COLUMN_STATS\":{\"key\":\"true\"}}