ql/src/test/results/clientpositive/llap/dynpart_sort_optimization_acid2.q.out - hive - Git at Google

 PREHOOK: query: CREATE TABLE non_acid(key string, value string)
 PARTITIONED BY(ds string, hr int)
 CLUSTERED BY(key) INTO 2 BUCKETS
 STORED AS ORC
 PREHOOK: type: CREATETABLE
 PREHOOK: Output: database:default
 PREHOOK: Output: default@non_acid
 POSTHOOK: query: CREATE TABLE non_acid(key string, value string)
 PARTITIONED BY(ds string, hr int)
 CLUSTERED BY(key) INTO 2 BUCKETS
 STORED AS ORC
 POSTHOOK: type: CREATETABLE
 POSTHOOK: Output: database:default
 POSTHOOK: Output: default@non_acid
 PREHOOK: query: explain
 insert into table non_acid partition(ds,hr) select * from srcpart sort by value
 PREHOOK: type: QUERY
 PREHOOK: Input: default@srcpart
 PREHOOK: Input: default@srcpart@ds=2008-04-08/hr=11
 PREHOOK: Input: default@srcpart@ds=2008-04-08/hr=12
 PREHOOK: Input: default@srcpart@ds=2008-04-09/hr=11
 PREHOOK: Input: default@srcpart@ds=2008-04-09/hr=12
 PREHOOK: Output: default@non_acid
 POSTHOOK: query: explain
 insert into table non_acid partition(ds,hr) select * from srcpart sort by value
 POSTHOOK: type: QUERY
 POSTHOOK: Input: default@srcpart
 POSTHOOK: Input: default@srcpart@ds=2008-04-08/hr=11
 POSTHOOK: Input: default@srcpart@ds=2008-04-08/hr=12
 POSTHOOK: Input: default@srcpart@ds=2008-04-09/hr=11
 POSTHOOK: Input: default@srcpart@ds=2008-04-09/hr=12
 POSTHOOK: Output: default@non_acid
 STAGE DEPENDENCIES:
   Stage-1 is a root stage
   Stage-2 depends on stages: Stage-1
   Stage-0 depends on stages: Stage-2
   Stage-3 depends on stages: Stage-0

 STAGE PLANS:
   Stage: Stage-1
     Tez
 #### A masked pattern was here ####
       Edges:
         Reducer 2 <- Map 1 (SIMPLE_EDGE)
         Reducer 3 <- Reducer 2 (SIMPLE_EDGE)
         Reducer 4 <- Reducer 2 (SIMPLE_EDGE)
 #### A masked pattern was here ####
       Vertices:
         Map 1
             Map Operator Tree:
                 TableScan
                   alias: srcpart
                   Statistics: Num rows: 2000 Data size: 1092000 Basic stats: COMPLETE Column stats: COMPLETE
                   Select Operator
                     expressions: key (type: string), value (type: string), ds (type: string), hr (type: string)
                     outputColumnNames: _col0, _col1, _col2, _col3
                     Statistics: Num rows: 2000 Data size: 1092000 Basic stats: COMPLETE Column stats: COMPLETE
                     Reduce Output Operator
                       key expressions: _col1 (type: string)
                       null sort order: z
                       sort order: +
                       Statistics: Num rows: 2000 Data size: 1092000 Basic stats: COMPLETE Column stats: COMPLETE
                       value expressions: _col0 (type: string), _col2 (type: string), _col3 (type: string)
             Execution mode: vectorized, llap
             LLAP IO: all inputs
         Reducer 2
             Execution mode: llap
             Reduce Operator Tree:
               Select Operator
                 expressions: VALUE._col0 (type: string), KEY.reducesinkkey0 (type: string), VALUE._col1 (type: string), UDFToInteger(VALUE._col2) (type: int)
                 outputColumnNames: _col0, _col1, _col2, _col3
                 Statistics: Num rows: 2000 Data size: 732000 Basic stats: COMPLETE Column stats: COMPLETE
                 Reduce Output Operator
                   key expressions: _col2 (type: string), _col3 (type: int), _bucket_number (type: string), _col1 (type: string)
                   null sort order: aaaa
                   sort order: ++++
                   Map-reduce partition columns: _col2 (type: string), _col3 (type: int)
                   Statistics: Num rows: 2000 Data size: 732000 Basic stats: COMPLETE Column stats: COMPLETE
                   value expressions: _col0 (type: string)
                 Select Operator
                   expressions: _col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: int)
                   outputColumnNames: key, value, ds, hr
                   Statistics: Num rows: 2000 Data size: 732000 Basic stats: COMPLETE Column stats: COMPLETE
                   Group By Operator
                     aggregations: max(length(key)), avg(COALESCE(length(key),0)), count(1), count(key), compute_bit_vector(key, 'hll'), max(length(value)), avg(COALESCE(length(value),0)), count(value), compute_bit_vector(value, 'hll')
                     keys: ds (type: string), hr (type: int)
                     minReductionHashAggr: 0.99
                     mode: hash
                     outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10
                     Statistics: Num rows: 4 Data size: 2640 Basic stats: COMPLETE Column stats: COMPLETE
                     Reduce Output Operator
                       key expressions: _col0 (type: string), _col1 (type: int)
                       null sort order: zz
                       sort order: ++
                       Map-reduce partition columns: _col0 (type: string), _col1 (type: int)
                       Statistics: Num rows: 4 Data size: 2640 Basic stats: COMPLETE Column stats: COMPLETE
                       value expressions: _col2 (type: int), _col3 (type: struct<count:bigint,sum:double,input:int>), _col4 (type: bigint), _col5 (type: bigint), _col6 (type: binary), _col7 (type: int), _col8 (type: struct<count:bigint,sum:double,input:int>), _col9 (type: bigint), _col10 (type: binary)
         Reducer 3
             Execution mode: vectorized, llap
             Reduce Operator Tree:
               Select Operator
                 expressions: VALUE._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: string), KEY._col3 (type: int), KEY._bucket_number (type: string)
                 outputColumnNames: _col0, _col1, _col2, _col3, _bucket_number
                 File Output Operator
                   compressed: false
                   Dp Sort State: PARTITION_BUCKET_SORTED
                   Statistics: Num rows: 2000 Data size: 732000 Basic stats: COMPLETE Column stats: COMPLETE
                   table:
                       input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat
                       output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat
                       serde: org.apache.hadoop.hive.ql.io.orc.OrcSerde
                       name: default.non_acid
         Reducer 4
             Execution mode: llap
             Reduce Operator Tree:
               Group By Operator
                 aggregations: max(VALUE._col0), avg(VALUE._col1), count(VALUE._col2), count(VALUE._col3), compute_bit_vector(VALUE._col4), max(VALUE._col5), avg(VALUE._col6), count(VALUE._col7), compute_bit_vector(VALUE._col8)
                 keys: KEY._col0 (type: string), KEY._col1 (type: int)
                 mode: mergepartial
                 outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10
                 Statistics: Num rows: 4 Data size: 2096 Basic stats: COMPLETE Column stats: COMPLETE
                 Select Operator
                   expressions: 'STRING' (type: string), UDFToLong(COALESCE(_col2,0)) (type: bigint), COALESCE(_col3,0) (type: double), (_col4 - _col5) (type: bigint), COALESCE(ndv_compute_bit_vector(_col6),0) (type: bigint), _col6 (type: binary), 'STRING' (type: string), UDFToLong(COALESCE(_col7,0)) (type: bigint), COALESCE(_col8,0) (type: double), (_col4 - _col9) (type: bigint), COALESCE(ndv_compute_bit_vector(_col10),0) (type: bigint), _col10 (type: binary), _col0 (type: string), _col1 (type: int)
                   outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13
                   Statistics: Num rows: 4 Data size: 2880 Basic stats: COMPLETE Column stats: COMPLETE
                   File Output Operator
                     compressed: false
                     Statistics: Num rows: 4 Data size: 2880 Basic stats: COMPLETE Column stats: COMPLETE
                     table:
                         input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                         output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
                         serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe

   Stage: Stage-2
     Dependency Collection

   Stage: Stage-0
     Move Operator
       tables:
           partition:
             ds
             hr
           replace: false
           table:
               input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat
               output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat
               serde: org.apache.hadoop.hive.ql.io.orc.OrcSerde
               name: default.non_acid

   Stage: Stage-3
     Stats Work
       Basic Stats Work:
       Column Stats Desc:
           Columns: key, value
           Column Types: string, string
           Table: default.non_acid
	PREHOOK: query: CREATE TABLE non_acid(key string, value string)
	PARTITIONED BY(ds string, hr int)
	CLUSTERED BY(key) INTO 2 BUCKETS
	STORED AS ORC
	PREHOOK: type: CREATETABLE
	PREHOOK: Output: database:default
	PREHOOK: Output: default@non_acid
	POSTHOOK: query: CREATE TABLE non_acid(key string, value string)
	PARTITIONED BY(ds string, hr int)
	CLUSTERED BY(key) INTO 2 BUCKETS
	STORED AS ORC
	POSTHOOK: type: CREATETABLE
	POSTHOOK: Output: database:default
	POSTHOOK: Output: default@non_acid
	PREHOOK: query: explain
	insert into table non_acid partition(ds,hr) select * from srcpart sort by value
	PREHOOK: type: QUERY
	PREHOOK: Input: default@srcpart
	PREHOOK: Input: default@srcpart@ds=2008-04-08/hr=11
	PREHOOK: Input: default@srcpart@ds=2008-04-08/hr=12
	PREHOOK: Input: default@srcpart@ds=2008-04-09/hr=11
	PREHOOK: Input: default@srcpart@ds=2008-04-09/hr=12
	PREHOOK: Output: default@non_acid
	POSTHOOK: query: explain
	insert into table non_acid partition(ds,hr) select * from srcpart sort by value
	POSTHOOK: type: QUERY
	POSTHOOK: Input: default@srcpart
	POSTHOOK: Input: default@srcpart@ds=2008-04-08/hr=11
	POSTHOOK: Input: default@srcpart@ds=2008-04-08/hr=12
	POSTHOOK: Input: default@srcpart@ds=2008-04-09/hr=11
	POSTHOOK: Input: default@srcpart@ds=2008-04-09/hr=12
	POSTHOOK: Output: default@non_acid
	STAGE DEPENDENCIES:
	Stage-1 is a root stage
	Stage-2 depends on stages: Stage-1
	Stage-0 depends on stages: Stage-2
	Stage-3 depends on stages: Stage-0

	STAGE PLANS:
	Stage: Stage-1
	Tez
	#### A masked pattern was here ####
	Edges:
	Reducer 2 <- Map 1 (SIMPLE_EDGE)
	Reducer 3 <- Reducer 2 (SIMPLE_EDGE)
	Reducer 4 <- Reducer 2 (SIMPLE_EDGE)
	#### A masked pattern was here ####
	Vertices:
	Map 1
	Map Operator Tree:
	TableScan
	alias: srcpart
	Statistics: Num rows: 2000 Data size: 1092000 Basic stats: COMPLETE Column stats: COMPLETE
	Select Operator
	expressions: key (type: string), value (type: string), ds (type: string), hr (type: string)
	outputColumnNames: _col0, _col1, _col2, _col3
	Statistics: Num rows: 2000 Data size: 1092000 Basic stats: COMPLETE Column stats: COMPLETE
	Reduce Output Operator
	key expressions: _col1 (type: string)
	null sort order: z
	sort order: +
	Statistics: Num rows: 2000 Data size: 1092000 Basic stats: COMPLETE Column stats: COMPLETE
	value expressions: _col0 (type: string), _col2 (type: string), _col3 (type: string)
	Execution mode: vectorized, llap
	LLAP IO: all inputs
	Reducer 2
	Execution mode: llap
	Reduce Operator Tree:
	Select Operator
	expressions: VALUE._col0 (type: string), KEY.reducesinkkey0 (type: string), VALUE._col1 (type: string), UDFToInteger(VALUE._col2) (type: int)
	outputColumnNames: _col0, _col1, _col2, _col3
	Statistics: Num rows: 2000 Data size: 732000 Basic stats: COMPLETE Column stats: COMPLETE
	Reduce Output Operator
	key expressions: _col2 (type: string), _col3 (type: int), _bucket_number (type: string), _col1 (type: string)
	null sort order: aaaa
	sort order: ++++
	Map-reduce partition columns: _col2 (type: string), _col3 (type: int)
	Statistics: Num rows: 2000 Data size: 732000 Basic stats: COMPLETE Column stats: COMPLETE
	value expressions: _col0 (type: string)
	Select Operator
	expressions: _col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: int)
	outputColumnNames: key, value, ds, hr
	Statistics: Num rows: 2000 Data size: 732000 Basic stats: COMPLETE Column stats: COMPLETE
	Group By Operator
	aggregations: max(length(key)), avg(COALESCE(length(key),0)), count(1), count(key), compute_bit_vector(key, 'hll'), max(length(value)), avg(COALESCE(length(value),0)), count(value), compute_bit_vector(value, 'hll')
	keys: ds (type: string), hr (type: int)
	minReductionHashAggr: 0.99
	mode: hash
	outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10
	Statistics: Num rows: 4 Data size: 2640 Basic stats: COMPLETE Column stats: COMPLETE
	Reduce Output Operator
	key expressions: _col0 (type: string), _col1 (type: int)
	null sort order: zz
	sort order: ++
	Map-reduce partition columns: _col0 (type: string), _col1 (type: int)
	Statistics: Num rows: 4 Data size: 2640 Basic stats: COMPLETE Column stats: COMPLETE
	value expressions: _col2 (type: int), _col3 (type: struct<count:bigint,sum:double,input:int>), _col4 (type: bigint), _col5 (type: bigint), _col6 (type: binary), _col7 (type: int), _col8 (type: struct<count:bigint,sum:double,input:int>), _col9 (type: bigint), _col10 (type: binary)
	Reducer 3
	Execution mode: vectorized, llap
	Reduce Operator Tree:
	Select Operator
	expressions: VALUE._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: string), KEY._col3 (type: int), KEY._bucket_number (type: string)
	outputColumnNames: _col0, _col1, _col2, _col3, _bucket_number
	File Output Operator
	compressed: false
	Dp Sort State: PARTITION_BUCKET_SORTED
	Statistics: Num rows: 2000 Data size: 732000 Basic stats: COMPLETE Column stats: COMPLETE
	table:
	input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat
	output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat
	serde: org.apache.hadoop.hive.ql.io.orc.OrcSerde
	name: default.non_acid
	Reducer 4
	Execution mode: llap
	Reduce Operator Tree:
	Group By Operator
	aggregations: max(VALUE._col0), avg(VALUE._col1), count(VALUE._col2), count(VALUE._col3), compute_bit_vector(VALUE._col4), max(VALUE._col5), avg(VALUE._col6), count(VALUE._col7), compute_bit_vector(VALUE._col8)
	keys: KEY._col0 (type: string), KEY._col1 (type: int)
	mode: mergepartial
	outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10
	Statistics: Num rows: 4 Data size: 2096 Basic stats: COMPLETE Column stats: COMPLETE
	Select Operator
	expressions: 'STRING' (type: string), UDFToLong(COALESCE(_col2,0)) (type: bigint), COALESCE(_col3,0) (type: double), (_col4 - _col5) (type: bigint), COALESCE(ndv_compute_bit_vector(_col6),0) (type: bigint), _col6 (type: binary), 'STRING' (type: string), UDFToLong(COALESCE(_col7,0)) (type: bigint), COALESCE(_col8,0) (type: double), (_col4 - _col9) (type: bigint), COALESCE(ndv_compute_bit_vector(_col10),0) (type: bigint), _col10 (type: binary), _col0 (type: string), _col1 (type: int)
	outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13
	Statistics: Num rows: 4 Data size: 2880 Basic stats: COMPLETE Column stats: COMPLETE
	File Output Operator
	compressed: false
	Statistics: Num rows: 4 Data size: 2880 Basic stats: COMPLETE Column stats: COMPLETE
	table:
	input format: org.apache.hadoop.mapred.SequenceFileInputFormat
	output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
	serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe

	Stage: Stage-2
	Dependency Collection

	Stage: Stage-0
	Move Operator
	tables:
	partition:
	ds
	hr
	replace: false
	table:
	input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat
	output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat
	serde: org.apache.hadoop.hive.ql.io.orc.OrcSerde
	name: default.non_acid

	Stage: Stage-3
	Stats Work
	Basic Stats Work:
	Column Stats Desc:
	Columns: key, value
	Column Types: string, string
	Table: default.non_acid