ql/src/test/queries/clientpositive/vector_groupby_sort_8.q - hive - Git at Google

 SET hive.vectorized.execution.enabled=true;
 SET hive.vectorized.execution.reduce.enabled=true;
 set hive.mapred.mode=nonstrict;
 set hive.exec.reducers.max = 10;
 set hive.map.groupby.sorted=true;

 -- SORT_QUERY_RESULTS

 CREATE TABLE T1_n2(key STRING, val STRING) PARTITIONED BY (ds string)
 CLUSTERED BY (key) SORTED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE;

 LOAD DATA LOCAL INPATH '../../data/files/bucket_files/000000_0' INTO TABLE T1_n2  PARTITION (ds='1');

 -- perform an insert to make sure there are 2 files
 INSERT OVERWRITE TABLE T1_n2 PARTITION (ds='1') select key, val from T1_n2 where ds = '1';

 -- The plan is not converted to a map-side, since although the sorting columns and grouping
 -- columns match, the user is issueing a distinct.
 -- However, after HIVE-4310, partial aggregation is performed on the mapper
 EXPLAIN VECTORIZATION DETAIL
 select count(distinct key) from T1_n2;
 select count(distinct key) from T1_n2;

 DROP TABLE T1_n2;
	SET hive.vectorized.execution.enabled=true;
	SET hive.vectorized.execution.reduce.enabled=true;
	set hive.mapred.mode=nonstrict;
	set hive.exec.reducers.max = 10;
	set hive.map.groupby.sorted=true;

	-- SORT_QUERY_RESULTS

	CREATE TABLE T1_n2(key STRING, val STRING) PARTITIONED BY (ds string)
	CLUSTERED BY (key) SORTED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE;

	LOAD DATA LOCAL INPATH '../../data/files/bucket_files/000000_0' INTO TABLE T1_n2 PARTITION (ds='1');

	-- perform an insert to make sure there are 2 files
	INSERT OVERWRITE TABLE T1_n2 PARTITION (ds='1') select key, val from T1_n2 where ds = '1';

	-- The plan is not converted to a map-side, since although the sorting columns and grouping
	-- columns match, the user is issueing a distinct.
	-- However, after HIVE-4310, partial aggregation is performed on the mapper
	EXPLAIN VECTORIZATION DETAIL
	select count(distinct key) from T1_n2;
	select count(distinct key) from T1_n2;

	DROP TABLE T1_n2;