blob: 3df4815979a578d3a481d84511e01f6b8063763f [file] [log] [blame]
--! qt:dataset:srcbucket
--! qt:dataset:src
--! qt:dataset:alltypesparquet
--! qt:replace:/((rawData|total)Size\s+)[0-9]{2,}/$1__SOME_NUMBER__/
set hive.mapred.mode=nonstrict;
set hive.explain.user=false;
SET hive.vectorized.execution.enabled=true;
set hive.vectorized.execution.reduce.enabled=true;
set hive.fetch.task.conversion=none;
-- SORT_QUERY_RESULTS
-- Use ORDER BY clauses to generate 2 stages.
EXPLAIN VECTORIZATION EXPRESSION
SELECT MIN(ctinyint) as c1,
MAX(ctinyint),
COUNT(ctinyint),
COUNT(*)
FROM alltypesparquet
ORDER BY c1;
SELECT MIN(ctinyint) as c1,
MAX(ctinyint),
COUNT(ctinyint),
COUNT(*)
FROM alltypesparquet
ORDER BY c1;
EXPLAIN VECTORIZATION EXPRESSION
SELECT SUM(ctinyint) as c1
FROM alltypesparquet
ORDER BY c1;
SELECT SUM(ctinyint) as c1
FROM alltypesparquet
ORDER BY c1;
EXPLAIN VECTORIZATION
SELECT
avg(ctinyint) as c1,
variance(ctinyint),
var_pop(ctinyint),
var_samp(ctinyint),
std(ctinyint),
stddev(ctinyint),
stddev_pop(ctinyint),
stddev_samp(ctinyint)
FROM alltypesparquet
ORDER BY c1;
SELECT
avg(ctinyint) as c1,
variance(ctinyint),
var_pop(ctinyint),
var_samp(ctinyint),
std(ctinyint),
stddev(ctinyint),
stddev_pop(ctinyint),
stddev_samp(ctinyint)
FROM alltypesparquet
ORDER BY c1;
EXPLAIN VECTORIZATION EXPRESSION
SELECT MIN(cbigint) as c1,
MAX(cbigint),
COUNT(cbigint),
COUNT(*)
FROM alltypesparquet
ORDER BY c1;
SELECT MIN(cbigint) as c1,
MAX(cbigint),
COUNT(cbigint),
COUNT(*)
FROM alltypesparquet
ORDER BY c1;
EXPLAIN VECTORIZATION EXPRESSION
SELECT SUM(cbigint) as c1
FROM alltypesparquet
ORDER BY c1;
SELECT SUM(cbigint) as c1
FROM alltypesparquet
ORDER BY c1;
EXPLAIN VECTORIZATION
SELECT
avg(cbigint) as c1,
variance(cbigint),
var_pop(cbigint),
var_samp(cbigint),
std(cbigint),
stddev(cbigint),
stddev_pop(cbigint),
stddev_samp(cbigint)
FROM alltypesparquet
ORDER BY c1;
SELECT
avg(cbigint) as c1,
variance(cbigint),
var_pop(cbigint),
var_samp(cbigint),
std(cbigint),
stddev(cbigint),
stddev_pop(cbigint),
stddev_samp(cbigint)
FROM alltypesparquet
ORDER BY c1;
EXPLAIN VECTORIZATION EXPRESSION
SELECT MIN(cfloat) as c1,
MAX(cfloat),
COUNT(cfloat),
COUNT(*)
FROM alltypesparquet
ORDER BY c1;
SELECT MIN(cfloat) as c1,
MAX(cfloat),
COUNT(cfloat),
COUNT(*)
FROM alltypesparquet
ORDER BY c1;
EXPLAIN VECTORIZATION EXPRESSION
SELECT SUM(cfloat) as c1
FROM alltypesparquet
ORDER BY c1;
SELECT SUM(cfloat) as c1
FROM alltypesparquet
ORDER BY c1;
EXPLAIN VECTORIZATION
SELECT
avg(cfloat) as c1,
variance(cfloat),
var_pop(cfloat),
var_samp(cfloat),
std(cfloat),
stddev(cfloat),
stddev_pop(cfloat),
stddev_samp(cfloat)
FROM alltypesparquet
ORDER BY c1;
SELECT
avg(cfloat) as c1,
variance(cfloat),
var_pop(cfloat),
var_samp(cfloat),
std(cfloat),
stddev(cfloat),
stddev_pop(cfloat),
stddev_samp(cfloat)
FROM alltypesparquet
ORDER BY c1;
EXPLAIN VECTORIZATION EXPRESSION
SELECT AVG(cbigint),
(-(AVG(cbigint))),
(-6432 + AVG(cbigint)),
STDDEV_POP(cbigint),
(-((-6432 + AVG(cbigint)))),
((-((-6432 + AVG(cbigint)))) + (-6432 + AVG(cbigint))),
VAR_SAMP(cbigint),
(-((-6432 + AVG(cbigint)))),
(-6432 + (-((-6432 + AVG(cbigint))))),
(-((-6432 + AVG(cbigint)))),
((-((-6432 + AVG(cbigint)))) / (-((-6432 + AVG(cbigint))))),
COUNT(*),
SUM(cfloat),
(VAR_SAMP(cbigint) % STDDEV_POP(cbigint)),
(-(VAR_SAMP(cbigint))),
((-((-6432 + AVG(cbigint)))) * (-(AVG(cbigint)))),
MIN(ctinyint),
(-(MIN(ctinyint)))
FROM alltypesparquet
WHERE (((cstring2 LIKE '%b%')
OR ((79.553 != cint)
OR (cbigint < cdouble)))
OR ((ctinyint >= csmallint)
AND ((cboolean2 = 1)
AND (3569 = ctinyint))));
SELECT AVG(cbigint),
(-(AVG(cbigint))),
(-6432 + AVG(cbigint)),
STDDEV_POP(cbigint),
(-((-6432 + AVG(cbigint)))),
((-((-6432 + AVG(cbigint)))) + (-6432 + AVG(cbigint))),
VAR_SAMP(cbigint),
(-((-6432 + AVG(cbigint)))),
(-6432 + (-((-6432 + AVG(cbigint))))),
(-((-6432 + AVG(cbigint)))),
((-((-6432 + AVG(cbigint)))) / (-((-6432 + AVG(cbigint))))),
COUNT(*),
SUM(cfloat),
(VAR_SAMP(cbigint) % STDDEV_POP(cbigint)),
(-(VAR_SAMP(cbigint))),
((-((-6432 + AVG(cbigint)))) * (-(AVG(cbigint)))),
MIN(ctinyint),
(-(MIN(ctinyint)))
FROM alltypesparquet
WHERE (((cstring2 LIKE '%b%')
OR ((79.553 != cint)
OR (cbigint < cdouble)))
OR ((ctinyint >= csmallint)
AND ((cboolean2 = 1)
AND (3569 = ctinyint))));
EXPLAIN extended
select count(*) from alltypesparquet
where (((cstring1 LIKE 'a%') or ((cstring1 like 'b%') or (cstring1 like 'c%'))) or
((length(cstring1) < 50 ) and ((cstring1 like '%n') and (length(cstring1) > 0))));
select count(*) from alltypesparquet
where (((cstring1 LIKE 'a%') or ((cstring1 like 'b%') or (cstring1 like 'c%'))) or
((length(cstring1) < 50 ) and ((cstring1 like '%n') and (length(cstring1) > 0))));
set hive.vectorized.execution.enabled=true;
set hive.compute.query.using.stats=false;
select min(ctinyint), max(ctinyint), sum(ctinyint), avg(ctinyint) from alltypesparquet;
select min(csmallint), max(csmallint), sum(csmallint), avg(csmallint) from alltypesparquet;
select min(cint), max(cint), sum(cint), avg(cint) from alltypesparquet;
select min(cbigint), max(cbigint), sum(cbigint), avg(cbigint) from alltypesparquet;
select min(cdouble), max(cdouble), sum(cdouble), avg(cdouble) from alltypesparquet;
select distinct cstring1 from alltypesparquet;
select distinct cstring1, ctinyint from alltypesparquet;
select cstring1, max(cbigint) from alltypesparquet
group by cstring1
order by cstring1 desc;
set hive.vectorized.execution.reduce.enabled=true;
set hive.vectorized.execution.reduce.groupby.enabled=true;
select cstring1, cint, ctinyint from alltypesparquet
where cstring1 > 'religion';
select cstring1, cint, ctinyint from alltypesparquet where cstring1 <> 'religion';
select ctinyint, csmallint, cint, cbigint, cdouble, cdouble, cstring1 from alltypesparquet
where ctinyint > 0 and csmallint > 0 and cint > 0 and cbigint > 0 and
cfloat > 0.0 and cdouble > 0.0 and cstring1 > 'm';
set hive.optimize.point.lookup=false;
--test to make sure multi and/or expressions are being vectorized
explain extended select * from alltypesparquet where
(cint=49 and cfloat=3.5) or
(cint=47 and cfloat=2.09) or
(cint=45 and cfloat=3.02);
set hive.optimize.point.lookup=true;
set hive.optimize.point.lookup.min=1;
explain extended select * from alltypesparquet where
(cint=49 and cfloat=3.5) or
(cint=47 and cfloat=2.09) or
(cint=45 and cfloat=3.02);
explain extended select * from alltypesparquet where
(cint=49 or cfloat=3.5) and
(cint=47 or cfloat=2.09) and
(cint=45 or cfloat=3.02);
explain extended select count(*),cstring1 from alltypesparquet where cstring1='biology'
or cstring1='history'
or cstring1='topology' group by cstring1 order by cstring1;
drop table if exists cast_string_to_int_1;
drop table if exists cast_string_to_int_2;
create table cast_string_to_int_1 as select CAST(CAST(key as float) as string),value from srcbucket;
create table cast_string_to_int_2(i int,s string);
insert overwrite table cast_string_to_int_2 select * from cast_string_to_int_1;
--moving ALL_1 system test here
select all key from src;