blob: 9cca2f47f62424eadf3bd5eb02beaef8c780258c [file] [log] [blame]
SET hive.query.results.cache.enabled=false;
SET hive.mapred.mode=nonstrict;
SET hive.explain.user=false;
dfs ${system:test.dfs.mkdir} ${system:test.tmp.dir}/testcase1;
dfs -copyFromLocal ../../data/files/compressed_4line_file1.csv ${system:test.tmp.dir}/testcase1/;
CREATE EXTERNAL TABLE `testcase1`(id int, name string) ROW FORMAT SERDE 'org.apache.hadoop.hive.serde2.OpenCSVSerde'
LOCATION '${system:test.tmp.dir}/testcase1'
TBLPROPERTIES ("skip.header.line.count"="1", "skip.footer.line.count"="1");
CREATE EXTERNAL TABLE `testcase2`(id int, name string) ROW FORMAT SERDE 'org.apache.hadoop.hive.serde2.OpenCSVSerde'
LOCATION '${system:test.tmp.dir}/testcase1'
TBLPROPERTIES ("skip.header.line.count"="1", "skip.footer.line.count"="0");
CREATE EXTERNAL TABLE `testcase3`(id int, name string) ROW FORMAT SERDE 'org.apache.hadoop.hive.serde2.OpenCSVSerde'
LOCATION '${system:test.tmp.dir}/testcase1'
TBLPROPERTIES ("skip.header.line.count"="0", "skip.footer.line.count"="1");
SET hive.fetch.task.conversion = more;
select * from testcase1;
select count(*) from testcase1;
select * from testcase2;
select count(*) from testcase2;
select * from testcase3;
select count(*) from testcase3;
SET hive.fetch.task.conversion = none;
select * from testcase1;
select count(*) from testcase1;
select * from testcase2;
select count(*) from testcase2;
select * from testcase3;
select count(*) from testcase3;
dfs ${system:test.dfs.mkdir} ${system:test.tmp.dir}/testcase2;
dfs ${system:test.dfs.mkdir} ${system:test.tmp.dir}/testcase3;
dfs ${system:test.dfs.mkdir} ${system:test.tmp.dir}/testcase4;
dfs -copyFromLocal ../../data/files/compressed_4line_file2.csv.bz2 ${system:test.tmp.dir}/testcase2/;
dfs -copyFromLocal ../../data/files/compressed_4line_file2.csv.bz2 ${system:test.tmp.dir}/testcase3/;
dfs -copyFromLocal ../../data/files/compressed_4line_file2.csv.bz2 ${system:test.tmp.dir}/testcase4/;
--
-- Stored encoded in Cache so need to create separate Tables
CREATE EXTERNAL TABLE `testcase4`(id int, name string) ROW FORMAT SERDE 'org.apache.hadoop.hive.serde2.OpenCSVSerde'
LOCATION '${system:test.tmp.dir}/testcase2'
TBLPROPERTIES ("skip.header.line.count"="1", "skip.footer.line.count"="1");
CREATE EXTERNAL TABLE `testcase5`(id int, name string) ROW FORMAT SERDE 'org.apache.hadoop.hive.serde2.OpenCSVSerde'
LOCATION '${system:test.tmp.dir}/testcase3'
TBLPROPERTIES ("skip.header.line.count"="1", "skip.footer.line.count"="0");
CREATE EXTERNAL TABLE `testcase6`(id int, name string) ROW FORMAT SERDE 'org.apache.hadoop.hive.serde2.OpenCSVSerde'
LOCATION '${system:test.tmp.dir}/testcase4'
TBLPROPERTIES ("skip.header.line.count"="0", "skip.footer.line.count"="1");
SET hive.fetch.task.conversion = more;
select * from testcase4;
select count(*) from testcase4;
select * from testcase5;
select count(*) from testcase5;
select * from testcase6;
select count(*) from testcase6;
SET hive.fetch.task.conversion = none;
select * from testcase4;
select count(*) from testcase4;
select * from testcase5;
select count(*) from testcase5;
select * from testcase6;
select count(*) from testcase6;
dfs ${system:test.dfs.mkdir} ${system:test.tmp.dir}/testcase_gz;
dfs -copyFromLocal ../../data/files/test.csv.gz ${system:test.tmp.dir}/testcase_gz/;
create table testcase_gz(age int, name string)
ROW FORMAT DELIMITED FIELDS TERMINATED BY ',' LINES TERMINATED BY '\n'
stored as textfile LOCATION '${system:test.tmp.dir}/testcase_gz'
TBLPROPERTIES ("skip.header.line.count"="1", "skip.footer.line.count"="1");
SET hive.fetch.task.conversion = more;
select * from testcase_gz;
select count(*) from testcase_gz;
set hive.fetch.task.conversion=none;
select * from testcase_gz;
select count(*) from testcase_gz;
-- clean up testdata
dfs -rmr ${system:test.tmp.dir}/testcase_gz;
dfs -rmr ${system:test.tmp.dir}/testcase1/;
dfs -rmr ${system:test.tmp.dir}/testcase2/;
dfs -rmr ${system:test.tmp.dir}/testcase3/;
dfs -rmr ${system:test.tmp.dir}/testcase4/;