DRILL-7405: Avoiding download of TPC-H data
closes #1874
diff --git a/contrib/data/tpch-sample-data/bin/pom.xml b/contrib/data/tpch-sample-data/bin/pom.xml
deleted file mode 100644
index 9afb8f1..0000000
--- a/contrib/data/tpch-sample-data/bin/pom.xml
+++ /dev/null
@@ -1,140 +0,0 @@
-<?xml version="1.0"?>
-<!--
-
- Licensed to the Apache Software Foundation (ASF) under one
- or more contributor license agreements. See the NOTICE file
- distributed with this work for additional information
- regarding copyright ownership. The ASF licenses this file
- to you under the Apache License, Version 2.0 (the
- "License"); you may not use this file except in compliance
- with the License. You may obtain a copy of the License at
-
- http://www.apache.org/licenses/LICENSE-2.0
-
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
-
--->
-<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
- xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
- <modelVersion>4.0.0</modelVersion>
- <parent>
- <artifactId>drill-contrib-data-parent</artifactId>
- <groupId>org.apache.drill.contrib.data</groupId>
- <version>0.8.0-SNAPSHOT</version>
- </parent>
-
- <artifactId>tpch-sample-data</artifactId>
- <name>contrib/data/tpch-sample-data</name>
- <packaging>jar</packaging>
-
- <dependencies>
- </dependencies>
- <build>
- <plugins>
- <plugin>
- <groupId>com.googlecode.maven-download-plugin</groupId>
- <artifactId>maven-download-plugin</artifactId>
- <version>1.1.0</version>
- <executions>
- <execution>
- <id>install-tgz</id>
- <phase>package</phase>
- <goals>
- <goal>wget</goal>
- </goals>
- <configuration>
- <url>http://apache-drill.s3.amazonaws.com/files/sf-0.01_tpc-h_parquet.tgz</url>
- <outputFileName>tpch.tgz</outputFileName>
- <unpack>true</unpack>
- <outputDirectory>${project.build.directory}</outputDirectory>
- </configuration>
- </execution>
- </executions>
- </plugin>
-
- <plugin>
- <groupId>org.codehaus.mojo</groupId>
- <artifactId>truezip-maven-plugin</artifactId>
- <version>1.0</version>
- <executions>
- <execution>
- <id>copy-out-files</id>
- <goals>
- <goal>copy</goal>
- </goals>
- <phase>package</phase>
- <configuration>
-<!-- <from>${project.build.directory}/tpch.tgz</from> -->
-<!-- <to>${project.build.directory}/data/</to> -->
- </configuration>
- </execution>
-
- <execution>
- <id>copy-out-fileset</id>
- <goals>
- <goal>copy</goal>
- </goals>
- <phase>package</phase>
- <configuration>
- <fileset>
- <directory>${project.build.directory}/tpch.tgz</directory>
- <outputDirectory>${project.build.directory}/data</outputDirectory>
- </fileset>
- </configuration>
- </execution>
-
-<!-- <execution> -->
-<!-- <id>copy-out-fileset</id> -->
-<!-- <goals> -->
-<!-- <goal>copy</goal> -->
-<!-- </goals> -->
-<!-- <phase>package</phase> -->
-<!-- <configuration> -->
-<!-- <fileset> -->
-<!-- <directory>${archive}</directory> -->
-<!-- <excludes> -->
-<!-- <exclude>**/pom.properties</exclude> -->
-<!-- </excludes> -->
-<!-- <outputDirectory>${project.build.directory}/copy-fileset</outputDirectory> -->
-<!-- </fileset> -->
-<!-- </configuration> -->
-<!-- </execution> -->
-
- <!-- <execution> -->
- <!-- <id>copy-into</id> -->
- <!-- <goals> -->
- <!-- <goal>copy</goal> -->
- <!-- </goals> -->
- <!-- <phase>package</phase> -->
- <!-- <configuration> -->
- <!-- <fileset> -->
- <!-- <directory>${basedir}</directory> -->
- <!-- <includes> -->
- <!-- <include>*</include> -->
- <!-- </includes> -->
- <!-- <outputDirectory>${archive}/copy-into</outputDirectory> -->
- <!-- </fileset> -->
- <!-- </configuration> -->
- <!-- </execution> -->
- </executions>
- </plugin>
- </plugins>
- </build>
- <pluginRepositories>
- <pluginRepository>
- <id>sonatype-public-repository</id>
- <url>https://oss.sonatype.org/content/groups/public</url>
- <snapshots>
- <enabled>true</enabled>
- </snapshots>
- <releases>
- <enabled>true</enabled>
- </releases>
- </pluginRepository>
- </pluginRepositories>
-
-</project>
diff --git a/contrib/data/tpch-sample-data/parquet/customer.parquet b/contrib/data/tpch-sample-data/parquet/customer.parquet
new file mode 100755
index 0000000..25c6553
--- /dev/null
+++ b/contrib/data/tpch-sample-data/parquet/customer.parquet
Binary files differ
diff --git a/contrib/data/tpch-sample-data/parquet/lineitem.parquet b/contrib/data/tpch-sample-data/parquet/lineitem.parquet
new file mode 100755
index 0000000..7af0a72
--- /dev/null
+++ b/contrib/data/tpch-sample-data/parquet/lineitem.parquet
Binary files differ
diff --git a/contrib/data/tpch-sample-data/parquet/nation.parquet b/contrib/data/tpch-sample-data/parquet/nation.parquet
new file mode 100755
index 0000000..29f2c22
--- /dev/null
+++ b/contrib/data/tpch-sample-data/parquet/nation.parquet
Binary files differ
diff --git a/contrib/data/tpch-sample-data/parquet/orders.parquet b/contrib/data/tpch-sample-data/parquet/orders.parquet
new file mode 100755
index 0000000..3c728ac
--- /dev/null
+++ b/contrib/data/tpch-sample-data/parquet/orders.parquet
Binary files differ
diff --git a/contrib/data/tpch-sample-data/parquet/part.parquet b/contrib/data/tpch-sample-data/parquet/part.parquet
new file mode 100755
index 0000000..e86fe08
--- /dev/null
+++ b/contrib/data/tpch-sample-data/parquet/part.parquet
Binary files differ
diff --git a/contrib/data/tpch-sample-data/parquet/partsupp.parquet b/contrib/data/tpch-sample-data/parquet/partsupp.parquet
new file mode 100755
index 0000000..3321245
--- /dev/null
+++ b/contrib/data/tpch-sample-data/parquet/partsupp.parquet
Binary files differ
diff --git a/contrib/data/tpch-sample-data/parquet/region.parquet b/contrib/data/tpch-sample-data/parquet/region.parquet
new file mode 100755
index 0000000..2994a58
--- /dev/null
+++ b/contrib/data/tpch-sample-data/parquet/region.parquet
Binary files differ
diff --git a/contrib/data/tpch-sample-data/parquet/supplier.parquet b/contrib/data/tpch-sample-data/parquet/supplier.parquet
new file mode 100755
index 0000000..00bc5c0
--- /dev/null
+++ b/contrib/data/tpch-sample-data/parquet/supplier.parquet
Binary files differ
diff --git a/contrib/data/tpch-sample-data/pom.xml b/contrib/data/tpch-sample-data/pom.xml
index 128c3e4..47286b7 100644
--- a/contrib/data/tpch-sample-data/pom.xml
+++ b/contrib/data/tpch-sample-data/pom.xml
@@ -18,7 +18,8 @@
limitations under the License.
-->
-<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+ xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
<modelVersion>4.0.0</modelVersion>
<parent>
<artifactId>drill-contrib-data-parent</artifactId>
@@ -35,21 +36,23 @@
<build>
<plugins>
<plugin>
- <groupId>com.googlecode.maven-download-plugin</groupId>
- <artifactId>download-maven-plugin</artifactId>
- <version>1.2.0</version>
+ <artifactId>maven-resources-plugin</artifactId>
<executions>
<execution>
- <id>install-tgz</id>
- <phase>prepare-package</phase>
+ <id>copy-tpch-data</id>
+ <phase>process-resources</phase>
<goals>
- <goal>wget</goal>
+ <goal>copy-resources</goal>
</goals>
<configuration>
- <url>http://apache-drill.s3.amazonaws.com/files/sf-0.01_tpc-h_parquet_typed.tgz</url>
- <outputFileName>tpch.tgz</outputFileName>
- <unpack>true</unpack>
- <outputDirectory>${project.build.directory}/classes/tpch</outputDirectory>
+ <outputDirectory>${basedir}/target/classes/tpch
+ </outputDirectory>
+ <resources>
+ <resource>
+ <directory>parquet</directory>
+ <filtering>false</filtering>
+ </resource>
+ </resources>
</configuration>
</execution>
</executions>