This is an automated email from the ASF dual-hosted git repository. arina pushed a commit to branch master in repository https://gitbox.apache.org/repos/asf/drill.git
commit 849e2b67d6f86090c70184051c596f0b1c8f15de Author: Abhishek Girish <agir...@apache.org> AuthorDate: Wed Oct 16 20:24:27 2019 -0700 DRILL-7405: Avoiding download of TPC-H data closes #1874 --- contrib/data/tpch-sample-data/bin/pom.xml | 140 --------------------- .../data/tpch-sample-data/parquet/customer.parquet | Bin 0 -> 132891 bytes .../data/tpch-sample-data/parquet/lineitem.parquet | Bin 0 -> 2839887 bytes .../data/tpch-sample-data/parquet/nation.parquet | Bin 0 -> 1845 bytes .../data/tpch-sample-data/parquet/orders.parquet | Bin 0 -> 661050 bytes contrib/data/tpch-sample-data/parquet/part.parquet | Bin 0 -> 93889 bytes .../data/tpch-sample-data/parquet/partsupp.parquet | Bin 0 -> 449294 bytes .../data/tpch-sample-data/parquet/region.parquet | Bin 0 -> 617 bytes .../data/tpch-sample-data/parquet/supplier.parquet | Bin 0 -> 9699 bytes contrib/data/tpch-sample-data/pom.xml | 25 ++-- 10 files changed, 14 insertions(+), 151 deletions(-) diff --git a/contrib/data/tpch-sample-data/bin/pom.xml b/contrib/data/tpch-sample-data/bin/pom.xml deleted file mode 100644 index 9afb8f1..0000000 --- a/contrib/data/tpch-sample-data/bin/pom.xml +++ /dev/null @@ -1,140 +0,0 @@ -<?xml version="1.0"?> -<!-- - - Licensed to the Apache Software Foundation (ASF) under one - or more contributor license agreements. See the NOTICE file - distributed with this work for additional information - regarding copyright ownership. The ASF licenses this file - to you under the Apache License, Version 2.0 (the - "License"); you may not use this file except in compliance - with the License. You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - - Unless required by applicable law or agreed to in writing, software - distributed under the License is distributed on an "AS IS" BASIS, - WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - See the License for the specific language governing permissions and - limitations under the License. - ---> -<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" - xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd"> - <modelVersion>4.0.0</modelVersion> - <parent> - <artifactId>drill-contrib-data-parent</artifactId> - <groupId>org.apache.drill.contrib.data</groupId> - <version>0.8.0-SNAPSHOT</version> - </parent> - - <artifactId>tpch-sample-data</artifactId> - <name>contrib/data/tpch-sample-data</name> - <packaging>jar</packaging> - - <dependencies> - </dependencies> - <build> - <plugins> - <plugin> - <groupId>com.googlecode.maven-download-plugin</groupId> - <artifactId>maven-download-plugin</artifactId> - <version>1.1.0</version> - <executions> - <execution> - <id>install-tgz</id> - <phase>package</phase> - <goals> - <goal>wget</goal> - </goals> - <configuration> - <url>http://apache-drill.s3.amazonaws.com/files/sf-0.01_tpc-h_parquet.tgz</url> - <outputFileName>tpch.tgz</outputFileName> - <unpack>true</unpack> - <outputDirectory>${project.build.directory}</outputDirectory> - </configuration> - </execution> - </executions> - </plugin> - - <plugin> - <groupId>org.codehaus.mojo</groupId> - <artifactId>truezip-maven-plugin</artifactId> - <version>1.0</version> - <executions> - <execution> - <id>copy-out-files</id> - <goals> - <goal>copy</goal> - </goals> - <phase>package</phase> - <configuration> -<!-- <from>${project.build.directory}/tpch.tgz</from> --> -<!-- <to>${project.build.directory}/data/</to> --> - </configuration> - </execution> - - <execution> - <id>copy-out-fileset</id> - <goals> - <goal>copy</goal> - </goals> - <phase>package</phase> - <configuration> - <fileset> - <directory>${project.build.directory}/tpch.tgz</directory> - <outputDirectory>${project.build.directory}/data</outputDirectory> - </fileset> - </configuration> - </execution> - -<!-- <execution> --> -<!-- <id>copy-out-fileset</id> --> -<!-- <goals> --> -<!-- <goal>copy</goal> --> -<!-- </goals> --> -<!-- <phase>package</phase> --> -<!-- <configuration> --> -<!-- <fileset> --> -<!-- <directory>${archive}</directory> --> -<!-- <excludes> --> -<!-- <exclude>**/pom.properties</exclude> --> -<!-- </excludes> --> -<!-- <outputDirectory>${project.build.directory}/copy-fileset</outputDirectory> --> -<!-- </fileset> --> -<!-- </configuration> --> -<!-- </execution> --> - - <!-- <execution> --> - <!-- <id>copy-into</id> --> - <!-- <goals> --> - <!-- <goal>copy</goal> --> - <!-- </goals> --> - <!-- <phase>package</phase> --> - <!-- <configuration> --> - <!-- <fileset> --> - <!-- <directory>${basedir}</directory> --> - <!-- <includes> --> - <!-- <include>*</include> --> - <!-- </includes> --> - <!-- <outputDirectory>${archive}/copy-into</outputDirectory> --> - <!-- </fileset> --> - <!-- </configuration> --> - <!-- </execution> --> - </executions> - </plugin> - </plugins> - </build> - <pluginRepositories> - <pluginRepository> - <id>sonatype-public-repository</id> - <url>https://oss.sonatype.org/content/groups/public</url> - <snapshots> - <enabled>true</enabled> - </snapshots> - <releases> - <enabled>true</enabled> - </releases> - </pluginRepository> - </pluginRepositories> - -</project> diff --git a/contrib/data/tpch-sample-data/parquet/customer.parquet b/contrib/data/tpch-sample-data/parquet/customer.parquet new file mode 100755 index 0000000..25c6553 Binary files /dev/null and b/contrib/data/tpch-sample-data/parquet/customer.parquet differ diff --git a/contrib/data/tpch-sample-data/parquet/lineitem.parquet b/contrib/data/tpch-sample-data/parquet/lineitem.parquet new file mode 100755 index 0000000..7af0a72 Binary files /dev/null and b/contrib/data/tpch-sample-data/parquet/lineitem.parquet differ diff --git a/contrib/data/tpch-sample-data/parquet/nation.parquet b/contrib/data/tpch-sample-data/parquet/nation.parquet new file mode 100755 index 0000000..29f2c22 Binary files /dev/null and b/contrib/data/tpch-sample-data/parquet/nation.parquet differ diff --git a/contrib/data/tpch-sample-data/parquet/orders.parquet b/contrib/data/tpch-sample-data/parquet/orders.parquet new file mode 100755 index 0000000..3c728ac Binary files /dev/null and b/contrib/data/tpch-sample-data/parquet/orders.parquet differ diff --git a/contrib/data/tpch-sample-data/parquet/part.parquet b/contrib/data/tpch-sample-data/parquet/part.parquet new file mode 100755 index 0000000..e86fe08 Binary files /dev/null and b/contrib/data/tpch-sample-data/parquet/part.parquet differ diff --git a/contrib/data/tpch-sample-data/parquet/partsupp.parquet b/contrib/data/tpch-sample-data/parquet/partsupp.parquet new file mode 100755 index 0000000..3321245 Binary files /dev/null and b/contrib/data/tpch-sample-data/parquet/partsupp.parquet differ diff --git a/contrib/data/tpch-sample-data/parquet/region.parquet b/contrib/data/tpch-sample-data/parquet/region.parquet new file mode 100755 index 0000000..2994a58 Binary files /dev/null and b/contrib/data/tpch-sample-data/parquet/region.parquet differ diff --git a/contrib/data/tpch-sample-data/parquet/supplier.parquet b/contrib/data/tpch-sample-data/parquet/supplier.parquet new file mode 100755 index 0000000..00bc5c0 Binary files /dev/null and b/contrib/data/tpch-sample-data/parquet/supplier.parquet differ diff --git a/contrib/data/tpch-sample-data/pom.xml b/contrib/data/tpch-sample-data/pom.xml index 128c3e4..47286b7 100644 --- a/contrib/data/tpch-sample-data/pom.xml +++ b/contrib/data/tpch-sample-data/pom.xml @@ -18,7 +18,8 @@ limitations under the License. --> -<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd"> +<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" + xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd"> <modelVersion>4.0.0</modelVersion> <parent> <artifactId>drill-contrib-data-parent</artifactId> @@ -35,21 +36,23 @@ <build> <plugins> <plugin> - <groupId>com.googlecode.maven-download-plugin</groupId> - <artifactId>download-maven-plugin</artifactId> - <version>1.2.0</version> + <artifactId>maven-resources-plugin</artifactId> <executions> <execution> - <id>install-tgz</id> - <phase>prepare-package</phase> + <id>copy-tpch-data</id> + <phase>process-resources</phase> <goals> - <goal>wget</goal> + <goal>copy-resources</goal> </goals> <configuration> - <url>http://apache-drill.s3.amazonaws.com/files/sf-0.01_tpc-h_parquet_typed.tgz</url> - <outputFileName>tpch.tgz</outputFileName> - <unpack>true</unpack> - <outputDirectory>${project.build.directory}/classes/tpch</outputDirectory> + <outputDirectory>${basedir}/target/classes/tpch + </outputDirectory> + <resources> + <resource> + <directory>parquet</directory> + <filtering>false</filtering> + </resource> + </resources> </configuration> </execution> </executions>