blob: f5a24e462b74219d4683c9ef3e1dab85218b0bc8 [file] [log] [blame]
#!/usr/bin/env bash
#
# Licensed to the Apache Software Foundation (ASF) under one or more
# contributor license agreements. See the NOTICE file distributed with
# this work for additional information regarding copyright ownership.
# The ASF licenses this file to You under the Apache License, Version 2.0
# (the "License"); you may not use this file except in compliance with
# the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
# Set up environment and working directory
cd /apache-arrow
export ARROW_BUILD_TYPE=release
export ARROW_HOME=$(pwd)/dist
export PARQUET_HOME=$(pwd)/dist
CONDA_BASE=/home/ubuntu/miniconda
export LD_LIBRARY_PATH=$(pwd)/dist/lib:${CONDA_BASE}/lib:${LD_LIBRARY_PATH}
# Allow for --user Python installation inside Docker
export HOME=$(pwd)
# Clean up and get the dask master branch from github
rm -rf dask .local
export GIT_COMMITTER_NAME="Nobody"
export GIT_COMMITTER_EMAIL="nobody@nowhere.com"
git clone https://github.com/dask/dask.git
pushd dask
pip install --user -e .[complete]
# Verify integrity of the installed dask dataframe code
py.test dask/dataframe/tests/test_dataframe.py
popd
# Run the integration test
pushd arrow/python/testing
py.test dask_tests
popd
pushd dask/dask/dataframe/io
py.test tests/test_parquet.py
popd