| #!/usr/bin/env bash |
| # |
| # Licensed to the Apache Software Foundation (ASF) under one |
| # or more contributor license agreements. See the NOTICE file |
| # distributed with this work for additional information |
| # regarding copyright ownership. The ASF licenses this file |
| # to you under the Apache License, Version 2.0 (the |
| # "License"); you may not use this file except in compliance |
| # with the License. You may obtain a copy of the License at |
| # |
| # http://www.apache.org/licenses/LICENSE-2.0 |
| # |
| # Unless required by applicable law or agreed to in writing, |
| # software distributed under the License is distributed on an |
| # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| # KIND, either express or implied. See the License for the |
| # specific language governing permissions and limitations |
| # under the License. |
| |
| set -e |
| |
| # check that optional pyarrow modules are available |
| # because pytest would just skip the dask tests |
| python -c "import pyarrow.orc" |
| python -c "import pyarrow.parquet" |
| |
| # check that dask.dataframe is correctly installed |
| python -c "import dask.dataframe" |
| |
| # TODO(kszucs): the following tests are also uses pyarrow |
| # pytest -sv --pyargs dask.bytes.tests.test_hdfs |
| # pytest -sv --pyargs dask.bytes.tests.test_local |
| |
| # The "skip_with_pyarrow_strings" marker is meant to skip automatically, but that doesn't work with --pyargs, so de-selecting manually |
| # - The 'test_categorize_info' test is failing because of change in StringArray's nbytes and |
| # an upstream fix (https://github.com/apache/arrow/issues/39028) |
| # - The 'test_describe_empty' test is flakey |
| # upstream issue: https://github.com/dask/dask/issues/10672 |
| # - The 'test_view' fails because we are not using the dev version of pandas |
| # where pd.Series.view is deprecated (https://pandas.pydata.org/docs/dev/reference/api/pandas.Series.view.html) |
| pytest -v --pyargs dask.dataframe.tests.test_dataframe -m "not skip_with_pyarrow_strings" \ |
| -k "not test_categorize_info and not test_describe_empty and not test_view" |
| pytest -v --pyargs dask.dataframe.io.tests.test_orc |
| pytest -v --pyargs dask.dataframe.io.tests.test_parquet \ |
| -m "not skip_with_pyarrow_strings and not xfail_with_pyarrow_strings" |
| # this file contains parquet tests that use S3 filesystem |
| pytest -v --pyargs dask.bytes.tests.test_s3 |