| # Licensed to the Apache Software Foundation (ASF) under one |
| # or more contributor license agreements. See the NOTICE file |
| # distributed with this work for additional information |
| # regarding copyright ownership. The ASF licenses this file |
| # to you under the Apache License, Version 2.0 (the |
| # "License"); you may not use this file except in compliance |
| # with the License. You may obtain a copy of the License at |
| # |
| # http://www.apache.org/licenses/LICENSE-2.0 |
| # |
| # Unless required by applicable law or agreed to in writing, |
| # software distributed under the License is distributed on an |
| # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| # KIND, either express or implied. See the License for the |
| # specific language governing permissions and limitations |
| # under the License. |
| |
| name: Python |
| |
| on: |
| push: |
| branches: |
| - '**' |
| - '!dependabot/**' |
| tags: |
| - '**' |
| paths: |
| - '.dockerignore' |
| - '.github/workflows/python.yml' |
| - 'ci/**' |
| - 'cpp/**' |
| - 'compose.yaml' |
| - 'python/**' |
| pull_request: |
| paths: |
| - '.dockerignore' |
| - '.github/workflows/python.yml' |
| - 'ci/**' |
| - 'cpp/**' |
| - 'compose.yaml' |
| - 'python/**' |
| |
| concurrency: |
| group: ${{ github.repository }}-${{ github.head_ref || github.sha }}-${{ github.workflow }} |
| cancel-in-progress: true |
| |
| permissions: |
| contents: read |
| |
| env: |
| ARCHERY_DEBUG: 1 |
| DOCKER_VOLUME_PREFIX: ".docker/" |
| |
| jobs: |
| |
| docker: |
| name: ${{ matrix.title }} |
| runs-on: ubuntu-latest |
| if: ${{ !contains(github.event.pull_request.title, 'WIP') }} |
| timeout-minutes: 60 |
| strategy: |
| fail-fast: false |
| matrix: |
| name: |
| - conda-python-docs |
| - conda-python-3.11-nopandas |
| - conda-python-3.10-pandas-1.3.4 |
| - conda-python-3.13-pandas-latest |
| - conda-python-3.12-no-numpy |
| include: |
| - name: conda-python-docs |
| cache: conda-python-3.10 |
| image: conda-python-docs |
| title: AMD64 Conda Python 3.10 Sphinx & Numpydoc |
| python: "3.10" |
| - name: conda-python-3.11-nopandas |
| cache: conda-python-3.11 |
| image: conda-python |
| title: AMD64 Conda Python 3.11 Without Pandas |
| python: "3.11" |
| - name: conda-python-3.10-pandas-1.3.4 |
| cache: conda-python-3.10 |
| image: conda-python-pandas |
| title: AMD64 Conda Python 3.10 Pandas 1.3.4 |
| python: "3.10" |
| pandas: "1.3.4" |
| numpy: "1.21.2" |
| - name: conda-python-3.13-pandas-latest |
| cache: conda-python-3.13 |
| image: conda-python-pandas |
| title: AMD64 Conda Python 3.13 Pandas latest |
| python: "3.13" |
| pandas: latest |
| - name: conda-python-3.12-no-numpy |
| cache: conda-python-3.12 |
| image: conda-python-no-numpy |
| title: AMD64 Conda Python 3.12 without NumPy |
| python: "3.12" |
| env: |
| PYTHON: ${{ matrix.python || 3.10 }} |
| UBUNTU: ${{ matrix.ubuntu || 22.04 }} |
| PANDAS: ${{ matrix.pandas || 'latest' }} |
| NUMPY: ${{ matrix.numpy || 'latest' }} |
| steps: |
| - name: Checkout Arrow |
| uses: actions/checkout@v6 |
| with: |
| fetch-depth: 0 |
| submodules: recursive |
| - name: Cache Docker Volumes |
| uses: actions/cache@v5 |
| with: |
| path: .docker |
| key: ${{ matrix.cache }}-${{ hashFiles('cpp/**') }} |
| restore-keys: ${{ matrix.cache }}- |
| - name: Setup Python |
| uses: actions/setup-python@v6 |
| with: |
| python-version: 3.12 |
| - name: Setup Archery |
| run: pip install -e dev/archery[docker] |
| - name: Execute Docker Build |
| env: |
| ARCHERY_DOCKER_USER: ${{ secrets.DOCKERHUB_USER }} |
| ARCHERY_DOCKER_PASSWORD: ${{ secrets.DOCKERHUB_TOKEN }} |
| run: | |
| source ci/scripts/util_enable_core_dumps.sh |
| archery docker run ${{ matrix.image }} |
| - name: Docker Push |
| if: >- |
| success() && |
| github.event_name == 'push' && |
| github.repository == 'apache/arrow' && |
| github.ref_name == 'main' |
| env: |
| ARCHERY_DOCKER_USER: ${{ secrets.DOCKERHUB_USER }} |
| ARCHERY_DOCKER_PASSWORD: ${{ secrets.DOCKERHUB_TOKEN }} |
| continue-on-error: true |
| run: archery docker push ${{ matrix.image }} |
| |
| macos: |
| name: ${{ matrix.architecture }} macOS ${{ matrix.macos-version }} Python 3 |
| runs-on: macos-${{ matrix.macos-version }} |
| if: ${{ !contains(github.event.pull_request.title, 'WIP') }} |
| timeout-minutes: 60 |
| strategy: |
| fail-fast: false |
| matrix: |
| include: |
| - architecture: AMD64 |
| macos-version: "15-intel" |
| - architecture: ARM64 |
| macos-version: "14" |
| env: |
| ARROW_HOME: /tmp/local |
| ARROW_AZURE: ON |
| ARROW_DATASET: ON |
| ARROW_FLIGHT: ON |
| ARROW_GANDIVA: ON |
| ARROW_GCS: OFF |
| ARROW_HDFS: ON |
| ARROW_JEMALLOC: ON |
| ARROW_ORC: ON |
| ARROW_PARQUET: ON |
| PARQUET_REQUIRE_ENCRYPTION: ON |
| ARROW_PYTHON: ON |
| ARROW_S3: ON |
| ARROW_SUBSTRAIT: ON |
| ARROW_WITH_ZLIB: ON |
| ARROW_WITH_LZ4: ON |
| ARROW_WITH_BZ2: ON |
| ARROW_WITH_ZSTD: ON |
| ARROW_WITH_SNAPPY: ON |
| ARROW_WITH_BROTLI: ON |
| ARROW_BUILD_TESTS: OFF |
| PYARROW_TEST_LARGE_MEMORY: ON |
| # Current oldest supported version according to https://endoflife.date/macos |
| MACOSX_DEPLOYMENT_TARGET: 12.0 |
| steps: |
| - name: Checkout Arrow |
| uses: actions/checkout@v6 |
| with: |
| fetch-depth: 0 |
| submodules: recursive |
| - name: Setup Python |
| uses: actions/setup-python@v6 |
| with: |
| python-version: '3.11' |
| - name: Install Dependencies |
| shell: bash |
| run: | |
| # pkg-config formula is deprecated but it's still installed |
| # in GitHub Actions runner now. We can remove this once |
| # pkg-config formula is removed from GitHub Actions runner. |
| brew uninstall pkg-config || : |
| brew uninstall pkg-config@0.29.2 || : |
| brew bundle --file=cpp/Brewfile |
| |
| python -m pip install \ |
| -r python/requirements-build.txt \ |
| -r python/requirements-test.txt |
| - name: Install MinIO |
| run: | |
| $(brew --prefix bash)/bin/bash \ |
| ci/scripts/install_minio.sh latest /usr/local |
| - name: Setup ccache |
| shell: bash |
| run: ci/scripts/ccache_setup.sh |
| - name: ccache info |
| id: ccache-info |
| shell: bash |
| run: echo "cache-dir=$(ccache --get-config cache_dir)" >> $GITHUB_OUTPUT |
| - name: Cache ccache |
| uses: actions/cache@v5 |
| with: |
| path: ${{ steps.ccache-info.outputs.cache-dir }} |
| key: python-ccache-macos-${{ matrix.macos-version }}-${{ hashFiles('cpp/**', 'python/**') }} |
| restore-keys: python-ccache-macos-${{ matrix.macos-version }}- |
| - name: Build |
| shell: bash |
| run: | |
| if [ "${{ matrix.macos-version }}" = "15-intel" ]; then |
| # This is a workaround. |
| # |
| # Homebrew uses /usr/local as prefix. So packages |
| # installed by Homebrew also use /usr/local/include. We |
| # want to include headers for packages installed by |
| # Homebrew as system headers to ignore warnings in them. |
| # But "-isystem /usr/local/include" isn't used by CMake |
| # because /usr/local/include is marked as the default |
| # include path. So we disable -Werror to avoid build error |
| # by warnings from packages installed by Homebrew. |
| export BUILD_WARNING_LEVEL=PRODUCTION |
| fi |
| |
| python -m pip install wheel |
| ci/scripts/cpp_build.sh $(pwd) $(pwd)/build |
| ci/scripts/python_build.sh $(pwd) $(pwd)/build |
| - name: Test |
| shell: bash |
| run: ci/scripts/python_test.sh $(pwd) $(pwd)/build |
| |
| windows: |
| name: AMD64 Windows 2022 Python 3.13 |
| runs-on: windows-2022 |
| if: ${{ !contains(github.event.pull_request.title, 'WIP') }} |
| timeout-minutes: 60 |
| env: |
| PYTHON_CMD: "py -3.13" |
| steps: |
| - name: Disable Crash Dialogs |
| run: | |
| reg add ` |
| "HKCU\SOFTWARE\Microsoft\Windows\Windows Error Reporting" ` |
| /v DontShowUI ` |
| /t REG_DWORD ` |
| /d 1 ` |
| /f |
| - name: Checkout Arrow |
| uses: actions/checkout@v6 |
| with: |
| fetch-depth: 0 |
| submodules: recursive |
| - name: Setup Python |
| uses: actions/setup-python@v6 |
| with: |
| python-version: 3.13 |
| - name: Install ccache |
| shell: bash |
| run: | |
| ci/scripts/install_ccache.sh 4.6.3 /usr |
| - name: Setup ccache |
| shell: bash |
| run: | |
| ci/scripts/ccache_setup.sh |
| - name: Generate path variables |
| id: path-info |
| shell: bash |
| run: | |
| echo "CCACHE_DIR=$(ccache --get-config cache_dir)" >> $GITHUB_ENV |
| echo "usr-windows-dir="$(cygpath --absolute --windows /usr)"" >> $GITHUB_OUTPUT |
| - name: Cache ccache |
| uses: actions/cache@v5 |
| with: |
| path: ${{ env.CCACHE_DIR }} |
| key: python-ccache-windows-${{ env.CACHE_VERSION }}-${{ hashFiles('cpp/**') }} |
| restore-keys: python-ccache-windows-${{ env.CACHE_VERSION }}- |
| env: |
| # We can invalidate the current cache by updating this. |
| CACHE_VERSION: "2025-09-16.1" |
| - name: Build Arrow C++ and PyArrow |
| shell: cmd |
| run: | |
| call "ci\scripts\python_build.bat" %cd% "${{ steps.path-info.outputs.usr-windows-dir }}" |
| - name: Test PyArrow |
| shell: cmd |
| run: | |
| call "ci\scripts\python_test.bat" %cd% |