Skip to content

GH-44815: [C++][Parquet] Add an example to dump statistics read as arrow::ArrayStatistics #47470

GH-44815: [C++][Parquet] Add an example to dump statistics read as arrow::ArrayStatistics

GH-44815: [C++][Parquet] Add an example to dump statistics read as arrow::ArrayStatistics #47470

Workflow file for this run

# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
name: Python
on:
push:
branches:
- '**'
- '!dependabot/**'
tags:
- '**'
paths:
- '.dockerignore'
- '.github/workflows/python.yml'
- 'ci/**'
- 'cpp/**'
- 'docker-compose.yml'
- 'python/**'
pull_request:
paths:
- '.dockerignore'
- '.github/workflows/python.yml'
- 'ci/**'
- 'cpp/**'
- 'docker-compose.yml'
- 'python/**'
concurrency:
group: ${{ github.repository }}-${{ github.head_ref || github.sha }}-${{ github.workflow }}
cancel-in-progress: true
permissions:
contents: read
env:
ARCHERY_DEBUG: 1
DOCKER_VOLUME_PREFIX: ".docker/"
jobs:
docker:
name: ${{ matrix.title }}
runs-on: ubuntu-latest
if: ${{ !contains(github.event.pull_request.title, 'WIP') }}
timeout-minutes: 60
strategy:
fail-fast: false
matrix:
name:
- conda-python-docs
- conda-python-3.10-nopandas
- conda-python-3.9-pandas-1.1.3
- conda-python-3.11-pandas-latest
- conda-python-3.11-no-numpy
include:
- name: conda-python-docs
cache: conda-python-3.10
image: conda-python-docs
title: AMD64 Conda Python 3.10 Sphinx & Numpydoc
python: "3.10"
- name: conda-python-3.10-nopandas
cache: conda-python-3.10
image: conda-python
title: AMD64 Conda Python 3.10 Without Pandas
python: "3.10"
- name: conda-python-3.9-pandas-1.1.3
cache: conda-python-3.9
image: conda-python-pandas
title: AMD64 Conda Python 3.9 Pandas 1.1.3
python: 3.9
pandas: "1.1.3"
numpy: 1.19.5
- name: conda-python-3.11-pandas-latest
cache: conda-python-3.11
image: conda-python-pandas
title: AMD64 Conda Python 3.11 Pandas latest
python: "3.11"
pandas: latest
- name: conda-python-3.11-no-numpy
cache: conda-python-3.11
image: conda-python-no-numpy
title: AMD64 Conda Python 3.11 without NumPy
python: "3.11"
env:
PYTHON: ${{ matrix.python || 3.9 }}
UBUNTU: ${{ matrix.ubuntu || 22.04 }}
PANDAS: ${{ matrix.pandas || 'latest' }}
NUMPY: ${{ matrix.numpy || 'latest' }}
steps:
- name: Checkout Arrow
uses: actions/checkout@3df4ab11eba7bda6032a0b82a6bb43b11571feac # v4.0.0
with:
fetch-depth: 0
submodules: recursive
- name: Cache Docker Volumes
uses: actions/cache@13aacd865c20de90d75de3b17ebe84f7a17d57d2 # v4.0.0
with:
path: .docker
key: ${{ matrix.cache }}-${{ hashFiles('cpp/**') }}
restore-keys: ${{ matrix.cache }}-
- name: Setup Python
uses: actions/setup-python@0b93645e9fea7318ecaed2b359559ac225c90a2b # v5.3.0
with:
python-version: 3.12
- name: Setup Archery
run: pip install -e dev/archery[docker]
- name: Execute Docker Build
env:
ARCHERY_DOCKER_USER: ${{ secrets.DOCKERHUB_USER }}
ARCHERY_DOCKER_PASSWORD: ${{ secrets.DOCKERHUB_TOKEN }}
run: |
source ci/scripts/util_enable_core_dumps.sh
archery docker run ${{ matrix.image }}
- name: Docker Push
if: >-
success() &&
github.event_name == 'push' &&
github.repository == 'apache/arrow' &&
github.ref_name == 'main'
env:
ARCHERY_DOCKER_USER: ${{ secrets.DOCKERHUB_USER }}
ARCHERY_DOCKER_PASSWORD: ${{ secrets.DOCKERHUB_TOKEN }}
continue-on-error: true
run: archery docker push ${{ matrix.image }}
macos:
name: ${{ matrix.architecture }} macOS ${{ matrix.macos-version }} Python 3
runs-on: macos-${{ matrix.macos-version }}
if: ${{ !contains(github.event.pull_request.title, 'WIP') }}
timeout-minutes: 60
strategy:
fail-fast: false
matrix:
include:
- architecture: AMD64
macos-version: "13"
- architecture: ARM64
macos-version: "14"
env:
ARROW_HOME: /tmp/local
ARROW_AZURE: ON
ARROW_DATASET: ON
ARROW_FLIGHT: ON
ARROW_GANDIVA: ON
ARROW_GCS: OFF
ARROW_HDFS: ON
ARROW_JEMALLOC: ON
ARROW_ORC: ON
ARROW_PARQUET: ON
PARQUET_REQUIRE_ENCRYPTION: ON
ARROW_PYTHON: ON
ARROW_S3: ON
ARROW_SUBSTRAIT: ON
ARROW_WITH_ZLIB: ON
ARROW_WITH_LZ4: ON
ARROW_WITH_BZ2: ON
ARROW_WITH_ZSTD: ON
ARROW_WITH_SNAPPY: ON
ARROW_WITH_BROTLI: ON
ARROW_BUILD_TESTS: OFF
PYARROW_TEST_LARGE_MEMORY: ON
# Current oldest supported version according to https://endoflife.date/macos
MACOSX_DEPLOYMENT_TARGET: 12.0
steps:
- name: Checkout Arrow
uses: actions/checkout@v4
with:
fetch-depth: 0
submodules: recursive
- name: Setup Python
uses: actions/[email protected]
with:
python-version: '3.11'
- name: Install Dependencies
shell: bash
run: |
# pkg-config formula is deprecated but it's still installed
# in GitHub Actions runner now. We can remove this once
# pkg-config formula is removed from GitHub Actions runner.
brew uninstall pkg-config || :
brew bundle --file=cpp/Brewfile
python -m pip install \
-r python/requirements-build.txt \
-r python/requirements-test.txt
- name: Install MinIO
run: |
$(brew --prefix bash)/bin/bash \
ci/scripts/install_minio.sh latest /usr/local
- name: Setup ccache
shell: bash
run: ci/scripts/ccache_setup.sh
- name: ccache info
id: ccache-info
shell: bash
run: echo "cache-dir=$(ccache --get-config cache_dir)" >> $GITHUB_OUTPUT
- name: Cache ccache
uses: actions/cache@v4
with:
path: ${{ steps.ccache-info.outputs.cache-dir }}
key: python-ccache-macos-${{ matrix.macos-version }}-${{ hashFiles('cpp/**', 'python/**') }}
restore-keys: python-ccache-macos-${{ matrix.macos-version }}-
- name: Build
shell: bash
run: |
python -m pip install wheel
ci/scripts/cpp_build.sh $(pwd) $(pwd)/build
ci/scripts/python_build.sh $(pwd) $(pwd)/build
- name: Test
shell: bash
run: ci/scripts/python_test.sh $(pwd) $(pwd)/build