Skip to content

Commit

Permalink
Arrow ~=18.1.0 (#76)
Browse files Browse the repository at this point in the history
  • Loading branch information
marcin-krystianc authored Jan 9, 2025
1 parent 38709bd commit 6f3bd3a
Show file tree
Hide file tree
Showing 4 changed files with 12 additions and 7 deletions.
4 changes: 3 additions & 1 deletion .github/workflows/python.yml
Original file line number Diff line number Diff line change
Expand Up @@ -136,7 +136,7 @@ jobs:
run: python -m cibuildwheel --output-dir dist
# to supply options, put them in 'env', like:
env:
CIBW_REPAIR_WHEEL_COMMAND_LINUX: auditwheel repair --exclude libarrow.so.1700 --exclude libparquet.so.1700 -w {dest_dir} {wheel}
CIBW_REPAIR_WHEEL_COMMAND_LINUX: auditwheel repair --exclude libarrow.so.1801 --exclude libparquet.so.1801 -w {dest_dir} {wheel}
CIBW_ENVIRONMENT: VCPKG_TARGET_TRIPLET="${{ steps.vcpkg-info.outputs.triplet }}"
CIBW_BUILD_VERBOSITY: 1
# We use manylinux_2_28 for ABI compatibility with pyarrow
Expand Down Expand Up @@ -181,6 +181,7 @@ jobs:

- name: Test with pytest
run: |
pip install -r python/requirements.txt
# Keep in mind that if the local and remote versions are the same, the remote version will be installed
pip install PalletJack --pre --find-links ./dist --break-system-packages --only-binary=:all:
# So now ensure that the local version is installed
Expand Down Expand Up @@ -230,6 +231,7 @@ jobs:

- name: Run benchmarks
run: |
pip install -r python/requirements.txt
# Keep in mind that if the local and remote versions are the same, the remote version will be installed
pip install PalletJack --pre --find-links ./dist --break-system-packages --only-binary=:all:
# So now ensure that the local version is installed
Expand Down
7 changes: 4 additions & 3 deletions python/pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -2,15 +2,16 @@
requires = [
"setuptools>=55.0",
"Cython>=3",
"pyarrow~=17.0",
"numpy>=1.16.6",
"pyarrow~=18.1.0",
"thrift",
]

build-backend = "setuptools.build_meta"

[project]
name = "palletjack"
version = "2.3.1"
version = "2.4.0"
description = "Faster parquet metadata reading"
readme = "README.md"
requires-python = ">=3.9"
Expand All @@ -20,7 +21,7 @@ classifiers = [
"Operating System :: OS Independent",
]
dependencies = [
"pyarrow~=17.0",
"pyarrow~=18.1.0",
]

[tool.setuptools.packages.find]
Expand Down
4 changes: 1 addition & 3 deletions python/requirements.txt
Original file line number Diff line number Diff line change
@@ -1,3 +1 @@
setuptools>=55.0
Cython>=3
pyarrow~=16.0
numpy
4 changes: 4 additions & 0 deletions python/test/test_palletjack.py
Original file line number Diff line number Diff line change
Expand Up @@ -33,6 +33,10 @@ class TestPalletJack(unittest.TestCase):
def test_read_metadata_columns_rows(self):

def validate_reading(parquet_path, index_path, row_groups, column_indices):

# Passing an empty list to the read_row_groups method is an invalid operation since Arrow 18.0.
if (len(row_groups) == 0): return

# Reading using the original metadata
pr = pq.ParquetReader()
pr.open(parquet_path)
Expand Down

0 comments on commit 6f3bd3a

Please sign in to comment.