forked from pool/apache-arrow
Compare commits
31 Commits
| Author | SHA256 | Date | |
|---|---|---|---|
| 97d3f5b9bd | |||
| fe8beb41f1 | |||
| 95ae261a6d | |||
| 423747c6f1 | |||
| d7bbabe07b | |||
| f26a64d1c1 | |||
| a49d6aac12 | |||
| b8b054a93e | |||
| 26f7f2002b | |||
| 77cc1e4fa0 | |||
| 4a660bf2fd | |||
| 77a7a6c0ae | |||
| b3fe0e46bf | |||
| 7710aa0469 | |||
| 96176c78b0 | |||
| 9b0d645fe4 | |||
| 69d004fa1c | |||
| 2266545ad6 | |||
| 6abdc26711 | |||
| 274e24f951 | |||
| 2caac2258f | |||
| cebda09598 | |||
| 0389e42d45 | |||
| 9f1d8991ae | |||
| 1539a8cfb2 | |||
| 22a0ee3370 | |||
| 20345967c9 | |||
| 6f40ca4abe | |||
| 174a699a90 | |||
| 86cdaafbd4 | |||
| ada1664357 |
@@ -1,3 +0,0 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:423eb4c1d6dbbcb7ca429d548e94f8a99cd4603bc023de9c0578d1950ce0f21d
|
||||
size 21350177
|
||||
3
apache-arrow-21.0.0.tar.gz
Normal file
3
apache-arrow-21.0.0.tar.gz
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:e92401790fdba33bfb4b8aa522626d800ea7fda4b6f036aaf39849927d2cf88d
|
||||
size 17241418
|
||||
1140
apache-arrow.changes
1140
apache-arrow.changes
File diff suppressed because it is too large
Load Diff
@@ -1,7 +1,7 @@
|
||||
#
|
||||
# spec file for package apache-arrow
|
||||
#
|
||||
# Copyright (c) 2024 SUSE LLC
|
||||
# Copyright (c) 2025 SUSE LLC and contributors
|
||||
#
|
||||
# All modifications and additions to the file contributed by third parties
|
||||
# remain the property of their copyright owners, unless otherwise agreed
|
||||
@@ -16,19 +16,28 @@
|
||||
#
|
||||
|
||||
|
||||
%bcond_without tests
|
||||
%bcond_without flight
|
||||
|
||||
# Remove static build due to devel-static packages being required by the generated CMake Targets
|
||||
%bcond_with static
|
||||
%bcond_without tests
|
||||
# Required for runtime dispatch, not yet packaged
|
||||
%bcond_with xsimd
|
||||
|
||||
%define sonum 1600
|
||||
%if %{suse_version} <= 1500
|
||||
# requires __has_builtin with keywords
|
||||
%define gccver 13
|
||||
%endif
|
||||
|
||||
%define sonum 2100
|
||||
# See git submodule /testing pointing to the correct revision
|
||||
%define arrow_testing_commit 25d16511e8d42c2744a1d94d90169e3a36e92631
|
||||
%define arrow_testing_commit fbf6b703dc93d17d75fa3664c5aa2c7873ebaf06
|
||||
# See git submodule /cpp/submodules/parquet-testing pointing to the correct revision
|
||||
%define parquet_testing_commit 74278bc4a1122d74945969e6dec405abd1533ec3
|
||||
%define parquet_testing_commit 18d17540097fca7c40be3d42c167e6bfad90763c
|
||||
# See cpp/thirdparty/versions.txt, replace by BuildRequires: pkgconfig(mimalloc) as soon as gh#apache/arrow#42211 is resolved
|
||||
%define arrow_mimalloc_build_version v2.2.4
|
||||
Name: apache-arrow
|
||||
Version: 16.0.0
|
||||
Version: 21.0.0
|
||||
Release: 0
|
||||
Summary: A development platform for in-memory data
|
||||
License: Apache-2.0 AND BSD-3-Clause AND BSD-2-Clause AND MIT
|
||||
@@ -38,41 +47,50 @@ URL: https://arrow.apache.org/
|
||||
Source0: https://github.com/apache/arrow/archive/apache-arrow-%{version}.tar.gz
|
||||
Source1: https://github.com/apache/arrow-testing/archive/%{arrow_testing_commit}.tar.gz#/arrow-testing-%{version}.tar.gz
|
||||
Source2: https://github.com/apache/parquet-testing/archive/%{parquet_testing_commit}.tar.gz#/parquet-testing-%{version}.tar.gz
|
||||
Source3: https://github.com/microsoft/mimalloc/archive/%{arrow_mimalloc_build_version}.tar.gz#/mimalloc-%{arrow_mimalloc_build_version}.tar.gz
|
||||
# PATCH-FIX-OPENSUSE arrow-boost-system-1.89-boo1249599.patch gh#boostorg/system#132, boo#1249599
|
||||
Patch1: arrow-boost-system-1.89-boo1249599.patch
|
||||
BuildRequires: bison
|
||||
BuildRequires: cmake >= 3.16
|
||||
BuildRequires: cmake >= 3.25
|
||||
BuildRequires: fdupes
|
||||
BuildRequires: flex
|
||||
BuildRequires: gcc-c++
|
||||
BuildRequires: gcc%{?gccver}-c++
|
||||
BuildRequires: libboost_context-devel
|
||||
BuildRequires: libboost_date_time-devel
|
||||
BuildRequires: libboost_filesystem-devel
|
||||
BuildRequires: libboost_system-devel >= 1.64.0
|
||||
BuildRequires: libboost_headers-devel
|
||||
BuildRequires: libboost_process-devel
|
||||
%if 0%{?suse_version} < 1699
|
||||
BuildRequires: libboost_system-devel
|
||||
%endif
|
||||
%if %{with static}
|
||||
BuildRequires: libzstd-devel-static
|
||||
%endif
|
||||
BuildRequires: pkgconfig
|
||||
BuildRequires: python-rpm-macros
|
||||
BuildRequires: python3-base
|
||||
BuildRequires: cmake(Snappy) >= 1.1.7
|
||||
BuildRequires: (cmake(lz4) >= 1.10 or (pkgconfig(liblz4) >= 1.8.3 with pkgconfig(liblz4) < 1.10))
|
||||
BuildRequires: cmake(Snappy) >= 1.2.2
|
||||
BuildRequires: cmake(absl)
|
||||
BuildRequires: cmake(double-conversion) >= 3.1.5
|
||||
BuildRequires: cmake(re2)
|
||||
BuildRequires: pkgconfig(RapidJSON)
|
||||
BuildRequires: pkgconfig(bzip2) >= 1.0.8
|
||||
BuildRequires: pkgconfig(gflags) >= 2.2.0
|
||||
BuildRequires: pkgconfig(grpc++) >= 1.20.0
|
||||
BuildRequires: pkgconfig(libbrotlicommon) >= 1.0.7
|
||||
BuildRequires: pkgconfig(libbrotlidec) >= 1.0.7
|
||||
BuildRequires: pkgconfig(libbrotlienc) >= 1.0.7
|
||||
BuildRequires: pkgconfig(libcares) >= 1.15.0
|
||||
BuildRequires: pkgconfig(libglog) >= 0.3.5
|
||||
BuildRequires: pkgconfig(liblz4) >= 1.8.3
|
||||
BuildRequires: pkgconfig(gflags) >= 2.2.2
|
||||
BuildRequires: pkgconfig(grpc++) >= 1.46.3
|
||||
BuildRequires: pkgconfig(libbrotlicommon) >= 1.0.9
|
||||
BuildRequires: pkgconfig(libbrotlidec) >= 1.0.9
|
||||
BuildRequires: pkgconfig(libbrotlienc) >= 1.0.9
|
||||
BuildRequires: pkgconfig(libcares) >= 1.17.2
|
||||
BuildRequires: pkgconfig(libglog) >= 0.5.0
|
||||
BuildRequires: pkgconfig(libopenssl)
|
||||
BuildRequires: pkgconfig(liburiparser) >= 0.9.3
|
||||
BuildRequires: pkgconfig(libutf8proc)
|
||||
BuildRequires: pkgconfig(libzstd) >= 1.4.3
|
||||
BuildRequires: pkgconfig(protobuf) >= 3.7.1
|
||||
BuildRequires: pkgconfig(sqlite3) >= 3.45.2
|
||||
BuildRequires: pkgconfig(thrift) >= 0.11.0
|
||||
BuildRequires: pkgconfig(zlib) >= 1.2.11
|
||||
BuildRequires: pkgconfig(libutf8proc) >= 2.10.0
|
||||
BuildRequires: pkgconfig(libzstd) >= 1.5.7
|
||||
BuildRequires: pkgconfig(protobuf) >= 21.3
|
||||
BuildRequires: pkgconfig(sqlite3)
|
||||
BuildRequires: pkgconfig(thrift) >= 0.22.0
|
||||
BuildRequires: pkgconfig(zlib) >= 1.3.1
|
||||
%if %{with tests}
|
||||
BuildRequires: timezone
|
||||
BuildRequires: pkgconfig(gmock) >= 1.10
|
||||
@@ -115,6 +133,20 @@ communication.
|
||||
|
||||
This package provides the shared library for the Acero streaming execution engine
|
||||
|
||||
%package -n libarrow_compute%{sonum}
|
||||
Summary: Development platform for in-memory data - shared library
|
||||
Group: System/Libraries
|
||||
|
||||
%description -n libarrow_compute%{sonum}
|
||||
Apache Arrow is a cross-language development platform for in-memory
|
||||
data. It specifies a standardized language-independent columnar memory
|
||||
format for flat and hierarchical data, organized for efficient
|
||||
analytic operations on modern hardware. It also provides computational
|
||||
libraries and zero-copy streaming messaging and interprocess
|
||||
communication.
|
||||
|
||||
This package provides the shared library for the C++ Compute module
|
||||
|
||||
%package -n libarrow_flight%{sonum}
|
||||
Summary: Development platform for in-memory data - shared library
|
||||
Group: System/Libraries
|
||||
@@ -176,16 +208,22 @@ Summary: Development platform for in-memory data - development files
|
||||
Group: Development/Libraries/C and C++
|
||||
Requires: libarrow%{sonum} = %{version}
|
||||
Requires: libarrow_acero%{sonum} = %{version}
|
||||
Requires: libarrow_compute%{sonum} = %{version}
|
||||
Requires: libarrow_dataset%{sonum} = %{version}
|
||||
%if %{with flight}
|
||||
Requires: libarrow_flight%{sonum} = %{version}
|
||||
Requires: libarrow_flight_sql%{sonum} = %{version}
|
||||
%endif
|
||||
%if %{with static}
|
||||
Suggests: %{name}-devel-static = %{version}
|
||||
Suggests: %{name}-acero-devel-static = %{version}
|
||||
Suggests: %{name}-compute-devel-static = %{version}
|
||||
Suggests: %{name}-dataset-devel-static = %{version}
|
||||
%if %{with flight}
|
||||
Suggests: %{name}-flight-devel-static = %{version}
|
||||
Suggests: %{name}-flight-sql-devel-static = %{version}
|
||||
%endif
|
||||
%endif
|
||||
|
||||
%description devel
|
||||
Apache Arrow is a cross-language development platform for in-memory
|
||||
@@ -229,6 +267,21 @@ communication.
|
||||
|
||||
This package provides the static library for the Acero streaming execution engine
|
||||
|
||||
%package compute-devel-static
|
||||
Summary: Development platform for in-memory data - development files
|
||||
Group: Development/Libraries/C and C++
|
||||
Requires: %{name}-devel = %{version}
|
||||
|
||||
%description compute-devel-static
|
||||
Apache Arrow is a cross-language development platform for in-memory
|
||||
data. It specifies a standardized language-independent columnar memory
|
||||
format for flat and hierarchical data, organized for efficient
|
||||
analytic operations on modern hardware. It also provides computational
|
||||
libraries and zero-copy streaming messaging and interprocess
|
||||
communication.
|
||||
|
||||
This package provides the static library for the C++ Compute module
|
||||
|
||||
%package flight-devel-static
|
||||
Summary: Development platform for in-memory data - development files
|
||||
Group: Development/Libraries/C and C++
|
||||
@@ -324,13 +377,18 @@ This package provides utilities for working with the Parquet format.
|
||||
|
||||
%prep
|
||||
%setup -q -n arrow-apache-arrow-%{version} -a1 -a2
|
||||
%autopatch -p1
|
||||
%if 0%{?suse_version} >= 1699
|
||||
%patch -P1 -p1
|
||||
%endif
|
||||
# https://github.com/protocolbuffers/protobuf/issues/12292
|
||||
sed -i 's/find_package(Protobuf/find_package(Protobuf CONFIG/' cpp/cmake_modules/FindProtobufAlt.cmake
|
||||
|
||||
%build
|
||||
%{?gccver:export CXX=g++-%{gccver}}
|
||||
%{?gccver:export CC=gcc-%{gccver}}
|
||||
export CFLAGS="%{optflags} -ffat-lto-objects"
|
||||
export CXXFLAGS="%{optflags} -ffat-lto-objects"
|
||||
export ARROW_MIMALLOC_URL=%{SOURCE3}
|
||||
|
||||
pushd cpp
|
||||
%cmake \
|
||||
@@ -351,14 +409,15 @@ pushd cpp
|
||||
-DARROW_CSV:BOOL=ON \
|
||||
-DARROW_DATASET:BOOL=ON \
|
||||
-DARROW_FILESYSTEM:BOOL=ON \
|
||||
%if %{with flight}
|
||||
-DARROW_FLIGHT:BOOL=ON \
|
||||
-DARROW_FLIGHT_SQL:BOOL=ON \
|
||||
%endif
|
||||
-DARROW_GANDIVA:BOOL=OFF \
|
||||
-DARROW_SKYHOOK:BOOL=OFF \
|
||||
-DARROW_HDFS:BOOL=ON \
|
||||
-DARROW_HIVESERVER2:BOOL=OFF \
|
||||
-DARROW_IPC:BOOL=ON \
|
||||
-DARROW_JEMALLOC:BOOL=OFF \
|
||||
-DARROW_JSON:BOOL=ON \
|
||||
-DARROW_ORC:BOOL=OFF \
|
||||
-DARROW_PARQUET:BOOL=ON \
|
||||
@@ -387,16 +446,20 @@ pushd cpp
|
||||
popd
|
||||
%if %{with tests}
|
||||
rm %{buildroot}%{_libdir}/libarrow_testing.so*
|
||||
rm %{buildroot}%{_libdir}/libarrow_flight_testing.so*
|
||||
rm %{buildroot}%{_libdir}/pkgconfig/arrow-testing.pc
|
||||
rm -Rf %{buildroot}%{_libdir}/cmake/ArrowTesting
|
||||
rm -Rf %{buildroot}%{_includedir}/arrow/testing
|
||||
%if %{with flight}
|
||||
rm %{buildroot}%{_libdir}/libarrow_flight_testing.so*
|
||||
rm %{buildroot}%{_libdir}/pkgconfig/arrow-flight-testing.pc
|
||||
rm -Rf %{buildroot}%{_libdir}/cmake/ArrowFlightTesting
|
||||
%endif
|
||||
%if %{with static}
|
||||
rm %{buildroot}%{_libdir}/libarrow_testing.a
|
||||
%if %{with flight}
|
||||
rm %{buildroot}%{_libdir}/libarrow_flight_testing.a
|
||||
%endif
|
||||
rm -Rf %{buildroot}%{_libdir}/cmake/ArrowTesting
|
||||
rm -Rf %{buildroot}%{_libdir}/cmake/ArrowFlightTesting
|
||||
rm -Rf %{buildroot}%{_includedir}/arrow/testing
|
||||
%endif
|
||||
%endif
|
||||
rm -r %{buildroot}%{_datadir}/doc/arrow/
|
||||
%fdupes %{buildroot}%{_libdir}/cmake
|
||||
@@ -421,7 +484,7 @@ if [ -n "${GTEST_failing}" ]; then
|
||||
fi
|
||||
%ifarch s390x
|
||||
# bsc#1218592
|
||||
exclude_regex='--exclude-regex (arrow-dataset-file-parquet-test|parquet-internals-test|parquet-reader-test|parquet-arrow-test|parquet-arrow-internals-test|parquet-encryption-test|arquet-encryption-key-management-test)'
|
||||
exclude_regex='--exclude-regex (arrow-dataset-file-parquet-test|parquet-internals-test|parquet-reader-test|parquet-arrow-test|parquet-arrow-internals-test|parquet-encryption-test|parquet-encryption-key-management-test)'
|
||||
%endif
|
||||
%ctest --label-regex unittest $exclude_regex
|
||||
popd
|
||||
@@ -431,54 +494,67 @@ popd
|
||||
%postun -n libarrow%{sonum} -p /sbin/ldconfig
|
||||
%post -n libarrow_acero%{sonum} -p /sbin/ldconfig
|
||||
%postun -n libarrow_acero%{sonum} -p /sbin/ldconfig
|
||||
%post -n libarrow_compute%{sonum} -p /sbin/ldconfig
|
||||
%postun -n libarrow_compute%{sonum} -p /sbin/ldconfig
|
||||
%if %{with flight}
|
||||
%post -n libarrow_flight%{sonum} -p /sbin/ldconfig
|
||||
%postun -n libarrow_flight%{sonum} -p /sbin/ldconfig
|
||||
%post -n libarrow_flight_sql%{sonum} -p /sbin/ldconfig
|
||||
%postun -n libarrow_flight_sql%{sonum} -p /sbin/ldconfig
|
||||
%endif
|
||||
%post -n libarrow_dataset%{sonum} -p /sbin/ldconfig
|
||||
%postun -n libarrow_dataset%{sonum} -p /sbin/ldconfig
|
||||
%post -n libparquet%{sonum} -p /sbin/ldconfig
|
||||
%postun -n libparquet%{sonum} -p /sbin/ldconfig
|
||||
|
||||
%files
|
||||
%license LICENSE.txt NOTICE.txt header
|
||||
%license LICENSE.txt NOTICE.txt
|
||||
%{_bindir}/arrow-file-to-stream
|
||||
%{_bindir}/arrow-stream-to-file
|
||||
|
||||
%files -n libarrow%{sonum}
|
||||
%license LICENSE.txt NOTICE.txt header
|
||||
%license LICENSE.txt NOTICE.txt
|
||||
%{_libdir}/libarrow.so.*
|
||||
|
||||
%files -n libarrow_acero%{sonum}
|
||||
%license LICENSE.txt NOTICE.txt header
|
||||
%license LICENSE.txt NOTICE.txt
|
||||
%{_libdir}/libarrow_acero.so.*
|
||||
|
||||
%files -n libarrow_compute%{sonum}
|
||||
%license LICENSE.txt NOTICE.txt
|
||||
%{_libdir}/libarrow_compute.so.*
|
||||
|
||||
%if %{with flight}
|
||||
%files -n libarrow_flight%{sonum}
|
||||
%license LICENSE.txt NOTICE.txt header
|
||||
%license LICENSE.txt NOTICE.txt
|
||||
%{_libdir}/libarrow_flight.so.*
|
||||
|
||||
%files -n libarrow_flight_sql%{sonum}
|
||||
%license LICENSE.txt NOTICE.txt header
|
||||
%license LICENSE.txt NOTICE.txt
|
||||
%{_libdir}/libarrow_flight_sql.so.*
|
||||
%endif
|
||||
|
||||
%files -n libarrow_dataset%{sonum}
|
||||
%license LICENSE.txt NOTICE.txt header
|
||||
%license LICENSE.txt NOTICE.txt
|
||||
%{_libdir}/libarrow_dataset.so.*
|
||||
|
||||
%files -n libparquet%{sonum}
|
||||
%license LICENSE.txt NOTICE.txt header
|
||||
%license LICENSE.txt NOTICE.txt
|
||||
%{_libdir}/libparquet.so.*
|
||||
|
||||
%files devel
|
||||
%doc README.md
|
||||
%license LICENSE.txt NOTICE.txt header
|
||||
%license LICENSE.txt NOTICE.txt
|
||||
%{_includedir}/arrow/
|
||||
%{_libdir}/cmake/Arrow*
|
||||
%{_libdir}/libarrow.so
|
||||
%{_libdir}/libarrow_acero.so
|
||||
%{_libdir}/libarrow_compute.so
|
||||
%{_libdir}/libarrow_dataset.so
|
||||
%if %{with flight}
|
||||
%{_libdir}/libarrow_flight.so
|
||||
%{_libdir}/libarrow_flight_sql.so
|
||||
%endif
|
||||
%{_libdir}/pkgconfig/arrow*.pc
|
||||
%dir %{_datadir}/arrow
|
||||
%{_datadir}/arrow/gdb
|
||||
@@ -490,29 +566,35 @@ popd
|
||||
|
||||
%if %{with static}
|
||||
%files devel-static
|
||||
%license LICENSE.txt NOTICE.txt header
|
||||
%license LICENSE.txt NOTICE.txt
|
||||
%{_libdir}/libarrow.a
|
||||
|
||||
%files acero-devel-static
|
||||
%license LICENSE.txt NOTICE.txt header
|
||||
%license LICENSE.txt NOTICE.txt
|
||||
%{_libdir}/libarrow_acero.a
|
||||
|
||||
%files compute-devel-static
|
||||
%license LICENSE.txt NOTICE.txt
|
||||
%{_libdir}/libarrow_compute.a
|
||||
|
||||
%files dataset-devel-static
|
||||
%license LICENSE.txt NOTICE.txt header
|
||||
%license LICENSE.txt NOTICE.txt
|
||||
%{_libdir}/libarrow_dataset.a
|
||||
|
||||
%if %{with flight}
|
||||
%files flight-devel-static
|
||||
%license LICENSE.txt NOTICE.txt header
|
||||
%license LICENSE.txt NOTICE.txt
|
||||
%{_libdir}/libarrow_flight.a
|
||||
|
||||
%files flight-sql-devel-static
|
||||
%license LICENSE.txt NOTICE.txt header
|
||||
%license LICENSE.txt NOTICE.txt
|
||||
%{_libdir}/libarrow_flight_sql.a
|
||||
%endif
|
||||
%endif
|
||||
|
||||
%files -n apache-parquet-devel
|
||||
%doc README.md
|
||||
%license LICENSE.txt NOTICE.txt header
|
||||
%license LICENSE.txt NOTICE.txt
|
||||
%{_includedir}/parquet/
|
||||
%{_libdir}/cmake/Parquet
|
||||
%{_libdir}/libparquet.so
|
||||
@@ -520,13 +602,13 @@ popd
|
||||
|
||||
%if %{with static}
|
||||
%files -n apache-parquet-devel-static
|
||||
%license LICENSE.txt NOTICE.txt header
|
||||
%license LICENSE.txt NOTICE.txt
|
||||
%{_libdir}/libparquet.a
|
||||
%endif
|
||||
|
||||
%files -n apache-parquet-utils
|
||||
%doc README.md
|
||||
%license LICENSE.txt NOTICE.txt header
|
||||
%license LICENSE.txt NOTICE.txt
|
||||
%{_bindir}/parquet-*
|
||||
|
||||
%changelog
|
||||
|
||||
27
arrow-boost-system-1.89-boo1249599.patch
Normal file
27
arrow-boost-system-1.89-boo1249599.patch
Normal file
@@ -0,0 +1,27 @@
|
||||
We have to tell cmake that the openSUSE packager removed the boost::system target.
|
||||
The headers subpackage provides the necessary Boost:system header file.
|
||||
|
||||
diff -ur --no-dereference arrow-apache-arrow-21.0.0.orig/cpp/cmake_modules/ThirdpartyToolchain.cmake arrow-apache-arrow-21.0.0/cpp/cmake_modules/ThirdpartyToolchain.cmake
|
||||
--- arrow-apache-arrow-21.0.0.orig/cpp/cmake_modules/ThirdpartyToolchain.cmake 2025-07-11 09:44:45.000000000 +0200
|
||||
+++ arrow-apache-arrow-21.0.0/cpp/cmake_modules/ThirdpartyToolchain.cmake 2025-09-26 20:53:58.409119646 +0200
|
||||
@@ -1259,7 +1259,7 @@
|
||||
set(Boost_USE_STATIC_LIBS ON)
|
||||
endif()
|
||||
if(ARROW_BOOST_REQUIRE_LIBRARY)
|
||||
- set(ARROW_BOOST_COMPONENTS filesystem system)
|
||||
+ set(ARROW_BOOST_COMPONENTS filesystem)
|
||||
if(ARROW_FLIGHT_SQL_ODBC AND MSVC)
|
||||
list(APPEND ARROW_BOOST_COMPONENTS locale)
|
||||
endif()
|
||||
diff -ur --no-dereference arrow-apache-arrow-21.0.0.orig/cpp/src/arrow/io/CMakeLists.txt arrow-apache-arrow-21.0.0/cpp/src/arrow/io/CMakeLists.txt
|
||||
--- arrow-apache-arrow-21.0.0.orig/cpp/src/arrow/io/CMakeLists.txt 2025-07-11 09:44:45.000000000 +0200
|
||||
+++ arrow-apache-arrow-21.0.0/cpp/src/arrow/io/CMakeLists.txt 2025-09-26 20:53:51.229519926 +0200
|
||||
@@ -30,7 +30,7 @@
|
||||
EXTRA_LINK_LIBS
|
||||
arrow::hadoop
|
||||
Boost::filesystem
|
||||
- Boost::system)
|
||||
+ Boost::headers)
|
||||
endif()
|
||||
|
||||
add_arrow_test(memory_test PREFIX "arrow-io")
|
||||
@@ -1,3 +0,0 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:87fa36b469cac0a0c95596e7be39548ddf20c8f737a02ea559e30fbebd12c7d3
|
||||
size 3571960
|
||||
3
arrow-testing-21.0.0.tar.gz
Normal file
3
arrow-testing-21.0.0.tar.gz
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:3fa7b34468636ff1642c5c3fdf67d8f86ae4bff283c5185a6a986d623bab1d19
|
||||
size 3588150
|
||||
3
mimalloc-v2.2.4.tar.gz
Normal file
3
mimalloc-v2.2.4.tar.gz
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:754a98de5e2912fddbeaf24830f982b4540992f1bab4a0a8796ee118e0752bda
|
||||
size 1295861
|
||||
@@ -1,3 +0,0 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:ac6331205baec1b97e8115de22efaf84561483623e5792d58060e91e84304bce
|
||||
size 1037654
|
||||
3
parquet-testing-21.0.0.tar.gz
Normal file
3
parquet-testing-21.0.0.tar.gz
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:4496522640dc88635a8bf3c8e7572a5815549188fa00df132eef6e2a97ce0652
|
||||
size 1077258
|
||||
@@ -1,26 +0,0 @@
|
||||
Index: arrow-apache-arrow-16.0.0/python/pyarrow/tests/test_array.py
|
||||
===================================================================
|
||||
--- arrow-apache-arrow-16.0.0.orig/python/pyarrow/tests/test_array.py
|
||||
+++ arrow-apache-arrow-16.0.0/python/pyarrow/tests/test_array.py
|
||||
@@ -3323,7 +3323,7 @@ def test_numpy_array_protocol():
|
||||
result = np.asarray(arr)
|
||||
np.testing.assert_array_equal(result, expected)
|
||||
|
||||
- if Version(np.__version__) < Version("2.0"):
|
||||
+ if Version(np.__version__) < Version("2.0.0rc1"):
|
||||
# copy keyword is not strict and not passed down to __array__
|
||||
result = np.array(arr, copy=False)
|
||||
np.testing.assert_array_equal(result, expected)
|
||||
Index: arrow-apache-arrow-16.0.0/python/pyarrow/tests/test_table.py
|
||||
===================================================================
|
||||
--- arrow-apache-arrow-16.0.0.orig/python/pyarrow/tests/test_table.py
|
||||
+++ arrow-apache-arrow-16.0.0/python/pyarrow/tests/test_table.py
|
||||
@@ -3244,7 +3244,7 @@ def test_numpy_array_protocol(constructo
|
||||
table = constructor([[1, 2, 3], [4.0, 5.0, 6.0]], names=["a", "b"])
|
||||
expected = np.array([[1, 4], [2, 5], [3, 6]], dtype="float64")
|
||||
|
||||
- if Version(np.__version__) < Version("2.0"):
|
||||
+ if Version(np.__version__) < Version("2.0.0rc1"):
|
||||
# copy keyword is not strict and not passed down to __array__
|
||||
result = np.array(table, copy=False)
|
||||
np.testing.assert_array_equal(result, expected)
|
||||
@@ -1,3 +1,452 @@
|
||||
-------------------------------------------------------------------
|
||||
Thu Sep 25 10:25:07 UTC 2025 - Ben Greiner <code@bnavigator.de>
|
||||
|
||||
- Update to 21.0.0
|
||||
## Bug Fixes
|
||||
* GH-44366 - [Python][Acero] RecordBatch.filter on expression
|
||||
raises error if result set is empty (#46057)
|
||||
* GH-45292 - [Python] test_dtypes hypotesis test fails
|
||||
sporadically (#46029)
|
||||
* GH-46080 - [Python][Docs] Provide guidance for tzdata related
|
||||
issues if installing with pip (#46591)
|
||||
* GH-46121 - [Python] Add missing column_index argument to
|
||||
ArrowReaderProperties::read_dictionary's Cython binding
|
||||
(#46122)
|
||||
* GH-46174 - [Python] Failing tests in python minimal builds
|
||||
(#46175)
|
||||
* GH-46238 - [Release][Python] Use array to avoid empty argument
|
||||
in dev/release/post-11-python.sh (#46239)
|
||||
* GH-46343 - [CI][Python] Remove workaround for gdb packaging
|
||||
issue (#46848)
|
||||
* GH-46344 - [CI][Python] Skip doctest for s3.get_file_info to
|
||||
avoid bucket restrictions (#46345)
|
||||
* GH-46355 - [Python] Fix table.to_struct_array with an empty
|
||||
table (#46357)
|
||||
* GH-46481 - [C++][Python] Allow nullable schema in FlightInfo
|
||||
(#46489)
|
||||
* GH-46516 - [CI][Python] Force Cython>3.1.1 for docs builds
|
||||
(#46770)
|
||||
* GH-46606 - [Python] Do not require numpy when normalizing slice
|
||||
(#46732)
|
||||
* GH-46611 - [Python][C++] Allow building float16 arrays without
|
||||
numpy (#46618)
|
||||
* GH-46729 - [Python] Allow constructing InMemoryDataset from
|
||||
RecordBatchReader (#46731)
|
||||
* GH-46811 - [C++][Python] Fix crash on
|
||||
FileReaderImpl::GetRecordBatchReader (#46931)
|
||||
## New Features and Improvements
|
||||
* GH-26818 - [C++][Python] Preserve order when writing dataset
|
||||
multi-threaded (#44470)
|
||||
* GH-38914 - [Python] Add
|
||||
EncryptionConfiguration.uniform_encryption (#46347)
|
||||
* GH-39294 - [C++][Python] DLPack on Tensor class (#42118)
|
||||
* GH-40754 - [Python] Expose tls_ca_file_path to S3FileSystem
|
||||
(#45881)
|
||||
* GH-41496 - [Python][Azure][Docs] Turn on azure on debian-docs
|
||||
(#46892)
|
||||
* GH-41672 - [Python][Doc] Clarify docstring of
|
||||
FixedSizeListArray.values that it ignores the offset (#46144)
|
||||
* GH-42012 - [Python] Add Schema with_field or set_field method
|
||||
(#46348)
|
||||
* GH-43041 - [C++][Python] Read/write Parquet BYTE_ARRAY as
|
||||
Large/View types directly (#46532)
|
||||
* GH-43807 - [C++][Python] Add UUID extension type conversion
|
||||
support to/from Parquet (#45866)
|
||||
* GH-44500 - [Python][Parquet] Map Parquet logical types to Arrow
|
||||
extension types by default (#46772)
|
||||
* GH-44900 - [Python] Support explicit fsspec+{protocol} and
|
||||
hf:// filesystem URIs (#45089)
|
||||
* GH-45229 - [Python] Migrate from scipy.spmatrix to
|
||||
scipy.sparray (#46423)
|
||||
* GH-45229 - [Python] skip scipy.sparse roundtrip tests for
|
||||
float16 (#46413)
|
||||
* GH-45531 - [Python] Add the dim_names argument to
|
||||
from_numpy_ndarray (#46170)
|
||||
* GH-45619 - [Python] Use f-string instead of string.format
|
||||
(#45629)
|
||||
* GH-45653 - [Python] Scalar subclasses should implement Python
|
||||
protocols (#45818)
|
||||
* GH-45750 - [C++][Python][Parquet] Implement Content-Defined
|
||||
Chunking for the Parquet writer (#45360)
|
||||
* GH-45957 - [C++][Python] Expose allow_delayed_open on
|
||||
S3FileSystem (#46078)
|
||||
* GH-46019 - [Python] Raise TypeError on feather read_table if
|
||||
columns is not a Sequence (#46038)
|
||||
* GH-46054 - [Python][Packaging] Re-enable pandas on Windows
|
||||
free-threaded wheel (#46109)
|
||||
* GH-46058 - [Python] Run Python in AppVeyor outside of source
|
||||
directory (#46059)
|
||||
* GH-46130 - [Python] Remove use_legacy_format in favour of
|
||||
setting IpcWriteOptions (#46131)
|
||||
* GH-46198 - [Python] Remove deprecated PyExtensionType (#46199)
|
||||
* GH-46222 - [Python] Allow to specify footer metadata when
|
||||
opening IPC file for writing (#46354)
|
||||
* GH-46349 - [Python] Move parquet definitions to
|
||||
pyarrow/includes/libparquet.pxd (#46437)
|
||||
* GH-46373 - [Python] Exercise fallback case on tests for
|
||||
parquet.read_table in case dataset is not available (#46550)
|
||||
* GH-46544 - [CI][Dev][Python] Use pre-commit for autopep8
|
||||
(#46552)
|
||||
* GH-46545 - [CI][Dev][Python] Update pre-commit for cython-lint
|
||||
(#46580)
|
||||
* GH-46546 - [CI][Dev][Python] Use pre-commit for numpydoc
|
||||
(#46595)
|
||||
* GH-46572 - [Python] expose filter option to python for join
|
||||
(#46566)
|
||||
* GH-46633 - [Docs][C++][Python] Update CombineChunks
|
||||
documentation to specify that binary columns can be combined
|
||||
into multiple chunks (#46638)
|
||||
* GH-46652 - [Python][Docs] Update language for row_group_size
|
||||
parameter (#46653)
|
||||
* GH-46676 - [C++][Python][Parquet] Allow reading Parquet LIST
|
||||
data as LargeList directly (#46678)
|
||||
* GH-46683 - [C++][Python] Add utf8_zero_fill compute function
|
||||
for sign-aware zero padding (#46815)
|
||||
* GH-46771 - [Python][C++] Implement pa.arange function to
|
||||
generate array sequences (#46778)
|
||||
* GH-46833 - [Python] Expose ConfigureManagedIdentityCredential
|
||||
and ConfigureClientSecretCredential to AzureFileSystem on
|
||||
PyArrow (#46837)
|
||||
* GH-46959 - [Python][Packaging] Drop support for manylinux2014
|
||||
(#46965)
|
||||
|
||||
-------------------------------------------------------------------
|
||||
Fri Jun 13 18:22:38 UTC 2025 - Ben Greiner <code@bnavigator.de>
|
||||
|
||||
- Update to 20.0.0
|
||||
## Bug Fixes
|
||||
* GH-36628 - [Python][Parquet] Fail when instantiating internal
|
||||
Parquet metadata classes (#45549)
|
||||
* GH-37630 - [C++][Python][Dataset] Allow disabling fragment
|
||||
metadata caching (#45330)
|
||||
* GH-44188 - [Python] Fix pandas roundtrip with bytes column
|
||||
names (#44171)
|
||||
* GH-45129 - [Python][C++] Fix usage of deprecated C++
|
||||
functionality on pyarrow (#45189)
|
||||
* GH-45155 - [Python][CI] Fix path for scientific nightly windows
|
||||
wheel upload (#45222)
|
||||
* GH-45169 - [Python] Adapt to modified pytest ignore collect
|
||||
hook api (#45170)
|
||||
* GH-45380 - [Python] Expose RankQuantileOptions to Python
|
||||
(#45392)
|
||||
* GH-45530 - [Python][Packaging] Add pyarrow.libs dir to
|
||||
get_library_dirs (#45766)
|
||||
* GH-45582 - [Python] Preserve decimal32/64/256 metadata in
|
||||
Schema.metadata (#45583)
|
||||
* GH-45733 - [C++][Python] Add biased/unbiased toggle to skew and
|
||||
kurtosis functions (#45762)
|
||||
* GH-45739 - [C++][Python] Fix crash when calling
|
||||
hash_pivot_wider without options (#45740)
|
||||
* GH-45758 - [Python] Add AzureFileSystem documentation (#45759)
|
||||
* GH-45926 - [Python] Use pytest.approx for float values on
|
||||
unbiased skew and kurtosis tests (#45929)
|
||||
* GH-46041 - [Python][Packaging] Temporary remove pandas from
|
||||
being installed on free-threaded Windows wheel tests (#46042)
|
||||
## New Features and Improvements
|
||||
* GH-14932 - [Python] Add python bindings for JSON streaming
|
||||
reader (#45084)
|
||||
* GH-35289 - [Python] Support large variable width types in numpy
|
||||
conversion (#36701)
|
||||
* GH-36412 - [Python][CI] Fix deprecation warnings in the pandas
|
||||
nightly build
|
||||
* GH-39010 - [Python] Introduce maps_as_pydicts parameter for
|
||||
to_pylist, to_pydict, as_py (#45471)
|
||||
* GH-41002 - [Python] Remove pins for pytest-cython and
|
||||
conda-docs pytest (#45240)
|
||||
* GH-41985 - [Python][Docs] Clarify docstring of
|
||||
pyarrow.compute.scalar() (#45668)
|
||||
* GH-43587 - [Python] Remove no longer used serialize/deserialize
|
||||
PyArrow C++ code (#45743)
|
||||
* GH-44421 - [Python] Add configuration for building & testing
|
||||
free-threaded wheels on Windows (#44804)
|
||||
* GH-44790 - [Python] Remove use_legacy_dataset from code base
|
||||
(#45742)
|
||||
* GH-45156 - [Python][Packaging] Refactor Python Windows wheel
|
||||
images to use newer base image (#45442)
|
||||
* GH-45237 - [Python] Raise minimum supported cython to >=3
|
||||
(#45238)
|
||||
* GH-45278 - [Python][Packaging] Updated delvewheel install
|
||||
command and updated flags used with delvewheel repair (#45323)
|
||||
* GH-45282 - [Python][Parquet] Remove unused readonly properties
|
||||
of ParquetWriter (#45281)
|
||||
* GH-45288 - [Python][Packaging][Docs] Update documentation for
|
||||
PyArrow nightly wheels (#45289)
|
||||
* GH-45358 - [C++][Python] Add MemoryPool method to print
|
||||
statistics (#45359)
|
||||
* GH-45433 - [Python] Remove Cython workarounds (#45437)
|
||||
* GH-45457 - [Python] Add pyarrow.ArrayStatistics (#45550)
|
||||
* GH-45482 - [CI][Python] Don’t use Ubuntu 20.04 for wheel test
|
||||
(#45483)
|
||||
* GH-45570 - [Python] Allow Decimal32/64Array.to_pandas (#45571)
|
||||
* GH-45676 - [C++][Python][Compute] Add skew and kurtosis
|
||||
functions (#45677)
|
||||
* GH-45680 - [C++][Python] Remove deprecated functions in 20.0
|
||||
* GH-45705 - [Python] Add support for SAS token in
|
||||
AzureFileSystem (#45706)
|
||||
* GH-45755 - [C++][Python][Compute] Add winsorize function
|
||||
(#45763)
|
||||
* GH-45848 - [C++][Python][R] Remove deprecated PARQUET_2_0
|
||||
(#45849)
|
||||
* GH-45920 - [Release][Python] Upload sdist and wheels to GitHub
|
||||
Releases not apache.jfrog.io (#45962)
|
||||
|
||||
-------------------------------------------------------------------
|
||||
Mon Feb 17 19:17:26 UTC 2025 - Ben Greiner <code@bnavigator.de>
|
||||
|
||||
- Update to 19.0.1
|
||||
## Bug Fixes
|
||||
* [Python][CI] Make download_tzdata_on_windows more robust and
|
||||
use tzdata package for tzinfo database on Windows for ORC
|
||||
(#45425)
|
||||
* [Python] Only enable the string dtype on pandas export for
|
||||
pandas>=2.3 (#45383) [Python] Fix version comparison in pandas
|
||||
compat for pandas 2.3 dev version (#45428)
|
||||
## Improvements
|
||||
* [CI][Python] Temporarily avoid newer boto3 version (#45311)
|
||||
[CI] Bump Minio version and unpin boto3 (#45320)
|
||||
- Release 19.0.0
|
||||
## New Features and Improvements
|
||||
* [Python] Add more FlightInfo / FlightEndpoint attributes
|
||||
(#43537)
|
||||
* [Python] Support Arrow PyCapsule stream objects in
|
||||
write_dataset (#43771)
|
||||
* [Python] Support pandas future default string dtype
|
||||
* [CI][Python] Use GitHub Packages for vcpkg cache (#44644)
|
||||
* [Python] Add Python wrapper for JsonExtensionType (#44070)
|
||||
* [Python][C++] Add version suffix to libarrow_python* libraries
|
||||
(#44702)
|
||||
* [Python] Add support for Decimal32 and Decimal64 types (#44882)
|
||||
* [C++][Python] Add Hyperbolic Trig functions (#44630)
|
||||
* [Python] Clean-up name / field_name handling in pandas compat
|
||||
(#44963)
|
||||
* [CI][Python][Packaging] Test 3.12 wheels on Ubuntu 24.04
|
||||
(#45042)
|
||||
* [CI][Packaging][Python] Simplify
|
||||
dev/tasks/python-wheels/github.linux.yml (#45077)
|
||||
* [Python] Honor the strings_to_categorical keyword in to_pandas
|
||||
for string view type (#45176)
|
||||
## Bug Fixes
|
||||
* [C++][Python] Fix ORC crash when file contains unknown timezone
|
||||
(#45051)
|
||||
* [Python] Converting month_day_nano_interal to numpy crashes
|
||||
* [Python] Allow from_buffers to work with StringView on Python
|
||||
(#44701)
|
||||
* [C++][Python] Fix Flight Timestamp precision, revert workaround
|
||||
from #43537 (#44681)
|
||||
* [Docs][Python] Add missing canonical extension types to PyArrow
|
||||
arrays and datatypes docs (#44880)
|
||||
* [Python] Trigger manual Garbage collection before checking
|
||||
allocated bytes for dlpack tests (#44793)
|
||||
* [Python][Packaging] Use delvewheel to repair Windows wheels
|
||||
(#35323)
|
||||
* [CI][Python] Fix and modernize AppVeyor build (#44999)
|
||||
* [Python][Docs] Update docstrings for metadata methods on Field
|
||||
and Schema classes (#45004)
|
||||
* [CI][Python] Fix test_memory failures (#45007)
|
||||
* [CI][Packaging][Python] Fix Docker push step for free-threaded
|
||||
wheel builds (#45040)
|
||||
* [Packaging][Python] Use ORC from vcpkg instead of bundled on
|
||||
Linux and macOS (#45046)
|
||||
- Release 18.1.0
|
||||
## Bug Fixes
|
||||
* [Release][Packacing][Python] Set PARQUET_TEST_DATA on
|
||||
verify-release-candidate-wheels.bat (#44462)
|
||||
## New Features and Improvements
|
||||
- Release 18.0.0
|
||||
## Bug Fixes
|
||||
* [Python][Packaging] Bump MACOSX_DEPLOYMENT_TARGET to 12 instead
|
||||
of 11 (#43137)
|
||||
* [Release][Packaging][Python] Add tzdata as conda env
|
||||
requirement to avoid ORC failure (#43233)
|
||||
* [Python] Give precedence to pycapsule interface in
|
||||
pa.schema(..) (#43486)
|
||||
* [Python] Sanitize Python reference handling in UDF
|
||||
implementation (#43557)
|
||||
* [Python] Allow tuple for rename columns (#43609)
|
||||
* [Packaging][Python] Fix vcpkg version detection in macOS wheel
|
||||
build jobs (#43615)
|
||||
* [Python] Fix compilation on Cython<3 (#43765)
|
||||
* [Python][CI] Correct PARQUET_TEST_DATA path in wheel tests
|
||||
(#43786)
|
||||
* [CI][Packaging][Python] Avoid uploading wheel to gemfury if
|
||||
version already exists (#43816)
|
||||
* [CI][Python] Skip test that requires PARQUET_TEST_DATA env on
|
||||
emscripten (#43906)
|
||||
* [Python] Fix threading issues with borrowed refs and pandas
|
||||
(#44047)
|
||||
* [Benchmarking][Python] Avoid uwsgi install failure on macOS
|
||||
(#44221)
|
||||
* [CI][Release][Python] Do not verify Python on Ubuntu 20.04
|
||||
(#44254)
|
||||
* [CI][Python] Remove ds requirement from test collection on
|
||||
test_dataset.py (#44370)
|
||||
## New Features and Improvements
|
||||
* [C++][Python] Native support for UUID (#37298)
|
||||
* [C++][Python] Bool8 Extension Type Implementation (#43488)
|
||||
* [Python] Make NumPy an optional runtime dependency (#41904)
|
||||
* [Python] Add StructType attribute to access all its fields
|
||||
(#43481)
|
||||
* [CI][Python] Use pipx to install GCS testbench (#43852)
|
||||
* [Python][CI][Packaging] Don’t upload sdist to scientific-python
|
||||
nightly channel (only wheels) (#43943)
|
||||
* [Python][CI][Packaging] Upload nightly wheels to main label of
|
||||
scientific-python-nightly-wheels channel (#43932)
|
||||
* [CI][Packaging][Python] Upload pyarrow nightly wheels to
|
||||
scientific python channel on Anaconda (#43862)
|
||||
* [C++][Python][Parquet] Support reading/writing key-value
|
||||
metadata from/to ColumnChunkMetaData (#41580)
|
||||
* [Python] Ensure (Chunked)Array/RecordBatch/Table methods don’t
|
||||
crash with non-CPU data
|
||||
* [Python] Let StructArray.from_array accept a type in addition
|
||||
to names or fields (#43047)
|
||||
* [Python] Test FlightStreamReader iterator (#42086)
|
||||
* [Python] Add bindings for CopyTo on RecordBatch and Array
|
||||
classes (#42223)
|
||||
* [Python] Use Py_IsFinalizing from pythoncapi_compat.h (#43767)
|
||||
* [Python] Add bindings for memory manager and device to Context
|
||||
class (#43392)
|
||||
* [C++][Python] Add Opaque canonical extension type (#43458)
|
||||
* [Python] Deprecate passing build flags to setup.py (#43515)
|
||||
* [Python][Packaging][CI] Drop Python 3.8 support (#43970)
|
||||
* [Python][CI] Add Python 3.13 conda test build (#44192)
|
||||
* [Python][CI][Packaging] Use released versions to build and test
|
||||
wheels on Python 3.13 (#44193)
|
||||
* [Python] Set up wheel building for Python 3.13 (#43539)
|
||||
* [Python] Remove usage of deprecated pkg_resources in setup.py
|
||||
(#43602)
|
||||
* [Python][CI] Add a Crossbow job with the free-threaded build
|
||||
(#43671)
|
||||
* [Python] Do not use borrowed references APIs (#43540)
|
||||
* [Python] Declare support for free-threading in Cython (#43606)
|
||||
* [Python][CI] Add a Crossbow job with a debug CPython
|
||||
interpreter (#43565)
|
||||
* [Python][Dataset] Python / Cython interface to C++
|
||||
arrow::dataset::Partitioning::Format (#43740)
|
||||
* [Python][CI] Simplify python/requirements-wheel-test.txt file
|
||||
(#43691)
|
||||
* [Python] RecordBatch fails gracefully on non-cpu devices
|
||||
(#43729)
|
||||
* [Python] ChunkedArray fails gracefully on non-cpu devices
|
||||
(#43795)
|
||||
* [Python][Packaging] Remove numpy dependency from pyarrow
|
||||
packaging (#44148)
|
||||
* [Python] Build macOS and manylinux wheels for free-threading
|
||||
(#43965)
|
||||
* [Python] Table fails gracefully on non-cpu devices (#43974)
|
||||
* [Python] Deprecate the no longer used serialize/deserialize
|
||||
Pyarrow C++ functions (#44064)
|
||||
* [CI][Python] Enable S3 testing on Windows wheel builds (#44093)
|
||||
* [CI][Python] Enable S3 tests on macOS CI (#44129)
|
||||
* [Packaging][Python] Use macOS 12 as deployment target to have
|
||||
macOS 12 pyarrow wheels (#44315)
|
||||
* [Packaging][Python] Disable interactive deb configuration in
|
||||
wheel-manylinux--cp313t- (#44362)
|
||||
- Drop pyarrow-pr433325-extradirs.patch
|
||||
|
||||
-------------------------------------------------------------------
|
||||
Thu Sep 26 23:24:22 UTC 2024 - Guang Yee <gyee@suse.com>
|
||||
|
||||
- Enable sle15_python_module_pythons.
|
||||
|
||||
-------------------------------------------------------------------
|
||||
Wed Aug 14 20:27:48 UTC 2024 - Ben Greiner <code@bnavigator.de>
|
||||
|
||||
- Update to 17.0.0
|
||||
## Bug Fixes
|
||||
* [C++][Python] Fix casting to extension type with fixed size
|
||||
list storage type (#42219)
|
||||
* [Python] Include metadata when creating pa.schema from
|
||||
PyCapsule (#41538)
|
||||
* [C++][Python] RecordBatch.filter() segfaults if passed a
|
||||
ChunkedArray (#40971)
|
||||
* [Python] pa.array: add check for byte-swapped numpy arrays
|
||||
inside python objects (#41549)
|
||||
* [Python] Fix read_table for encrypted parquet (#39438)
|
||||
* [Python] RunEndEncodedArray.from_arrays: bugfix for Array
|
||||
arguments (#40560) (#41093)
|
||||
* [C++][Python] Map child Array constructed from keys and items
|
||||
shouldn’t have offset (#40871)
|
||||
* [Python] `test_numpy_array_protocol` test failures with numpy
|
||||
2.0.0rc1
|
||||
* [Python] Fix StructArray.sort() for by=None (#41495)
|
||||
* [Python] Build with Python 3.13 (#42034)
|
||||
* [Python] remove special methods related to buffers in python
|
||||
<2.6 (#41492)
|
||||
* [Python] Fix reading column index with decimal values (#41503)
|
||||
* [Docs][Python] Remove duplicate contents (#41588)
|
||||
* [C++][Python] Add optional null_bitmap to MapArray::FromArrays
|
||||
(#41757)
|
||||
* [Python][Parquet] Implement to_dict method on SortingColumn
|
||||
(#41704)
|
||||
* [Python] CMake: ignore Parquet encryption option if Parquet
|
||||
itself is not enabled (fix Java integration build) (#41776)
|
||||
* [Python] Disallow direct pa.RecordBatchReader() construction to
|
||||
avoid segfaults (#41773)
|
||||
* [Python] Fix RecordBatchReader.cast to support casting to equal
|
||||
schema for all types (#42098)
|
||||
* [Python] Fix tests when using NumPy 2.0 on Windows (#42099)
|
||||
* [CI][Python] Use pip install -e instead of setup.py build_ext
|
||||
–inplace for installing pyarrow on verification script (#42007)
|
||||
* [CI][Python][C++] Fix utf8proc detection for wheel on Windows
|
||||
(#42022)
|
||||
* [Python][CI] Update expected output for numpy 2.0.0 (#42172)
|
||||
## New Features and Improvements
|
||||
* [Python] Replace pandas.util.testing.rands with vendored
|
||||
version (#42089)
|
||||
* [Python] begin moving static settings to pyproject.toml
|
||||
(#41041)
|
||||
* [Python] Implement PyCapsule interface for Device data in
|
||||
PyArrow (#40717)
|
||||
* [Python] Expand the Arrow PyCapsule Interface with C Device
|
||||
Data support (#40708)
|
||||
* [Python] Let RecordBatch.filter accept a boolean expression in
|
||||
addition to mask array (#43043)
|
||||
* [Python] Fix pickling of LocalFileSystem for cython 2 (#41459)
|
||||
* [Python] Expand the C Device Interface bindings to support
|
||||
import on CUDA device (#40385)
|
||||
* [Python] Allow passing a mapping of column names to
|
||||
rename_columns (#40645)
|
||||
* [Python][Packaging] Strip unnecessary symbols when building
|
||||
wheels (#42028)
|
||||
* [Python][Docs] Update PyArrow installation docs for conda
|
||||
package split (#41135)
|
||||
* [Python] Basic bindings for Device and MemoryManager classes
|
||||
(#41685)
|
||||
* [C++][Python] Expose recursive flatten for lists on
|
||||
list_flatten kernel function and pyarrow bindings (#41295)
|
||||
* [Python][Packaging] Ensure to build with released numpy 2.0
|
||||
(instead of RC) in the wheel building workflows (#42194)
|
||||
* [CI][Python] Add a job on ARM64 macOS (#41313)
|
||||
* [CI][Python] Reduce CI time on macOS (#41378)
|
||||
* [Python] Expose byte_width and bit_width of ExtensionType in
|
||||
terms of the storage type (#41413)
|
||||
* [Python] Update Python development guide about components being
|
||||
enabled by default based on Arrow C++ (#41705)
|
||||
* [Python] Building PyArrow: enable/disable python components by
|
||||
default based on availability in Arrow C++ (#41494)
|
||||
* [C++][Python] Extends the add_key_value to parquet::arrow and
|
||||
PyArrow (#41633)
|
||||
* [Python] Ensure Buffer methods don’t crash with non-CPU data
|
||||
(#41889)
|
||||
* [C++][Python] PrettyPrint non-cpu data by copying to default
|
||||
CPU device (#42010)
|
||||
* [Python][Parquet] Update BYTE_STREAM_SPLIT description in
|
||||
write_table() docstring (#41759)
|
||||
* [Python] Add support for Pyodide (#37822)
|
||||
* [Python] Fix pandas tests to follow downstream datetime64 unit
|
||||
changes (#41979)
|
||||
* [Python] Allow Array.filter() to take general array input
|
||||
(#42051)
|
||||
* [Python] Expose new FLOAT16 logical type in the pyarrow.parquet
|
||||
bindings (#42103)
|
||||
* [Python] Array gracefully fails on non-cpu device (#42113)
|
||||
* [Python][Parquet] Pyarrow store decimal as integer (#42169)
|
||||
* [Python] Add CI job for Numpy 1.X (#42189)
|
||||
* [CI][Python] Pin openjdk=17 in python substrait integration
|
||||
(#43051)
|
||||
- Drop pyarrow-pr41319-numpy2-tests.patch
|
||||
- Add pyarrow-pr433325-extradirs.patch gh#apache/arrow/pull/43325
|
||||
|
||||
-------------------------------------------------------------------
|
||||
Thu Apr 25 08:58:22 UTC 2024 - Ben Greiner <code@bnavigator.de>
|
||||
|
||||
@@ -252,12 +701,12 @@ Mon Jan 15 20:42:25 UTC 2024 - Ben Greiner <code@bnavigator.de>
|
||||
-------------------------------------------------------------------
|
||||
Tue Nov 14 23:29:03 UTC 2023 - Ondřej Súkup <mimi.vx@gmail.com>
|
||||
|
||||
- Fix cve in changelog
|
||||
- Fix cve in changelog
|
||||
|
||||
-------------------------------------------------------------------
|
||||
Tue Nov 14 09:28:23 UTC 2023 - Ondřej Súkup <mimi.vx@gmail.com>
|
||||
|
||||
- Update to 14.0.1
|
||||
- Update to 14.0.1
|
||||
- drop pyarrow-pr37481-pandas2.1.patch
|
||||
- fixes boo#1216991 CVE-2023-47248
|
||||
* GH-38431 - [Python][CI] Update fs.type_name checks for s3fs tests
|
||||
@@ -440,7 +889,7 @@ Sun Mar 12 05:31:32 UTC 2023 - Ben Greiner <code@bnavigator.de>
|
||||
* [Python][Docs] adding info about TableGroupBy.aggregation with empty list (#14482)
|
||||
* [Python] DataFrame Interchange Protocol for pyarrow Table
|
||||
* [Python] Drop older versions of Pandas (<1.0) (#14631)
|
||||
* [Python] Pass Cmake args to Python CPP
|
||||
* [Python] Pass Cmake args to Python CPP
|
||||
* [Docs][Python] Improve docs for S3FileSystem (#14599)
|
||||
* [Python] Add missing value accessor to temporal types (#14746)
|
||||
* [Python] Expose time32/time64 scalar values (#14637)
|
||||
@@ -468,7 +917,7 @@ Sun Mar 12 05:31:32 UTC 2023 - Ben Greiner <code@bnavigator.de>
|
||||
* [Python] Support passing create_dir thru pq.write_to_dataset (#14459)
|
||||
* [CI][Python] Fix pandas master/nightly build failure related to timedelta (#14460)
|
||||
* [Python] Fix writing files with multi-byte characters in file name (#14764)
|
||||
* [Python] Handle pytest 8 deprecations about pytest.warns(None)
|
||||
* [Python] Handle pytest 8 deprecations about pytest.warns(None)
|
||||
* [Python] Remove ARROW_BUILD_DIR in building pyarrow C++ (#14498)
|
||||
* [Python] Honor default memory pool in Dataset scanning (#14516)
|
||||
* [Python] Fully support filesystem in parquet.write_metadata (#14574)
|
||||
|
||||
@@ -1,7 +1,7 @@
|
||||
#
|
||||
# spec file for package python-pyarrow
|
||||
#
|
||||
# Copyright (c) 2024 SUSE LLC
|
||||
# Copyright (c) 2025 SUSE LLC and contributors
|
||||
#
|
||||
# All modifications and additions to the file contributed by third parties
|
||||
# remain the property of their copyright owners, unless otherwise agreed
|
||||
@@ -16,29 +16,38 @@
|
||||
#
|
||||
|
||||
|
||||
%{?sle15_python_module_pythons}
|
||||
%bcond_with xsimd
|
||||
%define plainpython python
|
||||
# See git submodule /testing pointing to the correct revision
|
||||
%define arrow_testing_commit fbf6b703dc93d17d75fa3664c5aa2c7873ebaf06
|
||||
# See git submodule /cpp/submodules/parquet-testing pointing to the correct revision
|
||||
%define parquet_testing_commit 18d17540097fca7c40be3d42c167e6bfad90763c
|
||||
%if %{suse_version} <= 1500
|
||||
# requires __has_builtin with keywords
|
||||
%define gccver 13
|
||||
%endif
|
||||
Name: python-pyarrow
|
||||
Version: 16.0.0
|
||||
Version: 21.0.0
|
||||
Release: 0
|
||||
Summary: Python library for Apache Arrow
|
||||
License: Apache-2.0 AND BSD-3-Clause AND BSD-2-Clause AND MIT
|
||||
URL: https://arrow.apache.org/
|
||||
# SourceRepository: https://github.com/apache/arrow
|
||||
Source0: apache-arrow-%{version}.tar.gz
|
||||
Source1: arrow-testing-%{version}.tar.gz
|
||||
Source2: parquet-testing-%{version}.tar.gz
|
||||
Source99: python-pyarrow.rpmlintrc
|
||||
# PATCH-FIX-UPSTREAM pyarrow-pr41319-numpy2-tests.patch gh#apache/arrow#41319
|
||||
Patch0: pyarrow-pr41319-numpy2-tests.patch
|
||||
BuildRequires: %{python_module Cython >= 0.29.31}
|
||||
BuildRequires: %{python_module devel >= 3.8}
|
||||
BuildRequires: %{python_module Cython >= 3}
|
||||
BuildRequires: %{python_module devel >= 3.9}
|
||||
BuildRequires: %{python_module numpy-devel >= 1.25}
|
||||
BuildRequires: %{python_module pip}
|
||||
BuildRequires: %{python_module setuptools_scm}
|
||||
BuildRequires: %{python_module setuptools}
|
||||
BuildRequires: %{python_module wheel}
|
||||
BuildRequires: cmake
|
||||
BuildRequires: cmake >= 3.25
|
||||
BuildRequires: fdupes
|
||||
BuildRequires: gcc-c++
|
||||
BuildRequires: gcc%{?gccver}-c++
|
||||
BuildRequires: openssl-devel
|
||||
BuildRequires: pkgconfig
|
||||
BuildRequires: python-rpm-macros
|
||||
@@ -88,12 +97,13 @@ This package provides the header files within the python
|
||||
platlib for consuming modules using cythonization.
|
||||
|
||||
%prep
|
||||
%autosetup -p1 -n arrow-apache-arrow-%{version}
|
||||
# we disabled the jemalloc backend in apache-arrow
|
||||
sed -i 's/should_have_jemalloc = sys.platform == "linux"/should_have_jemalloc = False/' python/pyarrow/tests/test_memory.py
|
||||
%setup -n arrow-apache-arrow-%{version} -a1 -a2
|
||||
%autopatch -p1
|
||||
|
||||
%build
|
||||
pushd python
|
||||
%{?gccver:export CXX=g++-%{gccver}}
|
||||
%{?gccver:export CC=gcc-%{gccver}}
|
||||
export CFLAGS="%{optflags}"
|
||||
export PYARROW_BUILD_TYPE=relwithdebinfo
|
||||
export PYARROW_BUILD_VERBOSE=1
|
||||
@@ -122,8 +132,15 @@ pushd python
|
||||
popd
|
||||
|
||||
%check
|
||||
# flaky
|
||||
%{?gccver:export CXX=g++-%{gccver}}
|
||||
%{?gccver:export CC=gcc-%{gccver}}
|
||||
export ARROW_TEST_DATA="${PWD}/arrow-testing-%{arrow_testing_commit}/data"
|
||||
export PARQUET_TEST_DATA="${PWD}/parquet-testing-%{parquet_testing_commit}/data"
|
||||
# flaky tests
|
||||
donttest="test_total_bytes_allocated"
|
||||
donttest="$donttest or test_batch_lifetime"
|
||||
# worker crashes, we don't have an s3 setup in obs anyway
|
||||
donttest="$donttest or test_s3fs_limited_permissions_create_bucket"
|
||||
%ifarch %{ix86} %{arm32}
|
||||
# tests conversion to 64bit datatypes
|
||||
donttest="$donttest or test_conversion"
|
||||
|
||||
Reference in New Issue
Block a user