This is an automated email from the ASF dual-hosted git repository.
jorisvandenbossche pushed a change to branch main
in repository https://gitbox.apache.org/repos/asf/arrow.git
from b20e0ae779 GH-37941: [R][CI][Release] Add checksum verification for
pre-compiled binaries (#38115)
add 0793432ad0 GH-29238 [C++][Dataset][Parquet] Support parquet modular
encryption in the new Dataset API (#34616)
No new revisions were added by this update.
Summary of changes:
cpp/src/arrow/dataset/CMakeLists.txt | 7 +
cpp/src/arrow/dataset/file_parquet.cc | 75 ++++++-
cpp/src/arrow/dataset/file_parquet.h | 8 +
.../arrow/dataset/file_parquet_encryption_test.cc | 216 +++++++++++++++++++++
cpp/src/arrow/dataset/file_parquet_test.cc | 27 +++
cpp/src/arrow/dataset/parquet_encryption_config.h | 75 +++++++
cpp/src/arrow/util/config.h.cmake | 1 +
cpp/src/parquet/properties.h | 46 ++++-
python/CMakeLists.txt | 6 +
python/examples/dataset/write_dataset_encrypted.py | 93 +++++++++
.../{_dataset_orc.pyx => _dataset_parquet.pxd} | 37 ++--
python/pyarrow/_dataset_parquet.pyx | 63 ++++--
python/pyarrow/_dataset_parquet_encryption.pyx | 170 ++++++++++++++++
python/pyarrow/_parquet_encryption.pxd | 119 ++----------
python/pyarrow/_parquet_encryption.pyx | 42 ++--
python/pyarrow/dataset.py | 9 +
.../pyarrow/includes/libarrow_dataset_parquet.pxd | 16 ++
.../libparquet_encryption.pxd} | 3 -
python/pyarrow/tests/test_dataset_encryption.py | 148 ++++++++++++++
19 files changed, 994 insertions(+), 167 deletions(-)
create mode 100644 cpp/src/arrow/dataset/file_parquet_encryption_test.cc
create mode 100644 cpp/src/arrow/dataset/parquet_encryption_config.h
create mode 100644 python/examples/dataset/write_dataset_encrypted.py
copy python/pyarrow/{_dataset_orc.pyx => _dataset_parquet.pxd} (56%)
create mode 100644 python/pyarrow/_dataset_parquet_encryption.pyx
copy python/pyarrow/{_parquet_encryption.pxd =>
includes/libparquet_encryption.pxd} (97%)
create mode 100644 python/pyarrow/tests/test_dataset_encryption.py