This is an automated email from the ASF dual-hosted git repository.
alamb pushed a change to tag 43.0.0
in repository https://gitbox.apache.org/repos/asf/arrow-rs.git
*** WARNING: tag 43.0.0 was modified! ***
from ffd216d574 (commit)
to 414235e763 (commit)
omit ffd216d574 Workaround new bug in parquet (#6344)
omit 774b721452 Prepare arrow/parquet `53.0.0` release (#6338)
omit 831a0804bf Specialize filter for structs and sparse unions (#6304)
omit 3a1f67fd6a parquet_derive: Match fields by name, support reading
selected fields rather than all (#6269)
omit 0c15191037 Support zero column `RecordBatch`es in pyarrow integration
(use RecordBatchOptions when converting a pyarrow RecordBatch) (#6320)
omit 6e505033b9 Derive PartialEq and Eq for parquet::arrow::ProjectionMask
(#6330)
omit acdd27a66a Fix writing of invalid Parquet ColumnIndex when row group
contains null pages (#6319)
omit 69e5e5f059 Minor: improve filter documentation (#6317)
omit 13369733af Pass empty vectors as min/max for all null pages when
building ColumnIndex (#6316)
omit 678517018d docs[object_store]: clarify the backoff strategy that is
actually implemented (#6325)
omit a937869f89 Update tonic-build requirement from =0.12.0 to =0.12.2
(#6314)
omit dc8427faaa Minor: Improve comments on
GenericByteViewArray::bytes_iter(), prefix_iter() and suffix_iter() (#6306)
omit b711f23a13 feat(parquet): add union method to RowSelection (#6308)
omit ee2f75a662 Err on `try_from_le_slice` (#6295)
omit 855666d9e9 Specialize Prefix/Suffix Match for `Like/ILike` between
Array and Scalar for StringViewArray (#6231)
omit f73dbc30bb Minor: improve `RowFilter` and `ArrowPredicate` docs (#6301)
omit 8c956a9f9a Support writing UTC adjusted time arrays to parquet (#6278)
omit 6dd4a5f590 Use `unary()` for array conversion in Parquet array
readers, speed up `Decimal128`, `Decimal256` and `Float16` (#6252)
omit 2795b94119 fix reference in doctest to size_of which is not imported
by default (#6286)
omit 56f6942e30 Fix panic in comparison_kernel benchmarks (#6284)
omit 30db5dce9c Update tower requirement from 0.4.13 to 0.5.0 (#6250)
omit 1dae743af5 ci: simplify octokit add assignee (#6280)
omit 6c59b76375 Minor: `pub use ByteView` in arrow and improve
documentation (#6275)
omit 0bbad36f7d Minor: move `FallibleRequestStream` and
`FallibleTonicResponseStream` to a module (#6258)
omit 23b6ff9f43 Only add encryption headers for for SSE-C in get. (#6260)
omit 344ba1dd87 ci: use octokit to add assignee (#6267)
omit 7655cca530 Fix accessing name from ffi schema (#6273)
omit e5d9816dfb Add `Statistics::distinct_count_opt` and deprecate
`Statistics::distinct_count` (#6259)
omit c2d2311020 Do not print compression level in schema printer (#6271)
omit 663a6374b4 Improve documentation for MutableArrayData (#6272)
omit 25d39c13fc feat: further TLS options on ClientOptions: #5034 (#6148)
omit d7ad4fec7c Implement date_part for durations (#6246)
omit 27789d7c9a Update parquet object_store dependency to 0.11.0 (#6264)
omit c6bd492030 Add tests for bad parquet files (#6262)
omit 4a3422febf Make the bearer token visible in FlightSqlServiceClient
(#6254)
omit 042d725888 Avoid infinite loop in bad parquet by checking the number
of rep levels (#6232)
omit c835f88951 docs: Add parquet_opendal in related projects (#6236)
omit 0130af34ba Expose bulk ingest in flight sql client and server (#6201)
omit 8d1f0f5214 feat(object_store): add support for server-side encryption
with customer-provided keys (SSE-C) (#6230)
omit 0f7116bf81 Minor: Update DateType::Date64 docs (#6223)
omit 69b17ad402 parquet Statistics - deprecate `has_*` APIs and add `_opt`
functions that return `Option<T>` (#6216)
omit 2461a16c19 Implement PartialEq for GenericBinaryArray (#6241)
omit 4295d37b8e Add examples to `StringViewBuilder` and `BinaryViewBuilder`
(#6240)
omit 3e5c76f23f Remove unnecessary null buffer construction when converting
arrays to a different type (#6244)
omit 43b29b9cf3 minor enhance doc for ParquetField (#6239)
omit 9c4a7e3efa Improve performance of `FixedLengthBinary` decoding (#6220)
omit c1b3d98ce3 Modest improvement to FixedLenByteArray BYTE_STREAM_SPLIT
arrow decoder (#6222)
omit 468a5648f6 Move `ParquetMetadataWriter` to its own module, update
documentation (#6202)
omit 1238bb1d39 Add "take" workflow for self-assigning tickets, add "how to
find issues" to contributor guide (#6059)
omit 5868966259 Minor: Improve Type documentation (#6224)
omit 63d49c856d Minor: Remove non standard footer from LICENSE.txt (#6237)
omit 3cd8b763e1 Update changelog for object_store 0.11.0 release (#6238)
omit 61c0b7dbb4 Add LICENSE and NOTICE files to object_store (#6234)
omit a693f0f9c3 Improve interval parsing (#6211)
omit fe03d39393 Prepare for object_store `0.11.0` release (#6227)
omit bb363dc261 fix: lexsort_to_indices should not fallback to non-lexical
sort if the datatype is not supported (#6225)
omit 5c5a94a11f Implement specialized filter kernel for
`FixedSizeByteArray` (#6178)
omit 8a66174d2b use spaces not tabs everywhere (#6217)
omit 3e02689e34 Add time dictionary coercions (#6208)
omit 79ffdc4c67 update BYTE_STREAM_SPLIT documentation (#6212)
omit 130ba61e35 feat(object_store): add `PermissionDenied` variant to
top-level error (#6194)
omit 4bd737dab2 Support casting between BinaryView <--> Utf8 and LargeUtf8
(#6180)
omit e28cf44e65 fix(arrow): restrict the range of temporal values produced
via `data_gen` (#6205)
omit ace14018ed Add benchmarks for `BYTE_STREAM_SPLIT` encoded Parquet
`FIXED_LEN_BYTE_ARRAY` data (#6204)
omit bd75582fd0 Optimize `min_boolean` and `bool_and` (#6144)
omit 7f1bae205d Make it clear that StatisticsConverter can not panic (#6187)
omit 12ff1eac23 fix: Correctly handle take on dense union of a single
selected type (#6209)
omit b90c799afd fix: interleave docs suggests itself, not take (#6210)
omit 49840ec0f1 Remove duplicated statistics tests in parquet (#6190)
omit d7c57d09aa fix parquet type is_optional comment (#6192)
omit db239e5b3a Add (more) Parquet Metadata Documentation (#6184)
omit d5ed6b9f82 Add `ThriftMetadataWriter` for writing Parquet metadata
(#6197)
omit a235b9b295 Update zstd-sys requirement from >=2.0.0, <2.0.13 to
>=2.0.0, <2.0.14 (#6196)
omit 63a6209b87 Reduce bounds check in `RowIter`, add `unsafe
Rows::row_unchecked` (#6142)
omit 2a4f269e94 Support Parquet `BYTE_STREAM_SPLIT` for INT32, INT64, and
FIXED_LEN_BYTE_ARRAY primitive types (#6159)
omit 7f2d9ac14b feat(parquet): Implement AsyncFileWriter for
`object_store::buffered::BufWriter` (#6013)
omit 6133d18021 Fix typo in documentation of Float64Array (#6188)
omit 191c9d4553 Benchmarks for `bool_and` (#6189)
omit e6bd74b2c3 Add support for `StringView` and `BinaryView` statistics in
`StatisticsConverter` (#6181)
omit 36d567b4ca add filter benchmark for fsb (#6186)
omit f2de2cd3c8 No longer write Parquet column metadata after column chunks
*and* in the footer (#6117)
omit ee6fb8709b Update sysinfo requirement from 0.30.12 to 0.31.2 (#6182)
omit e6b794436c Update snafu (#5930) (#6070)
omit f708f3eaf7 Make object_store errors non-exhaustive (#6165)
omit df59cddcec Support `StringView` and `BinaryView` in CDataInterface
(#6171)
omit 01407f4824 Minor: improve comments in temporal.rs tests (#6140)
omit 0c3732fcae Optimize `take` kernel for `BinaryViewArray` and
`StringViewArray` (#6168)
omit ede5a64628 Minor: Update release schedule in README (#6125)
omit bf1a9ec7fa Add additional documentation and examples to ArrayAccessor
(#6141)
omit c14ade2b91 Upgrade protobuf definitions to flightsql 17.0 (#6133)
(#6169)
omit 2905ce6796 Update object store MSRV to `1.64` (#6123)
omit 6e893b5d41 Add `BooleanArray::new_from_packed` and
`BooleanArray::new_from_u8` (#6127)
omit bf0ea9129e improvements to `(i)starts_with` and `(i)ends_with`
performance (#6118)
omit bf9ce475df Improve `LIKE` performance for "contains" style queries
(#6128)
omit 0e99e3a645 improve LIKE regex (#6145)
omit bd1e76b085 Implement exponential block size growing strategy for
`StringViewBuilder` (#6136)
omit 11f2bb8076 Fix comparison kernel benchmarks (#6147)
omit 80ed712851 Use `LevelHistogram` in `PageIndex` (#6135)
omit 5f5a82cb38 Remove automatic buffering in `ipc::reader::FileReader` for
for consistent buffering (#6132)
omit 705d3414eb Remove `SchemaBuilder` dependency from `StructArray`
constructors (#6139)
omit e815d06766 Implement data_part for intervals (#6071)
omit f42d242052 Add ArrowError::ArithmeticError (#6130)
omit b06ffceaab Add support for level histograms added in PARQUET-2261 to
`ParquetMetaData` (#6105)
omit 613e93e75f Merge `53.0.0-dev` dev branch to main (#6126)
omit 1ff4e21e80 Fix clippy in object_store crate (#6120)
omit 3ebb033266 Fix Clippy for the Rust 1.80 release (#6116)
omit fa2fbfdc8b added a flush method to IPC writers (#6108)
omit 49e714de6e Prepare `52.2.0` release (#6110)
omit af40ea3822 Implement specialized min/max for `GenericBinaryView`
(`StringView` and `BinaryView`) (#6089)
omit 93e4eb25c7 Faster `GenericByteView` construction (#6102)
omit 8aa91e519a Make bool_or an alias for max_boolean (#6100)
omit 658e58f882 add benchmark to track performance (#6101)
omit 5de1d5e741 Optimize `max_boolean` by operating on u64 chunks (#6098)
omit ee5694078c fix panic in `ParquetMetadata::memory_size`: check
has_min_max_set before invoking min()/max() (#6092)
omit 16915b57f0 Add PartialEq to ParquetMetaData and FileMetadata (#6082)
omit 8a5be1330e Enable casting from Utf8View (#6077)
omit 9be0eb530d Minor: Improve parquet PageIndex documentation (#6042)
omit b44497e1cd Prepare for object_store `0.10.2` release (#6079)
omit 41665ea138 Correct timeout in comment from 5s to 30s (#6073)
omit 94652e5e23 use GCE metadata server env var overrides (#6015)
omit 4978e32654 Sanitize error message for sensitive requests (#6074)
omit 62f9e72f74 Reorganize arrow-flight test code (#6065)
omit 6ab853d38f Do not write `ColumnIndex` for null columns when not
writing page statistics (#6011)
omit b72098fee5 Minor: clarify the relationship between `file::metadata`
and `format` (#6049)
omit b2458bd686 StringView support in arrow-csv (#6062)
omit 66390ff8ec Add parquet `StatisticsConverter` for arrow reader (#6046)
omit 6d4e2f2cea Implement min max support for string/binary view types
(#6053)
omit 31b8ba023e Add begin/end_transaction methods in FlightSqlServiceClient
(#6026)
omit 074bcb5793 Directly decode String/BinaryView types from arrow-row
format (#6044)
omit 0002b4ded7 Fix typo in GenericByteViewArray documentation (#6054)
omit 9acc9fa0b8 Minor API adjustments for StringViewBuilder (#6047)
omit 199ce9190c Fix 5592: Colon (:) in in object_store::path::{Path} is not
handled on Windows (#5830)
omit 920a94470d Move avoid using copy-based buffer creation (#6039)
omit e70c16d67d Clean up unused code for view types in offset buffer (#6040)
omit 50b1e30aa6 Additional tests for parquet reader utf8 validation (#6023)
omit 2424da25dd Fix `hashbrown` version in `arrow-array`, remove from
`arrow-row` (#6035)
omit 826577a764 Update quick-xml requirement from 0.35.0 to 0.36.0 in
/object_store (#6032)
omit cb3babc9d1 Improve performance reading `ByteViewArray` from parquet by
removing an implicit copy (#6031)
omit 3ce8e842af Unsafe improvements: core `parquet` crate. (#6024)
omit c47f230c9c Update clap test (#6028)
omit 76fbdbc060 Update zstd-sys requirement from >=2.0.0, <2.0.12 to
>=2.0.0, <2.0.13 (#6019)
omit 8355823f74 Complete `StringViewArray` and `BinaryViewArray` parquet
decoder: implement delta byte array and delta length byte array encoding
(#6004)
omit b9e4497258 Rename `Schema::all_fields` to `flattened_fields` (#6001)
omit af4d6b624e Fast utf8 validation when loading string view from parquet
(#6009)
omit 2b986dfd5d Deduplicate strings/binarys when building view types (#6005)
omit b9562b9550 fix doc ci in latest rust nightly version (#6012)
omit a85768db9f Add FlightSqlServiceClient::new_from_inner (#6003)
omit fd5e67df9f Automatically cleanup empty dirs in LocalFileSystem (#5978)
omit bed37466af Add additional documentation and examples to DataType
(#5997)
omit 1f0b000958 implement `DataType::try_form(&str)` (#5994)
omit e7a0008e59 Implement dictionary support for reading ByteView from
parquet (#5973)
omit 035b5899f3 Prepare arrow `52.1.0` (#5992)
omit 5c6f857d9a feat(5851): ArrowWriter memory usage (#5967)
omit e61fb621d1 Add ParquetMetadata::memory_size size estimation (#5965)
omit ebc1cb1e5b fix: error in case of invalid interval expression (#5987)
omit 859c4ad486 Implement directly build byte view array on top of parquet
buffer (#5972)
omit 3b93a4b062 WriteMultipart Abort on MultipartUpload::complete Error
(#5974)
omit 63516742e7 Provide Arrow Schema Hint to Parquet Reader - Alternative 2
(#5939)
omit cad573571b Add user defined metadata (#5915)
omit bb1250ceb8 Minor: fix clippy complaint in parquet_derive (#5984)
omit 8284e5f4ff Reduce repo size by removing accumulative commits in CI job
(#5982)
omit 8e9bdceb44 Update quick-xml requirement from 0.34.0 to 0.35.0 in
/object_store (#5983)
omit 62c1615e8f feat: support reading OPTIONAL column in parquet_derive
(#5717)
omit 6230435b4f Add operation in ArrowNativeTypeOp::neg_check error message
(#5944) (#5980)
omit a4d21679d4 Make ObjectStoreScheme public (#5912)
omit 871c999601 Handle flight dictionary ID assignment automatically (#5971)
omit a7b4a3b10b Add view buffer for parquet reader (#5970)
omit c5b5eda77b Add benchmark for reading binary/binary view from parquet
(#5968)
omit 0a4d8a14b5 Fix FFI array offset handling (#5964)
omit 6bc9514aef implement sort for view types (#5963)
omit ee5572163a Expose `IntervalMonthDayNano` and `IntervalDayTime` and
update docs (#5928)
omit 1ef22e5a9b `like` benchmark for StringView (#5936)
omit e5604aae63 Document process for PRs with breaking changes (#5953)
omit 6b031629e1 Faster primitive arrays encoding into row format (#5858)
omit 45190ab528 feat: add max_bytes and min_bytes on PageIndex (#5950)
omit 4b326f6d05 Improve error message for unsupported nested comparison
(#5961)
omit 0e56fd5c4d chore(5797): change default data_page_row_limit to 20k
(#5957)
omit 901fbe877f Minor: fixup contribution guide (#5952)
omit 2323c74ce2 Update quick-xml requirement from 0.33.0 to 0.34.0 in
/object_store (#5954)
omit 460fd5506c test: Add unit test for extending slice of list array
(#5948)
omit 66bada54cf Implement like/ilike etc for StringViewArray (#5931)
omit 3139a08baf Update quick-xml requirement from 0.32.0 to 0.33.0 in
/object_store (#5946)
omit c084342aef Better document support for nested comparison (#5942)
omit 0c3a24d2a4 Implement arrow-row encoding/decoding for view types (#5922)
omit 063ac13af0 row format benches for bool & nullable int (#5943)
omit a35214f92a Fix typo in benchmarks (#5935)
omit 0ea074af77 Add `MultipartUpload` blanket implementation for `Box<W>`
(#5919)
omit 02fb714142 Update zstd-sys requirement from >=2.0.0, <2.0.10 to
>=2.0.0, <2.0.12 (#5913)
omit 86eb191fb2 fix(ipc): set correct row count when reading struct arrays
with zero fields (#5918)
omit 9413cd3ffd Add the ability for Maps to cast to another case where the
field names are different (#5703)
omit 13c9e9083e Add eq benchmark for StringArray/StringViewArray (#5924)
omit 7ef6be4cd9 Preallocate for `FixedSizeList` in `concat` (#5862)
omit 22e0b4432c Revert "Write Bloom filters between row groups instead of
the end (#5860)" (#5932)
omit 3930d5b056 Write Bloom filters between row groups instead of the end
(#5860)
omit 492bba98fb docs: Fix broken links of object_store_opendal README
(#5929)
omit 29c07d00ad docs: Add object_store_opendal as related projects (#5926)
omit 2f1c0147b2 Update proc-macro2 requirement from =1.0.85 to =1.0.86
(#5927)
omit 20a569a733 fix: Adjust FFI_ArrowArray offset based on the offset of
offset buffer (#5895)
omit c7e88a257c fix: prevent potential out-of-range access in
FixedSizeListArray (#5902)
omit d0a88c6519 Implement compare operations for view types (#5900)
omit 72467c670f Minor: expose timestamp_tz_format for csv writing (#5890)
omit 0d1511cfaf minor: use as_primitive replace downcast_ref (#5898)
omit d89b3b9ae1 Document parquet ArrowWriter type limitations (#5875)
omit ed018a34d9 Minor: Clarify when page index structures are read (#5886)
omit c191294826 Document when the ParquetRecordBatchReader will re-read
metadata (#5887)
omit c7513bd7a9 implement new null for view types (#5894)
omit 3e7c40c14a chore: update RunArray reference in run_iterator.rs (#5892)
omit cc0ce1b479 add view type single column tests (#5891)
omit 9949dfe22e chore: implement error handling for object_store (#5889)
omit aab9a6cee0 chore: Remove not used cache in InstanceCredentialProvider
(#5888)
omit 956fe76731 Add simple GC for view array types (#5885)
omit e8285bea0e clean up ByteView construction (#5879)
omit d32f68d6ec Fix clippy for object_store (#5883)
omit 3715d5447e new clippy rules (#5881)
omit 8e476aee95 feat: implement take for dense union array (#5873)
omit 8752e01be6 Improve performance of casting `StringView`/`BinaryView` to
`DictionaryArray` (#5872)
omit c6359bf78d Avoid copy/allocation when read view types from parquet
(#5877)
omit 2d17bf09d0 feat: recursively merge Field when datatype is
DataType::List and DataType::LargeList (#5852)
omit 77271c4984 Improve performance of casting `DictionaryArray` to
`StringViewArray` (#5871)
omit 601a722206 feat(object_store): Add `put` API for buffered::BufWriter
(#5835)
omit 4fc9ad126f Benchmark for casting view to dict arrays (and the reverse)
(#5874)
omit 0cc1416800 Update quick-xml requirement from 0.31.0 to 0.32.0 in
/object_store (#5870)
omit 8bee08bf3c Improve Parquet reader/writer properties docs (#5863)
omit a20116ec36 Make RowSelection's from_consecutive_ranges public (#5848)
omit b8c2741491 Minor: refine row selection example more (#5850)
omit 298bf481ad parquet: Fix warning about unused import (#5865)
omit 7f66b77af9 fix: msrv CI for object_store (#5866)
omit 76d04a8fa4 Added panic message to docs. (#5857)
omit 087f34b70e Refine documentation for `unary_mut` and `binary_mut`
(#5798)
omit fa8d350238 Add exposing fields from parquet row (#5842)
omit bca2f3ab9f Derive `Copy` for `TimeUnit` and `IntervalUnit` (#5840)
omit f42218ae5d Update proc-macro2 requirement from =1.0.84 to =1.0.85
(#5838)
omit ce1a8fc664 Add repr(C) to i256 (#5837)
omit 176a2d781b Prepare arrow 52.0.0 (#5836)
omit 57c4748fa9 Minor: Document timestamp with/without cast behavior (#5826)
omit 198af7a3f4 chore: Make binary_mut kernel accept different type for
second arg (#5833)
omit 13a26d6cb0 feat: impl *Assign ops for types in arrow-buffer (#5832)
omit 065151be78 fix: invalid examples/documentation in parquet_derive doc
(#5823)
omit fe071eb6a3 Minor: Improve ArrowReaderBuilder::with_row_selection docs
(#5824)
omit e4b28bd787 Relax zstd-sys Version Pin (#5829)
omit 5a24119f66 Minor: Improve arrow_cast documentation (#5825)
omit c2b05cdbcb Check length of `FIXED_LEN_BYTE_ARRAY` for `uuid` logical
parquet type (#5821)
omit 95ef912632 fix(flightsql): remove Any encoding of
DoPutPreparedStatementUpdateResult (#5817)
omit 1634a65ee7 Allow constructing ByteViewArray from existing blocks
(#5796)
omit 7fe01bb432 Allow overriding the inferred parquet scheme root (#5814)
omit 09e58a435a fix: serialization of decimal (#5801)
omit 12f57af595 Minor: Clarify docs on `EnabledStatistics` (#5812)
omit c6d089b6a8 Minor: Add examples for ColumnPath::from (#5813)
omit 9828bf0bcd Push SortOptions into DynComparator Allowing Nested
Comparisons (#5426) (#5792)
omit 54efb65bb1 Revisit List Row Encoding (#5807) (#5811)
omit 1ebd2a4d1b Add parquet-derive to repository README (#5795)
omit 95791f1c31 Update proc-macro2 requirement from =1.0.83 to =1.0.84
(#5805)
omit 4b5d9bfc95 Fix issue #5800: Handle missing files in
list_with_delimiter (#5803)
omit 7342d363d7 Fix typo continuation maker -> marker (#5802)
omit 4b1feaad98 Update nix requirement from 0.28.0 to 0.29.0 in
/object_store (#5799)
omit bd5d4a59db chore: update docs to delineate which are recursive (#5794)
omit 5e9919fd2b Fix incorrect URL to Parquet CPP types.h (#5790)
omit d65240c120 Refine ParquetRecordBatchReaderBuilder docs (#5774)
omit b07fd5dc4e feat(arrow-json): encode `Binary` and `LargeBinary` types
as hex when writing JSON (#5785)
omit 3e7e701db7 Update proc-macro2 requirement from =1.0.82 to =1.0.83
(#5789)
omit 3b7923c77c Update prost-build requirement from =0.12.4 to =0.12.6
(#5788)
omit c6b3eaa963 Refine parquet documentation on types and metadata (#5786)
omit cf59b6cd82 Structured interval types for `IntervalMonthDayNano` or
`IntervalDayTime` (#3125) (#5654) (#5769)
omit ce8363af34 Set the default size of BitWriter for DeltdaBitPackEndoer
to 1MB (#5776)
omit c498eb7485 feat: support encoding of binary in CSV writer (#5782)
omit 2534976a56 fix broken link to ballista crate (#5784)
omit a126d5097b Support casting a `FixedSizedList<T>[1]` to `T` (#5779)
omit 30762e81be Encode UUID as FixedLenByteArray in parquet_derive (#5773)
omit dfe0f2627b Update itertools requirement from 0.12.0 to 0.13.0 in
/object_store (#5780)
omit 28c1cae83f Fix documentation for parquet `parse_metadata`,
`decode_metadata` and `decode_footer` (#5781)
omit fa2ba9efc7 Improve error message for timestamp queries outside
supported range (#5730)
omit 0c1e3b893b Remove harmful table lookup optimization for bit operations
(#5772)
omit 30767a687b Remove deprecated comparison kernels (#4733) (#5768)
omit d17b2067d6 feat: Make AsyncArrowWriter accepts AsyncFileWriter (#5753)
omit 178ef99d9a Add environment variable definitions to run the nanoarrow
integration tests (#5764)
omit 78bda14f4c Expose boolean builder contents (#5760)
omit 7d465b87cc Expose the null buffer of every builder that has one (#5754)
omit 3566328e04 Improve repository readme (#5752)
omit 326231e3fb fix: parse string of scientific notation to decimal when
the scale is 0 (#5740)
omit c08feb41a7 Downgrade to Rust 1.77 in integration pipeline to fix CI
(#5719) (#5761)
omit 6ab67df984 Allow specifying comment character for CSV reader (#5759)
omit cd39b8c024 Compute data buffer length by using start and end values in
offset buffer (#5741)
omit 1c869214e2 Minor: Document object store release cadence (#5750)
omit 68ecc16654 Document planned release cadence for arrow/parquet/etc
(#5737)
omit 158e54da2c Fix nested nullability when randomly generating arrays
(#5713)
omit 7efe6c2053 Add additional WriteMultipart tests (#5743) (#5746)
omit 3d3ddb2108 Prepare object_store 0.10.1 (#5745)
omit 02be02bb51 Fix PutPayloadMut::push not updating content_length (#5743)
(#5744)
omit b25c441745 Change `UnionArray` constructors (#5623)
omit 4045fb5ba2 csv: Add support for flexible column lengths (#5679)
omit f67a5cec22 Update brotli requirement from 5.0 to 6.0 (#5726)
omit 68d1eef689 Minor: avoid (likely unreachable) panic in FlightClient
(#5734)
omit e3f1c9669c Refactor to share code between do_put and do_exchange calls
(#5728)
omit 119db5cdc6 Update proc-macro2 requirement from =1.0.81 to =1.0.82
(#5732)
omit 98784bd059 Fix Rustdocs (amd64, nightly)" CI check (#5727)
omit 7568178e37 Support casting `StringView`/`BinaryView` -->
`StringArray`/`BinaryArray`. (#5704)
omit 8f8fb2e2a9 Fix `GenericListBuilder` test typo (#5724)
omit 520ad68bee Export object_store integration tests (#5709)
omit 0d0c02e71e Tweak Private Sbbf::new_with_ndv_fpp Documentation (#5718)
omit d9206ba83f Deprecate NullBuilder capacity, as it behaves in a
surprising way (#5721)
omit 2bdc9c1eec docs: add sizing explanation to bloom filter docs in
parquet (#5705)
omit b3f06f6cc4 Fix up clippy for Rust 1.78 (#5710)
omit eb2d00b3ab Fallible stream for arrow-flight do_exchange call (#3462)
(#5698)
omit 6348dc3d0c Accept parquet schemas without explicitly required Map keys
(#5630)
omit bbd85ed3d2 Add `ListView` & `LargeListView` basic construction and
validation (#5664)
omit a20d2e51e9 Fix documentation around handling of nulls in cmp kernels
(#5697)
omit a61f1dc8ea Support casting `StringArray`/`BinaryArray` -->
`StringView` / `BinaryView` (#5686)
omit 08af4710fc Add `BufWriter::with_attributes` and `::with_tags` in
`object_store` (#5693)
omit 7feb5425e6 Add more attributes (#5690)
omit 11450ae8dd Arrow Flight SQL example JDBC driver incompatibility (#5666)
omit 0230795384 Remove deprecated JSON writer (#5651)
omit ae9b0dbaa8 Move ffi stream and utils from arrow to arrow-array (#5670)
omit c5b33049d5 Update object_store 0.10.0 (#5675)
omit 50358f6ccb Fix integration tests by downgrading jobserver (#5673)
(#5674)
omit cd3331989d Prepare object_store 0.10.0 (#5658)
omit 884a13614f Update proc-macro2 requirement from =1.0.80 to =1.0.81
(#5659)
omit 4b49c34440 Add put_multipart_opts (#5435) (#5652)
omit f2765283b6 Add Attributes API (#5329) (#5650)
omit 34e2ac2e71 Modify decimal regex to accept positive exponent specifier
(#5649)
omit 0d031cc8aa feat: JSON encoding of FixedSizeList (#5646)
omit 012430759f Fix flaky test_cleanup_intermediate_files (#5645)
omit 873176078a Support non-contiguous put payloads / vectored writes
(#5514) (#5538)
omit b9a373d878 Update proc-macro2 requirement from =1.0.79 to =1.0.80
(#5644)
omit e88e5aa92e Implement `filter` kernel for byte view arrays. (#5624)
omit fee692189f fix: panic when casting `ListArray` to `FixedSizeList`
(#5643)
omit 883c13ae21 Add more invalid utf8 parquet reader tests (#5639)
omit 7d929f0aec feat(ffi): add run end encoded arrays (#5632)
omit d84a1a6152 String to decimal conversion written using E/scientific
notation (#5611)
omit 89767ccb1d Account for Timezone when Casting Timestamp to Date32
(#5605)
omit 905c46be1a PrettyPrint support for `StringViewArray` and
`BinaryViewArray` (#5634)
omit a999fb8676 Increase BinaryViewArray test coverage (#5635)
omit 6450527c4f feat: encode FixedSizeBinary in JSON as hex string (#5622)
omit 0a1dfb3045 Update brotli requirement from 4.0 to 5.0 (#5637)
omit a094863452 Update flatbuffers requirement from 23.1.21 to 24.3.25
(#5636)
omit a15adf66a8 Fixed typos in object store (#5629)
omit 36a6e515f9 Update Flight crate README version (#5621)
omit 91f0b17713 feat: support reading and writing`StringView` and
`BinaryView` in parquet (part 1) (#5618)
omit 2c4b321d3b Bump peaceiris/actions-gh-pages from 3.9.3 to 4.0.0 (#5617)
omit 755616fd36 Use FixedSizeListArray::new in FixedSizeListBuilder (#5612)
omit 12c0d00794 Update prost-build requirement from =0.12.3 to =0.12.4
(#5604)
omit 0b0d64b627 Adds send_retry_with_idempotency and retry more kinds of
transport errors (#5609)
omit f38283b49b test: Add a test for RowFilter with nested type (#5600)
omit 144c9c7f6d Implement `take` kernel for byte view array. (#5602)
omit 16f4a7f970 fix: https://github.com/apache/arrow-rs/issues/5599 (#5603)
omit 1852c3327a Minor: Add docs for GenericBinaryBuilder, links to
`GenericStringBuilder` (#5597)
omit c203785ca3 Add `UnionArray::into_parts` (#5585)
omit 1b3d1a9f58 feat: implemented with_field() for FixedSizeListBuilder
(#5541)
omit 51c1b4b2ed Add tests for Arrow Flight support for `StringViewArray`
and `BinaryViewArray` (#5601)
omit 9fda7eab0c Bump chrono-tz from 0.8 to 0.9 (#5596)
omit e8c6d95191 Fix handling of empty multipart uploads for GCS (#5590)
omit 1b0ef0224e Update py03 from 0.20 to 0.21 (#5566)
omit bc2a73d1de filter for run end array (#5573)
omit 5a0baf1aee Add GCS signed URL support (#5300)
omit eddef43d1c Optionally require alignment when reading IPC, respect
alignment when writing (#5554)
omit 6306df0828 Update brotli requirement from 3.3 to 4.0 (#5586)
omit 40409e4038 Split arrow_cast::cast::string into it's own submodule
(#5563)
omit 888408309f Expose ArrowReaderMetadata::try_new (#5583)
omit ec85145f4b Add `try_filter_leaves` to propagate error from filter
closure (#5575)
omit 77a3132bbd using latest choron (#5578)
omit 17058c76be IPC format support for StringViewArray and BinaryViewArray
(#5525)
omit 9f36c88345 Implement MultipartStore for ThrottledStore (#5533)
omit 40fa58edae Update localstack 3.3 (#5570)
omit 8d344a6312 Update error message tests (#5569)
omit f8acd2b66e Add OffsetBufferBuilder (#5532)
omit 3c50d47833 Pin zstd-sys to `v2.0.9` in parquet (#5567)
omit cdb7b6f15b Update reqwest 0.12 and http 1.0 (#5536)
omit ff86119429 Split cast::dictionary into a submodule of cast (#5555)
omit 51ea38814c Correct example code for column (#5560) (#5561)
omit 9a5ea83885 Implement FlightSQL spec change to support stateless
prepared statements (#5433)
omit e1e1fb8b30 Split arrow_cast::cast::decimal into it's own submodule
(#5552)
omit 4e13f92c0b query.to_any() please (#5543)
omit e8b424ab29 Fix Clippy Lints object_store (#5546)
omit a8c4232b58 Add IPC StreamDecoder (#5531)
omit 37d1d3d4e6 Fix new clippy lints (#5544)
omit 78762dcf20 Split arrow_cast::cast::list into it's own submodule (#5537)
omit 161924e830 Bump black from 22.10.0 to 24.3.0 in /parquet/pytest (#5535)
omit f5c2686296 fix: copy/rename return error if source is nonexistent
(#5528)
omit 96c4c0b168 Replace AsyncWrite with Upload trait and rename
MultiPartStore to MultipartStore (#5458) (#5500)
omit f41c2a4e5a Minor: add additional documentation about `BufWriter`
(#5519)
omit 7e5f523a17 impl `From<ScalarBuffer<T>>` for `Vec<T>` (#5518)
omit ae42b3b688 parquet: Use specific error variant when codec is disabled
(#5521)
omit ada986c7ec Prepare arrow 51.0.0 (#5516)
omit 78aff9c401 update arrow-format (#5502)
omit 14bd53dc12 Support dictionary encoding in structures for
`FlightDataEncoder`, add documentation for `arrow_flight::encode::Dictionary`
(#5488)
omit 773cf18e2a feat: clarifying comments in struct_builder.rs #5494
(#5499)
omit 5dd5418070 Minor: Add doc comments to `GenericByteViewArray` (#5512)
omit 4d0316da10 Deprecate array_to_json_array (#5515)
omit c3899cea0c Fix integer parsing of empty strings (#5504) (#5505)
omit d39cf283e9 feat: initial support string_view and binary_view,
supports layout and basic construction + tests (#5481)
omit ad3b4c9250 Add DataType::ListView and DataType::LargeListView (#5493)
omit 19a3bb0d26 Remove internal buffering from AsyncArrowWriter (#5484)
(#5485)
omit c252a18844 Implement MultiPartStore for InMemory (#5495)
omit 6fd3a16a02 Update proc-macro2 requirement from =1.0.78 to =1.0.79
(#5498)
omit 51bcadbcd1 Better document parquet pushdown (#5491)
omit aad42b52f8 Remove unused import detected by nightly rust (#5477)
omit 94da02f043 Fix NullBufferBuilder::new_from_buffer wrong size assertion
(#5489)
omit 82fc0df73a Add MapBuilder::with_values_field to support non-nullable
values (#5482) (#5483)
omit e2b1f22012 Provide access to inner Write for parquet writers (#5471)
omit 79634c0f4b Document parquet writer memory limiting (#5450) (#5457)
omit c6ba0f764a Add more comprehensive documentation on testing and
benchmarking to CONTRIBUTING.md (#5478)
omit ae1d10fd6b Update latest chrono (#5479)
omit 8caec3b28b add support for gcp application default auth on windows in
object store (#5473)
omit 1553267fbe Add RecordBatch::schema_ref (#5474)
omit ace6d9058c Enhancement: Replace unsafe code (#5460)
omit 7eb866dd32 Add DataType::Utf8View and DataType::BinaryView (#5470)
omit d350ac5be1 Update base64 requirement from 0.21 to 0.22 in
/object_store (#5465)
omit 629ec077d9 Minor: Fix formatting typo in `Field::new_list_field`
(#5464)
omit 924e17e5c5 Update base64 requirement from 0.21 to 0.22 (#5467)
omit a02cebac91 Update localstack (#5283) (#5462)
omit 386bf49a1c Uses ResourceType for filtering directories instead of
workaround (#5452)
omit 0b977c6954 Fix test_string_dictionary_merge (#5255) (#5461)
omit 885461eb36 Document UnionArray Panics (#5456)
omit c5ab64cdc1 fix: lexsort_to_indices unsupported mixed types with list
(#5455)
omit 30151220c2 Prepare object_store 0.9.1 (#5449)
omit 877e870ee0 Refine `Display` and `Source` implementation for error
types (#5439)
omit ed996da97a Update local.rs (#5441)
omit ef5c45cf41 Add BufWriter for Adapative Put / Multipart Upload (#5431)
omit 37cf8a6c19 Improve debug output of Time32/Time64 arrays (#5428)
omit ab59080169 Improve docs for logical and physical nulls even more
(#5434)
omit 282123441c Update nix requirement from 0.27.1 to 0.28.0 in
/object_store (#5432)
omit 48fbb293c2 feat: S3 server-side encryption (#5402)
omit 0fd9b8af8f Enable anonymous access for MicrosoftAzure (#5425)
omit 4325900818 Bring some methods over from ArrowWriter to the async
version (#5251)
omit 1e0a264371 Ensure addition/multiplications in when allocating buffers
don't overflow (#5417)
omit e7ce4bbd66 Update Flight proto: PollFlightInfo & expiration time
(#5413)
omit e09896d9ae Miri fix: Rename invalid_mut to without_provenance_mut
(#5418)
omit ef63fb9faf fix(object_store): Include Content-MD5 header for S3
DeleteObjects (#5415)
omit 5bb226cc79 docds(object_store): Mention HTTP/WebDAV in README (#5409)
omit 1a880d632e Improve float to string cast by ~20%-40% (#5401)
omit 2e6c7b94b7 Enable running arrow-array and arrow-arith with miri and
avoid strict provenance warning (#5387)
omit cc48095d4f [object_store] Fix empty Multipart Upload for AWS S3 (#5405)
omit eb4be68a82 Return null for overflow when casting string to integer
under safe option enabled (#5398)
omit a88d70dc14 feat: utility functions for creating fsl dtype (#5373)
omit 48246fff71 Add tests for serializing list of dictionary encoded values
to json (#5399)
omit 0d96f1eb36 Improve like kernel by ~2% (#5390)
omit 1b06d78db5 Propagate error instead of panic for `take_bytes` (#5395)
omit c9029c5388 Don't omit schema metadata when removing column (#5328)
omit 0b45993f9c Update to chrono 0.4.34 (#5385)
omit 9d0abcc6f4 Return error instead of panic when reading invalid Parquet
metadata (#5382)
omit 1f8470dfd0 Update tonic-build requirement from =0.10.2 to =0.11.0
(#5379)
omit 865a9d3fe8 Update tonic requirement from 0.10.0 to 0.11.0 (#5380)
omit b25fe56b8f Fix latest clippy lints (#5376)
omit bc824d216b Pull container name from URL for Azure blob in
https://<account>.blob.core.windows.net/<container> case (#5371)
omit 55723980d3 docs(object-store): add warning to flush (#5369)
omit ae85263a97 feat: support casting FixedSizeList with new child type
(#5360)
omit bd19a62446 Add example of converting RecordBatches to JSON objects
(#5364)
omit 0dda129be7 Return an error instead of a panic when reading a corrupted
Parquet file with mismatched column counts (#5362)
omit 79721ec408 Minor: support cast values to fixedsizelist (#5340)
omit f303c9e112 pyarrow: Preserve RecordBatch's schema metadata (#5355)
omit 5093b787c4 Minor(docs): update master to main for DataFusion/Ballista
(#5363)
omit 121666e464 Add more debugging info to StructBuilder validate_content
(#5357)
omit f5097b07cb Make ArrayBuilder also Sync (#5353)
omit 1237c89922 Enhance Time32/Time64 support in date_part (#5337)
omit c096172b76 Track the memory usage of custom allocations so that their
size can be reported via Array::get_buffer_memory_size (#5347)
omit 93c7a12cff Mark Encoding::BIT_PACKED as deprecated and document its
compatibility issues (#5348)
omit 31cf5ce23f Exclude questions from changelog (#5349)
omit 8e9d7132f3 fix: Return an error on type mismatch rather than panic
(#4995) (#5341)
omit 5117b38d99 feat: add `take_record_batch`. (#5333)
omit 8fff5e4a07 Add ListBuilder::with_field to support non nullable list
fields (#5330) (#5331)
omit 514641918a Raw JSON writer (~10x faster) (#5314) (#5318)
omit 20e723e523 Refactor temporal extract date part kernels (#5319)
omit a0148ba4ce Add JSON writer benchmarks (#5314) (#5317)
omit e36c5fd94c Update proc-macro2 requirement from =1.0.76 to =1.0.78
(#5324)
omit cf8084940d Minor/Doc Expand FlightSqlServiceClient::handshake doc
(#5321)
omit e47e2f19d1 fix panic when decode a group with no child (#5322)
omit b594d9063a Enhance Date64 type documentation (#5323)
omit ce589325d8 parquet: Add ArrowWriterOptions to skip embedding the arrow
metadata (#5299)
omit b03613eb00 Test parse_url_opts for HTTP (#5310) (#5316)
omit 639e81e98c Update IOx links (#5312)
omit ff5a84df39 Pass options to HTTPBuilder in parse_url_opts (#5310)
(#5311)
omit 8301b23845 Bump actions/cache from 3 to 4 (#5308)
omit 3ed7cc61d4 Remove localstack DynamoDB workaround (#5267) (#5307)
omit 202e9a1c29 Avro block decompression (#5306)
omit ba6dbb8e27 Add support for more fused boolean operations (#5298)
omit 8345991ad6 Result into error in case of endianness mismatches (#5301)
omit 07fa7f6f0b Update localstack 3.0.2 (#5302)
omit 4c3e9be465 Support Parquet Byte Stream Split Encoding (#5293)
omit 4a6ae68ad8 Map AvroSchema to Arrow (#4886) (#5009)
omit 72d8a78317 Extend string parsing support for Date32 to encompass the
timestamp format (#5282)
omit fcfe36fa2c refactor: log server error during object store retries
(#5294)
omit db81108366 Prepare arrow 50.0.0 (#5291)
omit ca14f6f6d0 Update parquet object_store dependency to 0.9.0 (#5290)
omit e831d5c8c3 Update proc-macro2 requirement from =1.0.75 to =1.0.76
(#5289)
omit a61e824abd Enable JS tests again (#5287)
omit cb16050ec7 Prepare object_store 0.9.0 (#5224) (#5285)
omit 2e86650529 Print container logs in CI (#5286)
omit f7101ec3a2 Support S3 Express One Zone (#5268)
omit 2f5dcdffb0 object_store: full HTTP range support (#5222)
omit cf61bb89d8 DynamoDB ConditionalPut (#5247)
omit 2f383e764a feat(object_store): Azure url signing (#5259)
omit a9470d3eb0 Update proc-macro2 requirement from =1.0.74 to =1.0.75
(#5279)
omit 8fda518891 Retry Safe/Read-Only Requests on Timeout (#5278)
omit 5a67f1f1e8 Fix ObjectMeta::size for range requests (#5272) (#5276)
omit 2460c88a33 docs(object_store): Mention `with_allow_http` in docs of
`with_endpoint` (#5275)
omit b2b4e7a44f Update proc-macro2 requirement from =1.0.73 to =1.0.74
(#5271)
omit dece26367a Update proc-macro2 requirement from =1.0.71 to =1.0.73
(#5265)
omit e6395e21d9 Make regexp_match take scalar pattern and flag (#5245)
omit b00f4e09ab Update docs for datatypes (#5260)
omit c57857031f Default AWS region to us-east-1 (#5211) (#5244)
omit 9863486299 Add IPC FileDecoder (#5249)
omit fad103a80a Further Clippy Lints and Temporarily disable JS integration
tests (#5258)
omit eeaff99113 Don't suppress errors in ArrowArrayStreamReader (#5256)
omit cbb2f3449a Clippy lints 1.75 (#5257)
omit 31b865ebcb use from_ffi_and_data_type instead (#5248)
omit 3cd6da0a6b Add `Field::new_list_field` and improve
`DataType::new_list` docs (#4627)
omit 844b8519bf Implement `copy_if_not_exist` for `AmazonS3` using DynamoDB
(#4880) (#4918)
omit add8f567c8 Add FileReaderBuilder for arrow-ipc to allow reading large
no. of column files (#5136)
omit ff951b42f5 ci: Fail Miri CI on first failure (#5243)
omit 0eb8a08f88 Remove 'unwrap' from Result (#5241)
omit 3b3bd604bb update (#5239)
omit a9d219bb49 Remove deprecated try_with_option methods (#5237)
omit c6f8bb5b91 Document default value of InstanceCredentialProvider (#5188)
omit 72c9505bed Improve regexp kernels performance by avoiding cloning
Regex (#5235)
omit 859edc6173 Update proc-macro2 requirement from =1.0.70 to =1.0.71
(#5231)
omit 9d3a80042e make with_schema's error more readable (#5228)
omit 41fda0bb98 Minor: Improve comments and errors for ArrowPredicate
(#5230)
omit 0a4eb81698 Bump actions/upload-pages-artifact from 2 to 3 (#5229)
omit 1fa7afdb84 Use `try_new` when casting between structs to propagate
error (#5226)
omit fc266f94d8 feat(cast): support cast between struct (#5221)
omit c0b805597c Fix inferring object after field was null. (#5216)
omit 9e060dc6c6 Add `entries` to `MapBuilder` to return both key and value
array builders (#5218)
omit 9a1e8b572d Use Vec in ColumnReader (#5177) (#5193)
omit b8ca86a8e3 Support MapBuilder in make_builder (#5210)
omit 8b816d31f9 Revert "Bump actions/download-artifact from 3 to 4 (#5212)"
(#5213)
omit 6d5d9007d9 Bump actions/download-artifact from 3 to 4 (#5212)
omit 802ed428f8 Support quote and escape in Csv WriterBuilder (#5196)
omit bc39f25e0f refactor: simplify cast_string_to_interval (#5195)
omit 7fd2d4248f impl `From<BufferBuilder<T>>` for `ScalarBuffer<T>` (#5201)
omit 2a84e85de1 feat(object_store): use http1 by default (#5204)
omit 8aa55ddc1c impl `From<BufferBuilder<T>>` for `Buffer` (#5202)
omit 15535457ff impl `From<OffsetBuffer<T>>` for `ScalarBuffer<T>` (#5203)
omit 9630aaf55b Blockwise IO in IPC FileReader (#5153) (#5179)
omit c5a9953f2a Clarify interval comparison behavior with documentation and
tests (#5192)
omit 7e289134a8 Simplify parquet statistics generation (#5183)
omit 2a213bc36f Remove ScalarBuffer from parquet (#1849) (#5177) (#5178)
omit a43e82c630 Add `BooleanArray::into_parts` method (#5191)
omit c821ae7287 Fix deprecated note for `Buffer::from_raw_parts` (#5190)
omit 93a28a5457 Fixed issue where timestamp parser incorrectly accepted
characters after 'Z (#5189)
omit d41e90e31d Remove SIMD Feature (#5184)
omit b06ab13fa2 Use Total Ordering for Aggregates and Refactor for Better
Auto-Vectorization (#5100)
omit 490c080e5b Parquet: Ensure page statistics are written only when
conifgured from the Arrow Writer (#5181)
omit 1534cc196c Bump actions/setup-python from 4 to 5 (#5175)
omit 2923243d1c Labeller attempt 2 (#5174)
omit 298ddfdbc4 ci: Add cargo audit CI action (#5160)
omit 95f03ac945 improve: make RunArray displayable (#5166)
omit 32b68f7207 Add LargeListBuilder to make_builder (#5171)
omit ea3aca1d6f fix: Changed labeler.yml to latest format (#5172)
omit f4bad6871f fix: ensure take_fixed_size_list can handle null indices
(#5170)
omit 46bbd7debe Removing redundant as casts (#5168)
omit f352cdc532 Bump actions/labeler from 4.3.0 to 5.0.0 (#5167)
omit cb338c94a9 Update rustls-pemfile requirement from 1.0 to 2.0 in
/object_store (#5155)
omit a36bf7ade4 Parquet: clear metadata and project fields of
ParquetRecordBatchStream::schema (#5135)
omit f16d2f516d Parquet: write column_orders in FileMetaData (#5158)
omit b8d3f3380c Parquet: don't truncate f16/decimal min/max stats (#5154)
omit 6b905fe232 Removing ahash (#5156)
omit 9efaf06247 Adding `is_null` datatype shortcut method (#5157)
omit 5788c69958 object_store: fix failing doctest with default features
(#5161)
omit f621d28db5 Parquet: omit min/max for interval columns when writing
stats (#5147)
omit 6d4b8bbad9 Support nested schema projection (#5148) (#5149)
omit 8867a1f433 Allow 403 for overwrite prevention (#5134)
omit cfdb505c97 Deprecate Fields::remove Schema::remove (#5144)
omit ef6932f31e JSON: write struct array nulls as null (#5133)
omit c161456158 Support casting of Float16 with other numeric types (#5139)
omit 093a10e462 Parquet: Make `MetadataLoader` public (#5137)
omit a361ce13c0 Fix 'ColumnPath not found' error reading Parquet files with
nested REPEATED fields (#5102)
omit 58c80e6d7d Update localstack to 3.0.1 (#5028)
omit 34a816d4fc Parquet: derive boundary order when writing (#5110)
omit 8a0b5cb252 Fix negative decimal string (#5128)
omit e26fa4f395 Update proc-macro2 requirement from =1.0.69 to =1.0.70
(#5131)
omit 4b7405ccc4 Improve cast docs (#5114)
omit 435b53ded3 Cast from numeric/timestamp to timestamp/numeric (#5123)
omit d5a6cf4e5a Fix ObjectStore.LocalFileSystem.put_opts for blobfuse
(#5094)
omit 409bb81a69 [fix #5044] Support converting 'yyyymmdd' format to date
(#5078)
omit ef1cc38bbf Cleanup list casting and support nested lists (#5113)
(#5124)
omit e1bafdf703 Remove empty source file (#5119)
omit 200e8c8008 Implementing `ArrayBuilder` for `Box<dyn ArrayBuilder>`
(#5109)
omit 410fcbba51 Update prost-build requirement from =0.12.2 to =0.12.3
(#5112)
omit 06a3a2e467 Fix integration tests (#5111)
omit df69ef57d0 fix: coerce_primitive for serde decoded data (#5101)
omit fbbb61d942 Allow writing null valued keys in JSON (#5065)
omit b7248497a4 Improve C Data Interface and Add Integration Testing
Entrypoints (#5080)
omit 4d141a34cb Allow 'zip' compute function to operate on Scalar arrays
(#5086)
omit 6815bf153d Expand parquet crate overview doc (#5093)
omit 61da64a055 Extend aggregation benchmarks (#5096)
omit dc75a280b4 feat: cast (Large)List to FixedSizeList (#5081)
omit bfe396e3fc Ensure arrays passed to MutableArrayData have same type
(#5091) (#5092)
omit 481652a4f8 Fix latest clippy lints (#5090)
omit 873d277af4 Update prost-build requirement from =0.12.1 to =0.12.2
(#5088)
omit a3687a7506 Add FFI from_raw (#5082)
omit aff86e704d Implement Arrow PyCapsule Interface (#5070)
omit 4b9d789885 Update itertools requirement from 0.11.0 to 0.12.0 in
/object_store (#5077)
omit 7fa78b79b5 Support multiple GZip members in parquet page (#4951)
omit 7941577d41 Enable truncation of binary statistics columns (#5076)
omit 7ba36b0123 Parquet: read/write f16 for Arrow (#5003)
omit 924b6e9d0e IPC writer truncated sliced list/map values (#5071)
omit 31b5724332 Add a PR under "Breaking changes" in the object_store 0.8.0
changelog (#5063)
omit f53f284b3e docs: re-order `object_store` intro (#5058)
omit 0cb30bb51e refactor: change `object_store` CA handling (#5056)
omit 1635f5bfdd Remove ByteBufferPtr and replace with Bytes (#5055)
omit 747dcbf067 Update parquet encoding docs (#5053)
omit 1d1693777e Prepare arrow 49.0.0 (#5054)
omit ffeda62fc9 Parquet f32/f64 handle signed zeros in statistics (#5048)
omit 20f10dcd21 Fix RowSelection::intersection (#5036) (#5041)
omit 8c20c98c1e Cast from integer/timestamp to timestamp/integer (#5040)
omit 91acfb07a9 Fix serialization of large integers (#5038) (#5042)
omit dcbe546529 Update object_store 0.8.0 (#5043)
omit 7705acad84 Support casting from integer to binary (#5015)
omit a447bcf0ee doc: update comment on sort_to_indices to reflect that IEE
754 totalOrder is used (#5033)
omit 1807abace4 chore: Update docs to refer to non deprecated function
(`partition`) (#5027)
omit e4689e6de7 Fix invalid_path test (#5026)
omit 829708d491 Verify object_store with all features (#5024)
omit ad211fe324 Prepare object_store 0.8.0 (#5010) (#5023)
omit ab53d2dd5f Support onelake fabric paths in parse_url (#5000) (#5002)
omit 7281a0c167 Relax path safety (#5019) (#5020)
omit 78735002d9 ObjectStore: make error msg thrown from retry more detailed
(#5012)
omit ec788e15a9 Decode URL paths (#5017) (#5018)
omit 94fe6bb4b0 Remove ObjectStore::append (#5016)
omit 65f7be8560 Return row count when inferring schema from JSON (#5008)
omit be093cb442 Simplify datetime conversion (#5006)
omit cc23cacd12 Improve object_store docs (#4978)
omit d9aaa437ca Add `RecordReader` trait and proc macro to implement it for
a struct (#4773)
omit 890823b6bc feat(flight-sql): Allow custom commands in get-flight-info
(#4997)
omit 11b2f5fecc Object tagging (#4754) (#4999)
omit e4bb1e9ec0 Support list_with_offset for GCS (#4993)
omit e3cce56979 Conditional Put (#4879) (#4984)
omit 5601b7a8c8 Add `Field::remove()`, `Schema::remove()`, and
`RecordBatch::remove_column()` APIs (#4959)
omit cd069ea28b Update tracing-log requirement from 0.1 to 0.2 (#4998)
omit b07dabea87 Use new integration scripts (#4963) (#4988)
omit 3dbe45b658 [MINOR] No need to jump to web pages (#4994)
omit 6b4fd2f222 Don't panic on invalid Azure access key (#4972) (#4974)
omit 1708b0bae0 Support metadata in SchemaBuilder (#4987)
omit 570c91eb06 Support bucket name with `.` when parsing GCS URL (#4991)
(#4992)
omit e78d1409c2 Add MultiPartStore (#4961) (#4608) (#4971)
omit a6a512f387 Fix pre commit (#4990)
omit a33d42f591 Increase default timeout to 30 seconds (#4989)
omit c90aff3cc9 feat: support schema change by idx and reverse (#4985)
omit 4748b6187a Bump actions/setup-node from 3 to 4 (#4982)
omit 2f3379559f Update quick-xml requirement from 0.30.0 to 0.31.0 in
/object_store (#4983)
omit e79b3bcd70 Support ImdsManagedIdentityProvider in Azure Functions
(#4976) (#4977)
omit 14d6c8df12 Add arrow_cast::base64 and document usage in arrow_json
(#4975)
omit 03d0505fc8 Add SchemaBuilder::remove (#4952) (#4964)
omit f4a2a88a65 Add ObjectMeta::version and GetOptions::version (#4925)
(#4935)
omit 0b9105d704 Temporarily Disable Java Integration Tests (#4957)
omit 7e134f4d27 Use rustfmt default line width (#4960)
omit f597d3a687 Split gcp Module (#4956)
omit efd4d1900a Add module links in docs root (#4955)
omit a425e7e7fa Split azure Module (#4954)
omit 62ca5f37d1 Split aws Module (#4953)
omit 4cca029144 Return `PutResult` with an ETag from ObjectStore::put
(#4934) (#4944)
omit 51ac6fec87 Respect ARROW_TEST_DATA in apache-avro tests (#4950)
omit 6e332b8f57 Prepare arrow 48.0.0 (#4948)
omit 4964d84431 Add `ReaderBuilder::with_header` for csv reader (#4949)
omit a94ccff9de feat: support parsing for parquet writer option (#4938)
omit 952cd2efcb Expose SubstraitPlan structure in arrow_flight::sql (#4932)
(#4933)
omit 511ac44cf9 Fix object_store docs (#4947)
omit fa7a61a4b0 Remove Nested async and Fallibility from ObjectStore::list
(#4930)
omit d4d11fe7a4 Assume Pages Delimit Records When Offset Index Loaded
(#4921) (#4943)
omit ab87abdd69 Generate `ETag`s for `InMemory` and `LocalFileSystem`
(#4879) (#4922)
omit 95b015cf7b Evaluate null_regex for string type in csv (now such values
will be parsed as `Null` rather than `""`) (#4942)
omit ce2a958055 Add `FileWriter` schema getter (#4940)
omit 69c937565f Support service_account in ApplicationDefaultCredentials
and Use SelfSignedJwt (#4926)
omit 4a23ab9333 Update pyo3 requirement from 0.19 to 0.20 (#4941)
omit 31bc84c91e Default connection and request timeouts of 5 seconds (#4928)
omit 57cd0945db Allow opting out of request signing (#4927) (#4929)
omit bb8e42f639 Add GetOptions::head (#4931)
omit 90bc5ec96b Support Arbitrary JSON values in JSON Reader (#4905) (#4911)
omit 6e49f31e6f feat: add method for async read bloom filter (#4917)
omit 0503d65b36 Update zstd requirement from 0.12.0 to 0.13.0 (#4923)
omit 11205a891c Add AWS presigned URL support (#4876)
omit d5a655d21f Add option to `FlightDataEncoder` to always resend batch
dictionaries (#4896)
omit 556c5ff819 Cleanup CSV WriterBuilder, Default to AutoSI Second
Precision (#4735) (#4909)
omit d83008bc03 Cleanup `object_store::retry` client error handling (#4915)
omit 181cb3d66e Minor: Clarify rationale for FlightDataEncoder API, add
examples (#4916)
omit 4aabd2c5de feat: document & streamline flight SQL CLI (#4912)
omit d3e1302a69 Update regex-syntax requirement from 0.7.1 to 0.8.0 (#4914)
omit 538a7bfed5 Specialize Thrift Decoding (~40% Faster) (#4891) (#4892)
omit c6387c1ffc fix(csv)!: infer null for empty column. (#4910)
omit 16f59056a4 feat: log headers/trailers in flight CLI (+ minor fixes)
(#4898)
omit 2af51631e4 Allow merge of Null to any datatype. (#4902)
omit ed58e767d7 chore: add csv example (#4904)
omit c7911286cc Update proc-macro2 requirement from =1.0.68 to =1.0.69
(#4907)
omit 431df704d3 Update proc-macro2 requirement from =1.0.67 to =1.0.68
(#4900)
omit 2c4bc5449f Upgrade to Rust 1.73.0 (#4899)
omit 2214fda3a9 fix(arrow-json)!: include null fields in schema inference
with a type of Null (#4894)
omit 208da03979 mark OnCloseRowGroup Send (#4893)
omit 97a82c01d4 Fix integration tests (#4889)
omit f0455d12dd Support Parsing Avro File Headers (#4888)
omit 4320a753be Implement Take for UnionArray (#4883)
omit 39e4d94364 Update ring requirement from 0.16 to 0.17 in /object_store
(#4887)
omit d941ff1c37 Support parquet bloom filter length (#4885)
omit 3b0ede4fbb Replace lz4 with lz4_flex Allowing Compilation for WASM
(#4884)
omit 8c495b6002 parquet: Read field IDs from Parquet Schema (#4878)
omit 3ac0053772 Support Encoding Parquet Columns in Parallel (#4871)
omit 0e04757d90 Update tonic-build requirement from =0.10.1 to =0.10.2
(#4881)
omit 471f6dd291 Flush in creates_dir_if_not_present_append (#4872) (#4874)
omit 284556e55a feat: improve flight CLI error handling (#4873)
omit 62bb64cf9f Check precision overflow for casting floating to decimal
(#4866)
omit 786760a8f2 Flush in multiple_append test (#4868) (#4869)
omit b600e202f4 Enable new integration tests (#4828) (#4862)
omit 8a07be3a51 Make align_buffers as public API (#4863)
omit 4ef7917bd5 Prepare object_store 0.7.1 (#4860)
omit fbd9008d31 Faster Serde Integration (~80% faster) (#4861)
omit 2c9e2e9a95 Add ObjectStore BufReader (#4762) (#4857)
omit 74e2c5cd23 Make ArrowRowGroupWriter Public and
SerializedRowGroupWriter Send (#4850)
omit 7e7ac153c6 fix: add missing precision overflow checking for
`cast_string_to_decimal` (#4830)
omit b35511d293 Allow overriding azure endpoint (#4853) (#4854)
omit 72a2dab54a Allow Constructing Non-Empty StructArray with no Fields
(#4842) (#4845)
omit 6d5d7e36ef Minor: Improve object_store docs.rs landing page (#4849)
omit 431be3facb Perform HEAD request for HttpStore::head (#4837)
omit 1de21d29ad fix: make_primitive_scalar bug (#4852)
omit 8465ed4729 Update tonic-build requirement from =0.10.0 to =0.10.1
(#4846)
omit f9cd26f7bc Refine documentation to `Array::is_null` (#4838)
omit 407e575f41 Error if Remote Ignores HTTP Range Header (#4841)
omit a03ce564f1 fix: object store http header last modified (#4834)
omit 1d6feeaceb Prepare arrow 47.0.0 (#4827)
omit e214d6b612 Respect FormatOption::nulls for NullArray (#4836)
omit f7464bc056 Fix merge_dictionary_values in selection kernels (#4833)
omit 47e8a8ddb3 Fix flight sql do put handling, add bind parameter support
to FlightSQL cli client (#4797)
omit 33b881dc18 Fix like scalar null (#4832)
omit 175c776593 Fix typo in docstring (#4826)
omit 95ee5d3c57 feat: FixedSizeBinaryArray::value_data return reference
(#4821)
omit a6dffca082 Update prost (#4825)
omit 7b785310c0 Update chrono pin (#4824)
omit 9cb4a75f18 Stateless Row Encoding / Don't Preserve Dictionaries in
`RowConverter` (#4811) (#4819)
omit b64e362f04 Adaptive Row Block Size (#4812) (#4818)
omit 80b0888fa1 fix: export record batch through stream (#4806)
omit d960379f3d Do not check schema for equality in `concat_batches` (#4815)
omit d2be733f44 More chrono deprecations (#4822)
omit 7355e8392d Update proc-macro2 requirement from =1.0.66 to =1.0.67
(#4816)
omit 229bf8b614 ObjectStore Wasm32 Fixes (#4775) (#4776) (#4796)
omit 2075cd125d csv: Add option to specify custom null values (#4795)
omit 77455d48cd fix: entries field is non-nullable (#4808)
omit b4997bc35c Improved csv_reader benchmarks with smaller integers (#4803)
omit 878217b9e3 Add docstring and example to `Scalar` (#4793)
omit 1e46f8f08a Best effort cleanup of staged upload files (#4778) (#4792)
omit 15dde87d4e Re-export array crate root (#4780) (#4779) (#4791)
omit dd0c4ab980 Relaxing type bounds on coalesce_ranges and collect_bytes
(#4787)
omit 2fe71ca52d Allow custom tree builder for parquet::record::RowIter
(#4783)
omit 83390ed13a Fix DictionaryArray::normalized_keys (#4788) (#4789)
omit 6fdbc263b0 Make coalesce_ranges and collect_bytes available to the
users (#4784)
omit 0847c9aa8b Update object_store chrono deprecations (#4786)
omit 65edbb1702 Re-encode dictionaries in selection kernels (#3558)
omit db5314c5c2 Fix List Sorting, Revert Removal of Rank Kernels (#4747)
omit b66c57c4b4 Bump actions/checkout from 3 to 4 (#4767)
omit 587250c8e0 fix: avoid panic if offset index not exists. (#4761)
omit 611b129e39 Remove unused dyn_cmp_dict feature (#4766)
omit 6e28c03ff6 Make ObjectStore::copy Atomic and Automatically Create
Parent Directories (#4758) (#4760) (#4759)
omit 4927c1ef1c Implement PyArrowType for `Box<dyn RecordBatchReader +
Send>` (#4751)
omit eeba0a3792 Relax constraints on PyArrowType (#4757)
omit 735f48d1f2 return error (#4752)
omit 32e973d7fd Chrono deprecations (#4748)
omit cb793a5d54 Update nix requirement from 0.26.1 to 0.27.1 in
/object_store (#4744)
omit 4888dbf1d9 Clear row buffer before reuse (#4742)
omit 221f5d2fe9 Datum based like kernels (#4595) (#4732)
omit 4533271b4b feat: expose DoGet response headers & trailers (#4727)
omit 2fe9ef11e5 Cleanup length and bit_length kernels (#4718)
omit f332e23b3d chore: fix libpython in CI (#4738)
omit f2ba18b89a Add `with_proxy_ca_certificate` and `with_proxy_excludes`
(#4714)
omit dfb1ea2469 Fix new clippy lints (#4734)
omit d9381c66c2 Add `IpcError` variant to replace some uses of
`IoError`that don't have underlying `std::io::Error` (#4726)
omit 90449ffb2e Prepare Arrow 46.0.0 (#4720)
omit bce0b418b6 Add distinct kernels (#960) (#4438) (#4716)
omit 23db567d05 Cleanup redundant link targets (#4719)
omit 2c487d0eba Parquet doc tweaks (#4680)
omit 1afc7c32bf Update parquet object_store 0.7 (#4715)
omit 8bbb5c1877 Datum based comparison kernels (#4596) (#4701)
omit b810e8f207 Support Field ID in ArrowWriter (#4702) (#4710)
omit a19ff2bacd Tweak docs (#4711)
omit f0200dbec1 Add AnyDictionary Abstraction and Take ArrayRef in
DictionaryArray::with_values (#4707)
omit 31c81c5fd9 Fix nightly tests (#4709)
omit 810291179f Take kernel dyn Array (#4705)
omit 44b644d47c Cleanup parquet type builders (#4706)
omit d8381943cc Improve ergonomics of Scalar (#4704)
omit fc6f528705 Remove rank kernels (#4703)
omit b581ef51b0 Add safe zero-copy converion from bytes::Bytes (#4254)
(#4260)
omit cbff4d818d Update object_store Dependencies and Configure Dependabot
(#4700)
omit 197c425285 Validate ArrayData Buffer Alignment and Automatically Align
IPC buffers (#4255) (#4681)
omit 77fe72ddd4 Prepare object_store 0.7.0 (#4699)
omit abd80ae014 Support references in i256 arithmetic ops (#4692)
omit 979a070dc8 Logical Nullability (#4691)
omit 820e40a278 Add range and ObjectMeta to GetResult (#4352) (#4495)
(#4677)
omit cd0e5513c9 Add AzureConfigKey::ContainerName (#4629) (#4686)
omit ec273e76db Cleanup DynComparator (#2654) (#4687)
omit 230612eedc Add Support for Microsoft Fabric / OneLake (#4573)
omit 65c24d6cee Faster stream_get test (#4685)
omit df28eafb08 Fix object_store docs and Add CI job (#4684)
omit f9f6eeae55 Check object_store format in CI (#4679)
omit 4200bedd61 Minor: improve object_store docs.rs library landing page
(#4682)
omit c618438924 Faster i256 Division (2-100x) (#4663) (#4672)
omit ea19ce86d6 Separate metadata fetch from `ArrowReaderBuilder`
construction (#4674) (#4676)
omit a41248ad8d Fix equality of nested nullable FixedSizeBinary (#4637)
(#4670)
omit 2139fa5317 cleanup some assert() with error propagation (#4673)
omit cefb8c1bbb Use ArrayFormatter in cast kernel (#4668)
omit 5023ea8438 Fix MSRV CI (#4671)
omit 92d8ee682f More intuitive bool-to-string casting (#4666)
omit 946e17d792 Minor: Improve API docs for FlightSQL metadata builders
(#4667)
omit 0ded0ce1be Account for child `Bucket` size in OrderPreservingInterner
(#4646)
omit 97eba43b01 enhancement: batches_to_flight_data require a schema ref as
param. (#4665)
omit eb8edc4122 bug: Add some missing field in row group metadata: ordinal,
total co… (#4636)
omit 696cbdbb72 Support `concat_batches` for 0 columns (#4662)
omit 50f161eafb fix ownership of c stream error (#4660)
omit f16ceedf98 minor: move comment to the correct location (#4655)
omit ab8d918cd5 Fix illustration for dict encoding (#4657)
omit 1f466dc62c Support copy_if_not_exists for Cloudflare R2 (#4190) (#4239)
omit 3b24ca1e62 Update packed_simd and run miri tests on simd code (#4654)
omit bcc04a40fd impl `From<Vec<T>>` for `BufferBuilder` and `MutableBuffer`
(#4650)
omit 6fd50329b1 Filter record batch with 0 columns (#4648)
omit 0aa49fc08b Pin latest nightly (#4652)
omit 273dcc18a8 refactor: from_thrift avoid panic (#4642)
omit b15838cfc1 Implement `Default`,`Extend` and `FromIterator` for
`BufferBuilder` (#4638)
omit a81da6c89c Cleanup sort (#4613)
omit 841a6a981d Vectorized lexicographical_partition_ranges (~80% faster)
(#4575)
omit c2b0aa5fae fix(select): handle `NullArray` in `nullif` (#4635)
omit 00be18dda5 fix: compute_dictionary_mapping use wrong offsetSize (#4625)
omit 08e4692b2e Add more docs and examples for ListArray and OffsetsBuffer
(#4607)
omit 0eb9049ff7 allow zero sized empty fixed (#4626)
omit 30a5b8d83f Minor: improve docs and add example for
lexicographical_partition_ranges (#4615)
omit 8a9dd842fc Use Config System for Object Store Integration Tests (#4628)
omit 70094a5eb3 expand docs for FixedSizeListArray (#4622)
omit 399a3d1bfd Move `BufferBuilder` to `arrow-buffer` (#4630)
omit 74889255f1 impl `FromIterator` for `MutableBuffer` (#4624)
omit de5aa483a5 chore: add datatype new_list (#4561)
omit a016654cfb impl `Default` for `arrow_buffer::buffer::MutableBuffer`
(#4619)
omit d5b713ada2 fix(buffer): panic on end index overflow in
`MutableBuffer::set_null_bits` (#4621)
omit 5724cf21c2 Use contains_nulls in ArrayData equality of byte arrays
(#4582)
omit ae0d82ccb8 Test Disabled Page Statistics (#4587) (#4589)
omit a5d9118c7b Cleanup ArrayData::buffers (#4583)
omit a2e2fa762e Don't Reorder Nulls in sort_to_indices (#4545) (#4603)
omit 86c3fdba21 Add rank function (#4606) (#4609)
omit 149a3f8c9f Remove deprecated arithmetic kernels (#4481) (#4594)
omit caa37fed52 Simplify dictionary sort (#4605)
omit a5519d6ac2 Consolidate sort benchmarks (#4604)
omit c663d88327 fix(data): map type ID to child index before indexing a
union child array (#4598)
omit b597a206a5 Use u32 metadata_len when parsing footer of parquet. (#4599)
omit d1fb2c6a0a fix(data): create child arrays of correct length when
building a sparse union null array (#4601)
omit 95683439fa Remove deprecated limit kernel (#4597)
omit 16744e5ac0 Prepare arrow 45 (#4590)
omit 2950d8b8fe Fix pretty hours duration display (#4591)
omit fb926a4ff9 Configurable Duration Display (#4581)
omit 1e0f02ffc0 refactor: simplify hour_dyn() with time_fraction_dyn()
(#4588)
omit 2adb64d113 Move from_iter_values to GenericByteArray (#4586)
omit a31005605e Mark GenericByteArray::new_unchecked unsafe (#4584)
omit 18385e5634 Fix take_bytes Null and Overflow Handling (#4576) (#4579)
omit 8c85d34869 Write Page Offset Index For All-Nan Pages (#4567)
omit fba19b0142 Cleanup multipart upload trait (#4572)
omit b27dc7e741 Move chrono-tz arithmetic tests to integration (#4571)
omit 96886303df Fix interval to duration casting (#4553) (#4562)
omit bff6155d38 Make object_store::multipart public (#4570)
omit 0b75e8fbb1 Fix timezoned timestamp arithmetic (#4546)
omit dfb642809e support NullArray un arith/boolean kernel (#4566)
omit 918959b4ac Remove Sync from arrow-flight example (#4564)
omit d9719d1f2d Fix field docs (#4563)
omit fc21cfbb9c Clarify GenericColumnReader::read_records (#4540)
omit 92e1e9ad80 docs: fix wrong parameter name (#4559)
omit 48cd0cfaae Fix FixedSizeListBuilder capacity (#4549) (#4552)
omit 6ee30a57e9 fix multiline likes (#4548)
omit 6e4d7008db docs: fix wrong inline code snippet in parquet document
(#4550)
omit 4e8e1b3890 Minor: Make arrow blog link about row format more
discoverable (#4551)
omit 72cafde586 Provide default `is_empty` impl for
`arrow::array::ArrayBuilder` (#4543)
omit 730941f09a feat: Support `FixedSizedListArray` for `length` kernel
(#4520)
omit 47f288c166 Initial loongarch port (#4538)
omit 276d8c5770 Add RowConverter::append (#4479) (#4541)
omit b71c0d9527 Update proc-macro2 requirement from =1.0.64 to =1.0.66
(#4537)
omit be8bd13aed add a validity slice access for boolean array builders
(#4536)
omit 13fdfa472b use new num version instead of explicit num-complex
dependency (#4532)
omit 8f44472e5c Prepare arrow 44.0.0 (#4528)
omit 6909db8b76 Use Parser for cast kernel (#4512) (#4513)
omit f951c8f6e3 Fix AsyncArrowWriter flush for large buffer sizes (#4526)
(#4527)
omit edeb7bbd92 Handle empty S3 payloads (#4514) (#4518)
omit 43712ac843 fix: clippy problem (#4521)
omit c0444642b4 object_store: Export `ClientConfigKey` and add
`HttpBuilder::with_config` (#4516)
omit e169355220 Cleanup cast_primitive_to_list (#4511)
omit 8bcb3fc4ec Support Date - Date (#4383) (#4504)
omit 6e0faaf24d Bump actions/upload-pages-artifact from 1 to 2 (#4508)
omit 8da2f97bfd object_store: Implement `ObjectStore` for `Arc` (#4502)
omit 6bbf2f0ce3 Add Datum Arithmetic tests, Fix Interval Substraction
(#4480) (#4493)
omit 6f2231353f fix incorrect buffer size limiting in parquet async writer
(#4478)
omit 72b2ec53aa ci: verify MSRV on CI (#4490)
omit 29d4ae3c32 Bump actions/labeler from 4.2.0 to 4.3.0 (#4501)
omit 20af94b0ac Add negate kernels (#4488) (#4494)
omit e5378be5cf object_store/InMemory: Add `fork()` fn and deprecate
`clone()` fn (#4499)
omit 1f56959cd8 Update proc-macro2 requirement from =1.0.63 to =1.0.64
(#4500)
omit 66aab5a622 add num-complex requirement (#4482)
omit 9649d08149 support FixedSizeBinary types in
eq_dyn_binary_scalar/neq_dyn_binary_scalar (#4492)
omit ee2c292360 Add Datum based arithmetic kernels (#3999) (#4465)
omit 08a57e9b3b Add default implementations to the FlightSqlService trait
(#4485)
omit aac3aa9939 Improve in-place primitive sorts by 13-67% (#4473)
omit 9ee36b216c Add Scalar/Datum abstraction (#1047) (#4393)
omit 5ea197dd9d feat: support RecordBatchReader on boxed trait objects
(#4475)
This update removed existing revisions from the reference, leaving the
reference pointing at a previous point in the repository history.
* -- * -- N refs/tags/43.0.0 (414235e763)
\
O -- O -- O (ffd216d574)
Any revisions marked "omit" are not gone; other references still
refer to them. Any revisions marked "discard" are gone forever.
No new revisions were added by this update.
Summary of changes:
.github/dependabot.yml | 11 +-
.github/workflows/arrow.yml | 75 +-
.github/workflows/arrow_flight.yml | 6 +-
.github/workflows/audit.yml | 43 -
.github/workflows/coverage.yml | 4 +-
.github/workflows/dev.yml | 8 +-
.github/workflows/dev_pr.yml | 4 +-
.github/workflows/dev_pr/labeler.yml | 50 +-
.github/workflows/docs.yml | 14 +-
.github/workflows/integration.yml | 75 +-
.github/workflows/miri.sh | 8 +-
.github/workflows/miri.yaml | 3 +-
.github/workflows/object_store.yml | 97 +-
.github/workflows/parquet.yml | 19 +-
.github/workflows/parquet_derive.yml | 4 +-
.github/workflows/rust.yml | 44 +-
.github/workflows/take.yml | 39 -
.github_changelog_generator | 2 +-
.gitignore | 2 -
CHANGELOG-old.md | 1092 ----
CHANGELOG.md | 169 +-
CONTRIBUTING.md | 101 +-
Cargo.toml | 35 +-
LICENSE.txt | 10 +
README.md | 107 +-
arrow-arith/Cargo.toml | 5 +-
arrow-arith/src/aggregate.rs | 1301 ++---
arrow-arith/src/arithmetic.rs | 3723 ++++++++++++-
arrow-arith/src/arity.rs | 238 +-
arrow-arith/src/bitwise.rs | 60 +-
arrow-arith/src/boolean.rs | 102 +-
arrow-arith/src/lib.rs | 2 -
arrow-arith/src/numeric.rs | 1523 ------
arrow-arith/src/temporal.rs | 1502 ++----
arrow-array/Cargo.toml | 20 +-
arrow-array/benches/fixed_size_list_array.rs | 51 -
arrow-array/benches/gc_view_types.rs | 48 -
arrow-array/src/arithmetic.rs | 110 +-
arrow-array/src/array/binary_array.rs | 83 +-
arrow-array/src/array/boolean_array.rs | 121 +-
arrow-array/src/array/byte_array.rs | 64 +-
arrow-array/src/array/byte_view_array.rs | 999 ----
arrow-array/src/array/dictionary_array.rs | 247 +-
arrow-array/src/array/fixed_size_binary_array.rs | 66 +-
arrow-array/src/array/fixed_size_list_array.rs | 168 +-
arrow-array/src/array/list_array.rs | 232 +-
arrow-array/src/array/map_array.rs | 69 +-
arrow-array/src/array/mod.rs | 286 +-
arrow-array/src/array/null_array.rs | 40 +-
arrow-array/src/array/primitive_array.rs | 584 +-
arrow-array/src/array/run_array.rs | 129 +-
arrow-array/src/array/string_array.rs | 151 +-
arrow-array/src/array/struct_array.rs | 85 +-
arrow-array/src/array/union_array.rs | 447 +-
arrow-array/src/builder/boolean_builder.rs | 28 +-
arrow-array/src/builder/buffer_builder.rs | 356 +-
.../src/builder/fixed_size_binary_builder.rs | 33 +-
arrow-array/src/builder/fixed_size_list_builder.rs | 261 +-
.../src/builder/generic_byte_run_builder.rs | 28 +-
arrow-array/src/builder/generic_bytes_builder.rs | 46 +-
.../builder/generic_bytes_dictionary_builder.rs | 72 +-
.../src/builder/generic_bytes_view_builder.rs | 713 ---
arrow-array/src/builder/generic_list_builder.rs | 396 +-
arrow-array/src/builder/map_builder.rs | 160 +-
arrow-array/src/builder/mod.rs | 47 +-
arrow-array/src/builder/null_builder.rs | 22 +-
arrow-array/src/builder/primitive_builder.rs | 34 +-
.../src/builder/primitive_dictionary_builder.rs | 29 +-
arrow-array/src/builder/primitive_run_builder.rs | 5 +
arrow-array/src/builder/struct_builder.rs | 207 +-
arrow-array/src/builder/union_builder.rs | 91 +-
arrow-array/src/cast.rs | 112 +-
arrow-array/src/delta.rs | 66 +-
arrow-array/src/iterator.rs | 26 +-
arrow-array/src/lib.rs | 10 +-
arrow-array/src/numeric.rs | 633 ++-
arrow-array/src/record_batch.rs | 192 +-
arrow-array/src/run_iterator.rs | 24 +-
arrow-array/src/scalar.rs | 152 -
arrow-array/src/temporal_conversions.rs | 59 +-
arrow-array/src/timezone.rs | 16 +-
arrow-array/src/trusted_len.rs | 2 +-
arrow-array/src/types.rs | 930 ++--
arrow-avro/Cargo.toml | 56 -
arrow-avro/src/codec.rs | 315 --
arrow-avro/src/compression.rs | 83 -
arrow-avro/src/lib.rs | 40 -
arrow-avro/src/reader/block.rs | 141 -
arrow-avro/src/reader/header.rs | 345 --
arrow-avro/src/reader/mod.rs | 107 -
arrow-avro/src/reader/vlq.rs | 46 -
arrow-avro/src/schema.rs | 512 --
arrow-buffer/Cargo.toml | 5 -
arrow-buffer/benches/i256.rs | 53 +-
arrow-buffer/benches/offset.rs | 49 -
arrow-buffer/src/alloc/alignment.rs | 16 +-
arrow-buffer/src/alloc/mod.rs | 21 +-
arrow-buffer/src/arith.rs | 77 -
arrow-buffer/src/{bigint/mod.rs => bigint.rs} | 241 +-
arrow-buffer/src/bigint/div.rs | 302 --
arrow-buffer/src/buffer/boolean.rs | 39 +-
arrow-buffer/src/buffer/immutable.rs | 128 +-
arrow-buffer/src/buffer/mutable.rs | 137 +-
arrow-buffer/src/buffer/null.rs | 5 +-
arrow-buffer/src/buffer/offset.rs | 56 +-
arrow-buffer/src/buffer/ops.rs | 23 +-
arrow-buffer/src/buffer/run.rs | 6 +-
arrow-buffer/src/buffer/scalar.rs | 99 +-
arrow-buffer/src/builder/boolean.rs | 12 +-
arrow-buffer/src/builder/mod.rs | 400 +-
arrow-buffer/src/builder/null.rs | 10 +-
arrow-buffer/src/builder/offset.rs | 125 -
arrow-buffer/src/bytes.rs | 43 +-
arrow-buffer/src/interval.rs | 574 --
arrow-buffer/src/lib.rs | 14 +-
arrow-buffer/src/native.rs | 109 +-
arrow-buffer/src/util/bit_chunk_iterator.rs | 39 +-
arrow-buffer/src/util/bit_iterator.rs | 4 +-
arrow-buffer/src/util/bit_mask.rs | 38 +-
arrow-buffer/src/util/bit_util.rs | 92 +-
arrow-cast/Cargo.toml | 11 +-
arrow-cast/benches/parse_date.rs | 34 -
arrow-cast/src/base64.rs | 120 -
arrow-cast/src/{cast/mod.rs => cast.rs} | 5584 ++++++++++----------
arrow-cast/src/cast/decimal.rs | 573 --
arrow-cast/src/cast/dictionary.rs | 390 --
arrow-cast/src/cast/list.rs | 182 -
arrow-cast/src/cast/map.rs | 74 -
arrow-cast/src/cast/string.rs | 380 --
arrow-cast/src/display.rs | 544 +-
arrow-cast/src/lib.rs | 6 +-
arrow-cast/src/parse.rs | 4977 ++++++++---------
arrow-cast/src/pretty.rs | 268 +-
arrow-csv/Cargo.toml | 4 +-
arrow-csv/examples/README.md | 21 -
arrow-csv/examples/csv_calculation.rs | 56 -
arrow-csv/src/reader/mod.rs | 731 +--
arrow-csv/src/reader/records.rs | 54 +-
arrow-csv/src/writer.rs | 393 +-
arrow-csv/test/data/custom_null_test.csv | 6 -
arrow-csv/test/data/example.csv | 4 -
arrow-csv/test/data/init_null_test.csv | 6 -
arrow-csv/test/data/scientific_notation_test.csv | 19 -
arrow-csv/test/data/truncated_rows.csv | 8 -
arrow-data/src/byte_view.rs | 130 -
arrow-data/src/data/buffers.rs | 96 +
arrow-data/src/{data.rs => data/mod.rs} | 597 +--
arrow-data/src/decimal.rs | 617 +--
arrow-data/src/equal/boolean.rs | 11 +-
arrow-data/src/equal/byte_view.rs | 74 -
arrow-data/src/equal/fixed_binary.rs | 24 +-
arrow-data/src/equal/mod.rs | 71 +-
arrow-data/src/equal/primitive.rs | 22 +-
arrow-data/src/equal/run.rs | 10 +-
arrow-data/src/equal/union.rs | 5 +-
arrow-data/src/equal/utils.rs | 14 +-
arrow-data/src/equal/variable_size.rs | 34 +-
arrow-data/src/ffi.rs | 24 +-
arrow-data/src/lib.rs | 3 -
arrow-data/src/transform/list.rs | 15 +-
arrow-data/src/transform/mod.rs | 348 +-
arrow-data/src/transform/primitive.rs | 5 +-
arrow-data/src/transform/union.rs | 13 +-
arrow-data/src/transform/utils.rs | 4 +-
arrow-data/src/transform/variable_size.rs | 15 +-
arrow-flight/Cargo.toml | 31 +-
arrow-flight/README.md | 34 +-
arrow-flight/examples/flight_sql_server.rs | 144 +-
arrow-flight/examples/server.rs | 45 +-
arrow-flight/gen/Cargo.toml | 6 +-
arrow-flight/src/arrow.flight.protocol.rs | 381 +-
arrow-flight/src/bin/flight_sql_client.rs | 304 +-
arrow-flight/src/client.rs | 248 +-
arrow-flight/src/decode.rs | 84 +-
arrow-flight/src/encode.rs | 1020 +---
arrow-flight/src/error.rs | 19 +-
arrow-flight/src/lib.rs | 217 +-
arrow-flight/src/sql/arrow.flight.protocol.sql.rs | 393 +-
arrow-flight/src/sql/client.rs | 304 +-
arrow-flight/src/sql/metadata/db_schemas.rs | 21 +-
arrow-flight/src/sql/metadata/mod.rs | 6 +-
arrow-flight/src/sql/metadata/sql_info.rs | 41 +-
arrow-flight/src/sql/metadata/tables.rs | 28 +-
arrow-flight/src/sql/metadata/xdbc_info.rs | 23 +-
arrow-flight/src/sql/mod.rs | 16 +-
arrow-flight/src/sql/server.rs | 645 +--
arrow-flight/src/streams.rs | 134 -
arrow-flight/src/trailers.rs | 92 -
arrow-flight/src/utils.rs | 41 +-
arrow-flight/tests/client.rs | 388 +-
arrow-flight/tests/common/fixture.rs | 118 -
arrow-flight/tests/common/server.rs | 102 +-
arrow-flight/tests/common/trailers_layer.rs | 124 -
arrow-flight/tests/common/utils.rs | 118 -
arrow-flight/tests/encode_decode.rs | 129 +-
arrow-flight/tests/flight_sql_client.rs | 216 -
arrow-flight/tests/flight_sql_client_cli.rs | 634 ++-
arrow-integration-test/src/datatype.rs | 26 +-
arrow-integration-test/src/field.rs | 106 +-
arrow-integration-test/src/lib.rs | 227 +-
arrow-integration-test/src/schema.rs | 29 +-
arrow-integration-testing/Cargo.toml | 9 +-
arrow-integration-testing/README.md | 2 +-
.../src/bin/arrow-json-integration-test.rs | 63 +-
.../src/bin/flight-test-integration-client.rs | 3 +-
.../flight_client_scenarios/auth_basic_proto.rs | 10 +-
.../flight_client_scenarios/integration_test.rs | 59 +-
.../src/flight_client_scenarios/middleware.rs | 3 +-
.../src/flight_server_scenarios.rs | 2 -
.../flight_server_scenarios/auth_basic_proto.rs | 36 +-
.../flight_server_scenarios/integration_test.rs | 51 +-
.../src/flight_server_scenarios/middleware.rs | 16 +-
arrow-integration-testing/src/lib.rs | 232 +-
arrow-integration-testing/tests/ipc_reader.rs | 82 +-
arrow-integration-testing/tests/ipc_writer.rs | 65 +-
arrow-ipc/Cargo.toml | 10 +-
arrow-ipc/src/compression.rs | 76 +-
arrow-ipc/src/convert.rs | 157 +-
arrow-ipc/src/gen/File.rs | 47 +-
arrow-ipc/src/gen/Message.rs | 199 +-
arrow-ipc/src/gen/Schema.rs | 823 +--
arrow-ipc/src/gen/SparseTensor.rs | 244 +-
arrow-ipc/src/gen/Tensor.rs | 188 +-
arrow-ipc/src/reader.rs | 1333 ++---
arrow-ipc/src/reader/stream.rs | 318 --
arrow-ipc/src/writer.rs | 1287 ++---
arrow-json/Cargo.toml | 21 +-
arrow-json/benches/serde.rs | 62 -
arrow-json/src/lib.rs | 67 +-
arrow-json/src/reader/decimal_array.rs | 26 -
arrow-json/src/reader/list_array.rs | 5 +-
arrow-json/src/reader/map_array.rs | 5 +-
arrow-json/src/reader/mod.rs | 241 +-
arrow-json/src/reader/primitive_array.rs | 55 +-
arrow-json/src/reader/schema.rs | 228 +-
arrow-json/src/reader/serializer.rs | 102 +-
arrow-json/src/reader/string_array.rs | 36 +-
arrow-json/src/reader/struct_array.rs | 18 +-
arrow-json/src/reader/tape.rs | 138 +-
arrow-json/src/reader/timestamp_array.rs | 18 +-
arrow-json/src/writer.rs | 1379 ++---
arrow-json/src/writer/encoder.rs | 547 --
arrow-json/test/data/basic.json | 4 +-
arrow-json/test/data/nested_with_nulls.json | 4 -
arrow-ord/Cargo.toml | 7 +
arrow-ord/src/cmp.rs | 855 ---
arrow-ord/src/comparison.rs | 5014 ++++++++++++++----
arrow-ord/src/lib.rs | 3 -
arrow-ord/src/ord.rs | 933 +---
arrow-ord/src/partition.rs | 511 +-
arrow-ord/src/rank.rs | 189 -
arrow-ord/src/sort.rs | 1793 ++++---
arrow-pyarrow-integration-testing/Cargo.toml | 2 +-
arrow-pyarrow-integration-testing/README.md | 2 -
arrow-pyarrow-integration-testing/pyproject.toml | 2 +-
arrow-pyarrow-integration-testing/src/lib.rs | 56 +-
.../tests/test_sql.py | 214 +-
arrow-row/Cargo.toml | 1 +
arrow-row/src/dictionary.rs | 296 ++
arrow-row/src/fixed.rs | 135 +-
arrow-row/src/interner.rs | 430 ++
arrow-row/src/lib.rs | 872 ++-
arrow-row/src/list.rs | 136 +-
arrow-row/src/variable.rs | 249 +-
arrow-schema/src/datatype.rs | 355 +-
arrow-schema/src/datatype_parse.rs | 783 ---
arrow-schema/src/error.rs | 26 +-
arrow-schema/src/ffi.rs | 105 +-
arrow-schema/src/field.rs | 205 +-
arrow-schema/src/fields.rs | 333 +-
arrow-schema/src/lib.rs | 1 -
arrow-schema/src/schema.rs | 223 +-
arrow-select/Cargo.toml | 1 -
arrow-select/src/concat.rs | 508 +-
arrow-select/src/dictionary.rs | 331 --
arrow-select/src/filter.rs | 627 +--
arrow-select/src/interleave.rs | 185 +-
arrow-select/src/lib.rs | 1 -
arrow-select/src/nullif.rs | 48 +-
arrow-select/src/take.rs | 722 +--
arrow-select/src/zip.rs | 156 +-
arrow-string/Cargo.toml | 9 +-
arrow-string/src/concat_elements.rs | 19 +-
arrow-string/src/length.rs | 317 +-
arrow-string/src/lib.rs | 1 -
arrow-string/src/like.rs | 1783 ++++---
arrow-string/src/predicate.rs | 461 --
arrow-string/src/regexp.rs | 310 +-
arrow-string/src/substring.rs | 65 +-
arrow/CONTRIBUTING.md | 12 +
arrow/Cargo.toml | 40 +-
arrow/README.md | 19 +-
arrow/benches/aggregate_kernels.rs | 165 +-
arrow/benches/arithmetic_kernels.rs | 40 +-
arrow/benches/array_data_validate.rs | 3 +-
arrow/benches/array_from_vec.rs | 6 +-
arrow/benches/bitwise_kernel.rs | 12 +-
arrow/benches/buffer_bit_ops.rs | 12 +-
arrow/benches/buffer_create.rs | 13 +-
arrow/benches/builder.rs | 5 +-
arrow/benches/cast_kernels.rs | 74 +-
arrow/benches/comparison_kernels.rs | 326 +-
arrow/benches/concatenate_kernel.rs | 42 -
arrow/benches/csv_reader.rs | 106 +-
arrow/benches/csv_writer.rs | 7 +-
arrow/benches/decimal_validate.rs | 4 +-
arrow/benches/equal.rs | 10 +
arrow/benches/filter_kernels.rs | 73 +-
arrow/benches/interleave_kernels.rs | 31 +-
arrow/benches/json_writer.rs | 198 -
arrow/benches/lexsort.rs | 69 +-
arrow/benches/partition_kernels.rs | 45 +-
arrow/benches/primitive_run_accessor.rs | 7 +-
arrow/benches/primitive_run_take.rs | 4 +-
arrow/benches/regexp_kernels.rs | 51 -
arrow/benches/row_format.rs | 127 +-
arrow/benches/sort_kernel.rs | 248 +-
arrow/benches/string_run_builder.rs | 4 +-
arrow/benches/string_run_iterator.rs | 4 +-
arrow/benches/take_kernels.rs | 40 +-
arrow/examples/builders.rs | 13 +-
arrow/examples/dynamic_types.rs | 5 +-
arrow/examples/tensor_builder.rs | 2 +-
arrow/src/array/ffi.rs | 262 +
arrow/src/array/mod.rs | 12 +-
arrow/src/compute/kernels/limit.rs | 208 +
arrow/src/compute/{kernels.rs => kernels/mod.rs} | 6 +-
arrow/src/compute/mod.rs | 2 +-
.../common/mod.rs => arrow/src/datatypes/ffi.rs | 5 -
arrow/src/datatypes/mod.rs | 15 +-
{arrow-array => arrow}/src/ffi.rs | 784 +--
{arrow-array => arrow}/src/ffi_stream.rs | 159 +-
arrow/src/lib.rs | 48 +-
arrow/src/pyarrow.rs | 319 +-
arrow/src/tensor.rs | 31 +-
arrow/src/util/bench_util.rs | 156 +-
arrow/src/util/data_gen.rs | 490 +-
arrow/src/util/string_writer.rs | 8 +-
arrow/src/util/test_util.rs | 1 +
arrow/tests/arithmetic.rs | 190 -
arrow/tests/array_cast.rs | 93 +-
arrow/tests/array_equal.rs | 214 +-
arrow/tests/array_transform.rs | 351 +-
arrow/tests/array_validation.rs | 172 +-
arrow/tests/csv.rs | 48 +-
arrow/tests/pyarrow.rs | 4 +-
arrow/tests/timezone.rs | 4 +-
dev/release/README.md | 1 -
dev/release/update_change_log.sh | 6 +-
format/Flight.proto | 152 +-
format/FlightSql.proto | 174 +-
format/Message.fbs | 18 +-
format/Schema.fbs | 46 +-
object_store/.github_changelog_generator | 2 +-
object_store/CHANGELOG-old.md | 393 --
object_store/CHANGELOG.md | 28 +-
object_store/CONTRIBUTING.md | 87 +-
object_store/Cargo.toml | 40 +-
object_store/LICENSE.txt | 204 -
object_store/NOTICE.txt | 5 -
object_store/README.md | 7 +-
object_store/dev/release/update_change_log.sh | 5 +-
.../dev/release/verify-release-candidate.sh | 2 +-
object_store/src/attributes.rs | 248 -
object_store/src/aws/builder.rs | 1458 -----
object_store/src/aws/checksum.rs | 15 +
object_store/src/aws/client.rs | 702 +--
object_store/src/aws/credential.rs | 393 +-
object_store/src/aws/dynamo.rs | 593 ---
object_store/src/aws/mod.rs | 1750 ++++--
object_store/src/aws/precondition.rs | 252 -
object_store/src/aws/resolve.rs | 103 -
object_store/src/azure/builder.rs | 1106 ----
object_store/src/azure/client.rs | 481 +-
object_store/src/azure/credential.rs | 506 +-
object_store/src/azure/mod.rs | 1267 ++++-
object_store/src/buffered.rs | 662 ---
object_store/src/chunked.rs | 172 +-
object_store/src/client/backoff.rs | 21 +-
object_store/src/client/get.rs | 410 +-
object_store/src/client/header.rs | 88 +-
object_store/src/client/list.rs | 33 +-
.../src/client/{s3.rs => list_response.rs} | 47 +-
object_store/src/client/mock_server.rs | 92 +-
object_store/src/client/mod.rs | 245 +-
object_store/src/client/parts.rs | 48 -
object_store/src/client/retry.rs | 547 +-
object_store/src/client/token.rs | 18 +-
object_store/src/delimited.rs | 3 +-
object_store/src/gcp/builder.rs | 674 ---
object_store/src/gcp/client.rs | 663 ---
object_store/src/gcp/credential.rs | 724 +--
object_store/src/gcp/mod.rs | 1377 ++++-
object_store/src/http/client.rs | 186 +-
object_store/src/http/mod.rs | 120 +-
object_store/src/integration.rs | 1105 ----
object_store/src/lib.rs | 1980 +++----
object_store/src/limit.rs | 187 +-
object_store/src/local.rs | 1276 +++--
object_store/src/memory.rs | 563 +-
object_store/src/multipart.rs | 287 +-
object_store/src/parse.rs | 148 +-
object_store/src/path/mod.rs | 90 +-
object_store/src/path/parts.rs | 23 +-
object_store/src/payload.rs | 328 --
object_store/src/prefix.rs | 67 +-
object_store/src/signer.rs | 50 -
object_store/src/tags.rs | 60 -
object_store/src/throttle.rs | 232 +-
object_store/src/upload.rs | 341 --
object_store/src/util.rs | 242 +-
object_store/tests/get_range_file.rs | 80 +-
parquet-testing | 2 +-
parquet/CONTRIBUTING.md | 12 +-
parquet/Cargo.toml | 69 +-
parquet/README.md | 21 +-
parquet/benches/arrow_reader.rs | 739 +--
parquet/benches/arrow_statistics.rs | 269 -
parquet/benches/arrow_writer.rs | 39 +-
parquet/benches/compression.rs | 96 -
parquet/benches/encoding.rs | 105 -
parquet/benches/metadata.rs | 42 -
parquet/examples/async_read_parquet.rs | 5 +-
parquet/examples/read_with_rowgroup.rs | 17 +-
parquet/examples/write_parquet.rs | 139 -
parquet/pytest/requirements.txt | 63 +-
parquet/regen.sh | 43 -
parquet/src/arrow/array_reader/builder.rs | 28 +-
parquet/src/arrow/array_reader/byte_array.rs | 188 +-
.../arrow/array_reader/byte_array_dictionary.rs | 94 +-
parquet/src/arrow/array_reader/byte_view_array.rs | 751 ---
.../src/arrow/array_reader/fixed_len_byte_array.rs | 239 +-
parquet/src/arrow/array_reader/list_array.rs | 2 +-
parquet/src/arrow/array_reader/mod.rs | 53 +-
parquet/src/arrow/array_reader/null_array.rs | 17 +-
parquet/src/arrow/array_reader/primitive_array.rs | 154 +-
parquet/src/arrow/array_reader/test_util.rs | 11 +-
parquet/src/arrow/arrow_reader/filter.rs | 25 +-
parquet/src/arrow/arrow_reader/mod.rs | 1697 +-----
parquet/src/arrow/arrow_reader/selection.rs | 461 +-
parquet/src/arrow/arrow_reader/statistics.rs | 1599 ------
parquet/src/arrow/arrow_writer/byte_array.rs | 144 +-
parquet/src/arrow/arrow_writer/levels.rs | 610 +--
parquet/src/arrow/arrow_writer/mod.rs | 1101 +---
parquet/src/arrow/async_reader/metadata.rs | 37 +-
parquet/src/arrow/async_reader/mod.rs | 796 +--
parquet/src/arrow/async_reader/store.rs | 42 +-
parquet/src/arrow/async_writer/mod.rs | 383 +-
parquet/src/arrow/async_writer/store.rs | 157 -
parquet/src/arrow/buffer/bit_util.rs | 7 +-
parquet/src/arrow/buffer/dictionary_buffer.rs | 97 +-
parquet/src/arrow/buffer/mod.rs | 1 -
parquet/src/arrow/buffer/offset_buffer.rs | 67 +-
parquet/src/arrow/buffer/view_buffer.rs | 193 -
parquet/src/arrow/decoder/delta_byte_array.rs | 21 +-
parquet/src/arrow/decoder/dictionary_index.rs | 20 +-
parquet/src/arrow/mod.rs | 88 +-
parquet/src/arrow/record_reader/buffer.rs | 186 +-
.../src/arrow/record_reader/definition_levels.rs | 99 +-
parquet/src/arrow/record_reader/mod.rs | 119 +-
parquet/src/arrow/schema/complex.rs | 36 +-
parquet/src/arrow/schema/mod.rs | 483 +-
parquet/src/arrow/schema/primitive.rs | 30 +-
parquet/src/basic.rs | 316 +-
parquet/src/bin/parquet-fromcsv.rs | 103 +-
parquet/src/bin/parquet-index.rs | 16 +-
parquet/src/bin/parquet-layout.rs | 9 +-
parquet/src/bin/parquet-read.rs | 3 +-
parquet/src/bin/parquet-rewrite.rs | 46 +-
parquet/src/bin/parquet-rowcount.rs | 3 +-
parquet/src/bin/parquet-show-bloom-filter.rs | 4 +-
parquet/src/bloom_filter/mod.rs | 143 +-
parquet/src/column/mod.rs | 12 +-
parquet/src/column/page.rs | 65 +-
parquet/src/column/reader.rs | 377 +-
parquet/src/column/reader/decoder.rs | 202 +-
parquet/src/column/writer/encoder.rs | 122 +-
parquet/src/column/writer/mod.rs | 1729 ++----
parquet/src/compression.rs | 121 +-
parquet/src/data_type.rs | 223 +-
parquet/src/encodings/decoding.rs | 562 +-
.../decoding/byte_stream_split_decoder.rs | 256 -
.../encoding/byte_stream_split_encoder.rs | 231 -
parquet/src/encodings/encoding/dict_encoder.rs | 28 +-
parquet/src/encodings/encoding/mod.rs | 206 +-
parquet/src/encodings/levels.rs | 2 -
parquet/src/encodings/rle.rs | 99 +-
parquet/src/errors.rs | 7 -
parquet/src/file/footer.rs | 84 +-
parquet/src/file/{metadata/mod.rs => metadata.rs} | 765 +--
parquet/src/file/metadata/memory.rs | 239 -
parquet/src/file/metadata/writer.rs | 683 ---
parquet/src/file/mod.rs | 13 +-
parquet/src/file/page_encoding_stats.rs | 5 +-
parquet/src/file/page_index/index.rs | 250 +-
parquet/src/file/page_index/index_reader.rs | 82 +-
parquet/src/file/page_index/mod.rs | 1 -
parquet/src/file/page_index/offset_index.rs | 59 -
parquet/src/file/properties.rs | 360 +-
parquet/src/file/reader.rs | 49 +-
parquet/src/file/serialized_reader.rs | 287 +-
parquet/src/file/statistics.rs | 563 +-
parquet/src/file/writer.rs | 922 +---
parquet/src/format.rs | 1360 +++--
parquet/src/lib.rs | 79 +-
parquet/src/record/api.rs | 151 +-
parquet/src/record/mod.rs | 5 +-
parquet/src/record/reader.rs | 344 +-
parquet/src/record/record_reader.rs | 30 -
parquet/src/record/record_writer.rs | 4 -
parquet/src/record/triplet.rs | 79 +-
parquet/src/schema/mod.rs | 16 +-
parquet/src/schema/parser.rs | 458 +-
parquet/src/schema/printer.rs | 133 +-
parquet/src/schema/types.rs | 406 +-
parquet/src/schema/visitor.rs | 24 +-
parquet/src/thrift.rs | 282 -
parquet/src/util/bit_util.rs | 139 +-
parquet/src/util/interner.rs | 12 -
parquet/src/util/memory.rs | 149 +
parquet/src/util/mod.rs | 1 +
parquet/src/util/test_common/page_util.rs | 50 +-
parquet/src/util/test_common/rand_gen.rs | 4 +-
parquet/tests/arrow_reader/bad_data.rs | 162 -
parquet/tests/arrow_reader/bad_raw_metadata.bin | Bin 35456 -> 0 bytes
parquet/tests/arrow_reader/mod.rs | 1045 ----
parquet/tests/arrow_reader/statistics.rs | 2624 ---------
parquet/tests/arrow_writer_layout.rs | 75 +-
parquet_derive/README.md | 51 +-
parquet_derive/src/lib.rs | 116 +-
parquet_derive/src/parquet_field.rs | 480 +-
parquet_derive_test/Cargo.toml | 3 +-
parquet_derive_test/src/lib.rs | 204 +-
pre-commit.sh | 6 +-
rustfmt.toml | 6 +
testing | 2 +-
536 files changed, 43730 insertions(+), 88553 deletions(-)
delete mode 100644 .github/workflows/audit.yml
delete mode 100644 .github/workflows/take.yml
delete mode 100644 arrow-arith/src/numeric.rs
delete mode 100644 arrow-array/benches/fixed_size_list_array.rs
delete mode 100644 arrow-array/benches/gc_view_types.rs
delete mode 100644 arrow-array/src/array/byte_view_array.rs
delete mode 100644 arrow-array/src/builder/generic_bytes_view_builder.rs
delete mode 100644 arrow-array/src/scalar.rs
delete mode 100644 arrow-avro/Cargo.toml
delete mode 100644 arrow-avro/src/codec.rs
delete mode 100644 arrow-avro/src/compression.rs
delete mode 100644 arrow-avro/src/lib.rs
delete mode 100644 arrow-avro/src/reader/block.rs
delete mode 100644 arrow-avro/src/reader/header.rs
delete mode 100644 arrow-avro/src/reader/mod.rs
delete mode 100644 arrow-avro/src/reader/vlq.rs
delete mode 100644 arrow-avro/src/schema.rs
delete mode 100644 arrow-buffer/benches/offset.rs
delete mode 100644 arrow-buffer/src/arith.rs
rename arrow-buffer/src/{bigint/mod.rs => bigint.rs} (90%)
delete mode 100644 arrow-buffer/src/bigint/div.rs
delete mode 100644 arrow-buffer/src/builder/offset.rs
delete mode 100644 arrow-buffer/src/interval.rs
delete mode 100644 arrow-cast/benches/parse_date.rs
delete mode 100644 arrow-cast/src/base64.rs
rename arrow-cast/src/{cast/mod.rs => cast.rs} (66%)
delete mode 100644 arrow-cast/src/cast/decimal.rs
delete mode 100644 arrow-cast/src/cast/dictionary.rs
delete mode 100644 arrow-cast/src/cast/list.rs
delete mode 100644 arrow-cast/src/cast/map.rs
delete mode 100644 arrow-cast/src/cast/string.rs
delete mode 100644 arrow-csv/examples/README.md
delete mode 100644 arrow-csv/examples/csv_calculation.rs
delete mode 100644 arrow-csv/test/data/custom_null_test.csv
delete mode 100644 arrow-csv/test/data/example.csv
delete mode 100644 arrow-csv/test/data/init_null_test.csv
delete mode 100644 arrow-csv/test/data/scientific_notation_test.csv
delete mode 100644 arrow-csv/test/data/truncated_rows.csv
delete mode 100644 arrow-data/src/byte_view.rs
create mode 100644 arrow-data/src/data/buffers.rs
rename arrow-data/src/{data.rs => data/mod.rs} (80%)
delete mode 100644 arrow-data/src/equal/byte_view.rs
delete mode 100644 arrow-flight/src/streams.rs
delete mode 100644 arrow-flight/src/trailers.rs
delete mode 100644 arrow-flight/tests/common/fixture.rs
delete mode 100644 arrow-flight/tests/common/trailers_layer.rs
delete mode 100644 arrow-flight/tests/common/utils.rs
delete mode 100644 arrow-flight/tests/flight_sql_client.rs
delete mode 100644 arrow-ipc/src/reader/stream.rs
delete mode 100644 arrow-json/benches/serde.rs
delete mode 100644 arrow-json/src/writer/encoder.rs
delete mode 100644 arrow-json/test/data/nested_with_nulls.json
delete mode 100644 arrow-ord/src/cmp.rs
delete mode 100644 arrow-ord/src/rank.rs
create mode 100644 arrow-row/src/dictionary.rs
create mode 100644 arrow-row/src/interner.rs
delete mode 100644 arrow-schema/src/datatype_parse.rs
delete mode 100644 arrow-select/src/dictionary.rs
delete mode 100644 arrow-string/src/predicate.rs
delete mode 100644 arrow/benches/json_writer.rs
delete mode 100644 arrow/benches/regexp_kernels.rs
create mode 100644 arrow/src/array/ffi.rs
create mode 100644 arrow/src/compute/kernels/limit.rs
rename arrow/src/compute/{kernels.rs => kernels/mod.rs} (94%)
rename arrow-flight/tests/common/mod.rs => arrow/src/datatypes/ffi.rs (91%)
rename {arrow-array => arrow}/src/ffi.rs (61%)
rename {arrow-array => arrow}/src/ffi_stream.rs (76%)
delete mode 100644 arrow/tests/arithmetic.rs
delete mode 100644 object_store/LICENSE.txt
delete mode 100644 object_store/NOTICE.txt
delete mode 100644 object_store/src/attributes.rs
delete mode 100644 object_store/src/aws/builder.rs
delete mode 100644 object_store/src/aws/dynamo.rs
delete mode 100644 object_store/src/aws/precondition.rs
delete mode 100644 object_store/src/aws/resolve.rs
delete mode 100644 object_store/src/azure/builder.rs
delete mode 100644 object_store/src/buffered.rs
rename object_store/src/client/{s3.rs => list_response.rs} (67%)
delete mode 100644 object_store/src/client/parts.rs
delete mode 100644 object_store/src/gcp/builder.rs
delete mode 100644 object_store/src/gcp/client.rs
delete mode 100644 object_store/src/integration.rs
delete mode 100644 object_store/src/payload.rs
delete mode 100644 object_store/src/signer.rs
delete mode 100644 object_store/src/tags.rs
delete mode 100644 object_store/src/upload.rs
delete mode 100644 parquet/benches/arrow_statistics.rs
delete mode 100644 parquet/benches/compression.rs
delete mode 100644 parquet/benches/encoding.rs
delete mode 100644 parquet/benches/metadata.rs
delete mode 100644 parquet/examples/write_parquet.rs
delete mode 100755 parquet/regen.sh
delete mode 100644 parquet/src/arrow/array_reader/byte_view_array.rs
delete mode 100644 parquet/src/arrow/arrow_reader/statistics.rs
delete mode 100644 parquet/src/arrow/async_writer/store.rs
delete mode 100644 parquet/src/arrow/buffer/view_buffer.rs
delete mode 100644 parquet/src/encodings/decoding/byte_stream_split_decoder.rs
delete mode 100644 parquet/src/encodings/encoding/byte_stream_split_encoder.rs
rename parquet/src/file/{metadata/mod.rs => metadata.rs} (53%)
delete mode 100644 parquet/src/file/metadata/memory.rs
delete mode 100644 parquet/src/file/metadata/writer.rs
delete mode 100644 parquet/src/file/page_index/offset_index.rs
delete mode 100644 parquet/src/record/record_reader.rs
delete mode 100644 parquet/src/thrift.rs
create mode 100644 parquet/src/util/memory.rs
delete mode 100644 parquet/tests/arrow_reader/bad_data.rs
delete mode 100644 parquet/tests/arrow_reader/bad_raw_metadata.bin
delete mode 100644 parquet/tests/arrow_reader/mod.rs
delete mode 100644 parquet/tests/arrow_reader/statistics.rs