This is an automated email from the ASF dual-hosted git repository.
alamb pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/arrow-rs.git
The following commit(s) were added to refs/heads/main by this push:
new e5e66fa05c Add test for
`parquet-testing/bad_data/ARROW-GH-47662.parquet` (#10077)
e5e66fa05c is described below
commit e5e66fa05ce986fa6a3f61c36c11ff6b476cb76c
Author: Ed Seidl <[email protected]>
AuthorDate: Fri Jun 5 03:06:25 2026 -0700
Add test for `parquet-testing/bad_data/ARROW-GH-47662.parquet` (#10077)
# Which issue does this PR close?
- Issue raised in #9110
# Rationale for this change
Add a "bad_data" test for newly added file in parquet-testing
# What changes are included in this PR?
Adds a new test so the `bad_data` unit test doesn't fail.
# Are these changes tested?
Yes
# Are there any user-facing changes?
No, only tests
---
parquet-testing | 2 +-
parquet/tests/arrow_reader/bad_data.rs | 10 ++++++++++
2 files changed, 11 insertions(+), 1 deletion(-)
diff --git a/parquet-testing b/parquet-testing
index 5a6cf84678..ffdcbb5e22 160000
--- a/parquet-testing
+++ b/parquet-testing
@@ -1 +1 @@
-Subproject commit 5a6cf84678df3af65c231109b78b86ba9bf495df
+Subproject commit ffdcbb5e22828186c7461e56dbd26a0fe3caee56
diff --git a/parquet/tests/arrow_reader/bad_data.rs
b/parquet/tests/arrow_reader/bad_data.rs
index 9a110c1361..b3173138fb 100644
--- a/parquet/tests/arrow_reader/bad_data.rs
+++ b/parquet/tests/arrow_reader/bad_data.rs
@@ -33,6 +33,7 @@ static KNOWN_FILES: &[&str] = &[
"ARROW-RS-GH-6229-DICTHEADER.parquet",
"ARROW-RS-GH-6229-LEVELS.parquet",
"ARROW-GH-45185.parquet",
+ "ARROW-GH-47662.parquet",
"README.md",
];
@@ -132,6 +133,15 @@ fn test_arrow_rs_gh_45185_dict_levels() {
);
}
+#[test]
+fn test_arrow_gh_47662() {
+ let err = read_file("ARROW-GH-47662.parquet").unwrap_err();
+ assert_eq!(
+ err.to_string(),
+ "External: Parquet argument error: Parquet error: insufficient values
read from column - expected: 100, got: 91"
+ );
+}
+
/// Reads the file and tries to return the total row count
/// Returns an error if the file is invalid
fn read_file(name: &str) -> Result<usize, ParquetError> {