This is an automated email from the ASF dual-hosted git repository.

alamb pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/arrow-rs.git


The following commit(s) were added to refs/heads/main by this push:
     new e5e66fa05c Add test for 
`parquet-testing/bad_data/ARROW-GH-47662.parquet` (#10077)
e5e66fa05c is described below

commit e5e66fa05ce986fa6a3f61c36c11ff6b476cb76c
Author: Ed Seidl <[email protected]>
AuthorDate: Fri Jun 5 03:06:25 2026 -0700

    Add test for `parquet-testing/bad_data/ARROW-GH-47662.parquet` (#10077)
    
    # Which issue does this PR close?
    
    - Issue raised in #9110
    
    # Rationale for this change
    Add a "bad_data" test for newly added file in parquet-testing
    
    # What changes are included in this PR?
    
    Adds a new test so the `bad_data` unit test doesn't fail.
    
    # Are these changes tested?
    
    Yes
    
    # Are there any user-facing changes?
    
    No, only tests
---
 parquet-testing                        |  2 +-
 parquet/tests/arrow_reader/bad_data.rs | 10 ++++++++++
 2 files changed, 11 insertions(+), 1 deletion(-)

diff --git a/parquet-testing b/parquet-testing
index 5a6cf84678..ffdcbb5e22 160000
--- a/parquet-testing
+++ b/parquet-testing
@@ -1 +1 @@
-Subproject commit 5a6cf84678df3af65c231109b78b86ba9bf495df
+Subproject commit ffdcbb5e22828186c7461e56dbd26a0fe3caee56
diff --git a/parquet/tests/arrow_reader/bad_data.rs 
b/parquet/tests/arrow_reader/bad_data.rs
index 9a110c1361..b3173138fb 100644
--- a/parquet/tests/arrow_reader/bad_data.rs
+++ b/parquet/tests/arrow_reader/bad_data.rs
@@ -33,6 +33,7 @@ static KNOWN_FILES: &[&str] = &[
     "ARROW-RS-GH-6229-DICTHEADER.parquet",
     "ARROW-RS-GH-6229-LEVELS.parquet",
     "ARROW-GH-45185.parquet",
+    "ARROW-GH-47662.parquet",
     "README.md",
 ];
 
@@ -132,6 +133,15 @@ fn test_arrow_rs_gh_45185_dict_levels() {
     );
 }
 
+#[test]
+fn test_arrow_gh_47662() {
+    let err = read_file("ARROW-GH-47662.parquet").unwrap_err();
+    assert_eq!(
+        err.to_string(),
+        "External: Parquet argument error: Parquet error: insufficient values 
read from column - expected: 100, got: 91"
+    );
+}
+
 /// Reads the file and tries to return the total row count
 /// Returns an error if the file is invalid
 fn read_file(name: &str) -> Result<usize, ParquetError> {

Reply via email to