alamb commented on code in PR #8313:
URL: https://github.com/apache/arrow-rs/pull/8313#discussion_r2345281913
##########
parquet/src/file/metadata/reader.rs:
##########
@@ -1065,116 +962,17 @@ impl ParquetMetaDataReader {
///
/// [Parquet Spec]: https://github.com/apache/parquet-format#metadata
pub fn decode_metadata(buf: &[u8]) -> Result<ParquetMetaData> {
- let mut prot = TCompactSliceInputProtocol::new(buf);
-
- let t_file_metadata =
crate::format::FileMetaData::read_from_in_protocol(&mut prot)
- .map_err(|e| general_err!("Could not parse metadata: {}", e))?;
- let schema = types::from_thrift(&t_file_metadata.schema)?;
- let schema_descr = Arc::new(SchemaDescriptor::new(schema));
-
- let mut row_groups = Vec::new();
- for rg in t_file_metadata.row_groups {
-
row_groups.push(RowGroupMetaData::from_thrift(schema_descr.clone(), rg)?);
- }
- let column_orders =
- Self::parse_column_orders(t_file_metadata.column_orders,
&schema_descr)?;
-
- let key_value_metadata = t_file_metadata.key_value_metadata.map(|vkv| {
- vkv.into_iter()
- .map(|kv| KeyValue::new(kv.key, kv.value))
- .collect::<Vec<KeyValue>>()
- });
-
- let file_metadata = FileMetaData::new(
- t_file_metadata.version,
- t_file_metadata.num_rows,
- t_file_metadata.created_by,
- key_value_metadata,
- schema_descr,
- column_orders,
- );
-
- Ok(ParquetMetaData::new(file_metadata, row_groups))
- }
-
- /// create meta data from thrift encoded bytes
- pub fn decode_file_metadata(buf: &[u8]) -> Result<ParquetMetaData> {
let mut prot = ThriftCompactInputProtocol::new(buf);
Review Comment:

##########
parquet/src/file/metadata/reader.rs:
##########
@@ -960,101 +947,11 @@ impl ParquetMetaDataReader {
encrypted_footer: bool,
file_decryption_properties: Option<&FileDecryptionProperties>,
) -> Result<ParquetMetaData> {
- let mut prot = TCompactSliceInputProtocol::new(buf);
Review Comment:
FYI I am messing with this code as part of
https://github.com/apache/arrow-rs/pull/8340 (mostly I moved where it lives) --
that isn't a problem per se, I am just giving you a heads up so we can
coordinate what to merge when in what order, etc
--
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.
To unsubscribe, e-mail: [email protected]
For queries about this service, please contact Infrastructure at:
[email protected]