alamb commented on code in PR #16971:
URL: https://github.com/apache/datafusion/pull/16971#discussion_r2246489431
##########
datafusion/common/src/config.rs:
##########
@@ -549,6 +549,12 @@ config_namespace! {
/// (reading) Use any available bloom filters when reading parquet
files
pub bloom_filter_on_read: bool, default = true
+ /// (reading) Whether or not to enable the caching of embedded
metadata of Parquet files
+ /// (footer and page metadata). Enabling it can offer substantial
performance improvements
+ /// for repeated queries over large files. By default, the cache is
automatically
+ /// invalidated when the underlying file is modified.
+ pub cache_metadata: bool, default = false
Review Comment:
See https://github.com/apache/datafusion/issues/17001
##########
datafusion/common/src/config.rs:
##########
@@ -549,6 +549,12 @@ config_namespace! {
/// (reading) Use any available bloom filters when reading parquet
files
pub bloom_filter_on_read: bool, default = true
+ /// (reading) Whether or not to enable the caching of embedded
metadata of Parquet files
+ /// (footer and page metadata). Enabling it can offer substantial
performance improvements
+ /// for repeated queries over large files. By default, the cache is
automatically
+ /// invalidated when the underlying file is modified.
+ pub cache_metadata: bool, default = false
Review Comment:
- See https://github.com/apache/datafusion/issues/17001
--
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.
To unsubscribe, e-mail: [email protected]
For queries about this service, please contact Infrastructure at:
[email protected]
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]