From f605f28d989536ef4044d818c91fcd00fa624a9f Mon Sep 17 00:00:00 2001 From: Sagar Sumit Date: Fri, 13 Sep 2024 14:45:25 +0530 Subject: [PATCH] [HUDI-8102] Turn on data skipping and position-based record merging by default (#11620) --- .../java/org/apache/hudi/common/config/HoodieReaderConfig.java | 2 +- .../src/main/scala/org/apache/hudi/DataSourceOptions.scala | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/hudi-common/src/main/java/org/apache/hudi/common/config/HoodieReaderConfig.java b/hudi-common/src/main/java/org/apache/hudi/common/config/HoodieReaderConfig.java index bb29e090ec32..452dcb670207 100644 --- a/hudi-common/src/main/java/org/apache/hudi/common/config/HoodieReaderConfig.java +++ b/hudi-common/src/main/java/org/apache/hudi/common/config/HoodieReaderConfig.java @@ -68,7 +68,7 @@ public class HoodieReaderConfig extends HoodieConfig { public static final ConfigProperty MERGE_USE_RECORD_POSITIONS = ConfigProperty .key("hoodie.merge.use.record.positions") - .defaultValue(false) + .defaultValue(true) .markAdvanced() .sinceVersion("1.0.0") .withDocumentation("Whether to use positions in the block header for data blocks containing updates and delete blocks for merging."); diff --git a/hudi-spark-datasource/hudi-spark-common/src/main/scala/org/apache/hudi/DataSourceOptions.scala b/hudi-spark-datasource/hudi-spark-common/src/main/scala/org/apache/hudi/DataSourceOptions.scala index 2f77f5bce9e9..82d8e2ad2f67 100644 --- a/hudi-spark-datasource/hudi-spark-common/src/main/scala/org/apache/hudi/DataSourceOptions.scala +++ b/hudi-spark-datasource/hudi-spark-common/src/main/scala/org/apache/hudi/DataSourceOptions.scala @@ -157,7 +157,7 @@ object DataSourceReadOptions { val ENABLE_DATA_SKIPPING: ConfigProperty[Boolean] = ConfigProperty .key("hoodie.enable.data.skipping") - .defaultValue(false) + .defaultValue(true) .markAdvanced() .sinceVersion("0.10.0") .withDocumentation("Enables data-skipping allowing queries to leverage indexes to reduce the search space by " +