This is an automated email from the ASF dual-hosted git repository.
vhs pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/hudi.git
The following commit(s) were added to refs/heads/master by this push:
new 433bf82a8d29 fix: Prevent HiveSyncTool from running twice in meta sync
(#17937)
433bf82a8d29 is described below
commit 433bf82a8d29c98e28398e6241754293cfe3b63c
Author: Surya Prasanna <[email protected]>
AuthorDate: Sun Jan 18 20:26:59 2026 -0800
fix: Prevent HiveSyncTool from running twice in meta sync (#17937)
* Make sure HiveSyncTool does not run twice
* Refactor code
* Fix checkstyle issues
---
.../src/main/java/org/apache/hudi/utilities/streamer/StreamSync.java | 3 ++-
1 file changed, 2 insertions(+), 1 deletion(-)
diff --git
a/hudi-utilities/src/main/java/org/apache/hudi/utilities/streamer/StreamSync.java
b/hudi-utilities/src/main/java/org/apache/hudi/utilities/streamer/StreamSync.java
index 6591c39fbb12..25a16acdf8a8 100644
---
a/hudi-utilities/src/main/java/org/apache/hudi/utilities/streamer/StreamSync.java
+++
b/hudi-utilities/src/main/java/org/apache/hudi/utilities/streamer/StreamSync.java
@@ -138,6 +138,7 @@ import java.util.Collections;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
+import java.util.Set;
import java.util.concurrent.atomic.AtomicLong;
import java.util.function.Function;
import java.util.function.Supplier;
@@ -1009,7 +1010,7 @@ public class StreamSync implements Serializable,
Closeable {
}
public void runMetaSync() {
- List<String> syncClientToolClasses =
Arrays.stream(cfg.syncClientToolClassNames.split(",")).distinct().collect(Collectors.toList());
+ Set<String> syncClientToolClasses =
Arrays.stream(cfg.syncClientToolClassNames.split(",")).collect(Collectors.toSet());
// for backward compatibility
if (cfg.enableHiveSync) {
cfg.enableMetaSync = true;