This is an automated email from the ASF dual-hosted git repository.

kerwinzhang pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/incubator-gluten.git


The following commit(s) were added to refs/heads/main by this push:
     new 32808dd22 [CELEBORN] Upgrade celeborn to 0.4.1 to support scala 
2.13-based compilation (#6226)
32808dd22 is described below

commit 32808dd22a0384d0e0bb5011bf2393710a4d5942
Author: Kerwin Zhang <[email protected]>
AuthorDate: Thu Jun 27 09:58:25 2024 +0800

    [CELEBORN] Upgrade celeborn to 0.4.1 to support scala 2.13-based 
compilation (#6226)
---
 .github/workflows/velox_docker.yml                         |  6 +++---
 docs/get-started/ClickHouse.md                             | 12 ++++++------
 .../shuffle/gluten/celeborn/CelebornShuffleManager.java    |  8 +++++++-
 .../spark/shuffle/gluten/celeborn/CelebornUtils.java       | 14 ++++++++++++--
 pom.xml                                                    |  2 +-
 tools/gluten-it/pom.xml                                    |  4 ++--
 6 files changed, 31 insertions(+), 15 deletions(-)

diff --git a/.github/workflows/velox_docker.yml 
b/.github/workflows/velox_docker.yml
index 31796c15b..d110d0a6d 100644
--- a/.github/workflows/velox_docker.yml
+++ b/.github/workflows/velox_docker.yml
@@ -521,7 +521,7 @@ jobs:
       fail-fast: false
       matrix:
         spark: ["spark-3.2"]
-        celeborn: ["celeborn-0.4.0", "celeborn-0.3.2"]
+        celeborn: ["celeborn-0.4.1", "celeborn-0.3.2-incubating"]
     runs-on: ubuntu-20.04
     container: ubuntu:22.04
     steps:
@@ -557,8 +557,8 @@ jobs:
           fi
           echo "EXTRA_PROFILE: ${EXTRA_PROFILE}"
           cd /opt && mkdir -p celeborn && \
-          wget https://archive.apache.org/dist/incubator/celeborn/${{ 
matrix.celeborn }}-incubating/apache-${{ matrix.celeborn }}-incubating-bin.tgz 
&& \
-          tar xzf apache-${{ matrix.celeborn }}-incubating-bin.tgz -C 
/opt/celeborn --strip-components=1 && cd celeborn && \
+          wget https://archive.apache.org/dist/celeborn/${{ matrix.celeborn 
}}/apache-${{ matrix.celeborn }}-bin.tgz && \
+          tar xzf apache-${{ matrix.celeborn }}-bin.tgz -C /opt/celeborn 
--strip-components=1 && cd celeborn && \
           mv ./conf/celeborn-env.sh.template ./conf/celeborn-env.sh && \
           bash -c "echo -e 
'CELEBORN_MASTER_MEMORY=4g\nCELEBORN_WORKER_MEMORY=4g\nCELEBORN_WORKER_OFFHEAP_MEMORY=8g'
 > ./conf/celeborn-env.sh" && \
           bash -c "echo -e 'celeborn.worker.commitFiles.threads 
128\nceleborn.worker.sortPartition.threads 64' > ./conf/celeborn-defaults.conf" 
&& \
diff --git a/docs/get-started/ClickHouse.md b/docs/get-started/ClickHouse.md
index 4352a99e5..ab24de7a4 100644
--- a/docs/get-started/ClickHouse.md
+++ b/docs/get-started/ClickHouse.md
@@ -679,13 +679,13 @@ 
spark.shuffle.manager=org.apache.spark.shuffle.gluten.celeborn.CelebornShuffleMa
 
 quickly start a celeborn cluster
 ```shell
-wget 
https://archive.apache.org/dist/incubator/celeborn/celeborn-0.3.0-incubating/apache-celeborn-0.3.0-incubating-bin.tgz
 && \
-tar -zxvf apache-celeborn-0.3.0-incubating-bin.tgz && \
-mv apache-celeborn-0.3.0-incubating-bin/conf/celeborn-defaults.conf.template 
apache-celeborn-0.3.0-incubating-bin/conf/celeborn-defaults.conf && \
-mv apache-celeborn-0.3.0-incubating-bin/conf/log4j2.xml.template 
apache-celeborn-0.3.0-incubating-bin/conf/log4j2.xml && \
+wget 
https://archive.apache.org/dist/celeborn/celeborn-0.3.2-incubating/apache-celeborn-0.3.2-incubating-bin.tgz
 && \
+tar -zxvf apache-celeborn-0.3.2-incubating-bin.tgz && \
+mv apache-celeborn-0.3.2-incubating-bin/conf/celeborn-defaults.conf.template 
apache-celeborn-0.3.2-incubating-bin/conf/celeborn-defaults.conf && \
+mv apache-celeborn-0.3.2-incubating-bin/conf/log4j2.xml.template 
apache-celeborn-0.3.2-incubating-bin/conf/log4j2.xml && \
 mkdir /opt/hadoop && chmod 777 /opt/hadoop && \
-echo -e "celeborn.worker.flusher.threads 4\nceleborn.worker.storage.dirs 
/tmp\nceleborn.worker.monitor.disk.enabled false" > 
apache-celeborn-0.3.0-incubating-bin/conf/celeborn-defaults.conf && \
-bash apache-celeborn-0.3.0-incubating-bin/sbin/start-master.sh && bash 
apache-celeborn-0.3.0-incubating-bin/sbin/start-worker.sh
+echo -e "celeborn.worker.flusher.threads 4\nceleborn.worker.storage.dirs 
/tmp\nceleborn.worker.monitor.disk.enabled false" > 
apache-celeborn-0.3.2-incubating-bin/conf/celeborn-defaults.conf && \
+bash apache-celeborn-0.3.2-incubating-bin/sbin/start-master.sh && bash 
apache-celeborn-0.3.2-incubating-bin/sbin/start-worker.sh
 ```
 
 ### Columnar shuffle mode
diff --git 
a/gluten-celeborn/common/src/main/java/org/apache/spark/shuffle/gluten/celeborn/CelebornShuffleManager.java
 
b/gluten-celeborn/common/src/main/java/org/apache/spark/shuffle/gluten/celeborn/CelebornShuffleManager.java
index f454cf00c..d196691d1 100644
--- 
a/gluten-celeborn/common/src/main/java/org/apache/spark/shuffle/gluten/celeborn/CelebornShuffleManager.java
+++ 
b/gluten-celeborn/common/src/main/java/org/apache/spark/shuffle/gluten/celeborn/CelebornShuffleManager.java
@@ -217,7 +217,13 @@ public class CelebornShuffleManager implements 
ShuffleManager {
       }
     }
     return CelebornUtils.unregisterShuffle(
-        lifecycleManager, shuffleClient, shuffleIdTracker, shuffleId, 
appUniqueId, isDriver());
+        lifecycleManager,
+        shuffleClient,
+        shuffleIdTracker,
+        shuffleId,
+        appUniqueId,
+        throwsFetchFailure,
+        isDriver());
   }
 
   @Override
diff --git 
a/gluten-celeborn/common/src/main/java/org/apache/spark/shuffle/gluten/celeborn/CelebornUtils.java
 
b/gluten-celeborn/common/src/main/java/org/apache/spark/shuffle/gluten/celeborn/CelebornUtils.java
index 9dd4e1d11..6b4229ad3 100644
--- 
a/gluten-celeborn/common/src/main/java/org/apache/spark/shuffle/gluten/celeborn/CelebornUtils.java
+++ 
b/gluten-celeborn/common/src/main/java/org/apache/spark/shuffle/gluten/celeborn/CelebornUtils.java
@@ -49,11 +49,21 @@ public class CelebornUtils {
       Object shuffleIdTracker,
       int appShuffleId,
       String appUniqueId,
+      boolean throwsFetchFailure,
       boolean isDriver) {
     try {
-      // for Celeborn 0.4.0
       try {
-        if (lifecycleManager != null) {
+        try {
+          // for Celeborn 0.4.1
+          if (lifecycleManager != null) {
+            Method unregisterAppShuffle =
+                lifecycleManager
+                    .getClass()
+                    .getMethod("unregisterAppShuffle", int.class, 
boolean.class);
+            unregisterAppShuffle.invoke(lifecycleManager, appShuffleId, 
throwsFetchFailure);
+          }
+        } catch (NoSuchMethodException ex) {
+          // for Celeborn 0.4.0
           Method unregisterAppShuffle =
               lifecycleManager.getClass().getMethod("unregisterAppShuffle", 
int.class);
           unregisterAppShuffle.invoke(lifecycleManager, appShuffleId);
diff --git a/pom.xml b/pom.xml
index 81ce0e5d4..887839ce5 100644
--- a/pom.xml
+++ b/pom.xml
@@ -53,7 +53,7 @@
     <delta.package.name>delta-core</delta.package.name>
     <delta.version>2.4.0</delta.version>
     <delta.binary.version>24</delta.binary.version>
-    <celeborn.version>0.3.2-incubating</celeborn.version>
+    <celeborn.version>0.4.1</celeborn.version>
     <uniffle.version>0.8.0</uniffle.version>
     <arrow.version>15.0.0</arrow.version>
     <arrow-gluten.version>15.0.0-gluten</arrow-gluten.version>
diff --git a/tools/gluten-it/pom.xml b/tools/gluten-it/pom.xml
index 3f1760069..71db637a8 100644
--- a/tools/gluten-it/pom.xml
+++ b/tools/gluten-it/pom.xml
@@ -21,7 +21,7 @@
     <spark.version>3.4.2</spark.version>
     <scala.binary.version>2.12</scala.binary.version>
     <spark.major.version>3</spark.major.version>
-    <celeborn.version>0.3.0-incubating</celeborn.version>
+    <celeborn.version>0.3.2-incubating</celeborn.version>
     <uniffle.version>0.8.0</uniffle.version>
     <gluten.version>1.2.0-SNAPSHOT</gluten.version>
     <guava.version>32.0.1-jre</guava.version>
@@ -167,7 +167,7 @@
     <profile>
       <id>celeborn-0.4</id>
       <properties>
-        <celeborn.version>0.4.0-incubating</celeborn.version>
+        <celeborn.version>0.4.1</celeborn.version>
       </properties>
     </profile>
   </profiles>


---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]

Reply via email to