This is an automated email from the ASF dual-hosted git repository.

yuanzhou pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/incubator-gluten.git


The following commit(s) were added to refs/heads/main by this push:
     new 664ef23270 [VL] Use clean docker image for Celeborn tests (#11250)
664ef23270 is described below

commit 664ef2327051a26d9d05aad8ff97341f5abc829c
Author: Yuan <[email protected]>
AuthorDate: Fri Dec 5 01:16:28 2025 +0000

    [VL] Use clean docker image for Celeborn tests (#11250)
    
    * use clean docker image for celeborn
    
    Signed-off-by: Yuan <[email protected]>
    
    * speedup download with apache mirror
    
    Signed-off-by: Yuan <[email protected]>
    
    ---------
    
    Signed-off-by: Yuan <[email protected]>
---
 .github/workflows/velox_backend_x86.yml | 17 ++++++++++++++---
 1 file changed, 14 insertions(+), 3 deletions(-)

diff --git a/.github/workflows/velox_backend_x86.yml 
b/.github/workflows/velox_backend_x86.yml
index 420763dd1b..d2a9768dde 100644
--- a/.github/workflows/velox_backend_x86.yml
+++ b/.github/workflows/velox_backend_x86.yml
@@ -561,7 +561,7 @@ jobs:
         celeborn: [ "celeborn-0.6.1", "celeborn-0.5.4"]
         writer: ["sort", "hash"]
     runs-on: ubuntu-22.04
-    container: apache/gluten:centos-8-jdk8
+    container: centos:8
     steps:
       - uses: actions/checkout@v2
       - name: Download All Native Artifacts
@@ -574,6 +574,17 @@ jobs:
         with:
           name: arrow-jars-centos-7-${{github.sha}}
           path: /root/.m2/repository/org/apache/arrow/
+      - name: Update mirror list
+        run: |
+          sed -i -e "s|mirrorlist=|#mirrorlist=|g" /etc/yum.repos.d/CentOS-* 
|| true
+          sed -i -e 
"s|#baseurl=http://mirror.centos.org|baseurl=http://vault.centos.org|g" 
/etc/yum.repos.d/CentOS-* || true
+      - name: Setup java and maven
+        run: |
+          yum update -y && yum install -y java-1.8.0-openjdk-devel wget
+          $SETUP install_maven
+      - name: Set environment variables
+        run: |
+          echo "JAVA_HOME=/usr/lib/jvm/java-1.8.0-openjdk" >> $GITHUB_ENV
       - name: Build for Spark ${{ matrix.spark }}
         run: |
           cd $GITHUB_WORKSPACE/
@@ -589,7 +600,7 @@ jobs:
           echo "EXTRA_PROFILE: ${EXTRA_PROFILE}"
           if [ ! -e "/opt/apache-${{ matrix.celeborn }}-bin.tgz" ]; then
             echo "WARNING: please pre-install your required package in docker 
image since the downloading is throttled by this site."
-            wget -nv https://archive.apache.org/dist/celeborn/${{ 
matrix.celeborn }}/apache-${{ matrix.celeborn }}-bin.tgz -P /opt/
+            wget -nv https://www.apache.org/dyn/closer.lua/celeborn/${{ 
matrix.celeborn }}/apache-${{ matrix.celeborn }}-bin.tgz?action=download -O 
/opt/apache-${{ matrix.celeborn }}-bin.tgz
           fi
           cd /opt && rm -rf shims && mkdir -p celeborn && \
           tar xzf apache-${{ matrix.celeborn }}-bin.tgz -C /opt/celeborn 
--strip-components=1 && cd celeborn && \
@@ -610,7 +621,7 @@ jobs:
             
--extra-conf=spark.celeborn.client.eagerlyCreateInputStream.threads=4 \
             --benchmark-type=ds --error-on-memleak \
             --off-heap-size=16g -s=1.0 --threads=16 --iterations=1
-          if false; then # TODO: fix celeborn rss sort issue
+          if [ "${{ matrix.writer }}" = "sort" ]; then
             GLUTEN_IT_JVM_ARGS=-Xmx16G sbin/gluten-it.sh queries-compare \
               --local --preset=velox-with-celeborn 
--extra-conf=spark.celeborn.client.spark.shuffle.writer=${{ matrix.writer }} \
               
--extra-conf=spark.gluten.sql.columnar.shuffle.celeborn.useRssSort=false \


---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]

Reply via email to