This is an automated email from the ASF dual-hosted git repository.

agrove pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/datafusion-comet.git


The following commit(s) were added to refs/heads/main by this push:
     new fc122e806 build: Set thread thresholds envs for spark test on macOS 
(#2987)
fc122e806 is described below

commit fc122e806fcb9f82b79bd1541b61ce995881a9e6
Author: Zhen Wang <[email protected]>
AuthorDate: Fri Dec 26 22:42:01 2025 +0800

    build: Set thread thresholds envs for spark test on macOS (#2987)
---
 .github/workflows/pr_build_macos.yml                     | 16 ++++++++--------
 .../test/scala/org/apache/spark/sql/CometTestBase.scala  |  8 ++++++++
 2 files changed, 16 insertions(+), 8 deletions(-)

diff --git a/.github/workflows/pr_build_macos.yml 
b/.github/workflows/pr_build_macos.yml
index da06bff87..0ad40c193 100644
--- a/.github/workflows/pr_build_macos.yml
+++ b/.github/workflows/pr_build_macos.yml
@@ -132,14 +132,6 @@ jobs:
             value: |
               org.apache.spark.sql.CometToPrettyStringSuite
 
-        exclude:
-          # Skip fuzz suite for Spark 4.0
-          # https://github.com/apache/datafusion-comet/issues/2965
-          - profile:
-              name: "Spark 4.0, JDK 17, Scala 2.13"
-            suite:
-              name: "fuzz"
-
       fail-fast: false
     name: ${{ matrix.os }}/${{ matrix.profile.name }} [${{ matrix.suite.name 
}}]
     runs-on: ${{ matrix.os }}
@@ -152,6 +144,14 @@ jobs:
           jdk-version: ${{ matrix.profile.java_version }}
           jdk-architecture: aarch64
           protoc-architecture: aarch_64
+      - name: Set thread thresholds envs for spark test on macOS
+        # see: https://github.com/apache/datafusion-comet/issues/2965
+        shell: bash
+        run: |
+          echo "SPARK_TEST_SQL_SHUFFLE_EXCHANGE_MAX_THREAD_THRESHOLD=256" >> 
$GITHUB_ENV
+          echo "SPARK_TEST_SQL_RESULT_QUERY_STAGE_MAX_THREAD_THRESHOLD=256" >> 
$GITHUB_ENV
+          echo "SPARK_TEST_HIVE_SHUFFLE_EXCHANGE_MAX_THREAD_THRESHOLD=48" >> 
$GITHUB_ENV
+          echo "SPARK_TEST_HIVE_RESULT_QUERY_STAGE_MAX_THREAD_THRESHOLD=48" >> 
$GITHUB_ENV
       - name: Java test steps
         uses: ./.github/actions/java-test
         with:
diff --git a/spark/src/test/scala/org/apache/spark/sql/CometTestBase.scala 
b/spark/src/test/scala/org/apache/spark/sql/CometTestBase.scala
index 8011e5e70..7dba24bff 100644
--- a/spark/src/test/scala/org/apache/spark/sql/CometTestBase.scala
+++ b/spark/src/test/scala/org/apache/spark/sql/CometTestBase.scala
@@ -89,6 +89,14 @@ abstract class CometTestBase
     // this is an edge case, and we expect most users to allow sorts on 
floating point, so we
     // enable this for the tests
     conf.set(CometConf.getExprAllowIncompatConfigKey("SortOrder"), "true")
+    // For spark 4.0 tests, we need limit the thread threshold to avoid OOM, 
see:
+    //  https://github.com/apache/datafusion-comet/issues/2965
+    conf.set(
+      "spark.sql.shuffleExchange.maxThreadThreshold",
+      
sys.env.getOrElse("SPARK_TEST_SQL_SHUFFLE_EXCHANGE_MAX_THREAD_THRESHOLD", 
"1024"))
+    conf.set(
+      "spark.sql.resultQueryStage.maxThreadThreshold",
+      
sys.env.getOrElse("SPARK_TEST_SQL_RESULT_QUERY_STAGE_MAX_THREAD_THRESHOLD", 
"1024"))
     conf
   }
 


---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]

Reply via email to