From 1b27f12f683c67d60ca4dab8624065516dc53054 Mon Sep 17 00:00:00 2001
From: James Xu <xumingmingv@gmail.com>
Date: Thu, 25 Jun 2026 11:37:28 +0800
Subject: [PATCH 1/3] [SPARK-57688][SQL] feat: add
 spark.sql.execution.bypassPartialAggregation to skip pre-shuffle partial agg

Adds a new SQL config spark.sql.execution.bypassPartialAggregation
(default false). When set to true, planAggregateWithoutDistinct skips
the pre-shuffle Partial-mode aggregation and runs a single Complete-mode
aggregation after the shuffle instead. This can improve performance when
group cardinality is high and the pre-shuffle reduction ratio is low.

The bypass is suppressed when a session_window grouping key is present,
since MergingSessionsExec must be inserted in the Partial+Merge+Final
path to correctly merge overlapping sessions.

The config has no effect on queries containing DISTINCT aggregate
functions, where the partial aggregation phases are required for
correctness and are always applied.
---
 .../apache/spark/sql/internal/SQLConf.scala   |  13 ++
 .../sql/execution/aggregate/AggUtils.scala    |  23 +++
 .../PartialAggregationBypassSuite.scala       | 178 ++++++++++++++++++
 3 files changed, 214 insertions(+)
 create mode 100644 sql/core/src/test/scala/org/apache/spark/sql/execution/aggregate/PartialAggregationBypassSuite.scala

diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/internal/SQLConf.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/internal/SQLConf.scala
index ff2dd2dbd4833..87dbc05770b2b 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/internal/SQLConf.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/internal/SQLConf.scala
@@ -3869,6 +3869,17 @@ object SQLConf {
     .booleanConf
     .createWithDefault(true)
 
+  val BYPASS_PARTIAL_AGGREGATION = buildConf("spark.sql.execution.bypassPartialAggregation")
+    .doc("When true, skips the pre-shuffle partial aggregation and runs a single Complete-mode " +
+      "aggregation after the shuffle. Bypassing partial aggregation can improve performance " +
+      "when group cardinality is high and the pre-shuffle reduction ratio is low. " +
+      "When false (default), uses a two-phase Partial+Final aggregation across a shuffle. " +
+      "This setting has no effect on queries containing DISTINCT aggregate functions, where " +
+      "the partial aggregation phases are required for correctness and are always applied.")
+    .version("3.3.1")
+    .booleanConf
+    .createWithDefault(false)
+
   val JSON_GENERATOR_IGNORE_NULL_FIELDS =
     buildConf("spark.sql.jsonGenerator.ignoreNullFields")
       .doc("Whether to ignore null fields when generating JSON objects in JSON data source and " +
@@ -8324,6 +8335,8 @@ class SQLConf extends Serializable with Logging with SqlApiConf {
 
   def useHashAggregation: Boolean = getConf(USE_HASH_AGG)
 
+  def bypassPartialAggregation: Boolean = getConf(BYPASS_PARTIAL_AGGREGATION)
+
   def objectAggSortBasedFallbackThreshold: Int = getConf(OBJECT_AGG_SORT_BASED_FALLBACK_THRESHOLD)
 
   def variableSubstituteEnabled: Boolean = getConf(VARIABLE_SUBSTITUTE_ENABLED)
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/AggUtils.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/AggUtils.scala
index c2a7024367afd..40b720b63fa47 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/AggUtils.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/AggUtils.scala
@@ -129,6 +129,29 @@ object AggUtils {
       child: SparkPlan): Seq[SparkPlan] = {
     // Check if we can use HashAggregate.
 
+    // When partial aggregation is disabled, skip the pre-shuffle partial aggregation and run a
+    // single Complete-mode aggregation after the shuffle. This can improve performance when the
+    // group cardinality is high and the pre-shuffle reduction ratio is low.
+    //
+    // session_window requires MergingSessionsExec (inserted below via mayAppendMergingSessionExec)
+    // to sort and merge overlapping sessions before the final aggregation. The bypass is skipped
+    // when a session_window grouping key is present so that the normal Partial+Merge+Final path
+    // runs and MergingSessionsExec is correctly inserted.
+    val hasSessionWindow = groupingExpressions.exists(_.metadata.contains(SessionWindow.marker))
+    if (child.conf.bypassPartialAggregation && !hasSessionWindow) {
+      val completeAggregateExpressions = aggregateExpressions.map(_.copy(mode = Complete))
+      val completeAggregateAttributes = completeAggregateExpressions.map(_.resultAttribute)
+      val completeAggregate = createAggregate(
+        requiredChildDistributionExpressions = Some(groupingExpressions),
+        groupingExpressions = groupingExpressions,
+        aggregateExpressions = completeAggregateExpressions,
+        aggregateAttributes = completeAggregateAttributes,
+        initialInputBufferOffset = 0,
+        resultExpressions = resultExpressions,
+        child = child)
+      return completeAggregate :: Nil
+    }
+
     // 1. Create an Aggregate Operator for partial aggregations.
 
     val groupingAttributes = groupingExpressions.map(_.toAttribute)
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/aggregate/PartialAggregationBypassSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/aggregate/PartialAggregationBypassSuite.scala
new file mode 100644
index 0000000000000..2ffe5731078d6
--- /dev/null
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/aggregate/PartialAggregationBypassSuite.scala
@@ -0,0 +1,178 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.execution.aggregate
+
+import org.apache.spark.sql.{functions => F, QueryTest}
+import org.apache.spark.sql.catalyst.expressions.aggregate.{Complete, Final, Partial}
+import org.apache.spark.sql.execution.SparkPlan
+import org.apache.spark.sql.execution.adaptive.AdaptiveSparkPlanHelper
+import org.apache.spark.sql.functions.{collect_list, count, session_window, sum}
+import org.apache.spark.sql.internal.SQLConf
+import org.apache.spark.sql.test.SharedSparkSession
+
+class PartialAggregationBypassSuite
+    extends QueryTest
+    with SharedSparkSession
+    with AdaptiveSparkPlanHelper {
+
+  private def aggNodes(plan: SparkPlan): Seq[BaseAggregateExec] =
+    collectWithSubqueries(plan) { case a: BaseAggregateExec => a }
+
+  private def withAndWithoutAQE(f: => Unit): Unit = {
+    Seq("true", "false").foreach { aqe =>
+      withSQLConf(SQLConf.ADAPTIVE_EXECUTION_ENABLED.key -> aqe)(f)
+    }
+  }
+
+  test("bypassPartialAggregation=true produces no Partial-mode node and one Complete-mode node") {
+    withAndWithoutAQE {
+      withSQLConf(SQLConf.BYPASS_PARTIAL_AGGREGATION.key -> "true") {
+        val df = spark.range(100).toDF("v")
+          .groupBy((F.col("v") % 10).as("k"))
+          .agg(F.sum("v"), F.count("v"))
+        val aggs = aggNodes(df.queryExecution.executedPlan)
+        assert(aggs.forall(_.aggregateExpressions.forall(_.mode != Partial)),
+          "expected no Partial-mode aggregation nodes")
+        assert(aggs.exists(_.aggregateExpressions.exists(_.mode == Complete)),
+          "expected at least one Complete-mode aggregation node")
+        assert(!aggs.exists(_.aggregateExpressions.exists(_.mode == Final)),
+          "expected no Final-mode aggregation nodes")
+      }
+    }
+  }
+
+  test("bypassPartialAggregation=false (default) produces Partial+Final plan") {
+    withAndWithoutAQE {
+      val df = spark.range(100).toDF("v")
+        .groupBy((F.col("v") % 10).as("k"))
+        .agg(F.sum("v"))
+      val aggs = aggNodes(df.queryExecution.executedPlan)
+      assert(aggs.exists(_.aggregateExpressions.exists(_.mode == Partial)),
+        "expected a Partial-mode aggregation node")
+      assert(aggs.exists(_.aggregateExpressions.exists(_.mode == Final)),
+        "expected a Final-mode aggregation node")
+    }
+  }
+
+  test("results are identical with and without partial aggregation — SUM") {
+    withAndWithoutAQE {
+      val data = spark.range(1000).selectExpr("id % 7 as k", "id as v")
+      val expected = data.groupBy("k").sum("v").orderBy("k").collect()
+      withSQLConf(SQLConf.BYPASS_PARTIAL_AGGREGATION.key -> "true") {
+        val actual = data.groupBy("k").sum("v").orderBy("k").collect()
+        assert(actual.toSeq == expected.toSeq)
+      }
+    }
+  }
+
+  test("results are identical with and without partial aggregation — COUNT") {
+    withAndWithoutAQE {
+      val data = spark.range(1000).selectExpr("id % 13 as k")
+      val expected = data.groupBy("k").count().orderBy("k").collect()
+      withSQLConf(SQLConf.BYPASS_PARTIAL_AGGREGATION.key -> "true") {
+        val actual = data.groupBy("k").count().orderBy("k").collect()
+        assert(actual.toSeq == expected.toSeq)
+      }
+    }
+  }
+
+  test("results are identical with and without partial aggregation — AVG") {
+    withAndWithoutAQE {
+      val data = spark.range(1000).selectExpr("id % 5 as k", "id as v")
+      val expected = data.groupBy("k").avg("v").orderBy("k").collect()
+      withSQLConf(SQLConf.BYPASS_PARTIAL_AGGREGATION.key -> "true") {
+        val actual = data.groupBy("k").avg("v").orderBy("k").collect()
+        assert(actual.toSeq == expected.toSeq)
+      }
+    }
+  }
+
+  test("results are identical with and without partial aggregation — collect_list " +
+      "(TypedImperativeAggregate via ObjectHashAggregateExec)") {
+    // collect_list is a TypedImperativeAggregate whose buffer cannot be expressed as fixed-width
+    // slots, so createAggregate routes it through ObjectHashAggregateExec rather than
+    // HashAggregateExec. This test verifies that the bypass correctly produces a single
+    // Complete-mode ObjectHashAggregateExec and that its results match the normal Partial+Final
+    // path.
+    withAndWithoutAQE {
+      val data = spark.range(20).selectExpr("id % 4 as k", "id as v")
+      val expected = data.groupBy("k").agg(collect_list("v"))
+        .orderBy("k").collect()
+      withSQLConf(SQLConf.BYPASS_PARTIAL_AGGREGATION.key -> "true") {
+        val df = data.groupBy("k").agg(collect_list("v")).orderBy("k")
+        val aggs = aggNodes(df.queryExecution.executedPlan)
+        assert(aggs.exists(_.isInstanceOf[ObjectHashAggregateExec]),
+          "expected ObjectHashAggregateExec for TypedImperativeAggregate")
+        assert(aggs.forall(_.aggregateExpressions.forall(_.mode != Partial)),
+          "expected no Partial-mode aggregation nodes")
+        // collect_list output order within each group may differ between runs; sort before compare.
+        val actual = df.collect()
+        assert(actual.length == expected.length)
+        actual.zip(expected).foreach { case (a, e) =>
+          assert(a.getLong(0) == e.getLong(0))
+          assert(a.getSeq[Long](1).sorted == e.getSeq[Long](1).sorted)
+        }
+      }
+    }
+  }
+
+  test("session_window with bypassPartialAggregation=true merges overlapping sessions correctly") {
+    // Regression test: when bypassPartialAggregation=true, the early-return path in
+    // planAggregateWithoutDistinct skipped mayAppendMergingSessionExec, so overlapping
+    // sessions were never merged and the aggregation produced wrong row counts / sums.
+    import testImplicits._
+    // Two events for key "a" fall within 10s of each other and must merge into one session.
+    // One event for key "b" stands alone.
+    val df = Seq(
+      ("2016-03-27 19:39:34", 1, "a"),
+      ("2016-03-27 19:39:39", 2, "a"), // within 10s of the first "a" — same session
+      ("2016-03-27 19:39:56", 3, "a"), // > 10s gap — separate session
+      ("2016-03-27 19:39:27", 4, "b")
+    ).toDF("time", "value", "id")
+
+    val expected = df
+      .groupBy(session_window($"time", "10 seconds"), $"id")
+      .agg(count("*").as("cnt"), sum("value").as("total"))
+      .orderBy($"session_window.start".asc)
+      .selectExpr(
+        "CAST(session_window.start AS STRING)",
+        "CAST(session_window.end AS STRING)",
+        "id", "cnt", "total")
+      .collect()
+
+    // With the bug, bypassPartialAggregation=true skips MergingSessionsExec and the two
+    // "a" events that belong to the same session appear as separate rows.
+    withAndWithoutAQE {
+      withSQLConf(SQLConf.BYPASS_PARTIAL_AGGREGATION.key -> "true") {
+        val actual = df
+          .groupBy(session_window($"time", "10 seconds"), $"id")
+          .agg(count("*").as("cnt"), sum("value").as("total"))
+          .orderBy($"session_window.start".asc)
+          .selectExpr(
+            "CAST(session_window.start AS STRING)",
+            "CAST(session_window.end AS STRING)",
+            "id", "cnt", "total")
+          .collect()
+
+        assert(actual.toSeq == expected.toSeq,
+          s"session_window results differ with bypassPartialAggregation=true.\n" +
+            s"Expected:\n${expected.mkString("\n")}\nActual:\n${actual.mkString("\n")}")
+      }
+    }
+  }
+}

From 037f169dfe0e0fee78e0a6c11434d5aba947e01f Mon Sep 17 00:00:00 2001
From: James Xu <xumingmingv@gmail.com>
Date: Fri, 26 Jun 2026 14:06:16 +0800
Subject: [PATCH 2/3] [SPARK-57688][SQL] Use checkAnswer in
 PartialAggregationBypassSuite for better diagnostics
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Switch scalar-aggregate tests (SUM, COUNT, AVG, session_window) to use
checkAnswer instead of raw actual.toSeq == expected.toSeq, providing
better error messages when comparisons fail by pinpointing the
mismatched row and column.

Keep manual zip-and-sort for the collect_list test since checkAnswer
does not sort nested arrays — collect_list output order within groups
is non-deterministic between Partial+Final and Complete aggregation
paths.

Also replace non-ASCII em-dashes with ASCII equivalents (--, -, :) in
test names and comments to satisfy scalastyle.
---
 .../apache/spark/sql/internal/SQLConf.scala   |  3 +-
 .../PartialAggregationBypassSuite.scala       | 35 +++++++++----------
 2 files changed, 19 insertions(+), 19 deletions(-)

diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/internal/SQLConf.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/internal/SQLConf.scala
index 87dbc05770b2b..a373e13da54a2 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/internal/SQLConf.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/internal/SQLConf.scala
@@ -3876,7 +3876,8 @@ object SQLConf {
       "When false (default), uses a two-phase Partial+Final aggregation across a shuffle. " +
       "This setting has no effect on queries containing DISTINCT aggregate functions, where " +
       "the partial aggregation phases are required for correctness and are always applied.")
-    .version("3.3.1")
+    .version("4.3.0")
+    .withBindingPolicy(ConfigBindingPolicy.SESSION)
     .booleanConf
     .createWithDefault(false)
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/aggregate/PartialAggregationBypassSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/aggregate/PartialAggregationBypassSuite.scala
index 2ffe5731078d6..0e8962ecad7bf 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/aggregate/PartialAggregationBypassSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/aggregate/PartialAggregationBypassSuite.scala
@@ -69,40 +69,40 @@ class PartialAggregationBypassSuite
     }
   }
 
-  test("results are identical with and without partial aggregation — SUM") {
+  test("results are identical with and without partial aggregation - SUM") {
     withAndWithoutAQE {
       val data = spark.range(1000).selectExpr("id % 7 as k", "id as v")
       val expected = data.groupBy("k").sum("v").orderBy("k").collect()
       withSQLConf(SQLConf.BYPASS_PARTIAL_AGGREGATION.key -> "true") {
-        val actual = data.groupBy("k").sum("v").orderBy("k").collect()
-        assert(actual.toSeq == expected.toSeq)
+        val actual = data.groupBy("k").sum("v").orderBy("k")
+        checkAnswer(actual, expected)
       }
     }
   }
 
-  test("results are identical with and without partial aggregation — COUNT") {
+  test("results are identical with and without partial aggregation - COUNT") {
     withAndWithoutAQE {
       val data = spark.range(1000).selectExpr("id % 13 as k")
       val expected = data.groupBy("k").count().orderBy("k").collect()
       withSQLConf(SQLConf.BYPASS_PARTIAL_AGGREGATION.key -> "true") {
-        val actual = data.groupBy("k").count().orderBy("k").collect()
-        assert(actual.toSeq == expected.toSeq)
+        val actual = data.groupBy("k").count().orderBy("k")
+        checkAnswer(actual, expected)
       }
     }
   }
 
-  test("results are identical with and without partial aggregation — AVG") {
+  test("results are identical with and without partial aggregation - AVG") {
     withAndWithoutAQE {
       val data = spark.range(1000).selectExpr("id % 5 as k", "id as v")
       val expected = data.groupBy("k").avg("v").orderBy("k").collect()
       withSQLConf(SQLConf.BYPASS_PARTIAL_AGGREGATION.key -> "true") {
-        val actual = data.groupBy("k").avg("v").orderBy("k").collect()
-        assert(actual.toSeq == expected.toSeq)
+        val actual = data.groupBy("k").avg("v").orderBy("k")
+        checkAnswer(actual, expected)
       }
     }
   }
 
-  test("results are identical with and without partial aggregation — collect_list " +
+  test("results are identical with and without partial aggregation - collect_list " +
       "(TypedImperativeAggregate via ObjectHashAggregateExec)") {
     // collect_list is a TypedImperativeAggregate whose buffer cannot be expressed as fixed-width
     // slots, so createAggregate routes it through ObjectHashAggregateExec rather than
@@ -120,7 +120,10 @@ class PartialAggregationBypassSuite
           "expected ObjectHashAggregateExec for TypedImperativeAggregate")
         assert(aggs.forall(_.aggregateExpressions.forall(_.mode != Partial)),
           "expected no Partial-mode aggregation nodes")
-        // collect_list output order within each group may differ between runs; sort before compare.
+        // checkAnswer is not used here because it does not sort nested arrays, and
+        // collect_list output order within each group is non-deterministic: it depends
+        // on row processing order which can differ between Partial+Final and Complete
+        // aggregation paths. Sort the arrays before comparing.
         val actual = df.collect()
         assert(actual.length == expected.length)
         actual.zip(expected).foreach { case (a, e) =>
@@ -140,8 +143,8 @@ class PartialAggregationBypassSuite
     // One event for key "b" stands alone.
     val df = Seq(
       ("2016-03-27 19:39:34", 1, "a"),
-      ("2016-03-27 19:39:39", 2, "a"), // within 10s of the first "a" — same session
-      ("2016-03-27 19:39:56", 3, "a"), // > 10s gap — separate session
+      ("2016-03-27 19:39:39", 2, "a"), // within 10s of the first "a" -- same session
+      ("2016-03-27 19:39:56", 3, "a"), // > 10s gap -- separate session
       ("2016-03-27 19:39:27", 4, "b")
     ).toDF("time", "value", "id")
 
@@ -167,11 +170,7 @@ class PartialAggregationBypassSuite
             "CAST(session_window.start AS STRING)",
             "CAST(session_window.end AS STRING)",
             "id", "cnt", "total")
-          .collect()
-
-        assert(actual.toSeq == expected.toSeq,
-          s"session_window results differ with bypassPartialAggregation=true.\n" +
-            s"Expected:\n${expected.mkString("\n")}\nActual:\n${actual.mkString("\n")}")
+        checkAnswer(actual, expected)
       }
     }
   }

From c8a214a883c6443193a5223c730e739820cb8ff7 Mon Sep 17 00:00:00 2001
From: James Xu <xumingmingv@gmail.com>
Date: Fri, 26 Jun 2026 14:29:14 +0800
Subject: [PATCH 3/3] [SPARK-57688][SQL] Skip partial aggregation bypass for
 global aggregations
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Global aggregations (no GROUP BY) always produce a single output row, so
the pre-shuffle partial aggregation achieves the maximum possible
reduction ratio. Bypassing it would shuffle all raw rows to a single
partition with no benefit — strictly worse than Partial+Final.

Extract hasGroupingKeys = groupingExpressions.nonEmpty and add it to the
bypass gate alongside hasSessionWindow, so the bypass only fires when
there are grouping keys to hash-partition on.

Add a test verifying that global aggregations continue to produce
Partial+Final plans even with bypassPartialAggregation=true.
---
 .../sql/execution/aggregate/AggUtils.scala    | 11 ++++++++--
 .../PartialAggregationBypassSuite.scala       | 21 +++++++++++++++++++
 2 files changed, 30 insertions(+), 2 deletions(-)

diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/AggUtils.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/AggUtils.scala
index 40b720b63fa47..7fda560863809 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/AggUtils.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/AggUtils.scala
@@ -129,16 +129,23 @@ object AggUtils {
       child: SparkPlan): Seq[SparkPlan] = {
     // Check if we can use HashAggregate.
 
-    // When partial aggregation is disabled, skip the pre-shuffle partial aggregation and run a
+    // When partial aggregation is bypassed, skip the pre-shuffle partial aggregation and run a
     // single Complete-mode aggregation after the shuffle. This can improve performance when the
     // group cardinality is high and the pre-shuffle reduction ratio is low.
     //
+    // The bypass is only beneficial when there are grouping keys (groupingExpressions.nonEmpty):
+    // global aggregations (no GROUP BY) always produce a single output row, so the pre-shuffle
+    // partial aggregation achieves the maximum possible reduction ratio and should never be
+    // skipped. Bypassing a global aggregation would shuffle all raw rows to a single partition
+    // with no benefit, which is strictly worse than the normal Partial+Final path.
+    val hasGroupingKeys = groupingExpressions.nonEmpty
+    //
     // session_window requires MergingSessionsExec (inserted below via mayAppendMergingSessionExec)
     // to sort and merge overlapping sessions before the final aggregation. The bypass is skipped
     // when a session_window grouping key is present so that the normal Partial+Merge+Final path
     // runs and MergingSessionsExec is correctly inserted.
     val hasSessionWindow = groupingExpressions.exists(_.metadata.contains(SessionWindow.marker))
-    if (child.conf.bypassPartialAggregation && !hasSessionWindow) {
+    if (child.conf.bypassPartialAggregation && hasGroupingKeys && !hasSessionWindow) {
       val completeAggregateExpressions = aggregateExpressions.map(_.copy(mode = Complete))
       val completeAggregateAttributes = completeAggregateExpressions.map(_.resultAttribute)
       val completeAggregate = createAggregate(
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/aggregate/PartialAggregationBypassSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/aggregate/PartialAggregationBypassSuite.scala
index 0e8962ecad7bf..b64bd9fe37f95 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/aggregate/PartialAggregationBypassSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/aggregate/PartialAggregationBypassSuite.scala
@@ -56,6 +56,27 @@ class PartialAggregationBypassSuite
     }
   }
 
+  test("bypassPartialAggregation=true does not bypass global aggregation " +
+      "(groupingExpressions.isEmpty)") {
+    // Global aggregations (no GROUP BY) always produce a single output row, so the
+    // pre-shuffle partial aggregation achieves the maximum possible reduction ratio.
+    // Bypassing it would shuffle all raw rows to a single partition with no benefit,
+    // which is strictly worse than the normal Partial+Final path. The bypass is
+    // therefore skipped for global aggregations.
+    withAndWithoutAQE {
+      withSQLConf(SQLConf.BYPASS_PARTIAL_AGGREGATION.key -> "true") {
+        val df = spark.range(100).agg(F.sum("id"), F.count("id"))
+        val aggs = aggNodes(df.queryExecution.executedPlan)
+        assert(aggs.exists(_.aggregateExpressions.exists(_.mode == Partial)),
+          "expected a Partial-mode node for global aggregation")
+        assert(aggs.exists(_.aggregateExpressions.exists(_.mode == Final)),
+          "expected a Final-mode node for global aggregation")
+        assert(!aggs.exists(_.aggregateExpressions.exists(_.mode == Complete)),
+          "expected no Complete-mode nodes for global aggregation")
+      }
+    }
+  }
+
   test("bypassPartialAggregation=false (default) produces Partial+Final plan") {
     withAndWithoutAQE {
       val df = spark.range(100).toDF("v")