apache · c21 · Nov 24, 2021 · Nov 26, 2021 · Nov 27, 2021 · Dec 1, 2021
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/internal/SQLConf.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/internal/SQLConf.scala
@@ -1504,6 +1504,13 @@ object SQLConf {
     .booleanConf
     .createWithDefault(true)
 
+  val REPLACE_HASH_WITH_SORT_AGG_ENABLED = buildConf("spark.sql.execution.replaceHashWithSortAgg")
+    .internal()
+    .doc("Whether to replace hash aggregate node with sort aggregate based on children's ordering")
+    .version("3.3.0")
+    .booleanConf
+    .createWithDefault(true)
+
   val STATE_STORE_PROVIDER_CLASS =
     buildConf("spark.sql.streaming.stateStore.providerClass")
       .internal()

diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/QueryExecution.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/QueryExecution.scala
@@ -423,6 +423,9 @@ object QueryExecution {
       PlanSubqueries(sparkSession),
       RemoveRedundantProjects,
       EnsureRequirements(),
+      // `ReplaceHashWithSortAgg` needs to be added after `EnsureRequirements` to guarantee the
+      // sort order of each node is checked to be valid.
+      ReplaceHashWithSortAgg,
       // `RemoveRedundantSorts` needs to be added after `EnsureRequirements` to guarantee the same
       // number of partitions when instantiating PartitioningCollection.
       RemoveRedundantSorts,

diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/ReplaceHashWithSortAgg.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/ReplaceHashWithSortAgg.scala
@@ -0,0 +1,139 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.execution
+
+import org.apache.spark.sql.catalyst.expressions.SortOrder
+import org.apache.spark.sql.catalyst.expressions.aggregate.{Complete, Final, Partial}
+import org.apache.spark.sql.catalyst.rules.Rule
+import org.apache.spark.sql.execution.aggregate.HashAggregateExec
+import org.apache.spark.sql.internal.SQLConf
+
+/**
+ * Replace [[HashAggregateExec]] with [[SortAggregateExec]] in the spark plan if:
+ *
+ * 1. The plan is a pair of partial and final [[HashAggregateExec]], and the child of partial
+ *    aggregate satisfies the sort order of corresponding [[SortAggregateExec]].
+ * or
+ * 2. The plan is a [[HashAggregateExec]], and the child satisfies the sort order of
+ *    corresponding [[SortAggregateExec]].
+ *
+ * Examples:
+ * 1. aggregate after join:
+ *
+ *  HashAggregate(t1.i, SUM, final)
+ *               |                         SortAggregate(t1.i, SUM, complete)
+ * HashAggregate(t1.i, SUM, partial)   =>                |
+ *               |                            SortMergeJoin(t1.i = t2.j)
+ *    SortMergeJoin(t1.i = t2.j)
+ *
+ * 2. aggregate after sort:
+ *
+ * HashAggregate(t1.i, SUM, partial)         SortAggregate(t1.i, SUM, partial)
+ *               |                     =>                  |
+ *           Sort(t1.i)                                Sort(t1.i)
+ *
+ * [[HashAggregateExec]] can be replaced when its child satisfies the sort order of
+ * corresponding [[SortAggregateExec]]. [[SortAggregateExec]] is faster in the sense that
+ * it does not have hashing overhead of [[HashAggregateExec]].
+ */
+object ReplaceHashWithSortAgg extends Rule[SparkPlan] {
+  def apply(plan: SparkPlan): SparkPlan = {
+    if (!conf.getConf(SQLConf.REPLACE_HASH_WITH_SORT_AGG_ENABLED)) {
+      plan
+    } else {
+      replaceHashAgg(plan)
+    }
+  }
+
+  /**
+   * Replace [[HashAggregateExec]] with [[SortAggregateExec]].
+   */
+  private def replaceHashAgg(plan: SparkPlan): SparkPlan = {
+    plan.transformDown {
+      case hashAgg: HashAggregateExec if hashAgg.groupingExpressions.nonEmpty =>
+        val sortAgg = hashAgg.toSortAggregate
+        hashAgg.child match {
+          case partialAgg: HashAggregateExec if isPartialAgg(partialAgg, hashAgg) =>
+            if (SortOrder.orderingSatisfies(
+                partialAgg.child.outputOrdering, sortAgg.requiredChildOrdering.head)) {
+              sortAgg.copy(
+                aggregateExpressions = sortAgg.aggregateExpressions.map(_.copy(mode = Complete)),
+                child = partialAgg.child)
+            } else {
+              hashAgg
+            }
+          case other =>
+            if (SortOrder.orderingSatisfies(
+                other.outputOrdering, sortAgg.requiredChildOrdering.head)) {
+              sortAgg
+            } else {
+              hashAgg
+            }
+        }
+      case other => other
+    }
+  }
+
+  /**
+   * Check if `partialAgg` to be partial aggregate of `finalAgg`.
+   */
+  private def isPartialAgg(partialAgg: HashAggregateExec, finalAgg: HashAggregateExec): Boolean = {
+    val partialGroupExprs = partialAgg.groupingExpressions
+    val finalGroupExprs = finalAgg.groupingExpressions
+    val partialAggExprs = partialAgg.aggregateExpressions
+    val finalAggExprs = finalAgg.aggregateExpressions
+    val partialAggAttrs = partialAggExprs.flatMap(_.aggregateFunction.aggBufferAttributes)
+    val finalAggAttrs = finalAggExprs.map(_.resultAttribute)
+    val partialResultExprs = partialGroupExprs ++
+      partialAggExprs.flatMap(_.aggregateFunction.inputAggBufferAttributes)
+
+    val groupExprsEqual = partialGroupExprs.length == finalGroupExprs.length &&
+      partialGroupExprs.zip(finalGroupExprs).forall {
+        case (e1, e2) => e1.semanticEquals(e2)
+      }
+    val aggExprsEqual = partialAggExprs.length == finalAggExprs.length &&
+      partialAggExprs.forall(_.mode == Partial) && finalAggExprs.forall(_.mode == Final) &&
+      partialAggExprs.zip(finalAggExprs).forall {
+        case (e1, e2) => e1.aggregateFunction.semanticEquals(e2.aggregateFunction)
+      }
+    val isPartialAggAttrsValid = partialAggAttrs.length == partialAgg.aggregateAttributes.length &&
+      partialAggAttrs.zip(partialAgg.aggregateAttributes).forall {
+        case (a1, a2) => a1.semanticEquals(a2)
+      }
+    val isFinalAggAttrsValid = finalAggAttrs.length == finalAgg.aggregateAttributes.length &&
+      finalAggAttrs.zip(finalAgg.aggregateAttributes).forall {
+        case (a1, a2) => a1.semanticEquals(a2)
+      }
+    val isPartialResultExprsValid =
+      partialResultExprs.length == partialAgg.resultExpressions.length &&
+        partialResultExprs.zip(partialAgg.resultExpressions).forall {
+          case (a1, a2) => a1.semanticEquals(a2)
+        }
+    val isRequiredDistributionValid =
+      partialAgg.requiredChildDistributionExpressions.isEmpty &&
+      finalAgg.requiredChildDistributionExpressions.exists { exprs =>
+        exprs.length == finalGroupExprs.length &&
+          exprs.zip(finalGroupExprs).forall {
+            case (e1, e2) => e1.semanticEquals(e2)
+          }
+      }
+
+    groupExprsEqual && aggExprsEqual && isPartialAggAttrsValid && isFinalAggAttrsValid &&
+      isPartialResultExprsValid && isRequiredDistributionValid
+  }
+}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/AdaptiveSparkPlanExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/AdaptiveSparkPlanExec.scala
@@ -116,6 +116,7 @@ case class AdaptiveSparkPlanExec(
     Seq(
       RemoveRedundantProjects,
       ensureRequirements,
+      ReplaceHashWithSortAgg,
       RemoveRedundantSorts,
       DisableUnnecessaryBucketedScan,
       OptimizeSkewedJoin(ensureRequirements)

diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/HashAggregateExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/HashAggregateExec.scala
@@ -1153,6 +1153,15 @@ case class HashAggregateExec(
     }
   }
 
+  /**
+   * The corresponding [[SortAggregateExec]] to get same result as this node.
+   */
+  def toSortAggregate: SortAggregateExec = {
+    SortAggregateExec(
+      requiredChildDistributionExpressions, groupingExpressions, aggregateExpressions,
+      aggregateAttributes, initialInputBufferOffset, resultExpressions, child)
+  }
+
   override protected def withNewChildInternal(newChild: SparkPlan): HashAggregateExec =
     copy(child = newChild)
 }

diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q16.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q16.sf100/explain.txt
@@ -3,7 +3,7 @@
 +- Exchange (44)
    +- * HashAggregate (43)
       +- * HashAggregate (42)
-         +- * HashAggregate (41)
+         +- SortAggregate (41)
             +- * Project (40)
                +- * BroadcastHashJoin Inner BuildRight (39)
                   :- * Project (33)
@@ -221,21 +221,21 @@ Join condition: None
 Output [3]: [cs_order_number#5, cs_ext_ship_cost#6, cs_net_profit#7]
 Input [5]: [cs_ship_date_sk#1, cs_order_number#5, cs_ext_ship_cost#6, cs_net_profit#7, d_date_sk#23]
 
-(41) HashAggregate [codegen id : 11]
+(41) SortAggregate
 Input [3]: [cs_order_number#5, cs_ext_ship_cost#6, cs_net_profit#7]
 Keys [1]: [cs_order_number#5]
 Functions [2]: [partial_sum(UnscaledValue(cs_ext_ship_cost#6)), partial_sum(UnscaledValue(cs_net_profit#7))]
 Aggregate Attributes [2]: [sum(UnscaledValue(cs_ext_ship_cost#6))#26, sum(UnscaledValue(cs_net_profit#7))#27]
 Results [3]: [cs_order_number#5, sum#28, sum#29]
 
-(42) HashAggregate [codegen id : 11]
+(42) HashAggregate [codegen id : 12]
 Input [3]: [cs_order_number#5, sum#28, sum#29]
 Keys [1]: [cs_order_number#5]
 Functions [2]: [merge_sum(UnscaledValue(cs_ext_ship_cost#6)), merge_sum(UnscaledValue(cs_net_profit#7))]
 Aggregate Attributes [2]: [sum(UnscaledValue(cs_ext_ship_cost#6))#26, sum(UnscaledValue(cs_net_profit#7))#27]
 Results [3]: [cs_order_number#5, sum#28, sum#29]
 
-(43) HashAggregate [codegen id : 11]
+(43) HashAggregate [codegen id : 12]
 Input [3]: [cs_order_number#5, sum#28, sum#29]
 Keys: []
 Functions [3]: [merge_sum(UnscaledValue(cs_ext_ship_cost#6)), merge_sum(UnscaledValue(cs_net_profit#7)), partial_count(distinct cs_order_number#5)]
@@ -246,7 +246,7 @@ Results [3]: [sum#28, sum#29, count#31]
 Input [3]: [sum#28, sum#29, count#31]
 Arguments: SinglePartition, ENSURE_REQUIREMENTS, [id=#32]
 
-(45) HashAggregate [codegen id : 12]
+(45) HashAggregate [codegen id : 13]
 Input [3]: [sum#28, sum#29, count#31]
 Keys: []
 Functions [3]: [sum(UnscaledValue(cs_ext_ship_cost#6)), sum(UnscaledValue(cs_net_profit#7)), count(distinct cs_order_number#5)]