apache · stanzhai · Sep 19, 2017 · Sep 19, 2017 · Sep 20, 2017 · Sep 21, 2017
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/view.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/view.scala
@@ -38,7 +38,7 @@ import org.apache.spark.sql.internal.SQLConf
  *         view resolution, in this way, we are able to get the correct view column ordering and
  *         omit the extra columns that we don't require);
  *    1.2. Else set the child output attributes to `queryOutput`.
- * 2. Map the `queryQutput` to view output by index, if the corresponding attributes don't match,
+ * 2. Map the `queryOutput` to view output by index, if the corresponding attributes don't match,
  *    try to up cast and alias the attribute in `queryOutput` to the attribute in the view output.
  * 3. Add a Project over the child, with the new output generated by the previous steps.
  * If the view output doesn't have the same number of columns neither with the child output, nor

diff --git a/...alyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/aggregate/interfaces.scala b/...alyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/aggregate/interfaces.scala
@@ -17,6 +17,8 @@
 
 package org.apache.spark.sql.catalyst.expressions.aggregate
 
+import java.util.Objects
+
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.analysis.UnresolvedAttribute
 import org.apache.spark.sql.catalyst.expressions._
@@ -72,11 +74,19 @@ object AggregateExpression {
       aggregateFunction: AggregateFunction,
       mode: AggregateMode,
       isDistinct: Boolean): AggregateExpression = {
+    val state = if (aggregateFunction.resolved) {
+      Seq(aggregateFunction.toString, aggregateFunction.dataType,
+        aggregateFunction.nullable, mode, isDistinct)
+    } else {
+      Seq(aggregateFunction.toString, mode, isDistinct)
+    }
+    val hashCode = state.map(Objects.hashCode).foldLeft(0)((a, b) => 31 * a + b)
+
     AggregateExpression(
       aggregateFunction,
       mode,
       isDistinct,
-      NamedExpression.newExprId)
+      ExprId(hashCode))
   }
 }
 

diff --git a/sql/core/src/main/scala/org/apache/spark/sql/expressions/Aggregator.scala b/sql/core/src/main/scala/org/apache/spark/sql/expressions/Aggregator.scala
@@ -20,6 +20,7 @@ package org.apache.spark.sql.expressions
 import org.apache.spark.annotation.{Experimental, InterfaceStability}
 import org.apache.spark.sql.{Dataset, Encoder, TypedColumn}
 import org.apache.spark.sql.catalyst.encoders.encoderFor
+import org.apache.spark.sql.catalyst.expressions.NamedExpression
 import org.apache.spark.sql.catalyst.expressions.aggregate.{AggregateExpression, Complete}
 import org.apache.spark.sql.execution.aggregate.TypedAggregateExpression
 
@@ -104,7 +105,8 @@ abstract class Aggregator[-IN, BUF, OUT] extends Serializable {
       AggregateExpression(
         TypedAggregateExpression(this),
         Complete,
-        isDistinct = false)
+        isDistinct = false,
+        NamedExpression.newExprId)
 
     new TypedColumn[IN, OUT](expr, encoderFor[OUT])
   }