[SPARK-51371][SQL] Change toString to toPrettySQL when building Aliases in ResolveAggregateFunctions

mihailoale-db · cloud-fan · commit 6ba4771842a7 · 2025-03-05T21:41:17.000+08:00
### What changes were proposed in this pull request? In this PR I propose that we use `toPrettySQL` instead of `toString` when building `Alias`es in `ResolveAggregateFunctions`. ### Why are the changes needed? Right now you can write a DataFrame program in which you can reference a column implicitly aliased with a expression id in its name. If we switch from using `toString` to `toPrettySQL` we won't have expression ids `Alias` name and thus users won't be able to utilize this. For example: ``` import org.apache.spark.sql.functions._ val df = spark.sql("SELECT col1 FROM VALUES (1, 2) GROUP BY col1 ORDER BY MAX(col2)") df.queryExecution.analyzed df.where(col("max(col2#10)") === 0).queryExecution.analyzed ``` program above can work (if `df.queryExecution.analyzed` shows that the name of the `AggregateExpression` alias is `max(col2#10)`). But when run again it might fail because expression ids can be generated differently so we want to disable that (to enforce deterministic behavior in DataFrame programs). ### Does this PR introduce _any_ user-facing change? Some DataFrame programs are going to fail (but they would fail with every cluster reset, as explained.) ### How was this patch tested? Existing tests. ### Was this patch authored or co-authored using generative AI tooling? No. Closes #50136 from mihailoale-db/toprettysqlresolveaggregatefunctions. Authored-by: mihailoale-db <mihailo.aleksic@databricks.com> Signed-off-by: Wenchen Fan <wenchen@databricks.com>
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/Analyzer.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/Analyzer.scala
@@ -2768,7 +2768,7 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
         expr match {
           case ae: AggregateExpression =>
             val cleaned = trimTempResolvedColumn(ae)
-            val alias = Alias(cleaned, cleaned.toString)()
+            val alias = Alias(cleaned, toPrettySQL(cleaned))()
             aggExprList += alias
             alias.toAttribute
           case grouping: Expression if agg.groupingExpressions.exists(grouping.semanticEquals) =>
@@ -2777,7 +2777,7 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
                 aggExprList += ne
                 ne.toAttribute
               case other =>
-                val alias = Alias(other, other.toString)()
+                val alias = Alias(other, toPrettySQL(other))()
                 aggExprList += alias
                 alias.toAttribute
             }
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/bitwise.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/bitwise.sql.out
@@ -248,8 +248,8 @@ Aggregate [(b1#x & 1)], [bit_xor(b3#x) AS bit_xor(b3)#x]
 SELECT b1, bit_xor(b2) FROM bitwise_test GROUP BY b1 HAVING bit_and(b2) < 7
 -- !query analysis
 Project [b1#x, bit_xor(b2)#x]
-+- Filter (bit_and(b2#x)#x < 7)
-   +- Aggregate [b1#x], [b1#x, bit_xor(b2#x) AS bit_xor(b2)#x, bit_and(b2#x) AS bit_and(b2#x)#x]
++- Filter (bit_and(b2)#x < 7)
+   +- Aggregate [b1#x], [b1#x, bit_xor(b2#x) AS bit_xor(b2)#x, bit_and(b2#x) AS bit_and(b2)#x]
       +- SubqueryAlias bitwise_test
          +- View (`bitwise_test`, [b1#x, b2#x, b3#x, b4#xL])
             +- Project [cast(b1#x as int) AS b1#x, cast(b2#x as int) AS b2#x, cast(b3#x as int) AS b3#x, cast(b4#xL as bigint) AS b4#xL]
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/group-by-all-mosha.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/group-by-all-mosha.sql.out
@@ -91,8 +91,8 @@ SELECT s AS s, COUNT(*) c FROM stuff GROUP BY ALL HAVING SUM(f) > 0 ORDER BY s
 -- !query analysis
 Sort [s#x ASC NULLS FIRST], true
 +- Project [s#x, c#xL]
-   +- Filter (sum(f#x)#x > cast(cast(0 as decimal(1,0)) as decimal(16,4)))
-      +- Aggregate [s#x], [s#x AS s#x, count(1) AS c#xL, sum(f#x) AS sum(f#x)#x]
+   +- Filter (sum(f)#x > cast(cast(0 as decimal(1,0)) as decimal(16,4)))
+      +- Aggregate [s#x], [s#x AS s#x, count(1) AS c#xL, sum(f#x) AS sum(f)#x]
          +- SubqueryAlias stuff
             +- View (`stuff`, [i#x, f#x, s#x, t#x, d#x, a#x])
                +- Project [cast(i#x as int) AS i#x, cast(f#x as decimal(6,4)) AS f#x, cast(s#x as string) AS s#x, cast(t#x as string) AS t#x, cast(d#x as string) AS d#x, cast(a#x as array<int>) AS a#x]
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/group-by.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/group-by.sql.out
@@ -315,8 +315,8 @@ Filter cast(true as boolean)
 SELECT 1 FROM range(10) HAVING MAX(id) > 0
 -- !query analysis
 Project [1#x]
-+- Filter (max(id#xL)#xL > cast(0 as bigint))
-   +- Aggregate [1 AS 1#x, max(id#xL) AS max(id#xL)#xL]
++- Filter (max(id)#xL > cast(0 as bigint))
+   +- Aggregate [1 AS 1#x, max(id#xL) AS max(id)#xL]
       +- Range (0, 10, step=1)
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/having.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/having.sql.out
@@ -35,8 +35,8 @@ Filter (sum(v)#xL > cast(2 as bigint))
 SELECT count(k) FROM hav GROUP BY v + 1 HAVING v + 1 = 2
 -- !query analysis
 Project [count(k)#xL]
-+- Filter ((v#x + 1)#x = 2)
-   +- Aggregate [(v#x + 1)], [count(k#x) AS count(k)#xL, (v#x + 1) AS (v#x + 1)#x]
++- Filter ((v + 1)#x = 2)
+   +- Aggregate [(v#x + 1)], [count(k#x) AS count(k)#xL, (v#x + 1) AS (v + 1)#x]
       +- SubqueryAlias hav
          +- View (`hav`, [k#x, v#x])
             +- Project [cast(k#x as string) AS k#x, cast(v#x as int) AS v#x]
@@ -199,9 +199,9 @@ Sort [sum(v)#xL ASC NULLS FIRST], true
 SELECT k, sum(v) FROM hav GROUP BY k HAVING sum(v) > 2 ORDER BY avg(v)
 -- !query analysis
 Project [k#x, sum(v)#xL]
-+- Sort [avg(v#x)#x ASC NULLS FIRST], true
++- Sort [avg(v)#x ASC NULLS FIRST], true
    +- Filter (sum(v)#xL > cast(2 as bigint))
-      +- Aggregate [k#x], [k#x, sum(v#x) AS sum(v)#xL, avg(v#x) AS avg(v#x)#x]
+      +- Aggregate [k#x], [k#x, sum(v#x) AS sum(v)#xL, avg(v#x) AS avg(v)#x]
          +- SubqueryAlias hav
             +- View (`hav`, [k#x, v#x])
                +- Project [cast(k#x as string) AS k#x, cast(v#x as int) AS v#x]
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/aggregates_part3.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/aggregates_part3.sql.out
@@ -38,13 +38,13 @@ group by ten
 having exists (select 1 from onek b where sum(distinct a.four) = b.four)
 -- !query analysis
 Project [ten#x, sum(DISTINCT four) FILTER (WHERE (four > 10))#xL]
-+- Filter exists#x [sum(distinct four#x)#xL]
++- Filter exists#x [sum(DISTINCT four)#xL]
    :  +- Project [1 AS 1#x]
-   :     +- Filter (outer(sum(distinct four#x)#xL) = cast(four#x as bigint))
+   :     +- Filter (outer(sum(DISTINCT four)#xL) = cast(four#x as bigint))
    :        +- SubqueryAlias b
    :           +- SubqueryAlias spark_catalog.default.onek
    :              +- Relation spark_catalog.default.onek[unique1#x,unique2#x,two#x,four#x,ten#x,twenty#x,hundred#x,thousand#x,twothousand#x,fivethous#x,tenthous#x,odd#x,even#x,stringu1#x,stringu2#x,string4#x] parquet
-   +- Aggregate [ten#x], [ten#x, sum(distinct four#x) FILTER (WHERE (four#x > 10)) AS sum(DISTINCT four) FILTER (WHERE (four > 10))#xL, sum(distinct four#x) AS sum(distinct four#x)#xL]
+   +- Aggregate [ten#x], [ten#x, sum(distinct four#x) FILTER (WHERE (four#x > 10)) AS sum(DISTINCT four) FILTER (WHERE (four > 10))#xL, sum(distinct four#x) AS sum(DISTINCT four)#xL]
       +- SubqueryAlias a
          +- SubqueryAlias spark_catalog.default.onek
             +- Relation spark_catalog.default.onek[unique1#x,unique2#x,two#x,four#x,ten#x,twenty#x,hundred#x,thousand#x,twothousand#x,fivethous#x,tenthous#x,odd#x,even#x,stringu1#x,stringu2#x,string4#x] parquet
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/select_having.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/select_having.sql.out
@@ -115,8 +115,8 @@ SELECT c, max(a) FROM test_having
 -- !query analysis
 Sort [c#x ASC NULLS FIRST], true
 +- Project [c#x, max(a)#x]
-   +- Filter ((count(1)#xL > cast(2 as bigint)) OR (min(a#x)#x = max(a)#x))
-      +- Aggregate [c#x], [c#x, max(a#x) AS max(a)#x, count(1) AS count(1)#xL, min(a#x) AS min(a#x)#x]
+   +- Filter ((count(1)#xL > cast(2 as bigint)) OR (min(a)#x = max(a)#x))
+      +- Aggregate [c#x], [c#x, max(a#x) AS max(a)#x, count(1) AS count(1)#xL, min(a#x) AS min(a)#x]
          +- SubqueryAlias spark_catalog.default.test_having
             +- Relation spark_catalog.default.test_having[a#x,b#x,c#x,d#x] parquet
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/select_implicit.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/select_implicit.sql.out
@@ -310,8 +310,8 @@ GROUP BY lower(test_missing_target.c)
 ORDER BY lower(test_missing_target.c)
 -- !query analysis
 Project [count(c)#xL]
-+- Sort [lower(c#x)#x ASC NULLS FIRST], true
-   +- Aggregate [lower(c#x)], [count(c#x) AS count(c)#xL, lower(c#x) AS lower(c#x)#x]
++- Sort [lower(c)#x ASC NULLS FIRST], true
+   +- Aggregate [lower(c#x)], [count(c#x) AS count(c)#xL, lower(c#x) AS lower(c)#x]
       +- SubqueryAlias spark_catalog.default.test_missing_target
          +- Relation spark_catalog.default.test_missing_target[a#x,b#x,c#x,d#x] parquet
 
@@ -341,8 +341,8 @@ org.apache.spark.sql.catalyst.ExtendedAnalysisException
 SELECT count(b) FROM test_missing_target GROUP BY b/2 ORDER BY b/2
 -- !query analysis
 Project [count(b)#xL]
-+- Sort [(cast(b#x as double) / cast(2 as double))#x ASC NULLS FIRST], true
-   +- Aggregate [(cast(b#x as double) / cast(2 as double))], [count(b#x) AS count(b)#xL, (cast(b#x as double) / cast(2 as double)) AS (cast(b#x as double) / cast(2 as double))#x]
++- Sort [(b / 2)#x ASC NULLS FIRST], true
+   +- Aggregate [(cast(b#x as double) / cast(2 as double))], [count(b#x) AS count(b)#xL, (cast(b#x as double) / cast(2 as double)) AS (b / 2)#x]
       +- SubqueryAlias spark_catalog.default.test_missing_target
          +- Relation spark_catalog.default.test_missing_target[a#x,b#x,c#x,d#x] parquet
 
@@ -372,8 +372,8 @@ SELECT count(b) FROM test_missing_target
 	GROUP BY (b + 1) / 2 ORDER BY (b + 1) / 2 desc
 -- !query analysis
 Project [count(b)#xL]
-+- Sort [(cast((b#x + 1) as double) / cast(2 as double))#x DESC NULLS LAST], true
-   +- Aggregate [(cast((b#x + 1) as double) / cast(2 as double))], [count(b#x) AS count(b)#xL, (cast((b#x + 1) as double) / cast(2 as double)) AS (cast((b#x + 1) as double) / cast(2 as double))#x]
++- Sort [((b + 1) / 2)#x DESC NULLS LAST], true
+   +- Aggregate [(cast((b#x + 1) as double) / cast(2 as double))], [count(b#x) AS count(b)#xL, (cast((b#x + 1) as double) / cast(2 as double)) AS ((b + 1) / 2)#x]
       +- SubqueryAlias spark_catalog.default.test_missing_target
          +- Relation spark_catalog.default.test_missing_target[a#x,b#x,c#x,d#x] parquet
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/sql-session-variables.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/sql-session-variables.sql.out
@@ -1995,8 +1995,8 @@ Aggregate [(c1#x + variablereference(system.session.var1=1))], [1 AS 1#x]
 SELECT c1, sum(c2) FROM VALUES(1, 2) AS T(c1, c2) GROUP BY c1 HAVING sum(c1) != var1
 -- !query analysis
 Project [c1#x, sum(c2)#xL]
-+- Filter NOT (sum(c1#x)#xL = cast(variablereference(system.session.var1=1) as bigint))
-   +- Aggregate [c1#x], [c1#x, sum(c2#x) AS sum(c2)#xL, sum(c1#x) AS sum(c1#x)#xL]
++- Filter NOT (sum(c1)#xL = cast(variablereference(system.session.var1=1) as bigint))
+   +- Aggregate [c1#x], [c1#x, sum(c2#x) AS sum(c2)#xL, sum(c1#x) AS sum(c1)#xL]
       +- SubqueryAlias T
          +- LocalRelation [c1#x, c2#x]
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/exists-subquery/exists-having.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/exists-subquery/exists-having.sql.out
@@ -75,14 +75,14 @@ HAVING EXISTS (SELECT 1
                WHERE  bonus_amt < min(emp.salary))
 -- !query analysis
 Project [dept_id#x, count(1)#xL]
-+- Filter exists#x [min(salary#x)#x]
++- Filter exists#x [min(salary)#x]
    :  +- Project [1 AS 1#x]
-   :     +- Filter (bonus_amt#x < outer(min(salary#x)#x))
+   :     +- Filter (bonus_amt#x < outer(min(salary)#x))
    :        +- SubqueryAlias bonus
    :           +- View (`BONUS`, [emp_name#x, bonus_amt#x])
    :              +- Project [cast(col1#x as string) AS emp_name#x, cast(col2#x as double) AS bonus_amt#x]
    :                 +- LocalRelation [col1#x, col2#x]
-   +- Aggregate [dept_id#x], [dept_id#x, count(1) AS count(1)#xL, min(salary#x) AS min(salary#x)#x]
+   +- Aggregate [dept_id#x], [dept_id#x, count(1) AS count(1)#xL, min(salary#x) AS min(salary)#x]
       +- SubqueryAlias emp
          +- View (`EMP`, [id#x, emp_name#x, hiredate#x, salary#x, dept_id#x])
             +- Project [cast(col1#x as int) AS id#x, cast(col2#x as string) AS emp_name#x, cast(col3#x as date) AS hiredate#x, cast(col4#x as double) AS salary#x, cast(col5#x as int) AS dept_id#x]
@@ -103,14 +103,14 @@ WHERE  EXISTS (SELECT dept_id,
 Project [dept_id#x, dept_name#x, state#x]
 +- Filter exists#x []
    :  +- Project [dept_id#x, count(1)#xL]
-   :     +- Filter exists#x [min(salary#x)#x]
+   :     +- Filter exists#x [min(salary)#x]
    :        :  +- Project [1 AS 1#x]
-   :        :     +- Filter (bonus_amt#x < outer(min(salary#x)#x))
+   :        :     +- Filter (bonus_amt#x < outer(min(salary)#x))
    :        :        +- SubqueryAlias bonus
    :        :           +- View (`BONUS`, [emp_name#x, bonus_amt#x])
    :        :              +- Project [cast(col1#x as string) AS emp_name#x, cast(col2#x as double) AS bonus_amt#x]
    :        :                 +- LocalRelation [col1#x, col2#x]
-   :        +- Aggregate [dept_id#x], [dept_id#x, count(1) AS count(1)#xL, min(salary#x) AS min(salary#x)#x]
+   :        +- Aggregate [dept_id#x], [dept_id#x, count(1) AS count(1)#xL, min(salary#x) AS min(salary)#x]
    :           +- SubqueryAlias emp
    :              +- View (`EMP`, [id#x, emp_name#x, hiredate#x, salary#x, dept_id#x])
    :                 +- Project [cast(col1#x as int) AS id#x, cast(col2#x as string) AS emp_name#x, cast(col3#x as date) AS hiredate#x, cast(col4#x as double) AS salary#x, cast(col5#x as int) AS dept_id#x]
@@ -137,14 +137,14 @@ GROUP  BY gp.dept_id
 Aggregate [dept_id#x], [dept_id#x, max(salary#x) AS max(salary)#x]
 +- Filter exists#x []
    :  +- Project [dept_id#x, count(1)#xL]
-   :     +- Filter exists#x [min(salary#x)#x]
+   :     +- Filter exists#x [min(salary)#x]
    :        :  +- Project [1 AS 1#x]
-   :        :     +- Filter (bonus_amt#x < outer(min(salary#x)#x))
+   :        :     +- Filter (bonus_amt#x < outer(min(salary)#x))
    :        :        +- SubqueryAlias bonus
    :        :           +- View (`BONUS`, [emp_name#x, bonus_amt#x])
    :        :              +- Project [cast(col1#x as string) AS emp_name#x, cast(col2#x as double) AS bonus_amt#x]
    :        :                 +- LocalRelation [col1#x, col2#x]
-   :        +- Aggregate [dept_id#x], [dept_id#x, count(1) AS count(1)#xL, min(salary#x) AS min(salary#x)#x]
+   :        +- Aggregate [dept_id#x], [dept_id#x, count(1) AS count(1)#xL, min(salary#x) AS min(salary)#x]
    :           +- SubqueryAlias p
    :              +- SubqueryAlias emp
    :                 +- View (`EMP`, [id#x, emp_name#x, hiredate#x, salary#x, dept_id#x])
@@ -171,14 +171,14 @@ WHERE  EXISTS (SELECT dept_id,
 Project [dept_id#x, dept_name#x, state#x]
 +- Filter exists#x []
    :  +- Project [dept_id#x, count(1)#xL]
-   :     +- Filter exists#x [min(salary#x)#x]
+   :     +- Filter exists#x [min(salary)#x]
    :        :  +- Project [1 AS 1#x]
-   :        :     +- Filter (bonus_amt#x > outer(min(salary#x)#x))
+   :        :     +- Filter (bonus_amt#x > outer(min(salary)#x))
    :        :        +- SubqueryAlias bonus
    :        :           +- View (`BONUS`, [emp_name#x, bonus_amt#x])
    :        :              +- Project [cast(col1#x as string) AS emp_name#x, cast(col2#x as double) AS bonus_amt#x]
    :        :                 +- LocalRelation [col1#x, col2#x]
-   :        +- Aggregate [dept_id#x], [dept_id#x, count(1) AS count(1)#xL, min(salary#x) AS min(salary#x)#x]
+   :        +- Aggregate [dept_id#x], [dept_id#x, count(1) AS count(1)#xL, min(salary#x) AS min(salary)#x]
    :           +- SubqueryAlias emp
    :              +- View (`EMP`, [id#x, emp_name#x, hiredate#x, salary#x, dept_id#x])
    :                 +- Project [cast(col1#x as int) AS id#x, cast(col2#x as string) AS emp_name#x, cast(col3#x as date) AS hiredate#x, cast(col4#x as double) AS salary#x, cast(col5#x as int) AS dept_id#x]
@@ -205,14 +205,14 @@ WHERE  EXISTS (SELECT dept_id,
 Project [dept_id#x, dept_name#x, state#x]
 +- Filter exists#x [dept_id#x]
    :  +- Project [dept_id#x, count(dept_id)#xL]
-   :     +- Filter exists#x [min(salary#x)#x && count(dept_id)#xL]
+   :     +- Filter exists#x [min(salary)#x && count(dept_id)#xL]
    :        :  +- Project [1 AS 1#x]
-   :        :     +- Filter ((bonus_amt#x > outer(min(salary#x)#x)) AND (outer(count(dept_id)#xL) > cast(1 as bigint)))
+   :        :     +- Filter ((bonus_amt#x > outer(min(salary)#x)) AND (outer(count(dept_id)#xL) > cast(1 as bigint)))
    :        :        +- SubqueryAlias bonus
    :        :           +- View (`BONUS`, [emp_name#x, bonus_amt#x])
    :        :              +- Project [cast(col1#x as string) AS emp_name#x, cast(col2#x as double) AS bonus_amt#x]
    :        :                 +- LocalRelation [col1#x, col2#x]
-   :        +- Aggregate [dept_id#x], [dept_id#x, count(dept_id#x) AS count(dept_id)#xL, min(salary#x) AS min(salary#x)#x]
+   :        +- Aggregate [dept_id#x], [dept_id#x, count(dept_id#x) AS count(dept_id)#xL, min(salary#x) AS min(salary)#x]
    :           +- Filter (outer(dept_id#x) = dept_id#x)
    :              +- SubqueryAlias emp
    :                 +- View (`EMP`, [id#x, emp_name#x, hiredate#x, salary#x, dept_id#x])
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/in-subquery/in-having.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/in-subquery/in-having.sql.out
@@ -203,8 +203,8 @@ GROUP BY t1a, t1b, t1c
 HAVING COUNT (DISTINCT t1b) < 10
 -- !query analysis
 Project [t1a#x, t1b#x, t1c#x]
-+- Filter (count(distinct t1b#x)#xL < cast(10 as bigint))
-   +- Aggregate [t1a#x, t1b#x, t1c#x], [t1a#x, t1b#x, t1c#x, count(distinct t1b#x) AS count(distinct t1b#x)#xL]
++- Filter (count(DISTINCT t1b)#xL < cast(10 as bigint))
+   +- Aggregate [t1a#x, t1b#x, t1c#x], [t1a#x, t1b#x, t1c#x, count(distinct t1b#x) AS count(DISTINCT t1b)#xL]
       +- Filter t1b#x IN (list#x [t1c#x])
          :  +- Project [t2b#x]
          :     +- Filter (outer(t1c#x) = t2c#x)
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/in-subquery/not-in-joins.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/in-subquery/not-in-joins.sql.out
@@ -341,8 +341,8 @@ GROUP BY t1b,
 HAVING   t1b < sum(t1c)
 -- !query analysis
 Project [count(DISTINCT t1a)#xL, t1b#x, t1c#x, t1d#xL]
-+- Filter (cast(t1b#x as bigint) < sum(t1c#x)#xL)
-   +- Aggregate [t1b#x, t1c#x, t1d#xL], [count(distinct t1a#x) AS count(DISTINCT t1a)#xL, t1b#x, t1c#x, t1d#xL, sum(t1c#x) AS sum(t1c#x)#xL]
++- Filter (cast(t1b#x as bigint) < sum(t1c)#xL)
+   +- Aggregate [t1b#x, t1c#x, t1d#xL], [count(distinct t1a#x) AS count(DISTINCT t1a)#xL, t1b#x, t1c#x, t1d#xL, sum(t1c#x) AS sum(t1c)#xL]
       +- Filter NOT t1a#x IN (list#x [])
          :  +- Project [t2a#x]
          :     +- Join Inner, (t1a#x = t2a#x)
@@ -390,8 +390,8 @@ GROUP BY t1b,
 HAVING   t1b < sum(t1c)
 -- !query analysis
 Project [count(DISTINCT t1a)#xL, t1b#x, t1c#x, t1d#xL]
-+- Filter (cast(t1b#x as bigint) < sum(t1c#x)#xL)
-   +- Aggregate [t1b#x, t1c#x, t1d#xL], [count(distinct t1a#x) AS count(DISTINCT t1a)#xL, t1b#x, t1c#x, t1d#xL, sum(t1c#x) AS sum(t1c#x)#xL]
++- Filter (cast(t1b#x as bigint) < sum(t1c)#xL)
+   +- Aggregate [t1b#x, t1c#x, t1d#xL], [count(distinct t1a#x) AS count(DISTINCT t1a)#xL, t1b#x, t1c#x, t1d#xL, sum(t1c#x) AS sum(t1c)#xL]
       +- Filter (NOT t1a#x IN (list#x []) AND NOT t1d#xL IN (list#x []))
          :  :- Project [t2a#x]
          :  :  +- Join Inner, (t1a#x = t2a#x)
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/scalar-subquery/scalar-subquery-predicate.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/scalar-subquery/scalar-subquery-predicate.sql.out
@@ -862,7 +862,7 @@ HAVING   max(t1b) <= (SELECT   max(t2b)
                       GROUP BY t2c)
 -- !query analysis
 Project [t1a#x]
-+- Filter (max(t1b#x)#x <= scalar-subquery#x [t1c#x])
++- Filter (max(t1b)#x <= scalar-subquery#x [t1c#x])
    :  +- Aggregate [t2c#x], [max(t2b#x) AS max(t2b)#x]
    :     +- Filter (t2c#x = outer(t1c#x))
    :        +- SubqueryAlias t2
@@ -871,7 +871,7 @@ Project [t1a#x]
    :                 +- Project [t2a#x, t2b#x, t2c#x, t2d#xL, t2e#x, t2f#x, t2g#x, t2h#x, t2i#x]
    :                    +- SubqueryAlias t2
    :                       +- LocalRelation [t2a#x, t2b#x, t2c#x, t2d#xL, t2e#x, t2f#x, t2g#x, t2h#x, t2i#x]
-   +- Aggregate [t1a#x, t1c#x], [t1a#x, max(t1b#x) AS max(t1b#x)#x, t1c#x]
+   +- Aggregate [t1a#x, t1c#x], [t1a#x, max(t1b#x) AS max(t1b)#x, t1c#x]
       +- SubqueryAlias t1
          +- View (`t1`, [t1a#x, t1b#x, t1c#x, t1d#xL, t1e#x, t1f#x, t1g#x, t1h#x, t1i#x])
             +- Project [cast(t1a#x as string) AS t1a#x, cast(t1b#x as smallint) AS t1b#x, cast(t1c#x as int) AS t1c#x, cast(t1d#xL as bigint) AS t1d#xL, cast(t1e#x as float) AS t1e#x, cast(t1f#x as double) AS t1f#x, cast(t1g#x as decimal(4,0)) AS t1g#x, cast(t1h#x as timestamp) AS t1h#x, cast(t1i#x as date) AS t1i#x]
@@ -1204,8 +1204,8 @@ Project [t1a#x, t1b#x]
    :  +- GlobalLimit 1
    :     +- LocalLimit 1
    :        +- Project [max(t2c)#x]
-   :           +- Sort [min(t2c#x)#x ASC NULLS FIRST], true
-   :              +- Aggregate [max(t2c#x) AS max(t2c)#x, min(t2c#x) AS min(t2c#x)#x]
+   :           +- Sort [min(t2c)#x ASC NULLS FIRST], true
+   :              +- Aggregate [max(t2c#x) AS max(t2c)#x, min(t2c#x) AS min(t2c)#x]
    :                 +- Filter (cast(outer(t1b#x) as bigint) < outer(t1d#xL))
    :                    +- SubqueryAlias t2
    :                       +- View (`t2`, [t2a#x, t2b#x, t2c#x, t2d#xL, t2e#x, t2f#x, t2g#x, t2h#x, t2i#x])
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-aggregates_part1.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-aggregates_part1.sql.out
@@ -454,13 +454,13 @@ group by ten
 having exists (select 1 from onek b where udf(sum(distinct a.four)) = b.four)
 -- !query analysis
 Project [ten#x, udf(sum(DISTINCT four))#xL]
-+- Filter exists#x [sum(distinct four#x)#xL]
++- Filter exists#x [sum(DISTINCT four)#xL]
    :  +- Project [1 AS 1#x]
    :     +- Filter (outer(udf(sum(DISTINCT four))#xL) = cast(four#x as bigint))
    :        +- SubqueryAlias b
    :           +- SubqueryAlias spark_catalog.default.onek
    :              +- Relation spark_catalog.default.onek[unique1#x,unique2#x,two#x,four#x,ten#x,twenty#x,hundred#x,thousand#x,twothousand#x,fivethous#x,tenthous#x,odd#x,even#x,stringu1#x,stringu2#x,string4#x] parquet
-   +- Aggregate [ten#x], [ten#x, cast(udf(cast(sum(distinct four#x) as string)) as bigint) AS udf(sum(DISTINCT four))#xL, sum(distinct four#x) AS sum(distinct four#x)#xL]
+   +- Aggregate [ten#x], [ten#x, cast(udf(cast(sum(distinct four#x) as string)) as bigint) AS udf(sum(DISTINCT four))#xL, sum(distinct four#x) AS sum(DISTINCT four)#xL]
       +- SubqueryAlias a
          +- SubqueryAlias spark_catalog.default.onek
             +- Relation spark_catalog.default.onek[unique1#x,unique2#x,two#x,four#x,ten#x,twenty#x,hundred#x,thousand#x,twothousand#x,fivethous#x,tenthous#x,odd#x,even#x,stringu1#x,stringu2#x,string4#x] parquet
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-aggregates_part2.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-aggregates_part2.sql.out
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-select_having.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-select_having.sql.out
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-select_implicit.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-select_implicit.sql.out
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/udf/udf-group-by.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/udf/udf-group-by.sql.out
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/udf/udf-having.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/udf/udf-having.sql.out
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/udf/udf-outer-join.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/udf/udf-outer-join.sql.out
diff --git a/sql/core/src/test/resources/tpch-plan-stability/q18/explain.txt b/sql/core/src/test/resources/tpch-plan-stability/q18/explain.txt