zml1206
diff --git a/‎mllib/src/test/scala/org/apache/spark/ml/feature/VectorSizeHintSuite.scala
+26-23 b/‎mllib/src/test/scala/org/apache/spark/ml/feature/VectorSizeHintSuite.scala
+26-23
diff --git a/‎sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/Optimizer.scala
+11-10 b/‎sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/Optimizer.scala
+11-10
diff --git a/‎sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/RewriteWithExpression.scala
+1-1 b/‎sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/RewriteWithExpression.scala
+1-1
diff --git a/‎sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/joins.scala
+7-1 b/‎sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/joins.scala
+7-1
diff --git a/‎sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/FilterPushdownOnePassSuite.scala
-4 b/‎sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/FilterPushdownOnePassSuite.scala
-4
diff --git a/‎sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/FilterPushdownSuite.scala
+45-48 b/‎sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/FilterPushdownSuite.scala
+45-48
@@ -22,6 +22,7 @@ import org.apache.spark.ml.attribute.AttributeGroup
 import org.apache.spark.ml.linalg.{Vector, Vectors}
 import org.apache.spark.ml.util.{DefaultReadWriteTest, MLTest}
 import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.StreamTest
 
 class VectorSizeHintSuite
@@ -55,29 +56,31 @@ class VectorSizeHintSuite
   }
 
   test("Adding size to column of vectors.") {
-    val size = 3
-    val vectorColName = "vector"
-    val denseVector = Vectors.dense(1, 2, 3)
-    val sparseVector = Vectors.sparse(size, Array(), Array())
-
-    val data = Seq(denseVector, denseVector, sparseVector).map(Tuple1.apply)
-    val dataFrame = data.toDF(vectorColName)
-    assert(
-      AttributeGroup.fromStructField(dataFrame.schema(vectorColName)).size == -1,
-      s"This test requires that column '$vectorColName' not have size metadata.")
-
-    for (handleInvalid <- VectorSizeHint.supportedHandleInvalids) {
-      val transformer = new VectorSizeHint()
-        .setInputCol(vectorColName)
-        .setSize(size)
-        .setHandleInvalid(handleInvalid)
-      testTransformerByGlobalCheckFunc[Tuple1[Vector]](dataFrame, transformer, vectorColName) {
-        rows => {
-          assert(
-            AttributeGroup.fromStructField(rows.head.schema(vectorColName)).size == size,
-            "Transformer did not add expected size data.")
-          val numRows = rows.length
-          assert(numRows === data.length, s"Expecting ${data.length} rows, got $numRows.")
+    withSQLConf(SQLConf.ALWAYS_INLINE_COMMON_EXPR.key -> "true") {
+      val size = 3
+      val vectorColName = "vector"
+      val denseVector = Vectors.dense(1, 2, 3)
+      val sparseVector = Vectors.sparse(size, Array(), Array())
+
+      val data = Seq(denseVector, denseVector, sparseVector).map(Tuple1.apply)
+      val dataFrame = data.toDF(vectorColName)
+      assert(
+        AttributeGroup.fromStructField(dataFrame.schema(vectorColName)).size == -1,
+        s"This test requires that column '$vectorColName' not have size metadata.")
+
+      for (handleInvalid <- VectorSizeHint.supportedHandleInvalids) {
+        val transformer = new VectorSizeHint()
+          .setInputCol(vectorColName)
+          .setSize(size)
+          .setHandleInvalid(handleInvalid)
+        testTransformerByGlobalCheckFunc[Tuple1[Vector]](dataFrame, transformer, vectorColName) {
+          rows => {
+            assert(
+              AttributeGroup.fromStructField(rows.head.schema(vectorColName)).size == size,
+              "Transformer did not add expected size data.")
+            val numRows = rows.length
+            assert(numRows === data.length, s"Expecting ${data.length} rows, got $numRows.")
+          }
         }
       }
     }
 
@@ -1281,8 +1281,8 @@ object CollapseProject extends Rule[LogicalPlan] with AliasHelper {
       } else {
         true
       }
-    // Alias, ExtractValue and CreateNamedStruct are very cheap.
-    case _: Alias | _: ExtractValue | _: CreateNamedStruct => e.children.forall(isCheap)
+    // Alias and ExtractValue are very cheap.
+    case _: Alias | _: ExtractValue => e.children.forall(isCheap)
     case _ => false
   }
 
@@ -1855,13 +1855,13 @@ object PushPredicateThroughNonJoin extends Rule[LogicalPlan] with PredicateHelpe
       }
 
       if (pushDown.nonEmpty) {
-        // Different from Project, Aggregate is not suitable for using With to push down, because
-        // propagate the attributes directly need add the groupingExpressions may cause regression.
-        // So Aggregate only need inline common expression from parent for original project
-        // inheritance.
+        // Different from Project, Aggregate propagate the attributes directly need add the
+        // groupingExpressions may cause regression. So Aggregate need inline common expression
+        // from parent for original project inheritance and rewrite originalAttribute of push down
+        // With.
         val newAggregateExpressions = aggregate.aggregateExpressions ++
           getWithAlias(pushDown.reduce(And)).map(replaceAliasButKeepName(_, aliasMap))
-        val replaced = removeOriginAttribute(rewriteCondition(pushDown.reduce(And), aliasMap))
+        val replaced = rewriteOriginalAttribute(rewriteCondition(pushDown.reduce(And), aliasMap))
         val newAggregate = aggregate.copy(child = Filter(replaced, aggregate.child),
           aggregateExpressions = newAggregateExpressions)
         // If there is no more filter to stay up, just eliminate the filter.
@@ -2020,9 +2020,10 @@ object PushPredicateThroughNonJoin extends Rule[LogicalPlan] with PredicateHelpe
     }
   }
 
-  private def removeOriginAttribute(expr: Expression): Expression = {
+  private def rewriteOriginalAttribute(expr: Expression): Expression = {
     expr.transform {
-      case ced: CommonExpressionDef => ced.copy(originalAttribute = None)
+      case ced @ CommonExpressionDef(_, _, Some(a)) =>
+        ced.copy(originalAttribute = Some(a.withExprId(NamedExpression.newExprId)))
     }
   }
 
@@ -2042,7 +2043,7 @@ object PushPredicateThroughNonJoin extends Rule[LogicalPlan] with PredicateHelpe
       val replaceWithMap = cond.references.toSeq
         .filter(attr => aliasMap.contains(attr))
         .map(attr => attr -> aliasMap(attr))
-        .filter(m => !CollapseProject.isCheap(m._2))
+        .filterNot(m => CollapseProject.isCheap(m._2))
       if (replaceWithMap.isEmpty) {
         cond
       } else {
 
@@ -148,7 +148,7 @@ object RewriteWithExpression extends Rule[LogicalPlan] {
               refToExpr(id) = child
             } else if (originalAttr.nonEmpty &&
               inputPlans.head.output.contains(originalAttr.get.toAttribute)) {
-              // originAlias only exists in Project or Filter. If the child already contains this
+              // originAttr only exists in Project or Filter. If the child already contains this
               // attribute, extend it.
               refToExpr(id) = originalAttr.get.toAttribute
             } else {
 
@@ -210,7 +210,13 @@ object EliminateOuterJoin extends Rule[LogicalPlan] with PredicateHelper {
     case f @ Filter(condition, j @ Join(_, _, RightOuter | LeftOuter | FullOuter, _, _)) =>
       val newJoinType = buildNewJoinType(f, j)
       if (j.joinType == newJoinType) f else Filter(condition, j.copy(joinType = newJoinType))
-
+    case f @ Filter(condition,
+        p @ Project(_, j @ Join(_, _, RightOuter | LeftOuter | FullOuter, _, _))) =>
+      val aliasMap = getAliasMap(p)
+      val newFilter = f.copy(condition = replaceAlias(condition, aliasMap))
+      val newJoinType = buildNewJoinType(newFilter, j)
+      if (j.joinType == newJoinType) f
+      else Filter(condition, p.copy(child = j.copy(joinType = newJoinType)))
     case a @ Aggregate(_, _, Join(left, _, LeftOuter, _, _), _)
         if a.references.subsetOf(left.outputSet) && allDuplicateAgnostic(a) =>
       a.copy(child = left)
 
@@ -148,10 +148,6 @@ class FilterPushdownOnePassSuite extends PlanTest {
     val optimized = Optimize.execute(originalQuery.analyze)
     val correctAnswer =
       x.where($"b" > 0)
-        .select(($"a" + 1) as "a1", $"b")
-        .select(($"a1" + 1) as "a2", $"b")
-        .select(($"a2" + 1) as "a3", $"b")
-        .select(($"a3" + 1) as "a4", $"b")
         .select($"b").analyze
 
     comparePlans(optimized, correctAnswer)
 
@@ -27,7 +27,6 @@ import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.plans._
 import org.apache.spark.sql.catalyst.plans.logical._
 import org.apache.spark.sql.catalyst.rules._
-import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types._
 import org.apache.spark.unsafe.types.CalendarInterval
 
@@ -762,8 +761,9 @@ class FilterPushdownSuite extends PlanTest {
     val optimized = Optimize.execute(originalQuery.analyze)
 
     val correctAnswer = testRelation
-      .where($"a" + 1 < 3)
-      .select($"a", $"b")
+      .select($"a", $"b", $"c", ($"a" + 1) as "aa")
+      .where($"aa" < 3)
+      .select($"a", $"b", $"aa")
       .groupBy($"a")(($"a" + 1) as "aa", count($"b") as "c")
       .where($"c" === 2L || $"aa" > 4)
       .analyze
@@ -1524,50 +1524,47 @@ class FilterPushdownSuite extends PlanTest {
   }
 
   test("SPARK-50589: avoid extra expression duplication when push filter") {
-    withSQLConf(SQLConf.USE_COMMON_EXPR_ID_FOR_ALIAS.key -> "false") {
-      // through project
-      val originalQuery1 = testRelation
-        .select($"a" + $"b" as "add", $"a" - $"b" as "sub")
-        .where($"add" < 10 && $"add" + $"add" > 10 && $"sub" > 0)
-      val correctAnswer1 = testRelation
-        .select($"a", $"b", $"c", $"a" + $"b" as "add", $"a" - $"b" as "sub")
-        .where($"add" < 10 && $"add" + $"add" > 10 && $"sub" > 0)
-        .select($"add", $"sub")
-        .analyze
-      val optimized1 = Optimize.execute(originalQuery1.analyze)
-      comparePlans(optimized1, correctAnswer1)
-
-      // through aggregate
-      val originalQuery2 = testRelation
-        .groupBy($"a")($"a", $"a" + $"a" as "add", abs($"a") as "abs", count(1) as "ct")
-        .where($"add" < 10 && $"add" + $"add" > 10 && $"abs" > 5)
-      val optimized2 = Optimize.execute(originalQuery2.analyze)
-      val correctAnswer2 = testRelation
-        .select($"a", $"b", $"c", $"a" + $"a" as "_common_expr_0")
-        .where($"_common_expr_0" < 10 &&
-          $"_common_expr_0" + $"_common_expr_0" > 10 &&
-          abs($"a") > 5)
-        .select($"a", $"b", $"c")
-        .groupBy($"a")($"a", $"a" + $"a" as "add", abs($"a") as "abs", count(1) as "ct")
-        .analyze
-      comparePlans(optimized2, correctAnswer2)
-    }
-    withSQLConf(SQLConf.USE_COMMON_EXPR_ID_FOR_ALIAS.key -> "false") {
-      // partial push down
-      val originalQuery3 = testRelation
-        .groupBy($"a")($"a", count(1) as "ct")
-        .select($"a" + $"a" as "add", $"ct")
-        .where($"add" + $"add" > 10 && $"add" > $"ct")
-      val optimized3 = Optimize.execute(originalQuery3.analyze)
-      val correctAnswer3 = testRelation
-        .select($"a", $"b", $"c", $"a" + $"a" as "_common_expr_0")
-        .where($"_common_expr_0" + $"_common_expr_0" > 10)
-        .select($"a", $"b", $"c")
-        .groupBy($"a")($"a", count(1) as "ct", $"a" + $"a" as "add")
-        .where($"add" > $"ct")
-        .select($"add", $"ct")
-        .analyze
-      comparePlans(optimized3, correctAnswer3)
-    }
+    // through project
+    val originalQuery1 = testRelation
+      .select($"a" + $"b" as "add", $"a" - $"b" as "sub")
+      .where($"add" < 10 && $"add" + $"add" > 10 && $"sub" > 0)
+    val correctAnswer1 = testRelation
+      .select($"a", $"b", $"c", $"a" + $"b" as "add", $"a" - $"b" as "sub")
+      .where($"add" < 10 && $"add" + $"add" > 10 && $"sub" > 0)
+      .select($"add", $"sub")
+      .analyze
+    val optimized1 = Optimize.execute(originalQuery1.analyze)
+    comparePlans(optimized1, correctAnswer1)
+
+    // through aggregate
+    val originalQuery2 = testRelation
+      .groupBy($"a")($"a", $"a" + $"a" as "add", abs($"a") as "abs", count(1) as "ct")
+      .where($"add" < 10 && $"add" + $"add" > 10 && $"abs" > 5)
+    val optimized2 = Optimize.execute(originalQuery2.analyze)
+    val correctAnswer2 = testRelation
+      .select($"a", $"b", $"c", $"a" + $"a" as "add", abs($"a") as "abs")
+      .where($"add" < 10 &&
+        $"add" + $"add" > 10 &&
+        $"abs" > 5)
+      .select($"a", $"b", $"c", $"add", $"abs")
+      .groupBy($"a")($"a", $"a" + $"a" as "add", abs($"a") as "abs", count(1) as "ct")
+      .analyze
+    comparePlans(optimized2, correctAnswer2)
+
+    // partial push down
+    val originalQuery3 = testRelation
+      .groupBy($"a")($"a", count(1) as "ct")
+      .select($"a" + $"a" as "add", $"ct")
+      .where($"add" + $"add" > 10 && $"add" > $"ct")
+    val optimized3 = Optimize.execute(originalQuery3.analyze)
+    val correctAnswer3 = testRelation
+      .select($"a", $"b", $"c", $"a" + $"a" as "add")
+      .where($"add" + $"add" > 10)
+      .select($"a", $"b", $"c", $"add")
+      .groupBy($"a")($"a", count(1) as "ct", $"a" + $"a" as "add")
+      .where($"add" > $"ct")
+      .select($"add", $"ct")
+      .analyze
+    comparePlans(optimized3, correctAnswer3)
   }
 }