Github user rberenguel commented on a diff in the pull request: https://github.com/apache/spark/pull/17100#discussion_r146177263 --- Diff: sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/CheckAnalysis.scala --- @@ -270,12 +271,25 @@ trait CheckAnalysis extends PredicateHelper { operator match { case o if o.children.nonEmpty && o.missingInput.nonEmpty => + val resolver = plan.conf.resolver + val attrsWithSameName = o.missingInput.filter(x => + o.inputSet.exists(y => resolver(x.name, y.name))) val missingAttributes = o.missingInput.mkString(",") - val input = o.inputSet.mkString(",") + val availableAttributes = o.inputSet.mkString(",") + val repeatedNameHint = if (attrsWithSameName.size > 0) { + val commonNames = attrsWithSameName.map(_.name).mkString(",") + s"""\n|Attribute(s) `$commonNames` seem to appear in two + |different datasets, with the same name.""" --- End diff -- I have changed it. Agree datasets may not be the best word to define it
--- --------------------------------------------------------------------- To unsubscribe, e-mail: reviews-unsubscr...@spark.apache.org For additional commands, e-mail: reviews-h...@spark.apache.org