Github user misutoth commented on a diff in the pull request:

    https://github.com/apache/spark/pull/20853#discussion_r175664716
  
    --- Diff: core/src/main/scala/org/apache/spark/deploy/DependencyUtils.scala 
---
    @@ -137,16 +138,32 @@ private[deploy] object DependencyUtils {
       def resolveGlobPaths(paths: String, hadoopConf: Configuration): String = 
{
         require(paths != null, "paths cannot be null.")
         Utils.stringToSeq(paths).flatMap { path =>
    -      val uri = Utils.resolveURI(path)
    -      uri.getScheme match {
    -        case "local" | "http" | "https" | "ftp" => Array(path)
    -        case _ =>
    -          val fs = FileSystem.get(uri, hadoopConf)
    -          Option(fs.globStatus(new Path(uri))).map { status =>
    -            status.filter(_.isFile).map(_.getPath.toUri.toString)
    -          }.getOrElse(Array(path))
    +      val (base, fragment) = splitOnFragment(path)
    +      (resolveGlobPath(base, hadoopConf), fragment) match {
    +        case (resolved, Some(_)) if resolved.length > 1 => throw new 
SparkException(
    +            s"${base.toString} resolves ambiguously to multiple files: 
${resolved.mkString(",")}")
    --- End diff --
    
    There was no space used here before. Actually there should not be any space 
in the resulting list. Tests also rely on this.


---

---------------------------------------------------------------------
To unsubscribe, e-mail: reviews-unsubscr...@spark.apache.org
For additional commands, e-mail: reviews-h...@spark.apache.org

Reply via email to