spark git commit: [SPARK-11188] [SQL] Elide stacktraces in bin/spark-sql for AnalysisExceptions

marmbrus Thu, 05 Nov 2015 16:52:32 -0800

Repository: spark
Updated Branches:
  refs/heads/branch-1.4 6c5e9a3a0 -> 4f98014b9



[SPARK-11188] [SQL] Elide stacktraces in bin/spark-sql for AnalysisExceptions

Only print the error message to the console for Analysis Exceptions in sql-shell

Author: Dilip Biswal <dbis...@us.ibm.com>

Closes #9375 from dilipbiswal/spark-11188-v142.


Project: http://git-wip-us.apache.org/repos/asf/spark/repo
Commit: http://git-wip-us.apache.org/repos/asf/spark/commit/4f98014b
Tree: http://git-wip-us.apache.org/repos/asf/spark/tree/4f98014b
Diff: http://git-wip-us.apache.org/repos/asf/spark/diff/4f98014b

Branch: refs/heads/branch-1.4
Commit: 4f98014b9b2ad66e356dbbbfdc8df4fb0f497dd9
Parents: 6c5e9a3
Author: Dilip Biswal <dbis...@us.ibm.com>
Authored: Thu Nov 5 16:52:22 2015 -0800
Committer: Michael Armbrust <mich...@databricks.com>
Committed: Thu Nov 5 16:52:22 2015 -0800

----------------------------------------------------------------------
 .../thriftserver/AbstractSparkSQLDriver.scala   | 23 ++++++++++++---
 .../hive/thriftserver/SparkSQLCLIDriver.scala   | 24 +++++++++-------
 .../spark/sql/hive/thriftserver/CliSuite.scala  | 30 +++++++++++++++++++-
 3 files changed, 62 insertions(+), 15 deletions(-)
----------------------------------------------------------------------


http://git-wip-us.apache.org/repos/asf/spark/blob/4f98014b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/AbstractSparkSQLDriver.scala
----------------------------------------------------------------------
diff --git 
a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/AbstractSparkSQLDriver.scala
 
b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/AbstractSparkSQLDriver.scala
index 48ac906..df025d0 100644
--- 
a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/AbstractSparkSQLDriver.scala
+++ 
b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/AbstractSparkSQLDriver.scala
@@ -25,6 +25,7 @@ import org.apache.hadoop.hive.ql.Driver
 import org.apache.hadoop.hive.ql.processors.CommandProcessorResponse
 
 import org.apache.spark.Logging
+import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.hive.{HiveContext, HiveMetastoreTypes}
 
 private[hive] abstract class AbstractSparkSQLDriver(
@@ -58,13 +59,23 @@ private[hive] abstract class AbstractSparkSQLDriver(
       hiveResponse = execution.stringResult()
       tableSchema = getResultSetSchema(execution)
       new CommandProcessorResponse(0)
-    } catch {
-      case cause: Throwable =>
-        logError(s"Failed in [$command]", cause)
-        new CommandProcessorResponse(1, ExceptionUtils.getStackTrace(cause), 
null)
     }
   }
 
+  def runWrapper(command: String): CommandProcessorResponseWrapper = try {
+    val result = run(command)
+    new CommandProcessorResponseWrapper(result, null)
+  } catch {
+    case ae: AnalysisException =>
+      logDebug(s"Failed in [$command]", ae)
+      new CommandProcessorResponseWrapper(new CommandProcessorResponse(1,
+        ExceptionUtils.getStackTrace(ae), null), ae)
+    case cause: Throwable =>
+      logError(s"Failed in [$command]", cause)
+      new CommandProcessorResponseWrapper(new CommandProcessorResponse(1,
+        ExceptionUtils.getStackTrace(cause), null), cause)
+  }
+
   override def close(): Int = {
     hiveResponse = null
     tableSchema = null
@@ -79,3 +90,7 @@ private[hive] abstract class AbstractSparkSQLDriver(
     tableSchema = null
   }
 }
+
+private[hive] case class CommandProcessorResponseWrapper(
+    rc : CommandProcessorResponse,
+    cause : Throwable)

http://git-wip-us.apache.org/repos/asf/spark/blob/4f98014b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkSQLCLIDriver.scala
----------------------------------------------------------------------
diff --git 
a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkSQLCLIDriver.scala
 
b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkSQLCLIDriver.scala
index c56d807..3928f7b 100644
--- 
a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkSQLCLIDriver.scala
+++ 
b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkSQLCLIDriver.scala
@@ -17,13 +17,12 @@
 
 package org.apache.spark.sql.hive.thriftserver
 
-import scala.collection.JavaConversions._
-
 import java.io._
 import java.util.{ArrayList => JArrayList}
 
-import jline.{ConsoleReader, History}
+import scala.collection.JavaConversions._
 
+import jline.{ConsoleReader, History}
 import org.apache.commons.lang3.StringUtils
 import org.apache.commons.logging.LogFactory
 import org.apache.hadoop.conf.Configuration
@@ -32,13 +31,14 @@ import 
org.apache.hadoop.hive.common.{HiveInterruptCallback, HiveInterruptUtils}
 import org.apache.hadoop.hive.conf.HiveConf
 import org.apache.hadoop.hive.ql.Driver
 import org.apache.hadoop.hive.ql.exec.Utilities
-import org.apache.hadoop.hive.ql.processors.{AddResourceProcessor, 
SetProcessor, CommandProcessor}
+import org.apache.hadoop.hive.ql.processors.{AddResourceProcessor, 
CommandProcessor, SetProcessor}
 import org.apache.hadoop.hive.ql.session.SessionState
 import org.apache.thrift.transport.TSocket
 
 import org.apache.spark.Logging
+import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.hive.{HiveContext, HiveShim}
-import org.apache.spark.util.{ShutdownHookManager, Utils}
+import org.apache.spark.util.ShutdownHookManager
 
 private[hive] object SparkSQLCLIDriver {
   private var prompt = "spark-sql"
@@ -276,19 +276,23 @@ private[hive] class SparkSQLCLIDriver extends CliDriver 
with Logging {
 
           driver.init()
           val out = sessionState.out
+          val err = sessionState.err
           val start: Long = System.currentTimeMillis()
           if (sessionState.getIsVerbose) {
             out.println(cmd)
           }
-          val rc = driver.run(cmd)
+          val rcWrapper = driver.runWrapper(cmd)
           val end = System.currentTimeMillis()
           val timeTaken: Double = (end - start) / 1000.0
 
-          ret = rc.getResponseCode
+          ret = rcWrapper.rc.getResponseCode
           if (ret != 0) {
-            console.printError(rc.getErrorMessage())
-            driver.close()
-            return ret
+            // For analysis exception, only the error is printed out to the 
console.
+            rcWrapper.cause match {
+              case e: AnalysisException =>
+                err.println(s"""Error in query: ${e.getMessage}""")
+              case _ => err.println(rcWrapper.rc.getErrorMessage())
+            }
           }
 
           val res = new JArrayList[String]()

http://git-wip-us.apache.org/repos/asf/spark/blob/4f98014b/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/CliSuite.scala
----------------------------------------------------------------------
diff --git 
a/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/CliSuite.scala
 
b/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/CliSuite.scala
index 13b0c59..1e28de4 100644
--- 
a/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/CliSuite.scala
+++ 
b/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/CliSuite.scala
@@ -48,9 +48,21 @@ class CliSuite extends SparkFunSuite with BeforeAndAfter 
with Logging {
       metastorePath.delete()
   }
 
+  /**
+   * Run a CLI operation and expect all the queries and expected answers to be 
returned.
+   * @param timeout maximum time for the commands to complete
+   * @param extraArgs any extra arguments
+   * @param errorResponses a sequence of strings whose presence in the stdout 
of the forked process
+   *                       is taken as an immediate error condition. That is: 
if a line containing
+   *                       with one of these strings is found, fail the test 
immediately.
+   *                       The default value is `Seq("Error:")`
+   *
+   * @param queriesAndExpectedAnswers one or more tupes of query + answer
+   */
   def runCliWithin(
       timeout: FiniteDuration,
-      extraArgs: Seq[String] = Seq.empty)(
+      extraArgs: Seq[String] = Seq.empty,
+      errorResponses: Seq[String] = Seq("Error:"))(
       queriesAndExpectedAnswers: (String, String)*): Unit = {
 
     val (queries, expectedAnswers) = queriesAndExpectedAnswers.unzip
@@ -82,6 +94,14 @@ class CliSuite extends SparkFunSuite with BeforeAndAfter 
with Logging {
           foundAllExpectedAnswers.trySuccess(())
         }
       }
+      else {
+        errorResponses.foreach { r =>
+          if (line.contains(r)) {
+            foundAllExpectedAnswers.tryFailure(
+              new RuntimeException(s"Failed with error line '$line'"))
+          }
+        }
+      }
     }
 
     // Searching expected output line from both stdout and stderr of the CLI 
process
@@ -184,4 +204,12 @@ class CliSuite extends SparkFunSuite with BeforeAndAfter 
with Logging {
         -> "OK"
     )
   }
+
+  test("SPARK-11188 Analysis error reporting") {
+    runCliWithin(timeout = 2.minute,
+      errorResponses = Seq("AnalysisException"))(
+        "select * from nonexistent_table;"
+          -> "Error in query: no such table nonexistent_table;"
+      )
+  }
 }


---------------------------------------------------------------------
To unsubscribe, e-mail: commits-unsubscr...@spark.apache.org
For additional commands, e-mail: commits-h...@spark.apache.org

spark git commit: [SPARK-11188] [SQL] Elide stacktraces in bin/spark-sql for AnalysisExceptions

Reply via email to