[SPARK-5213] [SQL] Remove the duplicated SparkSQLParser

This is a follow up of #5827 to remove the additional `SparkSQLParser` Author: Cheng Hao <hao.cheng@intel.com> Closes #5965 from chenghao-intel/remove_sparksqlparser and squashes the following commits: 509a233 [Cheng Hao] Remove the HiveQlQueryExecution a5f9e3b [Cheng Hao] Remove the duplicated SparkSQLParser (cherry picked from commit 074d75d4c8) Signed-off-by: Michael Armbrust <michael@databricks.com>
2015-05-07 12:09:54 -07:00 · 2015-05-07 12:09:54 -07:00 · 2b0c423856
parent 86f141c90a
commit 2b0c423856
4 changed files with 11 additions and 23 deletions
--- a/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveQl.scala
+++ b/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveQl.scala
@ -28,7 +28,7 @@ import org.apache.hadoop.hive.ql.lib.Node
 import org.apache.hadoop.hive.ql.metadata.Table
 import org.apache.hadoop.hive.ql.parse._
 import org.apache.hadoop.hive.ql.plan.PlanUtils
-import org.apache.spark.sql.{AnalysisException, SparkSQLParser}
+import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.catalyst.analysis._
 import org.apache.spark.sql.catalyst.expressions._
@ -140,10 +140,7 @@ private[hive] object HiveQl {
    "TOK_TRUNCATETABLE"     // truncate table" is a NativeCommand, does not need to explain.
  ) ++ nativeCommands
-  protected val hqlParser = {
+  protected val hqlParser = new ExtendedHiveQlParser
    val fallback = new ExtendedHiveQlParser
    new SparkSQLParser(fallback.parse(_))
  }
  /**
   * A set of implicit transformations that allow Hive ASTNodes to be rewritten by transformations
--- a/sql/hive/src/main/scala/org/apache/spark/sql/hive/test/TestHive.scala
+++ b/sql/hive/src/main/scala/org/apache/spark/sql/hive/test/TestHive.scala
@ -94,7 +94,8 @@ class TestHiveContext(sc: SparkContext) extends HiveContext(sc) {
  lazy val hiveDevHome = envVarToFile("HIVE_DEV_HOME")
  // Override so we can intercept relative paths and rewrite them to point at hive.
-  override def runSqlHive(sql: String): Seq[String] = super.runSqlHive(rewritePaths(sql))
+  override def runSqlHive(sql: String): Seq[String] =
    super.runSqlHive(rewritePaths(substitutor.substitute(this.hiveconf, sql)))
  override def executePlan(plan: LogicalPlan): this.QueryExecution =
    new this.QueryExecution(plan)
@ -157,22 +158,12 @@ class TestHiveContext(sc: SparkContext) extends HiveContext(sc) {
  val describedTable = "DESCRIBE (\\w+)".r
  val vs = new VariableSubstitution()
  // we should substitute variables in hql to pass the text to parseSql() as a parameter.
  // Hive parser need substituted text. HiveContext.sql() does this but return a DataFrame,
  // while we need a logicalPlan so we cannot reuse that.
  protected[hive] class HiveQLQueryExecution(hql: String)
    extends this.QueryExecution(HiveQl.parseSql(vs.substitute(hiveconf, hql))) {
    def hiveExec(): Seq[String] = runSqlHive(hql)
    override def toString: String = hql + "\n" + super.toString
  }
  /**
   * Override QueryExecution with special debug workflow.
   */
  class QueryExecution(logicalPlan: LogicalPlan)
    extends super.QueryExecution(logicalPlan) {
    def this(sql: String) = this(parseSql(sql))
    override lazy val analyzed = {
      val describedTables = logical match {
        case HiveNativeCommand(describedTable(tbl)) => tbl :: Nil
@ -196,7 +187,7 @@ class TestHiveContext(sc: SparkContext) extends HiveContext(sc) {
  protected[hive] implicit class SqlCmd(sql: String) {
    def cmd: () => Unit = {
-      () => new HiveQLQueryExecution(sql).stringResult(): Unit
+      () => new QueryExecution(sql).stringResult(): Unit
    }
  }
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveComparisonTest.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveComparisonTest.scala
@ -129,7 +129,7 @@ abstract class HiveComparisonTest
  }
  protected def prepareAnswer(
-    hiveQuery: TestHive.type#HiveQLQueryExecution,
+    hiveQuery: TestHive.type#QueryExecution,
    answer: Seq[String]): Seq[String] = {
    def isSorted(plan: LogicalPlan): Boolean = plan match {
@ -298,7 +298,7 @@ abstract class HiveComparisonTest
            hiveCachedResults
          } else {
-            val hiveQueries = queryList.map(new TestHive.HiveQLQueryExecution(_))
+            val hiveQueries = queryList.map(new TestHive.QueryExecution(_))
            // Make sure we can at least parse everything before attempting hive execution.
            hiveQueries.foreach(_.logical)
            val computedResults = (queryList.zipWithIndex, hiveQueries, hiveCacheFiles).zipped.map {
@ -346,7 +346,7 @@ abstract class HiveComparisonTest
        // Run w/ catalyst
        val catalystResults = queryList.zip(hiveResults).map { case (queryString, hive) =>
-          val query = new TestHive.HiveQLQueryExecution(queryString)
+          val query = new TestHive.QueryExecution(queryString)
          try { (query, prepareAnswer(query, query.stringResult())) } catch {
            case e: Throwable =>
              val errorMessage =
@ -402,7 +402,7 @@ abstract class HiveComparisonTest
            // okay by running a simple query. If this fails then we halt testing since
            // something must have gone seriously wrong.
            try {
-              new TestHive.HiveQLQueryExecution("SELECT key FROM src").stringResult()
+              new TestHive.QueryExecution("SELECT key FROM src").stringResult()
              TestHive.runSqlHive("SELECT key FROM src")
            } catch {
              case e: Exception =>
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/PruningSuite.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/PruningSuite.scala
@ -145,7 +145,7 @@ class PruningSuite extends HiveComparisonTest with BeforeAndAfter {
      expectedScannedColumns: Seq[String],
      expectedPartValues: Seq[Seq[String]]): Unit = {
    test(s"$testCaseName - pruning test") {
-      val plan = new TestHive.HiveQLQueryExecution(sql).executedPlan
+      val plan = new TestHive.QueryExecution(sql).executedPlan
      val actualOutputColumns = plan.output.map(_.name)
      val (actualScannedColumns, actualPartValues) = plan.collect {
        case p @ HiveTableScan(columns, relation, _) =>