apache
diff --git a/‎sql/api/src/test/scala/org/apache/spark/sql/CheckAnswerHelper.scala‎
Lines changed: 196 additions & 0 deletions b/‎sql/api/src/test/scala/org/apache/spark/sql/CheckAnswerHelper.scala‎
Lines changed: 196 additions & 0 deletions
diff --git a/‎sql/api/src/test/scala/org/apache/spark/sql/QueryCleanupHelper.scala‎
Lines changed: 68 additions & 0 deletions b/‎sql/api/src/test/scala/org/apache/spark/sql/QueryCleanupHelper.scala‎
Lines changed: 68 additions & 0 deletions
diff --git a/‎sql/api/src/test/scala/org/apache/spark/sql/SessionQueryTestBase.scala‎
Lines changed: 28 additions & 0 deletions b/‎sql/api/src/test/scala/org/apache/spark/sql/SessionQueryTestBase.scala‎
Lines changed: 28 additions & 0 deletions
diff --git a/‎…che/spark/sql/SparkSessionProvider.scala‎ ‎…che/spark/sql/SparkSessionProvider.scala‎sql/core/src/test/scala/org/apache/spark/sql/SparkSessionProvider.scala renamed to sql/api/src/test/scala/org/apache/spark/sql/SparkSessionProvider.scala b/‎…che/spark/sql/SparkSessionProvider.scala‎ ‎…che/spark/sql/SparkSessionProvider.scala‎sql/core/src/test/scala/org/apache/spark/sql/SparkSessionProvider.scala renamed to sql/api/src/test/scala/org/apache/spark/sql/SparkSessionProvider.scala
diff --git a/‎sql/connect/server/src/test/scala/org/apache/spark/sql/connect/DataSourceV2DataFrameConnectSuite.scala‎
Lines changed: 1 addition & 2 deletions b/‎sql/connect/server/src/test/scala/org/apache/spark/sql/connect/DataSourceV2DataFrameConnectSuite.scala‎
Lines changed: 1 addition & 2 deletions
diff --git a/‎sql/connect/server/src/test/scala/org/apache/spark/sql/connect/ExampleConnectSuite.scala‎
Lines changed: 1 addition & 1 deletion b/‎sql/connect/server/src/test/scala/org/apache/spark/sql/connect/ExampleConnectSuite.scala‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎…apache/spark/sql/connect/QueryTest.scala‎ ‎…spark/sql/connect/SessionQueryTest.scala‎sql/connect/server/src/test/scala/org/apache/spark/sql/connect/QueryTest.scala renamed to sql/connect/server/src/test/scala/org/apache/spark/sql/connect/SessionQueryTest.scala
Lines changed: 4 additions & 19 deletions b/‎…apache/spark/sql/connect/QueryTest.scala‎ ‎…spark/sql/connect/SessionQueryTest.scala‎sql/connect/server/src/test/scala/org/apache/spark/sql/connect/QueryTest.scala renamed to sql/connect/server/src/test/scala/org/apache/spark/sql/connect/SessionQueryTest.scala
Lines changed: 4 additions & 19 deletions
diff --git a/‎sql/connect/server/src/test/scala/org/apache/spark/sql/connect/SparkSessionBinder.scala‎
Lines changed: 2 additions & 9 deletions b/‎sql/connect/server/src/test/scala/org/apache/spark/sql/connect/SparkSessionBinder.scala‎
Lines changed: 2 additions & 9 deletions
@@ -0,0 +1,196 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql
+
+import java.util.TimeZone
+
+import scala.jdk.CollectionConverters._
+import scala.language.implicitConversions
+
+import org.scalatest.Assertions
+
+import org.apache.spark.util.{SparkErrorUtils, SparkStringUtils}
+import org.apache.spark.util.ArrayImplicits._
+
+trait CheckAnswerHelper extends Assertions {
+
+  /**
+   * Runs the plan and makes sure the answer matches the expected result.
+   *
+   * @param df the DataFrame to be executed
+   * @param expectedAnswer the expected result in a Seq of Rows.
+   */
+  protected def checkAnswer(df: => DataFrame, expectedAnswer: Seq[Row]): Unit = {
+    getErrorMessageInCheckAnswer(df, expectedAnswer) match {
+      case Some(errorMessage) => fail(errorMessage)
+      case None =>
+    }
+  }
+
+  protected def checkAnswer(df: => DataFrame, expectedAnswer: Row): Unit = {
+    checkAnswer(df, Seq(expectedAnswer))
+  }
+
+  protected def checkAnswer(df: => DataFrame, expectedAnswer: DataFrame): Unit = {
+    checkAnswer(df, expectedAnswer.collect().toImmutableArraySeq)
+  }
+
+  protected def checkAnswer(df: => DataFrame, expectedAnswer: Array[Row]): Unit = {
+    checkAnswer(df, expectedAnswer.toImmutableArraySeq)
+  }
+
+  protected def checkAnswer(df: DataFrame, expectedAnswer: java.util.List[Row]): Unit = {
+    checkAnswer(df, expectedAnswer.asScala.toSeq)
+  }
+
+  protected def isDfSorted(df: DataFrame): Boolean
+
+  /**
+   * Runs the plan and makes sure the answer matches the expected result.
+   * If there was exception during the execution or the contents of the DataFrame does not
+   * match the expected result, an error message will be returned. Otherwise, a None will
+   * be returned.
+   *
+   * @param df the DataFrame to be executed
+   * @param expectedAnswer the expected result in a Seq of Rows.
+   */
+  private def getErrorMessageInCheckAnswer(
+      df: DataFrame,
+      expectedAnswer: Seq[Row]): Option[String] = {
+    val sparkAnswer = try df.collect().toSeq catch {
+      case e: Exception =>
+        val errorMessage =
+          s"""
+             |Exception thrown while executing query:
+             |${df.queryExecution}
+             |== Exception ==
+             |$e
+             |${SparkErrorUtils.stackTraceToString(e)}
+          """.stripMargin
+        return Some(errorMessage)
+    }
+
+    sameRows(expectedAnswer, sparkAnswer, isDfSorted(df)).map { results =>
+      s"""
+         |Results do not match for query:
+         |Timezone: ${TimeZone.getDefault}
+         |Timezone Env: ${sys.env.getOrElse("TZ", "")}
+         |
+         |${df.queryExecution}
+         |== Results ==
+         |$results
+       """.stripMargin
+    }
+  }
+
+  private def prepareAnswer(answer: Seq[Row], isSorted: Boolean): Seq[Row] = {
+    // Converts data to types that we can do equality comparison using Scala collections.
+    // For BigDecimal type, the Scala type has a better definition of equality test (similar to
+    // Java's java.math.BigDecimal.compareTo).
+    // For binary arrays, we convert it to Seq to avoid of calling java.util.Arrays.equals for
+    // equality test.
+    val converted: Seq[Row] = answer.map(prepareRow)
+    if (!isSorted) converted.sortBy(_.toString()) else converted
+  }
+
+  // We need to call prepareRow recursively to handle schemas with struct types.
+  private def prepareRow(row: Row): Row = {
+    Row.fromSeq(row.toSeq.map {
+      case null => null
+      case bd: java.math.BigDecimal => BigDecimal(bd)
+      // Equality of WrappedArray differs for AnyVal and AnyRef in Scala 2.12.2+
+      case seq: Seq[_] => seq.map {
+        case b: java.lang.Byte => b.byteValue
+        case s: java.lang.Short => s.shortValue
+        case i: java.lang.Integer => i.intValue
+        case l: java.lang.Long => l.longValue
+        case f: java.lang.Float => f.floatValue
+        case d: java.lang.Double => d.doubleValue
+        case x => x
+      }
+      // Convert array to Seq for easy equality check.
+      case b: Array[_] => b.toSeq
+      case r: Row => prepareRow(r)
+      // SPARK-51349: "null" and null had the same precedence in sorting
+      case "null" => "__null_string__"
+      case o => o
+    })
+  }
+
+  private def genError(
+                        expectedAnswer: Seq[Row],
+                        sparkAnswer: Seq[Row],
+                        isSorted: Boolean = false): String = {
+    val getRowType: Option[Row] => String = row =>
+      row.map(row =>
+        if (row.schema == null) {
+          "struct<>"
+        } else {
+          s"${row.schema.catalogString}"
+        }).getOrElse("struct<>")
+
+    s"""
+       |== Results ==
+       |${
+      SparkStringUtils.sideBySide(
+        s"== Correct Answer - ${expectedAnswer.size} ==" +:
+          getRowType(expectedAnswer.headOption) +:
+          prepareAnswer(expectedAnswer, isSorted).map(_.toString()),
+        s"== Spark Answer - ${sparkAnswer.size} ==" +:
+          getRowType(sparkAnswer.headOption) +:
+          prepareAnswer(sparkAnswer, isSorted).map(_.toString())).mkString("\n")
+    }
+    """.stripMargin
+  }
+
+  private def compare(obj1: Any, obj2: Any): Boolean = (obj1, obj2) match {
+    case (null, null) => true
+    case (null, _) => false
+    case (_, null) => false
+    case (a: Array[_], b: Array[_]) =>
+      a.length == b.length && a.zip(b).forall { case (l, r) => compare(l, r)}
+    case (a: Map[_, _], b: Map[_, _]) =>
+      a.size == b.size && a.keys.forall { aKey =>
+        b.keys.find(bKey => compare(aKey, bKey)).exists(bKey => compare(a(aKey), b(bKey)))
+      }
+    case (a: Iterable[_], b: Iterable[_]) =>
+      a.size == b.size && a.zip(b).forall { case (l, r) => compare(l, r)}
+    case (a: Product, b: Product) =>
+      compare(a.productIterator.toSeq, b.productIterator.toSeq)
+    case (a: Row, b: Row) =>
+      compare(a.toSeq, b.toSeq)
+    // 0.0 == -0.0, turn float/double to bits before comparison, to distinguish 0.0 and -0.0.
+    // in some hardware NaN can be represented with different bits, so first check for it
+    case (a: Double, b: Double) =>
+      a.isNaN && b.isNaN ||
+        java.lang.Double.doubleToRawLongBits(a) == java.lang.Double.doubleToRawLongBits(b)
+    case (a: Float, b: Float) =>
+      a.isNaN && b.isNaN ||
+        java.lang.Float.floatToRawIntBits(a) == java.lang.Float.floatToRawIntBits(b)
+    case (a, b) => a == b
+  }
+
+  private def sameRows( expectedAnswer: Seq[Row],
+                        sparkAnswer: Seq[Row],
+                        isSorted: Boolean = false): Option[String] = {
+    if (!compare(prepareAnswer(expectedAnswer, isSorted), prepareAnswer(sparkAnswer, isSorted))) {
+      return Some(genError(expectedAnswer, sparkAnswer, isSorted))
+    }
+    None
+  }
+}
@@ -0,0 +1,68 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql
+
+import org.scalatest.Assertions
+
+import org.apache.spark.annotation.Experimental
+import org.apache.spark.util.SparkErrorUtils
+
+/**
+ * Provides [[withTable]], [[withView]], and [[withUserDefinedFunction]]
+ */
+@Experimental
+trait QueryCleanupHelper extends SparkSessionProvider with Assertions {
+
+  /**
+   * Drops table `tableName` after calling `f`.
+   */
+  protected def withTable(tableNames: String*)(f: => Unit): Unit = {
+    SparkErrorUtils.tryWithSafeFinally(f) {
+      tableNames.foreach { name =>
+        spark.sql(s"DROP TABLE IF EXISTS $name")
+      }
+    }
+  }
+
+  /**
+   * Drops view `viewName` after calling `f`.
+   */
+  protected def withView(viewNames: String*)(f: => Unit): Unit = {
+    SparkErrorUtils.tryWithSafeFinally(f)(
+      viewNames.foreach { name =>
+        spark.sql(s"DROP VIEW IF EXISTS $name")
+      }
+    )
+  }
+
+  protected def withUserDefinedFunction(functions: (String, Boolean)*)(f: => Unit): Unit = {
+    try {
+      f
+    } catch {
+      case cause: Throwable => throw cause
+    } finally {
+      functions.foreach { case (functionName, isTemporary) =>
+        val withTemporary = if (isTemporary) "TEMPORARY" else ""
+        spark.sql(s"DROP $withTemporary FUNCTION IF EXISTS $functionName")
+        assert(
+          !spark.catalog.functionExists(functionName),
+          s"Function $functionName should have been dropped. But, it still exists.")
+      }
+    }
+  }
+}
@@ -0,0 +1,28 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql
+
+// scalastyle:off funsuite
+import org.scalatest.funsuite.AnyFunSuite
+// scalastyle:on
+
+trait SessionQueryTestBase
+  extends AnyFunSuite
+    with SparkSessionProvider
+    with CheckAnswerHelper
+    with QueryCleanupHelper
@@ -34,7 +34,7 @@ import org.apache.spark.sql.connector.catalog.{CachingInMemoryTableCatalog, InMe
  * this class only provides the Connect-specific session, catalog access, and result comparison.
  */
 class DataSourceV2DataFrameConnectSuite
-    extends SparkSessionBinder
+    extends SessionQueryTest
     with DSv2TempViewWithStoredPlanTests
     with DSv2RepeatedTableAccessTests
     with DSv2IncrementallyConstructedQueryTests
@@ -53,7 +53,6 @@ class DataSourceV2DataFrameConnectSuite
     .set("spark.sql.catalog.nullbothidscat.copyOnLoad", "true")
 
   override protected def testPrefix: String = "[connect] "
-  override protected def isConnect: Boolean = true
 
   override protected def getTableCatalog[C <: TableCatalog: ClassTag](
       session: SparkSession,
 
@@ -19,4 +19,4 @@ package org.apache.spark.sql.connect
 
 import org.apache.spark.sql
 
-class ExampleConnectSuite extends sql.SparkSessionBinder
+class ExampleConnectSuite extends sql.ExampleSuite with SessionQueryTest
@@ -14,28 +14,13 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-
 package org.apache.spark.sql.connect
 
-import org.apache.spark.{sql => sqlApi}
+import org.apache.spark.sql
 
 /**
- * Extends [[sqlApi.QueryTest]] to provide connect-specific overrides to helpers like
- * [[checkAnswer]] that avoid classic-only APIs.
- *
- * Can be used together with [[SparkSessionBinder connect.SparkSessionBinder]] to create a
- * 'connect variant' of a test.
- *
- * Note: broader use will require more overrides.
+ * TODO write docstring
  */
-trait QueryTest extends sqlApi.QueryTest with SparkSessionProvider {
-
-  override protected def checkAnswer(
-    df: => sqlApi.DataFrame, expectedAnswer: Seq[sqlApi.Row]): Unit = {
-    val sparkAnswer = df.collect().toSeq
-    sqlApi.QueryTest.sameRows(expectedAnswer, sparkAnswer) match {
-      case Some(errorMessage) => fail(errorMessage)
-      case None =>
-    }
-  }
+trait SessionQueryTest extends sql.SessionQueryTest with SparkSessionBinder {
+  override def isDfSorted(df: sql.DataFrame): Boolean = false // TODO
 }
@@ -19,7 +19,7 @@ package org.apache.spark.sql.connect
 
 import java.util.UUID
 
-import org.apache.spark.SparkEnv
+import org.apache.spark.{SparkEnv, SparkFunSuite}
 import org.apache.spark.sql
 import org.apache.spark.sql.classic
 import org.apache.spark.sql.connect.client.SparkConnectClient
@@ -31,15 +31,8 @@ import org.apache.spark.sql.connect.service.SparkConnectService
  * Extends [[sql.SparkSessionBinder sql.SparkSessionBinder]] (which creates a
  * [[classic.SparkSession classic.SparkSession]] and SparkContext), then layers a Connect client
  * session on top by starting the gRPC service in-process.
- *
- * Mix in this trait to exercise existing sql/core test suites through the Connect path:
- * {{{
- * class FooWithConnectSuite
- *   extends FooSuite
- *   with connect.SparkSessionBinder
- * }}}
  */
-trait SparkSessionBinder extends sql.SparkSessionBinder with QueryTest {
+trait SparkSessionBinder extends sql.SparkSessionBinder { self: SparkFunSuite =>
 
   private var _connectSpark: SparkSession = _
Original file line number	Diff line number	Diff line change
`@@ -19,4 +19,4 @@ package org.apache.spark.sql.connect`
`19`	`19`
`20`	`20`	`import org.apache.spark.sql`
`21`	`21`
`22`		`-class ExampleConnectSuite extends sql.SparkSessionBinder`
	`22`	`+class ExampleConnectSuite extends sql.ExampleSuite with SessionQueryTest`