NVIDIA · abellina · Aug 25, 2023 · Aug 24, 2023 · Aug 25, 2023 · Aug 25, 2023
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ShimLoader.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ShimLoader.scala
@@ -35,7 +35,7 @@ import org.apache.spark.sql.Strategy
 import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
 import org.apache.spark.sql.catalyst.rules.Rule
 import org.apache.spark.sql.execution.{ColumnarRule, SparkPlan}
-import org.apache.spark.sql.rapids.AdaptiveSparkPlanHelperShim
+import org.apache.spark.sql.rapids.{AdaptiveSparkPlanHelperShim, ExecutionPlanCaptureCallbackBase}
 import org.apache.spark.sql.rapids.execution.UnshimmedTrampolineUtil
 import org.apache.spark.util.MutableURLClassLoader
 
@@ -421,4 +421,9 @@ object ShimLoader extends Logging {
     ShimReflectionUtils.newInstanceOf[AdaptiveSparkPlanHelperShim](
       "com.nvidia.spark.rapids.AdaptiveSparkPlanHelperImpl"
     )
+
+  def newExecutionPlanCaptureCallbackBase(): ExecutionPlanCaptureCallbackBase =
+    ShimReflectionUtils.
+        newInstanceOf[ExecutionPlanCaptureCallbackBase](
+          "org.apache.spark.sql.rapids.ShimmedExecutionPlanCaptureCallbackImpl")
 }
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/ExecutionPlanCaptureCallback.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/ExecutionPlanCaptureCallback.scala
@@ -16,238 +16,104 @@
 
 package org.apache.spark.sql.rapids
 
-import scala.collection.convert.ImplicitConversions.`collection AsScalaIterable`
-import scala.collection.mutable.{ArrayBuffer, Map => MutableMap}
-import scala.util.matching.Regex
+import com.nvidia.spark.rapids.ShimLoader
 
-import com.nvidia.spark.rapids.{PlanShims, PlanUtils, ShimLoader}
-
-import org.apache.spark.sql.{DataFrame, SparkSession}
-import org.apache.spark.sql.catalyst.expressions.Expression
-import org.apache.spark.sql.execution.{ExecSubqueryExpression, QueryExecution, ReusedSubqueryExec, SparkPlan}
-import org.apache.spark.sql.execution.adaptive.{AdaptiveSparkPlanExec, QueryStageExec}
-import org.apache.spark.sql.execution.exchange.ReusedExchangeExec
+import org.apache.spark.sql.DataFrame
+import org.apache.spark.sql.execution.{QueryExecution, SparkPlan}
 import org.apache.spark.sql.util.QueryExecutionListener
 
-object ExecutionPlanCaptureCallback {
-  private[this] var shouldCapture: Boolean = false
-  private[this] val execPlans: ArrayBuffer[SparkPlan] = ArrayBuffer.empty
-
-  private def captureIfNeeded(qe: QueryExecution): Unit = synchronized {
-    if (shouldCapture) {
-      execPlans.append(qe.executedPlan)
-    }
-  }
-
-  // Avoiding the use of default arguments since this is called from Python
-  def startCapture(): Unit = startCapture(10000)
-
-  def startCapture(timeoutMillis: Long): Unit = {
-    SparkSession.getActiveSession.foreach { spark =>
-      spark.sparkContext.listenerBus.waitUntilEmpty(timeoutMillis)
-    }
-    synchronized {
-      execPlans.clear()
-      shouldCapture = true
-    }
-  }
-
-  def getResultsWithTimeout(timeoutMs: Long = 10000): Array[SparkPlan] = {
-    try {
-      val spark = SparkSession.active
-      spark.sparkContext.listenerBus.waitUntilEmpty(timeoutMs)
-      synchronized {
-        execPlans.toArray
-      }
-    } finally {
-      synchronized {
-        shouldCapture = false
-        execPlans.clear()
-      }
-    }
-  }
-
-  def extractExecutedPlan(plan: SparkPlan): SparkPlan = {
-    plan match {
-      case p: AdaptiveSparkPlanExec => p.executedPlan
-      case p => PlanShims.extractExecutedPlan(p)
-    }
-  }
-
+trait ExecutionPlanCaptureCallbackBase {
+  def captureIfNeeded(qe: QueryExecution): Unit
+  def startCapture(): Unit
+  def startCapture(timeoutMillis: Long): Unit
+  def getResultsWithTimeout(timeoutMs: Long = 10000): Array[SparkPlan]
+  def extractExecutedPlan(plan: SparkPlan): SparkPlan
+  def assertContains(gpuPlan: SparkPlan, className: String): Unit
+  def assertContains(df: DataFrame, gpuClass: String): Unit
+  def assertContainsAnsiCast(df: DataFrame): Unit
+  def assertNotContain(gpuPlan: SparkPlan, className: String): Unit
+  def assertNotContain(df: DataFrame, gpuClass: String): Unit
+  def assertDidFallBack(gpuPlan: SparkPlan, fallbackCpuClass: String): Unit
+  def assertDidFallBack(df: DataFrame, fallbackCpuClass: String): Unit
+  def assertDidFallBack(gpuPlans: Array[SparkPlan], fallbackCpuClass: String): Unit
   def assertCapturedAndGpuFellBack(
       // used by python code, should not be Array[String]
       fallbackCpuClassList: java.util.ArrayList[String],
-      timeoutMs: Long): Unit = {
-    val gpuPlans = getResultsWithTimeout(timeoutMs = timeoutMs)
-    assert(gpuPlans.nonEmpty, "Did not capture a plan")
-    fallbackCpuClassList.foreach(fallbackCpuClass => assertDidFallBack(gpuPlans, fallbackCpuClass))
-  }
-
-  /**
-   * This method is used by the Python integration tests.
-   * The method checks the schemata used in the GPU and CPU executed plans and compares it to the
-   * expected schemata to make sure we are not reading more data than needed
-   */
-  def assertSchemataMatch(cpuDf: DataFrame, gpuDf: DataFrame, expectedSchema: String): Unit = {
-    import org.apache.spark.sql.execution.FileSourceScanExec
-    import org.apache.spark.sql.types.StructType
-    import org.apache.spark.sql.catalyst.parser.CatalystSqlParser
-
-    val adaptiveSparkPlanHelper = ShimLoader.newAdaptiveSparkPlanHelperShim()
-    val cpuFileSourceScanSchemata =
-      adaptiveSparkPlanHelper.collect(cpuDf.queryExecution.executedPlan) {
-      case scan: FileSourceScanExec => scan.requiredSchema
-    }
-    val gpuFileSourceScanSchemata =
-      adaptiveSparkPlanHelper.collect(gpuDf.queryExecution.executedPlan) {
-      case scan: GpuFileSourceScanExec => scan.requiredSchema
-    }
-    assert(cpuFileSourceScanSchemata.size == gpuFileSourceScanSchemata.size,
-      s"Found ${cpuFileSourceScanSchemata.size} file sources in dataframe, " +
-        s"but expected ${gpuFileSourceScanSchemata.size}")
-
-    cpuFileSourceScanSchemata.zip(gpuFileSourceScanSchemata).foreach {
-      case (cpuScanSchema, gpuScanSchema) =>
-         cpuScanSchema match {
-           case otherType: StructType =>
-             assert(gpuScanSchema.sameType(otherType))
-             val expectedStructType = CatalystSqlParser.parseDataType(expectedSchema)
-             assert(gpuScanSchema.sameType(expectedStructType),
-               s"Type GPU schema ${gpuScanSchema.toDDL} doesn't match $expectedSchema")
-             assert(cpuScanSchema.sameType(expectedStructType),
-               s"Type CPU schema ${cpuScanSchema.toDDL} doesn't match $expectedSchema")
-           case otherType => assert(false, s"The expected type $cpuScanSchema" +
-             s" doesn't match the actual type $otherType")
-         }
-    }
-  }
-
-  def assertCapturedAndGpuFellBack(fallbackCpuClass: String, timeoutMs: Long = 2000): Unit = {
-    val gpuPlans = getResultsWithTimeout(timeoutMs = timeoutMs)
-    assert(gpuPlans.nonEmpty, "Did not capture a plan")
-    assertDidFallBack(gpuPlans, fallbackCpuClass)
-  }
-
-  def assertDidFallBack(gpuPlans: Array[SparkPlan], fallbackCpuClass: String): Unit = {
-    val executedPlans = gpuPlans.map(extractExecutedPlan)
-    // Verify at least one of the plans has the fallback class
-    val found = executedPlans.exists { executedPlan =>
-      executedPlan.find(didFallBack(_, fallbackCpuClass)).isDefined
-    }
-    assert(found, s"Could not find $fallbackCpuClass in the GPU plans:\n" +
-        executedPlans.mkString("\n"))
-  }
-
-  def assertDidFallBack(gpuPlan: SparkPlan, fallbackCpuClass: String): Unit = {
-    val executedPlan = ExecutionPlanCaptureCallback.extractExecutedPlan(gpuPlan)
-    assert(executedPlan.find(didFallBack(_, fallbackCpuClass)).isDefined,
-      s"Could not find $fallbackCpuClass in the GPU plan\n$executedPlan")
-  }
-
-  def assertDidFallBack(df: DataFrame, fallbackCpuClass: String): Unit = {
-    val executedPlan = df.queryExecution.executedPlan
-    assertDidFallBack(Array(executedPlan), fallbackCpuClass)
-  }
-
-  def assertContains(gpuPlan: SparkPlan, className: String): Unit = {
-    assert(containsPlan(gpuPlan, className),
-      s"Could not find $className in the Spark plan\n$gpuPlan")
-  }
-
-  def assertContains(df: DataFrame, gpuClass: String): Unit = {
-    val executedPlan = df.queryExecution.executedPlan
-    assertContains(executedPlan, gpuClass)
-  }
-
-  def assertNotContain(gpuPlan: SparkPlan, className: String): Unit = {
-    assert(!containsPlan(gpuPlan, className),
-      s"We found $className in the Spark plan\n$gpuPlan")
-  }
-
-  def assertNotContain(df: DataFrame, gpuClass: String): Unit = {
-    val executedPlan = df.queryExecution.executedPlan
-    assertNotContain(executedPlan, gpuClass)
-  }
-
-  def assertContainsAnsiCast(df: DataFrame): Unit = {
-    val executedPlan = ExecutionPlanCaptureCallback
-      .extractExecutedPlan(df.queryExecution.executedPlan)
-    assert(containsPlanMatching(executedPlan,
-      _.expressions.exists(PlanShims.isAnsiCastOptionallyAliased)),
-        "Plan does not contain an ansi cast")
-  }
-
-  def didFallBack(exp: Expression, fallbackCpuClass: String): Boolean = {
-    !exp.getClass.getCanonicalName.equals("com.nvidia.spark.rapids.GpuExpression") &&
-        PlanUtils.getBaseNameFromClass(exp.getClass.getName) == fallbackCpuClass ||
-        exp.children.exists(didFallBack(_, fallbackCpuClass))
-  }
-
-  def didFallBack(plan: SparkPlan, fallbackCpuClass: String): Boolean = {
-    val executedPlan = ExecutionPlanCaptureCallback.extractExecutedPlan(plan)
-    !executedPlan.getClass.getCanonicalName.equals("com.nvidia.spark.rapids.GpuExec") &&
-        PlanUtils.sameClass(executedPlan, fallbackCpuClass) ||
-        executedPlan.expressions.exists(didFallBack(_, fallbackCpuClass))
-  }
-
-  private def containsExpression(exp: Expression, className: String,
-      regexMap: MutableMap[String, Regex] // regex memoization
-  ): Boolean = exp.find {
-    case e if PlanUtils.getBaseNameFromClass(e.getClass.getName) == className => true
-    case e: ExecSubqueryExpression => containsPlan(e.plan, className, regexMap)
-    case _ => false
-  }.nonEmpty
-
-  private def containsPlan(plan: SparkPlan, className: String,
-      regexMap: MutableMap[String, Regex] = MutableMap.empty // regex memoization
-  ): Boolean = plan.find {
-    case p if PlanUtils.sameClass(p, className) =>
-      true
-    case p: AdaptiveSparkPlanExec =>
-      containsPlan(p.executedPlan, className, regexMap)
-    case p: QueryStageExec =>
-      containsPlan(p.plan, className, regexMap)
-    case p: ReusedSubqueryExec =>
-      containsPlan(p.child, className, regexMap)
-    case p: ReusedExchangeExec =>
-      containsPlan(p.child, className, regexMap)
-    case p if p.expressions.exists(containsExpression(_, className, regexMap)) =>
-      true
-    case p: SparkPlan =>
-      val sparkPlanStringForRegex = p.verboseStringWithSuffix(1000)
-      regexMap.getOrElseUpdate(className, className.r)
-          .findFirstIn(sparkPlanStringForRegex)
-          .nonEmpty
-  }.nonEmpty
-
-  private def containsPlanMatching(plan: SparkPlan, f: SparkPlan => Boolean): Boolean = plan.find {
-    case p if f(p) =>
-      true
-    case p: AdaptiveSparkPlanExec =>
-      containsPlanMatching(p.executedPlan, f)
-    case p: QueryStageExec =>
-      containsPlanMatching(p.plan, f)
-    case p: ReusedSubqueryExec =>
-      containsPlanMatching(p.child, f)
-    case p: ReusedExchangeExec =>
-      containsPlanMatching(p.child, f)
-    case p =>
-      p.children.exists(plan => containsPlanMatching(plan, f))
-  }.nonEmpty
+      timeoutMs: Long): Unit
+  def assertCapturedAndGpuFellBack(fallbackCpuClass: String, timeoutMs: Long = 2000): Unit
+  def assertSchemataMatch(cpuDf: DataFrame, gpuDf: DataFrame, expectedSchema: String): Unit
+  def didFallBack(plan: SparkPlan, fallbackCpuClass: String): Boolean
+}
+
+object ExecutionPlanCaptureCallback extends ExecutionPlanCaptureCallbackBase {
+  lazy val impl = ShimLoader.newExecutionPlanCaptureCallbackBase()
+
+  override def captureIfNeeded(qe: QueryExecution): Unit =
+    impl.captureIfNeeded(qe)
+
+  override def startCapture(): Unit =
+    impl.startCapture()
+
+  override def startCapture(timeoutMillis: Long): Unit =
+    impl.startCapture(timeoutMillis)
+
+  override def getResultsWithTimeout(timeoutMs: Long = 10000): Array[SparkPlan] =
+    impl.getResultsWithTimeout(timeoutMs)
+
+  override def extractExecutedPlan(plan: SparkPlan): SparkPlan =
+    impl.extractExecutedPlan(plan)
+
+  override def assertContains(gpuPlan: SparkPlan, className: String): Unit =
+    impl.assertContains(gpuPlan, className)
+
+  override def assertContains(df: DataFrame, gpuClass: String): Unit =
+    impl.assertContains(df, gpuClass)
+
+  override def assertContainsAnsiCast(df: DataFrame): Unit =
+    impl.assertContainsAnsiCast(df)
 
+  override def assertNotContain(gpuPlan: SparkPlan, className: String): Unit =
+    impl.assertNotContain(gpuPlan, className)
+
+  override def assertNotContain(df: DataFrame, gpuClass: String): Unit =
+    impl.assertNotContain(df, gpuClass)
+
+  override def assertDidFallBack(gpuPlan: SparkPlan, fallbackCpuClass: String): Unit =
+    impl.assertDidFallBack(gpuPlan, fallbackCpuClass)
+
+  override def assertDidFallBack(df: DataFrame, fallbackCpuClass: String): Unit =
+    impl.assertDidFallBack(df, fallbackCpuClass)
+
+  override def assertDidFallBack(gpuPlans: Array[SparkPlan], fallbackCpuClass: String): Unit = 
+    impl.assertDidFallBack(gpuPlans, fallbackCpuClass)
+
+  override def assertCapturedAndGpuFellBack(
+      // used by python code, should not be Array[String]
+      fallbackCpuClassList: java.util.ArrayList[String],
+      timeoutMs: Long): Unit = 
+    impl.assertCapturedAndGpuFellBack(fallbackCpuClassList, timeoutMs)
+
+  override def assertCapturedAndGpuFellBack(
+      fallbackCpuClass: String, timeoutMs: Long = 2000): Unit =
+    impl.assertCapturedAndGpuFellBack(fallbackCpuClass, timeoutMs)
+
+  override def assertSchemataMatch(
+      cpuDf: DataFrame, gpuDf: DataFrame, expectedSchema: String): Unit =
+    impl.assertSchemataMatch(cpuDf, gpuDf, expectedSchema)
+
+  override def didFallBack(plan: SparkPlan, fallbackCpuClass: String): Boolean =
+    impl.didFallBack(plan, fallbackCpuClass)
 }
 
 /**
  * Used as a part of testing to capture the executed query plan.
  */
 class ExecutionPlanCaptureCallback extends QueryExecutionListener {
-  import ExecutionPlanCaptureCallback._
-
   override def onSuccess(funcName: String, qe: QueryExecution, durationNs: Long): Unit =
-    captureIfNeeded(qe)
+    ExecutionPlanCaptureCallback.captureIfNeeded(qe)
 
   override def onFailure(funcName: String, qe: QueryExecution, exception: Exception): Unit =
-    captureIfNeeded(qe)
+    ExecutionPlanCaptureCallback.captureIfNeeded(qe)
 }
 
 trait AdaptiveSparkPlanHelperShim {