[SPARK-56346][SQL] Use PartitionPredicate in DSV2 Metadata Only Delete

szehon-ho · szehon-ho · commit cb0ff922b306 · 2026-04-02T16:58:30.000-07:00
When `OptimizeMetadataOnlyDeleteFromTable` fails to push standard V2 predicates for a metadata-only delete, it now falls back to a second pass that converts partition-column filters to `PartitionPredicate`s (SPARK-55596) and combines them with translated V2 data filters.
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryPartitionPredicateDeleteTable.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryPartitionPredicateDeleteTable.scala
@@ -0,0 +1,146 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.connector.catalog
+
+import java.util
+
+import org.apache.spark.sql.catalyst.InternalRow
+import org.apache.spark.sql.catalyst.analysis.TableAlreadyExistsException
+import org.apache.spark.sql.connector.catalog.CatalogV2Implicits.MultipartIdentifierHelper
+import org.apache.spark.sql.connector.expressions.Transform
+import org.apache.spark.sql.connector.expressions.filter.{PartitionPredicate, Predicate}
+import org.apache.spark.sql.types.StructType
+import org.apache.spark.util.ArrayImplicits._
+
+/**
+ * In-memory table that supports row-level operations and accepts [[PartitionPredicate]]s
+ * in V2 [[canDeleteWhere]]/[[deleteWhere]] for metadata-only deletes.
+ *
+ * Contains some knobs to control acceptance of various partition and data predicates.
+ */
+class InMemoryPartitionPredicateDeleteTable(
+    name: String,
+    schema: StructType,
+    partitioning: Array[Transform],
+    properties: util.Map[String, String])
+  extends InMemoryRowLevelOperationTable(name, schema, partitioning, properties) {
+
+  private val acceptPartitionPredicates: Boolean =
+    properties.getOrDefault(
+      InMemoryPartitionPredicateDeleteTable.AcceptPartitionPredicatesKey, "true").toBoolean
+
+  private val acceptDataPredicates: Boolean =
+    properties.getOrDefault(
+      InMemoryPartitionPredicateDeleteTable.AcceptDataPredicatesKey, "false").toBoolean
+
+  private val partPaths = partCols.map(_.mkString(".")).toSet
+
+  private def refsOnlyPartCols(p: Predicate): Boolean =
+    p.references().forall(ref => partPaths.contains(ref.fieldNames().mkString(".")))
+
+  override def canDeleteWhere(predicates: Array[Predicate]): Boolean = {
+    predicates.forall {
+      case _: PartitionPredicate => acceptPartitionPredicates
+      case p =>
+        InMemoryTableWithV2Filter.supportsPredicates(Array(p)) &&
+          (acceptDataPredicates || refsOnlyPartCols(p))
+    }
+  }
+
+  override def deleteWhere(predicates: Array[Predicate]): Unit = dataMap.synchronized {
+    val (partPreds, standardPreds) = predicates.partition(_.isInstanceOf[PartitionPredicate])
+    val (partStdPreds, dataStdPreds) = standardPreds.partition(refsOnlyPartCols)
+
+    val candidateKeys = if (partStdPreds.nonEmpty) {
+      InMemoryTableWithV2Filter.filtersToKeys(
+        dataMap.keys, partCols.map(_.toSeq.quoted).toImmutableArraySeq, partStdPreds)
+    } else {
+      dataMap.keys
+    }
+
+    // Handle partition predicates.
+    val keysToProcess = if (partPreds.nonEmpty) {
+      val pArr = partPreds.map(_.asInstanceOf[PartitionPredicate])
+      candidateKeys.filter { key =>
+        val partRow = PartitionInternalRow(key.toArray)
+        pArr.forall(_.eval(partRow))
+      }
+    } else {
+      candidateKeys
+    }
+
+    // Handle data predicates (simulate data source with data column statistics)
+    if (dataStdPreds.isEmpty) {
+      dataMap --= keysToProcess
+    } else {
+      for (key <- keysToProcess.toSeq) {
+        dataMap.get(key).foreach { splits =>
+          val filtered = splits.map { buffered =>
+            val kept = new BufferedRows(key, buffered.schema)
+            buffered.rows
+              .filterNot(rowMatchesAll(_, dataStdPreds, buffered.schema))
+              .foreach(kept.withRow)
+            kept
+          }
+          if (filtered.forall(_.rows.isEmpty)) {
+            dataMap.remove(key)
+          } else {
+            dataMap.update(key, filtered)
+          }
+        }
+      }
+    }
+  }
+
+  private def rowMatchesAll(
+      row: InternalRow,
+      preds: Array[Predicate],
+      rowSchema: StructType): Boolean = {
+    val resolve: String => Any = colName => {
+      val idx = rowSchema.fieldIndex(colName)
+      row.get(idx, rowSchema(idx).dataType)
+    }
+    preds.forall(
+      InMemoryTableWithV2Filter.evalPredicate(_, resolve))
+  }
+}
+
+object InMemoryPartitionPredicateDeleteTable {
+  private[catalog] val AcceptPartitionPredicatesKey = "accept-partition-predicates"
+  private[catalog] val AcceptDataPredicatesKey = "accept-data-predicates"
+}
+
+class InMemoryPartitionPredicateDeleteCatalog extends InMemoryTableCatalog {
+  import CatalogV2Implicits._
+
+  override def createTable(ident: Identifier, tableInfo: TableInfo): Table = {
+    if (tables.containsKey(ident)) {
+      throw new TableAlreadyExistsException(ident.asMultipartIdentifier)
+    }
+
+    InMemoryTableCatalog.maybeSimulateFailedTableCreation(tableInfo.properties)
+
+    val tableName = s"$name.${ident.quoted}"
+    val schema = CatalogV2Util.v2ColumnsToStructType(tableInfo.columns)
+    val table = new InMemoryPartitionPredicateDeleteTable(
+      tableName, schema, tableInfo.partitions, tableInfo.properties)
+    tables.put(ident, table)
+    namespaces.putIfAbsent(ident.namespace.toList, Map())
+    table
+  }
+}
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryTableWithV2Filter.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryTableWithV2Filter.scala
@@ -140,31 +140,36 @@ object InMemoryTableWithV2Filter {
       partitionNames: Seq[String],
       filters: Array[Predicate]): Iterable[Seq[Any]] = {
     keys.filter { partValues =>
-      filters.flatMap(splitAnd).forall {
-        case p: Predicate if p.name().equals("=") =>
-          p.children()(1).asInstanceOf[LiteralValue[_]].value ==
-            InMemoryBaseTable.extractValue(p.children()(0).toString, partitionNames, partValues)
-        case p: Predicate if p.name().equals("<=>") =>
-          val attrVal = InMemoryBaseTable
-            .extractValue(p.children()(0).toString, partitionNames, partValues)
-          val value = p.children()(1).asInstanceOf[LiteralValue[_]].value
-          if (attrVal == null && value == null) {
-            true
-          } else if (attrVal == null || value == null) {
-            false
-          } else {
-            value == attrVal
-          }
-        case p: Predicate if p.name().equals("IS_NULL") =>
-          val attr = p.children()(0).toString
-          null == InMemoryBaseTable.extractValue(attr, partitionNames, partValues)
-        case p: Predicate if p.name().equals("IS_NOT_NULL") =>
-          val attr = p.children()(0).toString
-          null != InMemoryBaseTable.extractValue(attr, partitionNames, partValues)
-        case p: Predicate if p.name().equals("ALWAYS_TRUE") => true
-        case f =>
-          throw new IllegalArgumentException(s"Unsupported filter type: $f")
-      }
+      val resolve: String => Any = attr =>
+        InMemoryBaseTable.extractValue(attr, partitionNames, partValues)
+      filters.flatMap(splitAnd).forall(evalPredicate(_, resolve))
+    }
+  }
+
+  /**
+   * Evaluates a single V2 predicate by resolving column values through the
+   * given function. Supports =, <=>, IS_NULL, IS_NOT_NULL, and ALWAYS_TRUE.
+   */
+  def evalPredicate(
+      pred: Predicate,
+      resolveValue: String => Any): Boolean = {
+    lazy val attr = pred.children()(0).toString
+    pred.name() match {
+      case "=" =>
+        resolveValue(attr) ==
+          pred.children()(1).asInstanceOf[LiteralValue[_]].value
+      case "<=>" =>
+        val attrVal = resolveValue(attr)
+        val litVal =
+          pred.children()(1).asInstanceOf[LiteralValue[_]].value
+        (attrVal == null && litVal == null) ||
+          (attrVal != null && litVal != null && attrVal == litVal)
+      case "IS_NULL" => resolveValue(attr) == null
+      case "IS_NOT_NULL" => resolveValue(attr) != null
+      case "ALWAYS_TRUE" => true
+      case other =>
+        throw new IllegalArgumentException(
+          s"Unsupported filter type: $other")
     }
   }
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/OptimizeMetadataOnlyDeleteFromTable.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/OptimizeMetadataOnlyDeleteFromTable.scala
@@ -43,13 +43,12 @@ object OptimizeMetadataOnlyDeleteFromTable extends Rule[LogicalPlan] with Predic
         case table: SupportsDeleteV2 if !SubqueryExpression.hasSubquery(cond) =>
           val predicates = splitConjunctivePredicates(cond)
           val normalizedPredicates = DataSourceStrategy.normalizeExprs(predicates, relation.output)
-          val filters = toDataSourceV2Filters(normalizedPredicates)
-          val allPredicatesTranslated = normalizedPredicates.size == filters.length
-          if (allPredicatesTranslated && table.canDeleteWhere(filters)) {
-            logDebug(s"Switching to delete with filters: ${filters.mkString("[", ", ", "]")}")
-            DeleteFromTableWithFilters(relation, filters.toImmutableArraySeq)
+          val filtersOpt = tryTranslateToV2(normalizedPredicates)
+          if (filtersOpt.exists(table.canDeleteWhere)) {
+            DeleteFromTableWithFilters(relation, filtersOpt.get.toImmutableArraySeq)
           } else {
-            rowLevelPlan
+            tryDeleteWithPartitionPredicates(table, relation, normalizedPredicates)
+              .getOrElse(rowLevelPlan)
           }
 
         case _: TruncatableTable if cond == TrueLiteral =>
@@ -70,6 +69,40 @@ object OptimizeMetadataOnlyDeleteFromTable extends Rule[LogicalPlan] with Predic
     }.toArray
   }
 
+  /**
+   * Attempts to convert partition-column filters to [[PartitionPredicate]]s and
+   * combine them with translated V2 data filters for a metadata-only delete. (See SPARK-55596)
+   *
+   * Returns [[Some]] with the plan if the table accepts the combined predicates,
+   * or [[None]] if partition predicates cannot be created or the table rejects them.
+   */
+  private def tryDeleteWithPartitionPredicates(
+      table: SupportsDeleteV2,
+      relation: DataSourceV2Relation,
+      normalizedPredicates: Seq[Expression]): Option[LogicalPlan] = {
+    for {
+      partitionFields <- PushDownUtils.getPartitionPredicateSchema(relation)
+      flattenedFilters = PushDownUtils.flattenNestedPartitionFilters(
+        normalizedPredicates, partitionFields).keys.toSeq
+      (candidatePredicates, remainingFilters) =
+        PushDownUtils.createPartitionPredicates(flattenedFilters, partitionFields)
+      // None if no partition predicates created
+      partPredicates <- Option.when(candidatePredicates.nonEmpty)(candidatePredicates)
+      // None if any remaining filter cannot be translated to V2
+      dataV2Filters <- tryTranslateToV2(remainingFilters)
+      combined = partPredicates.toArray ++ dataV2Filters
+      if table.canDeleteWhere(combined)
+    } yield {
+      DeleteFromTableWithFilters(relation, combined.toImmutableArraySeq)
+    }
+  }
+
+  /** Translates all expressions to V2 filters, or returns [[None]] if any fail. */
+  private def tryTranslateToV2(predicates: Seq[Expression]): Option[Array[Predicate]] = {
+    val filters = toDataSourceV2Filters(predicates)
+    Option.when(filters.length == predicates.size)(filters)
+  }
+
   private object RewrittenRowLevelCommand {
     type ReturnType = (RowLevelWrite, RowLevelOperation.Command, Expression, LogicalPlan)
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/PushDownUtils.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/PushDownUtils.scala
@@ -149,7 +149,7 @@ object PushDownUtils extends Logging {
         case _ => None
       }
       if (fields.length == transforms.length) {
-        Some(fields.toSeq)
+        Some(fields.toSeq).filter(_.nonEmpty)
       } else {
         None
       }
@@ -177,6 +177,32 @@ object PushDownUtils extends Logging {
     }
   }
 
+  /**
+   * Separates partition filters from data filters and converts pushable partition
+   * filters to [[PartitionPredicateImpl]] instances.
+   *
+   * Callers must first flatten nested partition field references via
+   * [[flattenNestedPartitionFilters]] with [[ExprId]] matching the [[PartitionPredicateField]]s.
+   *
+   * @param flattenedFilters Catalyst filter expressions with partition field references
+   *                         already flattened.
+   * @param partitionFields Partition field metadata.
+   * @return a pair of (created partition predicates, remaining filters not converted).
+   */
+  private[v2] def createPartitionPredicates(
+      flattenedFilters: Seq[Expression],
+      partitionFields: Seq[PartitionPredicateField])
+  : (Seq[PartitionPredicateImpl], Seq[Expression]) = {
+    val partitionAttributes = partitionFields.map(_.attrRef)
+    val (partFilters, nonPartitionFilters) =
+      DataSourceUtils.getPartitionFiltersAndDataFilters(partitionAttributes, flattenedFilters)
+    val (pushable, nonPushable) = partFilters.partition(isPushablePartitionFilter)
+    val (partitionPredicates, errorPartitionPredicates) = pushable.partitionMap { e =>
+      PartitionPredicateImpl(e, partitionFields).toLeft(e)
+    }
+    (partitionPredicates, nonPartitionFilters ++ nonPushable ++ errorPartitionPredicates)
+  }
+
   /**
    * If the scan supports iterative filtering, infer additional partition filters,
    * convert these and unused partition filters to PartitionPredicates,
@@ -186,22 +212,15 @@ object PushDownUtils extends Logging {
       scanBuilder: SupportsPushDownV2Filters,
       partitionFields: Seq[PartitionPredicateField],
       remainingFilters: Seq[Expression]): Seq[Expression] = {
-    val normalizedToOriginal = normalizeNestedPartitionFilters(remainingFilters, partitionFields)
-    val normalized = normalizedToOriginal.keys.toSeq
-    val partitionAttributes = partitionFields.map(_.attrRef)
-    // may infer additional partition filters
-    val (partFilters, nonPartitionFilters) =
-      DataSourceUtils.getPartitionFiltersAndDataFilters(partitionAttributes, normalized)
-    val (pushable, nonPushable) = partFilters.partition(isPushablePartitionFilter)
-    val (partitionPredicates, errorPartitionPredicates) = pushable.partitionMap { e =>
-      PartitionPredicateImpl(e, partitionFields).toLeft(e)
-    }
-    val rejectedPartitionFilters = scanBuilder.pushPredicates(partitionPredicates.toArray).map {
+    val flattenedToOriginal = flattenNestedPartitionFilters(remainingFilters, partitionFields)
+    val flattened = flattenedToOriginal.keys.toSeq
+    val (partPredicates, remaining) = createPartitionPredicates(flattened, partitionFields)
+    val rejectedPartitionFilters = scanBuilder.pushPredicates(partPredicates.toArray).map {
       p => p.asInstanceOf[PartitionPredicateImpl].expression
     }.toSeq
-    (nonPartitionFilters ++ nonPushable ++ errorPartitionPredicates ++ rejectedPartitionFilters)
-      .filter(normalizedToOriginal.contains)
-      .map(normalizedToOriginal)
+    (remaining ++ rejectedPartitionFilters)
+      .filter(flattenedToOriginal.contains)
+      .map(flattenedToOriginal)
   }
 
   private def isPushablePartitionFilter(f: Expression) =
@@ -218,9 +237,9 @@ object PushDownUtils extends Logging {
    * (identity transform on a nested field), the analyzer produces
    * `GetStructField(attr("s"), "tz")`. This method replaces that chain with `attr("s.tz")`.
    *
-   * Returns a map from normalized expression to original.
+   * Returns a map from flattened expression to original.
    */
-  private def normalizeNestedPartitionFilters(
+  private[v2] def flattenNestedPartitionFilters(
       filters: Seq[Expression],
       partitionFields: Seq[PartitionPredicateField])
   : Map[Expression, Expression] = {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/connector/DataSourceV2EnhancedDeleteFilterSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/connector/DataSourceV2EnhancedDeleteFilterSuite.scala