Send DML metrics from job to V2Write

Szehon Ho · szehon-ho · commit c17c6b9c192e · 2025-07-02T19:51:53.000-07:00
diff --git a/sql/catalyst/src/main/java/org/apache/spark/sql/connector/write/BatchWrite.java b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/write/BatchWrite.java
@@ -18,6 +18,7 @@
 package org.apache.spark.sql.connector.write;
 
 import org.apache.spark.annotation.Evolving;
+import org.apache.spark.sql.connector.metric.CustomTaskMetric;
 
 /**
  * An interface that defines how to write the data to data source for batch processing.
@@ -104,4 +105,19 @@ default void onDataWriterCommit(WriterCommitMessage message) {}
    * clean up the data left by data writers.
    */
   void abort(WriterCommitMessage[] messages);
+
+
+  /**
+   * Whether this batch write requests execution metrics. Returns a row level operation command this batch write
+   * is part of, if requested. Return null if not requested.
+   */
+  default RowLevelOperation.Command requestExecMetrics() {
+    return null;
+  }
+
+  /**
+   * Provides an array of query execution metrics to the batch write prior to commit.
+   * @param metrics an array of execution metrics
+   */
+  default void execMetrics(CustomTaskMetric[] metrics) {}
 }
diff --git a/sql/catalyst/src/main/java/org/apache/spark/sql/connector/write/Write.java b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/write/Write.java
@@ -86,5 +86,4 @@ default CustomMetric[] supportedCustomMetrics() {
   default CustomTaskMetric[] reportDriverMetrics() {
     return new CustomTaskMetric[]{};
   }
-
 }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryBaseTable.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryBaseTable.scala
@@ -23,6 +23,7 @@ import java.util
 import java.util.OptionalLong
 
 import scala.collection.mutable
+import scala.collection.mutable.ListBuffer
 
 import com.google.common.base.Objects
 
@@ -144,6 +145,8 @@ abstract class InMemoryBaseTable(
   // The key `Seq[Any]` is the partition values, value is a set of splits, each with a set of rows.
   val dataMap: mutable.Map[Seq[Any], Seq[BufferedRows]] = mutable.Map.empty
 
+  val commits: ListBuffer[Commit] = ListBuffer[Commit]()
+
   def data: Array[BufferedRows] = dataMap.values.flatten.toArray
 
   def rows: Seq[InternalRow] = dataMap.values.flatten.flatMap(_.rows).toSeq
@@ -498,13 +501,32 @@ abstract class InMemoryBaseTable(
       options: CaseInsensitiveStringMap)
     extends BatchScanBaseClass(_data, readSchema, tableSchema) with SupportsRuntimeFiltering {
 
+    var setFilters = Array.empty[Filter]
+
+    override def reportDriverMetrics(): Array[CustomTaskMetric] =
+      Array(new CustomTaskMetric{
+        override def name(): String = "numSplits"
+        override def value(): Long = 1L
+      })
+
+    override def supportedCustomMetrics(): Array[CustomMetric] = {
+      Array(new CustomMetric {
+        override def name(): String = "numSplits"
+        override def description(): String = "number of splits in the scan"
+        override def aggregateTaskMetrics(taskMetrics: Array[Long]): String = {
+          taskMetrics.sum.toString
+        }
+      })
+    }
+
     override def filterAttributes(): Array[NamedReference] = {
       val scanFields = readSchema.fields.map(_.name).toSet
       partitioning.flatMap(_.references)
         .filter(ref => scanFields.contains(ref.fieldNames.mkString(".")))
     }
 
     override def filter(filters: Array[Filter]): Unit = {
+      this.setFilters = filters
       if (partitioning.length == 1 && partitioning.head.references().length == 1) {
         val ref = partitioning.head.references().head
         filters.foreach {
@@ -575,6 +597,9 @@ abstract class InMemoryBaseTable(
   }
 
   protected abstract class TestBatchWrite extends BatchWrite {
+
+    var commitProperties: mutable.Map[String, String] = mutable.Map.empty[String, String]
+
     override def createBatchWriterFactory(info: PhysicalWriteInfo): DataWriterFactory = {
       BufferedRowsWriterFactory
     }
@@ -583,8 +608,11 @@ abstract class InMemoryBaseTable(
   }
 
   class Append(val info: LogicalWriteInfo) extends TestBatchWrite {
+
     override def commit(messages: Array[WriterCommitMessage]): Unit = dataMap.synchronized {
       withData(messages.map(_.asInstanceOf[BufferedRows]))
+      commits += Commit(Instant.now().toEpochMilli, commitProperties.toMap)
+      commitProperties.clear()
     }
   }
 
@@ -593,13 +621,17 @@ abstract class InMemoryBaseTable(
       val newData = messages.map(_.asInstanceOf[BufferedRows])
       dataMap --= newData.flatMap(_.rows.map(getKey))
       withData(newData)
+      commits += Commit(Instant.now().toEpochMilli, commitProperties.toMap)
+      commitProperties.clear()
     }
   }
 
   class TruncateAndAppend(val info: LogicalWriteInfo) extends TestBatchWrite {
     override def commit(messages: Array[WriterCommitMessage]): Unit = dataMap.synchronized {
       dataMap.clear()
       withData(messages.map(_.asInstanceOf[BufferedRows]))
+      commits += Commit(Instant.now().toEpochMilli, commitProperties.toMap)
+      commitProperties.clear()
     }
   }
 
@@ -747,6 +779,14 @@ private class BufferedRowsReader(
 
   override def close(): Unit = {}
 
+  override def currentMetricsValues(): Array[CustomTaskMetric] =
+    Array[CustomTaskMetric](
+      new CustomTaskMetric {
+        override def name(): String = "numSplits"
+        override def value(): Long = 1
+      }
+    )
+
   private def extractFieldValue(
       field: StructField,
       schema: StructType,
@@ -841,6 +881,8 @@ class InMemoryCustomDriverTaskMetric(value: Long) extends CustomTaskMetric {
   override def value(): Long = value
 }
 
+case class Commit(id: Long, properties: Map[String, String])
+
 sealed trait Operation
 case object Write extends Operation
 case object Delete extends Operation
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryRowLevelOperationTable.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryRowLevelOperationTable.scala
@@ -17,13 +17,17 @@
 
 package org.apache.spark.sql.connector.catalog
 
+import java.time.Instant
 import java.util
 
+import scala.collection.mutable.ListBuffer
+
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.GenericInternalRow
 import org.apache.spark.sql.connector.catalog.constraints.Constraint
 import org.apache.spark.sql.connector.distributions.{Distribution, Distributions}
 import org.apache.spark.sql.connector.expressions.{FieldReference, LogicalExpressions, NamedReference, SortDirection, SortOrder, Transform}
+import org.apache.spark.sql.connector.metric.CustomTaskMetric
 import org.apache.spark.sql.connector.read.{Scan, ScanBuilder}
 import org.apache.spark.sql.connector.write.{BatchWrite, DeltaBatchWrite, DeltaWrite, DeltaWriteBuilder, DeltaWriter, DeltaWriterFactory, LogicalWriteInfo, PhysicalWriteInfo, RequiresDistributionAndOrdering, RowLevelOperation, RowLevelOperationBuilder, RowLevelOperationInfo, SupportsDelta, Write, WriteBuilder, WriterCommitMessage}
 import org.apache.spark.sql.connector.write.RowLevelOperation.Command
@@ -46,6 +50,8 @@ class InMemoryRowLevelOperationTable(
     constraints)
   with SupportsRowLevelOperations {
 
+  private val _scans = ListBuffer.empty[Scan]
+
   private final val PARTITION_COLUMN_REF = FieldReference(PartitionKeyColumn.name)
   private final val INDEX_COLUMN_REF = FieldReference(IndexColumn.name)
   private final val SUPPORTS_DELTAS = "supports-deltas"
@@ -68,6 +74,16 @@ class InMemoryRowLevelOperationTable(
     }
   }
 
+  class InMemoryRowLevelOperationScanBuilder(tableSchema: StructType,
+                                             options: CaseInsensitiveStringMap)
+    extends InMemoryScanBuilder(tableSchema, options) {
+    override def build: Scan = {
+      val scan = super.build
+      _scans += scan
+      scan
+    }
+  }
+
   case class PartitionBasedOperation(command: Command) extends RowLevelOperation {
     var configuredScan: InMemoryBatchScan = _
 
@@ -101,7 +117,7 @@ class InMemoryRowLevelOperationTable(
                 SortDirection.ASCENDING.defaultNullOrdering()))
           }
 
-          override def toBatch: BatchWrite = PartitionBasedReplaceData(configuredScan)
+          override def toBatch: BatchWrite = PartitionBasedReplaceData(configuredScan, command)
 
           override def description: String = "InMemoryWrite"
         }
@@ -111,9 +127,46 @@ class InMemoryRowLevelOperationTable(
     override def description(): String = "InMemoryPartitionReplaceOperation"
   }
 
-  private case class PartitionBasedReplaceData(scan: InMemoryBatchScan) extends TestBatchWrite {
+  abstract class RowLevelOperationBatchWrite(command: Command) extends TestBatchWrite {
+    override def requestExecMetrics(): Command = command
+
+    override def execMetrics(metrics: Array[CustomTaskMetric]): Unit = {
+      metrics.foreach(m => commitProperties += (m.name() -> m.value().toString))
+    }
+
+    override def commit(messages: Array[WriterCommitMessage]): Unit = {
+      assert(_scans.size <= 2, "Expected at most two scans in row-level operations")
+      assert(_scans.count{ case s: InMemoryBatchScan => s.setFilters.nonEmpty } <= 1,
+        "Expected at most one scan with runtime filters in row-level operations")
+      assert(_scans.count{ case s: InMemoryBatchScan => s.setFilters.isEmpty } <= 1,
+        "Expected at most one scan without runtime filters in row-level operations")
+
+      _scans.foreach{
+        case s: InMemoryBatchScan =>
+          val prefix = if (s.setFilters.isEmpty) {
+            ""
+          } else {
+            "secondScan."
+          }
+          s.reportDriverMetrics().foreach { metric =>
+            commitProperties += (prefix + metric.name() -> metric.value().toString)
+          }
+        case _ =>
+      }
+      _scans.clear()
+      doCommit(messages)
+      commits += Commit(Instant.now().toEpochMilli, commitProperties.toMap)
+      commitProperties.clear()
+    }
+
+    def doCommit(messages: Array[WriterCommitMessage]): Unit
+  }
+
+  private case class PartitionBasedReplaceData(scan: InMemoryBatchScan,
+                                               command: RowLevelOperation.Command)
+    extends RowLevelOperationBatchWrite(command) {
 
-    override def commit(messages: Array[WriterCommitMessage]): Unit = dataMap.synchronized {
+    override def doCommit(messages: Array[WriterCommitMessage]): Unit = dataMap.synchronized {
       val newData = messages.map(_.asInstanceOf[BufferedRows])
       val readRows = scan.data.flatMap(_.asInstanceOf[BufferedRows].rows)
       val readPartitions = readRows.map(r => getKey(r, schema)).distinct
@@ -134,7 +187,7 @@ class InMemoryRowLevelOperationTable(
     override def rowId(): Array[NamedReference] = Array(PK_COLUMN_REF)
 
     override def newScanBuilder(options: CaseInsensitiveStringMap): ScanBuilder = {
-      new InMemoryScanBuilder(schema, options)
+      new InMemoryRowLevelOperationScanBuilder(schema, options)
     }
 
     override def newWriteBuilder(info: LogicalWriteInfo): DeltaWriteBuilder = {
@@ -155,7 +208,7 @@ class InMemoryRowLevelOperationTable(
             )
           }
 
-          override def toBatch: DeltaBatchWrite = TestDeltaBatchWrite
+          override def toBatch: DeltaBatchWrite = TestDeltaBatchWrite(command)
         }
       }
     }
@@ -165,12 +218,14 @@ class InMemoryRowLevelOperationTable(
     }
   }
 
-  private object TestDeltaBatchWrite extends DeltaBatchWrite {
+  private case class TestDeltaBatchWrite(command: Command)
+    extends RowLevelOperationBatchWrite(command) with DeltaBatchWrite{
+
     override def createBatchWriterFactory(info: PhysicalWriteInfo): DeltaWriterFactory = {
       DeltaBufferedRowsWriterFactory
     }
 
-    override def commit(messages: Array[WriterCommitMessage]): Unit = {
+    override def doCommit(messages: Array[WriterCommitMessage]): Unit = {
       val newData = messages.map(_.asInstanceOf[BufferedRows])
       withDeletes(newData)
       withData(newData)
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/WriteToDataSourceV2Exec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/WriteToDataSourceV2Exec.scala
@@ -30,10 +30,11 @@ import org.apache.spark.sql.catalyst.util.{removeInternalMetadata, CharVarcharUt
 import org.apache.spark.sql.catalyst.util.RowDeltaUtils.{DELETE_OPERATION, INSERT_OPERATION, REINSERT_OPERATION, UPDATE_OPERATION, WRITE_OPERATION, WRITE_WITH_METADATA_OPERATION}
 import org.apache.spark.sql.connector.catalog.{CatalogV2Util, Column, Identifier, StagedTable, StagingTableCatalog, Table, TableCatalog, TableInfo, TableWritePrivilege}
 import org.apache.spark.sql.connector.expressions.Transform
-import org.apache.spark.sql.connector.metric.CustomMetric
-import org.apache.spark.sql.connector.write.{BatchWrite, DataWriter, DataWriterFactory, DeltaWrite, DeltaWriter, PhysicalWriteInfoImpl, Write, WriterCommitMessage}
+import org.apache.spark.sql.connector.metric.{CustomMetric, CustomTaskMetric}
+import org.apache.spark.sql.connector.write.{BatchWrite, DataWriter, DataWriterFactory, DeltaWrite, DeltaWriter, PhysicalWriteInfoImpl, RowLevelOperation, Write, WriterCommitMessage}
 import org.apache.spark.sql.errors.{QueryCompilationErrors, QueryExecutionErrors}
 import org.apache.spark.sql.execution.{SparkPlan, SQLExecution, UnaryExecNode}
+import org.apache.spark.sql.execution.adaptive.AdaptiveSparkPlanHelper
 import org.apache.spark.sql.execution.metric.{CustomMetrics, SQLMetric, SQLMetrics}
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.util.{LongAccumulator, Utils}
@@ -398,7 +399,7 @@ trait V2ExistingTableWriteExec extends V2TableWriteExec {
 /**
  * The base physical plan for writing data into data source v2.
  */
-trait V2TableWriteExec extends V2CommandExec with UnaryExecNode {
+trait V2TableWriteExec extends V2CommandExec with UnaryExecNode with AdaptiveSparkPlanHelper {
   def query: SparkPlan
   def writingTask: WritingSparkTask[_] = DataWritingSparkTask
 
@@ -422,6 +423,22 @@ trait V2TableWriteExec extends V2CommandExec with UnaryExecNode {
         tempRdd
       }
     }
+
+    val metricsOpt = batchWrite.requestExecMetrics() match {
+      case RowLevelOperation.Command.MERGE =>
+        collectFirst(query) {
+          case m: MergeRowsExec => m.metrics
+        }
+      case _ => None
+    }
+    metricsOpt.foreach { metrics =>
+      batchWrite.execMetrics(
+        metrics.map {
+          case (k, v) => V2ExecMetric(k, v.value)
+        }.toArray
+      )
+    }
+
     // introduce a local var to avoid serializing the whole class
     val task = writingTask
     val writerFactory = batchWrite.createBatchWriterFactory(
@@ -729,3 +746,4 @@ private[v2] case class DataWritingSparkTaskResult(
  */
 private[sql] case class StreamWriterCommitProgress(numOutputRows: Long)
 
+private [v2] case class V2ExecMetric(name: String, value: Long) extends CustomTaskMetric
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/connector/MergeIntoTableSuiteBase.scala b/sql/core/src/test/scala/org/apache/spark/sql/connector/MergeIntoTableSuiteBase.scala
@@ -2045,6 +2045,45 @@ abstract class MergeIntoTableSuiteBase extends RowLevelOperationSuiteBase
     }
   }
 
+  test("V2 write metrics for merge") {
+
+    Seq("true", "false").foreach { aqeEnabled: String =>
+      withTempView("source") {
+        withSQLConf(SQLConf.ADAPTIVE_EXECUTION_ENABLED.key -> aqeEnabled) {
+          createAndInitTable("pk INT NOT NULL, salary INT, dep STRING",
+            """{ "pk": 1, "salary": 100, "dep": "hr" }
+              |{ "pk": 2, "salary": 200, "dep": "software" }
+              |{ "pk": 3, "salary": 300, "dep": "hr" }
+              |{ "pk": 4, "salary": 400, "dep": "marketing" }
+              |{ "pk": 5, "salary": 500, "dep": "executive" }
+              |""".stripMargin)
+
+          val sourceDF = Seq(1, 2, 6, 10).toDF("pk")
+          sourceDF.createOrReplaceTempView("source")
+
+          sql(
+            s"""MERGE INTO $tableNameAsString t
+               |USING source s
+               |ON t.pk = s.pk
+               |WHEN MATCHED AND salary < 200 THEN
+               | DELETE
+               |WHEN NOT MATCHED AND s.pk < 10 THEN
+               | INSERT (pk, salary, dep) VALUES (s.pk, -1, "dummy")
+               |WHEN NOT MATCHED BY SOURCE AND salary > 400 THEN
+               | DELETE
+               |""".stripMargin
+          )
+
+          val table = catalog.loadTable(ident)
+          // scalastyle:off println
+          println(table)
+          // scalastyle:on println
+          sql(s"DROP TABLE $tableNameAsString")
+        }
+      }
+    }
+  }
+
   private def findMergeExec(query: String): MergeRowsExec = {
     val plan = executeAndKeepPlan {
       sql(query)
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveDDLSuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveDDLSuite.scala
@@ -36,7 +36,7 @@ import org.apache.spark.sql.catalyst.TableIdentifier
 import org.apache.spark.sql.catalyst.analysis.TableAlreadyExistsException
 import org.apache.spark.sql.catalyst.catalog._
 import org.apache.spark.sql.catalyst.parser.{CatalystSqlParser, ParseException}
-import org.apache.spark.sql.connector.catalog.{CatalogManager, CatalogV2Util, Identifier, TableChange, TableInfo}
+import org.apache.spark.sql.connector.catalog.{CatalogManager, CatalogV2Util, Identifier, TableCatalog, TableChange, TableInfo}
 import org.apache.spark.sql.connector.catalog.CatalogManager.SESSION_CATALOG_NAME
 import org.apache.spark.sql.connector.catalog.SupportsNamespaces.PROP_OWNER
 import org.apache.spark.sql.execution.command.{DDLSuite, DDLUtils}

Original file line number	Diff line number	Diff line change
`@@ -86,5 +86,4 @@ default CustomMetric[] supportedCustomMetrics() {`
`86`	`86`	`default CustomTaskMetric[] reportDriverMetrics() {`
`87`	`87`	`return new CustomTaskMetric[]{};`
`88`	`88`	`}`
`89`		`-`
`90`	`89`	`}`