apache · cxzl25 · Apr 29, 2024 · Apr 29, 2024 · Apr 29, 2024 · May 7, 2024
diff --git a/core/src/main/scala/org/apache/spark/shuffle/sort/SortShuffleManager.scala b/core/src/main/scala/org/apache/spark/shuffle/sort/SortShuffleManager.scala
@@ -176,7 +176,7 @@ private[spark] class SortShuffleManager(conf: SparkConf) extends ShuffleManager
  metrics,
  shuffleExecutorComponents)
  case other: BaseShuffleHandle[K @unchecked, V @unchecked, _] =>
- new SortShuffleWriter(other, mapId, context, shuffleExecutorComponents)
+ new SortShuffleWriter(other, mapId, context, metrics, shuffleExecutorComponents)
  }
  }
 

diff --git a/core/src/main/scala/org/apache/spark/shuffle/sort/SortShuffleWriter.scala b/core/src/main/scala/org/apache/spark/shuffle/sort/SortShuffleWriter.scala
@@ -21,13 +21,15 @@ import org.apache.spark._
 import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.scheduler.MapStatus
 import org.apache.spark.shuffle.{BaseShuffleHandle, ShuffleWriter}
+import org.apache.spark.shuffle.ShuffleWriteMetricsReporter
 import org.apache.spark.shuffle.api.ShuffleExecutorComponents
 import org.apache.spark.util.collection.ExternalSorter
 
 private[spark] class SortShuffleWriter[K, V, C](
  handle: BaseShuffleHandle[K, V, C],
  mapId: Long,
  context: TaskContext,
+ writeMetrics: ShuffleWriteMetricsReporter,
  shuffleExecutorComponents: ShuffleExecutorComponents)
  extends ShuffleWriter[K, V] with Logging {
 
@@ -46,8 +48,6 @@ private[spark] class SortShuffleWriter[K, V, C](
 
  private var partitionLengths: Array[Long] = _
 
- private val writeMetrics = context.taskMetrics().shuffleWriteMetrics
-
  /** Write a bunch of records to this task's output */
  override def write(records: Iterator[Product2[K, V]]): Unit = {
  sorter = if (dep.mapSideCombine) {
@@ -67,7 +67,7 @@ private[spark] class SortShuffleWriter[K, V, C](
  // (see SPARK-3570).
  val mapOutputWriter = shuffleExecutorComponents.createMapOutputWriter(
  dep.shuffleId, mapId, dep.partitioner.numPartitions)
- sorter.writePartitionedMapOutput(dep.shuffleId, mapId, mapOutputWriter)
+ sorter.writePartitionedMapOutput(dep.shuffleId, mapId, mapOutputWriter, writeMetrics)
  partitionLengths = mapOutputWriter.commitAllPartitions(sorter.getChecksums).getPartitionLengths
  mapStatus = MapStatus(blockManager.shuffleServerId, partitionLengths, mapId)
  }

diff --git a/core/src/main/scala/org/apache/spark/util/collection/ExternalSorter.scala b/core/src/main/scala/org/apache/spark/util/collection/ExternalSorter.scala
@@ -30,7 +30,7 @@ import org.apache.spark._
 import org.apache.spark.executor.ShuffleWriteMetrics
 import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.serializer._
-import org.apache.spark.shuffle.ShufflePartitionPairsWriter
+import org.apache.spark.shuffle.{ShufflePartitionPairsWriter, ShuffleWriteMetricsReporter}
 import org.apache.spark.shuffle.api.{ShuffleMapOutputWriter, ShufflePartitionWriter}
 import org.apache.spark.shuffle.checksum.ShuffleChecksumSupport
 import org.apache.spark.storage.{BlockId, DiskBlockObjectWriter, ShuffleBlockId}
@@ -693,7 +693,8 @@ private[spark] class ExternalSorter[K, V, C](
  def writePartitionedMapOutput(
  shuffleId: Int,
  mapId: Long,
- mapOutputWriter: ShuffleMapOutputWriter): Unit = {
+ mapOutputWriter: ShuffleMapOutputWriter,
+ writeMetrics: ShuffleWriteMetricsReporter): Unit = {
  if (spills.isEmpty) {
  // Case where we only have in-memory data
  val collection = if (aggregator.isDefined) map else buffer
@@ -710,7 +711,7 @@ private[spark] class ExternalSorter[K, V, C](
  serializerManager,
  serInstance,
  blockId,
- context.taskMetrics().shuffleWriteMetrics,
 writer = manager.getWriter[Any, Any]( 
 dep.shuffleHandle, 
 mapId, 
 context, 
 createMetricsReporter(context)) 
 writer.write(inputs.asInstanceOf[Iterator[_ <: Product2[Any, Any]]]) 
 def createShuffleWriteProcessor(metrics: Map[String, SQLMetric]): ShuffleWriteProcessor = { 
 new ShuffleWriteProcessor { 
 override protected def createMetricsReporter( 
 context: TaskContext): ShuffleWriteMetricsReporter = { 
 new SQLShuffleWriteMetricsReporter(context.taskMetrics().shuffleWriteMetrics, metrics) 
 } 
 } 
 writer = manager.getWriter[Any, Any]( 
 dep.shuffleHandle, 
 mapId, 
 context, 
 createMetricsReporter(context)) 
 writer.write(inputs.asInstanceOf[Iterator[_ <: Product2[Any, Any]]]) 
 def createShuffleWriteProcessor(metrics: Map[String, SQLMetric]): ShuffleWriteProcessor = { 
 new ShuffleWriteProcessor { 
 override protected def createMetricsReporter( 
 context: TaskContext): ShuffleWriteMetricsReporter = { 
 new SQLShuffleWriteMetricsReporter(context.taskMetrics().shuffleWriteMetrics, metrics) 
 } 
 } 
+ writeMetrics,
  if (partitionChecksums.nonEmpty) partitionChecksums(partitionId) else null)
  while (it.hasNext && it.nextPartition() == partitionId) {
  it.writeNext(partitionPairsWriter)
@@ -734,7 +735,7 @@ private[spark] class ExternalSorter[K, V, C](
  serializerManager,
  serInstance,
  blockId,
- context.taskMetrics().shuffleWriteMetrics,
+ writeMetrics,
  if (partitionChecksums.nonEmpty) partitionChecksums(id) else null)
  if (elements.hasNext) {
  for (elem <- elements) {

diff --git a/core/src/test/scala/org/apache/spark/shuffle/sort/SortShuffleWriterSuite.scala b/core/src/test/scala/org/apache/spark/shuffle/sort/SortShuffleWriterSuite.scala
@@ -85,6 +85,7 @@ class SortShuffleWriterSuite
  shuffleHandle,
  mapId = 1,
  context,
+ context.taskMetrics().shuffleWriteMetrics,
  shuffleExecutorComponents)
  writer.write(Iterator.empty)
  writer.stop(success = true)
@@ -102,6 +103,7 @@ class SortShuffleWriterSuite
  shuffleHandle,
  mapId = 2,
  context,
+ context.taskMetrics().shuffleWriteMetrics,
  shuffleExecutorComponents)
  writer.write(records.iterator)
  writer.stop(success = true)
@@ -158,6 +160,7 @@ class SortShuffleWriterSuite
  shuffleHandle,
  mapId = 0,
  context,
+ context.taskMetrics().shuffleWriteMetrics,
  new LocalDiskShuffleExecutorComponents(
  conf, shuffleBlockResolver._blockManager, shuffleBlockResolver))
  writer.write(records.iterator)

diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/UnsafeRowSerializerSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/UnsafeRowSerializerSuite.scala
@@ -130,7 +130,8 @@ class UnsafeRowSerializerSuite extends SparkFunSuite with LocalSparkSession {
  assert(sorter.numSpills > 0)
 
  // Merging spilled files should not throw assertion error
- sorter.writePartitionedMapOutput(0, 0, mapOutputWriter)
+ sorter.writePartitionedMapOutput(0, 0, mapOutputWriter,
+ taskContext.taskMetrics.shuffleWriteMetrics)
  }
 
  test("SPARK-10403: unsafe row serializer with SortShuffleManager") {

diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/adaptive/AdaptiveQueryExecSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/adaptive/AdaptiveQueryExecSuite.scala
@@ -2502,6 +2502,26 @@ class AdaptiveQueryExecSuite
  }
  }
 
+ test("SPARK-48037: Fix SortShuffleWriter lacks shuffle write related metrics " +
+ "resulting in potentially inaccurate data") {
+ withTable("t3") {
+ withSQLConf(
+ SQLConf.ADAPTIVE_EXECUTION_ENABLED.key -> "true",
+ SQLConf.SHUFFLE_PARTITIONS.key -> "16777217") {
+ sql("CREATE TABLE t3 USING PARQUET AS SELECT id FROM range(2)")
+ val (plan, adaptivePlan) = runAdaptiveAndVerifyResult(
+ """
+ |SELECT id, count(*)
+ |FROM t3
+ |GROUP BY id
+ |LIMIT 1
+ |""".stripMargin, skipCheckAnswer = true)
 def getErrorMessageInCheckAnswer( 
 df: DataFrame, 
 expectedAnswer: Seq[Row], 
 checkToRDD: Boolean = true): Option[String] = { 
 val isSorted = df.logicalPlan.collect { case s: logical.Sort => s }.nonEmpty 
 if (checkToRDD) { 
 SQLExecution.withSQLConfPropagated(df.sparkSession) { 
 df.rdd.count() // Also attempt to deserialize as an RDD [SPARK-15791] 
 } 
 } 
 val sparkAnswer = try df.collect().toSeq catch { 
 def getErrorMessageInCheckAnswer( 
 df: DataFrame, 
 expectedAnswer: Seq[Row], 
 checkToRDD: Boolean = true): Option[String] = { 
 val isSorted = df.logicalPlan.collect { case s: logical.Sort => s }.nonEmpty 
 if (checkToRDD) { 
 SQLExecution.withSQLConfPropagated(df.sparkSession) { 
 df.rdd.count() // Also attempt to deserialize as an RDD [SPARK-15791] 
 } 
 } 
 
 val sparkAnswer = try df.collect().toSeq catch { 
+ assert(findTopLevelLimit(plan).size == 1)
+ assert(findTopLevelLimit(adaptivePlan).size == 1)
+ }
+ }
+ }
+
  test("SPARK-37063: OptimizeSkewInRebalancePartitions support optimize non-root node") {
  withTempView("v") {
  withSQLConf(