apache
diff --git a/‎sql/catalyst/src/main/scala/org/apache/spark/sql/internal/SQLConf.scala‎
Lines changed: 17 additions & 3 deletions b/‎sql/catalyst/src/main/scala/org/apache/spark/sql/internal/SQLConf.scala‎
Lines changed: 17 additions & 3 deletions
diff --git a/‎sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/OffsetSeq.scala‎
Lines changed: 72 additions & 18 deletions b/‎sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/OffsetSeq.scala‎
Lines changed: 72 additions & 18 deletions
diff --git a/‎sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/IncrementalExecution.scala‎
Lines changed: 2 additions & 1 deletion b/‎sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/IncrementalExecution.scala‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamExecution.scala‎
Lines changed: 11 additions & 1 deletion b/‎sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamExecution.scala‎
Lines changed: 11 additions & 1 deletion
diff --git a/‎sql/core/src/test/resources/structured-streaming/checkpoint-version-4.0.1-dedup-spark-53942/commits/0‎
Lines changed: 2 additions & 0 deletions b/‎sql/core/src/test/resources/structured-streaming/checkpoint-version-4.0.1-dedup-spark-53942/commits/0‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎sql/core/src/test/resources/structured-streaming/checkpoint-version-4.0.1-dedup-spark-53942/metadata‎
Lines changed: 1 addition & 0 deletions b/‎sql/core/src/test/resources/structured-streaming/checkpoint-version-4.0.1-dedup-spark-53942/metadata‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎sql/core/src/test/resources/structured-streaming/checkpoint-version-4.0.1-dedup-spark-53942/offsets/0‎
Lines changed: 3 additions & 0 deletions b/‎sql/core/src/test/resources/structured-streaming/checkpoint-version-4.0.1-dedup-spark-53942/offsets/0‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎sql/core/src/test/resources/structured-streaming/checkpoint-version-4.0.1-dedup-spark-53942/state/0/0/1.delta‎
46 Bytes b/‎sql/core/src/test/resources/structured-streaming/checkpoint-version-4.0.1-dedup-spark-53942/state/0/0/1.delta‎
46 Bytes
diff --git a/‎sql/core/src/test/resources/structured-streaming/checkpoint-version-4.0.1-dedup-spark-53942/state/0/0/_metadata/schema‎
265 Bytes b/‎sql/core/src/test/resources/structured-streaming/checkpoint-version-4.0.1-dedup-spark-53942/state/0/0/_metadata/schema‎
265 Bytes
diff --git a/‎sql/core/src/test/resources/structured-streaming/checkpoint-version-4.0.1-dedup-spark-53942/state/0/1/1.delta‎
87 Bytes b/‎sql/core/src/test/resources/structured-streaming/checkpoint-version-4.0.1-dedup-spark-53942/state/0/1/1.delta‎
87 Bytes
@@ -877,9 +877,7 @@ object SQLConf {
     .createOptional
 
   val SHUFFLE_PARTITIONS = buildConf("spark.sql.shuffle.partitions")
-    .doc("The default number of partitions to use when shuffling data for joins or aggregations. " +
-      "Note: For structured streaming, this configuration cannot be changed between query " +
-      "restarts from the same checkpoint location.")
+    .doc("The default number of partitions to use when shuffling data for joins or aggregations.")
     .version("1.1.0")
     .intConf
     .checkValue(_ > 0, "The value of spark.sql.shuffle.partitions must be positive")
@@ -2627,6 +2625,22 @@ object SQLConf {
       .checkValue(k => k >= 0, "Must be greater than or equal to 0")
       .createWithDefault(5)
 
+  val STATEFUL_SHUFFLE_PARTITIONS_INTERNAL =
+    buildConf("spark.sql.streaming.internal.stateStore.partitions")
+      .doc("WARN: This config is used internally and is not intended to be user-facing. This " +
+        "config can be removed without support of compatibility in any time. " +
+        "DO NOT USE THIS CONFIG DIRECTLY AND USE THE CONFIG `spark.sql.shuffle.partitions`. " +
+        "The default number of partitions to use when shuffling data for stateful operations. " +
+        "If not specified, this config picks up the value of `spark.sql.shuffle.partitions`. " +
+        "Note: For structured streaming, this configuration cannot be changed between query " +
+        "restarts from the same checkpoint location.")
+      .internal()
+      .intConf
+      .checkValue(_ > 0,
+        "The value of spark.sql.streaming.internal.stateStore.partitions must be a positive " +
+          "integer.")
+      .createOptional
+
   val FLATMAPGROUPSWITHSTATE_STATE_FORMAT_VERSION =
     buildConf("spark.sql.streaming.flatMapGroupsWithState.stateFormatVersion")
       .internal()
 
@@ -17,11 +17,14 @@
 
 package org.apache.spark.sql.execution.streaming.checkpointing
 
+import scala.language.existentials
+
 import org.json4s.{Formats, NoTypeHints}
 import org.json4s.jackson.Serialization
 
 import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CONFIG, DEFAULT_VALUE, NEW_VALUE, OLD_VALUE, TIP}
+import org.apache.spark.internal.config.ConfigEntry
 import org.apache.spark.io.CompressionCodec
 import org.apache.spark.sql.RuntimeConfig
 import org.apache.spark.sql.connector.read.streaming.{Offset => OffsetV2, SparkDataStream}
@@ -85,6 +88,11 @@ object OffsetSeq {
  * @param batchTimestampMs: The current batch processing timestamp.
  * Time unit: milliseconds
  * @param conf: Additional conf_s to be persisted across batches, e.g. number of shuffle partitions.
+ * CAVEAT: This does not apply the logic we handle in [[OffsetSeqMetadata]] object, e.g.
+ * deducing the default value of SQL config if the entry does not exist in the offset log,
+ * resolving the re-bind of config key (the config key in offset log is not same with the
+ * actual key in session), etc. If you need to get the value with applying the logic, use
+ * [[OffsetSeqMetadata.readValue()]].
  */
 case class OffsetSeqMetadata(
     batchWatermarkMs: Long = 0,
@@ -101,13 +109,35 @@ object OffsetSeqMetadata extends Logging {
    * log in the checkpoint position.
    */
   private val relevantSQLConfs = Seq(
-    SHUFFLE_PARTITIONS, STATE_STORE_PROVIDER_CLASS, STREAMING_MULTIPLE_WATERMARK_POLICY,
+    STATE_STORE_PROVIDER_CLASS, STREAMING_MULTIPLE_WATERMARK_POLICY,
     FLATMAPGROUPSWITHSTATE_STATE_FORMAT_VERSION, STREAMING_AGGREGATION_STATE_FORMAT_VERSION,
     STREAMING_JOIN_STATE_FORMAT_VERSION, STATE_STORE_COMPRESSION_CODEC,
     STATE_STORE_ROCKSDB_FORMAT_VERSION, STATEFUL_OPERATOR_USE_STRICT_DISTRIBUTION,
     PRUNE_FILTERS_CAN_PRUNE_STREAMING_SUBPLAN, STREAMING_STATE_STORE_ENCODING_FORMAT
   )
 
+  /**
+   * This is an extension of `relevantSQLConfs`. The characteristic is the same, but we persist the
+   * value of config A as config B in offset log. This exists for compatibility purpose e.g. if
+   * user upgrades Spark and runs a streaming query, but has to downgrade due to some issues.
+   *
+   * A config should be only bound to either `relevantSQLConfs` or `rebindSQLConfs` (key or value).
+   */
+  private val rebindSQLConfsSessionToOffsetLog: Map[ConfigEntry[_], ConfigEntry[_]] = {
+    Map(
+      // TODO: The proper way to handle this is to make the number of partitions in the state
+      //  metadata as the source of truth, but it requires major changes if we want to take care
+      //  of compatibility.
+      STATEFUL_SHUFFLE_PARTITIONS_INTERNAL -> SHUFFLE_PARTITIONS
+    )
+  }
+
+  /**
+   * Reversed index of `rebindSQLConfsSessionToOffsetLog`.
+   */
+  private val rebindSQLConfsOffsetLogToSession: Map[ConfigEntry[_], ConfigEntry[_]] =
+    rebindSQLConfsSessionToOffsetLog.map { case (k, v) => (v, k) }.toMap
+
   /**
    * Default values of relevant configurations that are used for backward compatibility.
    * As new configurations are added to the metadata, existing checkpoints may not have those
@@ -132,56 +162,80 @@ object OffsetSeqMetadata extends Logging {
     STREAMING_STATE_STORE_ENCODING_FORMAT.key -> "unsaferow"
   )
 
+  def readValue[T](metadataLog: OffsetSeqMetadata, confKey: ConfigEntry[T]): String = {
+    readValueOpt(metadataLog, confKey).getOrElse(confKey.defaultValueString)
+  }
+
+  def readValueOpt[T](
+      metadataLog: OffsetSeqMetadata,
+      confKey: ConfigEntry[T]): Option[String] = {
+    val actualKey = if (rebindSQLConfsSessionToOffsetLog.contains(confKey)) {
+      rebindSQLConfsSessionToOffsetLog(confKey)
+    } else confKey
+
+    metadataLog.conf.get(actualKey.key).orElse(relevantSQLConfDefaultValues.get(actualKey.key))
+  }
+
   def apply(json: String): OffsetSeqMetadata = Serialization.read[OffsetSeqMetadata](json)
 
   def apply(
       batchWatermarkMs: Long,
       batchTimestampMs: Long,
       sessionConf: RuntimeConfig): OffsetSeqMetadata = {
     val confs = relevantSQLConfs.map { conf => conf.key -> sessionConf.get(conf.key) }.toMap
-    OffsetSeqMetadata(batchWatermarkMs, batchTimestampMs, confs)
+    val confsFromRebind = rebindSQLConfsSessionToOffsetLog.map {
+      case (confInSession, confInOffsetLog) =>
+        confInOffsetLog.key -> sessionConf.get(confInSession.key)
+    }.toMap
+    OffsetSeqMetadata(batchWatermarkMs, batchTimestampMs, confs++ confsFromRebind)
   }
 
   /** Set the SparkSession configuration with the values in the metadata */
   def setSessionConf(metadata: OffsetSeqMetadata, sessionConf: SQLConf): Unit = {
-    val configs = sessionConf.getAllConfs
-    OffsetSeqMetadata.relevantSQLConfs.map(_.key).foreach { confKey =>
-
-      metadata.conf.get(confKey) match {
+    def setOneSessionConf(confKeyInOffsetLog: String, confKeyInSession: String): Unit = {
+      metadata.conf.get(confKeyInOffsetLog) match {
 
         case Some(valueInMetadata) =>
           // Config value exists in the metadata, update the session config with this value
-          val optionalValueInSession = sessionConf.getConfString(confKey, null)
+          val optionalValueInSession = sessionConf.getConfString(confKeyInSession, null)
           if (optionalValueInSession != null && optionalValueInSession != valueInMetadata) {
-            logWarning(log"Updating the value of conf '${MDC(CONFIG, confKey)}' in current " +
-              log"session from '${MDC(OLD_VALUE, optionalValueInSession)}' " +
+            logWarning(log"Updating the value of conf '${MDC(CONFIG, confKeyInSession)}' in " +
+              log"current session from '${MDC(OLD_VALUE, optionalValueInSession)}' " +
               log"to '${MDC(NEW_VALUE, valueInMetadata)}'.")
           }
-          sessionConf.setConfString(confKey, valueInMetadata)
+          sessionConf.setConfString(confKeyInSession, valueInMetadata)
 
         case None =>
           // For backward compatibility, if a config was not recorded in the offset log,
           // then either inject a default value (if specified in `relevantSQLConfDefaultValues`) or
           // let the existing conf value in SparkSession prevail.
-          relevantSQLConfDefaultValues.get(confKey) match {
+          relevantSQLConfDefaultValues.get(confKeyInOffsetLog) match {
 
             case Some(defaultValue) =>
-              sessionConf.setConfString(confKey, defaultValue)
-              logWarning(log"Conf '${MDC(CONFIG, confKey)}' was not found in the offset log, " +
-                log"using default value '${MDC(DEFAULT_VALUE, defaultValue)}'")
+              sessionConf.setConfString(confKeyInSession, defaultValue)
+              logWarning(log"Conf '${MDC(CONFIG, confKeyInSession)}' was not found in the offset " +
+                log"log, using default value '${MDC(DEFAULT_VALUE, defaultValue)}'")
 
             case None =>
-              val value = sessionConf.getConfString(confKey, null)
+              val value = sessionConf.getConfString(confKeyInSession, null)
               val valueStr = if (value != null) {
                 s" Using existing session conf value '$value'."
               } else {
                 " No value set in session conf."
               }
-              logWarning(log"Conf '${MDC(CONFIG, confKey)}' was not found in the offset log. " +
-                log"${MDC(TIP, valueStr)}")
-
+              logWarning(log"Conf '${MDC(CONFIG, confKeyInSession)}' was not found in the " +
+                log"offset log. ${MDC(TIP, valueStr)}")
           }
       }
     }
+
+    OffsetSeqMetadata.relevantSQLConfs.map(_.key).foreach { confKey =>
+      setOneSessionConf(confKey, confKey)
+    }
+
+    rebindSQLConfsOffsetLogToSession.foreach {
+      case (confInOffsetLog, confInSession) =>
+        setOneSessionConf(confInOffsetLog.key, confInSession.key)
+    }
   }
 }
@@ -105,7 +105,8 @@ class IncrementalExecution(
 
   private lazy val hadoopConf = sparkSession.sessionState.newHadoopConf()
 
-  private[sql] val numStateStores = offsetSeqMetadata.conf.get(SQLConf.SHUFFLE_PARTITIONS.key)
+  private[sql] val numStateStores = OffsetSeqMetadata.readValueOpt(offsetSeqMetadata,
+      SQLConf.STATEFUL_SHUFFLE_PARTITIONS_INTERNAL)
     .map(SQLConf.SHUFFLE_PARTITIONS.valueConverter)
     .getOrElse(sparkSession.sessionState.conf.numShufflePartitions)
 
 
@@ -155,7 +155,7 @@ abstract class StreamExecution(
   protected def sources: Seq[SparkDataStream]
 
   /** Isolated spark session to run the batches with. */
-  protected val sparkSessionForStream: SparkSession = sparkSession.cloneSession()
+  protected[sql] val sparkSessionForStream: SparkSession = sparkSession.cloneSession()
 
   /**
    * Manages the metadata from this checkpoint location.
@@ -320,6 +320,16 @@ abstract class StreamExecution(
           sparkSessionForStream.conf.set(SQLConf.ADAPTIVE_EXECUTION_ENABLED.key, "false")
         }
 
+        sparkSessionForStream.conf.get(SQLConf.STATEFUL_SHUFFLE_PARTITIONS_INTERNAL) match {
+          case Some(_) => // no-op
+          case None =>
+            // Take the default value of `spark.sql.shuffle.partitions`.
+            val shufflePartitionValue = sparkSessionForStream.conf.get(SQLConf.SHUFFLE_PARTITIONS)
+            sparkSessionForStream.conf.set(
+              SQLConf.STATEFUL_SHUFFLE_PARTITIONS_INTERNAL.key,
+              shufflePartitionValue)
+        }
+
         getLatestExecutionContext().updateStatusMessage("Initializing sources")
         // force initialization of the logical plan so that the sources can be created
         logicalPlan
 
@@ -0,0 +1,2 @@
+v1
+{"nextBatchWatermarkMs":0}
@@ -0,0 +1 @@
+{"id":"295ee44f-dd99-45cf-a21d-9a760b439c45"}
@@ -0,0 +1,3 @@
+v1
+{"batchWatermarkMs":0,"batchTimestampMs":1760948082021,"conf":{"spark.sql.streaming.stateStore.providerClass":"org.apache.spark.sql.execution.streaming.state.HDFSBackedStateStoreProvider","spark.sql.streaming.stateStore.rocksdb.formatVersion":"5","spark.sql.streaming.stateStore.encodingFormat":"unsaferow","spark.sql.streaming.statefulOperator.useStrictDistribution":"true","spark.sql.streaming.flatMapGroupsWithState.stateFormatVersion":"2","spark.sql.streaming.multipleWatermarkPolicy":"min","spark.sql.streaming.aggregation.stateFormatVersion":"2","spark.sql.shuffle.partitions":"5","spark.sql.streaming.join.stateFormatVersion":"2","spark.sql.streaming.stateStore.compression.codec":"lz4","spark.sql.optimizer.pruneFiltersCanPruneStreamingSubplan":"false"}}
+0
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+{"id":"295ee44f-dd99-45cf-a21d-9a760b439c45"}`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+v1`
	`2`	+{"batchWatermarkMs":0,"batchTimestampMs":1760948082021,"conf":{"spark.sql.streaming.stateStore.providerClass":"org.apache.spark.sql.execution.streaming.state.HDFSBackedStateStoreProvider","spark.sql.streaming.stateStore.rocksdb.formatVersion":"5","spark.sql.streaming.stateStore.encodingFormat":"unsaferow","spark.sql.streaming.statefulOperator.useStrictDistribution":"true","spark.sql.streaming.flatMapGroupsWithState.stateFormatVersion":"2","spark.sql.streaming.multipleWatermarkPolicy":"min","spark.sql.streaming.aggregation.stateFormatVersion":"2","spark.sql.shuffle.partitions":"5","spark.sql.streaming.join.stateFormatVersion":"2","spark.sql.streaming.stateStore.compression.codec":"lz4","spark.sql.optimizer.pruneFiltersCanPruneStreamingSubplan":"false"}}
	`3`	`+0`