Change the strategy: "add new option" -> "apply by default, but keep backward compatible"

HeartSaVioR · HeartSaVioR · commit 63dfb5d2c82d · 2018-07-20T13:51:33.000+09:00
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/internal/SQLConf.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/internal/SQLConf.scala
@@ -871,15 +871,15 @@ object SQLConf {
     .intConf
     .createWithDefault(2)
 
-  val ADVANCED_REMOVE_REDUNDANT_IN_STATEFUL_AGGREGATION =
-    buildConf("spark.sql.streaming.advanced.removeRedundantInStatefulAggregation")
+  val STREAMING_AGGREGATION_STATE_FORMAT_VERSION =
+    buildConf("spark.sql.streaming.streamingAggregation.stateFormatVersion")
       .internal()
-      .doc("ADVANCED: When true, stateful aggregation tries to remove redundant data " +
-      "between key and value in state. Enabling this option helps minimizing state size, " +
-      "but no longer be compatible with state with disabling this option." +
-      "You can't change this option after starting the query.")
-      .booleanConf
-      .createWithDefault(false)
+      .doc("State format version used by streaming aggregation operations triggered " +
+        "explicitly or implicitly via agg() in a streaming query. State between versions are " +
+        "tend to be incompatible, so state format version shouldn't be modified after running.")
+      .intConf
+      .checkValue(v => Set(1, 2).contains(v), "Valid versions are 1 and 2")
+      .createWithDefault(2)
 
   val UNSUPPORTED_OPERATION_CHECK_ENABLED =
     buildConf("spark.sql.streaming.unsupportedOperationCheck")
@@ -1628,9 +1628,6 @@ class SQLConf extends Serializable with Logging {
   def advancedPartitionPredicatePushdownEnabled: Boolean =
     getConf(ADVANCED_PARTITION_PREDICATE_PUSHDOWN)
 
-  def advancedRemoveRedundantInStatefulAggregation: Boolean =
-    getConf(ADVANCED_REMOVE_REDUNDANT_IN_STATEFUL_AGGREGATION)
-
   def fallBackToHdfsForStatsEnabled: Boolean = getConf(ENABLE_FALL_BACK_TO_HDFS_FOR_STATS)
 
   def preferSortMergeJoin: Boolean = getConf(PREFER_SORTMERGEJOIN)
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/SparkStrategies.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/SparkStrategies.scala
@@ -328,10 +328,13 @@ abstract class SparkStrategies extends QueryPlanner[SparkPlan] {
             "Streaming aggregation doesn't support group aggregate pandas UDF")
         }
 
+        val stateVersion = conf.getConf(SQLConf.STREAMING_AGGREGATION_STATE_FORMAT_VERSION)
+
         aggregate.AggUtils.planStreamingAggregation(
           namedGroupingExpressions,
           aggregateExpressions.map(expr => expr.asInstanceOf[AggregateExpression]),
           rewrittenResultExpressions,
+          stateVersion,
           planLater(child))
 
       case _ => Nil
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/AggUtils.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/AggUtils.scala
@@ -256,6 +256,7 @@ object AggUtils {
       groupingExpressions: Seq[NamedExpression],
       functionsWithoutDistinct: Seq[AggregateExpression],
       resultExpressions: Seq[NamedExpression],
+      stateFormatVersion: Int,
       child: SparkPlan): Seq[SparkPlan] = {
 
     val groupingAttributes = groupingExpressions.map(_.toAttribute)
@@ -287,7 +288,8 @@ object AggUtils {
         child = partialAggregate)
     }
 
-    val restored = StateStoreRestoreExec(groupingAttributes, None, partialMerged1)
+    val restored = StateStoreRestoreExec(groupingAttributes, None, stateFormatVersion,
+      partialMerged1)
 
     val partialMerged2: SparkPlan = {
       val aggregateExpressions = functionsWithoutDistinct.map(_.copy(mode = PartialMerge))
@@ -311,6 +313,7 @@ object AggUtils {
         stateInfo = None,
         outputMode = None,
         eventTimeWatermark = None,
+        stateFormatVersion = stateFormatVersion,
         partialMerged2)
 
     val finalAndCompleteAggregate: SparkPlan = {
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/IncrementalExecution.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/IncrementalExecution.scala
@@ -100,19 +100,21 @@ class IncrementalExecution(
   val state = new Rule[SparkPlan] {
 
     override def apply(plan: SparkPlan): SparkPlan = plan transform {
-      case StateStoreSaveExec(keys, None, None, None,
+      case StateStoreSaveExec(keys, None, None, None, stateFormatVersion,
              UnaryExecNode(agg,
-               StateStoreRestoreExec(_, None, child))) =>
+               StateStoreRestoreExec(_, None, _, child))) =>
         val aggStateInfo = nextStatefulOperationStateInfo
         StateStoreSaveExec(
           keys,
           Some(aggStateInfo),
           Some(outputMode),
           Some(offsetSeqMetadata.batchWatermarkMs),
+          stateFormatVersion,
           agg.withNewChildren(
             StateStoreRestoreExec(
               keys,
               Some(aggStateInfo),
+              stateFormatVersion,
               child) :: Nil))
 
       case StreamingDeduplicateExec(keys, child, None, None) =>
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/OffsetSeq.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/OffsetSeq.scala
@@ -89,7 +89,7 @@ object OffsetSeqMetadata extends Logging {
   private implicit val format = Serialization.formats(NoTypeHints)
   private val relevantSQLConfs = Seq(
     SHUFFLE_PARTITIONS, STATE_STORE_PROVIDER_CLASS, STREAMING_MULTIPLE_WATERMARK_POLICY,
-    FLATMAPGROUPSWITHSTATE_STATE_FORMAT_VERSION, ADVANCED_REMOVE_REDUNDANT_IN_STATEFUL_AGGREGATION)
+    FLATMAPGROUPSWITHSTATE_STATE_FORMAT_VERSION, STREAMING_AGGREGATION_STATE_FORMAT_VERSION)
 
   /**
    * Default values of relevant configurations that are used for backward compatibility.
@@ -104,7 +104,9 @@ object OffsetSeqMetadata extends Logging {
   private val relevantSQLConfDefaultValues = Map[String, String](
     STREAMING_MULTIPLE_WATERMARK_POLICY.key -> MultipleWatermarkPolicy.DEFAULT_POLICY_NAME,
     FLATMAPGROUPSWITHSTATE_STATE_FORMAT_VERSION.key ->
-      FlatMapGroupsWithStateExecHelper.legacyVersion.toString
+      FlatMapGroupsWithStateExecHelper.legacyVersion.toString,
+    STREAMING_AGGREGATION_STATE_FORMAT_VERSION.key ->
+      StatefulOperatorsHelper.legacyVersion.toString
   )
 
   def apply(json: String): OffsetSeqMetadata = Serialization.read[OffsetSeqMetadata](json)
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StatefulOperatorsHelper.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StatefulOperatorsHelper.scala
@@ -22,10 +22,13 @@ import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{Attribute, UnsafeRow}
 import org.apache.spark.sql.catalyst.expressions.codegen.{GenerateUnsafeProjection, GenerateUnsafeRowJoiner}
 import org.apache.spark.sql.execution.streaming.state.{StateStore, UnsafeRowPair}
-import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types.StructType
 
 object StatefulOperatorsHelper {
+
+  val supportedVersions = Seq(1, 2)
+  val legacyVersion = 1
+
   sealed trait StreamingAggregationStateManager extends Serializable {
     def extractKey(row: InternalRow): UnsafeRow
     def getValueExpressions: Seq[Attribute]
@@ -35,16 +38,14 @@ object StatefulOperatorsHelper {
   }
 
   object StreamingAggregationStateManager extends Logging {
-    def newImpl(
+    def createStateManager(
         keyExpressions: Seq[Attribute],
         childOutput: Seq[Attribute],
-        conf: SQLConf): StreamingAggregationStateManager = {
-
-      if (conf.advancedRemoveRedundantInStatefulAggregation) {
-        log.info("Advanced option removeRedundantInStatefulAggregation activated!")
-        new StreamingAggregationStateManagerImplV2(keyExpressions, childOutput)
-      } else {
-        new StreamingAggregationStateManagerImplV1(keyExpressions, childOutput)
+        stateFormatVersion: Int): StreamingAggregationStateManager = {
+      stateFormatVersion match {
+        case 1 => new StreamingAggregationStateManagerImplV1(keyExpressions, childOutput)
+        case 2 => new StreamingAggregationStateManagerImplV2(keyExpressions, childOutput)
+        case _ => throw new IllegalArgumentException(s"Version $stateFormatVersion is invalid")
       }
     }
   }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/statefulOperators.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/statefulOperators.scala
@@ -200,13 +200,15 @@ object WatermarkSupport {
 case class StateStoreRestoreExec(
     keyExpressions: Seq[Attribute],
     stateInfo: Option[StatefulOperatorStateInfo],
+    stateFormatVersion: Int,
     child: SparkPlan)
   extends UnaryExecNode with StateStoreReader {
 
+  private[sql] val stateManager = StreamingAggregationStateManager.createStateManager(
+    keyExpressions, child.output, stateFormatVersion)
+
   override protected def doExecute(): RDD[InternalRow] = {
     val numOutputRows = longMetric("numOutputRows")
-    val stateManager = StreamingAggregationStateManager.newImpl(keyExpressions, child.output,
-      sqlContext.conf)
 
     child.execute().mapPartitionsWithStateStore(
       getStateInfo,
@@ -255,17 +257,18 @@ case class StateStoreSaveExec(
     stateInfo: Option[StatefulOperatorStateInfo] = None,
     outputMode: Option[OutputMode] = None,
     eventTimeWatermark: Option[Long] = None,
+    stateFormatVersion: Int,
     child: SparkPlan)
   extends UnaryExecNode with StateStoreWriter with WatermarkSupport {
 
+  private[sql] val stateManager = StreamingAggregationStateManager.createStateManager(
+    keyExpressions, child.output, stateFormatVersion)
+
   override protected def doExecute(): RDD[InternalRow] = {
     metrics // force lazy init at driver
     assert(outputMode.nonEmpty,
       "Incorrect planning in IncrementalExecution, outputMode has not been set")
 
-    val stateManager = StreamingAggregationStateManager.newImpl(keyExpressions, child.output,
-      sqlContext.conf)
-
     child.execute().mapPartitionsWithStateStore(
       getStateInfo,
       keyExpressions.toStructType,
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingAggregationSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingAggregationSuite.scala
@@ -19,8 +19,7 @@ package org.apache.spark.sql.streaming
 
 import java.util.{Locale, TimeZone}
 
-import org.scalatest.Assertions
-import org.scalatest.BeforeAndAfterAll
+import org.scalatest.{Assertions, BeforeAndAfterAll}
 
 import org.apache.spark.{SparkEnv, SparkException}
 import org.apache.spark.rdd.BlockRDD
@@ -54,30 +53,35 @@ class StreamingAggregationSuite extends StateStoreMetricsTest
 
   import testImplicits._
 
-  val confAndTestNamePostfixMatrix = List(
-    (Seq(SQLConf.ADVANCED_REMOVE_REDUNDANT_IN_STATEFUL_AGGREGATION.key -> "false"), ""),
-    (Seq(SQLConf.ADVANCED_REMOVE_REDUNDANT_IN_STATEFUL_AGGREGATION.key -> "true"),
-      " : enable remove redundant in stateful aggregation")
-  )
+  def executeFuncWithStateVersionSQLConf(
+      stateVersion: Int,
+      confPairs: Seq[(String, String)],
+      func: => Any): Unit = {
+    withSQLConf(confPairs ++
+      Seq(SQLConf.STREAMING_AGGREGATION_STATE_FORMAT_VERSION.key -> stateVersion.toString): _*) {
+      func
+    }
+  }
 
-  def testWithAggrOptions(testName: String, pairs: (String, String)*)(testFun: => Any): Unit = {
-    confAndTestNamePostfixMatrix.foreach {
-      case (conf, testNamePostfix) => withSQLConf(pairs ++ conf: _*) {
-        test(testName + testNamePostfix)(testFun)
+  def testWithAllStateVersions(name: String, confPairs: (String, String)*)
+                              (func: => Any): Unit = {
+    for (version <- StatefulOperatorsHelper.supportedVersions) {
+      test(s"$name - state format version $version") {
+        executeFuncWithStateVersionSQLConf(version, confPairs, func)
       }
     }
   }
 
-  def testQuietlyWithAggrOptions(testName: String, pairs: (String, String)*)
-                                (testFun: => Any): Unit = {
-    confAndTestNamePostfixMatrix.foreach {
-      case (conf, testNamePostfix) => withSQLConf(pairs ++ conf: _*) {
-        testQuietly(testName + testNamePostfix)(testFun)
+  def testQuietlyWithAllStateVersions(name: String, confPairs: (String, String)*)
+                                     (func: => Any): Unit = {
+    for (version <- StatefulOperatorsHelper.supportedVersions) {
+      testQuietly(s"$name - state format version $version") {
+        executeFuncWithStateVersionSQLConf(version, confPairs, func)
       }
     }
   }
 
-  testWithAggrOptions("simple count, update mode") {
+  testWithAllStateVersions("simple count, update mode") {
     val inputData = MemoryStream[Int]
 
     val aggregated =
@@ -101,7 +105,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest
     )
   }
 
-  testWithAggrOptions("count distinct") {
+  testWithAllStateVersions("count distinct") {
     val inputData = MemoryStream[(Int, Seq[Int])]
 
     val aggregated =
@@ -117,7 +121,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest
     )
   }
 
-  testWithAggrOptions("simple count, complete mode") {
+  testWithAllStateVersions("simple count, complete mode") {
     val inputData = MemoryStream[Int]
 
     val aggregated =
@@ -140,7 +144,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest
     )
   }
 
-  testWithAggrOptions("simple count, append mode") {
+  testWithAllStateVersions("simple count, append mode") {
     val inputData = MemoryStream[Int]
 
     val aggregated =
@@ -157,7 +161,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest
     }
   }
 
-  testWithAggrOptions("sort after aggregate in complete mode") {
+  testWithAllStateVersions("sort after aggregate in complete mode") {
     val inputData = MemoryStream[Int]
 
     val aggregated =
@@ -182,7 +186,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest
     )
   }
 
-  testWithAggrOptions("state metrics") {
+  testWithAllStateVersions("state metrics") {
     val inputData = MemoryStream[Int]
 
     val aggregated =
@@ -235,7 +239,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest
     )
   }
 
-  testWithAggrOptions("multiple keys") {
+  testWithAllStateVersions("multiple keys") {
     val inputData = MemoryStream[Int]
 
     val aggregated =
@@ -252,7 +256,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest
     )
   }
 
-  testQuietlyWithAggrOptions("midbatch failure") {
+  testQuietlyWithAllStateVersions("midbatch failure") {
     val inputData = MemoryStream[Int]
     FailureSingleton.firstTime = true
     val aggregated =
@@ -278,7 +282,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest
     )
   }
 
-  testWithAggrOptions("typed aggregators") {
+  testWithAllStateVersions("typed aggregators") {
     val inputData = MemoryStream[(String, Int)]
     val aggregated = inputData.toDS().groupByKey(_._1).agg(typed.sumLong(_._2))
 
@@ -288,7 +292,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest
     )
   }
 
-  testWithAggrOptions("prune results by current_time, complete mode") {
+  testWithAllStateVersions("prune results by current_time, complete mode") {
     import testImplicits._
     val clock = new StreamManualClock
     val inputData = MemoryStream[Long]
@@ -340,7 +344,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest
     )
   }
 
-  testWithAggrOptions("prune results by current_date, complete mode") {
+  testWithAllStateVersions("prune results by current_date, complete mode") {
     import testImplicits._
     val clock = new StreamManualClock
     val tz = TimeZone.getDefault.getID
@@ -389,7 +393,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest
     )
   }
 
-  testWithAggrOptions("SPARK-19690: do not convert batch aggregation in streaming query " +
+  testWithAllStateVersions("SPARK-19690: do not convert batch aggregation in streaming query " +
     "to streaming") {
     val streamInput = MemoryStream[Int]
     val batchDF = Seq(1, 2, 3, 4, 5)
@@ -454,7 +458,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest
     true
   }
 
-  testWithAggrOptions("SPARK-21977: coalesce(1) with 0 partition RDD should be " +
+  testWithAllStateVersions("SPARK-21977: coalesce(1) with 0 partition RDD should be " +
     "repartitioned to 1") {
     val inputSource = new BlockRDDBackedSource(spark)
     MockSourceProvider.withMockSources(inputSource) {
@@ -493,8 +497,8 @@ class StreamingAggregationSuite extends StateStoreMetricsTest
     }
   }
 
-  testWithAggrOptions("SPARK-21977: coalesce(1) with aggregation should still be repartitioned " +
-    "when it has non-empty grouping keys") {
+  testWithAllStateVersions("SPARK-21977: coalesce(1) with aggregation should still be " +
+    "repartitioned when it has non-empty grouping keys") {
     val inputSource = new BlockRDDBackedSource(spark)
     MockSourceProvider.withMockSources(inputSource) {
       withTempDir { tempDir =>
@@ -546,7 +550,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest
     }
   }
 
-  testWithAggrOptions("SPARK-22230: last should change with new batches") {
+  testWithAllStateVersions("SPARK-22230: last should change with new batches") {
     val input = MemoryStream[Int]
 
     val aggregated = input.toDF().agg(last('value))
@@ -562,7 +566,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest
     )
   }
 
-  testWithAggrOptions("SPARK-23004: Ensure that TypedImperativeAggregate functions " +
+  testWithAllStateVersions("SPARK-23004: Ensure that TypedImperativeAggregate functions " +
     "do not throw errors", SQLConf.SHUFFLE_PARTITIONS.key -> "1") {
     // See the JIRA SPARK-23004 for more details. In short, this test reproduces the error
     // by ensuring the following.

Original file line number	Diff line number	Diff line change
`@@ -19,8 +19,7 @@ package org.apache.spark.sql.streaming`
`19`	`19`
`20`	`20`	`import java.util.{Locale, TimeZone}`
`21`	`21`
`22`		`-import org.scalatest.Assertions`
`23`		`-import org.scalatest.BeforeAndAfterAll`
	`22`	`+import org.scalatest.{Assertions, BeforeAndAfterAll}`
`24`	`23`
`25`	`24`	`import org.apache.spark.{SparkEnv, SparkException}`
`26`	`25`	`import org.apache.spark.rdd.BlockRDD`
`@@ -54,30 +53,35 @@ class StreamingAggregationSuite extends StateStoreMetricsTest`
`54`	`53`
`55`	`54`	`import testImplicits._`
`56`	`55`
`57`		`- val confAndTestNamePostfixMatrix = List(`
`58`		`- (Seq(SQLConf.ADVANCED_REMOVE_REDUNDANT_IN_STATEFUL_AGGREGATION.key -> "false"), ""),`
`59`		`- (Seq(SQLConf.ADVANCED_REMOVE_REDUNDANT_IN_STATEFUL_AGGREGATION.key -> "true"),`
`60`		`- " : enable remove redundant in stateful aggregation")`
`61`		`- )`
	`56`	`+ def executeFuncWithStateVersionSQLConf(`
	`57`	`+ stateVersion: Int,`
	`58`	`+ confPairs: Seq[(String, String)],`
	`59`	`+ func: => Any): Unit = {`
	`60`	`+ withSQLConf(confPairs ++`
	`61`	`+ Seq(SQLConf.STREAMING_AGGREGATION_STATE_FORMAT_VERSION.key -> stateVersion.toString): _*) {`
	`62`	`+ func`
	`63`	`+ }`
	`64`	`+ }`
`62`	`65`
`63`		`- def testWithAggrOptions(testName: String, pairs: (String, String)*)(testFun: => Any): Unit = {`
`64`		`- confAndTestNamePostfixMatrix.foreach {`
`65`		`- case (conf, testNamePostfix) => withSQLConf(pairs ++ conf: _*) {`
`66`		`- test(testName + testNamePostfix)(testFun)`
	`66`	`+ def testWithAllStateVersions(name: String, confPairs: (String, String)*)`
	`67`	`+ (func: => Any): Unit = {`
	`68`	`+ for (version <- StatefulOperatorsHelper.supportedVersions) {`
	`69`	`+ test(s"$name - state format version $version") {`
	`70`	`+ executeFuncWithStateVersionSQLConf(version, confPairs, func)`
`67`	`71`	`}`
`68`	`72`	`}`
`69`	`73`	`}`
`70`	`74`
`71`		`- def testQuietlyWithAggrOptions(testName: String, pairs: (String, String)*)`
`72`		`- (testFun: => Any): Unit = {`
`73`		`- confAndTestNamePostfixMatrix.foreach {`
`74`		`- case (conf, testNamePostfix) => withSQLConf(pairs ++ conf: _*) {`
`75`		`- testQuietly(testName + testNamePostfix)(testFun)`
	`75`	`+ def testQuietlyWithAllStateVersions(name: String, confPairs: (String, String)*)`
	`76`	`+ (func: => Any): Unit = {`
	`77`	`+ for (version <- StatefulOperatorsHelper.supportedVersions) {`
	`78`	`+ testQuietly(s"$name - state format version $version") {`
	`79`	`+ executeFuncWithStateVersionSQLConf(version, confPairs, func)`
`76`	`80`	`}`
`77`	`81`	`}`
`78`	`82`	`}`
`79`	`83`
`80`		`- testWithAggrOptions("simple count, update mode") {`
	`84`	`+ testWithAllStateVersions("simple count, update mode") {`
`81`	`85`	`val inputData = MemoryStream[Int]`
`82`	`86`
`83`	`87`	`val aggregated =`
`@@ -101,7 +105,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest`
`101`	`105`	`)`
`102`	`106`	`}`
`103`	`107`
`104`		`- testWithAggrOptions("count distinct") {`
	`108`	`+ testWithAllStateVersions("count distinct") {`
`105`	`109`	`val inputData = MemoryStream[(Int, Seq[Int])]`
`106`	`110`
`107`	`111`	`val aggregated =`
`@@ -117,7 +121,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest`
`117`	`121`	`)`
`118`	`122`	`}`
`119`	`123`
`120`		`- testWithAggrOptions("simple count, complete mode") {`
	`124`	`+ testWithAllStateVersions("simple count, complete mode") {`
`121`	`125`	`val inputData = MemoryStream[Int]`
`122`	`126`
`123`	`127`	`val aggregated =`
`@@ -140,7 +144,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest`
`140`	`144`	`)`
`141`	`145`	`}`
`142`	`146`
`143`		`- testWithAggrOptions("simple count, append mode") {`
	`147`	`+ testWithAllStateVersions("simple count, append mode") {`
`144`	`148`	`val inputData = MemoryStream[Int]`
`145`	`149`
`146`	`150`	`val aggregated =`
`@@ -157,7 +161,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest`
`157`	`161`	`}`
`158`	`162`	`}`
`159`	`163`
`160`		`- testWithAggrOptions("sort after aggregate in complete mode") {`
	`164`	`+ testWithAllStateVersions("sort after aggregate in complete mode") {`
`161`	`165`	`val inputData = MemoryStream[Int]`
`162`	`166`
`163`	`167`	`val aggregated =`
`@@ -182,7 +186,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest`
`182`	`186`	`)`
`183`	`187`	`}`
`184`	`188`
`185`		`- testWithAggrOptions("state metrics") {`
	`189`	`+ testWithAllStateVersions("state metrics") {`
`186`	`190`	`val inputData = MemoryStream[Int]`
`187`	`191`
`188`	`192`	`val aggregated =`
`@@ -235,7 +239,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest`
`235`	`239`	`)`
`236`	`240`	`}`
`237`	`241`
`238`		`- testWithAggrOptions("multiple keys") {`
	`242`	`+ testWithAllStateVersions("multiple keys") {`
`239`	`243`	`val inputData = MemoryStream[Int]`
`240`	`244`
`241`	`245`	`val aggregated =`
`@@ -252,7 +256,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest`
`252`	`256`	`)`
`253`	`257`	`}`
`254`	`258`
`255`		`- testQuietlyWithAggrOptions("midbatch failure") {`
	`259`	`+ testQuietlyWithAllStateVersions("midbatch failure") {`
`256`	`260`	`val inputData = MemoryStream[Int]`
`257`	`261`	`FailureSingleton.firstTime = true`
`258`	`262`	`val aggregated =`
`@@ -278,7 +282,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest`
`278`	`282`	`)`
`279`	`283`	`}`
`280`	`284`
`281`		`- testWithAggrOptions("typed aggregators") {`
	`285`	`+ testWithAllStateVersions("typed aggregators") {`
`282`	`286`	`val inputData = MemoryStream[(String, Int)]`
`283`	`287`	`val aggregated = inputData.toDS().groupByKey(_._1).agg(typed.sumLong(_._2))`
`284`	`288`
`@@ -288,7 +292,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest`
`288`	`292`	`)`
`289`	`293`	`}`
`290`	`294`
`291`		`- testWithAggrOptions("prune results by current_time, complete mode") {`
	`295`	`+ testWithAllStateVersions("prune results by current_time, complete mode") {`
`292`	`296`	`import testImplicits._`
`293`	`297`	`val clock = new StreamManualClock`
`294`	`298`	`val inputData = MemoryStream[Long]`
`@@ -340,7 +344,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest`
`340`	`344`	`)`
`341`	`345`	`}`
`342`	`346`
`343`		`- testWithAggrOptions("prune results by current_date, complete mode") {`
	`347`	`+ testWithAllStateVersions("prune results by current_date, complete mode") {`
`344`	`348`	`import testImplicits._`
`345`	`349`	`val clock = new StreamManualClock`
`346`	`350`	`val tz = TimeZone.getDefault.getID`
`@@ -389,7 +393,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest`
`389`	`393`	`)`
`390`	`394`	`}`
`391`	`395`
`392`		`- testWithAggrOptions("SPARK-19690: do not convert batch aggregation in streaming query " +`
	`396`	`+ testWithAllStateVersions("SPARK-19690: do not convert batch aggregation in streaming query " +`
`393`	`397`	`"to streaming") {`
`394`	`398`	`val streamInput = MemoryStream[Int]`
`395`	`399`	`val batchDF = Seq(1, 2, 3, 4, 5)`
`@@ -454,7 +458,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest`
`454`	`458`	`true`
`455`	`459`	`}`
`456`	`460`
`457`		`- testWithAggrOptions("SPARK-21977: coalesce(1) with 0 partition RDD should be " +`
	`461`	`+ testWithAllStateVersions("SPARK-21977: coalesce(1) with 0 partition RDD should be " +`
`458`	`462`	`"repartitioned to 1") {`
`459`	`463`	`val inputSource = new BlockRDDBackedSource(spark)`
`460`	`464`	`MockSourceProvider.withMockSources(inputSource) {`
`@@ -493,8 +497,8 @@ class StreamingAggregationSuite extends StateStoreMetricsTest`
`493`	`497`	`}`
`494`	`498`	`}`
`495`	`499`
`496`		`- testWithAggrOptions("SPARK-21977: coalesce(1) with aggregation should still be repartitioned " +`
`497`		`- "when it has non-empty grouping keys") {`
	`500`	`+ testWithAllStateVersions("SPARK-21977: coalesce(1) with aggregation should still be " +`
	`501`	`+ "repartitioned when it has non-empty grouping keys") {`
`498`	`502`	`val inputSource = new BlockRDDBackedSource(spark)`
`499`	`503`	`MockSourceProvider.withMockSources(inputSource) {`
`500`	`504`	`withTempDir { tempDir =>`
`@@ -546,7 +550,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest`
`546`	`550`	`}`
`547`	`551`	`}`
`548`	`552`
`549`		`- testWithAggrOptions("SPARK-22230: last should change with new batches") {`
	`553`	`+ testWithAllStateVersions("SPARK-22230: last should change with new batches") {`
`550`	`554`	`val input = MemoryStream[Int]`
`551`	`555`
`552`	`556`	`val aggregated = input.toDF().agg(last('value))`
`@@ -562,7 +566,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest`
`562`	`566`	`)`
`563`	`567`	`}`
`564`	`568`
`565`		`- testWithAggrOptions("SPARK-23004: Ensure that TypedImperativeAggregate functions " +`
	`569`	`+ testWithAllStateVersions("SPARK-23004: Ensure that TypedImperativeAggregate functions " +`
`566`	`570`	`"do not throw errors", SQLConf.SHUFFLE_PARTITIONS.key -> "1") {`
`567`	`571`	`// See the JIRA SPARK-23004 for more details. In short, this test reproduces the error`
`568`	`572`	`// by ensuring the following.`