address

brkyvz · brkyvz · commit be3912552d20 · 2017-09-17T18:32:40.000-07:00
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/SparkPlanTest.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/SparkPlanTest.scala
@@ -231,10 +231,6 @@ object SparkPlanTest {
     }
   }
 
-  /**
-   *
-   */
-
   /**
    * Runs the plan
    * @param outputPlan SparkPlan to be executed
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/FlatMapGroupsWithStateSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/FlatMapGroupsWithStateSuite.scala
@@ -17,25 +17,23 @@
 
 package org.apache.spark.sql.streaming
 
-import java.io.File
 import java.sql.Date
 import java.util.concurrent.ConcurrentHashMap
 
 import org.scalatest.BeforeAndAfterAll
 
 import org.apache.spark.SparkException
 import org.apache.spark.api.java.function.FlatMapGroupsWithStateFunction
-import org.apache.spark.sql.{DataFrame, Dataset, Encoder}
+import org.apache.spark.sql.Encoder
 import org.apache.spark.sql.catalyst.expressions.{GenericInternalRow, UnsafeProjection, UnsafeRow}
 import org.apache.spark.sql.catalyst.plans.logical.FlatMapGroupsWithState
 import org.apache.spark.sql.catalyst.plans.physical.UnknownPartitioning
 import org.apache.spark.sql.catalyst.streaming.InternalOutputModes._
-import org.apache.spark.sql.execution.{RDDScanExec, WholeStageCodegenExec}
-import org.apache.spark.sql.execution.exchange.ShuffleExchange
-import org.apache.spark.sql.execution.streaming.{FlatMapGroupsWithStateExec, GroupStateImpl, MemoryStream, StreamingQueryWrapper}
+import org.apache.spark.sql.execution.RDDScanExec
+import org.apache.spark.sql.execution.streaming.{FlatMapGroupsWithStateExec, GroupStateImpl, MemoryStream}
 import org.apache.spark.sql.execution.streaming.state.{StateStore, StateStoreId, StateStoreMetrics, UnsafeRowPair}
 import org.apache.spark.sql.streaming.FlatMapGroupsWithStateSuite.MemoryStateStore
-import org.apache.spark.sql.streaming.util.{MockSourceProvider, StreamManualClock}
+import org.apache.spark.sql.streaming.util.StreamManualClock
 import org.apache.spark.sql.types.{DataType, IntegerType}
 
 /** Class to check custom state types */
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamTest.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamTest.scala
@@ -351,6 +351,8 @@ trait StreamTest extends QueryTest with SharedSQLContext with TimeLimits with Be
     }
 
     var manualClockExpectedTime = -1L
+    val defaultCheckpointLocation =
+      Utils.createTempDir(namePrefix = "streaming.metadata").getCanonicalPath
     try {
       startedTest.foreach { action =>
         logInfo(s"Processing test stream action: $action")
@@ -363,8 +365,7 @@ trait StreamTest extends QueryTest with SharedSQLContext with TimeLimits with Be
             if (triggerClock.isInstanceOf[StreamManualClock]) {
               manualClockExpectedTime = triggerClock.asInstanceOf[StreamManualClock].getTimeMillis()
             }
-            val metadataRoot = Option(checkpointLocation).getOrElse(
-              Utils.createTempDir(namePrefix = "streaming.metadata").getCanonicalPath)
+            val metadataRoot = Option(checkpointLocation).getOrElse(defaultCheckpointLocation)
 
             additionalConfs.foreach(pair => {
               val value =
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingAggregationSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingAggregationSuite.scala
@@ -24,22 +24,20 @@ import org.scalatest.Assertions
 import org.scalatest.BeforeAndAfterAll
 
 import org.apache.spark.{SparkEnv, SparkException}
-import org.apache.spark.rdd.{BlockRDD, RDD}
+import org.apache.spark.rdd.BlockRDD
 import org.apache.spark.sql.{AnalysisException, DataFrame, Dataset, SparkSession}
 import org.apache.spark.sql.catalyst.InternalRow
-import org.apache.spark.sql.catalyst.expressions.{Attribute, AttributeReference}
 import org.apache.spark.sql.catalyst.plans.logical.Aggregate
-import org.apache.spark.sql.catalyst.plans.physical.{ClusteredDistribution, Distribution, HashPartitioning}
 import org.apache.spark.sql.catalyst.util.DateTimeUtils
-import org.apache.spark.sql.execution.{SparkPlan, SparkPlanTest, UnaryExecNode}
-import org.apache.spark.sql.execution.exchange.{Exchange, ShuffleExchange}
+import org.apache.spark.sql.execution.{SparkPlan, UnaryExecNode}
+import org.apache.spark.sql.execution.exchange.Exchange
 import org.apache.spark.sql.execution.streaming._
 import org.apache.spark.sql.execution.streaming.state.StateStore
 import org.apache.spark.sql.expressions.scalalang.typed
 import org.apache.spark.sql.functions._
 import org.apache.spark.sql.streaming.OutputMode._
 import org.apache.spark.sql.streaming.util.{MockSourceProvider, StreamManualClock}
-import org.apache.spark.sql.types.{IntegerType, StructType}
+import org.apache.spark.sql.types.StructType
 import org.apache.spark.storage.{BlockId, StorageLevel, TestBlockId}
 
 object FailureSingleton {
@@ -435,64 +433,68 @@ class StreamingAggregationSuite extends StateStoreMetricsTest
   /** Add blocks of data to the `BlockRDDBackedSource`. */
   case class AddBlockData(source: BlockRDDBackedSource, data: Seq[Int]*) extends AddData {
     override def addData(query: Option[StreamExecution]): (Source, Offset) = {
-      if (data.nonEmpty) {
-        data.foreach(source.addData)
-      } else {
-        // we would like to create empty blockRDD's so add an empty block here.
-        source.addData()
-      }
-      source.releaseLock()
+      source.addBlocks(data: _*)
       (source, LongOffset(source.counter))
     }
   }
 
   test("SPARK-21977: coalesce(1) with 0 partition RDD should be repartitioned to 1") {
     val inputSource = new BlockRDDBackedSource(spark)
     MockSourceProvider.withMockSources(inputSource) {
-      withTempDir { tempDir =>
-        val aggregated: Dataset[Long] =
-          spark.readStream
-            .format((new MockSourceProvider).getClass.getCanonicalName)
-            .load()
-            .coalesce(1)
-            .groupBy()
-            .count()
-            .as[Long]
-
-        testStream(aggregated, Complete())(
-          AddBlockData(inputSource, Seq(1)),
-          CheckLastBatch(1),
-          AssertOnQuery("Verify no shuffling") { se =>
-            checkAggregationChain(se, expectShuffling = false, 1)
-          },
-          AddBlockData(inputSource), // create an empty trigger
-          CheckLastBatch(1),
-          AssertOnQuery("Verify addition of exchange operator") { se =>
-            checkAggregationChain(se, expectShuffling = true, 1)
-          },
-          AddBlockData(inputSource, Seq(2, 3)),
-          CheckLastBatch(3),
-          AddBlockData(inputSource),
-          CheckLastBatch(3),
-          StopStream
-        )
-      }
+      // `coalesce(1)` changes the partitioning of data to `SinglePartition` which by default
+      // satisfies the required distributions of all aggregations. Therefore in our SparkPlan, we
+      // don't have any shuffling. However, `coalesce(1)` only guarantees that the RDD has at most 1
+      // partition. Which means that if we have an input RDD with 0 partitions, nothing gets
+      // executed. Therefore the StateStore's don't save any delta files for a given trigger. This
+      // then leads to `FileNotFoundException`s in the subsequent batch.
+      // This isn't the only problem though. Once we introduce a shuffle before
+      // `StateStoreRestoreExec`, the input to the operator is an empty iterator. When performing
+      // `groupBy().agg(...)`, `HashAggregateExec` returns a `0` value for all aggregations. If
+      // we fail to restore the previous state in `StateStoreRestoreExec`, we save the 0 value in
+      // `StateStoreSaveExec` losing all previous state.
+      val aggregated: Dataset[Long] =
+        spark.readStream.format((new MockSourceProvider).getClass.getCanonicalName)
+        .load().coalesce(1).groupBy().count().as[Long]
+
+      testStream(aggregated, Complete())(
+        AddBlockData(inputSource, Seq(1)),
+        CheckLastBatch(1),
+        AssertOnQuery("Verify no shuffling") { se =>
+          checkAggregationChain(se, expectShuffling = false, 1)
+        },
+        AddBlockData(inputSource), // create an empty trigger
+        CheckLastBatch(1),
+        AssertOnQuery("Verify addition of exchange operator") { se =>
+          checkAggregationChain(se, expectShuffling = true, 1)
+        },
+        AddBlockData(inputSource, Seq(2, 3)),
+        CheckLastBatch(3),
+        AddBlockData(inputSource),
+        CheckLastBatch(3),
+        StopStream
+      )
     }
   }
 
-  test("SPARK-21977: coalesce(1) should still be repartitioned when it has keyExpressions") {
+  test("SPARK-21977: coalesce(1) with aggregation should still be repartitioned when it " +
+    "has non-empty grouping keys") {
     val inputSource = new BlockRDDBackedSource(spark)
     MockSourceProvider.withMockSources(inputSource) {
       withTempDir { tempDir =>
 
+        // `coalesce(1)` changes the partitioning of data to `SinglePartition` which by default
+        // satisfies the required distributions of all aggregations. However, when we have
+        // non-empty grouping keys, in streaming, we must repartition to
+        // `spark.sql.shuffle.partitions`, otherwise only a single StateStore is used to process
+        // all keys. This may be fine, however, if the user removes the coalesce(1) or changes to
+        // a `coalesce(2)` for example, then the default behavior is to shuffle to
+        // `spark.sql.shuffle.partitions` many StateStores. When this happens, all StateStore's
+        // except 1 will be missing their previous delta files, which causes the stream to fail
+        // with FileNotFoundException.
         def createDf(partitions: Int): Dataset[(Long, Long)] = {
           spark.readStream
             .format((new MockSourceProvider).getClass.getCanonicalName)
-            .load()
-            .coalesce(partitions)
-            .groupBy('a % 1) // just to give it a fake key
-            .count()
-            .as[(Long, Long)]
+            .load().coalesce(partitions).groupBy('a % 1).count().as[(Long, Long)]
         }
 
         testStream(createDf(1), Complete())(
@@ -536,29 +538,18 @@ class BlockRDDBackedSource(spark: SparkSession) extends Source {
   private val blockMgr = SparkEnv.get.blockManager
   private var blocks: Seq[BlockId] = Seq.empty
 
-  private var streamLock: CountDownLatch = new CountDownLatch(1)
-
-  def addData(data: Int*): Unit = {
-    if (streamLock.getCount == 0) {
-      streamLock = new CountDownLatch(1)
-    }
-    synchronized {
-      if (data.nonEmpty) {
-        val id = TestBlockId(counter.toString)
-        blockMgr.putIterator(id, data.iterator, StorageLevel.MEMORY_ONLY)
-        blocks ++= id :: Nil
-      }
+  def addBlocks(dataBlocks: Seq[Int]*): Unit = synchronized {
+    dataBlocks.foreach { data =>
+      val id = TestBlockId(counter.toString)
+      blockMgr.putIterator(id, data.iterator, StorageLevel.MEMORY_ONLY)
+      blocks ++= id :: Nil
       counter += 1
     }
+    counter += 1
   }
 
-  def releaseLock(): Unit = streamLock.countDown()
-
-  override def getOffset: Option[Offset] = {
-    streamLock.await()
-    synchronized {
-      if (counter == 0) None else Some(LongOffset(counter))
-    }
+  override def getOffset: Option[Offset] = synchronized {
+    if (counter == 0) None else Some(LongOffset(counter))
   }
 
   override def getBatch(start: Option[Offset], end: Offset): DataFrame = synchronized {

Original file line number	Diff line number	Diff line change
`@@ -231,10 +231,6 @@ object SparkPlanTest {`
`231`	`231`	`}`
`232`	`232`	`}`
`233`	`233`
`234`		`- /**`
`235`		`- *`
`236`		`- */`
`237`		`-`
`238`	`234`	`/**`
`239`	`235`	`* Runs the plan`
`240`	`236`	`* @param outputPlan SparkPlan to be executed`