From a33bf483760f6721dfd80ea96a1ad89a89d6c2f1 Mon Sep 17 00:00:00 2001
From: Tathagata Das <tathagata.das1565@gmail.com>
Date: Fri, 3 Oct 2014 17:22:55 -0700
Subject: [PATCH 01/10] Initial version of ReceivedDataManager

---
 .../receiver/ReceiverSupervisorImpl.scala     |  46 ++++----
 .../streaming/scheduler/ReceiverTracker.scala |  73 +++++++++---
 .../storage/ReceivedDataManager.scala         |  91 +++++++++++++++
 .../storage/WriteAheadLogManager.scala        | 108 ++++++++++++++++++
 4 files changed, 281 insertions(+), 37 deletions(-)
 create mode 100644 streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedDataManager.scala
 create mode 100644 streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala

diff --git a/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisorImpl.scala b/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisorImpl.scala
index 53a3e6200e340..ef2a22a363374 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisorImpl.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisorImpl.scala
@@ -35,6 +35,7 @@ import org.apache.spark.storage.StreamBlockId
 import org.apache.spark.streaming.scheduler.DeregisterReceiver
 import org.apache.spark.streaming.scheduler.AddBlock
 import org.apache.spark.streaming.scheduler.RegisterReceiver
+import org.apache.spark.streaming.storage._
 
 /**
  * Concrete implementation of [[org.apache.spark.streaming.receiver.ReceiverSupervisor]]
@@ -47,9 +48,8 @@ private[streaming] class ReceiverSupervisorImpl(
     env: SparkEnv
   ) extends ReceiverSupervisor(receiver, env.conf) with Logging {
 
-  private val blockManager = env.blockManager
-
-  private val storageLevel = receiver.storageLevel
+  private val receivedBlockHandler =
+    new BlockManagerBasedBlockHandler(env.blockManager, receiver.streamId, receiver.storageLevel)
 
   /** Remote Akka actor for the ReceiverTracker */
   private val trackerActor = {
@@ -108,11 +108,7 @@ private[streaming] class ReceiverSupervisorImpl(
       optionalMetadata: Option[Any],
       optionalBlockId: Option[StreamBlockId]
     ) {
-    val blockId = optionalBlockId.getOrElse(nextBlockId)
-    val time = System.currentTimeMillis
-    blockManager.putArray(blockId, arrayBuffer.toArray[Any], storageLevel, tellMaster = true)
-    logDebug("Pushed block " + blockId + " in " + (System.currentTimeMillis - time)  + " ms")
-    reportPushedBlock(blockId, arrayBuffer.size, optionalMetadata)
+    pushAndReportBlock(ArrayBufferBlock(arrayBuffer), optionalMetadata, optionalBlockId)
   }
 
   /** Store a iterator of received data as a data block into Spark's memory. */
@@ -121,11 +117,7 @@ private[streaming] class ReceiverSupervisorImpl(
       optionalMetadata: Option[Any],
       optionalBlockId: Option[StreamBlockId]
     ) {
-    val blockId = optionalBlockId.getOrElse(nextBlockId)
-    val time = System.currentTimeMillis
-    blockManager.putIterator(blockId, iterator, storageLevel, tellMaster = true)
-    logDebug("Pushed block " + blockId + " in " + (System.currentTimeMillis - time)  + " ms")
-    reportPushedBlock(blockId, -1, optionalMetadata)
+    pushAndReportBlock(IteratorBlock(iterator), optionalMetadata, optionalBlockId)
   }
 
   /** Store the bytes of received data as a data block into Spark's memory. */
@@ -134,16 +126,30 @@ private[streaming] class ReceiverSupervisorImpl(
       optionalMetadata: Option[Any],
       optionalBlockId: Option[StreamBlockId]
     ) {
+    pushAndReportBlock(ByteBufferBlock(bytes), optionalMetadata, optionalBlockId)
+  }
+
+  /** Store block and report it to driver */
+  def pushAndReportBlock(
+      receivedBlock: ReceivedBlock,
+      optionalMetadata: Option[Any],
+      optionalBlockId: Option[StreamBlockId]
+    ) {
     val blockId = optionalBlockId.getOrElse(nextBlockId)
+    val numRecords = receivedBlock match {
+      case ArrayBufferBlock(arrayBuffer) => arrayBuffer.size
+      case _ => -1
+    }
+
     val time = System.currentTimeMillis
-    blockManager.putBytes(blockId, bytes, storageLevel, tellMaster = true)
-    logDebug("Pushed block " + blockId + " in " + (System.currentTimeMillis - time)  + " ms")
-    reportPushedBlock(blockId, -1, optionalMetadata)
-  }
+    val fileSegmentOption = receivedBlockHandler.store(blockId, receivedBlock) match {
+      case f: FileSegment => Some(f)
+      case _ => None
+    }
+    logDebug("Pushed block " + blockId + " in " + (System.currentTimeMillis - time) + " ms")
 
-  /** Report pushed block */
-  def reportPushedBlock(blockId: StreamBlockId, numRecords: Long, optionalMetadata: Option[Any]) {
-    val blockInfo = ReceivedBlockInfo(streamId, blockId, numRecords, optionalMetadata.orNull)
+    val blockInfo = ReceivedBlockInfo(streamId,
+      blockId, numRecords, optionalMetadata.orNull, fileSegmentOption)
     trackerActor ! AddBlock(blockInfo)
     logDebug("Reported block " + blockId)
   }
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
index 5307fe189d717..9f88d21a56da3 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
@@ -21,19 +21,24 @@ import scala.collection.mutable.{HashMap, SynchronizedMap, SynchronizedQueue}
 import scala.language.existentials
 
 import akka.actor._
-import org.apache.spark.{Logging, SparkEnv, SparkException}
+import org.apache.hadoop.conf.Configuration
+import org.apache.spark.{SparkConf, Logging, SparkEnv, SparkException}
 import org.apache.spark.SparkContext._
 import org.apache.spark.storage.StreamBlockId
 import org.apache.spark.streaming.{StreamingContext, Time}
 import org.apache.spark.streaming.receiver.{Receiver, ReceiverSupervisorImpl, StopReceiver}
-import org.apache.spark.util.AkkaUtils
+import org.apache.spark.streaming.storage.{WriteAheadLogManager, FileSegment}
+import org.apache.spark.util.Utils
+import org.apache.hadoop.fs.Path
+import java.nio.ByteBuffer
 
 /** Information about blocks received by the receiver */
 private[streaming] case class ReceivedBlockInfo(
     streamId: Int,
     blockId: StreamBlockId,
     numRecords: Long,
-    metadata: Any
+    metadata: Any,
+    fileSegmentOption: Option[FileSegment]
   )
 
 /**
@@ -53,6 +58,28 @@ private[streaming] case class ReportError(streamId: Int, message: String, error:
 private[streaming] case class DeregisterReceiver(streamId: Int, msg: String, error: String)
   extends ReceiverTrackerMessage
 
+
+class ReceivedBlockInfoCheckpointer(
+    logDirectory: String, conf: SparkConf, hadoopConf: Configuration) {
+
+  private val logManager = new WriteAheadLogManager(logDirectory, conf, hadoopConf)
+
+  def read(): Iterator[ReceivedBlockInfo] = {
+    logManager.readFromLog().map { byteBuffer =>
+      Utils.deserialize[ReceivedBlockInfo](byteBuffer.array)
+    }
+  }
+
+  def write(receivedBlockInfo: ReceivedBlockInfo) {
+    val bytes = Utils.serialize(receivedBlockInfo)
+    logManager.writeToLog(ByteBuffer.wrap(bytes))
+  }
+
+  def clear(threshTime: Long) {
+    logManager.clear(threshTime)
+  }
+}
+
 /**
  * This class manages the execution of the receivers of NetworkInputDStreams. Instance of
  * this class must be created after all input streams have been added and StreamingContext.start()
@@ -61,20 +88,32 @@ private[streaming] case class DeregisterReceiver(streamId: Int, msg: String, err
 private[streaming]
 class ReceiverTracker(ssc: StreamingContext) extends Logging {
 
-  val receiverInputStreams = ssc.graph.getReceiverInputStreams()
-  val receiverInputStreamMap = Map(receiverInputStreams.map(x => (x.id, x)): _*)
-  val receiverExecutor = new ReceiverLauncher()
-  val receiverInfo = new HashMap[Int, ReceiverInfo] with SynchronizedMap[Int, ReceiverInfo]
-  val receivedBlockInfo = new HashMap[Int, SynchronizedQueue[ReceivedBlockInfo]]
+  private val receiverInputStreams = ssc.graph.getReceiverInputStreams()
+  private val receiverInputStreamMap = Map(receiverInputStreams.map(x => (x.id, x)): _*)
+  private val receiverExecutor = new ReceiverLauncher()
+  private val receiverInfo = new HashMap[Int, ReceiverInfo] with SynchronizedMap[Int, ReceiverInfo]
+  private val receivedBlockInfo = new HashMap[Int, SynchronizedQueue[ReceivedBlockInfo]]
     with SynchronizedMap[Int, SynchronizedQueue[ReceivedBlockInfo]]
-  val timeout = AkkaUtils.askTimeout(ssc.conf)
-  val listenerBus = ssc.scheduler.listenerBus
+  private val listenerBus = ssc.scheduler.listenerBus
+  private val receivedBlockCheckpointerOption = Option(ssc.checkpointDir) map { _ =>
+    new ReceivedBlockInfoCheckpointer(
+      new Path(ssc.checkpointDir, "receivedBlockMetadata").toString,
+      ssc.sparkContext.conf,
+      ssc.sparkContext.hadoopConfiguration
+    )
+  }
 
   // actor is created when generator starts.
   // This not being null means the tracker has been started and not stopped
   var actor: ActorRef = null
   var currentTime: Time = null
 
+  receivedBlockCheckpointerOption.foreach { checkpointer =>
+    checkpointer.read().foreach { info =>
+      getReceivedBlockInfoQueue(info.streamId) += info
+    }
+  }
+
   /** Start the actor and receiver execution thread. */
   def start() = synchronized {
     if (actor != null) {
@@ -126,7 +165,7 @@ class ReceiverTracker(ssc: StreamingContext) extends Logging {
     }
     receiverInfo(streamId) = ReceiverInfo(
       streamId, s"${typ}-${streamId}", receiverActor, true, host)
-    ssc.scheduler.listenerBus.post(StreamingListenerReceiverStarted(receiverInfo(streamId)))
+    listenerBus.post(StreamingListenerReceiverStarted(receiverInfo(streamId)))
     logInfo("Registered receiver for stream " + streamId + " from " + sender.path.address)
   }
 
@@ -140,7 +179,7 @@ class ReceiverTracker(ssc: StreamingContext) extends Logging {
         ReceiverInfo(streamId, "", null, false, "", lastErrorMessage = message, lastError = error)
     }
     receiverInfo(streamId) = newReceiverInfo
-    ssc.scheduler.listenerBus.post(StreamingListenerReceiverStopped(receiverInfo(streamId)))
+    listenerBus.post(StreamingListenerReceiverStopped(receiverInfo(streamId)))
     val messageWithError = if (error != null && !error.isEmpty) {
       s"$message - $error"
     } else {
@@ -150,10 +189,10 @@ class ReceiverTracker(ssc: StreamingContext) extends Logging {
   }
 
   /** Add new blocks for the given stream */
-  def addBlocks(receivedBlockInfo: ReceivedBlockInfo) {
+  def addBlock(receivedBlockInfo: ReceivedBlockInfo) {
+    receivedBlockCheckpointerOption.foreach { _.write(receivedBlockInfo) }
     getReceivedBlockInfoQueue(receivedBlockInfo.streamId) += receivedBlockInfo
-    logDebug("Stream " + receivedBlockInfo.streamId + " received new blocks: " +
-      receivedBlockInfo.blockId)
+    logDebug(s"Stream ${receivedBlockInfo.streamId} received block ${receivedBlockInfo.blockId}")
   }
 
   /** Report error sent by a receiver */
@@ -166,7 +205,7 @@ class ReceiverTracker(ssc: StreamingContext) extends Logging {
         ReceiverInfo(streamId, "", null, false, "", lastErrorMessage = message, lastError = error)
     }
     receiverInfo(streamId) = newReceiverInfo
-    ssc.scheduler.listenerBus.post(StreamingListenerReceiverError(receiverInfo(streamId)))
+    listenerBus.post(StreamingListenerReceiverError(receiverInfo(streamId)))
     val messageWithError = if (error != null && !error.isEmpty) {
       s"$message - $error"
     } else {
@@ -187,7 +226,7 @@ class ReceiverTracker(ssc: StreamingContext) extends Logging {
         registerReceiver(streamId, typ, host, receiverActor, sender)
         sender ! true
       case AddBlock(receivedBlockInfo) =>
-        addBlocks(receivedBlockInfo)
+        addBlock(receivedBlockInfo)
       case ReportError(streamId, message, error) =>
         reportError(streamId, message, error)
       case DeregisterReceiver(streamId, message, error) =>
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedDataManager.scala b/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedDataManager.scala
new file mode 100644
index 0000000000000..dd3818df2ae67
--- /dev/null
+++ b/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedDataManager.scala
@@ -0,0 +1,91 @@
+package org.apache.spark.streaming.storage
+
+import scala.language.postfixOps
+
+import java.nio.ByteBuffer
+import java.util.concurrent.Executors
+
+import scala.collection.mutable.ArrayBuffer
+import scala.concurrent.{Await, ExecutionContext, Future}
+import scala.concurrent.duration._
+
+import org.apache.hadoop.conf.Configuration
+import org.apache.hadoop.fs.Path
+import org.apache.spark.{Logging, SparkConf}
+import org.apache.spark.storage.{BlockManager, StorageLevel, StreamBlockId}
+
+private[streaming] sealed trait ReceivedBlock
+private[streaming] case class ArrayBufferBlock(arrayBuffer: ArrayBuffer[_]) extends ReceivedBlock
+private[streaming] case class IteratorBlock(iterator: Iterator[_]) extends ReceivedBlock
+private[streaming] case class ByteBufferBlock(byteBuffer: ByteBuffer) extends ReceivedBlock
+
+private[streaming] trait ReceivedBlockHandler {
+  def store(blockId: StreamBlockId, receivedBlock: ReceivedBlock): Option[AnyRef]
+  def clear(threshTime: Long) { }
+}
+
+private[streaming] class BlockManagerBasedBlockHandler(
+    blockManager: BlockManager,
+    streamId: Int,
+    storageLevel: StorageLevel
+  ) extends ReceivedBlockHandler {
+  
+  def store(blockId: StreamBlockId, receivedBlock: ReceivedBlock): Option[AnyRef] = {
+    receivedBlock match {
+      case ArrayBufferBlock(arrayBuffer) =>
+        blockManager.putIterator(blockId, arrayBuffer.iterator, storageLevel, tellMaster = true)
+      case IteratorBlock(iterator) =>
+        blockManager.putIterator(blockId, iterator, storageLevel, tellMaster = true)
+      case ByteBufferBlock(byteBuffer) =>
+        blockManager.putBytes(blockId, byteBuffer, storageLevel, tellMaster = true)
+      case _ =>
+        throw new Exception(s"Could not push $blockId to block manager, unexpected block type")
+    }
+    None
+  }
+}
+
+private[streaming] class WriteAheadLogBasedBlockHandler(
+    blockManager: BlockManager,
+    streamId: Int,
+    storageLevel: StorageLevel,
+    conf: SparkConf,
+    hadoopConf: Configuration,
+    checkpointDir: String
+  ) extends ReceivedBlockHandler with Logging {
+
+  private val logManager = new WriteAheadLogManager(
+    new Path(checkpointDir, new Path("receivedData", streamId.toString)).toString,
+    conf, hadoopConf
+  )
+
+  private val blockStoreTimeout =
+    conf.getInt("spark.streaming.receiver.blockStoreTimeout", 30) seconds
+
+  implicit private val executionContext =
+    ExecutionContext.fromExecutorService(Executors.newFixedThreadPool(2))
+  
+  def store(blockId: StreamBlockId, receivedBlock: ReceivedBlock): Option[AnyRef] = {
+    val serializedBlock = receivedBlock match {
+      case ArrayBufferBlock(arrayBuffer) =>
+        blockManager.dataSerialize(blockId, arrayBuffer.iterator)
+      case IteratorBlock(iterator) =>
+        blockManager.dataSerialize(blockId, iterator)
+      case ByteBufferBlock(byteBuffer) =>
+        byteBuffer
+      case _ =>
+        throw new Exception(s"Could not push $blockId to block manager, unexpected block type")
+    }
+
+    val pushToBlockManagerFuture = Future {
+      blockManager.putBytes(blockId, serializedBlock, storageLevel, tellMaster = true)
+    }
+    val pushToLogFuture = Future { logManager.writeToLog(serializedBlock) }
+    val combinedFuture = for {
+      _ <- pushToBlockManagerFuture
+      fileSegment <- pushToLogFuture
+    } yield fileSegment
+
+    Some(Await.result(combinedFuture, blockStoreTimeout))
+  }
+}
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala
new file mode 100644
index 0000000000000..68e148ab0802c
--- /dev/null
+++ b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala
@@ -0,0 +1,108 @@
+package org.apache.spark.streaming.storage
+
+import java.nio.ByteBuffer
+import java.util.concurrent.Executors
+
+import scala.collection.mutable.ArrayBuffer
+import scala.concurrent.{Future, ExecutionContext}
+
+import org.apache.hadoop.conf.Configuration
+import org.apache.hadoop.fs.Path
+import org.apache.spark.{Logging, SparkConf}
+
+class WriteAheadLogManager(logDirectory: String, conf: SparkConf, hadoopConf: Configuration)
+  extends Logging {
+
+  private case class LogInfo(startTime: Long, endTime: Long, path: String)
+
+  private val logWriterChangeIntervalSeconds =
+    conf.getInt("spark.streaming.wal.interval", 60)
+  private val logWriterMaxFailures =
+    conf.getInt("spark.streaming.wal.maxRetries", 3)
+  private val pastLogs = new ArrayBuffer[LogInfo]
+  implicit private val executionContext =
+    ExecutionContext.fromExecutorService(Executors.newFixedThreadPool(2))
+
+  private var currentLogWriter: WriteAheadLogWriter = null
+  private var currentLogWriterStartTime: Long = -1L
+
+  def writeToLog(byteBuffer: ByteBuffer): FileSegment = synchronized {
+    var failures = 0
+    var lastException: Exception = null
+    var fileSegment: FileSegment = null
+    var succeeded = false
+    while (!succeeded && failures < logWriterMaxFailures) {
+      try {
+        fileSegment = logWriter.write(byteBuffer)
+        succeeded = true
+      } catch {
+        case ex: Exception =>
+          lastException = ex
+          logWarning("Failed to ...")
+          reset()
+          failures += 1
+      }
+    }
+    if (fileSegment == null) {
+      throw lastException
+    }
+    fileSegment
+  }
+
+  def readFromLog(): Iterator[ByteBuffer] = {
+    WriteAheadLogManager.logsToIterator(pastLogs sortBy { _.startTime} map { _.path}, hadoopConf)
+  }
+
+  def clear(threshTime: Long): Unit = {
+    // Get the log files that are older than the threshold time, while accounting for possible
+    // time skew between the node issues the threshTime (say, driver node), and the local time at
+    // the node this is being executed (say, worker node)
+    val maxTimeSkewMs = 60 * 1000 // 1 minute
+    val oldLogFiles = synchronized { pastLogs.filter { _.endTime < threshTime - maxTimeSkewMs } }
+    logDebug(s"Attempting to clear ${oldLogFiles.size} old log files in $logDirectory " +
+      s"older than $threshTime: ${oldLogFiles.map { _.path }.mkString("\n")}")
+
+    def deleteFiles() {
+      oldLogFiles.foreach { logInfo =>
+        try {
+          val path = new Path(logInfo.path)
+          val fs = hadoopConf.synchronized { path.getFileSystem(hadoopConf) }
+          fs.delete(path, true)
+          synchronized { pastLogs -= logInfo }
+          logDebug(s"Cleared log file $logInfo")
+        } catch {
+          case ex: Exception => logWarning("Could not delete ...")
+        }
+      }
+      logInfo(s"Cleared log files in $logDirectory older than $threshTime")
+    }
+
+    Future { deleteFiles() }
+  }
+
+  private def logWriter: WriteAheadLogWriter = synchronized {
+    val currentTime = System.currentTimeMillis
+    if (currentLogWriter == null ||
+      currentTime - currentLogWriterStartTime > logWriterChangeIntervalSeconds * 1000) {
+      pastLogs += LogInfo(currentLogWriterStartTime, currentTime, currentLogWriter.path)
+      val newLogPath = new Path(logDirectory, s"data-$currentTime".toString)
+      currentLogWriter = new WriteAheadLogWriter(newLogPath.toString, hadoopConf)
+      currentLogWriterStartTime = currentTime
+    }
+    currentLogWriter
+  }
+
+  private def reset(): Unit = synchronized {
+    currentLogWriter.close()
+    currentLogWriter = null
+  }
+}
+
+object WriteAheadLogManager {
+  def logsToIterator(
+      chronologicallySortedLogFiles: Seq[String],
+      hadoopConf: Configuration
+    ): Iterator[ByteBuffer] = {
+    chronologicallySortedLogFiles map { new WriteAheadLogReader(_, hadoopConf) } flatMap { x => x }
+  }
+}

From a49fd1d7a30d9fe3e38211e8703a7ec53636d0cc Mon Sep 17 00:00:00 2001
From: Tathagata Das <tathagata.das1565@gmail.com>
Date: Fri, 3 Oct 2014 19:28:06 -0700
Subject: [PATCH 02/10] Fixed compilation errors.

---
 .../streaming/scheduler/ReceiverTracker.scala |  4 ++--
 .../storage/ReceivedDataManager.scala         | 11 +++++-----
 .../storage/WriteAheadLogManager.scala        | 22 +++++++++++--------
 3 files changed, 20 insertions(+), 17 deletions(-)

diff --git a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
index 9f88d21a56da3..081e1c4bd8141 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
@@ -58,11 +58,11 @@ private[streaming] case class ReportError(streamId: Int, message: String, error:
 private[streaming] case class DeregisterReceiver(streamId: Int, msg: String, error: String)
   extends ReceiverTrackerMessage
 
-
 class ReceivedBlockInfoCheckpointer(
     logDirectory: String, conf: SparkConf, hadoopConf: Configuration) {
 
-  private val logManager = new WriteAheadLogManager(logDirectory, conf, hadoopConf)
+  private val logManager = new WriteAheadLogManager(
+    logDirectory, conf, hadoopConf, "ReceiverTracker.WriteAheadLogManager")
 
   def read(): Iterator[ReceivedBlockInfo] = {
     logManager.readFromLog().map { byteBuffer =>
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedDataManager.scala b/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedDataManager.scala
index dd3818df2ae67..0c4db076eb357 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedDataManager.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedDataManager.scala
@@ -1,18 +1,17 @@
 package org.apache.spark.streaming.storage
 
-import scala.language.postfixOps
-
 import java.nio.ByteBuffer
-import java.util.concurrent.Executors
 
 import scala.collection.mutable.ArrayBuffer
 import scala.concurrent.{Await, ExecutionContext, Future}
 import scala.concurrent.duration._
+import scala.language.postfixOps
 
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 import org.apache.spark.{Logging, SparkConf}
 import org.apache.spark.storage.{BlockManager, StorageLevel, StreamBlockId}
+import org.apache.spark.util.Utils
 
 private[streaming] sealed trait ReceivedBlock
 private[streaming] case class ArrayBufferBlock(arrayBuffer: ArrayBuffer[_]) extends ReceivedBlock
@@ -56,14 +55,14 @@ private[streaming] class WriteAheadLogBasedBlockHandler(
 
   private val logManager = new WriteAheadLogManager(
     new Path(checkpointDir, new Path("receivedData", streamId.toString)).toString,
-    conf, hadoopConf
+    conf, hadoopConf, "WriteAheadLogBasedHandler.WriteAheadLogManager"
   )
 
   private val blockStoreTimeout =
     conf.getInt("spark.streaming.receiver.blockStoreTimeout", 30) seconds
 
-  implicit private val executionContext =
-    ExecutionContext.fromExecutorService(Executors.newFixedThreadPool(2))
+  implicit private val executionContext = ExecutionContext.fromExecutorService(
+    Utils.newDaemonFixedThreadPool(1, "WriteAheadLogBasedBlockHandler"))
   
   def store(blockId: StreamBlockId, receivedBlock: ReceivedBlock): Option[AnyRef] = {
     val serializedBlock = receivedBlock match {
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala
index 68e148ab0802c..8a2eda1962946 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala
@@ -1,17 +1,17 @@
 package org.apache.spark.streaming.storage
 
 import java.nio.ByteBuffer
-import java.util.concurrent.Executors
 
 import scala.collection.mutable.ArrayBuffer
-import scala.concurrent.{Future, ExecutionContext}
+import scala.concurrent.{ExecutionContext, Future}
 
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 import org.apache.spark.{Logging, SparkConf}
+import org.apache.spark.util.Utils
 
-class WriteAheadLogManager(logDirectory: String, conf: SparkConf, hadoopConf: Configuration)
-  extends Logging {
+private[streaming] class WriteAheadLogManager(logDirectory: String, conf: SparkConf,
+    hadoopConf: Configuration, threadPoolName: String = "WriteAheadLogManager") extends Logging {
 
   private case class LogInfo(startTime: Long, endTime: Long, path: String)
 
@@ -21,8 +21,9 @@ class WriteAheadLogManager(logDirectory: String, conf: SparkConf, hadoopConf: Co
     conf.getInt("spark.streaming.wal.maxRetries", 3)
   private val pastLogs = new ArrayBuffer[LogInfo]
   implicit private val executionContext =
-    ExecutionContext.fromExecutorService(Executors.newFixedThreadPool(2))
+    ExecutionContext.fromExecutorService(Utils.newDaemonFixedThreadPool(1, threadPoolName))
 
+  private var currentLogPath: String = null
   private var currentLogWriter: WriteAheadLogWriter = null
   private var currentLogWriterStartTime: Long = -1L
 
@@ -84,9 +85,10 @@ class WriteAheadLogManager(logDirectory: String, conf: SparkConf, hadoopConf: Co
     val currentTime = System.currentTimeMillis
     if (currentLogWriter == null ||
       currentTime - currentLogWriterStartTime > logWriterChangeIntervalSeconds * 1000) {
-      pastLogs += LogInfo(currentLogWriterStartTime, currentTime, currentLogWriter.path)
+      pastLogs += LogInfo(currentLogWriterStartTime, currentTime, currentLogPath)
       val newLogPath = new Path(logDirectory, s"data-$currentTime".toString)
-      currentLogWriter = new WriteAheadLogWriter(newLogPath.toString, hadoopConf)
+      currentLogPath = newLogPath.toString
+      currentLogWriter = new WriteAheadLogWriter(currentLogPath, hadoopConf)
       currentLogWriterStartTime = currentTime
     }
     currentLogWriter
@@ -98,11 +100,13 @@ class WriteAheadLogManager(logDirectory: String, conf: SparkConf, hadoopConf: Co
   }
 }
 
-object WriteAheadLogManager {
+private[storage] object WriteAheadLogManager {
   def logsToIterator(
       chronologicallySortedLogFiles: Seq[String],
       hadoopConf: Configuration
     ): Iterator[ByteBuffer] = {
-    chronologicallySortedLogFiles map { new WriteAheadLogReader(_, hadoopConf) } flatMap { x => x }
+    chronologicallySortedLogFiles.iterator.map { file =>
+      new WriteAheadLogReader(file, hadoopConf)
+    } flatMap { x => x }
   }
 }

From 5eafb2e2853f19558624d9e0a680fa6e9c0f88ab Mon Sep 17 00:00:00 2001
From: Tathagata Das <tathagata.das1565@gmail.com>
Date: Mon, 6 Oct 2014 15:21:54 -0700
Subject: [PATCH 03/10] Added checkpoint data of ReceiverInputDStream, improved
 WALManager, refactored WALSuite.

---
 .../dstream/DStreamCheckpointData.scala       |   2 +-
 .../dstream/ReceiverInputDStream.scala        |  25 +-
 .../receiver/ReceiverSupervisorImpl.scala     |   2 +-
 .../streaming/scheduler/ReceiverTracker.scala |   4 +-
 ...nager.scala => ReceivedBlockHandler.scala} |  30 ++-
 .../storage/WriteAheadLogManager.scala        | 124 +++++++---
 .../storage/WriteAheadLogReader.scala         |  30 +--
 .../storage/WriteAheadLogSuite.scala          | 215 ++++++++++--------
 8 files changed, 288 insertions(+), 144 deletions(-)
 rename streaming/src/main/scala/org/apache/spark/streaming/storage/{ReceivedDataManager.scala => ReceivedBlockHandler.scala} (75%)

diff --git a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStreamCheckpointData.scala b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStreamCheckpointData.scala
index f33c0ceafdf42..544cf57587e57 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStreamCheckpointData.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStreamCheckpointData.scala
@@ -26,7 +26,7 @@ import org.apache.spark.Logging
 import org.apache.spark.streaming.Time
 
 private[streaming]
-class DStreamCheckpointData[T: ClassTag] (dstream: DStream[T])
+class DStreamCheckpointData[T: ClassTag](dstream: DStream[T])
   extends Serializable with Logging {
   protected val data = new HashMap[Time, AnyRef]()
 
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/dstream/ReceiverInputDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/dstream/ReceiverInputDStream.scala
index 391e40924f38a..e53af30836a0a 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/dstream/ReceiverInputDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/dstream/ReceiverInputDStream.scala
@@ -40,7 +40,8 @@ abstract class ReceiverInputDStream[T: ClassTag](@transient ssc_ : StreamingCont
   extends InputDStream[T](ssc_) {
 
   /** Keeps all received blocks information */
-  private lazy val receivedBlockInfo = new HashMap[Time, Array[ReceivedBlockInfo]]
+  private[streaming] lazy val receivedBlockInfo = new HashMap[Time, Array[ReceivedBlockInfo]]
+  private[streaming] override val checkpointData = new ReceiverInputDStreamCheckpointData(this)
 
   /** This is an unique identifier for the network input stream. */
   val id = ssc.getNewReceiverStreamId()
@@ -92,3 +93,25 @@ abstract class ReceiverInputDStream[T: ClassTag](@transient ssc_ : StreamingCont
   }
 }
 
+private[streaming] class ReceiverInputDStreamCheckpointData[T: ClassTag](
+    dstream: ReceiverInputDStream[T]) extends DStreamCheckpointData[T](dstream) {
+
+  private var timeToReceivedBlockInfo: Seq[(Time, Array[ReceivedBlockInfo])] = _
+
+  override def update(time: Time) {
+    timeToReceivedBlockInfo = dstream.receivedBlockInfo.toSeq
+  }
+
+  override def cleanup(time: Time) {
+    // not required, as block info copied in whole every time update is called
+  }
+
+  override def restore() {
+    Option(timeToReceivedBlockInfo).foreach { blockInfo =>
+      dstream.receivedBlockInfo.clear()
+      dstream.receivedBlockInfo ++= blockInfo
+    }
+  }
+}
+
+
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisorImpl.scala b/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisorImpl.scala
index ef2a22a363374..017cbae5060b5 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisorImpl.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisorImpl.scala
@@ -142,7 +142,7 @@ private[streaming] class ReceiverSupervisorImpl(
     }
 
     val time = System.currentTimeMillis
-    val fileSegmentOption = receivedBlockHandler.store(blockId, receivedBlock) match {
+    val fileSegmentOption = receivedBlockHandler.storeBlock(blockId, receivedBlock) match {
       case f: FileSegment => Some(f)
       case _ => None
     }
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
index 081e1c4bd8141..36a55e64409b6 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
@@ -62,7 +62,7 @@ class ReceivedBlockInfoCheckpointer(
     logDirectory: String, conf: SparkConf, hadoopConf: Configuration) {
 
   private val logManager = new WriteAheadLogManager(
-    logDirectory, conf, hadoopConf, "ReceiverTracker.WriteAheadLogManager")
+    logDirectory, hadoopConf, threadPoolName = "ReceiverTracker.WriteAheadLogManager")
 
   def read(): Iterator[ReceivedBlockInfo] = {
     logManager.readFromLog().map { byteBuffer =>
@@ -76,7 +76,7 @@ class ReceivedBlockInfoCheckpointer(
   }
 
   def clear(threshTime: Long) {
-    logManager.clear(threshTime)
+    logManager.clearOldLogs(threshTime)
   }
 }
 
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedDataManager.scala b/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedBlockHandler.scala
similarity index 75%
rename from streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedDataManager.scala
rename to streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedBlockHandler.scala
index 0c4db076eb357..052bb59c9c324 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedDataManager.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedBlockHandler.scala
@@ -19,8 +19,8 @@ private[streaming] case class IteratorBlock(iterator: Iterator[_]) extends Recei
 private[streaming] case class ByteBufferBlock(byteBuffer: ByteBuffer) extends ReceivedBlock
 
 private[streaming] trait ReceivedBlockHandler {
-  def store(blockId: StreamBlockId, receivedBlock: ReceivedBlock): Option[AnyRef]
-  def clear(threshTime: Long) { }
+  def storeBlock(blockId: StreamBlockId, receivedBlock: ReceivedBlock): Option[AnyRef]
+  def clearOldBlocks(threshTime: Long)
 }
 
 private[streaming] class BlockManagerBasedBlockHandler(
@@ -29,7 +29,7 @@ private[streaming] class BlockManagerBasedBlockHandler(
     storageLevel: StorageLevel
   ) extends ReceivedBlockHandler {
   
-  def store(blockId: StreamBlockId, receivedBlock: ReceivedBlock): Option[AnyRef] = {
+  def storeBlock(blockId: StreamBlockId, receivedBlock: ReceivedBlock): Option[AnyRef] = {
     receivedBlock match {
       case ArrayBufferBlock(arrayBuffer) =>
         blockManager.putIterator(blockId, arrayBuffer.iterator, storageLevel, tellMaster = true)
@@ -42,6 +42,11 @@ private[streaming] class BlockManagerBasedBlockHandler(
     }
     None
   }
+
+  def clearOldBlocks(threshTime: Long) {
+    // this is not used as blocks inserted into the BlockManager are cleared by DStream's clearing
+    // of BlockRDDs.
+  }
 }
 
 private[streaming] class WriteAheadLogBasedBlockHandler(
@@ -53,18 +58,23 @@ private[streaming] class WriteAheadLogBasedBlockHandler(
     checkpointDir: String
   ) extends ReceivedBlockHandler with Logging {
 
+  private val blockStoreTimeout = conf.getInt(
+    "spark.streaming.receiver.blockStoreTimeout", 30).seconds
+  private val rotationInterval = conf.getInt(
+    "spark.streaming.receiver.writeAheadLog.rotationInterval", 60)
+  private val maxFailures = conf.getInt(
+    "spark.streaming.receiver.writeAheadLog.maxFailures", 3)
+
   private val logManager = new WriteAheadLogManager(
     new Path(checkpointDir, new Path("receivedData", streamId.toString)).toString,
-    conf, hadoopConf, "WriteAheadLogBasedHandler.WriteAheadLogManager"
+    hadoopConf, rotationInterval, maxFailures,
+    "WriteAheadLogBasedHandler.WriteAheadLogManager"
   )
 
-  private val blockStoreTimeout =
-    conf.getInt("spark.streaming.receiver.blockStoreTimeout", 30) seconds
-
   implicit private val executionContext = ExecutionContext.fromExecutorService(
     Utils.newDaemonFixedThreadPool(1, "WriteAheadLogBasedBlockHandler"))
   
-  def store(blockId: StreamBlockId, receivedBlock: ReceivedBlock): Option[AnyRef] = {
+  def storeBlock(blockId: StreamBlockId, receivedBlock: ReceivedBlock): Option[AnyRef] = {
     val serializedBlock = receivedBlock match {
       case ArrayBufferBlock(arrayBuffer) =>
         blockManager.dataSerialize(blockId, arrayBuffer.iterator)
@@ -87,4 +97,8 @@ private[streaming] class WriteAheadLogBasedBlockHandler(
 
     Some(Await.result(combinedFuture, blockStoreTimeout))
   }
+
+  def clearOldBlocks(threshTime: Long) {
+    logManager.clearOldLogs(threshTime)
+  }
 }
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala
index 8a2eda1962946..62086a3194cad 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala
@@ -7,18 +7,20 @@ import scala.concurrent.{ExecutionContext, Future}
 
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
-import org.apache.spark.{Logging, SparkConf}
+import org.apache.spark.Logging
+import org.apache.spark.streaming.storage.WriteAheadLogManager._
+import org.apache.spark.streaming.util.{Clock, ManualClock, SystemClock}
 import org.apache.spark.util.Utils
 
-private[streaming] class WriteAheadLogManager(logDirectory: String, conf: SparkConf,
-    hadoopConf: Configuration, threadPoolName: String = "WriteAheadLogManager") extends Logging {
+private[streaming] class WriteAheadLogManager(
+    logDirectory: String,
+    hadoopConf: Configuration,
+    rollingIntervalSecs: Int = 60,
+    maxFailures: Int = 3,
+    threadPoolName: String = "WriteAheadLogManager",
+    clock: Clock = new SystemClock
+  ) extends Logging {
 
-  private case class LogInfo(startTime: Long, endTime: Long, path: String)
-
-  private val logWriterChangeIntervalSeconds =
-    conf.getInt("spark.streaming.wal.interval", 60)
-  private val logWriterMaxFailures =
-    conf.getInt("spark.streaming.wal.maxRetries", 3)
   private val pastLogs = new ArrayBuffer[LogInfo]
   implicit private val executionContext =
     ExecutionContext.fromExecutorService(Utils.newDaemonFixedThreadPool(1, threadPoolName))
@@ -26,21 +28,24 @@ private[streaming] class WriteAheadLogManager(logDirectory: String, conf: SparkC
   private var currentLogPath: String = null
   private var currentLogWriter: WriteAheadLogWriter = null
   private var currentLogWriterStartTime: Long = -1L
+  private var currentLogWriterStopTime: Long = -1L
+
+  recoverPastLogs()
 
   def writeToLog(byteBuffer: ByteBuffer): FileSegment = synchronized {
+    var fileSegment: FileSegment = null
     var failures = 0
     var lastException: Exception = null
-    var fileSegment: FileSegment = null
     var succeeded = false
-    while (!succeeded && failures < logWriterMaxFailures) {
+    while (!succeeded && failures < maxFailures) {
       try {
-        fileSegment = logWriter.write(byteBuffer)
+        fileSegment = getLogWriter.write(byteBuffer)
         succeeded = true
       } catch {
         case ex: Exception =>
           lastException = ex
           logWarning("Failed to ...")
-          reset()
+          resetWriter()
           failures += 1
       }
     }
@@ -51,10 +56,10 @@ private[streaming] class WriteAheadLogManager(logDirectory: String, conf: SparkC
   }
 
   def readFromLog(): Iterator[ByteBuffer] = {
-    WriteAheadLogManager.logsToIterator(pastLogs sortBy { _.startTime} map { _.path}, hadoopConf)
+    logsToIterator(pastLogs.map{ _.path}, hadoopConf)
   }
 
-  def clear(threshTime: Long): Unit = {
+  def clearOldLogs(threshTime: Long): Unit = {
     // Get the log files that are older than the threshold time, while accounting for possible
     // time skew between the node issues the threshTime (say, driver node), and the local time at
     // the node this is being executed (say, worker node)
@@ -72,7 +77,8 @@ private[streaming] class WriteAheadLogManager(logDirectory: String, conf: SparkC
           synchronized { pastLogs -= logInfo }
           logDebug(s"Cleared log file $logInfo")
         } catch {
-          case ex: Exception => logWarning("Could not delete ...")
+          case ex: Exception =>
+            logWarning(s"Error clearing log file $logInfo", ex)
         }
       }
       logInfo(s"Cleared log files in $logDirectory older than $threshTime")
@@ -81,31 +87,97 @@ private[streaming] class WriteAheadLogManager(logDirectory: String, conf: SparkC
     Future { deleteFiles() }
   }
 
-  private def logWriter: WriteAheadLogWriter = synchronized {
-    val currentTime = System.currentTimeMillis
-    if (currentLogWriter == null ||
-      currentTime - currentLogWriterStartTime > logWriterChangeIntervalSeconds * 1000) {
-      pastLogs += LogInfo(currentLogWriterStartTime, currentTime, currentLogPath)
-      val newLogPath = new Path(logDirectory, s"data-$currentTime".toString)
+  private def getLogWriter: WriteAheadLogWriter = synchronized {
+    val currentTime = clock.currentTime()
+    if (currentLogPath == null || currentTime > currentLogWriterStopTime) {
+      resetWriter()
+      if (currentLogPath != null) {
+        pastLogs += LogInfo(currentLogWriterStartTime, currentLogWriterStopTime, currentLogPath)
+      }
+      currentLogWriterStartTime = currentTime
+      currentLogWriterStopTime = currentTime + (rollingIntervalSecs * 1000)
+      val newLogPath = new Path(logDirectory,
+        timeToLogFile(currentLogWriterStartTime, currentLogWriterStopTime))
       currentLogPath = newLogPath.toString
       currentLogWriter = new WriteAheadLogWriter(currentLogPath, hadoopConf)
-      currentLogWriterStartTime = currentTime
     }
     currentLogWriter
   }
 
-  private def reset(): Unit = synchronized {
-    currentLogWriter.close()
-    currentLogWriter = null
+  private def recoverPastLogs(): Unit = synchronized {
+    val logDirectoryPath = new Path(logDirectory)
+    val fs = logDirectoryPath.getFileSystem(hadoopConf)
+    if (fs.exists(logDirectoryPath) && fs.getFileStatus(logDirectoryPath).isDir) {
+      val logFiles = fs.listStatus(logDirectoryPath).map { _.getPath }
+      pastLogs.clear()
+      pastLogs ++= logFilesTologInfo(logFiles)
+      logInfo(s"Recovered ${logFiles.size} log files from $logDirectory")
+      logDebug(s"Recoved files are:\n${logFiles.mkString("\n")}")
+    }
+  }
+
+  private def resetWriter(): Unit = synchronized {
+    if (currentLogWriter != null) {
+      currentLogWriter.close()
+      currentLogWriter = null
+    }
   }
+
+/*
+  private def tryMultipleTimes[T](message: String)(body: => T): T = {
+    var result: T = null.asInstanceOf[T]
+    var failures = 0
+    var lastException: Exception = null
+    var succeeded = false
+    while (!succeeded && failures < maxFailures) {
+      try {
+        result = body
+        succeeded = true
+      } catch {
+        case ex: Exception =>
+          lastException = ex
+          resetWriter()
+          failures += 1
+          logWarning(message, ex)
+      }
+    }
+    if (!succeeded) {
+      throw new Exception(s"Failed $message after $failures failures", lastException)
+    }
+    result
+  } */
 }
 
 private[storage] object WriteAheadLogManager {
+
+  case class LogInfo(startTime: Long, endTime: Long, path: String)
+
+  val logFileRegex = """log-(\d+)-(\d+)""".r
+
+  def timeToLogFile(startTime: Long, stopTime: Long): String = {
+    s"log-$startTime-$stopTime"
+  }
+
+  def logFilesTologInfo(files: Seq[Path]): Seq[LogInfo] = {
+    println("Creating log info with " + files.mkString("[","],[","]"))
+    files.flatMap { file =>
+      logFileRegex.findFirstIn(file.getName()) match {
+        case logFileRegex(startTimeStr, stopTimeStr) =>
+          val startTime = startTimeStr.toLong
+          val stopTime = stopTimeStr.toLong
+          Some(LogInfo(startTime, stopTime, file.toString))
+        case _ => None
+      }
+    }.sortBy { _.startTime }
+  }
+
   def logsToIterator(
       chronologicallySortedLogFiles: Seq[String],
       hadoopConf: Configuration
     ): Iterator[ByteBuffer] = {
+    println("Creating iterator with " + chronologicallySortedLogFiles.mkString("[", "],[", "]"))
     chronologicallySortedLogFiles.iterator.map { file =>
+      println(s"Creating log reader with $file")
       new WriteAheadLogReader(file, hadoopConf)
     } flatMap { x => x }
   }
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogReader.scala b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogReader.scala
index 724549e216e93..35d3e7fb2b873 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogReader.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogReader.scala
@@ -29,7 +29,10 @@ private[streaming] class WriteAheadLogReader(path: String, conf: Configuration)
   private var nextItem: Option[ByteBuffer] = None
 
   override def hasNext: Boolean = synchronized {
-    assertOpen()
+    if (closed) {
+      return false
+    }
+
     if (nextItem.isDefined) { // handle the case where hasNext is called without calling next
       true
     } else {
@@ -40,31 +43,30 @@ private[streaming] class WriteAheadLogReader(path: String, conf: Configuration)
         nextItem = Some(ByteBuffer.wrap(buffer))
         true
       } catch {
-        case e: EOFException => false
-        case e: Exception => throw e
+        case e: EOFException =>
+          close()
+          false
+        case e: Exception =>
+          close()
+          throw e
       }
     }
   }
 
   override def next(): ByteBuffer = synchronized {
-    // TODO: Possible error case where there are not enough bytes in the stream
-    // TODO: How to handle that?
     val data = nextItem.getOrElse {
-      throw new IllegalStateException("next called without calling hasNext or after hasNext " +
-        "returned false")
+      close()
+      throw new IllegalStateException(
+        "next called without calling hasNext or after hasNext returned false")
     }
     nextItem = None // Ensure the next hasNext call loads new data.
     data
   }
 
   override def close(): Unit = synchronized {
+    if (!closed) {
+      instream.close()
+    }
     closed = true
-    instream.close()
   }
-
-  private def assertOpen() {
-    HdfsUtils.checkState(!closed, "Stream is closed. Create a new Reader to read from the " +
-      "file.")
-  }
-
 }
diff --git a/streaming/src/test/scala/org/apache/spark/streaming/storage/WriteAheadLogSuite.scala b/streaming/src/test/scala/org/apache/spark/streaming/storage/WriteAheadLogSuite.scala
index ed21bdbb399fd..b2114dfbc7b12 100644
--- a/streaming/src/test/scala/org/apache/spark/streaming/storage/WriteAheadLogSuite.scala
+++ b/streaming/src/test/scala/org/apache/spark/streaming/storage/WriteAheadLogSuite.scala
@@ -16,145 +16,178 @@
  */
 package org.apache.spark.streaming.storage
 
-import java.io.{RandomAccessFile, File}
+import java.io.{File, RandomAccessFile}
 import java.nio.ByteBuffer
-import java.util.Random
+import scala.util.Random
 
 import scala.collection.mutable.ArrayBuffer
+import scala.language.implicitConversions
 
 import com.google.common.io.Files
 import org.apache.hadoop.conf.Configuration
+import org.scalatest.{BeforeAndAfter, FunSuite}
+import org.apache.commons.io.FileUtils
+import org.apache.spark.streaming.util.ManualClock
+import org.apache.spark.util.Utils
 
-import org.apache.spark.streaming.TestSuiteBase
-
-class WriteAheadLogSuite extends TestSuiteBase {
+class WriteAheadLogSuite extends FunSuite with BeforeAndAfter {
   
   val hadoopConf = new Configuration()
-  val random = new Random()
-
-  test("Test successful writes") {
-    val dir = Files.createTempDir()
-    val file = new File(dir, "TestWriter")
-    try {
-      val dataToWrite = for (i <- 1 to 50) yield generateRandomData()
-      val writer = new WriteAheadLogWriter("file:///" + file.toString, hadoopConf)
-      val segments = dataToWrite.map(writer.write)
-      writer.close()
-      val writtenData = readData(segments, file)
-      assert(writtenData.toArray === dataToWrite.toArray)
-    } finally {
-      file.delete()
-      dir.delete()
+  var tempDirectory: File = null
+
+  before {
+    tempDirectory = Files.createTempDir()
+  }
+
+  after {
+    if (tempDirectory != null && tempDirectory.exists()) {
+      FileUtils.deleteDirectory(tempDirectory)
+      tempDirectory = null
     }
   }
 
-  test("Test successful reads using random reader") {
-    val file = File.createTempFile("TestRandomReads", "")
-    file.deleteOnExit()
-    val writtenData = writeData(50, file)
-    val reader = new WriteAheadLogRandomReader("file:///" + file.toString, hadoopConf)
-    writtenData.foreach {
-      x =>
-        val length = x._1.remaining()
-        assert(x._1 === reader.read(new FileSegment(file.toString, x._2, length)))
+  test("WriteAheadLogWriter - writing data") {
+    val file = new File(tempDirectory, Random.nextString(10))
+    val dataToWrite = generateRandomData()
+    val writer = new WriteAheadLogWriter("file:///" + file, hadoopConf)
+    val segments = dataToWrite.map(data => writer.write(data))
+    writer.close()
+    val writtenData = readDataFromLogManually(file, segments)
+    assert(writtenData.toArray === dataToWrite.toArray)
+  }
+
+  test("WriteAheadLogWriter - syncing of data by writing and reading immediately") {
+    val file = new File(tempDirectory, Random.nextString(10))
+    val dataToWrite = generateRandomData()
+    val writer = new WriteAheadLogWriter("file:///" + file, hadoopConf)
+    dataToWrite.foreach { data =>
+      val segment = writer.write(data)
+      assert(readDataFromLogManually(file, Seq(segment)).head === data)
     }
-    reader.close()
+    writer.close()
   }
 
-  test("Test reading data using random reader written with writer") {
-    val dir = Files.createTempDir()
-    val file = new File(dir, "TestRandomReads")
-    try {
-      val dataToWrite = for (i <- 1 to 50) yield generateRandomData()
-      val segments = writeUsingWriter(file, dataToWrite)
-      val iter = dataToWrite.iterator
-      val reader = new WriteAheadLogRandomReader("file:///" + file.toString, hadoopConf)
-      val writtenData = segments.map { x =>
-        reader.read(x)
-      }
-      assert(dataToWrite.toArray === writtenData.toArray)
-    } finally {
-      file.delete()
-      dir.delete()
+  test("WriteAheadLogReader - sequentially reading data") {
+    val file = File.createTempFile("TestSequentialReads", "", tempDirectory)
+    val writtenData = writeRandomDataToLogManually(50, file)
+    val reader = new WriteAheadLogReader("file:///" + file.toString, hadoopConf)
+    val readData = reader.toSeq.map(byteBufferToString)
+    assert(readData.toList === writtenData.map { _._1 }.toList)
+    assert(reader.hasNext === false)
+    intercept[Exception] {
+      reader.next()
     }
+    reader.close()
   }
 
-  test("Test successful reads using sequential reader") {
-    val file = File.createTempFile("TestSequentialReads", "")
-    file.deleteOnExit()
-    val writtenData = writeData(50, file)
+  test("WriteAheadLogReader - sequentially reading data written with writer") {
+    val file = new File(tempDirectory, "TestWriter")
+    val dataToWrite = generateRandomData()
+    writeDataUsingWriter(file, dataToWrite)
+    val iter = dataToWrite.iterator
     val reader = new WriteAheadLogReader("file:///" + file.toString, hadoopConf)
-    val iter = writtenData.iterator
-    iter.foreach { x =>
-      assert(reader.hasNext === true)
-      assert(reader.next() === x._1)
+    reader.foreach { byteBuffer =>
+      assert(byteBufferToString(byteBuffer) === iter.next())
+    }
+  }
+
+  test("WriteAheadLogRandomReader - reading data using random reader") {
+    val file = File.createTempFile("TestRandomReads", "", tempDirectory)
+    val writtenData = writeRandomDataToLogManually(50, file)
+    val reader = new WriteAheadLogRandomReader("file:///" + file.toString, hadoopConf)
+    val reorderedWrittenData = writtenData.toSeq.permutations.next()
+    reorderedWrittenData.foreach { case (data, offset, length) =>
+      val segment = new FileSegment(file.toString, offset, length)
+      assert(data === byteBufferToString(reader.read(segment)))
     }
     reader.close()
   }
 
+  test("WriteAheadLogRandomReader - reading data using random reader written with writer") {
+    val file = new File(tempDirectory, "TestRandomReads")
+    val dataToWrite = generateRandomData()
+    val segments = writeDataUsingWriter(file, dataToWrite)
+    val reader = new WriteAheadLogRandomReader("file:///" + file.toString, hadoopConf)
+    val writtenData = segments.map { byteBuffer => byteBufferToString(reader.read(byteBuffer)) }
+    assert(dataToWrite.toList === writtenData.toList)
+  }
 
-  test("Test reading data using sequential reader written with writer") {
-    val dir = Files.createTempDir()
-    val file = new File(dir, "TestWriter")
-    try {
-      val dataToWrite = for (i <- 1 to 50) yield generateRandomData()
-      val segments = writeUsingWriter(file, dataToWrite)
-      val iter = dataToWrite.iterator
-      val reader = new WriteAheadLogReader("file:///" + file.toString, hadoopConf)
-      reader.foreach { x =>
-        assert(x === iter.next())
-      }
-    } finally {
-      file.delete()
-      dir.delete()
+  test("WriteAheadLogManager - write rotating logs and reading from them") {
+    val fakeClock = new ManualClock
+    val manager = new WriteAheadLogManager(tempDirectory.toString, hadoopConf,
+      rollingIntervalSecs = 1, clock = fakeClock)
+    val dataToWrite = generateRandomData(10)
+    dataToWrite.foreach { data =>
+      fakeClock.addToTime(500)
+      manager.writeToLog(data)
     }
+    println(tempDirectory.list().mkString("\n"))
+    assert(tempDirectory.list().size > 1)
+
+    val readData = manager.readFromLog().map(byteBufferToString).toSeq
+    println("Generated data")
+    printData(dataToWrite)
+    println("Read data")
+    printData(readData)
+    assert(dataToWrite.toList === readData.toList)
   }
 
   /**
-   * Writes data to the file and returns the an array of the bytes written.
-   * @param count
-   * @return
+   * Write data to the file and returns the an array of the bytes written.
+   * This is used to test the WAL reader independently of the WAL writer.
    */
-  // We don't want to be using the WAL writer to test the reader - it will be painful to figure
-  // out where the bug is. Instead generate the file by hand and see if the WAL reader can
-  // handle it.
-  def writeData(count: Int, file: File): ArrayBuffer[(ByteBuffer, Long)] = {
-    val writtenData = new ArrayBuffer[(ByteBuffer, Long)]()
+  def writeRandomDataToLogManually(count: Int, file: File): ArrayBuffer[(String, Long, Int)] = {
+    val writtenData = new ArrayBuffer[(String, Long, Int)]()
     val writer = new RandomAccessFile(file, "rw")
-    var i = 0
-    while (i < count) {
-      val data = generateRandomData()
-      writtenData += ((data, writer.getFilePointer))
-      data.rewind()
-      writer.writeInt(data.remaining())
-      writer.write(data.array())
-      i += 1
+    for (i <- 1 to count) {
+      val data = generateRandomData(1).head
+      val offset = writer.getFilePointer()
+      val bytes = Utils.serialize(data)
+      writer.writeInt(bytes.size)
+      writer.write(bytes)
+      writtenData += ((data, offset, bytes.size))
     }
     writer.close()
     writtenData
   }
 
-  def readData(segments: Seq[FileSegment], file: File): Seq[ByteBuffer] = {
+  /**
+   * Read data from the given segments of log file and returns the read list of byte buffers.
+   * This is used to test the WAL writer independently of the WAL reader.
+   */
+  def readDataFromLogManually(file: File, segments: Seq[FileSegment]): Seq[String] = {
     val reader = new RandomAccessFile(file, "r")
+    println("File " + file + " has " + reader.length() + " bytes ")
     segments.map { x =>
       reader.seek(x.offset)
       val data = new Array[Byte](x.length)
       reader.readInt()
       reader.readFully(data)
-      ByteBuffer.wrap(data)
+      Utils.deserialize[String](data)
     }
   }
 
-  def generateRandomData(): ByteBuffer = {
-    val data = new Array[Byte](random.nextInt(50))
-    random.nextBytes(data)
-    ByteBuffer.wrap(data)
+  def generateRandomData(numItems: Int = 50, itemSize: Int = 50): Seq[String] = {
+    (1 to numItems).map { _.toString }
   }
 
-  def writeUsingWriter(file: File, input: Seq[ByteBuffer]): Seq[FileSegment] = {
+  def printData(data: Seq[String]) {
+    println("# items in data = " + data.size)
+    println(data.mkString("\n"))
+  }
+
+  def writeDataUsingWriter(file: File, input: Seq[String]): Seq[FileSegment] = {
     val writer = new WriteAheadLogWriter(file.toString, hadoopConf)
-    val segments = input.map(writer.write)
+    val segments = input.map { data => writer.write(data) }
     writer.close()
     segments
   }
+
+  implicit def stringToByteBuffer(str: String): ByteBuffer = {
+    ByteBuffer.wrap(Utils.serialize(str))
+  }
+
+  implicit def byteBufferToString(byteBuffer: ByteBuffer): String = {
+    Utils.deserialize[String](byteBuffer.array)
+  }
 }

From b86af2dbf1a7d7e3f3803314d9d42a56c4c06cce Mon Sep 17 00:00:00 2001
From: Tathagata Das <tathagata.das1565@gmail.com>
Date: Tue, 7 Oct 2014 11:11:20 -0700
Subject: [PATCH 04/10] Improved WALSuite, and added ReceivedBlockHandlerSuite.

---
 streaming/pom.xml                             |   5 +
 .../storage/ReceivedBlockHandler.scala        |  26 ++-
 .../storage/WriteAheadLogManager.scala        |  48 ++---
 .../storage/WriteAheadLogWriter.scala         |   2 +
 .../storage/ReceivedBlockHandlerSuite.scala   | 138 ++++++++++++++
 .../storage/WriteAheadLogSuite.scala          | 173 +++++++++++++-----
 6 files changed, 320 insertions(+), 72 deletions(-)
 create mode 100644 streaming/src/test/scala/org/apache/spark/streaming/storage/ReceivedBlockHandlerSuite.scala

diff --git a/streaming/pom.xml b/streaming/pom.xml
index 12f900c91eb98..002c35f251390 100644
--- a/streaming/pom.xml
+++ b/streaming/pom.xml
@@ -68,6 +68,11 @@
       <artifactId>junit-interface</artifactId>
       <scope>test</scope>
     </dependency>
+    <dependency>
+      <groupId>org.mockito</groupId>
+      <artifactId>mockito-all</artifactId>
+      <scope>test</scope>
+    </dependency>
   </dependencies>
   <build>
     <outputDirectory>target/scala-${scala.binary.version}/classes</outputDirectory>
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedBlockHandler.scala b/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedBlockHandler.scala
index 052bb59c9c324..299d6069d7018 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedBlockHandler.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedBlockHandler.scala
@@ -7,10 +7,12 @@ import scala.concurrent.{Await, ExecutionContext, Future}
 import scala.concurrent.duration._
 import scala.language.postfixOps
 
+import WriteAheadLogBasedBlockHandler._
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 import org.apache.spark.{Logging, SparkConf}
 import org.apache.spark.storage.{BlockManager, StorageLevel, StreamBlockId}
+import org.apache.spark.streaming.util.{Clock, SystemClock}
 import org.apache.spark.util.Utils
 
 private[streaming] sealed trait ReceivedBlock
@@ -55,20 +57,22 @@ private[streaming] class WriteAheadLogBasedBlockHandler(
     storageLevel: StorageLevel,
     conf: SparkConf,
     hadoopConf: Configuration,
-    checkpointDir: String
+    checkpointDir: String,
+    clock: Clock = new SystemClock
   ) extends ReceivedBlockHandler with Logging {
 
   private val blockStoreTimeout = conf.getInt(
     "spark.streaming.receiver.blockStoreTimeout", 30).seconds
-  private val rotationInterval = conf.getInt(
-    "spark.streaming.receiver.writeAheadLog.rotationInterval", 60)
+  private val rollingInterval = conf.getInt(
+    "spark.streaming.receiver.writeAheadLog.rollingInterval", 60)
   private val maxFailures = conf.getInt(
     "spark.streaming.receiver.writeAheadLog.maxFailures", 3)
 
   private val logManager = new WriteAheadLogManager(
-    new Path(checkpointDir, new Path("receivedData", streamId.toString)).toString,
-    hadoopConf, rotationInterval, maxFailures,
-    "WriteAheadLogBasedHandler.WriteAheadLogManager"
+    checkpointDirToLogDir(checkpointDir, streamId),
+    hadoopConf, rollingInterval, maxFailures,
+    threadPoolName = "WriteAheadLogBasedHandler.WriteAheadLogManager",
+    clock = clock
   )
 
   implicit private val executionContext = ExecutionContext.fromExecutorService(
@@ -101,4 +105,14 @@ private[streaming] class WriteAheadLogBasedBlockHandler(
   def clearOldBlocks(threshTime: Long) {
     logManager.clearOldLogs(threshTime)
   }
+
+  def stop() {
+    logManager.stop()
+  }
+}
+
+private[streaming] object WriteAheadLogBasedBlockHandler {
+  def checkpointDirToLogDir(checkpointDir: String, streamId: Int): String = {
+    new Path(checkpointDir, new Path("receivedData", streamId.toString)).toString
+  }
 }
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala
index 62086a3194cad..ff878e7b8bc31 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala
@@ -9,7 +9,7 @@ import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 import org.apache.spark.Logging
 import org.apache.spark.streaming.storage.WriteAheadLogManager._
-import org.apache.spark.streaming.util.{Clock, ManualClock, SystemClock}
+import org.apache.spark.streaming.util.{Clock, SystemClock}
 import org.apache.spark.util.Utils
 
 private[streaming] class WriteAheadLogManager(
@@ -55,17 +55,26 @@ private[streaming] class WriteAheadLogManager(
     fileSegment
   }
 
-  def readFromLog(): Iterator[ByteBuffer] = {
-    logsToIterator(pastLogs.map{ _.path}, hadoopConf)
+  def readFromLog(): Iterator[ByteBuffer] = synchronized {
+    val logFilesToRead = pastLogs.map{ _.path} ++ Option(currentLogPath)
+    println("Reading from the logs: " + logFilesToRead.mkString("\n"))
+    logFilesToRead.iterator.map { file =>
+        println(s"Creating log reader with $file")
+        new WriteAheadLogReader(file, hadoopConf)
+    } flatMap { x => x }
   }
 
+  /**
+   * Delete the log files that are older than the threshold time.
+   *
+   * Its important to note that the threshold time is based on the time stamps used in the log
+   * files, and is therefore based on the local system time. So if there is coordination necessary
+   * between the node calculating the threshTime (say, driver node), and the local system time
+   * (say, worker node), the caller has to take account of possible time skew.
+   */
   def clearOldLogs(threshTime: Long): Unit = {
-    // Get the log files that are older than the threshold time, while accounting for possible
-    // time skew between the node issues the threshTime (say, driver node), and the local time at
-    // the node this is being executed (say, worker node)
-    val maxTimeSkewMs = 60 * 1000 // 1 minute
-    val oldLogFiles = synchronized { pastLogs.filter { _.endTime < threshTime - maxTimeSkewMs } }
-    logDebug(s"Attempting to clear ${oldLogFiles.size} old log files in $logDirectory " +
+    val oldLogFiles = synchronized { pastLogs.filter { _.endTime < threshTime } }
+    println(s"Attempting to clear ${oldLogFiles.size} old log files in $logDirectory " +
       s"older than $threshTime: ${oldLogFiles.map { _.path }.mkString("\n")}")
 
     def deleteFiles() {
@@ -87,6 +96,13 @@ private[streaming] class WriteAheadLogManager(
     Future { deleteFiles() }
   }
 
+  def stop(): Unit = synchronized {
+    println("Stopping log manager")
+    if (currentLogWriter != null) {
+      currentLogWriter.close()
+    }
+  }
+
   private def getLogWriter: WriteAheadLogWriter = synchronized {
     val currentTime = clock.currentTime()
     if (currentLogPath == null || currentTime > currentLogWriterStopTime) {
@@ -112,12 +128,13 @@ private[streaming] class WriteAheadLogManager(
       pastLogs.clear()
       pastLogs ++= logFilesTologInfo(logFiles)
       logInfo(s"Recovered ${logFiles.size} log files from $logDirectory")
-      logDebug(s"Recoved files are:\n${logFiles.mkString("\n")}")
+      logDebug(s"Recovered files are:\n${logFiles.mkString("\n")}")
     }
   }
 
   private def resetWriter(): Unit = synchronized {
     if (currentLogWriter != null) {
+      currentLogWriter
       currentLogWriter.close()
       currentLogWriter = null
     }
@@ -170,15 +187,4 @@ private[storage] object WriteAheadLogManager {
       }
     }.sortBy { _.startTime }
   }
-
-  def logsToIterator(
-      chronologicallySortedLogFiles: Seq[String],
-      hadoopConf: Configuration
-    ): Iterator[ByteBuffer] = {
-    println("Creating iterator with " + chronologicallySortedLogFiles.mkString("[", "],[", "]"))
-    chronologicallySortedLogFiles.iterator.map { file =>
-      println(s"Creating log reader with $file")
-      new WriteAheadLogReader(file, hadoopConf)
-    } flatMap { x => x }
-  }
 }
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogWriter.scala b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogWriter.scala
index 8a2db8305a7e2..f8f6089318344 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogWriter.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogWriter.scala
@@ -55,10 +55,12 @@ private[streaming] class WriteAheadLogWriter(path: String, conf: Configuration)
 
   override private[streaming] def close(): Unit = synchronized {
     closed = true
+    hflushOrSync()
     stream.close()
   }
 
   private def hflushOrSync() {
+    stream.getWrappedStream.flush()
     hflushMethod.foreach(_.invoke(stream))
   }
 
diff --git a/streaming/src/test/scala/org/apache/spark/streaming/storage/ReceivedBlockHandlerSuite.scala b/streaming/src/test/scala/org/apache/spark/streaming/storage/ReceivedBlockHandlerSuite.scala
new file mode 100644
index 0000000000000..9c493210d2575
--- /dev/null
+++ b/streaming/src/test/scala/org/apache/spark/streaming/storage/ReceivedBlockHandlerSuite.scala
@@ -0,0 +1,138 @@
+package org.apache.spark.streaming.storage
+
+import java.io.File
+
+import scala.concurrent.duration._
+import scala.language.postfixOps
+
+import akka.actor.{ActorSystem, Props}
+import com.google.common.io.Files
+import org.apache.commons.io.FileUtils
+import org.apache.hadoop.conf.Configuration
+import org.scalatest.{BeforeAndAfter, FunSuite, Matchers}
+import org.scalatest.concurrent.Eventually._
+
+import org.apache.spark.{MapOutputTrackerMaster, SecurityManager, SparkConf}
+import org.apache.spark.network.nio.NioBlockTransferService
+import org.apache.spark.scheduler.LiveListenerBus
+import org.apache.spark.serializer.KryoSerializer
+import org.apache.spark.shuffle.hash.HashShuffleManager
+import org.apache.spark.storage._
+import org.apache.spark.streaming.util.ManualClock
+import org.apache.spark.util.AkkaUtils
+import WriteAheadLogBasedBlockHandler._
+import WriteAheadLogSuite._
+
+class ReceivedBlockHandlerSuite extends FunSuite with BeforeAndAfter with Matchers {
+
+  val conf = new SparkConf()
+    .set("spark.authenticate", "false")
+    .set("spark.kryoserializer.buffer.mb", "1")
+    .set("spark.streaming.receiver.writeAheadLog.rollingInterval", "1")
+  val hadoopConf = new Configuration()
+  val storageLevel = StorageLevel.MEMORY_ONLY_SER
+  val streamId = 1
+  val securityMgr = new SecurityManager(conf)
+  val mapOutputTracker = new MapOutputTrackerMaster(conf)
+  val shuffleManager = new HashShuffleManager(conf)
+  val serializer = new KryoSerializer(conf)
+  val manualClock = new ManualClock
+
+  var actorSystem: ActorSystem = null
+  var blockManagerMaster: BlockManagerMaster = null
+  var blockManager: BlockManager = null
+  var receivedBlockHandler: ReceivedBlockHandler = null
+  var tempDirectory: File = null
+
+  before {
+    val (actorSystem, boundPort) = AkkaUtils.createActorSystem(
+      "test", "localhost", 0, conf = conf, securityManager = securityMgr)
+    this.actorSystem = actorSystem
+
+    conf.set("spark.driver.port", boundPort.toString)
+
+    blockManagerMaster = new BlockManagerMaster(
+      actorSystem.actorOf(Props(new BlockManagerMasterActor(true, conf, new LiveListenerBus))),
+      conf, true)
+    blockManager = new BlockManager("bm", actorSystem, blockManagerMaster, serializer, 100000,
+      conf, mapOutputTracker, shuffleManager, new NioBlockTransferService(conf, securityMgr))
+    tempDirectory = Files.createTempDir()
+    manualClock.setTime(0)
+  }
+
+  after {
+    actorSystem.shutdown()
+    actorSystem.awaitTermination()
+    actorSystem = null
+    blockManagerMaster = null
+
+    if (blockManager != null) {
+      blockManager.stop()
+      blockManager = null
+    }
+
+    if (tempDirectory != null && tempDirectory.exists()) {
+      FileUtils.deleteDirectory(tempDirectory)
+      tempDirectory = null
+    }
+  }
+
+  test("WriteAheadLogBasedBlockHandler - store block") {
+    createWriteAheadLogBasedBlockHandler()
+    val (data, blockIds) = generateAndStoreData(receivedBlockHandler)
+    receivedBlockHandler.asInstanceOf[WriteAheadLogBasedBlockHandler].stop()
+
+    // Check whether blocks inserted in the block manager are correct
+    val blockManagerData = blockIds.flatMap { blockId =>
+      blockManager.getLocal(blockId).map { _.data }.getOrElse(Iterator.empty)
+    }
+    blockManagerData.toList shouldEqual data.toList
+
+    // Check whether the blocks written to the write ahead log are correct
+    val logFiles = getLogFiles()
+    logFiles.size should be > 1
+
+    val logData = logFiles.flatMap {
+      file => new WriteAheadLogReader(file.toString, hadoopConf).toSeq
+    }.flatMap { blockManager.dataDeserialize(StreamBlockId(streamId, 0), _ )}
+    logData.toList shouldEqual data.toList
+  }
+
+  test("WriteAheadLogBasedBlockHandler - clear old blocks") {
+    createWriteAheadLogBasedBlockHandler()
+    generateAndStoreData(receivedBlockHandler)
+    val preCleanupLogFiles = getLogFiles()
+    preCleanupLogFiles.size should be > 1
+
+    // this depends on the number of blocks inserted using generateAndStoreData()
+    manualClock.currentTime() shouldEqual 5000L
+
+    val cleanupThreshTime = 3000L
+    receivedBlockHandler.clearOldBlocks(cleanupThreshTime)
+    eventually(timeout(10000 millis), interval(10 millis)) {
+      getLogFiles().size should be < preCleanupLogFiles.size
+    }
+  }
+
+  def createWriteAheadLogBasedBlockHandler() {
+    receivedBlockHandler = new WriteAheadLogBasedBlockHandler(blockManager, 1,
+      storageLevel, conf, hadoopConf, tempDirectory.toString, manualClock)
+  }
+
+  def generateAndStoreData(
+      receivedBlockHandler: ReceivedBlockHandler): (Seq[String], Seq[StreamBlockId]) = {
+    val data = (1 to 100).map { _.toString }
+    val blocks = data.grouped(10).map { _.toIterator }.toSeq
+    val blockIds = (0 until blocks.size).map { i => StreamBlockId(streamId, i) }
+    blocks.zip(blockIds).foreach { case (block, id) =>
+      manualClock.addToTime(500)  // log rolling interval set to 1000 ms through SparkConf
+      receivedBlockHandler.storeBlock(id, IteratorBlock(block))
+    }
+    (data, blockIds)
+  }
+
+  def getLogFiles(): Seq[File] = {
+    getLogFilesInDirectory(
+      new File(checkpointDirToLogDir(tempDirectory.toString, streamId)))
+  }
+}
diff --git a/streaming/src/test/scala/org/apache/spark/streaming/storage/WriteAheadLogSuite.scala b/streaming/src/test/scala/org/apache/spark/streaming/storage/WriteAheadLogSuite.scala
index b2114dfbc7b12..1ba6e0e45bc16 100644
--- a/streaming/src/test/scala/org/apache/spark/streaming/storage/WriteAheadLogSuite.scala
+++ b/streaming/src/test/scala/org/apache/spark/streaming/storage/WriteAheadLogSuite.scala
@@ -16,7 +16,7 @@
  */
 package org.apache.spark.streaming.storage
 
-import java.io.{File, RandomAccessFile}
+import java.io.{DataInputStream, FileInputStream, File, RandomAccessFile}
 import java.nio.ByteBuffer
 import scala.util.Random
 
@@ -29,9 +29,10 @@ import org.scalatest.{BeforeAndAfter, FunSuite}
 import org.apache.commons.io.FileUtils
 import org.apache.spark.streaming.util.ManualClock
 import org.apache.spark.util.Utils
+import WriteAheadLogSuite._
 
 class WriteAheadLogSuite extends FunSuite with BeforeAndAfter {
-  
+
   val hadoopConf = new Configuration()
   var tempDirectory: File = null
 
@@ -52,7 +53,7 @@ class WriteAheadLogSuite extends FunSuite with BeforeAndAfter {
     val writer = new WriteAheadLogWriter("file:///" + file, hadoopConf)
     val segments = dataToWrite.map(data => writer.write(data))
     writer.close()
-    val writtenData = readDataFromLogManually(file, segments)
+    val writtenData = readDataManually(file, segments)
     assert(writtenData.toArray === dataToWrite.toArray)
   }
 
@@ -62,17 +63,19 @@ class WriteAheadLogSuite extends FunSuite with BeforeAndAfter {
     val writer = new WriteAheadLogWriter("file:///" + file, hadoopConf)
     dataToWrite.foreach { data =>
       val segment = writer.write(data)
-      assert(readDataFromLogManually(file, Seq(segment)).head === data)
+      assert(readDataManually(file, Seq(segment)).head === data)
     }
     writer.close()
   }
 
   test("WriteAheadLogReader - sequentially reading data") {
+    // Write data manually for testing the sequential reader
     val file = File.createTempFile("TestSequentialReads", "", tempDirectory)
-    val writtenData = writeRandomDataToLogManually(50, file)
+    val writtenData = generateRandomData()
+    writeDataManually(writtenData, file)
     val reader = new WriteAheadLogReader("file:///" + file.toString, hadoopConf)
     val readData = reader.toSeq.map(byteBufferToString)
-    assert(readData.toList === writtenData.map { _._1 }.toList)
+    assert(readData.toList === writtenData.toList)
     assert(reader.hasNext === false)
     intercept[Exception] {
       reader.next()
@@ -81,6 +84,7 @@ class WriteAheadLogSuite extends FunSuite with BeforeAndAfter {
   }
 
   test("WriteAheadLogReader - sequentially reading data written with writer") {
+    // Write data manually for testing the sequential reader
     val file = new File(tempDirectory, "TestWriter")
     val dataToWrite = generateRandomData()
     writeDataUsingWriter(file, dataToWrite)
@@ -89,73 +93,130 @@ class WriteAheadLogSuite extends FunSuite with BeforeAndAfter {
     reader.foreach { byteBuffer =>
       assert(byteBufferToString(byteBuffer) === iter.next())
     }
+    reader.close()
   }
 
   test("WriteAheadLogRandomReader - reading data using random reader") {
+    // Write data manually for testing the random reader
     val file = File.createTempFile("TestRandomReads", "", tempDirectory)
-    val writtenData = writeRandomDataToLogManually(50, file)
+    val writtenData = generateRandomData()
+    val segments = writeDataManually(writtenData, file)
+
+    // Get a random order of these segments and read them back
+    val writtenDataAndSegments = writtenData.zip(segments).toSeq.permutations.take(10).flatten
     val reader = new WriteAheadLogRandomReader("file:///" + file.toString, hadoopConf)
-    val reorderedWrittenData = writtenData.toSeq.permutations.next()
-    reorderedWrittenData.foreach { case (data, offset, length) =>
-      val segment = new FileSegment(file.toString, offset, length)
+    writtenDataAndSegments.foreach { case (data, segment) =>
       assert(data === byteBufferToString(reader.read(segment)))
     }
     reader.close()
   }
 
   test("WriteAheadLogRandomReader - reading data using random reader written with writer") {
+    // Write data using writer for testing the random reader
     val file = new File(tempDirectory, "TestRandomReads")
-    val dataToWrite = generateRandomData()
-    val segments = writeDataUsingWriter(file, dataToWrite)
+    val data = generateRandomData()
+    val segments = writeDataUsingWriter(file, data)
+
+    // Read a random sequence of segments and verify read data
+    val dataAndSegments = data.zip(segments).toSeq.permutations.take(10).flatten
     val reader = new WriteAheadLogRandomReader("file:///" + file.toString, hadoopConf)
-    val writtenData = segments.map { byteBuffer => byteBufferToString(reader.read(byteBuffer)) }
-    assert(dataToWrite.toList === writtenData.toList)
+    dataAndSegments.foreach { case(data, segment) =>
+      assert(data === byteBufferToString(reader.read(segment)))
+    }
+    reader.close()
   }
 
-  test("WriteAheadLogManager - write rotating logs and reading from them") {
-    val fakeClock = new ManualClock
-    val manager = new WriteAheadLogManager(tempDirectory.toString, hadoopConf,
-      rollingIntervalSecs = 1, clock = fakeClock)
+  test("WriteAheadLogManager - write rotating logs") {
+    // Write data using manager
     val dataToWrite = generateRandomData(10)
-    dataToWrite.foreach { data =>
-      fakeClock.addToTime(500)
-      manager.writeToLog(data)
-    }
-    println(tempDirectory.list().mkString("\n"))
-    assert(tempDirectory.list().size > 1)
-
-    val readData = manager.readFromLog().map(byteBufferToString).toSeq
-    println("Generated data")
-    printData(dataToWrite)
-    println("Read data")
-    printData(readData)
+    writeDataUsingManager(tempDirectory, dataToWrite)
+
+    // Read data manually to verify the written data
+    val logFiles = getLogFilesInDirectory(tempDirectory)
+    assert(logFiles.size > 1)
+    val writtenData = logFiles.flatMap { file => readDataManually(file) }
+    assert(writtenData.toList === dataToWrite.toList)
+  }
+
+  test("WriteAheadLogManager - read rotating logs") {
+    // Write data manually for testing reading through manager
+    val writtenData = (1 to 10).map { i =>
+      val data = generateRandomData(10)
+      val file = new File(tempDirectory, s"log-$i-${i + 1}")
+      writeDataManually(data, file)
+      println(s"Generated log file $file")
+      data
+    }.flatten
+
+    // Read data using manager and verify
+    val readData = readDataUsingManager(tempDirectory)
+    assert(readData.toList === writtenData.toList)
+  }
+
+  test("WriteAheadLogManager - recover past logs when creating new manager") {
+    // Write data with manager, recover with new manager and verify
+    val dataToWrite = generateRandomData(100)
+    writeDataUsingManager(tempDirectory, dataToWrite)
+    val logFiles = getLogFilesInDirectory(tempDirectory)
+    println("==========\n" + logFiles.mkString("\n") + "\n==========\n"  )
+
+    assert(logFiles.size > 1)
+    val readData = readDataUsingManager(tempDirectory)
     assert(dataToWrite.toList === readData.toList)
   }
 
+  // TODO (Hari, TD): Test different failure conditions of writers and readers.
+  //  - Failure in the middle of write
+  //  - Failure while reading incomplete/corrupt file
+}
+
+object WriteAheadLogSuite {
+
+  private val hadoopConf = new Configuration()
+
   /**
    * Write data to the file and returns the an array of the bytes written.
    * This is used to test the WAL reader independently of the WAL writer.
    */
-  def writeRandomDataToLogManually(count: Int, file: File): ArrayBuffer[(String, Long, Int)] = {
-    val writtenData = new ArrayBuffer[(String, Long, Int)]()
+  def writeDataManually(data: Seq[String], file: File): Seq[FileSegment] = {
+    val segments = new ArrayBuffer[FileSegment]()
     val writer = new RandomAccessFile(file, "rw")
-    for (i <- 1 to count) {
-      val data = generateRandomData(1).head
+    data.foreach { item =>
       val offset = writer.getFilePointer()
-      val bytes = Utils.serialize(data)
+      val bytes = Utils.serialize(item)
       writer.writeInt(bytes.size)
       writer.write(bytes)
-      writtenData += ((data, offset, bytes.size))
+      segments += FileSegment(file.toString, offset, bytes.size)
     }
     writer.close()
-    writtenData
+    segments
+  }
+
+  def writeDataUsingWriter(file: File, data: Seq[String]): Seq[FileSegment] = {
+    val writer = new WriteAheadLogWriter(file.toString, hadoopConf)
+    val segments = data.map {
+      item => writer.write(item)
+    }
+    writer.close()
+    segments
+  }
+
+  def writeDataUsingManager(logDirectory: File, data: Seq[String]) {
+    val fakeClock = new ManualClock
+    val manager = new WriteAheadLogManager(logDirectory.toString, hadoopConf,
+      rollingIntervalSecs = 1, clock = fakeClock)
+    data.foreach { item =>
+      fakeClock.addToTime(500)
+      manager.writeToLog(item)
+    }
+    manager.stop()
   }
 
   /**
    * Read data from the given segments of log file and returns the read list of byte buffers.
    * This is used to test the WAL writer independently of the WAL reader.
    */
-  def readDataFromLogManually(file: File, segments: Seq[FileSegment]): Seq[String] = {
+  def readDataManually(file: File, segments: Seq[FileSegment]): Seq[String] = {
     val reader = new RandomAccessFile(file, "r")
     println("File " + file + " has " + reader.length() + " bytes ")
     segments.map { x =>
@@ -167,22 +228,44 @@ class WriteAheadLogSuite extends FunSuite with BeforeAndAfter {
     }
   }
 
+  def readDataManually(file: File): Seq[String] = {
+    val reader = new DataInputStream(new FileInputStream(file))
+    val buffer = new ArrayBuffer[String]
+    try {
+      while (reader.available > 0) {
+        val length = reader.readInt()
+        val bytes = new Array[Byte](length)
+        reader.read(bytes)
+        buffer += Utils.deserialize[String](bytes)
+      }
+    } finally {
+      reader.close()
+    }
+    buffer
+  }
+
+  def readDataUsingManager(logDirectory: File): Seq[String] = {
+    val manager = new WriteAheadLogManager(logDirectory.toString, hadoopConf)
+    val data = manager.readFromLog().map(byteBufferToString).toSeq
+    manager.stop()
+    data
+  }
+
   def generateRandomData(numItems: Int = 50, itemSize: Int = 50): Seq[String] = {
     (1 to numItems).map { _.toString }
   }
 
+  def getLogFilesInDirectory(directory: File): Seq[File] = {
+    println("[ " + directory.listFiles().filter(_.getName().startsWith("log-")).mkString(" | ") + " ]")
+    directory.listFiles().filter(_.getName().startsWith("log-"))
+      .sortBy(_.getName.split("-")(1).toLong)
+  }
+
   def printData(data: Seq[String]) {
     println("# items in data = " + data.size)
     println(data.mkString("\n"))
   }
 
-  def writeDataUsingWriter(file: File, input: Seq[String]): Seq[FileSegment] = {
-    val writer = new WriteAheadLogWriter(file.toString, hadoopConf)
-    val segments = input.map { data => writer.write(data) }
-    writer.close()
-    segments
-  }
-
   implicit def stringToByteBuffer(str: String): ByteBuffer = {
     ByteBuffer.wrap(Utils.serialize(str))
   }

From 4d9c830d91af30dc1daaa21064d64d1583e7d9d5 Mon Sep 17 00:00:00 2001
From: Tathagata Das <tathagata.das1565@gmail.com>
Date: Tue, 7 Oct 2014 18:33:02 -0700
Subject: [PATCH 05/10] Added ReceiverTrackerSuite

---
 .../receiver/ReceiverSupervisorImpl.scala     |   3 +-
 .../streaming/scheduler/ReceiverTracker.scala |  79 ++++++++---
 .../storage/ReceivedBlockHandler.scala        |   2 +-
 .../storage/WriteAheadLogManager.scala        |  60 +++-----
 .../storage/WriteAheadLogReader.scala         |   6 +-
 .../storage/WriteAheadLogWriter.scala         |   2 -
 .../streaming/ReceiverTrackerSuite.scala      | 133 ++++++++++++++++++
 .../storage/ReceivedBlockHandlerSuite.scala   |   8 +-
 .../storage/WriteAheadLogSuite.scala          |  19 +--
 9 files changed, 231 insertions(+), 81 deletions(-)
 create mode 100644 streaming/src/test/scala/org/apache/spark/streaming/ReceiverTrackerSuite.scala

diff --git a/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisorImpl.scala b/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisorImpl.scala
index 017cbae5060b5..01d3e3f497500 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisorImpl.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisorImpl.scala
@@ -150,7 +150,8 @@ private[streaming] class ReceiverSupervisorImpl(
 
     val blockInfo = ReceivedBlockInfo(streamId,
       blockId, numRecords, optionalMetadata.orNull, fileSegmentOption)
-    trackerActor ! AddBlock(blockInfo)
+    val future = trackerActor.ask(AddBlock(blockInfo))(askTimeout)
+    Await.result(future, askTimeout)
     logDebug("Reported block " + blockId)
   }
 
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
index 36a55e64409b6..582df6889c24b 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
@@ -58,16 +58,23 @@ private[streaming] case class ReportError(streamId: Int, message: String, error:
 private[streaming] case class DeregisterReceiver(streamId: Int, msg: String, error: String)
   extends ReceiverTrackerMessage
 
-class ReceivedBlockInfoCheckpointer(
-    logDirectory: String, conf: SparkConf, hadoopConf: Configuration) {
 
+/**
+ *
+ */
+private[streaming] class ReceivedBlockInfoCheckpointer(
+    checkpointDirectory: String, conf: SparkConf, hadoopConf: Configuration) {
+
+  import ReceivedBlockInfoCheckpointer._
+
+  private val logDirectory = checkpointDirToLogDir(checkpointDirectory)
   private val logManager = new WriteAheadLogManager(
-    logDirectory, hadoopConf, threadPoolName = "ReceiverTracker.WriteAheadLogManager")
+    logDirectory, hadoopConf, callerName = "ReceiverTracker")
 
-  def read(): Iterator[ReceivedBlockInfo] = {
+  def recover(): Seq[ReceivedBlockInfo] = {
     logManager.readFromLog().map { byteBuffer =>
       Utils.deserialize[ReceivedBlockInfo](byteBuffer.array)
-    }
+    }.toSeq
   }
 
   def write(receivedBlockInfo: ReceivedBlockInfo) {
@@ -78,15 +85,27 @@ class ReceivedBlockInfoCheckpointer(
   def clear(threshTime: Long) {
     logManager.clearOldLogs(threshTime)
   }
+
+  def stop() {
+    logManager.stop()
+  }
+}
+
+private[streaming] object ReceivedBlockInfoCheckpointer {
+  def checkpointDirToLogDir(checkpointDir: String): String = {
+    new Path(checkpointDir, "receivedBlockMetadata").toString
+  }
 }
 
 /**
  * This class manages the execution of the receivers of NetworkInputDStreams. Instance of
  * this class must be created after all input streams have been added and StreamingContext.start()
  * has been called because it needs the final set of input streams at the time of instantiation.
+ *
+ * @param skipReceiverLaunch Do not launch the receiver. This is useful for testing.
  */
 private[streaming]
-class ReceiverTracker(ssc: StreamingContext) extends Logging {
+class ReceiverTracker(ssc: StreamingContext, skipReceiverLaunch: Boolean = false) extends Logging {
 
   private val receiverInputStreams = ssc.graph.getReceiverInputStreams()
   private val receiverInputStreamMap = Map(receiverInputStreams.map(x => (x.id, x)): _*)
@@ -95,12 +114,9 @@ class ReceiverTracker(ssc: StreamingContext) extends Logging {
   private val receivedBlockInfo = new HashMap[Int, SynchronizedQueue[ReceivedBlockInfo]]
     with SynchronizedMap[Int, SynchronizedQueue[ReceivedBlockInfo]]
   private val listenerBus = ssc.scheduler.listenerBus
-  private val receivedBlockCheckpointerOption = Option(ssc.checkpointDir) map { _ =>
-    new ReceivedBlockInfoCheckpointer(
-      new Path(ssc.checkpointDir, "receivedBlockMetadata").toString,
-      ssc.sparkContext.conf,
-      ssc.sparkContext.hadoopConfiguration
-    )
+  val receivedBlockCheckpointerOption = Option(ssc.checkpointDir) map { dir =>
+    new ReceivedBlockInfoCheckpointer(dir, ssc.sparkContext.conf,
+      ssc.sparkContext.hadoopConfiguration)
   }
 
   // actor is created when generator starts.
@@ -109,9 +125,11 @@ class ReceiverTracker(ssc: StreamingContext) extends Logging {
   var currentTime: Time = null
 
   receivedBlockCheckpointerOption.foreach { checkpointer =>
-    checkpointer.read().foreach { info =>
+    val recoveredBlockInfo = checkpointer.recover()
+    recoveredBlockInfo.foreach { info =>
       getReceivedBlockInfoQueue(info.streamId) += info
     }
+    logInfo(s"Recovered info on ${recoveredBlockInfo.size} blocks from write ahead log")
   }
 
   /** Start the actor and receiver execution thread. */
@@ -123,7 +141,7 @@ class ReceiverTracker(ssc: StreamingContext) extends Logging {
     if (!receiverInputStreams.isEmpty) {
       actor = ssc.env.actorSystem.actorOf(Props(new ReceiverTrackerActor),
         "ReceiverTracker")
-      receiverExecutor.start()
+      if (!skipReceiverLaunch) receiverExecutor.start()
       logInfo("ReceiverTracker started")
     }
   }
@@ -132,11 +150,13 @@ class ReceiverTracker(ssc: StreamingContext) extends Logging {
   def stop() = synchronized {
     if (!receiverInputStreams.isEmpty && actor != null) {
       // First, stop the receivers
-      receiverExecutor.stop()
+      if (!skipReceiverLaunch) receiverExecutor.stop()
 
       // Finally, stop the actor
       ssc.env.actorSystem.stop(actor)
       actor = null
+
+      receivedBlockCheckpointerOption.foreach { _.stop() }
       logInfo("ReceiverTracker stopped")
     }
   }
@@ -148,6 +168,10 @@ class ReceiverTracker(ssc: StreamingContext) extends Logging {
     receivedBlockInfo.toArray
   }
 
+  def getReceiverInfo(streamId: Int): Option[ReceiverInfo] = {
+    receiverInfo.get(streamId)
+  }
+
   private def getReceivedBlockInfoQueue(streamId: Int) = {
     receivedBlockInfo.getOrElseUpdate(streamId, new SynchronizedQueue[ReceivedBlockInfo])
   }
@@ -189,10 +213,17 @@ class ReceiverTracker(ssc: StreamingContext) extends Logging {
   }
 
   /** Add new blocks for the given stream */
-  def addBlock(receivedBlockInfo: ReceivedBlockInfo) {
-    receivedBlockCheckpointerOption.foreach { _.write(receivedBlockInfo) }
-    getReceivedBlockInfoQueue(receivedBlockInfo.streamId) += receivedBlockInfo
-    logDebug(s"Stream ${receivedBlockInfo.streamId} received block ${receivedBlockInfo.blockId}")
+  def addBlock(receivedBlockInfo: ReceivedBlockInfo): Boolean = {
+    try {
+      receivedBlockCheckpointerOption.foreach { _.write(receivedBlockInfo) }
+      getReceivedBlockInfoQueue(receivedBlockInfo.streamId) += receivedBlockInfo
+      logDebug(s"Stream ${receivedBlockInfo.streamId} received block ${receivedBlockInfo.blockId}")
+      true
+    } catch {
+      case e: Exception =>
+        logError("Error adding block " + receivedBlockInfo, e)
+        false
+    }
   }
 
   /** Report error sent by a receiver */
@@ -226,7 +257,7 @@ class ReceiverTracker(ssc: StreamingContext) extends Logging {
         registerReceiver(streamId, typ, host, receiverActor, sender)
         sender ! true
       case AddBlock(receivedBlockInfo) =>
-        addBlock(receivedBlockInfo)
+        sender ! addBlock(receivedBlockInfo)
       case ReportError(streamId, message, error) =>
         reportError(streamId, message, error)
       case DeregisterReceiver(streamId, message, error) =>
@@ -299,9 +330,11 @@ class ReceiverTracker(ssc: StreamingContext) extends Logging {
             "Could not start receiver as object not found.")
         }
         val receiver = iterator.next()
-        val executor = new ReceiverSupervisorImpl(receiver, SparkEnv.get)
-        executor.start()
-        executor.awaitTermination()
+        val supervisor = new ReceiverSupervisorImpl(receiver, SparkEnv.get)
+        supervisor.start()
+        logInfo("Supervisor started()")
+        supervisor.awaitTermination()
+        logInfo("Supervisor terminated")
       }
       // Run the dummy Spark job to ensure that all slaves have registered.
       // This avoids all the receivers to be scheduled on the same node.
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedBlockHandler.scala b/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedBlockHandler.scala
index 299d6069d7018..fe36dbc210f24 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedBlockHandler.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedBlockHandler.scala
@@ -71,7 +71,7 @@ private[streaming] class WriteAheadLogBasedBlockHandler(
   private val logManager = new WriteAheadLogManager(
     checkpointDirToLogDir(checkpointDir, streamId),
     hadoopConf, rollingInterval, maxFailures,
-    threadPoolName = "WriteAheadLogBasedHandler.WriteAheadLogManager",
+    callerName = "WriteAheadLogBasedHandler",
     clock = clock
   )
 
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala
index ff878e7b8bc31..0c104c1609e9a 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala
@@ -17,13 +17,15 @@ private[streaming] class WriteAheadLogManager(
     hadoopConf: Configuration,
     rollingIntervalSecs: Int = 60,
     maxFailures: Int = 3,
-    threadPoolName: String = "WriteAheadLogManager",
+    callerName: String = null,
     clock: Clock = new SystemClock
   ) extends Logging {
 
   private val pastLogs = new ArrayBuffer[LogInfo]
-  implicit private val executionContext =
-    ExecutionContext.fromExecutorService(Utils.newDaemonFixedThreadPool(1, threadPoolName))
+  private val threadpoolName = "WriteAheadLogManager" +
+    Option(callerName).map { s => s" for $s" }.getOrElse("")
+  implicit private val executionContext = ExecutionContext.fromExecutorService(
+    Utils.newDaemonFixedThreadPool(1, threadpoolName))
 
   private var currentLogPath: String = null
   private var currentLogWriter: WriteAheadLogWriter = null
@@ -57,9 +59,9 @@ private[streaming] class WriteAheadLogManager(
 
   def readFromLog(): Iterator[ByteBuffer] = synchronized {
     val logFilesToRead = pastLogs.map{ _.path} ++ Option(currentLogPath)
-    println("Reading from the logs: " + logFilesToRead.mkString("\n"))
+    logInfo("Reading from the logs: " + logFilesToRead.mkString("\n"))
     logFilesToRead.iterator.map { file =>
-        println(s"Creating log reader with $file")
+        logDebug(s"Creating log reader with $file")
         new WriteAheadLogReader(file, hadoopConf)
     } flatMap { x => x }
   }
@@ -74,7 +76,7 @@ private[streaming] class WriteAheadLogManager(
    */
   def clearOldLogs(threshTime: Long): Unit = {
     val oldLogFiles = synchronized { pastLogs.filter { _.endTime < threshTime } }
-    println(s"Attempting to clear ${oldLogFiles.size} old log files in $logDirectory " +
+    logInfo(s"Attempting to clear ${oldLogFiles.size} old log files in $logDirectory " +
       s"older than $threshTime: ${oldLogFiles.map { _.path }.mkString("\n")}")
 
     def deleteFiles() {
@@ -92,15 +94,17 @@ private[streaming] class WriteAheadLogManager(
       }
       logInfo(s"Cleared log files in $logDirectory older than $threshTime")
     }
-
-    Future { deleteFiles() }
+    if (!executionContext.isShutdown) {
+      Future { deleteFiles() }
+    }
   }
 
   def stop(): Unit = synchronized {
-    println("Stopping log manager")
     if (currentLogWriter != null) {
       currentLogWriter.close()
     }
+    executionContext.shutdown()
+    logInfo("Stopped log manager")
   }
 
   private def getLogWriter: WriteAheadLogWriter = synchronized {
@@ -124,11 +128,11 @@ private[streaming] class WriteAheadLogManager(
     val logDirectoryPath = new Path(logDirectory)
     val fs = logDirectoryPath.getFileSystem(hadoopConf)
     if (fs.exists(logDirectoryPath) && fs.getFileStatus(logDirectoryPath).isDir) {
-      val logFiles = fs.listStatus(logDirectoryPath).map { _.getPath }
+      val logFileInfo = logFilesTologInfo(fs.listStatus(logDirectoryPath).map { _.getPath })
       pastLogs.clear()
-      pastLogs ++= logFilesTologInfo(logFiles)
-      logInfo(s"Recovered ${logFiles.size} log files from $logDirectory")
-      logDebug(s"Recovered files are:\n${logFiles.mkString("\n")}")
+      pastLogs ++= logFileInfo
+      logInfo(s"Recovered ${logFileInfo.size} log files from $logDirectory")
+      logDebug(s"Recovered files are:\n${logFileInfo.map(_.path).mkString("\n")}")
     }
   }
 
@@ -139,30 +143,6 @@ private[streaming] class WriteAheadLogManager(
       currentLogWriter = null
     }
   }
-
-/*
-  private def tryMultipleTimes[T](message: String)(body: => T): T = {
-    var result: T = null.asInstanceOf[T]
-    var failures = 0
-    var lastException: Exception = null
-    var succeeded = false
-    while (!succeeded && failures < maxFailures) {
-      try {
-        result = body
-        succeeded = true
-      } catch {
-        case ex: Exception =>
-          lastException = ex
-          resetWriter()
-          failures += 1
-          logWarning(message, ex)
-      }
-    }
-    if (!succeeded) {
-      throw new Exception(s"Failed $message after $failures failures", lastException)
-    }
-    result
-  } */
 }
 
 private[storage] object WriteAheadLogManager {
@@ -176,14 +156,14 @@ private[storage] object WriteAheadLogManager {
   }
 
   def logFilesTologInfo(files: Seq[Path]): Seq[LogInfo] = {
-    println("Creating log info with " + files.mkString("[","],[","]"))
     files.flatMap { file =>
       logFileRegex.findFirstIn(file.getName()) match {
-        case logFileRegex(startTimeStr, stopTimeStr) =>
+        case Some(logFileRegex(startTimeStr, stopTimeStr)) =>
           val startTime = startTimeStr.toLong
           val stopTime = stopTimeStr.toLong
           Some(LogInfo(startTime, stopTime, file.toString))
-        case _ => None
+        case None =>
+          None
       }
     }.sortBy { _.startTime }
   }
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogReader.scala b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogReader.scala
index 35d3e7fb2b873..5e0dc1d49a89a 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogReader.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogReader.scala
@@ -20,9 +20,10 @@ import java.io.{EOFException, Closeable}
 import java.nio.ByteBuffer
 
 import org.apache.hadoop.conf.Configuration
+import org.apache.spark.Logging
 
 private[streaming] class WriteAheadLogReader(path: String, conf: Configuration)
-  extends Iterator[ByteBuffer] with Closeable {
+  extends Iterator[ByteBuffer] with Closeable with Logging {
 
   private val instream = HdfsUtils.getInputStream(path, conf)
   private var closed = false
@@ -41,12 +42,15 @@ private[streaming] class WriteAheadLogReader(path: String, conf: Configuration)
         val buffer = new Array[Byte](length)
         instream.readFully(buffer)
         nextItem = Some(ByteBuffer.wrap(buffer))
+        logTrace("Read next item " + nextItem.get)
         true
       } catch {
         case e: EOFException =>
+          logDebug("Error reading next item, EOF reached", e)
           close()
           false
         case e: Exception =>
+          logDebug("Error reading next item, EOF reached", e)
           close()
           throw e
       }
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogWriter.scala b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogWriter.scala
index f8f6089318344..8a2db8305a7e2 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogWriter.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogWriter.scala
@@ -55,12 +55,10 @@ private[streaming] class WriteAheadLogWriter(path: String, conf: Configuration)
 
   override private[streaming] def close(): Unit = synchronized {
     closed = true
-    hflushOrSync()
     stream.close()
   }
 
   private def hflushOrSync() {
-    stream.getWrappedStream.flush()
     hflushMethod.foreach(_.invoke(stream))
   }
 
diff --git a/streaming/src/test/scala/org/apache/spark/streaming/ReceiverTrackerSuite.scala b/streaming/src/test/scala/org/apache/spark/streaming/ReceiverTrackerSuite.scala
new file mode 100644
index 0000000000000..7d4473e27f6a5
--- /dev/null
+++ b/streaming/src/test/scala/org/apache/spark/streaming/ReceiverTrackerSuite.scala
@@ -0,0 +1,133 @@
+package org.apache.spark.streaming
+
+import java.io.File
+
+import scala.concurrent.{Await, Future}
+import scala.concurrent.ExecutionContext.Implicits.global
+import scala.concurrent.duration._
+import scala.language.postfixOps
+import scala.util.Random
+
+import akka.pattern.ask
+import com.google.common.io.Files
+import org.apache.commons.io.FileUtils
+import org.scalatest.{BeforeAndAfter, BeforeAndAfterAll, FunSuite, Matchers}
+import org.scalatest.concurrent.Eventually._
+
+import org.apache.spark.{Logging, SparkConf, SparkContext}
+import org.apache.spark.storage.{StorageLevel, StreamBlockId}
+import org.apache.spark.streaming.receiver.Receiver
+import org.apache.spark.streaming.scheduler.{AddBlock, ReceivedBlockInfo, ReceivedBlockInfoCheckpointer, ReceiverTracker}
+import org.apache.spark.streaming.storage.{FileSegment, WriteAheadLogReader}
+import org.apache.spark.streaming.storage.WriteAheadLogSuite._
+import org.apache.spark.util.Utils
+
+class ReceiverTrackerSuite
+  extends FunSuite with BeforeAndAfter with BeforeAndAfterAll with Matchers with Logging {
+
+  val conf = new SparkConf().setMaster("local[2]").setAppName("ReceiverTrackerSuite")
+  val sc = new SparkContext(conf)
+  val akkaTimeout = 10 seconds
+
+  var ssc: StreamingContext = null
+  var receiverTracker: ReceiverTracker = null
+  var checkpointDirectory: File = null
+
+  before {
+    checkpointDirectory = Files.createTempDir()
+  }
+
+  after {
+    if (receiverTracker != null) {
+      receiverTracker.stop()
+      receiverTracker = null
+    }
+    if (ssc != null) {
+      ssc.stop(stopSparkContext = false)
+      ssc = null
+    }
+    if (checkpointDirectory != null && checkpointDirectory.exists()) {
+      FileUtils.deleteDirectory(checkpointDirectory)
+      checkpointDirectory = null
+    }
+  }
+
+  override def afterAll() {
+    sc.stop()
+  }
+
+  test("add blocks info and retrieve them") {
+    createTracker(enableCheckpoint = false)
+    val blockIds = (1 to 10).map { _ => math.abs(Random.nextInt()) }
+    val futures = blockIds.map { id =>
+      receiverTracker.actor.ask(AddBlock(createBlockInfo(id, 1)))(akkaTimeout).mapTo[Boolean]
+    }
+    Await.ready(Future.sequence(futures), akkaTimeout)
+
+    val recordedBlockIds = receiverTracker.getReceivedBlockInfo(1)
+    recordedBlockIds.map { _.blockId.uniqueId } shouldEqual blockIds
+  }
+
+  test("add block info with checkpoint enabled, and recover them") {
+    createTracker(enableCheckpoint = true)
+    val blockIds = (1 to 10).map { _ => math.abs(Random.nextInt()) }
+    val futures = blockIds.map { id =>
+      receiverTracker.actor.ask(AddBlock(createBlockInfo(id, 1)))(akkaTimeout).mapTo[Boolean]
+    }
+    Await.ready(Future.sequence(futures), akkaTimeout)
+    receiverTracker.stop()
+
+    val logFiles = getWriteAheadLogFiles()
+    logFiles.size should be > 0
+
+    val logData = logFiles.flatMap {
+      file => new WriteAheadLogReader(file.toString, sc.hadoopConfiguration).toSeq
+    }.map { byteBuffer =>
+      Utils.deserialize[ReceivedBlockInfo](byteBuffer.array)
+    }
+    logData foreach { _.blockId.streamId shouldEqual 1 }
+    logData.map { _.blockId.uniqueId }.toList shouldEqual blockIds
+
+    createTracker(enableCheckpoint = true)
+    val recoveredBlockIds = receiverTracker.getReceivedBlockInfo(1)
+    recoveredBlockIds.map { _.blockId.uniqueId } shouldEqual blockIds
+  }
+
+  ignore("clean old block info") {
+    // TODO (TD)
+  }
+
+  def createTracker(enableCheckpoint: Boolean) {
+    ssc = new StreamingContext(sc, Seconds(1))
+    if (enableCheckpoint) {
+      ssc.checkpoint(checkpointDirectory.toString)
+      assert(ssc.checkpointDir != null)
+    }
+
+    val receiver = new Receiver[String](StorageLevel.MEMORY_ONLY) {
+      def onStart(): Unit = { }
+      def onStop(): Unit = { }
+    }
+    ssc.receiverStream(receiver)
+    receiverTracker = new ReceiverTracker(ssc, skipReceiverLaunch = true)
+    receiverTracker.start()
+    if (enableCheckpoint) {
+      assert(receiverTracker.receivedBlockCheckpointerOption.isDefined)
+    }
+
+    // Wait for the receiver to be start before doing anything with it
+    eventually(timeout(akkaTimeout), interval(10 milliseconds)) {
+      receiverTracker.getReceivedBlockInfo(0) should not be None
+    }
+  }
+  
+  def createBlockInfo(blockUniqueId: Long, streamId: Int): ReceivedBlockInfo = {
+    new ReceivedBlockInfo(streamId,
+      StreamBlockId(streamId, blockUniqueId), 0, null, None)
+  }
+
+  def getWriteAheadLogFiles(): Seq[File] = {
+    getLogFilesInDirectory(
+      new File(ReceivedBlockInfoCheckpointer.checkpointDirToLogDir(checkpointDirectory.toString)))
+  }
+}
diff --git a/streaming/src/test/scala/org/apache/spark/streaming/storage/ReceivedBlockHandlerSuite.scala b/streaming/src/test/scala/org/apache/spark/streaming/storage/ReceivedBlockHandlerSuite.scala
index 9c493210d2575..784d615cf499c 100644
--- a/streaming/src/test/scala/org/apache/spark/streaming/storage/ReceivedBlockHandlerSuite.scala
+++ b/streaming/src/test/scala/org/apache/spark/streaming/storage/ReceivedBlockHandlerSuite.scala
@@ -89,7 +89,7 @@ class ReceivedBlockHandlerSuite extends FunSuite with BeforeAndAfter with Matche
     blockManagerData.toList shouldEqual data.toList
 
     // Check whether the blocks written to the write ahead log are correct
-    val logFiles = getLogFiles()
+    val logFiles = getWriteAheadLogFiles()
     logFiles.size should be > 1
 
     val logData = logFiles.flatMap {
@@ -101,7 +101,7 @@ class ReceivedBlockHandlerSuite extends FunSuite with BeforeAndAfter with Matche
   test("WriteAheadLogBasedBlockHandler - clear old blocks") {
     createWriteAheadLogBasedBlockHandler()
     generateAndStoreData(receivedBlockHandler)
-    val preCleanupLogFiles = getLogFiles()
+    val preCleanupLogFiles = getWriteAheadLogFiles()
     preCleanupLogFiles.size should be > 1
 
     // this depends on the number of blocks inserted using generateAndStoreData()
@@ -110,7 +110,7 @@ class ReceivedBlockHandlerSuite extends FunSuite with BeforeAndAfter with Matche
     val cleanupThreshTime = 3000L
     receivedBlockHandler.clearOldBlocks(cleanupThreshTime)
     eventually(timeout(10000 millis), interval(10 millis)) {
-      getLogFiles().size should be < preCleanupLogFiles.size
+      getWriteAheadLogFiles().size should be < preCleanupLogFiles.size
     }
   }
 
@@ -131,7 +131,7 @@ class ReceivedBlockHandlerSuite extends FunSuite with BeforeAndAfter with Matche
     (data, blockIds)
   }
 
-  def getLogFiles(): Seq[File] = {
+  def getWriteAheadLogFiles(): Seq[File] = {
     getLogFilesInDirectory(
       new File(checkpointDirToLogDir(tempDirectory.toString, streamId)))
   }
diff --git a/streaming/src/test/scala/org/apache/spark/streaming/storage/WriteAheadLogSuite.scala b/streaming/src/test/scala/org/apache/spark/streaming/storage/WriteAheadLogSuite.scala
index 1ba6e0e45bc16..88b2b5095ceb6 100644
--- a/streaming/src/test/scala/org/apache/spark/streaming/storage/WriteAheadLogSuite.scala
+++ b/streaming/src/test/scala/org/apache/spark/streaming/storage/WriteAheadLogSuite.scala
@@ -18,6 +18,7 @@ package org.apache.spark.streaming.storage
 
 import java.io.{DataInputStream, FileInputStream, File, RandomAccessFile}
 import java.nio.ByteBuffer
+
 import scala.util.Random
 
 import scala.collection.mutable.ArrayBuffer
@@ -144,7 +145,6 @@ class WriteAheadLogSuite extends FunSuite with BeforeAndAfter {
       val data = generateRandomData(10)
       val file = new File(tempDirectory, s"log-$i-${i + 1}")
       writeDataManually(data, file)
-      println(s"Generated log file $file")
       data
     }.flatten
 
@@ -158,8 +158,6 @@ class WriteAheadLogSuite extends FunSuite with BeforeAndAfter {
     val dataToWrite = generateRandomData(100)
     writeDataUsingManager(tempDirectory, dataToWrite)
     val logFiles = getLogFilesInDirectory(tempDirectory)
-    println("==========\n" + logFiles.mkString("\n") + "\n==========\n"  )
-
     assert(logFiles.size > 1)
     val readData = readDataUsingManager(tempDirectory)
     assert(dataToWrite.toList === readData.toList)
@@ -204,7 +202,7 @@ object WriteAheadLogSuite {
   def writeDataUsingManager(logDirectory: File, data: Seq[String]) {
     val fakeClock = new ManualClock
     val manager = new WriteAheadLogManager(logDirectory.toString, hadoopConf,
-      rollingIntervalSecs = 1, clock = fakeClock)
+      rollingIntervalSecs = 1, callerName = "WriteAheadLogSuite", clock = fakeClock)
     data.foreach { item =>
       fakeClock.addToTime(500)
       manager.writeToLog(item)
@@ -218,7 +216,6 @@ object WriteAheadLogSuite {
    */
   def readDataManually(file: File, segments: Seq[FileSegment]): Seq[String] = {
     val reader = new RandomAccessFile(file, "r")
-    println("File " + file + " has " + reader.length() + " bytes ")
     segments.map { x =>
       reader.seek(x.offset)
       val data = new Array[Byte](x.length)
@@ -245,7 +242,8 @@ object WriteAheadLogSuite {
   }
 
   def readDataUsingManager(logDirectory: File): Seq[String] = {
-    val manager = new WriteAheadLogManager(logDirectory.toString, hadoopConf)
+    val manager = new WriteAheadLogManager(logDirectory.toString, hadoopConf,
+      callerName = "WriteAheadLogSuite")
     val data = manager.readFromLog().map(byteBufferToString).toSeq
     manager.stop()
     data
@@ -256,9 +254,12 @@ object WriteAheadLogSuite {
   }
 
   def getLogFilesInDirectory(directory: File): Seq[File] = {
-    println("[ " + directory.listFiles().filter(_.getName().startsWith("log-")).mkString(" | ") + " ]")
-    directory.listFiles().filter(_.getName().startsWith("log-"))
-      .sortBy(_.getName.split("-")(1).toLong)
+    if (directory.exists) {
+      directory.listFiles().filter(_.getName().startsWith("log-"))
+        .sortBy(_.getName.split("-")(1).toLong)
+    } else {
+      Seq.empty
+    }
   }
 
   def printData(data: Seq[String]) {

From 9be5f227761bbcfaee37af5d5abc5a73a171104c Mon Sep 17 00:00:00 2001
From: Tathagata Das <tathagata.das1565@gmail.com>
Date: Wed, 8 Oct 2014 18:07:04 -0700
Subject: [PATCH 06/10] Initial implementation of DriverFailureSuite unit test
 for testing with receivers + write ahead log.

---
 .../receiver/ReceiverSupervisorImpl.scala     |  35 +-
 .../streaming/scheduler/ReceiverTracker.scala |  20 +-
 .../spark/streaming/DriverFailureSuite.scala  | 348 ++++++++++++++++++
 .../apache/spark/streaming/FailureSuite.scala |  56 ---
 4 files changed, 383 insertions(+), 76 deletions(-)
 create mode 100644 streaming/src/test/scala/org/apache/spark/streaming/DriverFailureSuite.scala
 delete mode 100644 streaming/src/test/scala/org/apache/spark/streaming/FailureSuite.scala

diff --git a/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisorImpl.scala b/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisorImpl.scala
index 01d3e3f497500..97677491cd0b2 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisorImpl.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisorImpl.scala
@@ -25,17 +25,13 @@ import scala.concurrent.Await
 
 import akka.actor.{Actor, Props}
 import akka.pattern.ask
-
 import com.google.common.base.Throwables
-
-import org.apache.spark.{Logging, SparkEnv}
-import org.apache.spark.streaming.scheduler._
-import org.apache.spark.util.{Utils, AkkaUtils}
+import org.apache.hadoop.conf.Configuration
+import org.apache.spark.{SparkException, Logging, SparkEnv}
 import org.apache.spark.storage.StreamBlockId
-import org.apache.spark.streaming.scheduler.DeregisterReceiver
-import org.apache.spark.streaming.scheduler.AddBlock
-import org.apache.spark.streaming.scheduler.RegisterReceiver
+import org.apache.spark.streaming.scheduler._
 import org.apache.spark.streaming.storage._
+import org.apache.spark.util.{AkkaUtils, Utils}
 
 /**
  * Concrete implementation of [[org.apache.spark.streaming.receiver.ReceiverSupervisor]]
@@ -45,11 +41,26 @@ import org.apache.spark.streaming.storage._
  */
 private[streaming] class ReceiverSupervisorImpl(
     receiver: Receiver[_],
-    env: SparkEnv
+    env: SparkEnv,
+    hadoopConf: Configuration,
+    checkpointDirOption: Option[String]
   ) extends ReceiverSupervisor(receiver, env.conf) with Logging {
 
-  private val receivedBlockHandler =
-    new BlockManagerBasedBlockHandler(env.blockManager, receiver.streamId, receiver.storageLevel)
+  private val receivedBlockHandler: ReceivedBlockHandler = {
+    if (env.conf.getBoolean("spark.streaming.receiver.writeAheadLog.enable", false)) {
+      if (checkpointDirOption.isEmpty) {
+        throw new SparkException(
+          "Cannot enable receiver write-ahead log without checkpoint directory set. " +
+            "Please use streamingContext.checkpoint() to set the checkpoint directory. " +
+            "See documentation for more details.")
+      }
+      new WriteAheadLogBasedBlockHandler(env.blockManager, receiver.streamId,
+        receiver.storageLevel, env.conf, hadoopConf, checkpointDirOption.get)
+    } else {
+      new BlockManagerBasedBlockHandler(env.blockManager, receiver.streamId, receiver.storageLevel)
+    }
+  }
+
 
   /** Remote Akka actor for the ReceiverTracker */
   private val trackerActor = {
@@ -143,7 +154,7 @@ private[streaming] class ReceiverSupervisorImpl(
 
     val time = System.currentTimeMillis
     val fileSegmentOption = receivedBlockHandler.storeBlock(blockId, receivedBlock) match {
-      case f: FileSegment => Some(f)
+      case Some(f: FileSegment) => Some(f)
       case _ => None
     }
     logDebug("Pushed block " + blockId + " in " + (System.currentTimeMillis - time) + " ms")
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
index 582df6889c24b..8c39aae1d601e 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
@@ -17,20 +17,22 @@
 
 package org.apache.spark.streaming.scheduler
 
+import java.nio.ByteBuffer
+
 import scala.collection.mutable.{HashMap, SynchronizedMap, SynchronizedQueue}
 import scala.language.existentials
 
 import akka.actor._
 import org.apache.hadoop.conf.Configuration
-import org.apache.spark.{SparkConf, Logging, SparkEnv, SparkException}
+import org.apache.hadoop.fs.Path
+import org.apache.spark.{Logging, SparkConf, SparkEnv, SparkException}
 import org.apache.spark.SparkContext._
+import org.apache.spark.SerializableWritable
 import org.apache.spark.storage.StreamBlockId
 import org.apache.spark.streaming.{StreamingContext, Time}
 import org.apache.spark.streaming.receiver.{Receiver, ReceiverSupervisorImpl, StopReceiver}
-import org.apache.spark.streaming.storage.{WriteAheadLogManager, FileSegment}
+import org.apache.spark.streaming.storage.{FileSegment, WriteAheadLogManager}
 import org.apache.spark.util.Utils
-import org.apache.hadoop.fs.Path
-import java.nio.ByteBuffer
 
 /** Information about blocks received by the receiver */
 private[streaming] case class ReceivedBlockInfo(
@@ -323,6 +325,9 @@ class ReceiverTracker(ssc: StreamingContext, skipReceiverLaunch: Boolean = false
           ssc.sc.makeRDD(receivers, receivers.size)
         }
 
+      val checkpointDirOption = Option(ssc.checkpointDir)
+      val serializableHadoopConf = new SerializableWritable(ssc.sparkContext.hadoopConfiguration)
+
       // Function to start the receiver on the worker node
       val startReceiver = (iterator: Iterator[Receiver[_]]) => {
         if (!iterator.hasNext) {
@@ -330,11 +335,10 @@ class ReceiverTracker(ssc: StreamingContext, skipReceiverLaunch: Boolean = false
             "Could not start receiver as object not found.")
         }
         val receiver = iterator.next()
-        val supervisor = new ReceiverSupervisorImpl(receiver, SparkEnv.get)
+        val supervisor = new ReceiverSupervisorImpl(
+          receiver, SparkEnv.get, serializableHadoopConf.value, checkpointDirOption)
         supervisor.start()
-        logInfo("Supervisor started()")
         supervisor.awaitTermination()
-        logInfo("Supervisor terminated")
       }
       // Run the dummy Spark job to ensure that all slaves have registered.
       // This avoids all the receivers to be scheduled on the same node.
@@ -344,7 +348,7 @@ class ReceiverTracker(ssc: StreamingContext, skipReceiverLaunch: Boolean = false
 
       // Distribute the receivers and start them
       logInfo("Starting " + receivers.length + " receivers")
-      ssc.sparkContext.runJob(tempRDD, startReceiver)
+      ssc.sparkContext.runJob(tempRDD, ssc.sparkContext.clean(startReceiver))
       logInfo("All of the receivers have been terminated")
     }
 
diff --git a/streaming/src/test/scala/org/apache/spark/streaming/DriverFailureSuite.scala b/streaming/src/test/scala/org/apache/spark/streaming/DriverFailureSuite.scala
new file mode 100644
index 0000000000000..38fe35d283f34
--- /dev/null
+++ b/streaming/src/test/scala/org/apache/spark/streaming/DriverFailureSuite.scala
@@ -0,0 +1,348 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.streaming
+
+import java.io.File
+import java.util.UUID
+import java.util.concurrent.atomic.AtomicInteger
+
+import scala.util.Random
+
+import org.apache.hadoop.conf.Configuration
+import org.apache.hadoop.fs.Path
+import org.apache.spark.{Logging, SparkConf}
+import org.apache.spark.rdd.RDD
+import org.apache.spark.storage.StorageLevel
+import org.apache.spark.streaming.StreamingContext._
+import org.apache.spark.streaming.dstream.DStream
+import org.apache.spark.streaming.receiver.Receiver
+import org.apache.spark.streaming.scheduler.{StreamingListener, StreamingListenerBatchCompleted}
+import org.apache.spark.util.Utils
+
+/**
+ * This testsuite tests master failures at random times while the stream is running using
+ * the real clock.
+ */
+class DriverFailureSuite extends TestSuiteBase with Logging {
+
+  var directory = "FailureSuite"
+  val numBatches = 30
+
+  override def batchDuration = Milliseconds(1000)
+
+  override def useManualClock = false
+
+  override def beforeFunction() {
+    super.beforeFunction()
+    Utils.deleteRecursively(new File(directory))
+  }
+
+  override def afterFunction() {
+    super.afterFunction()
+    Utils.deleteRecursively(new File(directory))
+  }
+/*
+  test("multiple failures with map") {
+    MasterFailureTest.testMap(directory, numBatches, batchDuration)
+  }
+
+  test("multiple failures with updateStateByKey") {
+    MasterFailureTest.testUpdateStateByKey(directory, numBatches, batchDuration)
+  }
+*/
+  test("multiple failures with receiver and updateStateByKey") {
+    val operation = (st: DStream[String]) => {
+      val updateFunc = (values: Seq[Long], state: Option[Long]) => {
+        Some(values.foldLeft(0L)(_ + _) + state.getOrElse(0L))
+      }
+      st.flatMap(_.split(" ")).map(x => (x, 1L)).updateStateByKey[Long](updateFunc)
+        .checkpoint(batchDuration * 5)
+    }
+
+    val expectedOutput =
+      (1L to DriverFailureTestReceiver.maxRecordsPerBlock).map(x => (1L to x).sum).toSet
+
+    val verify = (time: Time, output: Seq[(String, Long)]) => {
+      println(s"$time: ${output.mkString(", ")}")
+      if (!output.map { _._2 }.forall(expectedOutput.contains)) {
+        throw new Exception(s"Incorrect output: $output\nExpected output: $expectedOutput")
+      }
+    }
+
+    val driverTest = new ReceiverBasedDriverFailureTest[(String, Long)](
+      "./driver-test/", batchDuration.milliseconds.toInt, 120, operation, verify)
+    driverTest.testAndGetError().map(errorMessage => fail(errorMessage))
+  }
+}
+
+
+abstract class DriverFailureTest(
+    testDirectory: String,
+    batchDurationMillis: Int,
+    numBatchesToRun: Int
+  ) extends Logging {
+
+  @transient private val checkpointDir = createCheckpointDir()
+  @transient private val timeoutMillis = batchDurationMillis * numBatchesToRun * 2
+
+  @transient @volatile private var killed = false
+  @transient @volatile private var killCount = 0
+  @transient @volatile private var lastBatchCompleted = 0L
+  @transient @volatile private var batchesCompleted = 0
+  @transient @volatile private var ssc: StreamingContext = null
+
+  protected def setupContext(checkpointDirector: String): StreamingContext
+
+  //----------------------------------------
+
+  /**
+   * Run the test and return an option string containing error message.
+   * @return None is test succeeded, or Some(errorMessage) if test failed
+   */
+  def testAndGetError(): Option[String] = {
+    ssc = setupContext(checkpointDir.toString)
+    run()
+  }
+
+  private def run(): Option[String] = {
+
+    val runStartTime = System.currentTimeMillis
+
+    def allBatchesCompleted = batchesCompleted >= numBatchesToRun
+    def timedOut = (System.currentTimeMillis - runStartTime) > timeoutMillis
+    def failed = DriverFailureSuite.failed
+
+    while(!failed && !allBatchesCompleted && !timedOut) {
+      // Start the thread to kill the streaming after some time
+      killed = false
+      val killingThread = new KillingThread(ssc, batchDurationMillis * 10)
+      killingThread.start()
+      try {
+        // Start the streaming computation and let it run while ...
+        // (i) StreamingContext has not been shut down yet
+        // (ii) The last expected output has not been generated yet
+        // (iii) Its not timed out yet
+        System.clearProperty("spark.streaming.clock")
+        System.clearProperty("spark.driver.port")
+        ssc.addStreamingListener(new BatchCompletionListener)
+        ssc.start()
+        while (!failed && !killed && !allBatchesCompleted && !timedOut) {
+          ssc.awaitTermination(100)
+        }
+      } catch {
+        case e: Exception =>
+          logError("Error running streaming context", e)
+          DriverFailureSuite.fail("Error running streaming context: " + e)
+      }
+
+      logInfo(s"Failed = $failed")
+      logInfo(s"Killed = $killed")
+      logInfo(s"All batches completed = $allBatchesCompleted")
+      logInfo(s"Timed out = $timedOut")
+
+      if (killingThread.isAlive) {
+        killingThread.interrupt()
+        ssc.stop()
+      }
+
+      if (!timedOut) {
+        val sleepTime = Random.nextInt(batchDurationMillis * 10)
+        logInfo(
+          "\n-------------------------------------------\n" +
+            "   Restarting stream computation in " + sleepTime + " ms   " +
+            "\n-------------------------------------------\n"
+        )
+        Thread.sleep(sleepTime)
+        // Recreate the streaming context from checkpoint
+        ssc = StreamingContext.getOrCreate(checkpointDir.toString, () => {
+          throw new Exception("Trying to create new context when it " +
+            "should be reading from checkpoint file")
+        })
+      }
+    }
+
+    if (failed) {
+      Some(s"Failed with message: ${DriverFailureSuite.failureMessage}")
+    } else if (timedOut) {
+      Some(s"Timed out after $batchesCompleted/$numBatchesToRun batches, and " +
+        s"${System.currentTimeMillis} ms (time out = $timeoutMillis ms")
+    } else if (allBatchesCompleted) {
+      None
+    } else {
+      throw new Exception("Unexpected end of test")
+    }
+  }
+
+  private def createCheckpointDir(): Path = {
+    // Create the directories for this test
+    val uuid = UUID.randomUUID().toString
+    val rootDir = new Path(testDirectory, uuid)
+    val fs = rootDir.getFileSystem(new Configuration())
+    val dir = new Path(rootDir, "checkpoint")
+    fs.mkdirs(dir)
+    dir
+  }
+  
+  class BatchCompletionListener extends StreamingListener {
+    override def onBatchCompleted(batchCompleted: StreamingListenerBatchCompleted) {
+      if (batchCompleted.batchInfo.batchTime.milliseconds > lastBatchCompleted) {
+        batchesCompleted += 1
+        lastBatchCompleted = batchCompleted.batchInfo.batchTime.milliseconds
+      }
+    }    
+  }
+
+  class KillingThread(ssc: StreamingContext, maxKillWaitTime: Long) extends Thread with Logging {
+    override def run() {
+      try {
+        // If it is the first killing, then allow the first checkpoint to be created
+        var minKillWaitTime = if (killCount == 0) 5000 else 2000
+        val killWaitTime = minKillWaitTime + math.abs(Random.nextLong % maxKillWaitTime)
+        logInfo("Kill wait time = " + killWaitTime)
+        Thread.sleep(killWaitTime)
+        logInfo(
+          "\n---------------------------------------\n" +
+            "Killing streaming context after " + killWaitTime + " ms" +
+            "\n---------------------------------------\n"
+        )
+        if (ssc != null) {
+          ssc.stop()
+          killed = true
+          killCount += 1
+        }
+        logInfo("Killing thread finished normally")
+      } catch {
+        case ie: InterruptedException => logInfo("Killing thread interrupted")
+        case e: Exception => logWarning("Exception in killing thread", e)
+      }
+
+    }
+  }
+}
+
+object DriverFailureSuite {
+  @transient @volatile var failed = false
+  @transient @volatile var failureMessage = "NOT SET"
+
+  def fail(message: String) {
+    failureMessage = message
+  }
+}
+
+class ReceiverBasedDriverFailureTest[T](
+    @transient testDirectory: String,
+    @transient batchDurationMillis: Int,
+    @transient numBatchesToRun: Int,
+    @transient operation: DStream[String] => DStream[T],
+    outputVerifyingFunction: (Time, Seq[T]) => Unit
+  ) extends DriverFailureTest(
+    testDirectory, batchDurationMillis, numBatchesToRun
+  ) {
+
+  @transient val conf = new SparkConf()
+  conf.setMaster("local[4]")
+      .setAppName("ReceiverBasedDriverFailureTest")
+      .set("spark.streaming.receiver.writeAheadLog.enable", "true")
+
+  override def setupContext(checkpointDirector: String): StreamingContext = {
+
+    val context = StreamingContext.getOrCreate(checkpointDirector, () => {
+      val newSsc = new StreamingContext(conf, Milliseconds(batchDurationMillis))
+      val inputStream = newSsc.receiverStream[String](new DriverFailureTestReceiver)
+      val operatedStream = operation(inputStream)
+
+      val verify = outputVerifyingFunction
+      operatedStream.foreachRDD((rdd: RDD[T], time: Time) => {
+        val collected = rdd.collect()
+        try {
+          verify(time, collected)
+        } catch {
+          case e: Exception =>
+            DriverFailureSuite.fail(e.toString)
+        }
+      })
+      newSsc.checkpoint(checkpointDirector)
+      newSsc
+    })
+    context
+  }
+}
+
+
+
+class DriverFailureTestReceiver extends Receiver[String](StorageLevel.MEMORY_ONLY_SER) with Logging {
+
+  import DriverFailureTestReceiver._
+  @volatile var thread: Thread = null
+
+  class ReceivingThread extends Thread() {
+    override def run() {
+      while (!isStopped() && !isInterrupted()) {
+        val block = getNextBlock()
+        store(block)
+        commitBlock()
+        try {
+          Thread.sleep(100)
+        } catch {
+          case ie: InterruptedException =>
+          case e: Exception =>
+            DriverFailureTestReceiver.this.stop("Error in receiving thread", e)
+        }
+      }
+    }
+  }
+
+  def onStart() {
+    if (thread == null) {
+      thread = new ReceivingThread()
+      thread.start()
+    } else {
+      logError("Error starting receiver, previous receiver thread not stopped yet.")
+    }
+  }
+
+  def onStop() {
+    if (thread != null) {
+      thread.interrupt()
+      thread = null
+    }
+  }
+}
+
+object DriverFailureTestReceiver {
+  val maxRecordsPerBlock = 1000L
+  private val currentKey = new AtomicInteger()
+  private val counter = new AtomicInteger()
+
+  counter.set(1)
+  currentKey.set(1)
+
+  def getNextBlock(): Iterator[String] = {
+    val count = counter.get()
+    (1 to count).map { _ => "word" + currentKey.get() }.iterator
+  }
+
+  def commitBlock() {
+    if (counter.incrementAndGet() > maxRecordsPerBlock) {
+      currentKey.incrementAndGet()
+      counter.set(1)
+      println("Stored " + counter.get())
+    }
+  }
+}
+
diff --git a/streaming/src/test/scala/org/apache/spark/streaming/FailureSuite.scala b/streaming/src/test/scala/org/apache/spark/streaming/FailureSuite.scala
deleted file mode 100644
index 40434b1f9b709..0000000000000
--- a/streaming/src/test/scala/org/apache/spark/streaming/FailureSuite.scala
+++ /dev/null
@@ -1,56 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *    http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.spark.streaming
-
-import org.apache.spark.Logging
-import org.apache.spark.util.Utils
-
-import java.io.File
-
-/**
- * This testsuite tests master failures at random times while the stream is running using
- * the real clock.
- */
-class FailureSuite extends TestSuiteBase with Logging {
-
-  var directory = "FailureSuite"
-  val numBatches = 30
-
-  override def batchDuration = Milliseconds(1000)
-
-  override def useManualClock = false
-
-  override def beforeFunction() {
-    super.beforeFunction()
-    Utils.deleteRecursively(new File(directory))
-  }
-
-  override def afterFunction() {
-    super.afterFunction()
-    Utils.deleteRecursively(new File(directory))
-  }
-
-  test("multiple failures with map") {
-    MasterFailureTest.testMap(directory, numBatches, batchDuration)
-  }
-
-  test("multiple failures with updateStateByKey") {
-    MasterFailureTest.testUpdateStateByKey(directory, numBatches, batchDuration)
-  }
-}
-

From 09cda57739fd63a2cc1405a0932709d6bd7adfe4 Mon Sep 17 00:00:00 2001
From: Tathagata Das <tathagata.das1565@gmail.com>
Date: Wed, 8 Oct 2014 18:41:02 -0700
Subject: [PATCH 07/10] Updated receiver input stream to use
 HDFSBackedBlockRDD.

---
 .../dstream/ReceiverInputDStream.scala        | 16 +++++++---
 .../storage/rdd/HDFSBackedBlockRDD.scala      |  1 +
 .../spark/streaming/DriverFailureSuite.scala  | 29 +++++++++++++------
 3 files changed, 33 insertions(+), 13 deletions(-)

diff --git a/streaming/src/main/scala/org/apache/spark/streaming/dstream/ReceiverInputDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/dstream/ReceiverInputDStream.scala
index e53af30836a0a..eadd7f33d2096 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/dstream/ReceiverInputDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/dstream/ReceiverInputDStream.scala
@@ -21,10 +21,11 @@ import scala.collection.mutable.HashMap
 import scala.reflect.ClassTag
 
 import org.apache.spark.rdd.{BlockRDD, RDD}
-import org.apache.spark.storage.BlockId
+import org.apache.spark.storage.{StorageLevel, BlockId}
 import org.apache.spark.streaming._
 import org.apache.spark.streaming.receiver.Receiver
 import org.apache.spark.streaming.scheduler.ReceivedBlockInfo
+import org.apache.spark.streaming.storage.rdd.HDFSBackedBlockRDD
 
 /**
  * Abstract class for defining any [[org.apache.spark.streaming.dstream.InputDStream]]
@@ -63,14 +64,21 @@ abstract class ReceiverInputDStream[T: ClassTag](@transient ssc_ : StreamingCont
     // If this is called for any time before the start time of the context,
     // then this returns an empty RDD. This may happen when recovering from a
     // master failure
-    if (validTime >= graph.startTime) {
+    val blockRDD = if (validTime >= graph.startTime) {
       val blockInfo = ssc.scheduler.receiverTracker.getReceivedBlockInfo(id)
       receivedBlockInfo(validTime) = blockInfo
       val blockIds = blockInfo.map(_.blockId.asInstanceOf[BlockId])
-      Some(new BlockRDD[T](ssc.sc, blockIds))
+      val fileSegments = blockInfo.flatMap(_.fileSegmentOption)
+      if (fileSegments.nonEmpty) {
+        new HDFSBackedBlockRDD[T](ssc.sparkContext, ssc.sparkContext.hadoopConfiguration,
+          blockIds, fileSegments, storeInBlockManager = false, StorageLevel.MEMORY_ONLY_SER)
+      } else {
+        new BlockRDD[T](ssc.sc, blockIds)
+      }
     } else {
-      Some(new BlockRDD[T](ssc.sc, Array[BlockId]()))
+      new BlockRDD[T](ssc.sc, Array[BlockId]())
     }
+    Some(blockRDD)
   }
 
   /** Get information on received blocks. */
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/storage/rdd/HDFSBackedBlockRDD.scala b/streaming/src/main/scala/org/apache/spark/streaming/storage/rdd/HDFSBackedBlockRDD.scala
index c672574ee2ed4..25f8363454394 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/storage/rdd/HDFSBackedBlockRDD.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/storage/rdd/HDFSBackedBlockRDD.scala
@@ -68,6 +68,7 @@ class HDFSBackedBlockRDD[T: ClassTag](
         block.data.asInstanceOf[Iterator[T]]
       // Data not found in Block Manager, grab it from HDFS
       case None =>
+        logInfo("Reading partition data from write ahead log " + partition.segment.path)
         val reader = new WriteAheadLogRandomReader(partition.segment.path, hadoopConf)
         val dataRead = reader.read(partition.segment)
         reader.close()
diff --git a/streaming/src/test/scala/org/apache/spark/streaming/DriverFailureSuite.scala b/streaming/src/test/scala/org/apache/spark/streaming/DriverFailureSuite.scala
index 38fe35d283f34..98890f3b41143 100644
--- a/streaming/src/test/scala/org/apache/spark/streaming/DriverFailureSuite.scala
+++ b/streaming/src/test/scala/org/apache/spark/streaming/DriverFailureSuite.scala
@@ -115,6 +115,7 @@ abstract class DriverFailureTest(
    * @return None is test succeeded, or Some(errorMessage) if test failed
    */
   def testAndGetError(): Option[String] = {
+    DriverFailureTest.reset()
     ssc = setupContext(checkpointDir.toString)
     run()
   }
@@ -125,7 +126,7 @@ abstract class DriverFailureTest(
 
     def allBatchesCompleted = batchesCompleted >= numBatchesToRun
     def timedOut = (System.currentTimeMillis - runStartTime) > timeoutMillis
-    def failed = DriverFailureSuite.failed
+    def failed = DriverFailureTest.failed
 
     while(!failed && !allBatchesCompleted && !timedOut) {
       // Start the thread to kill the streaming after some time
@@ -147,7 +148,7 @@ abstract class DriverFailureTest(
       } catch {
         case e: Exception =>
           logError("Error running streaming context", e)
-          DriverFailureSuite.fail("Error running streaming context: " + e)
+          DriverFailureTest.fail("Error running streaming context: " + e)
       }
 
       logInfo(s"Failed = $failed")
@@ -173,11 +174,12 @@ abstract class DriverFailureTest(
           throw new Exception("Trying to create new context when it " +
             "should be reading from checkpoint file")
         })
+        println("Restarting")
       }
     }
 
     if (failed) {
-      Some(s"Failed with message: ${DriverFailureSuite.failureMessage}")
+      Some(s"Failed with message: ${DriverFailureTest.failureMessage}")
     } else if (timedOut) {
       Some(s"Timed out after $batchesCompleted/$numBatchesToRun batches, and " +
         s"${System.currentTimeMillis} ms (time out = $timeoutMillis ms")
@@ -224,6 +226,7 @@ abstract class DriverFailureTest(
           ssc.stop()
           killed = true
           killCount += 1
+          println("Killed")
         }
         logInfo("Killing thread finished normally")
       } catch {
@@ -235,13 +238,19 @@ abstract class DriverFailureTest(
   }
 }
 
-object DriverFailureSuite {
-  @transient @volatile var failed = false
-  @transient @volatile var failureMessage = "NOT SET"
+object DriverFailureTest {
+  @transient @volatile var failed: Boolean = _
+  @transient @volatile var failureMessage: String = _
 
   def fail(message: String) {
+    failed = true
     failureMessage = message
   }
+
+  def reset() {
+    failed = false
+    failureMessage = "NOT SET"
+  }
 }
 
 class ReceiverBasedDriverFailureTest[T](
@@ -268,12 +277,14 @@ class ReceiverBasedDriverFailureTest[T](
 
       val verify = outputVerifyingFunction
       operatedStream.foreachRDD((rdd: RDD[T], time: Time) => {
-        val collected = rdd.collect()
         try {
+          val collected = rdd.collect()
           verify(time, collected)
         } catch {
+          case ie: InterruptedException =>
+            // ignore
           case e: Exception =>
-            DriverFailureSuite.fail(e.toString)
+            DriverFailureTest.fail(e.toString)
         }
       })
       newSsc.checkpoint(checkpointDirector)
@@ -338,10 +349,10 @@ object DriverFailureTestReceiver {
   }
 
   def commitBlock() {
+    println(s"Stored ${counter.get()} copies of word${currentKey.get}")
     if (counter.incrementAndGet() > maxRecordsPerBlock) {
       currentKey.incrementAndGet()
       counter.set(1)
-      println("Stored " + counter.get())
     }
   }
 }

From e390c718796767ba1a7c263a7e1149f27473f25e Mon Sep 17 00:00:00 2001
From: Tathagata Das <tathagata.das1565@gmail.com>
Date: Wed, 8 Oct 2014 20:58:22 -0700
Subject: [PATCH 08/10] Made WriteAheadLogWriter use local fileoutputstream for
 local file system.

---
 .../storage/WriteAheadLogWriter.scala         | 55 +++++++++++++------
 .../spark/streaming/DriverFailureSuite.scala  |  2 +-
 2 files changed, 39 insertions(+), 18 deletions(-)

diff --git a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogWriter.scala b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogWriter.scala
index 8a2db8305a7e2..f292bd0f045a9 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogWriter.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogWriter.scala
@@ -16,20 +16,36 @@
  */
 package org.apache.spark.streaming.storage
 
-import java.io.Closeable
-import java.lang.reflect.Method
+import java.io.{BufferedOutputStream, Closeable, DataOutputStream, FileOutputStream}
+import java.net.URI
 import java.nio.ByteBuffer
 
 import scala.util.Try
 
 import org.apache.hadoop.conf.Configuration
-import org.apache.hadoop.fs.FSDataOutputStream
+import org.apache.hadoop.fs.{FSDataOutputStream, FileSystem}
 
 private[streaming] class WriteAheadLogWriter(path: String, conf: Configuration) extends Closeable {
-  private val stream = HdfsUtils.getOutputStream(path, conf)
-  private var nextOffset = stream.getPos
+  private val underlyingStream: Either[DataOutputStream, FSDataOutputStream] = {
+    val uri = new URI(path)
+    val defaultFs = FileSystem.getDefaultUri(conf).getScheme
+    val isDefaultLocal = defaultFs == null || defaultFs == "file"
+
+    if ((isDefaultLocal && uri.getScheme == null) || uri.getScheme == "file") {
+      Left(new DataOutputStream(new BufferedOutputStream(new FileOutputStream(uri.getPath))))
+    } else {
+      Right(HdfsUtils.getOutputStream(path, conf))
+    }
+  }
+
+  private lazy val hadoopFlushMethod = {
+    val cls = classOf[FSDataOutputStream]
+    Try(cls.getMethod("hflush")).orElse(Try(cls.getMethod("sync"))).toOption
+  }
+
+  private var nextOffset = getPosition()
   private var closed = false
-  private val hflushMethod = getHflushOrSync()
+
 
   // Data is always written as:
   // - Length - Long
@@ -48,8 +64,8 @@ private[streaming] class WriteAheadLogWriter(path: String, conf: Configuration)
         stream.write(data.get())
       }
     }
-    hflushOrSync()
-    nextOffset = stream.getPos
+    flush()
+    nextOffset = getPosition()
     segment
   }
 
@@ -58,17 +74,22 @@ private[streaming] class WriteAheadLogWriter(path: String, conf: Configuration)
     stream.close()
   }
 
-  private def hflushOrSync() {
-    hflushMethod.foreach(_.invoke(stream))
+  private def stream(): DataOutputStream = {
+    underlyingStream.fold(x => x,  x => x)
+  }
+
+  private def getPosition(): Long = {
+    underlyingStream match {
+      case Left(localStream) => localStream.size
+      case Right(dfsStream) => dfsStream.getPos()
+    }
   }
 
-  private def getHflushOrSync(): Option[Method] = {
-    Try {
-      Some(classOf[FSDataOutputStream].getMethod("hflush"))
-    }.recover {
-      case e: NoSuchMethodException =>
-        Some(classOf[FSDataOutputStream].getMethod("sync"))
-    }.getOrElse(None)
+  private def flush() {
+    underlyingStream match {
+      case Left(localStream) => localStream.flush
+      case Right(dfsStream) => hadoopFlushMethod.foreach { _.invoke(dfsStream) }
+    }
   }
 
   private def assertOpen() {
diff --git a/streaming/src/test/scala/org/apache/spark/streaming/DriverFailureSuite.scala b/streaming/src/test/scala/org/apache/spark/streaming/DriverFailureSuite.scala
index 98890f3b41143..664506f60f706 100644
--- a/streaming/src/test/scala/org/apache/spark/streaming/DriverFailureSuite.scala
+++ b/streaming/src/test/scala/org/apache/spark/streaming/DriverFailureSuite.scala
@@ -78,7 +78,7 @@ class DriverFailureSuite extends TestSuiteBase with Logging {
       (1L to DriverFailureTestReceiver.maxRecordsPerBlock).map(x => (1L to x).sum).toSet
 
     val verify = (time: Time, output: Seq[(String, Long)]) => {
-      println(s"$time: ${output.mkString(", ")}")
+      println(s"Count at $time: ${output.mkString(", ")}")
       if (!output.map { _._2 }.forall(expectedOutput.contains)) {
         throw new Exception(s"Incorrect output: $output\nExpected output: $expectedOutput")
       }

From 6b612870cc1922445e5f7f84563c8541e12d5dea Mon Sep 17 00:00:00 2001
From: Tathagata Das <tathagata.das1565@gmail.com>
Date: Mon, 20 Oct 2014 17:55:41 -0700
Subject: [PATCH 09/10] Added ReceivedBlockTracker to track all block metadata
 related actions. Updated ReceivedBlockTrackerSuite, and DriverFailureSuite.

---
 .../dstream/ReceiverInputDStream.scala        |  47 +---
 .../streaming/scheduler/JobGenerator.scala    |   4 +-
 .../scheduler/ReceivedBlockTracker.scala      | 172 ++++++++++++++
 .../streaming/scheduler/ReceiverTracker.scala | 101 ++-------
 .../storage/ReceivedBlockHandler.scala        |   8 +-
 .../storage/WriteAheadLogManager.scala        |  34 +--
 .../storage/WriteAheadLogWriter.scala         |   4 +-
 .../spark/streaming/DriverFailureSuite.scala  | 137 ++++++++----
 .../streaming/ReceivedBlockTrackerSuite.scala | 210 ++++++++++++++++++
 .../streaming/ReceiverTrackerSuite.scala      | 133 -----------
 10 files changed, 534 insertions(+), 316 deletions(-)
 create mode 100644 streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceivedBlockTracker.scala
 create mode 100644 streaming/src/test/scala/org/apache/spark/streaming/ReceivedBlockTrackerSuite.scala
 delete mode 100644 streaming/src/test/scala/org/apache/spark/streaming/ReceiverTrackerSuite.scala

diff --git a/streaming/src/main/scala/org/apache/spark/streaming/dstream/ReceiverInputDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/dstream/ReceiverInputDStream.scala
index eadd7f33d2096..f1645066cc815 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/dstream/ReceiverInputDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/dstream/ReceiverInputDStream.scala
@@ -40,10 +40,6 @@ import org.apache.spark.streaming.storage.rdd.HDFSBackedBlockRDD
 abstract class ReceiverInputDStream[T: ClassTag](@transient ssc_ : StreamingContext)
   extends InputDStream[T](ssc_) {
 
-  /** Keeps all received blocks information */
-  private[streaming] lazy val receivedBlockInfo = new HashMap[Time, Array[ReceivedBlockInfo]]
-  private[streaming] override val checkpointData = new ReceiverInputDStreamCheckpointData(this)
-
   /** This is an unique identifier for the network input stream. */
   val id = ssc.getNewReceiverStreamId()
 
@@ -65,10 +61,11 @@ abstract class ReceiverInputDStream[T: ClassTag](@transient ssc_ : StreamingCont
     // then this returns an empty RDD. This may happen when recovering from a
     // master failure
     val blockRDD = if (validTime >= graph.startTime) {
-      val blockInfo = ssc.scheduler.receiverTracker.getReceivedBlockInfo(id)
-      receivedBlockInfo(validTime) = blockInfo
-      val blockIds = blockInfo.map(_.blockId.asInstanceOf[BlockId])
-      val fileSegments = blockInfo.flatMap(_.fileSegmentOption)
+      val blockInfo = getReceivedBlockInfo(validTime)
+      val blockIds = blockInfo.map(_.blockId).map { _.asInstanceOf[BlockId] } toArray
+      val fileSegments = blockInfo.flatMap(_.fileSegmentOption).toArray
+      logInfo("Stream " + id + ": allocated " + blockInfo.map(_.blockId).mkString(", "))
+
       if (fileSegments.nonEmpty) {
         new HDFSBackedBlockRDD[T](ssc.sparkContext, ssc.sparkContext.hadoopConfiguration,
           blockIds, fileSegments, storeInBlockManager = false, StorageLevel.MEMORY_ONLY_SER)
@@ -82,8 +79,8 @@ abstract class ReceiverInputDStream[T: ClassTag](@transient ssc_ : StreamingCont
   }
 
   /** Get information on received blocks. */
-  private[streaming] def getReceivedBlockInfo(time: Time) = {
-    receivedBlockInfo.get(time).getOrElse(Array.empty[ReceivedBlockInfo])
+  private[streaming] def getReceivedBlockInfo(time: Time): Seq[ReceivedBlockInfo] = {
+    ssc.scheduler.receiverTracker.getReceivedBlocks(time, id)
   }
 
   /**
@@ -94,32 +91,6 @@ abstract class ReceiverInputDStream[T: ClassTag](@transient ssc_ : StreamingCont
    */
   private[streaming] override def clearMetadata(time: Time) {
     super.clearMetadata(time)
-    val oldReceivedBlocks = receivedBlockInfo.filter(_._1 <= (time - rememberDuration))
-    receivedBlockInfo --= oldReceivedBlocks.keys
-    logDebug("Cleared " + oldReceivedBlocks.size + " RDDs that were older than " +
-      (time - rememberDuration) + ": " + oldReceivedBlocks.keys.mkString(", "))
+    ssc.scheduler.receiverTracker.cleanupOldInfo(time - rememberDuration)
   }
-}
-
-private[streaming] class ReceiverInputDStreamCheckpointData[T: ClassTag](
-    dstream: ReceiverInputDStream[T]) extends DStreamCheckpointData[T](dstream) {
-
-  private var timeToReceivedBlockInfo: Seq[(Time, Array[ReceivedBlockInfo])] = _
-
-  override def update(time: Time) {
-    timeToReceivedBlockInfo = dstream.receivedBlockInfo.toSeq
-  }
-
-  override def cleanup(time: Time) {
-    // not required, as block info copied in whole every time update is called
-  }
-
-  override def restore() {
-    Option(timeToReceivedBlockInfo).foreach { blockInfo =>
-      dstream.receivedBlockInfo.clear()
-      dstream.receivedBlockInfo ++= blockInfo
-    }
-  }
-}
-
-
+}
\ No newline at end of file
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/JobGenerator.scala b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/JobGenerator.scala
index 374848358e700..ee00abdf3f4f0 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/JobGenerator.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/JobGenerator.scala
@@ -222,10 +222,10 @@ class JobGenerator(jobScheduler: JobScheduler) extends Logging {
       case Success(jobs) =>
         val receivedBlockInfo = graph.getReceiverInputStreams.map { stream =>
           val streamId = stream.id
-          val receivedBlockInfo = stream.getReceivedBlockInfo(time)
+          val receivedBlockInfo = stream.getReceivedBlockInfo(time).toArray
           (streamId, receivedBlockInfo)
         }.toMap
-        jobScheduler.submitJobSet(JobSet(time, jobs, receivedBlockInfo))
+        jobScheduler.submitJobSet(JobSet(time, jobs, receivedBlockInfo.toMap))
       case Failure(e) =>
         jobScheduler.reportError("Error generating jobs for time " + time, e)
     }
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceivedBlockTracker.scala b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceivedBlockTracker.scala
new file mode 100644
index 0000000000000..25c0980d7462e
--- /dev/null
+++ b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceivedBlockTracker.scala
@@ -0,0 +1,172 @@
+package org.apache.spark.streaming.scheduler
+
+import java.nio.ByteBuffer
+
+import scala.collection.mutable
+import scala.language.implicitConversions
+
+import org.apache.hadoop.conf.Configuration
+import org.apache.hadoop.fs.Path
+import org.apache.spark.{Logging, SparkConf}
+import org.apache.spark.streaming.Time
+import org.apache.spark.streaming.storage.WriteAheadLogManager
+import org.apache.spark.util.Utils
+import org.apache.spark.storage.StreamBlockId
+import org.apache.spark.streaming.util.Clock
+
+private[streaming] sealed trait ReceivedBlockTrackerRecord
+
+private[streaming] case class BlockAddition(receivedBlockInfo: ReceivedBlockInfo)
+  extends ReceivedBlockTrackerRecord
+private[streaming] case class BatchAllocations(time: Time, allocatedBlocks: AllocatedBlocks)
+  extends ReceivedBlockTrackerRecord
+private[streaming] case class BatchCleanup(times: Seq[Time])
+  extends ReceivedBlockTrackerRecord
+
+case class AllocatedBlocks(streamIdToAllocatedBlocks: Map[Int, Seq[ReceivedBlockInfo]]) {
+  def apply(streamId: Int) = streamIdToAllocatedBlocks(streamId)
+}
+
+private[streaming]
+class ReceivedBlockTracker(
+    conf: SparkConf, hadoopConf: Configuration, streamIds: Seq[Int], clock: Clock,
+    checkpointDirOption: Option[String]) extends Logging {
+
+  private type ReceivedBlockQueue = mutable.Queue[ReceivedBlockInfo]
+  
+  private val streamIdToUnallocatedBlockInfo = new mutable.HashMap[Int, ReceivedBlockQueue]
+  private val timeToAllocatedBlockInfo = new mutable.HashMap[Time, AllocatedBlocks]
+
+  private val logManagerRollingIntervalSecs = conf.getInt(
+    "spark.streaming.receivedBlockTracker.writeAheadLog.rotationIntervalSecs", 60)
+  private val logManagerOption = checkpointDirOption.map { checkpointDir =>
+    new WriteAheadLogManager(
+      ReceivedBlockTracker.checkpointDirToLogDir(checkpointDir),
+      hadoopConf,
+      rollingIntervalSecs = logManagerRollingIntervalSecs,
+      callerName = "ReceivedBlockHandlerMaster",
+      clock = clock
+    )
+  }
+
+  // Recover block information from write ahead logs
+  recoverFromWriteAheadLogs()
+
+  /** Add received block */
+  def addBlock(receivedBlockInfo: ReceivedBlockInfo): Boolean = synchronized {
+    try {
+      writeToLog(BlockAddition(receivedBlockInfo))
+      getReceivedBlockQueue(receivedBlockInfo.streamId) += receivedBlockInfo
+      logDebug(s"Stream ${receivedBlockInfo.streamId} received block ${receivedBlockInfo.blockId}")
+      true
+    } catch {
+      case e: Exception =>
+        logError("Error adding block " + receivedBlockInfo, e)
+        false
+    }
+  }
+
+  /** Get blocks that have been added but not yet allocated to any batch */
+  def getUnallocatedBlocks(streamId: Int): Seq[ReceivedBlockInfo] = synchronized {
+    getReceivedBlockQueue(streamId).toSeq
+  } 
+
+  /** Get the blocks allocated to a batch, or allocate blocks to the batch and then get them */
+  def getOrAllocateBlocksToBatch(batchTime: Time, streamId: Int): Seq[ReceivedBlockInfo] = {
+    synchronized {
+      if (!timeToAllocatedBlockInfo.contains(batchTime)) {
+        allocateAllUnallocatedBlocksToBatch(batchTime)
+      }
+      timeToAllocatedBlockInfo(batchTime)(streamId)
+    }
+  }
+
+  /** Check if any blocks are left to be allocated to batches */
+  def hasUnallocatedReceivedBlocks(): Boolean = synchronized {
+    !streamIdToUnallocatedBlockInfo.values.forall(_.isEmpty)
+  }
+
+  /** Clean up block information of old batches */
+  def cleanupOldBatches(cleanupThreshTime: Time): Unit = synchronized {
+    assert(cleanupThreshTime.milliseconds < clock.currentTime())
+    val timesToCleanup = timeToAllocatedBlockInfo.keys.filter { _ < cleanupThreshTime }.toSeq
+    logInfo("Deleting batches " + timesToCleanup)
+    writeToLog(BatchCleanup(timesToCleanup))
+    timeToAllocatedBlockInfo --= timesToCleanup
+    logManagerOption.foreach(_.cleanupOldLogs(cleanupThreshTime.milliseconds))
+    log
+  }
+
+  /** Stop the block tracker */
+  def stop() {
+    logManagerOption.foreach { _.stop() }
+  }
+
+  /** Allocate all unallocated blocks to the given batch */
+  private def allocateAllUnallocatedBlocksToBatch(batchTime: Time): AllocatedBlocks = synchronized {
+    val allocatedBlockInfos = AllocatedBlocks(streamIds.map { streamId =>
+      (streamId, getReceivedBlockQueue(streamId).dequeueAll(x => true))
+    }.toMap)
+    writeToLog(BatchAllocations(batchTime, allocatedBlockInfos))
+    timeToAllocatedBlockInfo(batchTime) = allocatedBlockInfos
+    allocatedBlockInfos
+  }
+
+  private def getReceivedBlockQueue(streamId: Int): ReceivedBlockQueue = {
+    streamIdToUnallocatedBlockInfo.getOrElseUpdate(streamId, new ReceivedBlockQueue)
+  }
+
+  /** Write an update to the tracker to the write ahead log */
+  private def writeToLog(record: ReceivedBlockTrackerRecord) {
+    logDebug("Writing to log " + record)
+    logManagerOption.foreach { logManager =>
+      logManager.writeToLog(ByteBuffer.wrap(Utils.serialize(record)))
+    }
+  }
+
+  private def recoverFromWriteAheadLogs(): Unit = synchronized {
+    logInfo("Recovering from checkpoint")
+    val blockIdToblockInfo = new mutable.HashMap[StreamBlockId, ReceivedBlockInfo]
+
+    def insertAddedBlock(receivedBlockInfo: ReceivedBlockInfo) {
+      logTrace(s"Recovery: Inserting added block $receivedBlockInfo")
+      println(s"Recovery: Inserting added block $receivedBlockInfo")
+      blockIdToblockInfo.put(receivedBlockInfo.blockId, receivedBlockInfo)
+      getReceivedBlockQueue(receivedBlockInfo.streamId) += receivedBlockInfo
+    }
+
+    def insertAllocatedBatch(time: Time, allocatedBlocks: AllocatedBlocks) {
+      logTrace(s"Recovery: Inserting allocated batch for time $time to ${allocatedBlocks.streamIdToAllocatedBlocks}")
+      println(s"Recovery: Inserting allocated batch for time $time to ${allocatedBlocks.streamIdToAllocatedBlocks}")
+      streamIdToUnallocatedBlockInfo.values.foreach { _.clear() }
+      timeToAllocatedBlockInfo.put(time, allocatedBlocks)
+    }
+
+    def cleanupBatches(batchTimes: Seq[Time]) {
+      logTrace(s"Recovery: Cleaning up batches ${batchTimes}")
+      println(s"Recovery: Cleaning up batches ${batchTimes}")
+      timeToAllocatedBlockInfo --= batchTimes
+    }
+
+    logManagerOption.foreach { logManager =>
+      logManager.readFromLog().foreach { byteBuffer =>
+        logTrace("Recovering record " + byteBuffer)
+        Utils.deserialize[ReceivedBlockTrackerRecord](byteBuffer.array) match {
+          case BlockAddition(receivedBlockInfo) =>
+            insertAddedBlock(receivedBlockInfo)
+          case BatchAllocations(time, allocatedBlocks) =>
+            insertAllocatedBatch(time, allocatedBlocks)
+          case BatchCleanup(batchTimes) =>
+            cleanupBatches(batchTimes)
+        }
+      }
+    }
+    blockIdToblockInfo.clear()
+  }
+}
+
+private[streaming] object ReceivedBlockTracker {
+  def checkpointDirToLogDir(checkpointDir: String): String = {
+    new Path(checkpointDir, "receivedBlockMetadata").toString
+  }
+}
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
index 8c39aae1d601e..0eabffa66a9cb 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
@@ -60,45 +60,6 @@ private[streaming] case class ReportError(streamId: Int, message: String, error:
 private[streaming] case class DeregisterReceiver(streamId: Int, msg: String, error: String)
   extends ReceiverTrackerMessage
 
-
-/**
- *
- */
-private[streaming] class ReceivedBlockInfoCheckpointer(
-    checkpointDirectory: String, conf: SparkConf, hadoopConf: Configuration) {
-
-  import ReceivedBlockInfoCheckpointer._
-
-  private val logDirectory = checkpointDirToLogDir(checkpointDirectory)
-  private val logManager = new WriteAheadLogManager(
-    logDirectory, hadoopConf, callerName = "ReceiverTracker")
-
-  def recover(): Seq[ReceivedBlockInfo] = {
-    logManager.readFromLog().map { byteBuffer =>
-      Utils.deserialize[ReceivedBlockInfo](byteBuffer.array)
-    }.toSeq
-  }
-
-  def write(receivedBlockInfo: ReceivedBlockInfo) {
-    val bytes = Utils.serialize(receivedBlockInfo)
-    logManager.writeToLog(ByteBuffer.wrap(bytes))
-  }
-
-  def clear(threshTime: Long) {
-    logManager.clearOldLogs(threshTime)
-  }
-
-  def stop() {
-    logManager.stop()
-  }
-}
-
-private[streaming] object ReceivedBlockInfoCheckpointer {
-  def checkpointDirToLogDir(checkpointDir: String): String = {
-    new Path(checkpointDir, "receivedBlockMetadata").toString
-  }
-}
-
 /**
  * This class manages the execution of the receivers of NetworkInputDStreams. Instance of
  * this class must be created after all input streams have been added and StreamingContext.start()
@@ -113,26 +74,18 @@ class ReceiverTracker(ssc: StreamingContext, skipReceiverLaunch: Boolean = false
   private val receiverInputStreamMap = Map(receiverInputStreams.map(x => (x.id, x)): _*)
   private val receiverExecutor = new ReceiverLauncher()
   private val receiverInfo = new HashMap[Int, ReceiverInfo] with SynchronizedMap[Int, ReceiverInfo]
-  private val receivedBlockInfo = new HashMap[Int, SynchronizedQueue[ReceivedBlockInfo]]
-    with SynchronizedMap[Int, SynchronizedQueue[ReceivedBlockInfo]]
+  private val receivedBlockTracker = new ReceivedBlockTracker(
+    ssc.sparkContext.conf,
+    ssc.sparkContext.hadoopConfiguration,
+    receiverInputStreams.map { _.id },
+    ssc.scheduler.clock,
+    Option(ssc.checkpointDir)
+  )
   private val listenerBus = ssc.scheduler.listenerBus
-  val receivedBlockCheckpointerOption = Option(ssc.checkpointDir) map { dir =>
-    new ReceivedBlockInfoCheckpointer(dir, ssc.sparkContext.conf,
-      ssc.sparkContext.hadoopConfiguration)
-  }
 
   // actor is created when generator starts.
   // This not being null means the tracker has been started and not stopped
-  var actor: ActorRef = null
-  var currentTime: Time = null
-
-  receivedBlockCheckpointerOption.foreach { checkpointer =>
-    val recoveredBlockInfo = checkpointer.recover()
-    recoveredBlockInfo.foreach { info =>
-      getReceivedBlockInfoQueue(info.streamId) += info
-    }
-    logInfo(s"Recovered info on ${recoveredBlockInfo.size} blocks from write ahead log")
-  }
+  private var actor: ActorRef = null
 
   /** Start the actor and receiver execution thread. */
   def start() = synchronized {
@@ -157,29 +110,22 @@ class ReceiverTracker(ssc: StreamingContext, skipReceiverLaunch: Boolean = false
       // Finally, stop the actor
       ssc.env.actorSystem.stop(actor)
       actor = null
-
-      receivedBlockCheckpointerOption.foreach { _.stop() }
+      receivedBlockTracker.stop()
       logInfo("ReceiverTracker stopped")
     }
   }
 
   /** Return all the blocks received from a receiver. */
-  def getReceivedBlockInfo(streamId: Int): Array[ReceivedBlockInfo] = {
-    val receivedBlockInfo = getReceivedBlockInfoQueue(streamId).dequeueAll(x => true)
-    logInfo("Stream " + streamId + " received " + receivedBlockInfo.size + " blocks")
-    receivedBlockInfo.toArray
+  def getReceivedBlocks(batchTime: Time, streamId: Int): Seq[ReceivedBlockInfo] = {
+    receivedBlockTracker.getOrAllocateBlocksToBatch(batchTime, streamId)
   }
 
-  def getReceiverInfo(streamId: Int): Option[ReceiverInfo] = {
-    receiverInfo.get(streamId)
-  }
-
-  private def getReceivedBlockInfoQueue(streamId: Int) = {
-    receivedBlockInfo.getOrElseUpdate(streamId, new SynchronizedQueue[ReceivedBlockInfo])
+  def cleanupOldInfo(cleanupThreshTime: Time) {
+    receivedBlockTracker.cleanupOldBatches(cleanupThreshTime)
   }
 
   /** Register a receiver */
-  def registerReceiver(
+  private def registerReceiver(
       streamId: Int,
       typ: String,
       host: String,
@@ -196,7 +142,7 @@ class ReceiverTracker(ssc: StreamingContext, skipReceiverLaunch: Boolean = false
   }
 
   /** Deregister a receiver */
-  def deregisterReceiver(streamId: Int, message: String, error: String) {
+  private def deregisterReceiver(streamId: Int, message: String, error: String) {
     val newReceiverInfo = receiverInfo.get(streamId) match {
       case Some(oldInfo) =>
         oldInfo.copy(actor = null, active = false, lastErrorMessage = message, lastError = error)
@@ -215,21 +161,12 @@ class ReceiverTracker(ssc: StreamingContext, skipReceiverLaunch: Boolean = false
   }
 
   /** Add new blocks for the given stream */
-  def addBlock(receivedBlockInfo: ReceivedBlockInfo): Boolean = {
-    try {
-      receivedBlockCheckpointerOption.foreach { _.write(receivedBlockInfo) }
-      getReceivedBlockInfoQueue(receivedBlockInfo.streamId) += receivedBlockInfo
-      logDebug(s"Stream ${receivedBlockInfo.streamId} received block ${receivedBlockInfo.blockId}")
-      true
-    } catch {
-      case e: Exception =>
-        logError("Error adding block " + receivedBlockInfo, e)
-        false
-    }
+  private def addBlock(receivedBlockInfo: ReceivedBlockInfo): Boolean = {
+    receivedBlockTracker.addBlock(receivedBlockInfo)
   }
 
   /** Report error sent by a receiver */
-  def reportError(streamId: Int, message: String, error: String) {
+  private def reportError(streamId: Int, message: String, error: String) {
     val newReceiverInfo = receiverInfo.get(streamId) match {
       case Some(oldInfo) =>
         oldInfo.copy(lastErrorMessage = message, lastError = error)
@@ -249,7 +186,7 @@ class ReceiverTracker(ssc: StreamingContext, skipReceiverLaunch: Boolean = false
 
   /** Check if any blocks are left to be processed */
   def hasMoreReceivedBlockIds: Boolean = {
-    !receivedBlockInfo.values.forall(_.isEmpty)
+    receivedBlockTracker.hasUnallocatedReceivedBlocks()
   }
 
   /** Actor to receive messages from the receivers. */
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedBlockHandler.scala b/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedBlockHandler.scala
index fe36dbc210f24..cc5b5b8136b81 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedBlockHandler.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedBlockHandler.scala
@@ -71,7 +71,7 @@ private[streaming] class WriteAheadLogBasedBlockHandler(
   private val logManager = new WriteAheadLogManager(
     checkpointDirToLogDir(checkpointDir, streamId),
     hadoopConf, rollingInterval, maxFailures,
-    callerName = "WriteAheadLogBasedHandler",
+    callerName = "WriteAheadLogBasedBlockHandler",
     clock = clock
   )
 
@@ -93,7 +93,9 @@ private[streaming] class WriteAheadLogBasedBlockHandler(
     val pushToBlockManagerFuture = Future {
       blockManager.putBytes(blockId, serializedBlock, storageLevel, tellMaster = true)
     }
-    val pushToLogFuture = Future { logManager.writeToLog(serializedBlock) }
+    val pushToLogFuture = Future {
+      logManager.writeToLog(serializedBlock)
+    }
     val combinedFuture = for {
       _ <- pushToBlockManagerFuture
       fileSegment <- pushToLogFuture
@@ -103,7 +105,7 @@ private[streaming] class WriteAheadLogBasedBlockHandler(
   }
 
   def clearOldBlocks(threshTime: Long) {
-    logManager.clearOldLogs(threshTime)
+    logManager.cleanupOldLogs(threshTime)
   }
 
   def stop() {
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala
index 0c104c1609e9a..c70ecb0da4e54 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogManager.scala
@@ -7,6 +7,7 @@ import scala.concurrent.{ExecutionContext, Future}
 
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
+import org.apache.hadoop.fs.permission.FsPermission
 import org.apache.spark.Logging
 import org.apache.spark.streaming.storage.WriteAheadLogManager._
 import org.apache.spark.streaming.util.{Clock, SystemClock}
@@ -17,22 +18,24 @@ private[streaming] class WriteAheadLogManager(
     hadoopConf: Configuration,
     rollingIntervalSecs: Int = 60,
     maxFailures: Int = 3,
-    callerName: String = null,
+    callerName: String = "",
     clock: Clock = new SystemClock
   ) extends Logging {
 
   private val pastLogs = new ArrayBuffer[LogInfo]
-  private val threadpoolName = "WriteAheadLogManager" +
-    Option(callerName).map { s => s" for $s" }.getOrElse("")
+  private val callerNameTag =
+    if (callerName != null && callerName.nonEmpty) s" for $callerName" else ""
+  private val threadpoolName = s"WriteAheadLogManager $callerNameTag"
   implicit private val executionContext = ExecutionContext.fromExecutorService(
     Utils.newDaemonFixedThreadPool(1, threadpoolName))
+  override protected val logName = s"WriteAheadLogManager $callerNameTag"
 
   private var currentLogPath: String = null
   private var currentLogWriter: WriteAheadLogWriter = null
   private var currentLogWriterStartTime: Long = -1L
   private var currentLogWriterStopTime: Long = -1L
 
-  recoverPastLogs()
+  initializeOrRecover()
 
   def writeToLog(byteBuffer: ByteBuffer): FileSegment = synchronized {
     var fileSegment: FileSegment = null
@@ -41,7 +44,7 @@ private[streaming] class WriteAheadLogManager(
     var succeeded = false
     while (!succeeded && failures < maxFailures) {
       try {
-        fileSegment = getLogWriter.write(byteBuffer)
+        fileSegment = getLogWriter(clock.currentTime).write(byteBuffer)
         succeeded = true
       } catch {
         case ex: Exception =>
@@ -74,7 +77,7 @@ private[streaming] class WriteAheadLogManager(
    * between the node calculating the threshTime (say, driver node), and the local system time
    * (say, worker node), the caller has to take account of possible time skew.
    */
-  def clearOldLogs(threshTime: Long): Unit = {
+  def cleanupOldLogs(threshTime: Long): Unit = {
     val oldLogFiles = synchronized { pastLogs.filter { _.endTime < threshTime } }
     logInfo(s"Attempting to clear ${oldLogFiles.size} old log files in $logDirectory " +
       s"older than $threshTime: ${oldLogFiles.map { _.path }.mkString("\n")}")
@@ -107,9 +110,8 @@ private[streaming] class WriteAheadLogManager(
     logInfo("Stopped log manager")
   }
 
-  private def getLogWriter: WriteAheadLogWriter = synchronized {
-    val currentTime = clock.currentTime()
-    if (currentLogPath == null || currentTime > currentLogWriterStopTime) {
+  private def getLogWriter(currentTime: Long): WriteAheadLogWriter = synchronized {
+    if (currentLogWriter == null || currentTime > currentLogWriterStopTime) {
       resetWriter()
       if (currentLogPath != null) {
         pastLogs += LogInfo(currentLogWriterStartTime, currentLogWriterStopTime, currentLogPath)
@@ -124,21 +126,25 @@ private[streaming] class WriteAheadLogManager(
     currentLogWriter
   }
 
-  private def recoverPastLogs(): Unit = synchronized {
+  private def initializeOrRecover(): Unit = synchronized {
     val logDirectoryPath = new Path(logDirectory)
-    val fs = logDirectoryPath.getFileSystem(hadoopConf)
-    if (fs.exists(logDirectoryPath) && fs.getFileStatus(logDirectoryPath).isDir) {
-      val logFileInfo = logFilesTologInfo(fs.listStatus(logDirectoryPath).map { _.getPath })
+    val fileSystem = logDirectoryPath.getFileSystem(hadoopConf)
+
+    if (fileSystem.exists(logDirectoryPath) && fileSystem.getFileStatus(logDirectoryPath).isDir) {
+      val logFileInfo = logFilesTologInfo(fileSystem.listStatus(logDirectoryPath).map { _.getPath })
       pastLogs.clear()
       pastLogs ++= logFileInfo
       logInfo(s"Recovered ${logFileInfo.size} log files from $logDirectory")
       logDebug(s"Recovered files are:\n${logFileInfo.map(_.path).mkString("\n")}")
+    } else {
+      fileSystem.mkdirs(logDirectoryPath,
+        FsPermission.createImmutable(Integer.parseInt("770", 8).toShort))
+      logInfo(s"Created ${logDirectory} for log files")
     }
   }
 
   private def resetWriter(): Unit = synchronized {
     if (currentLogWriter != null) {
-      currentLogWriter
       currentLogWriter.close()
       currentLogWriter = null
     }
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogWriter.scala b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogWriter.scala
index f292bd0f045a9..68a1172d7d282 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogWriter.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/storage/WriteAheadLogWriter.scala
@@ -16,7 +16,7 @@
  */
 package org.apache.spark.streaming.storage
 
-import java.io.{BufferedOutputStream, Closeable, DataOutputStream, FileOutputStream}
+import java.io._
 import java.net.URI
 import java.nio.ByteBuffer
 
@@ -24,6 +24,7 @@ import scala.util.Try
 
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.{FSDataOutputStream, FileSystem}
+import org.apache.spark.streaming.storage.FileSegment
 
 private[streaming] class WriteAheadLogWriter(path: String, conf: Configuration) extends Closeable {
   private val underlyingStream: Either[DataOutputStream, FSDataOutputStream] = {
@@ -32,6 +33,7 @@ private[streaming] class WriteAheadLogWriter(path: String, conf: Configuration)
     val isDefaultLocal = defaultFs == null || defaultFs == "file"
 
     if ((isDefaultLocal && uri.getScheme == null) || uri.getScheme == "file") {
+      assert(!new File(uri.getPath).exists)
       Left(new DataOutputStream(new BufferedOutputStream(new FileOutputStream(uri.getPath))))
     } else {
       Right(HdfsUtils.getOutputStream(path, conf))
diff --git a/streaming/src/test/scala/org/apache/spark/streaming/DriverFailureSuite.scala b/streaming/src/test/scala/org/apache/spark/streaming/DriverFailureSuite.scala
index 664506f60f706..802b24e47e21c 100644
--- a/streaming/src/test/scala/org/apache/spark/streaming/DriverFailureSuite.scala
+++ b/streaming/src/test/scala/org/apache/spark/streaming/DriverFailureSuite.scala
@@ -25,7 +25,7 @@ import scala.util.Random
 
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
-import org.apache.spark.{Logging, SparkConf}
+import org.apache.spark.{HashPartitioner, Logging, SparkConf}
 import org.apache.spark.rdd.RDD
 import org.apache.spark.storage.StorageLevel
 import org.apache.spark.streaming.StreamingContext._
@@ -33,6 +33,7 @@ import org.apache.spark.streaming.dstream.DStream
 import org.apache.spark.streaming.receiver.Receiver
 import org.apache.spark.streaming.scheduler.{StreamingListener, StreamingListenerBatchCompleted}
 import org.apache.spark.util.Utils
+import scala.collection.mutable.ArrayBuffer
 
 /**
  * This testsuite tests master failures at random times while the stream is running using
@@ -66,27 +67,62 @@ class DriverFailureSuite extends TestSuiteBase with Logging {
   }
 */
   test("multiple failures with receiver and updateStateByKey") {
+
+
     val operation = (st: DStream[String]) => {
-      val updateFunc = (values: Seq[Long], state: Option[Long]) => {
-        Some(values.foldLeft(0L)(_ + _) + state.getOrElse(0L))
+
+      val mapPartitionFunc = (iterator: Iterator[String]) => {
+        Iterator(iterator.flatMap(_.split(" ")).map(_ -> 1L).reduce((x, y) => (x._1, x._2 + y._2)))
       }
-      st.flatMap(_.split(" ")).map(x => (x, 1L)).updateStateByKey[Long](updateFunc)
+
+      val updateFunc = (iterator: Iterator[(String, Seq[Long], Option[Seq[Long]])]) => {
+        iterator.map { case (key, values, state) =>
+          val combined = (state.getOrElse(Seq.empty) ++ values).sorted
+          if (state.isEmpty || state.get.max != DriverFailureTestReceiver.maxRecordsPerBlock) {
+            val oldState = s"[${ state.map { _.max }.getOrElse(-1) }, ${state.map { _.distinct.sum }.getOrElse(0)}]"
+            val newState = s"[${combined.max}, ${combined.distinct.sum}]"
+            println(s"Updated state for $key: state = $oldState, new values = $values, new state = $newState")
+          }
+          (key, combined)
+        }
+      }
+
+      st.mapPartitions(mapPartitionFunc)
+        .updateStateByKey[Seq[Long]](updateFunc, new HashPartitioner(2), rememberPartitioner = false)
         .checkpoint(batchDuration * 5)
     }
 
-    val expectedOutput =
-      (1L to DriverFailureTestReceiver.maxRecordsPerBlock).map(x => (1L to x).sum).toSet
+    val maxValue = DriverFailureTestReceiver.maxRecordsPerBlock
+    val expectedValues = (1L to maxValue).toSet
 
-    val verify = (time: Time, output: Seq[(String, Long)]) => {
-      println(s"Count at $time: ${output.mkString(", ")}")
-      if (!output.map { _._2 }.forall(expectedOutput.contains)) {
-        throw new Exception(s"Incorrect output: $output\nExpected output: $expectedOutput")
+    val verify = (time: Time, output: Seq[(String, Seq[Long])]) => {
+      val outputStr = output.map { x => (x._1, x._2.distinct.sum) }.sortBy(_._1).mkString(", ")
+      println(s"State at $time: $outputStr")
+
+      val incompletelyReceivedWords = output.filter { _._2.max < maxValue }
+      if (incompletelyReceivedWords.size > 1) {
+        val debugStr = incompletelyReceivedWords.map { x =>
+          s"""${x._1}: ${x._2.mkString(",")}, sum = ${x._2.distinct.sum}"""
+        }.mkString("\n")
+        throw new Exception(s"Incorrect processing of input, all input not processed:\n$debugStr\n")
+      }
+
+      output.foreach { case (key, values) =>
+        if (!values.forall(expectedValues.contains)) {
+          val sum = values.distinct.sum
+          val debugStr = values.zip(1L to values.size).map {
+            x => if (x._1 == x._2) x._1 else s"[${x._2}]"
+          }.mkString(",") + s", sum = $sum"
+          throw new Exception(s"Incorrect sequence of values in output:\n$debugStr\n")
+        }
       }
     }
 
-    val driverTest = new ReceiverBasedDriverFailureTest[(String, Long)](
-      "./driver-test/", batchDuration.milliseconds.toInt, 120, operation, verify)
-    driverTest.testAndGetError().map(errorMessage => fail(errorMessage))
+    val driverTest = new ReceiverBasedDriverFailureTest[(String, Seq[Long])](
+      "./driver-test/", 200, 50, operation, verify)
+    driverTest.testAndGetError().map { errorMessage =>
+      fail(errorMessage)
+    }
   }
 }
 
@@ -98,7 +134,7 @@ abstract class DriverFailureTest(
   ) extends Logging {
 
   @transient private val checkpointDir = createCheckpointDir()
-  @transient private val timeoutMillis = batchDurationMillis * numBatchesToRun * 2
+  @transient private val timeoutMillis = batchDurationMillis * numBatchesToRun * 4
 
   @transient @volatile private var killed = false
   @transient @volatile private var killCount = 0
@@ -123,6 +159,7 @@ abstract class DriverFailureTest(
   private def run(): Option[String] = {
 
     val runStartTime = System.currentTimeMillis
+    var killingThread: Thread = null
 
     def allBatchesCompleted = batchesCompleted >= numBatchesToRun
     def timedOut = (System.currentTimeMillis - runStartTime) > timeoutMillis
@@ -131,19 +168,15 @@ abstract class DriverFailureTest(
     while(!failed && !allBatchesCompleted && !timedOut) {
       // Start the thread to kill the streaming after some time
       killed = false
-      val killingThread = new KillingThread(ssc, batchDurationMillis * 10)
-      killingThread.start()
       try {
-        // Start the streaming computation and let it run while ...
-        // (i) StreamingContext has not been shut down yet
-        // (ii) The last expected output has not been generated yet
-        // (iii) Its not timed out yet
-        System.clearProperty("spark.streaming.clock")
-        System.clearProperty("spark.driver.port")
         ssc.addStreamingListener(new BatchCompletionListener)
         ssc.start()
+
+        killingThread = new KillingThread(ssc, batchDurationMillis * 10)
+        killingThread.start()
+
         while (!failed && !killed && !allBatchesCompleted && !timedOut) {
-          ssc.awaitTermination(100)
+          ssc.awaitTermination(1)
         }
       } catch {
         case e: Exception =>
@@ -169,20 +202,22 @@ abstract class DriverFailureTest(
             "\n-------------------------------------------\n"
         )
         Thread.sleep(sleepTime)
+
         // Recreate the streaming context from checkpoint
+        System.clearProperty("spark.driver.port")
         ssc = StreamingContext.getOrCreate(checkpointDir.toString, () => {
           throw new Exception("Trying to create new context when it " +
             "should be reading from checkpoint file")
         })
-        println("Restarting")
+        println("Restarted")
       }
     }
 
     if (failed) {
-      Some(s"Failed with message: ${DriverFailureTest.failureMessage}")
+      Some(s"Failed with message: ${DriverFailureTest.firstFailureMessage}")
     } else if (timedOut) {
       Some(s"Timed out after $batchesCompleted/$numBatchesToRun batches, and " +
-        s"${System.currentTimeMillis} ms (time out = $timeoutMillis ms")
+        s"${System.currentTimeMillis} ms (time out = $timeoutMillis ms)")
     } else if (allBatchesCompleted) {
       None
     } else {
@@ -222,12 +257,10 @@ abstract class DriverFailureTest(
             "Killing streaming context after " + killWaitTime + " ms" +
             "\n---------------------------------------\n"
         )
-        if (ssc != null) {
-          ssc.stop()
-          killed = true
-          killCount += 1
-          println("Killed")
-        }
+        ssc.stop()
+        killed = true
+        killCount += 1
+        println("Killed")
         logInfo("Killing thread finished normally")
       } catch {
         case ie: InterruptedException => logInfo("Killing thread interrupted")
@@ -240,16 +273,18 @@ abstract class DriverFailureTest(
 
 object DriverFailureTest {
   @transient @volatile var failed: Boolean = _
-  @transient @volatile var failureMessage: String = _
+  @transient @volatile var firstFailureMessage: String = _
 
   def fail(message: String) {
-    failed = true
-    failureMessage = message
+    if (!failed) {
+      failed = true
+      firstFailureMessage = message
+    }
   }
 
   def reset() {
     failed = false
-    failureMessage = "NOT SET"
+    firstFailureMessage = "NOT SET"
   }
 }
 
@@ -266,13 +301,29 @@ class ReceiverBasedDriverFailureTest[T](
   @transient val conf = new SparkConf()
   conf.setMaster("local[4]")
       .setAppName("ReceiverBasedDriverFailureTest")
-      .set("spark.streaming.receiver.writeAheadLog.enable", "true")
+      .set("spark.streaming.receiver.writeAheadLog.enable", "true")  // enable write ahead log
+      .set("spark.streaming.receiver.writeAheadLog.rotationIntervalSecs", "10")  // rotate logs to test cleanup
 
   override def setupContext(checkpointDirector: String): StreamingContext = {
 
     val context = StreamingContext.getOrCreate(checkpointDirector, () => {
       val newSsc = new StreamingContext(conf, Milliseconds(batchDurationMillis))
       val inputStream = newSsc.receiverStream[String](new DriverFailureTestReceiver)
+      /*inputStream.mapPartitions(iter => {
+        val sum = iter.map { _.split(" ").size }.fold(0)(_ + _)
+        Iterator(sum)
+      }).foreachRDD ((rdd: RDD[Int], time: Time) => {
+        try {
+          val collected =  rdd.collect().sorted
+          println(s"# in partitions at $time = ${collected.mkString(", ")}")
+        } catch {
+          case ie: InterruptedException =>
+          // ignore
+          case e: Exception =>
+            DriverFailureTest.fail(e.toString)
+        }
+
+      })*/
       val operatedStream = operation(inputStream)
 
       val verify = outputVerifyingFunction
@@ -304,11 +355,11 @@ class DriverFailureTestReceiver extends Receiver[String](StorageLevel.MEMORY_ONL
   class ReceivingThread extends Thread() {
     override def run() {
       while (!isStopped() && !isInterrupted()) {
-        val block = getNextBlock()
-        store(block)
-        commitBlock()
         try {
-          Thread.sleep(100)
+          val block = getNextBlock()
+          store(block)
+          commitBlock()
+          Thread.sleep(10)
         } catch {
           case ie: InterruptedException =>
           case e: Exception =>
@@ -343,9 +394,9 @@ object DriverFailureTestReceiver {
   counter.set(1)
   currentKey.set(1)
 
-  def getNextBlock(): Iterator[String] = {
+  def getNextBlock(): ArrayBuffer[String] = {
     val count = counter.get()
-    (1 to count).map { _ => "word" + currentKey.get() }.iterator
+    new ArrayBuffer ++= (1 to count).map { _ => "word%03d".format(currentKey.get()) }
   }
 
   def commitBlock() {
diff --git a/streaming/src/test/scala/org/apache/spark/streaming/ReceivedBlockTrackerSuite.scala b/streaming/src/test/scala/org/apache/spark/streaming/ReceivedBlockTrackerSuite.scala
new file mode 100644
index 0000000000000..ef152ac538abe
--- /dev/null
+++ b/streaming/src/test/scala/org/apache/spark/streaming/ReceivedBlockTrackerSuite.scala
@@ -0,0 +1,210 @@
+package org.apache.spark.streaming
+
+import java.io.File
+
+import scala.Some
+import scala.collection.mutable.ArrayBuffer
+import scala.concurrent.duration._
+import scala.language.{implicitConversions, postfixOps}
+import scala.util.Random
+
+import com.google.common.io.Files
+import org.apache.commons.io.FileUtils
+import org.apache.hadoop.conf.Configuration
+import org.apache.spark.{Logging, SparkConf}
+import org.apache.spark.storage.StreamBlockId
+import org.apache.spark.streaming.scheduler._
+import org.apache.spark.streaming.storage.WriteAheadLogReader
+import org.apache.spark.streaming.storage.WriteAheadLogSuite._
+import org.apache.spark.streaming.util.{Clock, ManualClock, SystemClock}
+import org.apache.spark.util.Utils
+import org.scalatest.{BeforeAndAfter, FunSuite, Matchers}
+import org.scalatest.concurrent.Eventually._
+
+class ReceivedBlockTrackerSuite
+  extends FunSuite with BeforeAndAfter with Matchers with Logging {
+
+  val conf = new SparkConf().setMaster("local[2]").setAppName("ReceivedBlockTrackerSuite")
+  conf.set("spark.streaming.receivedBlockTracker.writeAheadLog.rotationIntervalSecs", "1")
+
+  val hadoopConf = new Configuration()
+  val akkaTimeout = 10 seconds
+  val streamId = 1
+
+  var allReceivedBlockTrackers = new ArrayBuffer[ReceivedBlockTracker]()
+  var checkpointDirectory: File = null
+
+  before {
+    checkpointDirectory = Files.createTempDir()
+  }
+
+  after {
+    allReceivedBlockTrackers.foreach { _.stop() }
+    if (checkpointDirectory != null && checkpointDirectory.exists()) {
+      FileUtils.deleteDirectory(checkpointDirectory)
+      checkpointDirectory = null
+    }
+  }
+
+  test("block addition, and block to batch allocation") {
+    val receivedBlockTracker = createTracker(enableCheckpoint = false)
+    receivedBlockTracker.getUnallocatedBlocks(streamId) shouldEqual Seq.empty
+
+    val blockInfos = generateBlockInfos()
+    blockInfos.map(receivedBlockTracker.addBlock)
+
+    receivedBlockTracker.getUnallocatedBlocks(streamId) shouldEqual blockInfos
+    receivedBlockTracker.getOrAllocateBlocksToBatch(1, streamId) shouldEqual blockInfos
+    receivedBlockTracker.getUnallocatedBlocks(streamId) should have size 0
+    receivedBlockTracker.getOrAllocateBlocksToBatch(1, streamId) shouldEqual blockInfos
+    receivedBlockTracker.getOrAllocateBlocksToBatch(2, streamId) should have size 0
+  }
+
+  test("block addition, block to batch allocation and cleanup with write ahead log") {
+    val manualClock = new ManualClock
+    conf.getInt(
+      "spark.streaming.receivedBlockTracker.writeAheadLog.rotationIntervalSecs", -1) should be (1)
+
+    // Set the time increment level to twice the rotation interval so that every increment creates
+    // a new log file
+    val timeIncrementMillis = 2000L
+    def incrementTime() {
+      manualClock.addToTime(timeIncrementMillis)
+    }
+
+    // Generate and add blocks to the given tracker
+    def addBlockInfos(tracker: ReceivedBlockTracker): Seq[ReceivedBlockInfo] = {
+      val blockInfos = generateBlockInfos()
+      blockInfos.map(tracker.addBlock)
+      blockInfos
+    }
+
+    // Print the data present in the log ahead files in the log directory
+    def printLogFiles(message: String) {
+      val fileContents = getWriteAheadLogFiles().map { file =>
+          (s"\n>>>>> $file: <<<<<\n${getWrittenLogData(file).mkString("\n")}")
+      }.mkString("\n")
+      logInfo(s"\n\n=====================\n$message\n$fileContents\n=====================\n")
+    }
+
+    // Start tracker and add blocks
+    val tracker1 = createTracker(enableCheckpoint = true, clock = manualClock)
+    val blockInfos1 = addBlockInfos(tracker1)
+    tracker1.getUnallocatedBlocks(streamId).toList shouldEqual blockInfos1
+
+    // Verify whether write ahead log has correct contents
+    val expectedWrittenData1 = blockInfos1.map(BlockAddition)
+    getWrittenLogData() shouldEqual expectedWrittenData1
+    getWriteAheadLogFiles() should have size 1
+
+    // Restart tracker and verify recovered list of unallocated blocks
+    incrementTime()
+    val tracker2 = createTracker(enableCheckpoint = true, clock = manualClock)
+    tracker2.getUnallocatedBlocks(streamId).toList shouldEqual blockInfos1
+
+    // Allocate blocks to batch and verify whether the unallocated blocks got allocated
+    val batchTime1 = manualClock.currentTime
+    tracker2.getOrAllocateBlocksToBatch(batchTime1, streamId) shouldEqual blockInfos1
+
+    // Add more blocks and allocate to another batch
+    incrementTime()
+    val batchTime2 = manualClock.currentTime
+    val blockInfos2 = addBlockInfos(tracker2)
+    tracker2.getOrAllocateBlocksToBatch(batchTime2, streamId) shouldEqual blockInfos2
+
+    // Verify whether log has correct contents
+    val expectedWrittenData2 = expectedWrittenData1 ++
+      Seq(createBatchAllocation(batchTime1, blockInfos1)) ++
+      blockInfos2.map(BlockAddition) ++
+      Seq(createBatchAllocation(batchTime2, blockInfos2))
+    getWrittenLogData() shouldEqual expectedWrittenData2
+
+    // Restart tracker and verify recovered state
+    incrementTime()
+    val tracker3 = createTracker(enableCheckpoint = true, clock = manualClock)
+    tracker3.getOrAllocateBlocksToBatch(batchTime1, streamId) shouldEqual blockInfos1
+    tracker3.getOrAllocateBlocksToBatch(batchTime2, streamId) shouldEqual blockInfos2
+    tracker3.getUnallocatedBlocks(streamId) shouldBe empty
+
+    // Cleanup first batch but not second batch
+    val oldestLogFile = getWriteAheadLogFiles().head
+    incrementTime()
+    tracker3.cleanupOldBatches(batchTime2)
+
+    // Verify that the batch allocations have been cleaned, and the act has been written to log
+    tracker3.getOrAllocateBlocksToBatch(batchTime1, streamId) shouldEqual Seq.empty
+    getWrittenLogData(getWriteAheadLogFiles().last) should contain(createBatchCleanup(batchTime1))
+
+    // Verify that at least one log file gets deleted
+    eventually(timeout(10 seconds), interval(10 millisecond )) {
+      getWriteAheadLogFiles() should not contain oldestLogFile
+    }
+    printLogFiles("After cleanup")
+
+    // Restart tracker and verify recovered state, specifically whether info about the first
+    // batch has been removed, but not the second batch
+    incrementTime()
+    val tracker4 = createTracker(enableCheckpoint = true, clock = manualClock)
+    tracker4.getUnallocatedBlocks(streamId) shouldBe empty
+    tracker4.getOrAllocateBlocksToBatch(batchTime1, streamId) shouldBe empty  // should be cleaned
+    tracker4.getOrAllocateBlocksToBatch(batchTime2, streamId) shouldEqual blockInfos2
+  }
+
+  /**
+   * Create tracker object with the optional provided clock. Use fake clock if you
+   * want to control time by manually incrementing it to test log cleanup.
+   */
+  def createTracker(enableCheckpoint: Boolean, clock: Clock = new SystemClock): ReceivedBlockTracker = {
+    val cpDirOption = if (enableCheckpoint) Some(checkpointDirectory.toString) else None
+    val tracker = new ReceivedBlockTracker(conf, hadoopConf, Seq(streamId), clock, cpDirOption)
+    allReceivedBlockTrackers += tracker
+    tracker
+  }
+
+  /** Generate blocks infos using random ids */
+  def generateBlockInfos(): Seq[ReceivedBlockInfo] = {
+    (1 to 5).map { id =>
+      new ReceivedBlockInfo(streamId,
+        StreamBlockId(streamId, math.abs(Random.nextInt())), 0, null, None)
+    }.toList
+  }
+
+  /** Get all the data written in the given write ahead log file. */
+  def getWrittenLogData(logFile: String): Seq[ReceivedBlockTrackerRecord] = {
+    getWrittenLogData(Seq(logFile))
+  }
+
+  /**
+   * Get all the data written in the given write ahead log files. By default, it will read all
+   * files in the test log directory.
+   */
+  def getWrittenLogData(logFiles: Seq[String] = getWriteAheadLogFiles): Seq[ReceivedBlockTrackerRecord] = {
+    logFiles.flatMap {
+      file => new WriteAheadLogReader(file, hadoopConf).toSeq
+    }.map { byteBuffer =>
+      Utils.deserialize[ReceivedBlockTrackerRecord](byteBuffer.array)
+    }.toList
+  }
+
+  /** Get all the write ahead log files in the test directory */
+  def getWriteAheadLogFiles(): Seq[String] = {
+    import ReceivedBlockTracker._
+    val logDir = checkpointDirToLogDir(checkpointDirectory.toString)
+    getLogFilesInDirectory(new File(logDir)).map { _.toString }
+  }
+
+  /** Create batch allocation object from the given info */
+  def createBatchAllocation(time: Long, blockInfos: Seq[ReceivedBlockInfo]): BatchAllocations = {
+    BatchAllocations(time, AllocatedBlocks(Map((streamId -> blockInfos))))
+  }
+
+  /** Create batch cleanup object from the given info */
+  def createBatchCleanup(time: Long, moreTimes: Long*): BatchCleanup = {
+    BatchCleanup((Seq(time) ++ moreTimes).map(Time.apply))
+  }
+
+  implicit def millisToTime(milliseconds: Long): Time = Time(milliseconds)
+
+  implicit def timeToMillis(time: Time): Long = time.milliseconds
+
+}
diff --git a/streaming/src/test/scala/org/apache/spark/streaming/ReceiverTrackerSuite.scala b/streaming/src/test/scala/org/apache/spark/streaming/ReceiverTrackerSuite.scala
deleted file mode 100644
index 7d4473e27f6a5..0000000000000
--- a/streaming/src/test/scala/org/apache/spark/streaming/ReceiverTrackerSuite.scala
+++ /dev/null
@@ -1,133 +0,0 @@
-package org.apache.spark.streaming
-
-import java.io.File
-
-import scala.concurrent.{Await, Future}
-import scala.concurrent.ExecutionContext.Implicits.global
-import scala.concurrent.duration._
-import scala.language.postfixOps
-import scala.util.Random
-
-import akka.pattern.ask
-import com.google.common.io.Files
-import org.apache.commons.io.FileUtils
-import org.scalatest.{BeforeAndAfter, BeforeAndAfterAll, FunSuite, Matchers}
-import org.scalatest.concurrent.Eventually._
-
-import org.apache.spark.{Logging, SparkConf, SparkContext}
-import org.apache.spark.storage.{StorageLevel, StreamBlockId}
-import org.apache.spark.streaming.receiver.Receiver
-import org.apache.spark.streaming.scheduler.{AddBlock, ReceivedBlockInfo, ReceivedBlockInfoCheckpointer, ReceiverTracker}
-import org.apache.spark.streaming.storage.{FileSegment, WriteAheadLogReader}
-import org.apache.spark.streaming.storage.WriteAheadLogSuite._
-import org.apache.spark.util.Utils
-
-class ReceiverTrackerSuite
-  extends FunSuite with BeforeAndAfter with BeforeAndAfterAll with Matchers with Logging {
-
-  val conf = new SparkConf().setMaster("local[2]").setAppName("ReceiverTrackerSuite")
-  val sc = new SparkContext(conf)
-  val akkaTimeout = 10 seconds
-
-  var ssc: StreamingContext = null
-  var receiverTracker: ReceiverTracker = null
-  var checkpointDirectory: File = null
-
-  before {
-    checkpointDirectory = Files.createTempDir()
-  }
-
-  after {
-    if (receiverTracker != null) {
-      receiverTracker.stop()
-      receiverTracker = null
-    }
-    if (ssc != null) {
-      ssc.stop(stopSparkContext = false)
-      ssc = null
-    }
-    if (checkpointDirectory != null && checkpointDirectory.exists()) {
-      FileUtils.deleteDirectory(checkpointDirectory)
-      checkpointDirectory = null
-    }
-  }
-
-  override def afterAll() {
-    sc.stop()
-  }
-
-  test("add blocks info and retrieve them") {
-    createTracker(enableCheckpoint = false)
-    val blockIds = (1 to 10).map { _ => math.abs(Random.nextInt()) }
-    val futures = blockIds.map { id =>
-      receiverTracker.actor.ask(AddBlock(createBlockInfo(id, 1)))(akkaTimeout).mapTo[Boolean]
-    }
-    Await.ready(Future.sequence(futures), akkaTimeout)
-
-    val recordedBlockIds = receiverTracker.getReceivedBlockInfo(1)
-    recordedBlockIds.map { _.blockId.uniqueId } shouldEqual blockIds
-  }
-
-  test("add block info with checkpoint enabled, and recover them") {
-    createTracker(enableCheckpoint = true)
-    val blockIds = (1 to 10).map { _ => math.abs(Random.nextInt()) }
-    val futures = blockIds.map { id =>
-      receiverTracker.actor.ask(AddBlock(createBlockInfo(id, 1)))(akkaTimeout).mapTo[Boolean]
-    }
-    Await.ready(Future.sequence(futures), akkaTimeout)
-    receiverTracker.stop()
-
-    val logFiles = getWriteAheadLogFiles()
-    logFiles.size should be > 0
-
-    val logData = logFiles.flatMap {
-      file => new WriteAheadLogReader(file.toString, sc.hadoopConfiguration).toSeq
-    }.map { byteBuffer =>
-      Utils.deserialize[ReceivedBlockInfo](byteBuffer.array)
-    }
-    logData foreach { _.blockId.streamId shouldEqual 1 }
-    logData.map { _.blockId.uniqueId }.toList shouldEqual blockIds
-
-    createTracker(enableCheckpoint = true)
-    val recoveredBlockIds = receiverTracker.getReceivedBlockInfo(1)
-    recoveredBlockIds.map { _.blockId.uniqueId } shouldEqual blockIds
-  }
-
-  ignore("clean old block info") {
-    // TODO (TD)
-  }
-
-  def createTracker(enableCheckpoint: Boolean) {
-    ssc = new StreamingContext(sc, Seconds(1))
-    if (enableCheckpoint) {
-      ssc.checkpoint(checkpointDirectory.toString)
-      assert(ssc.checkpointDir != null)
-    }
-
-    val receiver = new Receiver[String](StorageLevel.MEMORY_ONLY) {
-      def onStart(): Unit = { }
-      def onStop(): Unit = { }
-    }
-    ssc.receiverStream(receiver)
-    receiverTracker = new ReceiverTracker(ssc, skipReceiverLaunch = true)
-    receiverTracker.start()
-    if (enableCheckpoint) {
-      assert(receiverTracker.receivedBlockCheckpointerOption.isDefined)
-    }
-
-    // Wait for the receiver to be start before doing anything with it
-    eventually(timeout(akkaTimeout), interval(10 milliseconds)) {
-      receiverTracker.getReceivedBlockInfo(0) should not be None
-    }
-  }
-  
-  def createBlockInfo(blockUniqueId: Long, streamId: Int): ReceivedBlockInfo = {
-    new ReceivedBlockInfo(streamId,
-      StreamBlockId(streamId, blockUniqueId), 0, null, None)
-  }
-
-  def getWriteAheadLogFiles(): Seq[File] = {
-    getLogFilesInDirectory(
-      new File(ReceivedBlockInfoCheckpointer.checkpointDirToLogDir(checkpointDirectory.toString)))
-  }
-}

From acd94673948e4433fb216df5577c7f9e669c3bbc Mon Sep 17 00:00:00 2001
From: Tathagata Das <tathagata.das1565@gmail.com>
Date: Mon, 20 Oct 2014 19:21:42 -0700
Subject: [PATCH 10/10] Moved around packages.

---
 .../streaming/{storage => }/rdd/HDFSBackedBlockRDD.scala    | 0
 .../apache/spark/streaming/scheduler/ReceiverTracker.scala  | 2 +-
 .../spark/streaming/storage/ReceivedBlockHandler.scala      | 6 +++---
 .../{scheduler => storage}/ReceivedBlockTracker.scala       | 3 ++-
 .../apache/spark/streaming/ReceivedBlockTrackerSuite.scala  | 6 +++++-
 .../{storage => }/rdd/HDFSBackedBlockRDDSuite.scala         | 0
 .../spark/streaming/storage/ReceivedBlockHandlerSuite.scala | 2 +-
 7 files changed, 12 insertions(+), 7 deletions(-)
 rename streaming/src/main/scala/org/apache/spark/streaming/{storage => }/rdd/HDFSBackedBlockRDD.scala (100%)
 rename streaming/src/main/scala/org/apache/spark/streaming/{scheduler => storage}/ReceivedBlockTracker.scala (98%)
 rename streaming/src/test/scala/org/apache/spark/streaming/{storage => }/rdd/HDFSBackedBlockRDDSuite.scala (100%)

diff --git a/streaming/src/main/scala/org/apache/spark/streaming/storage/rdd/HDFSBackedBlockRDD.scala b/streaming/src/main/scala/org/apache/spark/streaming/rdd/HDFSBackedBlockRDD.scala
similarity index 100%
rename from streaming/src/main/scala/org/apache/spark/streaming/storage/rdd/HDFSBackedBlockRDD.scala
rename to streaming/src/main/scala/org/apache/spark/streaming/rdd/HDFSBackedBlockRDD.scala
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
index 0eabffa66a9cb..f2aa02d065222 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
@@ -31,7 +31,7 @@ import org.apache.spark.SerializableWritable
 import org.apache.spark.storage.StreamBlockId
 import org.apache.spark.streaming.{StreamingContext, Time}
 import org.apache.spark.streaming.receiver.{Receiver, ReceiverSupervisorImpl, StopReceiver}
-import org.apache.spark.streaming.storage.{FileSegment, WriteAheadLogManager}
+import org.apache.spark.streaming.storage.{ReceivedBlockTracker, FileSegment, WriteAheadLogManager}
 import org.apache.spark.util.Utils
 
 /** Information about blocks received by the receiver */
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedBlockHandler.scala b/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedBlockHandler.scala
index cc5b5b8136b81..d0d2370201a8e 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedBlockHandler.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedBlockHandler.scala
@@ -22,7 +22,7 @@ private[streaming] case class ByteBufferBlock(byteBuffer: ByteBuffer) extends Re
 
 private[streaming] trait ReceivedBlockHandler {
   def storeBlock(blockId: StreamBlockId, receivedBlock: ReceivedBlock): Option[AnyRef]
-  def clearOldBlocks(threshTime: Long)
+  def cleanupOldBlock(threshTime: Long)
 }
 
 private[streaming] class BlockManagerBasedBlockHandler(
@@ -45,7 +45,7 @@ private[streaming] class BlockManagerBasedBlockHandler(
     None
   }
 
-  def clearOldBlocks(threshTime: Long) {
+  def cleanupOldBlock(threshTime: Long) {
     // this is not used as blocks inserted into the BlockManager are cleared by DStream's clearing
     // of BlockRDDs.
   }
@@ -104,7 +104,7 @@ private[streaming] class WriteAheadLogBasedBlockHandler(
     Some(Await.result(combinedFuture, blockStoreTimeout))
   }
 
-  def clearOldBlocks(threshTime: Long) {
+  def cleanupOldBlock(threshTime: Long) {
     logManager.cleanupOldLogs(threshTime)
   }
 
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceivedBlockTracker.scala b/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedBlockTracker.scala
similarity index 98%
rename from streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceivedBlockTracker.scala
rename to streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedBlockTracker.scala
index 25c0980d7462e..866d77dd25489 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceivedBlockTracker.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/storage/ReceivedBlockTracker.scala
@@ -1,4 +1,4 @@
-package org.apache.spark.streaming.scheduler
+package org.apache.spark.streaming.storage
 
 import java.nio.ByteBuffer
 
@@ -13,6 +13,7 @@ import org.apache.spark.streaming.storage.WriteAheadLogManager
 import org.apache.spark.util.Utils
 import org.apache.spark.storage.StreamBlockId
 import org.apache.spark.streaming.util.Clock
+import org.apache.spark.streaming.scheduler.ReceivedBlockInfo
 
 private[streaming] sealed trait ReceivedBlockTrackerRecord
 
diff --git a/streaming/src/test/scala/org/apache/spark/streaming/ReceivedBlockTrackerSuite.scala b/streaming/src/test/scala/org/apache/spark/streaming/ReceivedBlockTrackerSuite.scala
index ef152ac538abe..6b791df092f64 100644
--- a/streaming/src/test/scala/org/apache/spark/streaming/ReceivedBlockTrackerSuite.scala
+++ b/streaming/src/test/scala/org/apache/spark/streaming/ReceivedBlockTrackerSuite.scala
@@ -14,12 +14,16 @@ import org.apache.hadoop.conf.Configuration
 import org.apache.spark.{Logging, SparkConf}
 import org.apache.spark.storage.StreamBlockId
 import org.apache.spark.streaming.scheduler._
-import org.apache.spark.streaming.storage.WriteAheadLogReader
+import org.apache.spark.streaming.storage._
 import org.apache.spark.streaming.storage.WriteAheadLogSuite._
 import org.apache.spark.streaming.util.{Clock, ManualClock, SystemClock}
 import org.apache.spark.util.Utils
 import org.scalatest.{BeforeAndAfter, FunSuite, Matchers}
 import org.scalatest.concurrent.Eventually._
+import org.apache.spark.streaming.scheduler.ReceivedBlockInfo
+import org.apache.spark.storage.StreamBlockId
+import scala.Some
+import org.apache.spark.streaming.storage.BlockAddition
 
 class ReceivedBlockTrackerSuite
   extends FunSuite with BeforeAndAfter with Matchers with Logging {
diff --git a/streaming/src/test/scala/org/apache/spark/streaming/storage/rdd/HDFSBackedBlockRDDSuite.scala b/streaming/src/test/scala/org/apache/spark/streaming/rdd/HDFSBackedBlockRDDSuite.scala
similarity index 100%
rename from streaming/src/test/scala/org/apache/spark/streaming/storage/rdd/HDFSBackedBlockRDDSuite.scala
rename to streaming/src/test/scala/org/apache/spark/streaming/rdd/HDFSBackedBlockRDDSuite.scala
diff --git a/streaming/src/test/scala/org/apache/spark/streaming/storage/ReceivedBlockHandlerSuite.scala b/streaming/src/test/scala/org/apache/spark/streaming/storage/ReceivedBlockHandlerSuite.scala
index 784d615cf499c..654bc7bad92b6 100644
--- a/streaming/src/test/scala/org/apache/spark/streaming/storage/ReceivedBlockHandlerSuite.scala
+++ b/streaming/src/test/scala/org/apache/spark/streaming/storage/ReceivedBlockHandlerSuite.scala
@@ -108,7 +108,7 @@ class ReceivedBlockHandlerSuite extends FunSuite with BeforeAndAfter with Matche
     manualClock.currentTime() shouldEqual 5000L
 
     val cleanupThreshTime = 3000L
-    receivedBlockHandler.clearOldBlocks(cleanupThreshTime)
+    receivedBlockHandler.cleanupOldBlock(cleanupThreshTime)
     eventually(timeout(10000 millis), interval(10 millis)) {
       getWriteAheadLogFiles().size should be < preCleanupLogFiles.size
     }