From c539c949abc5b8019e7fe79aa23fb440311d788f Mon Sep 17 00:00:00 2001
From: gss2002 <greg@senia.org>
Date: Wed, 14 Nov 2018 00:27:09 -0500
Subject: [PATCH] [SPARK-25778] WriteAheadLogBackedBlockRDD in YARN Cluster
 Mode Fails due to lack of access to java.io.tmpdir in HDFS
 WriteAheadLogBackedBlockRDD usage of java.io.tmpdir will fail if $PWD
 resolves to a folder in HDFS and the Spark YARN Cluster job does not have the
 correct access to this folder in regards to the dummy folder. So the fix is
 to pass the locally resolved dummy folder to the createLogForReceiver with
 the correct nonExistantDirectory

---
 .../spark/streaming/rdd/WriteAheadLogBackedBlockRDD.scala       | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/streaming/src/main/scala/org/apache/spark/streaming/rdd/WriteAheadLogBackedBlockRDD.scala b/streaming/src/main/scala/org/apache/spark/streaming/rdd/WriteAheadLogBackedBlockRDD.scala
index 844760ab61d2e..f677c492d561f 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/rdd/WriteAheadLogBackedBlockRDD.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/rdd/WriteAheadLogBackedBlockRDD.scala
@@ -136,7 +136,7 @@ class WriteAheadLogBackedBlockRDD[T: ClassTag](
         // this dummy directory should not already exist otherwise the WAL will try to recover
         // past events from the directory and throw errors.
         val nonExistentDirectory = new File(
-          System.getProperty("java.io.tmpdir"), UUID.randomUUID().toString).getAbsolutePath
+          System.getProperty("java.io.tmpdir"), UUID.randomUUID().toString).toURI.toString
         writeAheadLog = WriteAheadLogUtils.createLogForReceiver(
           SparkEnv.get.conf, nonExistentDirectory, hadoopConf)
         dataRead = writeAheadLog.read(partition.walRecordHandle)