From 6c6e47e3cd4b5c717517609a19632e61c02b7d51 Mon Sep 17 00:00:00 2001 From: Ankur Dave <ankurdave@gmail.com> Date: Fri, 9 Sep 2011 01:46:00 +0000 Subject: [PATCH] Use BufferedOutputStream in ShuffleMapTask --- core/src/main/scala/spark/ShuffleMapTask.scala | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/core/src/main/scala/spark/ShuffleMapTask.scala b/core/src/main/scala/spark/ShuffleMapTask.scala index b64401c2c7..eb6a5e2df3 100644 --- a/core/src/main/scala/spark/ShuffleMapTask.scala +++ b/core/src/main/scala/spark/ShuffleMapTask.scala @@ -1,5 +1,6 @@ package spark +import java.io.BufferedOutputStream import java.io.FileOutputStream import java.io.ObjectOutputStream import scala.collection.mutable.HashMap @@ -26,7 +27,7 @@ extends DAGTask[String](stageId) with Logging { val ser = SparkEnv.get.serializer.newInstance() for (i <- 0 until numOutputSplits) { val file = LocalFileShuffle.getOutputFile(dep.shuffleId, partition, i) - val out = ser.outputStream(new FileOutputStream(file)) + val out = ser.outputStream(new BufferedOutputStream(new FileOutputStream(file))) buckets(i).foreach(pair => out.writeObject(pair)) // TODO: have some kind of EOF marker out.close() -- GitLab