From 4e2fe0bdaf7c2626d8b8461fed36259c9830a25c Mon Sep 17 00:00:00 2001
From: Matei Zaharia <matei@eecs.berkeley.edu>
Date: Fri, 6 Jul 2012 16:33:40 -0700
Subject: [PATCH] Miscellaneous bug fixes

---
 core/src/main/scala/spark/SparkContext.scala           |  2 +-
 core/src/main/scala/spark/executor/Executor.scala      |  8 +++++---
 .../scala/spark/executor/MesosExecutorRunner.scala     |  3 ++-
 .../scala/spark/scheduler/cluster/TaskSetManager.scala |  1 +
 .../scala/spark/scheduler/mesos/MesosScheduler.scala   | 10 ++++++----
 5 files changed, 15 insertions(+), 9 deletions(-)

diff --git a/core/src/main/scala/spark/SparkContext.scala b/core/src/main/scala/spark/SparkContext.scala
index d35b2b1cac..2e8cb609b2 100644
--- a/core/src/main/scala/spark/SparkContext.scala
+++ b/core/src/main/scala/spark/SparkContext.scala
@@ -63,7 +63,7 @@ class SparkContext(
     System.setProperty("spark.master.port", "0")
   }
 
-  private val isLocal = master.startsWith("local") // TODO: better check for local
+  private val isLocal = (master == "local" || master.startsWith("local["))
 
   // Create the Spark execution environment (cache, map output tracker, etc)
   val env = SparkEnv.createFromSystemProperties(
diff --git a/core/src/main/scala/spark/executor/Executor.scala b/core/src/main/scala/spark/executor/Executor.scala
index ad02b85254..ac30ae9aec 100644
--- a/core/src/main/scala/spark/executor/Executor.scala
+++ b/core/src/main/scala/spark/executor/Executor.scala
@@ -69,17 +69,19 @@ class Executor extends Logging {
         val value = task.run(taskId.toInt)
         val accumUpdates = Accumulators.values
         val result = new TaskResult(value, accumUpdates)
-        context.statusUpdate(taskId, TaskState.FINISHED, ser.serialize(result))
+        val serializedResult = ser.serialize(result)
+        logInfo("Serialized size of result for " + taskId + " is " + serializedResult.limit)
+        context.statusUpdate(taskId, TaskState.FINISHED, serializedResult)
         logInfo("Finished task ID " + taskId)
       } catch {
         case ffe: FetchFailedException => {
           val reason = ffe.toTaskEndReason
-          context.statusUpdate(taskId, TaskState.FINISHED, ser.serialize(reason))
+          context.statusUpdate(taskId, TaskState.FAILED, ser.serialize(reason))
         }
 
         case t: Throwable => {
           val reason = ExceptionFailure(t)
-          context.statusUpdate(taskId, TaskState.FINISHED, ser.serialize(reason))
+          context.statusUpdate(taskId, TaskState.FAILED, ser.serialize(reason))
 
           // TODO: Should we exit the whole executor here? On the one hand, the failed task may
           // have left some weird state around depending on when the exception was thrown, but on
diff --git a/core/src/main/scala/spark/executor/MesosExecutorRunner.scala b/core/src/main/scala/spark/executor/MesosExecutorRunner.scala
index 7695cbdfd7..f97d9d0bfa 100644
--- a/core/src/main/scala/spark/executor/MesosExecutorRunner.scala
+++ b/core/src/main/scala/spark/executor/MesosExecutorRunner.scala
@@ -6,6 +6,7 @@ import org.apache.mesos.Protos.{TaskState => MesosTaskState, TaskStatus => Mesos
 import spark.TaskState.TaskState
 import com.google.protobuf.ByteString
 import spark.{Utils, Logging}
+import spark.TaskState
 
 class MesosExecutorRunner(executor: Executor)
   extends MesosExecutor
@@ -18,7 +19,7 @@ class MesosExecutorRunner(executor: Executor)
     val mesosTaskId = TaskID.newBuilder().setValue(taskId.toString).build()
     driver.sendStatusUpdate(MesosTaskStatus.newBuilder()
       .setTaskId(mesosTaskId)
-      .setState(MesosTaskState.TASK_FINISHED)
+      .setState(TaskState.toMesos(state))
       .setData(ByteString.copyFrom(data))
       .build())
   }
diff --git a/core/src/main/scala/spark/scheduler/cluster/TaskSetManager.scala b/core/src/main/scala/spark/scheduler/cluster/TaskSetManager.scala
index 75b67a0eb4..ab07f1c8c2 100644
--- a/core/src/main/scala/spark/scheduler/cluster/TaskSetManager.scala
+++ b/core/src/main/scala/spark/scheduler/cluster/TaskSetManager.scala
@@ -227,6 +227,7 @@ class TaskSetManager(
   }
 
   def statusUpdate(tid: Long, state: TaskState, serializedData: ByteBuffer) {
+    logInfo("statusUpdate: " + tid + " is now " + state + " " + serializedData)
     state match {
       case TaskState.FINISHED =>
         taskFinished(tid, state, serializedData)
diff --git a/core/src/main/scala/spark/scheduler/mesos/MesosScheduler.scala b/core/src/main/scala/spark/scheduler/mesos/MesosScheduler.scala
index 8131d84fdf..f5c35becda 100644
--- a/core/src/main/scala/spark/scheduler/mesos/MesosScheduler.scala
+++ b/core/src/main/scala/spark/scheduler/mesos/MesosScheduler.scala
@@ -188,10 +188,12 @@ class MesosScheduler(
       for ((taskList, index) <- taskLists.zipWithIndex) {
         if (!taskList.isEmpty) {
           val offerNum = offerableIndices(index)
+          val slaveId = offers(offerNum).getSlaveId.getValue
+          slaveIdsWithExecutors += slaveId
           mesosTasks(offerNum) = new JArrayList[MesosTaskInfo](taskList.size)
           for (taskDesc <- taskList) {
-            taskIdToSlaveId(taskDesc.taskId) = offers(offerNum).getSlaveId.getValue
-            mesosTasks(offerNum).add(createMesosTask(taskDesc, offers(offerNum).getSlaveId))
+            taskIdToSlaveId(taskDesc.taskId) = slaveId
+            mesosTasks(offerNum).add(createMesosTask(taskDesc, slaveId))
           }
         }
       }
@@ -214,7 +216,7 @@ class MesosScheduler(
   }
 
   /** Turn a Spark TaskDescription into a Mesos task */
-  def createMesosTask(task: TaskDescription, slaveId: SlaveID): MesosTaskInfo = {
+  def createMesosTask(task: TaskDescription, slaveId: String): MesosTaskInfo = {
     val taskId = TaskID.newBuilder().setValue(task.taskId.toString).build()
     val cpuResource = Resource.newBuilder()
       .setName("cpus")
@@ -223,7 +225,7 @@ class MesosScheduler(
       .build()
     return MesosTaskInfo.newBuilder()
       .setTaskId(taskId)
-      .setSlaveId(slaveId)
+      .setSlaveId(SlaveID.newBuilder().setValue(slaveId).build())
       .setExecutor(executorInfo)
       .setName(task.name)
       .addResources(cpuResource)
-- 
GitLab