Initial commit for job killing.

2013-09-16 18:54:06 -07:00 · 2013-09-16 18:54:06 -07:00 · cbc48be13b
parent 3443d3fd43
commit cbc48be13b
21 changed files with 255 additions and 56 deletions
--- a/core/src/main/scala/org/apache/spark/InterruptibleIterator.scala
+++ b/core/src/main/scala/org/apache/spark/InterruptibleIterator.scala
@ -0,0 +1,26 @@
 /*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
 package org.apache.spark
 class InterruptibleIterator[+T](val context: TaskContext, val delegate: Iterator[T])
  extends Iterator[T] {
  def hasNext: Boolean = !context.interrupted && delegate.hasNext
  def next(): T = delegate.next()
 }
--- a/core/src/main/scala/org/apache/spark/SparkContext.scala
+++ b/core/src/main/scala/org/apache/spark/SparkContext.scala
@ -812,6 +812,13 @@ class SparkContext(
    result
  }
  /**
   * Kill a running job.
   */
  def killJob(jobId: Int) {
    dagScheduler.killJob(jobId)
  }
  /**
   * Clean a closure to make it ready to serialized and send to tasks
   * (removes unreferenced variables in $outer's, updates REPL variables)
--- a/core/src/main/scala/org/apache/spark/TaskContext.scala
+++ b/core/src/main/scala/org/apache/spark/TaskContext.scala
@ -25,6 +25,7 @@ class TaskContext(
  val splitId: Int,
  val attemptId: Long,
  val runningLocally: Boolean = false,
  @volatile var interrupted: Boolean = false,
  val taskMetrics: TaskMetrics = TaskMetrics.empty()
 ) extends Serializable {
--- a/core/src/main/scala/org/apache/spark/executor/Executor.scala
+++ b/core/src/main/scala/org/apache/spark/executor/Executor.scala
@ -17,7 +17,7 @@
 package org.apache.spark.executor
-import java.io.{File}
+import java.io.File
 import java.lang.management.ManagementFactory
 import java.nio.ByteBuffer
 import java.util.concurrent._
@ -31,7 +31,8 @@ import org.apache.spark.util.Utils
 /**
- * The Mesos executor for Spark.
+ * The backend executor for Spark. The executor maintains a thread pool and uses it to execute
 * tasks.
 */
 private[spark] class Executor(
    executorId: String,
@ -101,18 +102,38 @@ private[spark] class Executor(
  val executorSource = new ExecutorSource(this, executorId)
  // Initialize Spark environment (using system properties read above)
-  val env = SparkEnv.createFromSystemProperties(executorId, slaveHostname, 0, false, false)
+  private val env = SparkEnv.createFromSystemProperties(executorId, slaveHostname, 0,
    isDriver = false, isLocal = false)
  SparkEnv.set(env)
  env.metricsSystem.registerSource(executorSource)
-  private val akkaFrameSize = env.actorSystem.settings.config.getBytes("akka.remote.netty.message-frame-size")
+  private val akkaFrameSize = {
    env.actorSystem.settings.config.getBytes("akka.remote.netty.message-frame-size")
  }
  // Start worker thread pool
  val threadPool = new ThreadPoolExecutor(
    1, 128, 600, TimeUnit.SECONDS, new SynchronousQueue[Runnable])
  // Maintains the list of running tasks.
  private val runningTasks = new ConcurrentHashMap[Long, TaskRunner]
  def launchTask(context: ExecutorBackend, taskId: Long, serializedTask: ByteBuffer) {
-    threadPool.execute(new TaskRunner(context, taskId, serializedTask))
+    val task = new TaskRunner(context, taskId, serializedTask)
    runningTasks.put(taskId, task)
    threadPool.execute(task)
  }
  def killTask(taskId: Long) {
    val task = runningTasks.get(taskId)
    if (task != null) {
      task.kill()
      // We remove the task also in the finally block in TaskRunner.run.
      // The reason we need to remove it here is because killTask might be called before the task
      // is even launched, and never reaching that finally block. ConcurrentHashMap's remove is
      // idempotent.
      runningTasks.remove(taskId)
    }
  }
  /** Get the Yarn approved local directories. */
@ -124,15 +145,26 @@ private[spark] class Executor(
      .getOrElse(Option(System.getenv("LOCAL_DIRS"))
      .getOrElse(""))
-    if (localDirs.isEmpty()) {
+    if (localDirs.isEmpty) {
      throw new Exception("Yarn Local dirs can't be empty")
    }
-    return localDirs
+    localDirs
  }
  class TaskRunner(context: ExecutorBackend, taskId: Long, serializedTask: ByteBuffer)
    extends Runnable {
    @volatile private var killed = false
    @volatile private var task: Task[Any] = _
    def kill() {
      // Note that there is a tiny possibiliy of raising here.
      killed = true
      if (task != null) {
        task.kill()
      }
    }
    override def run() {
      val startTime = System.currentTimeMillis()
      SparkEnv.set(env)
@ -150,22 +182,29 @@ private[spark] class Executor(
        Accumulators.clear()
        val (taskFiles, taskJars, taskBytes) = Task.deserializeWithDependencies(serializedTask)
        updateDependencies(taskFiles, taskJars)
-        val task = ser.deserialize[Task[Any]](taskBytes, Thread.currentThread.getContextClassLoader)
+        task = ser.deserialize[Task[Any]](taskBytes, Thread.currentThread.getContextClassLoader)
        // If this task has been killed before we deserialized it, let's quit now. Otherwise,
        // continue executing the task.
        if (killed) {
          context.statusUpdate(taskId, TaskState.KILLED, ser.serialize(""))
        }
        attemptedTask = Some(task)
-        logInfo("Its epoch is " + task.epoch)
+        logDebug("Its epoch is " + task.epoch)
        env.mapOutputTracker.updateEpoch(task.epoch)
        taskStart = System.currentTimeMillis()
        val value = task.run(taskId.toInt)
        val taskFinish = System.currentTimeMillis()
        for (m <- task.metrics) {
-          m.hostname = Utils.localHostName
+          m.hostname = Utils.localHostName()
          m.executorDeserializeTime = (taskStart - startTime).toInt
          m.executorRunTime = (taskFinish - taskStart).toInt
          m.jvmGCTime = getTotalGCTime - startGCTime
        }
-        //TODO I'd also like to track the time it takes to serialize the task results, but that is huge headache, b/c
+        // TODO I'd also like to track the time it takes to serialize the task results, but that is
-        // we need to serialize the task metrics first.  If TaskMetrics had a custom serialized format, we could
+        // huge headache, b/c we need to serialize the task metrics first.  If TaskMetrics had a
-        // just change the relevants bytes in the byte buffer
+        // custom serialized format, we could just change the relevants bytes in the byte buffer
        val accumUpdates = Accumulators.values
        val result = new TaskResult(value, accumUpdates, task.metrics.getOrElse(null))
        val serializedResult = ser.serialize(result)
@ -198,6 +237,8 @@ private[spark] class Executor(
          logError("Exception in task ID " + taskId, t)
          //System.exit(1)
        }
      } finally {
        runningTasks.remove(taskId)
      }
    }
  }
@ -207,7 +248,7 @@ private[spark] class Executor(
   * created by the interpreter to the search path
   */
  private def createClassLoader(): ExecutorURLClassLoader = {
-    var loader = this.getClass.getClassLoader
+    val loader = this.getClass.getClassLoader
    // For each of the jars in the jarSet, add them to the class loader.
    // We assume each of the files has already been fetched.
@ -229,7 +270,7 @@ private[spark] class Executor(
        val klass = Class.forName("org.apache.spark.repl.ExecutorClassLoader")
          .asInstanceOf[Class[_ <: ClassLoader]]
        val constructor = klass.getConstructor(classOf[String], classOf[ClassLoader])
-        return constructor.newInstance(classUri, parent)
+        constructor.newInstance(classUri, parent)
      } catch {
        case _: ClassNotFoundException =>
          logError("Could not find org.apache.spark.repl.ExecutorClassLoader on classpath!")
@ -237,7 +278,7 @@ private[spark] class Executor(
          null
      }
    } else {
-      return parent
+      parent
    }
  }
--- a/core/src/main/scala/org/apache/spark/executor/StandaloneExecutorBackend.scala
+++ b/core/src/main/scala/org/apache/spark/executor/StandaloneExecutorBackend.scala
@ -69,6 +69,12 @@ private[spark] class StandaloneExecutorBackend(
        executor.launchTask(this, taskDesc.taskId, taskDesc.serializedTask)
      }
    case KillTask(taskId, _) =>
      logInfo("Kill task %s %s".format(taskId, executorId))
      if (executor != null) {
        executor.killTask(taskId)
      }
    case Terminated(_) | RemoteClientDisconnected(_, _) | RemoteClientShutdown(_, _) =>
      logError("Driver terminated or disconnected! Shutting down.")
      System.exit(1)
--- a/core/src/main/scala/org/apache/spark/scheduler/DAGScheduler.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/DAGScheduler.scala
@ -128,6 +128,7 @@ class DAGScheduler(
  //       stray messages to detect.
  val failedEpoch = new HashMap[String, Long]
  // stage id to the active job
  val idToActiveJob = new HashMap[Int, ActiveJob]
  val waiting = new HashSet[Stage] // Stages we need to run whose parents aren't done
@ -334,6 +335,35 @@ class DAGScheduler(
    listener.awaitResult()    // Will throw an exception if the job fails
  }
  def killJob(jobId: Int) {
    activeJobs.find(job => job.jobId == jobId).foreach(job => killJob(job))
  }
  private def killJob(job: ActiveJob) {
    logInfo("Killing Job and cleaning up stages %d".format(job.jobId))
    activeJobs.remove(job)
    idToActiveJob.remove(job.jobId)
    val stage = job.finalStage
    resultStageToJob.remove(stage)
    killStage(stage)
    // recursively remove all parent stages
    stage.parents.foreach(p => killStage(p))
    job.listener.jobFailed(new SparkException("Job killed"))
  }
  private def killStage(stage: Stage) {
    logInfo("Killing Stage %s".format(stage.id))
    stageIdToStage.remove(stage.id)
    if (stage.isShuffleMap) {
      shuffleToMapStage.remove(stage.id)
    }
    waiting.remove(stage)
    pendingTasks.remove(stage)
    running.remove(stage)
    taskSched.killTasks(stage.id)
    stage.parents.foreach(p => killStage(p))
  }
  /**
   * Process one event retrieved from the event queue.
   * Returns true if we should stop the event loop.
@ -579,6 +609,11 @@ class DAGScheduler(
   */
  private def handleTaskCompletion(event: CompletionEvent) {
    val task = event.task
    if (!stageIdToStage.contains(task.stageId)) {
      // Skip all the actions if the stage has been cancelled.
      return
    }
    val stage = stageIdToStage(task.stageId)
    def markStageAsFinished(stage: Stage) = {
--- a/core/src/main/scala/org/apache/spark/scheduler/ResultTask.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/ResultTask.scala
@ -38,17 +38,17 @@ private[spark] object ResultTask {
    synchronized {
      val old = serializedInfoCache.get(stageId).orNull
      if (old != null) {
-        return old
+        old
      } else {
        val out = new ByteArrayOutputStream
-        val ser = SparkEnv.get.closureSerializer.newInstance
+        val ser = SparkEnv.get.closureSerializer.newInstance()
        val objOut = ser.serializeStream(new GZIPOutputStream(out))
        objOut.writeObject(rdd)
        objOut.writeObject(func)
        objOut.close()
        val bytes = out.toByteArray
        serializedInfoCache.put(stageId, bytes)
-        return bytes
+        bytes
      }
    }
  }
@ -56,11 +56,11 @@ private[spark] object ResultTask {
  def deserializeInfo(stageId: Int, bytes: Array[Byte]): (RDD[_], (TaskContext, Iterator[_]) => _) = {
    val loader = Thread.currentThread.getContextClassLoader
    val in = new GZIPInputStream(new ByteArrayInputStream(bytes))
-    val ser = SparkEnv.get.closureSerializer.newInstance
+    val ser = SparkEnv.get.closureSerializer.newInstance()
    val objIn = ser.deserializeStream(in)
    val rdd = objIn.readObject().asInstanceOf[RDD[_]]
    val func = objIn.readObject().asInstanceOf[(TaskContext, Iterator[_]) => _]
-    return (rdd, func)
+    (rdd, func)
  }
  def clearCache() {
@ -75,25 +75,20 @@ private[spark] class ResultTask[T, U](
    stageId: Int,
    var rdd: RDD[T],
    var func: (TaskContext, Iterator[T]) => U,
-    var partition: Int,
+    _partition: Int,
    @transient locs: Seq[TaskLocation],
    var outputId: Int)
-  extends Task[U](stageId) with Externalizable {
+  extends Task[U](stageId, _partition) with Externalizable {
  def this() = this(0, null, null, 0, null, 0)
-  var split = if (rdd == null) {
+  var split = if (rdd == null) null else rdd.partitions(partition)
    null
  } else {
    rdd.partitions(partition)
  }
  @transient private val preferredLocs: Seq[TaskLocation] = {
    if (locs == null) Nil else locs.toSet.toSeq
  }
-  override def run(attemptId: Long): U = {
+  override def runTask(context: TaskContext): U = {
    val context = new TaskContext(stageId, partition, attemptId, runningLocally = false)
    metrics = Some(context.taskMetrics)
    try {
      func(context, rdd.iterator(split, context))
--- a/core/src/main/scala/org/apache/spark/scheduler/ShuffleMapTask.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/ShuffleMapTask.scala
@ -53,7 +53,7 @@ private[spark] object ShuffleMapTask {
        objOut.close()
        val bytes = out.toByteArray
        serializedInfoCache.put(stageId, bytes)
-        return bytes
+        bytes
      }
    }
  }
@ -66,7 +66,7 @@ private[spark] object ShuffleMapTask {
      val objIn = ser.deserializeStream(in)
      val rdd = objIn.readObject().asInstanceOf[RDD[_]]
      val dep = objIn.readObject().asInstanceOf[ShuffleDependency[_,_]]
-      return (rdd, dep)
+      (rdd, dep)
    }
  }
@ -75,7 +75,7 @@ private[spark] object ShuffleMapTask {
    val in = new GZIPInputStream(new ByteArrayInputStream(bytes))
    val objIn = new ObjectInputStream(in)
    val set = objIn.readObject().asInstanceOf[Array[(String, Long)]].toMap
-    return (HashMap(set.toSeq: _*))
+    HashMap(set.toSeq: _*)
  }
  def clearCache() {
@ -89,9 +89,9 @@ private[spark] class ShuffleMapTask(
    stageId: Int,
    var rdd: RDD[_],
    var dep: ShuffleDependency[_,_],
-    var partition: Int,
+    _partition: Int,
    @transient private var locs: Seq[TaskLocation])
-  extends Task[MapStatus](stageId)
+  extends Task[MapStatus](stageId, _partition)
  with Externalizable
  with Logging {
@ -129,11 +129,9 @@ private[spark] class ShuffleMapTask(
    split = in.readObject().asInstanceOf[Partition]
  }
-  override def run(attemptId: Long): MapStatus = {
+  override def runTask(context: TaskContext): MapStatus = {
    val numOutputSplits = dep.partitioner.numPartitions
-
+    metrics = Some(context.taskMetrics)
    val taskContext = new TaskContext(stageId, partition, attemptId, runningLocally = false)
    metrics = Some(taskContext.taskMetrics)
    val blockManager = SparkEnv.get.blockManager
    var shuffle: ShuffleBlocks = null
@ -146,7 +144,7 @@ private[spark] class ShuffleMapTask(
      buckets = shuffle.acquireWriters(partition)
      // Write the map output to its associated buckets.
-      for (elem <- rdd.iterator(split, taskContext)) {
+      for (elem <- rdd.iterator(split, context)) {
        val pair = elem.asInstanceOf[Product2[Any, Any]]
        val bucketId = dep.partitioner.getPartition(pair._1)
        buckets.writers(bucketId).write(pair)
@ -167,7 +165,7 @@ private[spark] class ShuffleMapTask(
      shuffleMetrics.shuffleBytesWritten = totalBytes
      metrics.get.shuffleWriteMetrics = Some(shuffleMetrics)
-      return new MapStatus(blockManager.blockManagerId, compressedSizes)
+      new MapStatus(blockManager.blockManagerId, compressedSizes)
    } catch { case e: Exception =>
      // If there is an exception from running the task, revert the partial writes
      // and throw the exception upstream to Spark.
@ -181,7 +179,7 @@ private[spark] class ShuffleMapTask(
        shuffle.releaseWriters(buckets)
      }
      // Execute the callbacks on task completion.
-      taskContext.executeOnCompleteCallbacks()
+      context.executeOnCompleteCallbacks()
    }
  }
--- a/core/src/main/scala/org/apache/spark/scheduler/Task.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/Task.scala
@ -17,25 +17,59 @@
 package org.apache.spark.scheduler
 import org.apache.spark.serializer.SerializerInstance
 import java.io.{DataInputStream, DataOutputStream}
 import java.nio.ByteBuffer
-import it.unimi.dsi.fastutil.io.FastByteArrayOutputStream
+
 import org.apache.spark.util.ByteBufferInputStream
 import scala.collection.mutable.HashMap
 import it.unimi.dsi.fastutil.io.FastByteArrayOutputStream
 import org.apache.spark.TaskContext
 import org.apache.spark.executor.TaskMetrics
 import org.apache.spark.serializer.SerializerInstance
 import org.apache.spark.util.ByteBufferInputStream
 /**
 * A task to execute on a worker node.
 */
-private[spark] abstract class Task[T](val stageId: Int) extends Serializable {
+private[spark] abstract class Task[T](val stageId: Int, var partition: Int) extends Serializable {
-  def run(attemptId: Long): T
+
  def run(attemptId: Long): T = {
    context = new TaskContext(stageId, partition, attemptId, runningLocally = false)
    if (killed) {
      kill()
    }
    runTask(context)
  }
  def runTask(context: TaskContext): T
  def preferredLocations: Seq[TaskLocation] = Nil
-  var epoch: Long = -1   // Map output tracker epoch. Will be set by TaskScheduler.
+  // Map output tracker epoch. Will be set by TaskScheduler.
  var epoch: Long = -1
  var metrics: Option[TaskMetrics] = None
  // Task context, to be initialized in run().
  @transient protected var context: TaskContext = _
  // A flag to indicate whether the task is killed. This is used in case context is not yet
  // initialized when kill() is invoked.
  @volatile @transient private var killed = false
  /**
   * Kills a task by setting the interrupted flag to true. This relies on the upper level Spark
   * code and user code to properly handle the flag. This function should be idempotent so it can
   * be called multiple times.
   */
  def kill() {
    killed = true
    if (context != null) {
      context.interrupted = true
    }
  }
 }
 /**
--- a/core/src/main/scala/org/apache/spark/scheduler/TaskScheduler.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/TaskScheduler.scala
@ -19,6 +19,7 @@ package org.apache.spark.scheduler
 import org.apache.spark.scheduler.cluster.Pool
 import org.apache.spark.scheduler.cluster.SchedulingMode.SchedulingMode
 /**
 * Low-level task scheduler interface, implemented by both ClusterScheduler and LocalScheduler.
 * These schedulers get sets of tasks submitted to them from the DAGScheduler for each stage,
@ -44,6 +45,9 @@ private[spark] trait TaskScheduler {
  // Submit a sequence of tasks to run.
  def submitTasks(taskSet: TaskSet): Unit
  // Kill the stage.
  def killTasks(stageId: Int)
  // Set a listener for upcalls. This is guaranteed to be set before submitTasks is called.
  def setListener(listener: TaskSchedulerListener): Unit
--- a/core/src/main/scala/org/apache/spark/scheduler/TaskSet.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/TaskSet.scala
@ -31,5 +31,9 @@ private[spark] class TaskSet(
    val properties: Properties) {
    val id: String = stageId + "." + attempt
  def kill() {
    tasks.foreach(_.kill())
  }
  override def toString: String = "TaskSet " + id
 }
--- a/core/src/main/scala/org/apache/spark/scheduler/cluster/ClusterScheduler.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/cluster/ClusterScheduler.scala
@ -166,6 +166,20 @@ private[spark] class ClusterScheduler(val sc: SparkContext)
    backend.reviveOffers()
  }
  override def killTasks(stageId: Int) {
    synchronized {
      schedulableBuilder.popTaskSetManagers(stageId).foreach { t =>
        val ts = t.asInstanceOf[TaskSetManager].taskSet
        ts.kill()
        val taskIds = taskSetTaskIds(ts.id)
        taskIds.foreach { tid =>
          val execId = taskIdToExecutorId(tid)
          backend.killTask(tid, execId)
        }
      }
    }
  }
  def taskSetFinished(manager: TaskSetManager) {
    this.synchronized {
      activeTaskSets -= manager.taskSet.id
--- a/core/src/main/scala/org/apache/spark/scheduler/cluster/SchedulableBuilder.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/cluster/SchedulableBuilder.scala
@ -32,8 +32,17 @@ import org.apache.spark.scheduler.cluster.SchedulingMode.SchedulingMode
 * addTaskSetManager: build the leaf nodes(TaskSetManagers)
 */
 private[spark] trait SchedulableBuilder {
  def rootPool: Pool
  def buildPools()
  def addTaskSetManager(manager: Schedulable, properties: Properties)
  def popTaskSetManagers(stageId: Int): Iterable[Schedulable] = {
    val taskSets = rootPool.schedulableQueue.filter(_.stageId == stageId)
    taskSets.foreach(rootPool.removeSchedulable)
    taskSets
  }
 }
 private[spark] class FIFOSchedulableBuilder(val rootPool: Pool)
--- a/core/src/main/scala/org/apache/spark/scheduler/cluster/SchedulerBackend.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/cluster/SchedulerBackend.scala
@ -17,7 +17,7 @@
 package org.apache.spark.scheduler.cluster
-import org.apache.spark.{SparkContext}
+import org.apache.spark.SparkContext
 /**
 * A backend interface for cluster scheduling systems that allows plugging in different ones under
@ -30,6 +30,10 @@ private[spark] trait SchedulerBackend {
  def reviveOffers(): Unit
  def defaultParallelism(): Int
  def killTask(taskId: Long, executorId: String) {
    throw new UnsupportedOperationException
  }
  // Memory used by each executor (in megabytes)
  protected val executorMemory: Int = SparkContext.executorMemoryRequested
--- a/core/src/main/scala/org/apache/spark/scheduler/cluster/StandaloneClusterMessage.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/cluster/StandaloneClusterMessage.scala
@ -30,6 +30,8 @@ private[spark] object StandaloneClusterMessages {
  // Driver to executors
  case class LaunchTask(task: TaskDescription) extends StandaloneClusterMessage
  case class KillTask(taskId: Long, executor: String) extends StandaloneClusterMessage
  case class RegisteredExecutor(sparkProperties: Seq[(String, String)])
    extends StandaloneClusterMessage
--- a/core/src/main/scala/org/apache/spark/scheduler/cluster/StandaloneSchedulerBackend.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/cluster/StandaloneSchedulerBackend.scala
@ -90,6 +90,9 @@ class StandaloneSchedulerBackend(scheduler: ClusterScheduler, actorSystem: Actor
      case ReviveOffers =>
        makeOffers()
      case KillTask(taskId, executorId) =>
        executorActor(executorId) ! KillTask(taskId, executorId)
      case StopDriver =>
        sender ! true
        context.stop(self)
@ -179,6 +182,10 @@ class StandaloneSchedulerBackend(scheduler: ClusterScheduler, actorSystem: Actor
    driverActor ! ReviveOffers
  }
  override def killTask(taskId: Long, executorId: String) {
    driverActor ! KillTask(taskId, executorId)
  }
  override def defaultParallelism() = Option(System.getProperty("spark.default.parallelism"))
      .map(_.toInt).getOrElse(math.max(totalCoreCount.get(), 2))
--- a/core/src/main/scala/org/apache/spark/scheduler/local/LocalScheduler.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/local/LocalScheduler.scala
@ -128,6 +128,12 @@ private[spark] class LocalScheduler(threads: Int, val maxFailures: Int, val sc:
    }
  }
  override def killTasks(stageId: Int) = synchronized {
    schedulableBuilder.popTaskSetManagers(stageId).foreach {
      _.asInstanceOf[TaskSetManager].taskSet.kill()
    }
  }
  def resourceOffer(freeCores: Int): Seq[TaskDescription] = {
    synchronized {
      var freeCpuCores = freeCores
--- a/core/src/test/scala/org/apache/spark/CacheManagerSuite.scala
+++ b/core/src/test/scala/org/apache/spark/CacheManagerSuite.scala
@ -58,7 +58,8 @@ class CacheManagerSuite extends FunSuite with BeforeAndAfter with EasyMockSugar
    }
    whenExecuting(blockManager) {
-      val context = new TaskContext(0, 0, 0, runningLocally = false, null)
+      val context = new TaskContext(0, 0, 0, interrupted = false, runningLocally = false,
        taskMetrics = null)
      val value = cacheManager.getOrCompute(rdd, split, context, StorageLevel.MEMORY_ONLY)
      assert(value.toList === List(1, 2, 3, 4))
    }
@ -70,7 +71,8 @@ class CacheManagerSuite extends FunSuite with BeforeAndAfter with EasyMockSugar
    }
    whenExecuting(blockManager) {
-      val context = new TaskContext(0, 0, 0, runningLocally = false, null)
+      val context = new TaskContext(0, 0, 0, interrupted = false, runningLocally = false,
        taskMetrics = null)
      val value = cacheManager.getOrCompute(rdd, split, context, StorageLevel.MEMORY_ONLY)
      assert(value.toList === List(5, 6, 7))
    }
@ -83,7 +85,8 @@ class CacheManagerSuite extends FunSuite with BeforeAndAfter with EasyMockSugar
    }
    whenExecuting(blockManager) {
-      val context = new TaskContext(0, 0, 0, runningLocally = true, null)
+      val context = new TaskContext(0, 0, 0, runningLocally = true, interrupted = false,
        taskMetrics = null)
      val value = cacheManager.getOrCompute(rdd, split, context, StorageLevel.MEMORY_ONLY)
      assert(value.toList === List(1, 2, 3, 4))
    }
--- a/core/src/test/scala/org/apache/spark/JavaAPISuite.java
+++ b/core/src/test/scala/org/apache/spark/JavaAPISuite.java
@ -495,7 +495,7 @@ public class JavaAPISuite implements Serializable {
  @Test
  public void iterator() {
    JavaRDD<Integer> rdd = sc.parallelize(Arrays.asList(1, 2, 3, 4, 5), 2);
-    TaskContext context = new TaskContext(0, 0, 0, false, null);
+    TaskContext context = new TaskContext(0, 0, 0, false, false, null);
    Assert.assertEquals(1, rdd.iterator(rdd.splits().get(0), context).next().intValue());
  }
--- a/core/src/test/scala/org/apache/spark/scheduler/DAGSchedulerSuite.scala
+++ b/core/src/test/scala/org/apache/spark/scheduler/DAGSchedulerSuite.scala
@ -29,12 +29,13 @@ import org.apache.spark.SparkContext
 import org.apache.spark.Partition
 import org.apache.spark.TaskContext
 import org.apache.spark.{Dependency, ShuffleDependency, OneToOneDependency}
-import org.apache.spark.{FetchFailed, Success, TaskEndReason}
+import org.apache.spark.{Success, TaskEndReason}
 import org.apache.spark.storage.{BlockManagerId, BlockManagerMaster}
 import org.apache.spark.scheduler.cluster.Pool
 import org.apache.spark.scheduler.cluster.SchedulingMode
 import org.apache.spark.scheduler.cluster.SchedulingMode.SchedulingMode
 import org.apache.spark.FetchFailed
 /**
 * Tests for DAGScheduler. These tests directly call the event processing functions in DAGScheduler
@ -62,6 +63,7 @@ class DAGSchedulerSuite extends FunSuite with BeforeAndAfter with LocalSparkCont
      taskSet.tasks.foreach(_.epoch = mapOutputTracker.getEpoch)
      taskSets += taskSet
    }
    override def killTasks(stageId: Int) {}
    override def setListener(listener: TaskSchedulerListener) = {}
    override def defaultParallelism() = 2
  }
--- a/core/src/test/scala/org/apache/spark/scheduler/cluster/FakeTask.scala
+++ b/core/src/test/scala/org/apache/spark/scheduler/cluster/FakeTask.scala
@ -17,10 +17,11 @@
 package org.apache.spark.scheduler.cluster
 import org.apache.spark.TaskContext
 import org.apache.spark.scheduler.{TaskLocation, Task}
-class FakeTask(stageId: Int, prefLocs: Seq[TaskLocation] = Nil) extends Task[Int](stageId) {
+class FakeTask(stageId: Int, prefLocs: Seq[TaskLocation] = Nil) extends Task[Int](stageId, 0) {
-  override def run(attemptId: Long): Int = 0
+  override def runTask(context: TaskContext): Int = 0
  override def preferredLocations: Seq[TaskLocation] = prefLocs
 }