spark1.1.0源码阅读-taskScheduler

1. sparkContext中设置createTaskScheduler

 1       case "yarn-standalone" | "yarn-cluster" =>
 2         if (master == "yarn-standalone") {
 3           logWarning(
 4             ""yarn-standalone" is deprecated as of Spark 1.0. Use "yarn-cluster" instead.")
 5         }
 6         val scheduler = try {
 7           val clazz = Class.forName("org.apache.spark.scheduler.cluster.YarnClusterScheduler")
 8           val cons = clazz.getConstructor(classOf[SparkContext])
 9           cons.newInstance(sc).asInstanceOf[TaskSchedulerImpl]
10         } catch {
11           // TODO: Enumerate the exact reasons why it can fail
12           // But irrespective of it, it means we cannot proceed !
13           case e: Exception => {
14             throw new SparkException("YARN mode not available ?", e)
15           }
16         }
17         val backend = new CoarseGrainedSchedulerBackend(scheduler, sc.env.actorSystem)
18         scheduler.initialize(backend) //调用实现类的initialize函数
19         scheduler

在taskSchedulerImpl.scala中

 1   def initialize(backend: SchedulerBackend) {
 2     this.backend = backend
 3     // temporarily set rootPool name to empty
 4     rootPool = new Pool("", schedulingMode, 0, 0)
 5     schedulableBuilder = {
 6       schedulingMode match {
 7         case SchedulingMode.FIFO =>
 8           new FIFOSchedulableBuilder(rootPool)
 9         case SchedulingMode.FAIR =>
10           new FairSchedulableBuilder(rootPool, conf)
11       }
12     }
13     schedulableBuilder.buildPools()
14   }

2. submitTasks

 1   override def submitTasks(taskSet: TaskSet) {
 2     val tasks = taskSet.tasks
 3     logInfo("Adding task set " + taskSet.id + " with " + tasks.length + " tasks")
 4     this.synchronized {
 5       val manager = new TaskSetManager(this, taskSet, maxTaskFailures)
 6       activeTaskSets(taskSet.id) = manager
 7       schedulableBuilder.addTaskSetManager(manager, manager.taskSet.properties)
 8 
 9       if (!isLocal && !hasReceivedTask) {
10         starvationTimer.scheduleAtFixedRate(new TimerTask() {
11           override def run() {
12             if (!hasLaunchedTask) {
13               logWarning("Initial job has not accepted any resources; " +
14                 "check your cluster UI to ensure that workers are registered " +
15                 "and have sufficient memory")
16             } else {
17               this.cancel()
18             }
19           }
20         }, STARVATION_TIMEOUT, STARVATION_TIMEOUT)
21       }
22       hasReceivedTask = true
23     }
24     backend.reviveOffers()
25   }

3. CoarseGrainedSchedulerBackend的reviveOffers

1   override def reviveOffers() {
2     driverActor ! ReviveOffers  //将msg发给CoarseGrainedSchedulerBackend的driverActor
3   }

1       case ReviveOffers =>
2         makeOffers()

1     // Make fake resource offers on all executors
2     def makeOffers() {
3       launchTasks(scheduler.resourceOffers(
4         executorHost.toArray.map {case (id, host) => new WorkerOffer(id, host, freeCores(id))}))
5     }

1 /**
2  * Represents free resources available on an executor.
3  */
4 private[spark]
5 case class WorkerOffer(executorId: String, host: String, cores: Int)

 1   /**
 2    * Called by cluster manager to offer resources on slaves. We respond by asking our active task
 3    * sets for tasks in order of priority. We fill each node with tasks in a round-robin manner so
 4    * that tasks are balanced across the cluster.
 5    */
 6   def resourceOffers(offers: Seq[WorkerOffer]): Seq[Seq[TaskDescription]] = synchronized {
 7     SparkEnv.set(sc.env)
 8 
 9     // Mark each slave as alive and remember its hostname
10     for (o <- offers) {
11       executorIdToHost(o.executorId) = o.host
12       if (!executorsByHost.contains(o.host)) {
13         executorsByHost(o.host) = new HashSet[String]()
14         executorAdded(o.executorId, o.host)
15       }
16     }
17 
18     // Randomly shuffle offers to avoid always placing tasks on the same set of workers.
19     val shuffledOffers = Random.shuffle(offers)
20     // Build a list of tasks to assign to each worker.
21     val tasks = shuffledOffers.map(o => new ArrayBuffer[TaskDescription](o.cores))
22     val availableCpus = shuffledOffers.map(o => o.cores).toArray
23     val sortedTaskSets = rootPool.getSortedTaskSetQueue
24     for (taskSet <- sortedTaskSets) {
25       logDebug("parentName: %s, name: %s, runningTasks: %s".format(
26         taskSet.parent.name, taskSet.name, taskSet.runningTasks))
27     }
28 
29     // Take each TaskSet in our scheduling order, and then offer it each node in increasing order
30     // of locality levels so that it gets a chance to launch local tasks on all of them.
31     var launchedTask = false
32     for (taskSet <- sortedTaskSets; maxLocality <- TaskLocality.values) {
33       do {
34         launchedTask = false
35         for (i <- 0 until shuffledOffers.size) {
36           val execId = shuffledOffers(i).executorId
37           val host = shuffledOffers(i).host
38           if (availableCpus(i) >= CPUS_PER_TASK) {
39             for (task <- taskSet.resourceOffer(execId, host, maxLocality)) {
40               tasks(i) += task
41               val tid = task.taskId
42               taskIdToTaskSetId(tid) = taskSet.taskSet.id
43               taskIdToExecutorId(tid) = execId
44               activeExecutorIds += execId
45               executorsByHost(host) += execId
46               availableCpus(i) -= CPUS_PER_TASK
47               assert (availableCpus(i) >= 0)
48               launchedTask = true
49             }
50           }
51         }
52       } while (launchedTask)
53     }
54 
55     if (tasks.size > 0) {
56       hasLaunchedTask = true
57     }
58     return tasks
59   }

4. launchTasks

1     // Launch tasks returned by a set of resource offers
2     def launchTasks(tasks: Seq[Seq[TaskDescription]]) {
3       for (task <- tasks.flatten) {
4         freeCores(task.executorId) -= scheduler.CPUS_PER_TASK
5         executorActor(task.executorId) ! LaunchTask(task)
6       }
7     }

 1 class CoarseGrainedSchedulerBackend(scheduler: TaskSchedulerImpl, actorSystem: ActorSystem)
 2   extends SchedulerBackend with Logging
 3 {
 4   // Use an atomic variable to track total number of cores in the cluster for simplicity and speed
 5   var totalCoreCount = new AtomicInteger(0)
 6   val conf = scheduler.sc.conf
 7   private val timeout = AkkaUtils.askTimeout(conf)
 8 
 9   class DriverActor(sparkProperties: Seq[(String, String)]) extends Actor {
10     private val executorActor = new HashMap[String, ActorRef]
11     private val executorAddress = new HashMap[String, Address]
12     private val executorHost = new HashMap[String, String]
13     private val freeCores = new HashMap[String, Int]
14     private val totalCores = new HashMap[String, Int]
15     private val addressToExecutorId = new HashMap[Address, String]

1   // Driver to executors
2   case class LaunchTask(task: TaskDescription) extends CoarseGrainedClusterMessage

 1 private[spark] class TaskDescription(
 2     val taskId: Long,
 3     val executorId: String,
 4     val name: String,
 5     val index: Int,    // Index within this task's TaskSet
 6     _serializedTask: ByteBuffer)
 7   extends Serializable {
 8 
 9   // Because ByteBuffers are not serializable, wrap the task in a SerializableBuffer
10   private val buffer = new SerializableBuffer(_serializedTask)
11 
12   def serializedTask: ByteBuffer = buffer.value
13 
14   override def toString: String = "TaskDescription(TID=%d, index=%d)".format(taskId, index)
15 }

5. CoarseGrainedSchedulerBackend收到executor的注册之后，记录executor

 1     def receive = {
 2       case RegisterExecutor(executorId, hostPort, cores) =>
 3         Utils.checkHostPort(hostPort, "Host port expected " + hostPort)
 4         if (executorActor.contains(executorId)) {
 5           sender ! RegisterExecutorFailed("Duplicate executor ID: " + executorId)
 6         } else {
 7           logInfo("Registered executor: " + sender + " with ID " + executorId)
 8           sender ! RegisteredExecutor(sparkProperties)
 9           executorActor(executorId) = sender
10           executorHost(executorId) = Utils.parseHostPort(hostPort)._1
11           totalCores(executorId) = cores
12           freeCores(executorId) = cores
13           executorAddress(executorId) = sender.path.address
14           addressToExecutorId(sender.path.address) = executorId
15           totalCoreCount.addAndGet(cores)
16           makeOffers()
17         }

executor先向CoarseGrainedSchedulerBackend注册，然后CoarseGrainedSchedulerBackend发task（序列化后）到这个executor上去。

6. CoarseGrainedExecutorBackend跟CoarseGrainedSchedulerBackend通信。

 1 private[spark] class CoarseGrainedExecutorBackend(
 2     driverUrl: String,
 3     executorId: String,
 4     hostPort: String,
 5     cores: Int,
 6     sparkProperties: Seq[(String, String)])
 7   extends Actor with ActorLogReceive with ExecutorBackend with Logging {
 8 
 9   Utils.checkHostPort(hostPort, "Expected hostport")
10 
11   var executor: Executor = null
12   var driver: ActorSelection = null
13 
14   override def preStart() {
15     logInfo("Connecting to driver: " + driverUrl)
16     driver = context.actorSelection(driverUrl)
17     driver ! RegisterExecutor(executorId, hostPort, cores) //注册
18     context.system.eventStream.subscribe(self, classOf[RemotingLifecycleEvent])
19   }
20 
21   override def receiveWithLogging = {
22     case RegisteredExecutor =>
23       logInfo("Successfully registered with driver")
24       // Make this host instead of hostPort ?
25       executor = new Executor(executorId, Utils.parseHostPort(hostPort)._1, sparkProperties,
26         false)
27 
28     case RegisterExecutorFailed(message) =>
29       logError("Slave registration failed: " + message)
30       System.exit(1)
31 
32     case LaunchTask(data) =>  //收到task
33       if (executor == null) {
34         logError("Received LaunchTask command but executor was null")
35         System.exit(1)
36       } else {
37         val ser = SparkEnv.get.closureSerializer.newInstance()
38         val taskDesc = ser.deserialize[TaskDescription](data.value)
39         logInfo("Got assigned task " + taskDesc.taskId)
40         executor.launchTask(this, taskDesc.taskId, taskDesc.name, taskDesc.serializedTask)
41       }

7. executor.launchTask

1   def launchTask(
2       context: ExecutorBackend, taskId: Long, taskName: String, serializedTask: ByteBuffer) {
3     val tr = new TaskRunner(context, taskId, taskName, serializedTask)
4     runningTasks.put(taskId, tr)
5     threadPool.execute(tr)
6   }

且听下回分解