Spark系列(八)Worker工作原理

时间：2016-04-10 20:52:09 阅读：428 评论：0 收藏：0 [点我收藏+]

标签：

工作原理图

源代码分析

包名：org.apache.spark.deploy.worker

启动driver入口点：registerWithMaster方法中的case LaunchDriver

            1            case LaunchDriver(driverId, driverDesc) => {       
         2                logInfo(s"Asked to launch driver $driverId")       
         3                // 创建DriverRunner对象启动Driver       
         4                val driver = new DriverRunner(       
         5                conf,       
         6                driverId,       
         7                workDir,       
         8                sparkHome,       
         9                driverDesc.copy(command = Worker.maybeUpdateSSLSettings(driverDesc.command, conf)),       
         10                self,       
         11                akkaUrl)       
         12                // 将driver加入本地缓存       
         13                drivers(driverId) = driver       
         14                driver.start()       
         15                    
         16                // 增加已使用core       
         17                coresUsed += driverDesc.cores       
         18                // 增加已使用内存       
         19                memoryUsed += driverDesc.mem       
         20            }       
 

DriverRunner

管理一个driver的执行，包括失败时自动重启driver,这种方式仅仅适用于standalone集群部署模式

DriverRunner类中start方法实现

            1            def start() = {       
         2                // 创建新线程       
         3                new Thread("DriverRunner for " + driverId) {       
         4                  override def run() {       
         5                    try {       
         6                      // 创建driver工作目录       
         7                      val driverDir = createWorkingDirectory()       
         8                      // 下载应用所需的的Jar包       
         9                      val localJarFilename = downloadUserJar(driverDir)       
         10                    
         11                      def substituteVariables(argument: String): String = argument match {       
         12                        case "{{WORKER_URL}}" => workerUrl       
         13                        case "{{USER_JAR}}" => localJarFilename       
         14                        case other => other       
         15                      }       
         16                    
         17                      // TODO: If we add ability to submit multiple jars they should also be added here       
         18                      // 构建ProcessBuilder对象，传入启动driver命令(所需内存大小)       
         19                      val builder = CommandUtils.buildProcessBuilder(driverDesc.command, driverDesc.mem,       
         20                        sparkHome.getAbsolutePath, substituteVariables)       
         21                      // 启动driver进程       
         22                      launchDriver(builder, driverDir, driverDesc.supervise)       
         23                    }       
         24                    catch {       
         25                      case e: Exception => finalException = Some(e)       
         26                    }       
         27                    
         28                    // Driver退出状态处理       
         29                    val state =       
         30                      if (killed) {       
         31                        DriverState.KILLED       
         32                      } else if (finalException.isDefined) {       
         33                        DriverState.ERROR       
         34                      } else {       
         35                        finalExitCode match {       
         36                          case Some(0) => DriverState.FINISHED       
         37                          case _ => DriverState.FAILED       
         38                        }       
         39                      }       
         40                    
         41                    finalState = Some(state)       
         42                    // 向Driver所属worker发送DriverStateChanged消息       
         43                    worker ! DriverStateChanged(driverId, state, finalException)       
         44                  }       
         45                }.start()       
         46            }       
 

LaunchExecutor

管理LaunchExecutor的启动

            1            case LaunchExecutor(masterUrl, appId, execId, appDesc, cores_, memory_) =>       
         2                if (masterUrl != activeMasterUrl) {       
         3                logWarning("Invalid Master (" + masterUrl + ") attempted to launch executor.")       
         4                } else {       
         5                try {       
         6                  logInfo("Asked to launch executor %s/%d for %s".format(appId, execId, appDesc.name))       
         7                    
         8                  // Create the executor‘s working directory       
         9                  // 创建executor本地工作目录       
         10                  val executorDir = new File(workDir, appId + "/" + execId)       
         11                  if (!executorDir.mkdirs()) {       
         12                    throw new IOException("Failed to create directory " + executorDir)       
         13                  }       
         14                    
         15                  // Create local dirs for the executor. These are passed to the executor via the       
         16                  // SPARK_LOCAL_DIRS environment variable, and deleted by the Worker when the       
         17                  // application finishes.       
         18                  val appLocalDirs = appDirectories.get(appId).getOrElse {       
         19                    Utils.getOrCreateLocalRootDirs(conf).map { dir =>       
         20                      Utils.createDirectory(dir).getAbsolutePath()       
         21                    }.toSeq       
         22                  }       
         23                  appDirectories(appId) = appLocalDirs       
         24                  // 创建ExecutorRunner对象       
         25                  val manager = new ExecutorRunner(       
         26                    appId,       
         27                    execId,       
         28                    appDesc.copy(command = Worker.maybeUpdateSSLSettings(appDesc.command, conf)),       
         29                    cores_,       
         30                    memory_,       
         31                    self,       
         32                    workerId,       
         33                    host,       
         34                    webUi.boundPort,       
         35                    publicAddress,       
         36                    sparkHome,       
         37                    executorDir,       
         38                    akkaUrl,       
         39                    conf,       
         40                    appLocalDirs, ExecutorState.LOADING)       
         41                  // executor加入本地缓存       
         42                  executors(appId + "/" + execId) = manager       
         43                  manager.start()       
         44                  // 增加worker已使用core       
         45                  coresUsed += cores_       
         46                  // 增加worker已使用memory       
         47                  memoryUsed += memory_       
         48                  // 通知master发送ExecutorStateChanged消息       
         49                  master ! ExecutorStateChanged(appId, execId, manager.state, None, None)       
         50                }       
         51                // 异常情况处理，通知master发送ExecutorStateChanged FAILED消息       
         52                catch {       
         53                  case e: Exception => {       
         54                    logError(s"Failed to launch executor $appId/$execId for ${appDesc.name}.", e)       
         55                    if (executors.contains(appId + "/" + execId)) {       
         56                      executors(appId + "/" + execId).kill()       
         57                      executors -= appId + "/" + execId       
         58                    }       
         59                    master ! ExecutorStateChanged(appId, execId, ExecutorState.FAILED,       
         60                      Some(e.toString), None)       
         61                  }       
         62                }       
         63            }       
 

总结

1、Worker、Driver、Application启动后都会向Master进行注册,并缓存到Master内存数据模型中
2、完成注册后发送LaunchExecutor、LaunchDriver到Worker
3、Worker收到消息后启动executor和driver进程，并调用Worker的ExecutorStateChanged和DriverStateChanged方法
4、发送ExecutorStateChanged和DriverStateChanged消息到Master的，根据各自的状态信息进行处理，最重要的是会调用schedule方法进行资源的重新调度

Spark系列(八)Worker工作原理

标签：

原文地址：http://www.cnblogs.com/jianyuan/p/Spark系列之Worker工作原理.html

踩

(0)

评论一句话评论（0）

分享档案

更多>

2021年07月29日 (22)
2021年07月28日 (40)
2021年07月27日 (32)
2021年07月26日 (79)
2021年07月23日 (29)
2021年07月22日 (30)
2021年07月21日 (42)
2021年07月20日 (16)
2021年07月19日 (90)
2021年07月16日 (35)

周排行

1	case LaunchDriver(driverId, driverDesc) => {
2	logInfo(s"Asked to launch driver $driverId")
3	// 创建DriverRunner对象启动Driver
4	val driver = new DriverRunner(
5	conf,
6	driverId,
7	workDir,
8	sparkHome,
9	driverDesc.copy(command = Worker.maybeUpdateSSLSettings(driverDesc.command, conf)),
10	self,
11	akkaUrl)
12	// 将driver加入本地缓存
13	drivers(driverId) = driver
14	driver.start()
15
16	// 增加已使用core
17	coresUsed += driverDesc.cores
18	// 增加已使用内存
19	memoryUsed += driverDesc.mem
20	}

1	def start() = {
2	// 创建新线程
3	new Thread("DriverRunner for " + driverId) {
4	override def run() {
5	try {
6	// 创建driver工作目录
7	val driverDir = createWorkingDirectory()
8	// 下载应用所需的的Jar包
9	val localJarFilename = downloadUserJar(driverDir)
10
11	def substituteVariables(argument: String): String = argument match {
12	case "{{WORKER_URL}}" => workerUrl
13	case "{{USER_JAR}}" => localJarFilename
14	case other => other
15	}
16
17	// TODO: If we add ability to submit multiple jars they should also be added here
18	// 构建ProcessBuilder对象，传入启动driver命令(所需内存大小)
19	val builder = CommandUtils.buildProcessBuilder(driverDesc.command, driverDesc.mem,
20	sparkHome.getAbsolutePath, substituteVariables)
21	// 启动driver进程
22	launchDriver(builder, driverDir, driverDesc.supervise)
23	}
24	catch {
25	case e: Exception => finalException = Some(e)
26	}
27
28	// Driver退出状态处理
29	val state =
30	if (killed) {
31	DriverState.KILLED
32	} else if (finalException.isDefined) {
33	DriverState.ERROR
34	} else {
35	finalExitCode match {
36	case Some(0) => DriverState.FINISHED
37	case _ => DriverState.FAILED
38	}
39	}
40
41	finalState = Some(state)
42	// 向Driver所属worker发送DriverStateChanged消息
43	worker ! DriverStateChanged(driverId, state, finalException)
44	}
45	}.start()
46	}

1	case LaunchExecutor(masterUrl, appId, execId, appDesc, cores_, memory_) =>
2	if (masterUrl != activeMasterUrl) {
3	logWarning("Invalid Master (" + masterUrl + ") attempted to launch executor.")
4	} else {
5	try {
6	logInfo("Asked to launch executor %s/%d for %s".format(appId, execId, appDesc.name))
7
8	// Create the executor‘s working directory
9	// 创建executor本地工作目录
10	val executorDir = new File(workDir, appId + "/" + execId)
11	if (!executorDir.mkdirs()) {
12	throw new IOException("Failed to create directory " + executorDir)
13	}
14
15	// Create local dirs for the executor. These are passed to the executor via the
16	// SPARK_LOCAL_DIRS environment variable, and deleted by the Worker when the
17	// application finishes.
18	val appLocalDirs = appDirectories.get(appId).getOrElse {
19	Utils.getOrCreateLocalRootDirs(conf).map { dir =>
20	Utils.createDirectory(dir).getAbsolutePath()
21	}.toSeq
22	}
23	appDirectories(appId) = appLocalDirs
24	// 创建ExecutorRunner对象
25	val manager = new ExecutorRunner(
26	appId,
27	execId,
28	appDesc.copy(command = Worker.maybeUpdateSSLSettings(appDesc.command, conf)),
29	cores_,
30	memory_,
31	self,
32	workerId,
33	host,
34	webUi.boundPort,
35	publicAddress,
36	sparkHome,
37	executorDir,
38	akkaUrl,
39	conf,
40	appLocalDirs, ExecutorState.LOADING)
41	// executor加入本地缓存
42	executors(appId + "/" + execId) = manager
43	manager.start()
44	// 增加worker已使用core
45	coresUsed += cores_
46	// 增加worker已使用memory
47	memoryUsed += memory_
48	// 通知master发送ExecutorStateChanged消息
49	master ! ExecutorStateChanged(appId, execId, manager.state, None, None)
50	}
51	// 异常情况处理，通知master发送ExecutorStateChanged FAILED消息
52	catch {
53	case e: Exception => {
54	logError(s"Failed to launch executor $appId/$execId for ${appDesc.name}.", e)
55	if (executors.contains(appId + "/" + execId)) {
56	executors(appId + "/" + execId).kill()
57	executors -= appId + "/" + execId
58	}
59	master ! ExecutorStateChanged(appId, execId, ExecutorState.FAILED,
60	Some(e.toString), None)
61	}
62	}
63	}