-
Notifications
You must be signed in to change notification settings - Fork 29k
[SPARK-22839] [K8s] Refactor to unify driver and executor pod builder APIs #20910
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Changes from 12 commits
f1b8c08
80e1562
c3460ae
6d1711b
4036d72
d46d671
2936aa5
d2751b6
430fbb2
fd3e8e6
f0ea6d9
67e9ca1
4c944c4
27b8634
9c67016
f3540f8
33f9d56
9b6cc05
a5f08bb
fbde25d
dff0089
02bbcbc
7d65875
041a240
f446868
df75a9c
518fb2a
7b339c3
dbe35fa
4b92989
7807c9c
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,158 @@ | ||
| /* | ||
| * Licensed to the Apache Software Foundation (ASF) under one or more | ||
| * contributor license agreements. See the NOTICE file distributed with | ||
| * this work for additional information regarding copyright ownership. | ||
| * The ASF licenses this file to You under the Apache License, Version 2.0 | ||
| * (the "License"); you may not use this file except in compliance with | ||
| * the License. You may obtain a copy of the License at | ||
| * | ||
| * http://www.apache.org/licenses/LICENSE-2.0 | ||
| * | ||
| * Unless required by applicable law or agreed to in writing, software | ||
| * distributed under the License is distributed on an "AS IS" BASIS, | ||
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
| * See the License for the specific language governing permissions and | ||
| * limitations under the License. | ||
| */ | ||
| package org.apache.spark.deploy.k8s | ||
|
|
||
| import io.fabric8.kubernetes.api.model.Pod | ||
|
|
||
| import org.apache.spark.SparkConf | ||
| import org.apache.spark.deploy.k8s.Config._ | ||
| import org.apache.spark.deploy.k8s.Constants._ | ||
| import org.apache.spark.deploy.k8s.submit.{JavaMainAppResource, MainAppResource} | ||
| import org.apache.spark.internal.config.ConfigEntry | ||
|
|
||
| private[spark] sealed trait KubernetesRoleSpecificConf | ||
|
|
||
| private[spark] case class KubernetesDriverSpecificConf( | ||
| mainAppResource: Option[MainAppResource], | ||
| mainClass: String, | ||
| appName: String, | ||
| appArgs: Seq[String]) extends KubernetesRoleSpecificConf | ||
|
|
||
| private[spark] case class KubernetesExecutorSpecificConf( | ||
| executorId: String, driverPod: Pod) | ||
| extends KubernetesRoleSpecificConf | ||
|
|
||
| private[spark] class KubernetesConf[T <: KubernetesRoleSpecificConf]( | ||
| val sparkConf: SparkConf, | ||
| val roleSpecificConf: T, | ||
| val appResourceNamePrefix: String, | ||
| val appId: String, | ||
| val roleLabels: Map[String, String], | ||
| val roleAnnotations: Map[String, String], | ||
| val roleSecretNamesToMountPaths: Map[String, String]) { | ||
|
|
||
| def namespace(): String = sparkConf.get(KUBERNETES_NAMESPACE) | ||
|
|
||
| def sparkJars(): Seq[String] = sparkConf | ||
| .getOption("spark.jars") | ||
| .map(str => str.split(",").toSeq) | ||
| .getOrElse(Seq.empty[String]) | ||
|
|
||
| def sparkFiles(): Seq[String] = sparkConf | ||
| .getOption("spark.files") | ||
| .map(str => str.split(",").toSeq) | ||
| .getOrElse(Seq.empty[String]) | ||
|
|
||
| def driverCustomEnvs(): Seq[(String, String)] = | ||
|
||
| sparkConf.getAllWithPrefix(KUBERNETES_DRIVER_ENV_KEY).toSeq | ||
|
|
||
| def imagePullPolicy(): String = sparkConf.get(CONTAINER_IMAGE_PULL_POLICY) | ||
|
|
||
| def nodeSelector(): Map[String, String] = | ||
| KubernetesUtils.parsePrefixedKeyValuePairs(sparkConf, KUBERNETES_NODE_SELECTOR_PREFIX) | ||
|
|
||
| def get[T](config: ConfigEntry[T]): T = sparkConf.get(config) | ||
|
|
||
| def get(conf: String, defaultValue: String): String = sparkConf.get(conf, defaultValue) | ||
|
|
||
| def getOption(key: String): Option[String] = sparkConf.getOption(key) | ||
|
|
||
|
||
| } | ||
|
|
||
| private[spark] object KubernetesConf { | ||
| def createDriverConf( | ||
| sparkConf: SparkConf, | ||
| appName: String, | ||
| appResourceNamePrefix: String, | ||
| appId: String, | ||
| mainAppResource: Option[MainAppResource], | ||
| mainClass: String, | ||
| appArgs: Array[String]): KubernetesConf[KubernetesDriverSpecificConf] = { | ||
| val sparkConfWithMainAppJar = sparkConf.clone() | ||
| mainAppResource.foreach { | ||
| case JavaMainAppResource(res) => | ||
| val previousJars = sparkConf | ||
| .getOption("spark.jars") | ||
| .map(_.split(",")) | ||
| .getOrElse(Array.empty) | ||
| if (!previousJars.contains(res)) { | ||
| sparkConfWithMainAppJar.setJars(previousJars ++ Seq(res)) | ||
| } | ||
| } | ||
| val driverCustomLabels = KubernetesUtils.parsePrefixedKeyValuePairs( | ||
|
Contributor
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Can you add a new line before this line? |
||
| sparkConf, | ||
| KUBERNETES_DRIVER_LABEL_PREFIX) | ||
| require(!driverCustomLabels.contains(SPARK_APP_ID_LABEL), "Label with key " + | ||
| s"$SPARK_APP_ID_LABEL is not allowed as it is reserved for Spark bookkeeping " + | ||
| "operations.") | ||
| require(!driverCustomLabels.contains(SPARK_ROLE_LABEL), "Label with key " + | ||
| s"$SPARK_ROLE_LABEL is not allowed as it is reserved for Spark bookkeeping " + | ||
| "operations.") | ||
| val driverLabels = driverCustomLabels ++ Map( | ||
| SPARK_APP_ID_LABEL -> appId, | ||
| SPARK_ROLE_LABEL -> SPARK_POD_DRIVER_ROLE) | ||
| val driverAnnotations = | ||
| KubernetesUtils.parsePrefixedKeyValuePairs(sparkConf, KUBERNETES_DRIVER_ANNOTATION_PREFIX) | ||
| val driverSecretNamesToMountPaths = | ||
|
||
| KubernetesUtils.parsePrefixedKeyValuePairs(sparkConf, KUBERNETES_DRIVER_SECRETS_PREFIX) | ||
| new KubernetesConf( | ||
|
||
| sparkConfWithMainAppJar, | ||
| KubernetesDriverSpecificConf(mainAppResource, mainClass, appName, appArgs), | ||
| appResourceNamePrefix, | ||
| appId, | ||
| driverLabels, | ||
| driverAnnotations, | ||
| driverSecretNamesToMountPaths) | ||
| } | ||
|
|
||
| def createExecutorConf( | ||
| sparkConf: SparkConf, | ||
| executorId: String, | ||
| appId: String, | ||
| driverPod: Pod): KubernetesConf[KubernetesExecutorSpecificConf] = { | ||
| val executorCustomLabels = KubernetesUtils.parsePrefixedKeyValuePairs( | ||
| sparkConf, | ||
| KUBERNETES_EXECUTOR_LABEL_PREFIX) | ||
| require( | ||
| !executorCustomLabels.contains(SPARK_APP_ID_LABEL), | ||
| s"Custom executor labels cannot contain $SPARK_APP_ID_LABEL as it is reserved for Spark.") | ||
| require( | ||
| !executorCustomLabels.contains(SPARK_EXECUTOR_ID_LABEL), | ||
| s"Custom executor labels cannot contain $SPARK_EXECUTOR_ID_LABEL as it is reserved for" + | ||
| " Spark.") | ||
| require( | ||
| !executorCustomLabels.contains(SPARK_ROLE_LABEL), | ||
| s"Custom executor labels cannot contain $SPARK_ROLE_LABEL as it is reserved for Spark.") | ||
| val executorLabels = Map( | ||
| SPARK_EXECUTOR_ID_LABEL -> executorId, | ||
| SPARK_APP_ID_LABEL -> appId, | ||
| SPARK_ROLE_LABEL -> SPARK_POD_EXECUTOR_ROLE) ++ | ||
| executorCustomLabels | ||
| val executorAnnotations = | ||
| KubernetesUtils.parsePrefixedKeyValuePairs(sparkConf, KUBERNETES_EXECUTOR_ANNOTATION_PREFIX) | ||
| val executorSecrets = | ||
| KubernetesUtils.parsePrefixedKeyValuePairs(sparkConf, KUBERNETES_EXECUTOR_SECRETS_PREFIX) | ||
| new KubernetesConf( | ||
|
||
| sparkConf.clone(), | ||
| KubernetesExecutorSpecificConf(executorId, driverPod), | ||
| sparkConf.get(KUBERNETES_EXECUTOR_POD_NAME_PREFIX), | ||
| appId, | ||
| executorLabels, | ||
| executorAnnotations, | ||
| executorSecrets) | ||
| } | ||
| } | ||
| Original file line number | Diff line number | Diff line change |
|---|---|---|
|
|
@@ -14,25 +14,18 @@ | |
| * See the License for the specific language governing permissions and | ||
| * limitations under the License. | ||
| */ | ||
| package org.apache.spark.deploy.k8s.submit.steps | ||
| package org.apache.spark.deploy.k8s | ||
|
|
||
| import org.apache.spark.deploy.k8s.MountSecretsBootstrap | ||
| import org.apache.spark.deploy.k8s.submit.KubernetesDriverSpec | ||
| import io.fabric8.kubernetes.api.model.HasMetadata | ||
|
|
||
| /** | ||
| * A driver configuration step for mounting user-specified secrets onto user-specified paths. | ||
| * | ||
| * @param bootstrap a utility actually handling mounting of the secrets. | ||
| */ | ||
| private[spark] class DriverMountSecretsStep( | ||
| bootstrap: MountSecretsBootstrap) extends DriverConfigurationStep { | ||
| private[k8s] case class KubernetesSpec( | ||
| pod: SparkPod, | ||
| additionalDriverKubernetesResources: Seq[HasMetadata], | ||
| podJavaSystemProperties: Map[String, String]) | ||
|
||
|
|
||
| override def configureDriver(driverSpec: KubernetesDriverSpec): KubernetesDriverSpec = { | ||
| val pod = bootstrap.addSecretVolumes(driverSpec.driverPod) | ||
| val container = bootstrap.mountSecrets(driverSpec.driverContainer) | ||
| driverSpec.copy( | ||
| driverPod = pod, | ||
| driverContainer = container | ||
| ) | ||
| } | ||
| private[k8s] object KubernetesSpec { | ||
|
||
| def initialSpec(initialProps: Map[String, String]): KubernetesSpec = KubernetesSpec( | ||
| SparkPod.initialPod(), | ||
| Seq.empty, | ||
| initialProps) | ||
| } | ||
This file was deleted.
| Original file line number | Diff line number | Diff line change |
|---|---|---|
|
|
@@ -14,17 +14,16 @@ | |
| * See the License for the specific language governing permissions and | ||
| * limitations under the License. | ||
| */ | ||
| package org.apache.spark.deploy.k8s.submit.steps | ||
| package org.apache.spark.deploy.k8s | ||
|
|
||
| import org.apache.spark.deploy.k8s.submit.KubernetesDriverSpec | ||
| import io.fabric8.kubernetes.api.model.{Container, ContainerBuilder, Pod, PodBuilder} | ||
|
|
||
| /** | ||
| * Represents a step in configuring the Spark driver pod. | ||
| */ | ||
| private[spark] trait DriverConfigurationStep { | ||
| private[spark] case class SparkPod(pod: Pod, container: Container) | ||
|
|
||
| /** | ||
| * Apply some transformation to the previous state of the driver to add a new feature to it. | ||
| */ | ||
| def configureDriver(driverSpec: KubernetesDriverSpec): KubernetesDriverSpec | ||
| private[spark] object SparkPod { | ||
| def initialPod(): SparkPod = { | ||
| SparkPod( | ||
| new PodBuilder().withNewMetadata().endMetadata().withNewSpec().endSpec().build(), | ||
|
||
| new ContainerBuilder().build()) | ||
| } | ||
| } | ||
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Maybe should be a
case class? This seems like a struct-like object which inclines me to think using acase classseems more idiomatic here.