satisfying integration tests

apache · ifilonenko · Apr 16, 2018 · Apr 17, 2018 · Apr 18, 2018 · Apr 18, 2018
commit 98cef8ceb0f04cfcefbc482c2a0fe39c75f620c4
diff --git a/core/src/main/scala/org/apache/spark/deploy/SparkSubmit.scala b/core/src/main/scala/org/apache/spark/deploy/SparkSubmit.scala
@@ -696,7 +696,9 @@ private[spark] class SparkSubmit extends Logging {
         if (args.isPython) {
           childArgs ++= Array("--primary-py-file", args.primaryResource)
           childArgs ++= Array("--main-class", "org.apache.spark.deploy.PythonRunner")
-          childArgs ++= Array("--other-py-files", args.pyFiles)
+          if (args.pyFiles != null) {
+            childArgs ++= Array("--other-py-files", args.pyFiles)
+          }
         } else {
           childArgs ++= Array("--primary-java-resource", args.primaryResource)
           childArgs ++= Array("--main-class", args.mainClass)

diff --git a/...-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/KubernetesConf.scala b/...-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/KubernetesConf.scala
@@ -67,10 +67,8 @@ private[spark] case class KubernetesConf[T <: KubernetesRoleSpecificConf](
     .map(str => str.split(",").toSeq)
     .getOrElse(Seq.empty[String])
 
-  def pyFiles(): Seq[String] = sparkConf
+  def pyFiles(): Option[String] = sparkConf
     .get(KUBERNETES_PYSPARK_PY_FILES)
-    .map(str => str.split(",").toSeq)
-    .getOrElse(Seq.empty[String])
 
   def pySparkMainResource(): Option[String] = sparkConf
     .get(KUBERNETES_PYSPARK_MAIN_APP_RESOURCE)

diff --git a/...tes/core/src/main/scala/org/apache/spark/deploy/k8s/features/BasicDriverFeatureStep.scala b/...tes/core/src/main/scala/org/apache/spark/deploy/k8s/features/BasicDriverFeatureStep.scala
@@ -77,7 +77,7 @@ private[spark] class BasicDriverFeatureStep(
       ("cpu", new QuantityBuilder(false).withAmount(limitCores).build())
     }
 
-    val driverContainer = new ContainerBuilder(pod.container)
+    val withoutArgsDriverContainer: ContainerBuilder = new ContainerBuilder(pod.container)
       .withName(DRIVER_CONTAINER_NAME)
       .withImage(driverContainerImage)
       .withImagePullPolicy(conf.imagePullPolicy())
@@ -97,12 +97,20 @@ private[spark] class BasicDriverFeatureStep(
       .addToArgs(driverDockerContainer)
       .addToArgs("--properties-file", SPARK_CONF_PATH)
       .addToArgs("--class", conf.roleSpecificConf.mainClass)
-      // The user application jar is merged into the spark.jars list and managed through that
-      // property, so there is no need to reference it explicitly here.
-      .addToArgs(SparkLauncher.NO_RESOURCE)
-      .addToArgs(conf.roleSpecificConf.appArgs: _*)
-      .build()
 
+    val driverContainer =
+      if (driverDockerContainer == "driver-py") {
+        withoutArgsDriverContainer
+          .addToArgs(conf.roleSpecificConf.appArgs: _*)
+          .build()
+      } else {
+        // The user application jar is merged into the spark.jars list and managed through that
+        // property, so there is no need to reference it explicitly here.
+        withoutArgsDriverContainer
+          .addToArgs(SparkLauncher.NO_RESOURCE)
+          .addToArgs(conf.roleSpecificConf.appArgs: _*)
+          .build()
+      }
     val driverPod = new PodBuilder(pod.pod)
       .editOrNewMetadata()
         .withName(driverPodName)

diff --git a/...rc/main/scala/org/apache/spark/deploy/k8s/features/bindings/PythonDriverFeatureStep.scala b/...rc/main/scala/org/apache/spark/deploy/k8s/features/bindings/PythonDriverFeatureStep.scala
@@ -30,15 +30,17 @@ private[spark] class PythonDriverFeatureStep(
   override def configurePod(pod: SparkPod): SparkPod = {
     val mainResource = kubernetesConf.pySparkMainResource()
     require(mainResource.isDefined, "PySpark Main Resource must be defined")
-    val otherPyFiles = kubernetesConf.pyFiles()
+    val otherPyFiles = kubernetesConf.pyFiles().map(pyFile =>
+      KubernetesUtils.resolveFileUrisAndPath(pyFile.split(","))
+        .mkString(",")).getOrElse("null")
     val withPythonPrimaryFileContainer = new ContainerBuilder(pod.container)
       .addNewEnv()
         .withName(ENV_PYSPARK_PRIMARY)
         .withValue(KubernetesUtils.resolveFileUri(mainResource.get))
         .endEnv()
       .addNewEnv()
         .withName(ENV_PYSPARK_FILES)
-        .withValue(KubernetesUtils.resolveFileUrisAndPath(otherPyFiles).mkString(","))
+        .withValue(if (otherPyFiles == "") {"null"} else otherPyFiles)
         .endEnv()
       .build()
     SparkPod(pod.pod, withPythonPrimaryFileContainer)

diff --git a/...etes/core/src/main/scala/org/apache/spark/deploy/k8s/submit/KubernetesDriverBuilder.scala b/...etes/core/src/main/scala/org/apache/spark/deploy/k8s/submit/KubernetesDriverBuilder.scala
@@ -45,9 +45,11 @@ private[spark] class KubernetesDriverBuilder(
       provideServiceStep(kubernetesConf))
     val maybeRoleSecretNamesStep = if (kubernetesConf.roleSecretNamesToMountPaths.nonEmpty) {
       Some(provideSecretsStep(kubernetesConf)) } else None
-    val maybeNonJVMBindings = kubernetesConf.roleSpecificConf.mainAppResource.map {
-      case PythonMainAppResource(_) =>
-         providePythonStep(kubernetesConf)
+    val maybeNonJVMBindings = kubernetesConf.roleSpecificConf.mainAppResource.getOrElse(None)
+      match {
+        case PythonMainAppResource(_) =>
+          Some(providePythonStep(kubernetesConf))
+        case _ => None
     }
     val allFeatures: Seq[KubernetesFeatureConfigStep] =
       baseFeatures ++

diff --git a/...st/scala/org/apache/spark/deploy/k8s/features/bindings/PythonDriverFeatureStepSuite.scala b/...st/scala/org/apache/spark/deploy/k8s/features/bindings/PythonDriverFeatureStepSuite.scala
@@ -65,4 +65,35 @@ class PythonDriverFeatureStepSuite extends SparkFunSuite {
     assert(envs(ENV_PYSPARK_PRIMARY) === expectedMainResource)
     assert(envs(ENV_PYSPARK_FILES) === expectedPySparkFiles)
   }
+  test("Python Step testing empty pyfiles") {
+    val mainResource = "local:///main.py"
+    val baseDriverPod = SparkPod.initialPod()
+    val sparkConf = new SparkConf(false)
+      .set(KUBERNETES_PYSPARK_MAIN_APP_RESOURCE, mainResource)
+      .set(KUBERNETES_PYSPARK_PY_FILES, "")
+    val kubernetesConf = KubernetesConf(
+      sparkConf,
+      KubernetesDriverSpecificConf(
+        Some(PythonMainAppResource("local:///main.py")),
+        "test-app",
+        "python-runner",
+        Seq.empty[String]),
+      "",
+      "",
+      Map.empty,
+      Map.empty,
+      Map.empty,
+      Map.empty,
+      Seq.empty[String])
+    val step = new PythonDriverFeatureStep(kubernetesConf)
+    val driverPod = step.configurePod(baseDriverPod).pod
+    val driverContainerwithPySpark = step.configurePod(baseDriverPod).container
+    assert(driverContainerwithPySpark.getEnv.size === 2)
+    val envs = driverContainerwithPySpark
+      .getEnv
+      .asScala
+      .map(env => (env.getName, env.getValue))
+      .toMap
+    assert(envs(ENV_PYSPARK_FILES) === "null")
+  }
 }