[GitHub] spark pull request #19954: [SPARK-22757][Kubernetes] Enable use of remote de...

vanzin Wed, 20 Dec 2017 16:11:35 -0800

Github user vanzin commented on a diff in the pull request:

    https://github.com/apache/spark/pull/19954#discussion_r158167023
  
    --- Diff: 
resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/rest/k8s/SparkPodInitContainer.scala
 ---
    @@ -0,0 +1,119 @@
    +/*
    + * Licensed to the Apache Software Foundation (ASF) under one or more
    + * contributor license agreements.  See the NOTICE file distributed with
    + * this work for additional information regarding copyright ownership.
    + * The ASF licenses this file to You under the Apache License, Version 2.0
    + * (the "License"); you may not use this file except in compliance with
    + * the License.  You may obtain a copy of the License at
    + *
    + *    http://www.apache.org/licenses/LICENSE-2.0
    + *
    + * Unless required by applicable law or agreed to in writing, software
    + * distributed under the License is distributed on an "AS IS" BASIS,
    + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
    + * See the License for the specific language governing permissions and
    + * limitations under the License.
    + */
    +package org.apache.spark.deploy.rest.k8s
    +
    +import java.io.File
    +import java.util.concurrent.TimeUnit
    +
    +import scala.concurrent.{ExecutionContext, Future}
    +
    +import org.apache.spark.{SecurityManager => SparkSecurityManager, 
SparkConf}
    +import org.apache.spark.deploy.SparkHadoopUtil
    +import org.apache.spark.deploy.k8s.Config._
    +import org.apache.spark.internal.Logging
    +import org.apache.spark.util.{ThreadUtils, Utils}
    +
    +/**
    + * Process that fetches files from a resource staging server and/or 
arbitrary remote locations.
    + *
    + * The init-container can handle fetching files from any of those sources, 
but not all of the
    + * sources need to be specified. This allows for composing multiple 
instances of this container
    + * with different configurations for different download sources, or using 
the same container to
    + * download everything at once.
    + */
    +private[spark] class SparkPodInitContainer(
    +    sparkConf: SparkConf,
    +    fileFetcher: FileFetcher) extends Logging {
    +
    +  private val maxThreadPoolSize = 
sparkConf.get(INIT_CONTAINER_MAX_THREAD_POOL_SIZE)
    +  private implicit val downloadExecutor = 
ExecutionContext.fromExecutorService(
    +    ThreadUtils.newDaemonCachedThreadPool("download-executor", 
maxThreadPoolSize))
    +
    +  private val jarsDownloadDir = new File(
    +    sparkConf.get(JARS_DOWNLOAD_LOCATION))
    +  private val filesDownloadDir = new File(
    +    sparkConf.get(FILES_DOWNLOAD_LOCATION))
    +
    +  private val remoteJars = sparkConf.get(INIT_CONTAINER_REMOTE_JARS)
    +  private val remoteFiles = sparkConf.get(INIT_CONTAINER_REMOTE_FILES)
    +
    +  private val downloadTimeoutMinutes = 
sparkConf.get(INIT_CONTAINER_MOUNT_TIMEOUT)
    +
    +  def run(): Unit = {
    +    logInfo(s"Downloading remote jars: $remoteJars")
    +    downloadFiles(
    +      remoteJars,
    +      jarsDownloadDir,
    +      s"Remote jars download directory specified at $jarsDownloadDir does 
not exist " +
    +        "or is not a directory.")
    +
    +    logInfo(s"Downloading remote files: $remoteFiles")
    +    downloadFiles(
    +      remoteFiles,
    +      filesDownloadDir,
    +      s"Remote files download directory specified at $filesDownloadDir 
does not exist " +
    +        "or is not a directory.")
    +
    +    downloadExecutor.shutdown()
    +    downloadExecutor.awaitTermination(downloadTimeoutMinutes, 
TimeUnit.MINUTES)
    +  }
    +
    +  private def downloadFiles(
    +      filesCommaSeparated: Option[String],
    +      downloadDir: File,
    +      errMessageOnDestinationNotADirectory: String): Unit = {
    +    filesCommaSeparated.foreach { files =>
    +      require(downloadDir.isDirectory, 
errMessageOnDestinationNotADirectory)
    +      Utils.stringToSeq(files).foreach { file =>
    +        Future[Unit] {
    +          fileFetcher.fetchFile(file, downloadDir)
    +        }
    +
    --- End diff --
    
    nuke empty line.



---

---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]

[GitHub] spark pull request #19954: [SPARK-22757][Kubernetes] Enable use of remote de...

Reply via email to