Github user vanzin commented on a diff in the pull request:

    https://github.com/apache/spark/pull/22504#discussion_r228672761
  
    --- Diff: 
core/src/main/scala/org/apache/spark/util/logging/DriverLogger.scala ---
    @@ -0,0 +1,206 @@
    +/*
    + * Licensed to the Apache Software Foundation (ASF) under one or more
    + * contributor license agreements.  See the NOTICE file distributed with
    + * this work for additional information regarding copyright ownership.
    + * The ASF licenses this file to You under the Apache License, Version 2.0
    + * (the "License"); you may not use this file except in compliance with
    + * the License.  You may obtain a copy of the License at
    + *
    + *    http://www.apache.org/licenses/LICENSE-2.0
    + *
    + * Unless required by applicable law or agreed to in writing, software
    + * distributed under the License is distributed on an "AS IS" BASIS,
    + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
    + * See the License for the specific language governing permissions and
    + * limitations under the License.
    + */
    +
    +package org.apache.spark.util.logging
    +
    +import java.io._
    +import java.util.concurrent.TimeUnit
    +
    +import org.apache.commons.io.FileUtils
    +import org.apache.hadoop.conf.Configuration
    +import org.apache.hadoop.fs.{FileSystem, FSDataOutputStream, Path}
    +import org.apache.hadoop.fs.permission.FsPermission
    +import org.apache.log4j.{FileAppender => Log4jFileAppender, _}
    +
    +import org.apache.spark.SparkConf
    +import org.apache.spark.internal.Logging
    +import org.apache.spark.internal.config._
    +import org.apache.spark.network.util.JavaUtils
    +import org.apache.spark.util.{ThreadUtils, Utils}
    +
    +private[spark] class DriverLogger(conf: SparkConf) extends Logging {
    +
    +  private val UPLOAD_CHUNK_SIZE = 1024 * 1024
    +  private val UPLOAD_INTERVAL_IN_SECS = 5
    +  private val DEFAULT_LAYOUT = "%d{yy/MM/dd HH:mm:ss.SSS} %t %p %c{1}: 
%m%n"
    +  private val LOG_FILE_PERMISSIONS = new 
FsPermission(Integer.parseInt("770", 8).toShort)
    +
    +  private var localLogFile: String = FileUtils.getFile(
    +    Utils.getLocalDir(conf),
    +    DriverLogger.DRIVER_LOG_DIR,
    +    DriverLogger.DRIVER_LOG_FILE).getAbsolutePath()
    +  private var writer: Option[DfsAsyncWriter] = None
    +
    +  addLogAppender()
    +
    +  private def addLogAppender(): Unit = {
    +    val appenders = LogManager.getRootLogger().getAllAppenders()
    +    val layout = if (conf.get(DRIVER_LOG_LAYOUT).isDefined) {
    +      new PatternLayout(conf.get(DRIVER_LOG_LAYOUT).get)
    +    } else if (appenders.hasMoreElements()) {
    +      appenders.nextElement().asInstanceOf[Appender].getLayout()
    +    } else {
    +      new PatternLayout(DEFAULT_LAYOUT)
    +    }
    +    val fa = new Log4jFileAppender(layout, localLogFile)
    +    fa.setName(DriverLogger.APPENDER_NAME)
    +    LogManager.getRootLogger().addAppender(fa)
    +    logInfo(s"Added a local log appender at: ${localLogFile}")
    +  }
    +
    +  def startSync(hadoopConf: Configuration): Unit = {
    +    try {
    +      // Setup a writer which moves the local file to hdfs continuously
    +      val appId = Utils.sanitizeDirName(conf.getAppId)
    +      writer = Some(new DfsAsyncWriter(appId, hadoopConf))
    +    } catch {
    +      case e: Exception =>
    +        logError(s"Could not persist driver logs to dfs", e)
    +    }
    +  }
    +
    +  def stop(): Unit = {
    +    try {
    +      val fa = 
LogManager.getRootLogger.getAppender(DriverLogger.APPENDER_NAME)
    +      LogManager.getRootLogger().removeAppender(DriverLogger.APPENDER_NAME)
    +      Utils.tryLogNonFatalError(fa.close())
    +      writer.foreach(_.closeWriter())
    +    } catch {
    +      case e: Exception =>
    +        logError(s"Error in persisting driver logs", e)
    +    } finally {
    +      Utils.tryLogNonFatalError {
    +        
JavaUtils.deleteRecursively(FileUtils.getFile(localLogFile).getParentFile())
    +      }
    +    }
    +  }
    +
    +  // Visible for testing
    +  private[spark] class DfsAsyncWriter(appId: String, hadoopConf: 
Configuration) extends Runnable
    +      with Logging {
    +
    +    private var streamClosed = false
    +    private var fileSystem: FileSystem = _
    +    private val dfsLogFile: String = {
    +      val rootDir = conf.get(DRIVER_LOG_DFS_DIR).get
    +      fileSystem = new Path(rootDir).getFileSystem(hadoopConf)
    --- End diff --
    
    This is actually super weird, initializing another field in the initializer 
of this field.
    
    It's looking like you should just have an `init()` function, or maybe have 
`rootDir` as a field so you can initialize `fileSystem` more directly...
    
    (Sometimes I really miss Java constructors.)


---

---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]

Reply via email to