Github user wzhfy commented on a diff in the pull request:
https://github.com/apache/spark/pull/20611#discussion_r172716633
--- Diff:
sql/core/src/main/scala/org/apache/spark/sql/execution/command/tables.scala ---
@@ -385,8 +385,12 @@ case class LoadDataCommand(
val hadoopConf = sparkSession.sessionState.newHadoopConf()
val srcPath = new Path(hdfsUri)
val fs = srcPath.getFileSystem(hadoopConf)
- if (!fs.exists(srcPath)) {
- throw new AnalysisException(s"LOAD DATA input path does not
exist: $path")
+ // A validaton logic is been added for non local files, Error will
be thrown
+ // If hdfs path doest not exist or if no files matches the wild
card defined
+ // in load path
+ if (null == fs.globStatus(srcPath) ||
fs.globStatus(srcPath).isEmpty) {
--- End diff --
please add test cases for this change, e.g. path containing '*', '?', etc.
---
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]