Github user HyukjinKwon commented on a diff in the pull request: https://github.com/apache/spark/pull/21192#discussion_r189043012 --- Diff: sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/json/JSONOptions.scala --- @@ -120,8 +120,26 @@ private[sql] class JSONOptions( enc } - val lineSeparatorInRead: Option[Array[Byte]] = lineSeparator.map { lineSep => - lineSep.getBytes(encoding.getOrElse("UTF-8")) + /** + * A sequence of bytes between two consecutive json records in read. + * Format of the `lineSep` option is: + * selector (1 char) + separator spec (any length) | sequence of chars + * + * Currently the following selectors are supported: + * - 'x' + sequence of bytes in hexadecimal format. For example: "x0a 0d". --- End diff -- BTW, I misunderstood this PR because you proposed a regex support too before.
--- --------------------------------------------------------------------- To unsubscribe, e-mail: reviews-unsubscr...@spark.apache.org For additional commands, e-mail: reviews-h...@spark.apache.org