cloud-fan commented on code in PR #42462:
URL: https://github.com/apache/spark/pull/42462#discussion_r1299684790
##########
sql/core/src/main/scala/org/apache/spark/sql/functions.scala:
##########
@@ -7314,6 +7314,136 @@ object functions {
*/
def to_csv(e: Column): Column = to_csv(e, Map.empty[String, String].asJava)
+ // scalastyle:off line.size.limit
+
+ /**
+ * Parses a column containing a XML string into a `StructType` with the
specified schema.
+ * Returns `null`, in the case of an unparseable string.
+ *
+ * @param e a string column containing XML data.
+ * @param schema the schema to use when parsing the XML string
+ * @param options options to control how the XML is parsed. accepts the same
options and the
+ * XML data source.
+ * See
+ * <a href=
+ *
"https://spark.apache.org/docs/latest/sql-data-sources-xml.html#data-source-option">
+ * Data Source Option</a> in the version you use.
+ * @group collection_funcs
+ * @since
+ */
+ // scalastyle:on line.size.limit
+ def from_xml(e: Column, schema: StructType, options: Map[String, String]):
Column = withExpr {
+ XmlToStructs(CharVarcharUtils.failIfHasCharVarchar(schema), options,
e.expr)
+ }
+
+ // scalastyle:off line.size.limit
+
+ /**
+ * Parses a column containing a XML string into a `StructType` with the
specified schema.
+ * Returns `null`, in the case of an unparseable string.
+ *
+ * @param e a string column containing XML data.
+ * @param schema the schema to use when parsing the json string
+ * @param options options to control how the json is parsed. accepts the
same options and the
+ * XML data source.
+ * See
+ * <a href=
+ *
"https://spark.apache.org/docs/latest/sql-data-sources-xml.html#data-source-option">
+ * Data Source Option</a> in the version you use.
+ * @group collection_funcs
+ * @since
+ */
+ // scalastyle:on line.size.limit
+ def from_xml(e: Column, schema: DataType, options: Map[String, String]):
Column = withExpr {
Review Comment:
why do we add this API? looking at the code, `XmlToStructs.schema` must be
`StructType`, right?
--
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.
To unsubscribe, e-mail: [email protected]
For queries about this service, please contact Infrastructure at:
[email protected]
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]