Github user HyukjinKwon commented on a diff in the pull request:
https://github.com/apache/spark/pull/19325#discussion_r140623030
--- Diff: python/pyspark/sql/tests.py ---
@@ -3256,11 +3256,9 @@ def test_vectorized_udf_null_string(self):
def test_vectorized_udf_zero_parameter(self):
from pyspark.sql.functions import pandas_udf
- import pandas as pd
- df = self.spark.range(10)
- f0 = pandas_udf(lambda **kwargs:
pd.Series(1).repeat(kwargs['length']), LongType())
- res = df.select(f0())
- self.assertEquals(df.select(lit(1)).collect(), res.collect())
+ with QuietTest(self.sc):
+ with self.assertRaisesRegexp(Exception, '0-parameter
pandas_udfs.*not.*supported'):
--- End diff --
I believe we could catch narrower one, `NotImplementedError`.
---
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]