Github user HyukjinKwon commented on a diff in the pull request:
https://github.com/apache/spark/pull/21107#discussion_r183230073
--- Diff: python/pyspark/ml/tests.py ---
@@ -2136,17 +2136,23 @@ class ImageReaderTest2(PySparkTestCase):
@classmethod
def setUpClass(cls):
super(ImageReaderTest2, cls).setUpClass()
+ cls.hive_available = True
# Note that here we enable Hive's support.
cls.spark = None
try:
cls.sc._jvm.org.apache.hadoop.hive.conf.HiveConf()
except py4j.protocol.Py4JError:
cls.tearDownClass()
- raise unittest.SkipTest("Hive is not available")
+ cls.hive_available = False
except TypeError:
cls.tearDownClass()
- raise unittest.SkipTest("Hive is not available")
- cls.spark = HiveContext._createForTesting(cls.sc)
+ cls.hive_available = False
+ if cls.hive_available:
+ cls.spark = HiveContext._createForTesting(cls.sc)
+
+ def setUp(self):
+ if not self.hive_available:
+ self.skipTest("Hive is not available.")
--- End diff --
```
Finished test(python3): pyspark.sql.tests (51s) ... 93 tests were skipped
...
Skipped tests in pyspark.sql.tests with python3:
test_createDataFrame_column_name_encoding
(pyspark.sql.tests.ArrowTests) ... skipped 'PyArrow >= 0.8.0 must be installed;
however, it was not found.'
...
test_collect_functions (pyspark.sql.tests.HiveContextSQLTests) ...
skipped 'Hive is not available.'
test_datetime_functions (pyspark.sql.tests.HiveContextSQLTests) ...
skipped 'Hive is not available.'
...
test_query_execution_listener_on_collect
(pyspark.sql.tests.QueryExecutionListenerTests) ... skipped
"'org.apache.spark.sql.TestQueryExecutionListener' is not available. Will skip
the related tests."
...
```
@viirya, @bersprockets and @BryanCutler, these were the output from my
partial testing in my local.
---
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]