This is an automated email from the ASF dual-hosted git repository. stigahuang pushed a commit to branch master in repository https://gitbox.apache.org/repos/asf/impala.git
commit 0e3ae5c339fad3183ba8ce5c0c7d954e50dee091 Author: stiga-huang <[email protected]> AuthorDate: Sun Apr 27 16:45:57 2025 +0800 IMPALA-13996: Deflake test_too_many_files by creating dedicate tables TestAllowIncompleteData.test_too_many_files depends on tpch_parquet.lineitem to have exactly 3 data files. This is false in erasure coding builds in which tpch_parquet.lineitem has only 2 data files. This fixes the test to use dedicate tables created in the test. Change-Id: I28cec8ec4bc59f066aa15a7243b7163639706cc7 Reviewed-on: http://gerrit.cloudera.org:8080/22824 Reviewed-by: Jason Fehr <[email protected]> Tested-by: Impala Public Jenkins <[email protected]> --- tests/custom_cluster/test_local_catalog.py | 14 +++++++++----- 1 file changed, 9 insertions(+), 5 deletions(-) diff --git a/tests/custom_cluster/test_local_catalog.py b/tests/custom_cluster/test_local_catalog.py index 3f7da98d8..c4e92e9ba 100644 --- a/tests/custom_cluster/test_local_catalog.py +++ b/tests/custom_cluster/test_local_catalog.py @@ -713,11 +713,15 @@ class TestAllowIncompleteData(CustomClusterTestSuite): catalogd_args="--catalog_topic_mode=minimal --catalog_partial_fetch_max_files=1") def test_too_many_files(self, unique_database): """Test the error reporting the limit is too small""" - exception = self.execute_query_expect_failure( - self.client, "show files in tpch_parquet.lineitem") - err = ("Too many files to collect in table tpch_parquet.lineitem: 3. Current limit " - "is 1 configured by startup flag 'catalog_partial_fetch_max_files'. Consider " - "compacting files of the table.") + # Create a non-partitioned table with multiple files + tbl = unique_database + ".tbl" + self.execute_query("create table {0} (i int)".format(tbl)) + self.execute_query("insert into {0} values (0)".format(tbl)) + self.execute_query("insert into {0} values (1)".format(tbl)) + exception = self.execute_query_expect_failure(self.client, "show files in " + tbl) + err = ("Too many files to collect in table {0}: 2. Current limit is 1 configured by " + "startup flag 'catalog_partial_fetch_max_files'. Consider compacting files of" + " the table.").format(tbl) assert err in str(exception) self.assert_catalogd_log_contains("ERROR", err)
