[
https://issues.apache.org/jira/browse/IMPALA-14692?page=com.atlassian.jira.plugin.system.issuetabpanels:all-tabpanel
]
Dániel Gábor Vankó updated IMPALA-14692:
----------------------------------------
Labels: broken-build (was: )
> test_spilling_hash_join is failing without greedy regex
> -------------------------------------------------------
>
> Key: IMPALA-14692
> URL: https://issues.apache.org/jira/browse/IMPALA-14692
> Project: IMPALA
> Issue Type: Bug
> Reporter: Dániel Gábor Vankó
> Assignee: Dániel Gábor Vankó
> Priority: Major
> Labels: broken-build
>
> query_test/test_join_queries.py::TestSpillingHashJoin::test_spilling_hash_join
> is failing since IMPALA-14680, seemingly without no reason, but for other
> row_regex lines there is a space between the row_regex: and the pattern,
> which is missing here.
>
> This test runs only in exhaustive mode.
>
> h4. Stacktrace:
> {noformat}
> query_test/test_join_queries.py:247: in test_spilling_hash_join
> self.run_test_case('QueryTest/query-impala-13138', vector,
> unique_database)
> i = 0
> self = <test_join_queries.TestSpillingHashJoin object at
> 0x7f36a4cab9a0>
> unique_database = 'test_spilling_hash_join_28ff9a90'
> vector = "table_format: parquet/none" | "protocol: hs2" |
> "exec_option: {'abort_on_error': 1, 'batch_size': 0, 'disable_codegen':
> False, 'disable_codegen_rows_threshold': 0,
> 'exec_single_node_rows_threshold': 0, 'num_nodes': 0, 'test_replan': 1}"
> /data/jenkins/workspace/impala-cdw-master-exhaustive/repos/Impala/tests/common/impala_test_suite.py:987:
> in run_test_case
> self.__verify_results_and_errors(vector, test_section, result, use_db)
> _ImpalaTestSuite__exec_in_hive = <function
> ImpalaTestSuite.run_test_case.<locals>.__exec_in_hive at 0x7f36a511a0d0>
> _ImpalaTestSuite__exec_in_impala = <function
> ImpalaTestSuite.run_test_case.<locals>.__exec_in_impala at 0x7f36a511a3a0>
> current_error = None
> encoding = None
> exec_fn = <function
> ImpalaTestSuite.run_test_case.<locals>.__exec_in_impala at 0x7f36a511a3a0>
> exec_options = {'abort_on_error': 1, 'batch_size': 0,
> 'disable_codegen': False, 'disable_codegen_rows_threshold': 0, ...}
> failed_count = 0
> impalad_client = <tests.common.impala_connection.ImpylaHS2Connection
> object at 0x7f36a4cab250>
> impalad_clients =
> [<tests.common.impala_connection.ImpylaHS2Connection object at
> 0x7f36a4cab250>]
> lineage_log_dir = ''
> multiple_impalad = False
> protocol = 'hs2'
> query = "set RUNTIME_FILTER_WAIT_TIME_MS=10000;\nset
> MT_DOP=12;\nset RUNTIME_FILTER_MIN_SIZE=8192;\nset
> RUNTIME_FILTER_MAX_SIZ...>='2024-06-01'\n AND re.send_account_sk not in
> (43)\n GROUP BY ecc.letter_mission_name, re.`date`, c.war_group"
> query_section = "set RUNTIME_FILTER_WAIT_TIME_MS=10000;\nset
> MT_DOP=12;\nset RUNTIME_FILTER_MIN_SIZE=8192;\nset
> RUNTIME_FILTER_MAX_SIZ...2024-06-01'\n AND re.send_account_sk not in
> (43)\n GROUP BY ecc.letter_mission_name, re.`date`, c.war_group;\n"
> result = <tests.common.impala_connection.ImpylaHS2ResultSet
> object at 0x7f36a4db4fd0>
> result_list = []
> sections = [defaultdict(<class 'str'>, {'QUERY': "set
> RUNTIME_FILTER_WAIT_TIME_MS=10000;\nset MT_DOP=12;\nset
> RUNTIME_FILTER_MIN_...roup;\n", 'VERIFIER': 'VERIFY_IS_SUBSET', 'RESULTS':
> "row_regex:,'2024-06-07',\n", 'TYPES': 'STRING,STRING,STRING\n'})]
> self = <test_join_queries.TestSpillingHashJoin object at
> 0x7f36a4cab9a0>
> table_format_info = <tests.common.test_dimensions.TableFormatInfo
> object at 0x7f36a922f460>
> target_feng_real_impalad_clients = []
> target_impalad_clients =
> [<tests.common.impala_connection.ImpylaHS2Connection object at
> 0x7f36a4cab250>]
> test_file_name = 'QueryTest/query-impala-13138'
> test_file_vars = None
> test_section = defaultdict(<class 'str'>, {'QUERY': "set
> RUNTIME_FILTER_WAIT_TIME_MS=10000;\nset MT_DOP=12;\nset
> RUNTIME_FILTER_MIN_S...group;\n", 'VERIFIER': 'VERIFY_IS_SUBSET', 'RESULTS':
> "row_regex:,'2024-06-07',\n", 'TYPES': 'STRING,STRING,STRING\n'})
> total_count = 1
> use_db = 'test_spilling_hash_join_28ff9a90'
> vector = "table_format: parquet/none" | "protocol: hs2" |
> "exec_option: {'abort_on_error': 1, 'batch_size': 0, 'disable_codegen':
> False, 'disable_codegen_rows_threshold': 0,
> 'exec_single_node_rows_threshold': 0, 'num_nodes': 0, 'test_replan': 1}"
> /data/jenkins/workspace/impala-cdw-master-exhaustive/repos/Impala/tests/common/impala_test_suite.py:782:
> in __verify_results_and_errors
> verify_raw_results(test_section, result, vector,
> replace_filenames_with_placeholder = True
> result = <tests.common.impala_connection.ImpylaHS2ResultSet
> object at 0x7f36a4db4fd0>
> result_section = 'RESULTS'
> section_name = 'ERRORS'
> self = <test_join_queries.TestSpillingHashJoin object at
> 0x7f36a4cab9a0>
> test_section = defaultdict(<class 'str'>, {'QUERY': "set
> RUNTIME_FILTER_WAIT_TIME_MS=10000;\nset MT_DOP=12;\nset
> RUNTIME_FILTER_MIN_S...group;\n", 'VERIFIER': 'VERIFY_IS_SUBSET', 'RESULTS':
> "row_regex:,'2024-06-07',\n", 'TYPES': 'STRING,STRING,STRING\n'})
> type_section = 'TYPES'
> use_db = 'test_spilling_hash_join_28ff9a90'
> vector = "table_format: parquet/none" | "protocol: hs2" |
> "exec_option: {'abort_on_error': 1, 'batch_size': 0, 'disable_codegen':
> False, 'disable_codegen_rows_threshold': 0,
> 'exec_single_node_rows_threshold': 0, 'num_nodes': 0, 'test_replan': 1}"
> /data/jenkins/workspace/impala-cdw-master-exhaustive/repos/Impala/tests/common/test_result_verifier.py:540:
> in verify_raw_results
> VERIFIER_MAP[verifier](expected, actual)
> actual = <tests.common.test_result_verifier.QueryTestResult
> object at 0x7f36a4db4be0>
> actual_labels = ['LETTER_MISSION_NAME', 'DATE_', 'WAR_GROUP']
> actual_types = ['STRING', 'STRING', 'STRING']
> exec_result = <tests.common.impala_connection.ImpylaHS2ResultSet
> object at 0x7f36a4db4fd0>
> expected = <tests.common.test_result_verifier.QueryTestResult
> object at 0x7f36a4db4b20>
> expected_results = "row_regex:,'2024-06-07',\n"
> expected_results_list = ["row_regex:,'2024-06-07',"]
> expected_types = ['STRING', 'STRING', 'STRING']
> file_format = 'parquet'
> is_raw_string = False
> order_matters = True
> protocol = 'hs2'
> replace_filenames = True
> result_section = 'RESULTS'
> section = 'STRING,STRING,STRING\n'
> test_section = defaultdict(<class 'str'>, {'QUERY': "set
> RUNTIME_FILTER_WAIT_TIME_MS=10000;\nset MT_DOP=12;\nset
> RUNTIME_FILTER_MIN_S...group;\n", 'VERIFIER': 'VERIFY_IS_SUBSET', 'RESULTS':
> "row_regex:,'2024-06-07',\n", 'TYPES': 'STRING,STRING,STRING\n'})
> type_section = 'TYPES'
> update_section = False
> vector = "table_format: parquet/none" | "protocol: hs2" |
> "exec_option: {'abort_on_error': 1, 'batch_size': 0, 'disable_codegen':
> False, 'disable_codegen_rows_threshold': 0,
> 'exec_single_node_rows_threshold': 0, 'num_nodes': 0, 'test_replan': 1}"
> verifier = 'VERIFY_IS_SUBSET'
> /data/jenkins/workspace/impala-cdw-master-exhaustive/repos/Impala/tests/common/test_result_verifier.py:298:
> in verify_query_result_is_subset
> assert matched, u"Could not find expected row {0} in actual
> rows:\n{1}".format(
> E AssertionError: Could not find expected row row_regex:,'2024-06-07', in
> actual rows:
> E 'NULL','2024-06-07','47'
> E 'NULL','2024-06-07','42'
> E 'NULL','2024-06-07','11'
> E 'name','2024-06-07','20'
> E 'NULL','2024-06-07','7'
> E 'name','2024-06-07','5'
> E 'NULL','2024-06-07','20'
> E 'NULL','2024-06-07','NULL'
> E 'name','2024-06-07','31'
> E 'NULL','2024-06-07','25'
> E 'name','2024-06-07','48'
> E 'name','2024-06-07','34'
> E 'NULL','2024-06-07','2'
> E 'NULL','2024-06-07','8'
> E 'name','2024-06-07','25'
> E 'NULL','2024-06-07','48'
> E 'name','2024-06-07','16'
> E 'name','2024-06-07','45'
> E 'NULL','2024-06-07','14'
> E 'NULL','2024-06-07','34'
> E 'name','2024-06-07','2'
> E 'name','2024-06-07','7'
> E 'NULL','2024-06-07','war_group'
> E 'name','2024-06-07','42'
> E 'name','2024-06-07','11'
> E 'name','2024-06-07','14'
> E 'name','2024-06-07','0'
> E 'name','2024-06-07','47'
> E 'NULL','2024-06-07','39'
> E 'NULL','2024-06-07','19'
> E 'name','2024-06-07','39'
> E 'NULL','2024-06-07','31'
> E 'NULL','2024-06-07','33'
> E 'NULL','2024-06-07','22'
> E 'NULL','2024-06-07','10'
> E 'NULL','2024-06-07','13'
> E 'name','2024-06-07','36'
> E 'NULL','2024-06-07','45'
> E 'NULL','2024-06-07','27'
> E 'name','2024-06-07','13'
> E 'name','2024-06-07','28'
> E 'name','2024-06-07','40'
> E 'NULL','2024-06-07','40'
> E 'name','2024-06-07','19'
> E 'NULL','2024-06-07','3'
> E 'NULL','2024-06-07','6'
> E 'NULL','2024-06-07','43'
> E 'NULL','2024-06-07','36'
> E 'name','2024-06-07','35'
> E 'NULL','2024-06-07','0'
> E 'NULL','2024-06-07','16'
> E 'name','2024-06-07','8'
> E 'name','2024-06-07','33'
> E 'NULL','2024-06-07','32'
> E 'name','2024-06-07','24'
> E 'NULL','2024-06-07','46'
> E 'NULL','2024-06-07','15'
> E 'name','2024-06-07','43'
> E 'name','2024-06-07','27'
> E 'NULL','2024-06-07','21'
> E 'NULL','2024-06-07','35'
> E 'NULL','2024-06-07','49'
> E 'name','2024-06-07','10'
> E 'name','2024-06-07','21'
> E 'name','2024-06-07','9'
> E 'name','2024-06-07','26'
> E 'NULL','2024-06-07','44'
> E 'NULL','2024-06-07','26'
> E 'name','2024-06-07','3'
> E 'NULL','2024-06-07','30'
> E 'NULL','2024-06-07','37'
> E 'name','2024-06-07','6'
> E 'NULL','2024-06-07','5'
> E 'NULL','2024-06-07','28'
> E 'name','2024-06-07','22'
> E 'name','2024-06-07','30'
> E 'name','2024-06-07','41'
> E 'name','2024-06-07','29'
> E 'name','2024-06-07','38'
> E 'name','2024-06-07','17'
> E 'NULL','2024-06-07','1'
> E 'name','2024-06-07','49'
> E 'NULL','2024-06-07','24'
> E 'name','2024-06-07','15'
> E 'name','2024-06-07','1'
> E 'name','2024-06-07','war_group'
> E 'name','2024-06-07','32'
> E 'name','2024-06-07','12'
> E 'name','2024-06-07','37'
> E 'NULL','2024-06-07','12'
> E 'name','2024-06-07','4'
> E 'name','2024-06-07','23'
> E 'NULL','2024-06-07','29'
> E 'NULL','2024-06-07','18'
> E 'NULL','2024-06-07','17'
> E 'name','2024-06-07','46'
> E 'NULL','2024-06-07','9'
> E 'NULL','2024-06-07','50'
> E 'NULL','2024-06-07','38'
> E 'name','2024-06-07','50'
> E 'name','2024-06-07','44'
> E 'NULL','2024-06-07','41'
> E 'name','2024-06-07','18'
> E 'NULL','2024-06-07','4'
> E 'NULL','2024-06-07','23'
> actual_literal_strings = {"'NULL','2024-06-07','0'",
> "'NULL','2024-06-07','1'", "'NULL','2024-06-07','10'",
> "'NULL','2024-06-07','11'", "'NULL','2024-06-07','12'",
> "'NULL','2024-06-07','13'", ...}
> actual_results = <tests.common.test_result_verifier.QueryTestResult
> object at 0x7f36a4db4be0>
> actual_row = <tests.common.test_result_verifier.ResultRow object at
> 0x7f36a4cb4070>
> expected_literal_strings = set()
> expected_literals = []
> expected_non_literals = [<tests.common.test_result_verifier.ResultRow
> object at 0x7f36a4db4b80>]
> expected_results = <tests.common.test_result_verifier.QueryTestResult
> object at 0x7f36a4db4b20>
> expected_row = <tests.common.test_result_verifier.ResultRow object at
> 0x7f36a4db4b80>
> matched = False{noformat}
--
This message was sent by Atlassian Jira
(v8.20.10#820010)
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]