Dániel Gábor Vankó created IMPALA-14692:
-------------------------------------------

             Summary: test_spilling_hash_join is failing without greedy regex
                 Key: IMPALA-14692
                 URL: https://issues.apache.org/jira/browse/IMPALA-14692
             Project: IMPALA
          Issue Type: Bug
            Reporter: Dániel Gábor Vankó
            Assignee: Dániel Gábor Vankó


query_test/test_join_queries.py::TestSpillingHashJoin::test_spilling_hash_join 
is failing since IMPALA-14680, seemingly without no reason, but for other 
row_regex lines there is a space between the row_regex: and the pattern, which 
is missing here.
 
This test runs only in exhaustive mode.
 
h4. Stacktrace:
{noformat}
query_test/test_join_queries.py:247: in test_spilling_hash_join
    self.run_test_case('QueryTest/query-impala-13138', vector, unique_database)
        i          = 0
        self       = <test_join_queries.TestSpillingHashJoin object at 
0x7f36a4cab9a0>
        unique_database = 'test_spilling_hash_join_28ff9a90'
        vector     = "table_format: parquet/none" | "protocol: hs2" | 
"exec_option: {'abort_on_error': 1, 'batch_size': 0, 'disable_codegen': False, 
'disable_codegen_rows_threshold': 0, 'exec_single_node_rows_threshold': 0, 
'num_nodes': 0, 'test_replan': 1}"
/data/jenkins/workspace/impala-cdw-master-exhaustive/repos/Impala/tests/common/impala_test_suite.py:987:
 in run_test_case
    self.__verify_results_and_errors(vector, test_section, result, use_db)
        _ImpalaTestSuite__exec_in_hive = <function 
ImpalaTestSuite.run_test_case.<locals>.__exec_in_hive at 0x7f36a511a0d0>
        _ImpalaTestSuite__exec_in_impala = <function 
ImpalaTestSuite.run_test_case.<locals>.__exec_in_impala at 0x7f36a511a3a0>
        current_error = None
        encoding   = None
        exec_fn    = <function 
ImpalaTestSuite.run_test_case.<locals>.__exec_in_impala at 0x7f36a511a3a0>
        exec_options = {'abort_on_error': 1, 'batch_size': 0, 
'disable_codegen': False, 'disable_codegen_rows_threshold': 0, ...}
        failed_count = 0
        impalad_client = <tests.common.impala_connection.ImpylaHS2Connection 
object at 0x7f36a4cab250>
        impalad_clients = [<tests.common.impala_connection.ImpylaHS2Connection 
object at 0x7f36a4cab250>]
        lineage_log_dir = ''
        multiple_impalad = False
        protocol   = 'hs2'
        query      = "set RUNTIME_FILTER_WAIT_TIME_MS=10000;\nset 
MT_DOP=12;\nset RUNTIME_FILTER_MIN_SIZE=8192;\nset 
RUNTIME_FILTER_MAX_SIZ...>='2024-06-01'\n      AND re.send_account_sk not in 
(43)\n    GROUP BY ecc.letter_mission_name, re.`date`, c.war_group"
        query_section = "set RUNTIME_FILTER_WAIT_TIME_MS=10000;\nset 
MT_DOP=12;\nset RUNTIME_FILTER_MIN_SIZE=8192;\nset 
RUNTIME_FILTER_MAX_SIZ...2024-06-01'\n      AND re.send_account_sk not in 
(43)\n    GROUP BY ecc.letter_mission_name, re.`date`, c.war_group;\n"
        result     = <tests.common.impala_connection.ImpylaHS2ResultSet object 
at 0x7f36a4db4fd0>
        result_list = []
        sections   = [defaultdict(<class 'str'>, {'QUERY': "set 
RUNTIME_FILTER_WAIT_TIME_MS=10000;\nset MT_DOP=12;\nset 
RUNTIME_FILTER_MIN_...roup;\n", 'VERIFIER': 'VERIFY_IS_SUBSET', 'RESULTS': 
"row_regex:,'2024-06-07',\n", 'TYPES': 'STRING,STRING,STRING\n'})]
        self       = <test_join_queries.TestSpillingHashJoin object at 
0x7f36a4cab9a0>
        table_format_info = <tests.common.test_dimensions.TableFormatInfo 
object at 0x7f36a922f460>
        target_feng_real_impalad_clients = []
        target_impalad_clients = 
[<tests.common.impala_connection.ImpylaHS2Connection object at 0x7f36a4cab250>]
        test_file_name = 'QueryTest/query-impala-13138'
        test_file_vars = None
        test_section = defaultdict(<class 'str'>, {'QUERY': "set 
RUNTIME_FILTER_WAIT_TIME_MS=10000;\nset MT_DOP=12;\nset 
RUNTIME_FILTER_MIN_S...group;\n", 'VERIFIER': 'VERIFY_IS_SUBSET', 'RESULTS': 
"row_regex:,'2024-06-07',\n", 'TYPES': 'STRING,STRING,STRING\n'})
        total_count = 1
        use_db     = 'test_spilling_hash_join_28ff9a90'
        vector     = "table_format: parquet/none" | "protocol: hs2" | 
"exec_option: {'abort_on_error': 1, 'batch_size': 0, 'disable_codegen': False, 
'disable_codegen_rows_threshold': 0, 'exec_single_node_rows_threshold': 0, 
'num_nodes': 0, 'test_replan': 1}"
/data/jenkins/workspace/impala-cdw-master-exhaustive/repos/Impala/tests/common/impala_test_suite.py:782:
 in __verify_results_and_errors
    verify_raw_results(test_section, result, vector,
        replace_filenames_with_placeholder = True
        result     = <tests.common.impala_connection.ImpylaHS2ResultSet object 
at 0x7f36a4db4fd0>
        result_section = 'RESULTS'
        section_name = 'ERRORS'
        self       = <test_join_queries.TestSpillingHashJoin object at 
0x7f36a4cab9a0>
        test_section = defaultdict(<class 'str'>, {'QUERY': "set 
RUNTIME_FILTER_WAIT_TIME_MS=10000;\nset MT_DOP=12;\nset 
RUNTIME_FILTER_MIN_S...group;\n", 'VERIFIER': 'VERIFY_IS_SUBSET', 'RESULTS': 
"row_regex:,'2024-06-07',\n", 'TYPES': 'STRING,STRING,STRING\n'})
        type_section = 'TYPES'
        use_db     = 'test_spilling_hash_join_28ff9a90'
        vector     = "table_format: parquet/none" | "protocol: hs2" | 
"exec_option: {'abort_on_error': 1, 'batch_size': 0, 'disable_codegen': False, 
'disable_codegen_rows_threshold': 0, 'exec_single_node_rows_threshold': 0, 
'num_nodes': 0, 'test_replan': 1}"
/data/jenkins/workspace/impala-cdw-master-exhaustive/repos/Impala/tests/common/test_result_verifier.py:540:
 in verify_raw_results
    VERIFIER_MAP[verifier](expected, actual)
        actual     = <tests.common.test_result_verifier.QueryTestResult object 
at 0x7f36a4db4be0>
        actual_labels = ['LETTER_MISSION_NAME', 'DATE_', 'WAR_GROUP']
        actual_types = ['STRING', 'STRING', 'STRING']
        exec_result = <tests.common.impala_connection.ImpylaHS2ResultSet object 
at 0x7f36a4db4fd0>
        expected   = <tests.common.test_result_verifier.QueryTestResult object 
at 0x7f36a4db4b20>
        expected_results = "row_regex:,'2024-06-07',\n"
        expected_results_list = ["row_regex:,'2024-06-07',"]
        expected_types = ['STRING', 'STRING', 'STRING']
        file_format = 'parquet'
        is_raw_string = False
        order_matters = True
        protocol   = 'hs2'
        replace_filenames = True
        result_section = 'RESULTS'
        section    = 'STRING,STRING,STRING\n'
        test_section = defaultdict(<class 'str'>, {'QUERY': "set 
RUNTIME_FILTER_WAIT_TIME_MS=10000;\nset MT_DOP=12;\nset 
RUNTIME_FILTER_MIN_S...group;\n", 'VERIFIER': 'VERIFY_IS_SUBSET', 'RESULTS': 
"row_regex:,'2024-06-07',\n", 'TYPES': 'STRING,STRING,STRING\n'})
        type_section = 'TYPES'
        update_section = False
        vector     = "table_format: parquet/none" | "protocol: hs2" | 
"exec_option: {'abort_on_error': 1, 'batch_size': 0, 'disable_codegen': False, 
'disable_codegen_rows_threshold': 0, 'exec_single_node_rows_threshold': 0, 
'num_nodes': 0, 'test_replan': 1}"
        verifier   = 'VERIFY_IS_SUBSET'
/data/jenkins/workspace/impala-cdw-master-exhaustive/repos/Impala/tests/common/test_result_verifier.py:298:
 in verify_query_result_is_subset
    assert matched, u"Could not find expected row {0} in actual 
rows:\n{1}".format(
E   AssertionError: Could not find expected row row_regex:,'2024-06-07', in 
actual rows:
E   'NULL','2024-06-07','47'
E   'NULL','2024-06-07','42'
E   'NULL','2024-06-07','11'
E   'name','2024-06-07','20'
E   'NULL','2024-06-07','7'
E   'name','2024-06-07','5'
E   'NULL','2024-06-07','20'
E   'NULL','2024-06-07','NULL'
E   'name','2024-06-07','31'
E   'NULL','2024-06-07','25'
E   'name','2024-06-07','48'
E   'name','2024-06-07','34'
E   'NULL','2024-06-07','2'
E   'NULL','2024-06-07','8'
E   'name','2024-06-07','25'
E   'NULL','2024-06-07','48'
E   'name','2024-06-07','16'
E   'name','2024-06-07','45'
E   'NULL','2024-06-07','14'
E   'NULL','2024-06-07','34'
E   'name','2024-06-07','2'
E   'name','2024-06-07','7'
E   'NULL','2024-06-07','war_group'
E   'name','2024-06-07','42'
E   'name','2024-06-07','11'
E   'name','2024-06-07','14'
E   'name','2024-06-07','0'
E   'name','2024-06-07','47'
E   'NULL','2024-06-07','39'
E   'NULL','2024-06-07','19'
E   'name','2024-06-07','39'
E   'NULL','2024-06-07','31'
E   'NULL','2024-06-07','33'
E   'NULL','2024-06-07','22'
E   'NULL','2024-06-07','10'
E   'NULL','2024-06-07','13'
E   'name','2024-06-07','36'
E   'NULL','2024-06-07','45'
E   'NULL','2024-06-07','27'
E   'name','2024-06-07','13'
E   'name','2024-06-07','28'
E   'name','2024-06-07','40'
E   'NULL','2024-06-07','40'
E   'name','2024-06-07','19'
E   'NULL','2024-06-07','3'
E   'NULL','2024-06-07','6'
E   'NULL','2024-06-07','43'
E   'NULL','2024-06-07','36'
E   'name','2024-06-07','35'
E   'NULL','2024-06-07','0'
E   'NULL','2024-06-07','16'
E   'name','2024-06-07','8'
E   'name','2024-06-07','33'
E   'NULL','2024-06-07','32'
E   'name','2024-06-07','24'
E   'NULL','2024-06-07','46'
E   'NULL','2024-06-07','15'
E   'name','2024-06-07','43'
E   'name','2024-06-07','27'
E   'NULL','2024-06-07','21'
E   'NULL','2024-06-07','35'
E   'NULL','2024-06-07','49'
E   'name','2024-06-07','10'
E   'name','2024-06-07','21'
E   'name','2024-06-07','9'
E   'name','2024-06-07','26'
E   'NULL','2024-06-07','44'
E   'NULL','2024-06-07','26'
E   'name','2024-06-07','3'
E   'NULL','2024-06-07','30'
E   'NULL','2024-06-07','37'
E   'name','2024-06-07','6'
E   'NULL','2024-06-07','5'
E   'NULL','2024-06-07','28'
E   'name','2024-06-07','22'
E   'name','2024-06-07','30'
E   'name','2024-06-07','41'
E   'name','2024-06-07','29'
E   'name','2024-06-07','38'
E   'name','2024-06-07','17'
E   'NULL','2024-06-07','1'
E   'name','2024-06-07','49'
E   'NULL','2024-06-07','24'
E   'name','2024-06-07','15'
E   'name','2024-06-07','1'
E   'name','2024-06-07','war_group'
E   'name','2024-06-07','32'
E   'name','2024-06-07','12'
E   'name','2024-06-07','37'
E   'NULL','2024-06-07','12'
E   'name','2024-06-07','4'
E   'name','2024-06-07','23'
E   'NULL','2024-06-07','29'
E   'NULL','2024-06-07','18'
E   'NULL','2024-06-07','17'
E   'name','2024-06-07','46'
E   'NULL','2024-06-07','9'
E   'NULL','2024-06-07','50'
E   'NULL','2024-06-07','38'
E   'name','2024-06-07','50'
E   'name','2024-06-07','44'
E   'NULL','2024-06-07','41'
E   'name','2024-06-07','18'
E   'NULL','2024-06-07','4'
E   'NULL','2024-06-07','23'
        actual_literal_strings = {"'NULL','2024-06-07','0'", 
"'NULL','2024-06-07','1'", "'NULL','2024-06-07','10'", 
"'NULL','2024-06-07','11'", "'NULL','2024-06-07','12'", 
"'NULL','2024-06-07','13'", ...}
        actual_results = <tests.common.test_result_verifier.QueryTestResult 
object at 0x7f36a4db4be0>
        actual_row = <tests.common.test_result_verifier.ResultRow object at 
0x7f36a4cb4070>
        expected_literal_strings = set()
        expected_literals = []
        expected_non_literals = [<tests.common.test_result_verifier.ResultRow 
object at 0x7f36a4db4b80>]
        expected_results = <tests.common.test_result_verifier.QueryTestResult 
object at 0x7f36a4db4b20>
        expected_row = <tests.common.test_result_verifier.ResultRow object at 
0x7f36a4db4b80>
        matched    = False{noformat}



--
This message was sent by Atlassian Jira
(v8.20.10#820010)

Reply via email to