[ 
https://issues.apache.org/jira/browse/IMPALA-14692?page=com.atlassian.jira.plugin.system.issuetabpanels:all-tabpanel
 ]

Dániel Gábor Vankó updated IMPALA-14692:
----------------------------------------
    Labels: broken-build  (was: )

> test_spilling_hash_join is failing without greedy regex
> -------------------------------------------------------
>
>                 Key: IMPALA-14692
>                 URL: https://issues.apache.org/jira/browse/IMPALA-14692
>             Project: IMPALA
>          Issue Type: Bug
>            Reporter: Dániel Gábor Vankó
>            Assignee: Dániel Gábor Vankó
>            Priority: Major
>              Labels: broken-build
>
> query_test/test_join_queries.py::TestSpillingHashJoin::test_spilling_hash_join
>  is failing since IMPALA-14680, seemingly without no reason, but for other 
> row_regex lines there is a space between the row_regex: and the pattern, 
> which is missing here.
>  
> This test runs only in exhaustive mode.
>  
> h4. Stacktrace:
> {noformat}
> query_test/test_join_queries.py:247: in test_spilling_hash_join
>     self.run_test_case('QueryTest/query-impala-13138', vector, 
> unique_database)
>         i          = 0
>         self       = <test_join_queries.TestSpillingHashJoin object at 
> 0x7f36a4cab9a0>
>         unique_database = 'test_spilling_hash_join_28ff9a90'
>         vector     = "table_format: parquet/none" | "protocol: hs2" | 
> "exec_option: {'abort_on_error': 1, 'batch_size': 0, 'disable_codegen': 
> False, 'disable_codegen_rows_threshold': 0, 
> 'exec_single_node_rows_threshold': 0, 'num_nodes': 0, 'test_replan': 1}"
> /data/jenkins/workspace/impala-cdw-master-exhaustive/repos/Impala/tests/common/impala_test_suite.py:987:
>  in run_test_case
>     self.__verify_results_and_errors(vector, test_section, result, use_db)
>         _ImpalaTestSuite__exec_in_hive = <function 
> ImpalaTestSuite.run_test_case.<locals>.__exec_in_hive at 0x7f36a511a0d0>
>         _ImpalaTestSuite__exec_in_impala = <function 
> ImpalaTestSuite.run_test_case.<locals>.__exec_in_impala at 0x7f36a511a3a0>
>         current_error = None
>         encoding   = None
>         exec_fn    = <function 
> ImpalaTestSuite.run_test_case.<locals>.__exec_in_impala at 0x7f36a511a3a0>
>         exec_options = {'abort_on_error': 1, 'batch_size': 0, 
> 'disable_codegen': False, 'disable_codegen_rows_threshold': 0, ...}
>         failed_count = 0
>         impalad_client = <tests.common.impala_connection.ImpylaHS2Connection 
> object at 0x7f36a4cab250>
>         impalad_clients = 
> [<tests.common.impala_connection.ImpylaHS2Connection object at 
> 0x7f36a4cab250>]
>         lineage_log_dir = ''
>         multiple_impalad = False
>         protocol   = 'hs2'
>         query      = "set RUNTIME_FILTER_WAIT_TIME_MS=10000;\nset 
> MT_DOP=12;\nset RUNTIME_FILTER_MIN_SIZE=8192;\nset 
> RUNTIME_FILTER_MAX_SIZ...>='2024-06-01'\n      AND re.send_account_sk not in 
> (43)\n    GROUP BY ecc.letter_mission_name, re.`date`, c.war_group"
>         query_section = "set RUNTIME_FILTER_WAIT_TIME_MS=10000;\nset 
> MT_DOP=12;\nset RUNTIME_FILTER_MIN_SIZE=8192;\nset 
> RUNTIME_FILTER_MAX_SIZ...2024-06-01'\n      AND re.send_account_sk not in 
> (43)\n    GROUP BY ecc.letter_mission_name, re.`date`, c.war_group;\n"
>         result     = <tests.common.impala_connection.ImpylaHS2ResultSet 
> object at 0x7f36a4db4fd0>
>         result_list = []
>         sections   = [defaultdict(<class 'str'>, {'QUERY': "set 
> RUNTIME_FILTER_WAIT_TIME_MS=10000;\nset MT_DOP=12;\nset 
> RUNTIME_FILTER_MIN_...roup;\n", 'VERIFIER': 'VERIFY_IS_SUBSET', 'RESULTS': 
> "row_regex:,'2024-06-07',\n", 'TYPES': 'STRING,STRING,STRING\n'})]
>         self       = <test_join_queries.TestSpillingHashJoin object at 
> 0x7f36a4cab9a0>
>         table_format_info = <tests.common.test_dimensions.TableFormatInfo 
> object at 0x7f36a922f460>
>         target_feng_real_impalad_clients = []
>         target_impalad_clients = 
> [<tests.common.impala_connection.ImpylaHS2Connection object at 
> 0x7f36a4cab250>]
>         test_file_name = 'QueryTest/query-impala-13138'
>         test_file_vars = None
>         test_section = defaultdict(<class 'str'>, {'QUERY': "set 
> RUNTIME_FILTER_WAIT_TIME_MS=10000;\nset MT_DOP=12;\nset 
> RUNTIME_FILTER_MIN_S...group;\n", 'VERIFIER': 'VERIFY_IS_SUBSET', 'RESULTS': 
> "row_regex:,'2024-06-07',\n", 'TYPES': 'STRING,STRING,STRING\n'})
>         total_count = 1
>         use_db     = 'test_spilling_hash_join_28ff9a90'
>         vector     = "table_format: parquet/none" | "protocol: hs2" | 
> "exec_option: {'abort_on_error': 1, 'batch_size': 0, 'disable_codegen': 
> False, 'disable_codegen_rows_threshold': 0, 
> 'exec_single_node_rows_threshold': 0, 'num_nodes': 0, 'test_replan': 1}"
> /data/jenkins/workspace/impala-cdw-master-exhaustive/repos/Impala/tests/common/impala_test_suite.py:782:
>  in __verify_results_and_errors
>     verify_raw_results(test_section, result, vector,
>         replace_filenames_with_placeholder = True
>         result     = <tests.common.impala_connection.ImpylaHS2ResultSet 
> object at 0x7f36a4db4fd0>
>         result_section = 'RESULTS'
>         section_name = 'ERRORS'
>         self       = <test_join_queries.TestSpillingHashJoin object at 
> 0x7f36a4cab9a0>
>         test_section = defaultdict(<class 'str'>, {'QUERY': "set 
> RUNTIME_FILTER_WAIT_TIME_MS=10000;\nset MT_DOP=12;\nset 
> RUNTIME_FILTER_MIN_S...group;\n", 'VERIFIER': 'VERIFY_IS_SUBSET', 'RESULTS': 
> "row_regex:,'2024-06-07',\n", 'TYPES': 'STRING,STRING,STRING\n'})
>         type_section = 'TYPES'
>         use_db     = 'test_spilling_hash_join_28ff9a90'
>         vector     = "table_format: parquet/none" | "protocol: hs2" | 
> "exec_option: {'abort_on_error': 1, 'batch_size': 0, 'disable_codegen': 
> False, 'disable_codegen_rows_threshold': 0, 
> 'exec_single_node_rows_threshold': 0, 'num_nodes': 0, 'test_replan': 1}"
> /data/jenkins/workspace/impala-cdw-master-exhaustive/repos/Impala/tests/common/test_result_verifier.py:540:
>  in verify_raw_results
>     VERIFIER_MAP[verifier](expected, actual)
>         actual     = <tests.common.test_result_verifier.QueryTestResult 
> object at 0x7f36a4db4be0>
>         actual_labels = ['LETTER_MISSION_NAME', 'DATE_', 'WAR_GROUP']
>         actual_types = ['STRING', 'STRING', 'STRING']
>         exec_result = <tests.common.impala_connection.ImpylaHS2ResultSet 
> object at 0x7f36a4db4fd0>
>         expected   = <tests.common.test_result_verifier.QueryTestResult 
> object at 0x7f36a4db4b20>
>         expected_results = "row_regex:,'2024-06-07',\n"
>         expected_results_list = ["row_regex:,'2024-06-07',"]
>         expected_types = ['STRING', 'STRING', 'STRING']
>         file_format = 'parquet'
>         is_raw_string = False
>         order_matters = True
>         protocol   = 'hs2'
>         replace_filenames = True
>         result_section = 'RESULTS'
>         section    = 'STRING,STRING,STRING\n'
>         test_section = defaultdict(<class 'str'>, {'QUERY': "set 
> RUNTIME_FILTER_WAIT_TIME_MS=10000;\nset MT_DOP=12;\nset 
> RUNTIME_FILTER_MIN_S...group;\n", 'VERIFIER': 'VERIFY_IS_SUBSET', 'RESULTS': 
> "row_regex:,'2024-06-07',\n", 'TYPES': 'STRING,STRING,STRING\n'})
>         type_section = 'TYPES'
>         update_section = False
>         vector     = "table_format: parquet/none" | "protocol: hs2" | 
> "exec_option: {'abort_on_error': 1, 'batch_size': 0, 'disable_codegen': 
> False, 'disable_codegen_rows_threshold': 0, 
> 'exec_single_node_rows_threshold': 0, 'num_nodes': 0, 'test_replan': 1}"
>         verifier   = 'VERIFY_IS_SUBSET'
> /data/jenkins/workspace/impala-cdw-master-exhaustive/repos/Impala/tests/common/test_result_verifier.py:298:
>  in verify_query_result_is_subset
>     assert matched, u"Could not find expected row {0} in actual 
> rows:\n{1}".format(
> E   AssertionError: Could not find expected row row_regex:,'2024-06-07', in 
> actual rows:
> E   'NULL','2024-06-07','47'
> E   'NULL','2024-06-07','42'
> E   'NULL','2024-06-07','11'
> E   'name','2024-06-07','20'
> E   'NULL','2024-06-07','7'
> E   'name','2024-06-07','5'
> E   'NULL','2024-06-07','20'
> E   'NULL','2024-06-07','NULL'
> E   'name','2024-06-07','31'
> E   'NULL','2024-06-07','25'
> E   'name','2024-06-07','48'
> E   'name','2024-06-07','34'
> E   'NULL','2024-06-07','2'
> E   'NULL','2024-06-07','8'
> E   'name','2024-06-07','25'
> E   'NULL','2024-06-07','48'
> E   'name','2024-06-07','16'
> E   'name','2024-06-07','45'
> E   'NULL','2024-06-07','14'
> E   'NULL','2024-06-07','34'
> E   'name','2024-06-07','2'
> E   'name','2024-06-07','7'
> E   'NULL','2024-06-07','war_group'
> E   'name','2024-06-07','42'
> E   'name','2024-06-07','11'
> E   'name','2024-06-07','14'
> E   'name','2024-06-07','0'
> E   'name','2024-06-07','47'
> E   'NULL','2024-06-07','39'
> E   'NULL','2024-06-07','19'
> E   'name','2024-06-07','39'
> E   'NULL','2024-06-07','31'
> E   'NULL','2024-06-07','33'
> E   'NULL','2024-06-07','22'
> E   'NULL','2024-06-07','10'
> E   'NULL','2024-06-07','13'
> E   'name','2024-06-07','36'
> E   'NULL','2024-06-07','45'
> E   'NULL','2024-06-07','27'
> E   'name','2024-06-07','13'
> E   'name','2024-06-07','28'
> E   'name','2024-06-07','40'
> E   'NULL','2024-06-07','40'
> E   'name','2024-06-07','19'
> E   'NULL','2024-06-07','3'
> E   'NULL','2024-06-07','6'
> E   'NULL','2024-06-07','43'
> E   'NULL','2024-06-07','36'
> E   'name','2024-06-07','35'
> E   'NULL','2024-06-07','0'
> E   'NULL','2024-06-07','16'
> E   'name','2024-06-07','8'
> E   'name','2024-06-07','33'
> E   'NULL','2024-06-07','32'
> E   'name','2024-06-07','24'
> E   'NULL','2024-06-07','46'
> E   'NULL','2024-06-07','15'
> E   'name','2024-06-07','43'
> E   'name','2024-06-07','27'
> E   'NULL','2024-06-07','21'
> E   'NULL','2024-06-07','35'
> E   'NULL','2024-06-07','49'
> E   'name','2024-06-07','10'
> E   'name','2024-06-07','21'
> E   'name','2024-06-07','9'
> E   'name','2024-06-07','26'
> E   'NULL','2024-06-07','44'
> E   'NULL','2024-06-07','26'
> E   'name','2024-06-07','3'
> E   'NULL','2024-06-07','30'
> E   'NULL','2024-06-07','37'
> E   'name','2024-06-07','6'
> E   'NULL','2024-06-07','5'
> E   'NULL','2024-06-07','28'
> E   'name','2024-06-07','22'
> E   'name','2024-06-07','30'
> E   'name','2024-06-07','41'
> E   'name','2024-06-07','29'
> E   'name','2024-06-07','38'
> E   'name','2024-06-07','17'
> E   'NULL','2024-06-07','1'
> E   'name','2024-06-07','49'
> E   'NULL','2024-06-07','24'
> E   'name','2024-06-07','15'
> E   'name','2024-06-07','1'
> E   'name','2024-06-07','war_group'
> E   'name','2024-06-07','32'
> E   'name','2024-06-07','12'
> E   'name','2024-06-07','37'
> E   'NULL','2024-06-07','12'
> E   'name','2024-06-07','4'
> E   'name','2024-06-07','23'
> E   'NULL','2024-06-07','29'
> E   'NULL','2024-06-07','18'
> E   'NULL','2024-06-07','17'
> E   'name','2024-06-07','46'
> E   'NULL','2024-06-07','9'
> E   'NULL','2024-06-07','50'
> E   'NULL','2024-06-07','38'
> E   'name','2024-06-07','50'
> E   'name','2024-06-07','44'
> E   'NULL','2024-06-07','41'
> E   'name','2024-06-07','18'
> E   'NULL','2024-06-07','4'
> E   'NULL','2024-06-07','23'
>         actual_literal_strings = {"'NULL','2024-06-07','0'", 
> "'NULL','2024-06-07','1'", "'NULL','2024-06-07','10'", 
> "'NULL','2024-06-07','11'", "'NULL','2024-06-07','12'", 
> "'NULL','2024-06-07','13'", ...}
>         actual_results = <tests.common.test_result_verifier.QueryTestResult 
> object at 0x7f36a4db4be0>
>         actual_row = <tests.common.test_result_verifier.ResultRow object at 
> 0x7f36a4cb4070>
>         expected_literal_strings = set()
>         expected_literals = []
>         expected_non_literals = [<tests.common.test_result_verifier.ResultRow 
> object at 0x7f36a4db4b80>]
>         expected_results = <tests.common.test_result_verifier.QueryTestResult 
> object at 0x7f36a4db4b20>
>         expected_row = <tests.common.test_result_verifier.ResultRow object at 
> 0x7f36a4db4b80>
>         matched    = False{noformat}



--
This message was sent by Atlassian Jira
(v8.20.10#820010)

---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]

Reply via email to