Tim Armstrong created IMPALA-7119:
-------------------------------------

             Summary: HBase tests failing with RetriesExhausted and 
"RuntimeException: couldn't retrieve HBase table"
                 Key: IMPALA-7119
                 URL: https://issues.apache.org/jira/browse/IMPALA-7119
             Project: IMPALA
          Issue Type: Bug
    Affects Versions: Impala 2.13.0
            Reporter: Tim Armstrong
            Assignee: Joe McDonnell


64820211a2d30238093f1c4cd03bc268e3a01638

{noformat}
    
metadata.test_compute_stats.TestHbaseComputeStats.test_hbase_compute_stats_incremental[exec_option:
 {'batch_size': 0, 'num_nodes': 0, 'disable_codegen_rows_threshold': 5000, 
'disable_codegen': False, 'abort_on_error': 1, 'debug_action': None, 
'exec_single_node_rows_threshold': 0} | table_format: hbase/none]
    
metadata.test_compute_stats.TestHbaseComputeStats.test_hbase_compute_stats[exec_option:
 {'batch_size': 0, 'num_nodes': 0, 'disable_codegen_rows_threshold': 5000, 
'disable_codegen': False, 'abort_on_error': 1, 'debug_action': None, 
'exec_single_node_rows_threshold': 0} | table_format: hbase/none]
    query_test.test_mt_dop.TestMtDop.test_mt_dop[mt_dop: 1 | exec_option: 
{'batch_size': 0, 'num_nodes': 0, 'disable_codegen_rows_threshold': 0, 
'disable_codegen': False, 'abort_on_error': 1, 'debug_action': None, 
'exec_single_node_rows_threshold': 0} | table_format: hbase/none]
    query_test.test_mt_dop.TestMtDop.test_compute_stats[mt_dop: 1 | 
exec_option: {'batch_size': 0, 'num_nodes': 0, 
'disable_codegen_rows_threshold': 0, 'disable_codegen': False, 
'abort_on_error': 1, 'debug_action': None, 'exec_single_node_rows_threshold': 
0} | table_format: hbase/none]
    
query_test.test_hbase_queries.TestHBaseQueries.test_hbase_scan_node[exec_option:
 {'batch_size': 0, 'num_nodes': 0, 'disable_codegen_rows_threshold': 0, 
'disable_codegen': False, 'abort_on_error': 1, 'debug_action': None, 
'exec_single_node_rows_threshold': 0} | table_format: hbase/none]
    query_test.test_queries.TestHdfsQueries.test_file_partitions[exec_option: 
{'batch_size': 0, 'num_nodes': 0, 'disable_codegen_rows_threshold': 0, 
'disable_codegen': False, 'abort_on_error': 1, 'debug_action': None, 
'exec_single_node_rows_threshold': 0} | table_format: hbase/none]
    query_test.test_mt_dop.TestMtDop.test_mt_dop[mt_dop: 0 | exec_option: 
{'batch_size': 0, 'num_nodes': 0, 'disable_codegen_rows_threshold': 0, 
'disable_codegen': False, 'abort_on_error': 1, 'debug_action': None, 
'exec_single_node_rows_threshold': 0} | table_format: hbase/none]
    query_test.test_observability.TestObservability.test_scan_summary
    query_test.test_mt_dop.TestMtDop.test_compute_stats[mt_dop: 0 | 
exec_option: {'batch_size': 0, 'num_nodes': 0, 
'disable_codegen_rows_threshold': 0, 'disable_codegen': False, 
'abort_on_error': 1, 'debug_action': None, 'exec_single_node_rows_threshold': 
0} | table_format: hbase/none]
    failure.test_failpoints.TestFailpoints.test_failpoints[table_format: 
hbase/none | exec_option: {'batch_size': 0, 'num_nodes': 0, 
'disable_codegen_rows_threshold': 0, 'disable_codegen': False, 
'abort_on_error': 1, 'debug_action': None, 'exec_single_node_rows_threshold': 
0} | mt_dop: 4 | location: GETNEXT_SCANNER | action: FAIL | query: select 1 
from alltypessmall order by id limit 100]
    failure.test_failpoints.TestFailpoints.test_failpoints[table_format: 
hbase/none | exec_option: {'batch_size': 0, 'num_nodes': 0, 
'disable_codegen_rows_threshold': 0, 'disable_codegen': False, 
'abort_on_error': 1, 'debug_action': None, 'exec_single_node_rows_threshold': 
0} | mt_dop: 0 | location: OPEN | action: CANCEL | query: select c from (select 
id c from alltypessmall order by id limit 10) v where c = 1]
    failure.test_failpoints.TestFailpoints.test_failpoints[table_format: 
hbase/none | exec_option: {'batch_size': 0, 'num_nodes': 0, 
'disable_codegen_rows_threshold': 0, 'disable_codegen': False, 
'abort_on_error': 1, 'debug_action': None, 'exec_single_node_rows_threshold': 
0} | mt_dop: 0 | location: CLOSE | action: MEM_LIMIT_EXCEEDED | query: select 
count(*) from alltypessmall]
    failure.test_failpoints.TestFailpoints.test_failpoints[table_format: 
hbase/none | exec_option: {'batch_size': 0, 'num_nodes': 0, 
'disable_codegen_rows_threshold': 0, 'disable_codegen': False, 
'abort_on_error': 1, 'debug_action': None, 'exec_single_node_rows_threshold': 
0} | mt_dop: 4 | location: PREPARE | action: MEM_LIMIT_EXCEEDED | query: select 
count(int_col) from alltypessmall group by id]
    failure.test_failpoints.TestFailpoints.test_failpoints[table_format: 
hbase/none | exec_option: {'batch_size': 0, 'num_nodes': 0, 
'disable_codegen_rows_threshold': 0, 'disable_codegen': False, 
'abort_on_error': 1, 'debug_action': None, 'exec_single_node_rows_threshold': 
0} | mt_dop: 4 | location: OPEN | action: MEM_LIMIT_EXCEEDED | query: select * 
from alltypessmall union all select * from alltypessmall]
    failure.test_failpoints.TestFailpoints.test_failpoints[table_format: 
hbase/none | exec_option: {'batch_size': 0, 'num_nodes': 0, 
'disable_codegen_rows_threshold': 0, 'disable_codegen': False, 
'abort_on_error': 1, 'debug_action': None, 'exec_single_node_rows_threshold': 
0} | mt_dop: 4 | location: CLOSE | action: MEM_LIMIT_EXCEEDED | query: select 
row_number() over (partition by int_col order by id) from alltypessmall]
    failure.test_failpoints.TestFailpoints.test_failpoints[table_format: 
hbase/none | exec_option: {'batch_size': 0, 'num_nodes': 0, 
'disable_codegen_rows_threshold': 0, 'disable_codegen': False, 
'abort_on_error': 1, 'debug_action': None, 'exec_single_node_rows_threshold': 
0} | mt_dop: 4 | location: CLOSE | action: MEM_LIMIT_EXCEEDED | query: select 1 
from alltypessmall order by id]
    failure.test_failpoints.TestFailpoints.test_failpoints[table_format: 
hbase/none | exec_option: {'batch_size': 0, 'num_nodes': 0, 
'disable_codegen_rows_threshold': 0, 'disable_codegen': False, 
'abort_on_error': 1, 'debug_action': None, 'exec_single_node_rows_threshold': 
0} | mt_dop: 4 | location: CLOSE | action: MEM_LIMIT_EXCEEDED | query: select * 
from alltypes]
    verifiers.test_verify_metrics.TestValidateMetrics.test_metrics_are_zero
    org.apache.impala.planner.PlannerTest.org.apache.impala.planner.PlannerTest
    
org.apache.impala.planner.S3PlannerTest.org.apache.impala.planner.S3PlannerTest
    failure.test_failpoints.TestFailpoints.test_failpoints[table_format: 
hbase/none | exec_option: {'batch_size': 0, 'num_nodes': 0, 
'disable_codegen_rows_threshold': 0, 'disable_codegen': False, 
'abort_on_error': 1, 'debug_action': None, 'exec_single_node_rows_threshold': 
0} | mt_dop: 4 | location: GETNEXT | action: FAIL | query: select 1 from 
alltypessmall a join alltypessmall b on a.id != b.id]
    failure.test_failpoints.TestFailpoints.test_failpoints[table_format: 
hbase/none | exec_option: {'batch_size': 0, 'num_nodes': 0, 
'disable_codegen_rows_threshold': 0, 'disable_codegen': False, 
'abort_on_error': 1, 'debug_action': None, 'exec_single_node_rows_threshold': 
0} | mt_dop: 4 | location: PREPARE_SCANNER | action: MEM_LIMIT_EXCEEDED | 
query: select 1 from alltypessmall a join alltypessmall b on a.id = b.id]
{noformat}

{noformat}

21:22:44 Running org.apache.impala.planner.S3PlannerTest
21:22:44 Tests run: 1, Failures: 0, Errors: 1, Skipped: 0, Time elapsed: 
450.328 sec <<< FAILURE! - in org.apache.impala.planner.S3PlannerTest
21:22:44 org.apache.impala.planner.S3PlannerTest  Time elapsed: 450.328 sec  
<<< ERROR!
21:22:44        at 
org.apache.impala.datagenerator.HBaseTestDataRegionAssignment.<init>(HBaseTestDataRegionAssignment.java:68)
21:22:44        at 
org.apache.impala.planner.PlannerTestBase.setUp(PlannerTestBase.java:120)
21:22:44        at 
org.apache.maven.surefire.junit4.JUnit4Provider.executeTestSet(JUnit4Provider.java:153)
21:22:44        at 
org.apache.impala.datagenerator.HBaseTestDataRegionAssignment.<init>(HBaseTestDataRegionAssignment.java:68)
21:22:44        at 
org.apache.impala.planner.PlannerTestBase.setUp(PlannerTestBase.java:120)
21:22:44        at 
org.apache.maven.surefire.junit4.JUnit4Provider.executeTestSet(JUnit4Provider.java:153)
21:22:44        at 
org.apache.impala.datagenerator.HBaseTestDataRegionAssignment.<init>(HBaseTestDataRegionAssignment.java:68)
21:22:44        at 
org.apache.impala.planner.PlannerTestBase.setUp(PlannerTestBase.java:120)
21:22:44        at 
org.apache.maven.surefire.junit4.JUnit4Provider.executeTestSet(JUnit4Provider.java:153)
21:22:44 Running org.apache.impala.planner.PlannerTest
21:22:44 Tests run: 1, Failures: 0, Errors: 1, Skipped: 0, Time elapsed: 
450.602 sec <<< FAILURE! - in org.apache.impala.planner.PlannerTest
21:22:44 org.apache.impala.planner.PlannerTest  Time elapsed: 450.602 sec  <<< 
ERROR!
21:22:44        at 
org.apache.impala.datagenerator.HBaseTestDataRegionAssignment.<init>(HBaseTestDataRegionAssignment.java:68)
21:22:44        at 
org.apache.impala.planner.PlannerTestBase.setUp(PlannerTestBase.java:120)
21:22:44        at 
org.apache.maven.surefire.junit4.JUnit4Provider.executeTestSet(JUnit4Provider.java:153)
21:22:44        at 
org.apache.impala.datagenerator.HBaseTestDataRegionAssignment.<init>(HBaseTestDataRegionAssignment.java:68)
21:22:44        at 
org.apache.impala.planner.PlannerTestBase.setUp(PlannerTestBase.java:120)
21:22:44        at 
org.apache.maven.surefire.junit4.JUnit4Provider.executeTestSet(JUnit4Provider.java:153)
21:22:44        at 
org.apache.impala.datagenerator.HBaseTestDataRegionAssignment.<init>(HBaseTestDataRegionAssignment.java:68)
21:22:44        at 
org.apache.impala.planner.PlannerTestBase.setUp(PlannerTestBase.java:120)
21:22:44        at 
org.apache.maven.surefire.junit4.JUnit4Provider.executeTestSet(JUnit4Provider.java:153)
{noformat}

{noformat}
22:53:05 =================================== FAILURES 
===================================
22:53:05  TestFailpoints.test_failpoints[table_format: hbase/none | 
exec_option: {'batch_size': 0, 'num_nodes': 0, 
'disable_codegen_rows_threshold': 0, 'disable_codegen': False, 
'abort_on_error': 1, 'debug_action': None, 'exec_single_node_rows_threshold': 
0} | mt_dop: 4 | location: GETNEXT_SCANNER | action: FAIL | query: select 1 
from alltypessmall order by id limit 100] 
22:53:05 failure/test_failpoints.py:102: in test_failpoints
22:53:05     raise e
22:53:05 E   ImpalaBeeswaxException: ImpalaBeeswaxException:
22:53:05 E    INNER EXCEPTION: <class 'beeswaxd.ttypes.BeeswaxException'>
22:53:05 E    MESSAGE: RuntimeException: couldn't retrieve HBase table 
(functional_hbase.alltypessmall) info:
22:53:05 E   Connection refused
22:53:05 E   CAUSED BY: ConnectException: Connection refused
22:53:05  TestFailpoints.test_failpoints[table_format: hbase/none | 
exec_option: {'batch_size': 0, 'num_nodes': 0, 
'disable_codegen_rows_threshold': 0, 'disable_codegen': False, 
'abort_on_error': 1, 'debug_action': None, 'exec_single_node_rows_threshold': 
0} | mt_dop: 0 | location: OPEN | action: CANCEL | query: select c from (select 
id c from alltypessmall order by id limit 10) v where c = 1] 
22:53:05 failure/test_failpoints.py:102: in test_failpoints
22:53:05     raise e
22:53:05 E   ImpalaBeeswaxException: ImpalaBeeswaxException:
22:53:05 E    INNER EXCEPTION: <class 'beeswaxd.ttypes.BeeswaxException'>
22:53:05 E    MESSAGE: RuntimeException: couldn't retrieve HBase table 
(functional_hbase.alltypessmall) info:
22:53:05 E   Connection refused
22:53:05 E   CAUSED BY: ConnectException: Connection refused
{noformat}

{noformat}
23:21:02  
TestHbaseComputeStats.test_hbase_compute_stats_incremental[exec_option: 
{'batch_size': 0, 'num_nodes': 0, 'disable_codegen_rows_threshold': 5000, 
'disable_codegen': False, 'abort_on_error': 1, 'debug_action': None, 
'exec_single_node_rows_threshold': 0} | table_format: hbase/none] 
23:21:02 [gw3] linux2 -- Python 2.7.5 
/data/jenkins/workspace/impala-asf-2.x-core/repos/Impala/bin/../infra/python/env/bin/python
23:21:02 metadata/test_compute_stats.py:147: in 
test_hbase_compute_stats_incremental
23:21:02     unique_database)
23:21:02 common/impala_test_suite.py:405: in run_test_case
23:21:02     result = self.__execute_query(target_impalad_client, query, 
user=user)
23:21:02 common/impala_test_suite.py:620: in __execute_query
23:21:02     return impalad_client.execute(query, user=user)
23:21:02 common/impala_connection.py:160: in execute
23:21:02     return self.__beeswax_client.execute(sql_stmt, user=user)
23:21:02 beeswax/impala_beeswax.py:173: in execute
23:21:02     handle = self.__execute_query(query_string.strip(), user=user)
23:21:02 beeswax/impala_beeswax.py:341: in __execute_query
23:21:02     self.wait_for_completion(handle)
23:21:02 beeswax/impala_beeswax.py:361: in wait_for_completion
23:21:02     raise ImpalaBeeswaxException("Query aborted:" + error_log, None)
23:21:02 E   ImpalaBeeswaxException: ImpalaBeeswaxException:
23:21:02 E    Query aborted:RuntimeException: couldn't retrieve HBase table 
(functional_hbase.alltypessmall) info:
23:21:02 E   This server is in the failed servers list: 
localhost/127.0.0.1:16202
23:21:02 E   CAUSED BY: FailedServerException: This server is in the failed 
servers list: localhost/127.0.0.1:16202
{noformat}



--
This message was sent by Atlassian JIRA
(v7.6.3#76005)

---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]

Reply via email to