[ 
https://issues.apache.org/jira/browse/IMPALA-11806?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=17681821#comment-17681821
 ] 

Quanlong Huang edited comment on IMPALA-11806 at 1/30/23 1:12 AM:
------------------------------------------------------------------

Reopen this since still see it fails in Ozone builds. The error message is 
different but might due to the recent fix:
{code:java}
F query_test/test_iceberg.py::TestIcebergTable::()::test_load[protocol: beeswax 
| exec_option: {'test_replan': 1, 'batch_size': 0, 'num_nodes': 0, 
'disable_codegen_rows_threshold': 0, 'disable_codegen': False, 
'abort_on_error': 1, 'exec_single_node_rows_threshold': 0} | table_format: 
parquet/none]
 query_test/test_iceberg.py:842: in test_load
     self.run_test_case('QueryTest/iceberg-load', vector, 
use_db=unique_database)
 common/impala_test_suite.py:773: in run_test_case
     self.__verify_exceptions(test_section['CATCH'], str(e), use_db)
 common/impala_test_suite.py:557: in __verify_exceptions
     (expected_str, actual_str)
 E   AssertionError: Unexpected exception string. Expected: minimum memory 
reservation is greater than memory available to the query for buffer 
reservations
 E   Not found in actual: ImpalaBeeswaxException: INNER EXCEPTION: <class 
'beeswaxd.ttypes.BeeswaxException'> MESSAGE: AnalysisException: INPATH location 
'ofs://localhost:9862/tmp/test_load_a61184e9/parquet/00000-0-data-gfurnstahl_20220906113044_157fc172-f5d3-4c70-8653-fff150b6136a-job_16619542960420_0002-1-00001.parquet'
 does not exist.{code}
Could you take a look again? [~tmate] 

Also added the logs:
{noformat}
---------------------------- Captured stderr setup -----------------------------
SET 
client_identifier=query_test/test_iceberg.py::TestIcebergTable::()::test_load[protocol:beeswax|exec_option:{'test_replan':1;'batch_size':0;'num_nodes':0;'disable_codegen_rows_threshold':0;'disable_codegen':False;'abort_on_error':1;'exec_single_node_rows_threshold':0}|table;
SET sync_ddl=False;
-- executing against localhost:21000

DROP DATABASE IF EXISTS `test_load_a61184e9` CASCADE;

-- 2023-01-28 02:50:33,868 INFO     MainThread: Started query 
58461c91b3d336a7:2432b82e00000000
SET 
client_identifier=query_test/test_iceberg.py::TestIcebergTable::()::test_load[protocol:beeswax|exec_option:{'test_replan':1;'batch_size':0;'num_nodes':0;'disable_codegen_rows_threshold':0;'disable_codegen':False;'abort_on_error':1;'exec_single_node_rows_threshold':0}|table;
SET sync_ddl=False;
-- executing against localhost:21000

CREATE DATABASE `test_load_a61184e9`;

-- 2023-01-28 02:50:40,221 INFO     MainThread: Started query 
c24370b426b545c3:6fa8231500000000
-- 2023-01-28 02:50:40,272 INFO     MainThread: Created database 
"test_load_a61184e9" for test ID 
"query_test/test_iceberg.py::TestIcebergTable::()::test_load[protocol: beeswax 
| exec_option: {'test_replan': 1, 'batch_size': 0, 'num_nodes': 0, 
'disable_codegen_rows_threshold': 0, 'disable_codegen': False, 
'abort_on_error': 1, 'exec_single_node_rows_threshold': 0} | table_format: 
parquet/none]"
----------------------------- Captured stderr call -----------------------------
/data/jenkins/workspace/impala-cdwh-2023.0.13.0-core-ozone/repos/Impala/infra/python/env-gcc10.4.0/lib/python2.7/site-packages/avro/schema.py:1048:
 IgnoredLogicalType: Unknown map, using array.
  warnings.warn(IgnoredLogicalType("Unknown {}, using {}.".format(logical_type, 
type_)))
23/01/28 02:51:05 WARN impl.MetricsConfig: Cannot locate configuration: tried 
hadoop-metrics2-xceiverclientmetrics.properties,hadoop-metrics2.properties
23/01/28 02:51:05 INFO impl.MetricsSystemImpl: Scheduled Metric snapshot period 
at 10 second(s).
23/01/28 02:51:05 INFO impl.MetricsSystemImpl: XceiverClientMetrics metrics 
system started
23/01/28 02:51:06 INFO metrics.MetricRegistries: Loaded MetricRegistries class 
org.apache.ratis.metrics.impl.MetricRegistriesImpl
-- executing against localhost:21000

create external table test_load_a61184e9.iceberg_mixed_file_format_test stored 
as iceberg location 
'ofs://localhost:9862/impala/test-warehouse/iceberg_mixed_file_format_test'
                        tblproperties('write.format.default'='parquet', 
'iceberg.catalog'=
                        'hadoop.tables');

-- 2023-01-28 02:51:07,100 INFO     MainThread: Started query 
3d461f30b9331806:dbe7ea7000000000
-- executing against localhost:21000

alter table test_load_a61184e9.iceberg_mixed_file_format_test set tblproperties 
('external.table.purge'=
                        'True');;

-- 2023-01-28 02:51:12,916 INFO     MainThread: Started query 
8c4c9685cc4512fd:51b2417c00000000
SET 
client_identifier=query_test/test_iceberg.py::TestIcebergTable::()::test_load[protocol:beeswax|exec_option:{'test_replan':1;'batch_size':0;'num_nodes':0;'disable_codegen_rows_threshold':0;'disable_codegen':False;'abort_on_error':1;'exec_single_node_rows_threshold':0}|table;
-- executing against localhost:21000

use test_load_a61184e9;

-- 2023-01-28 02:51:13,120 INFO     MainThread: Started query 
3c4a5bba881f8c96:f7ff062c00000000
SET 
client_identifier=query_test/test_iceberg.py::TestIcebergTable::()::test_load[protocol:beeswax|exec_option:{'test_replan':1;'batch_size':0;'num_nodes':0;'disable_codegen_rows_threshold':0;'disable_codegen':False;'abort_on_error':1;'exec_single_node_rows_threshold':0}|table;
SET test_replan=1;
SET batch_size=0;
SET num_nodes=0;
SET disable_codegen_rows_threshold=0;
SET disable_codegen=False;
SET abort_on_error=1;
SET exec_single_node_rows_threshold=0;
-- 2023-01-28 02:51:13,120 INFO     MainThread: Loading query test file: 
/data/jenkins/workspace/impala-cdwh-2023.0.13.0-core-ozone/repos/Impala/testdata/workloads/functional-query/queries/QueryTest/iceberg-load.test
-- executing against localhost:21000

create table test_iceberg_load_parquet like iceberg_mixed_file_format_test
stored as iceberg;

-- 2023-01-28 02:51:14,684 INFO     MainThread: Started query 
3d4a0a7f0c3ccdec:2d9fe5cf00000000
-- executing against localhost:21000

set mem_limit=1;

-- 2023-01-28 02:51:14,938 INFO     MainThread: Started query 
2f459d894fb8f77b:ce500c1a00000000
-- executing against localhost:21000


load data inpath 
'/tmp/test_load_a61184e9/parquet/00000-0-data-gfurnstahl_20220906113044_157fc172-f5d3-4c70-8653-fff150b6136a-job_16619542960420_0002-1-00001.parquet'
into table test_iceberg_load_parquet;

-- executing against localhost:21000

SET MEM_LIMIT="0";

-- 2023-01-28 02:51:18,992 INFO     MainThread: Started query 
ae44d82bd603ffcd:90040d3a00000000 {noformat}


was (Author: stiga-huang):
Reopen this since still see it fails in Ozone builds. The error message is 
different but might due to the recent fix:
{code:java}
F query_test/test_iceberg.py::TestIcebergTable::()::test_load[protocol: beeswax 
| exec_option: {'test_replan': 1, 'batch_size': 0, 'num_nodes': 0, 
'disable_codegen_rows_threshold': 0, 'disable_codegen': False, 
'abort_on_error': 1, 'exec_single_node_rows_threshold': 0} | table_format: 
parquet/none]
 query_test/test_iceberg.py:842: in test_load
     self.run_test_case('QueryTest/iceberg-load', vector, 
use_db=unique_database)
 common/impala_test_suite.py:773: in run_test_case
     self.__verify_exceptions(test_section['CATCH'], str(e), use_db)
 common/impala_test_suite.py:557: in __verify_exceptions
     (expected_str, actual_str)
 E   AssertionError: Unexpected exception string. Expected: minimum memory 
reservation is greater than memory available to the query for buffer 
reservations
 E   Not found in actual: ImpalaBeeswaxException: INNER EXCEPTION: <class 
'beeswaxd.ttypes.BeeswaxException'> MESSAGE: AnalysisException: INPATH location 
'ofs://localhost:9862/tmp/test_load_a61184e9/parquet/00000-0-data-gfurnstahl_20220906113044_157fc172-f5d3-4c70-8653-fff150b6136a-job_16619542960420_0002-1-00001.parquet'
 does not exist.{code}
Could you take a look again? [~tmate] 

> TestIcebergTable.test_load failed
> ---------------------------------
>
>                 Key: IMPALA-11806
>                 URL: https://issues.apache.org/jira/browse/IMPALA-11806
>             Project: IMPALA
>          Issue Type: Bug
>          Components: Backend
>    Affects Versions: Impala 4.3.0
>            Reporter: Wenzhe Zhou
>            Assignee: Tamas Mate
>            Priority: Critical
>             Fix For: Impala 4.3.0
>
>
> TestIcebergTable.test_load was added by IMPALA-11339 (Add Iceberg LOAD DATA 
> INPATH statement). It failed in core-ozone build.
> *Error Message*
> query_test/test_iceberg.py:805: in test_load     
> self.hdfs_client.make_dir(DST_DIR, permission=777) E   AttributeError: 
> 'TestIcebergTable' object has no attribute 'hdfs_client'
> *Stacktrace*
> query_test/test_iceberg.py:805: in test_load
>     self.hdfs_client.make_dir(DST_DIR, permission=777)
> E   AttributeError: 'TestIcebergTable' object has no attribute 'hdfs_client'
> Standard Error
> SET 
> client_identifier=query_test/test_iceberg.py::TestIcebergTable::()::test_load[protocol:beeswax|exec_option:{'test_replan':1;'batch_size':0;'num_nodes':0;'disable_codegen_rows_threshold':0;'disable_codegen':False;'abort_on_error':1;'exec_single_node_rows_threshold':0}|table;
> SET sync_ddl=False;
> -- executing against localhost:21000
> DROP DATABASE IF EXISTS `test_load_a61184e9` CASCADE;
> -- 2022-12-16 09:11:10,345 INFO     MainThread: Started query 
> 7748bb1822e271fa:9bada05000000000
> SET 
> client_identifier=query_test/test_iceberg.py::TestIcebergTable::()::test_load[protocol:beeswax|exec_option:{'test_replan':1;'batch_size':0;'num_nodes':0;'disable_codegen_rows_threshold':0;'disable_codegen':False;'abort_on_error':1;'exec_single_node_rows_threshold':0}|table;
> SET sync_ddl=False;
> -- executing against localhost:21000
> CREATE DATABASE `test_load_a61184e9`;
> -- 2022-12-16 09:11:14,357 INFO     MainThread: Started query 
> 2649fc95833f8f75:cafcfec300000000
> -- 2022-12-16 09:11:14,408 INFO     MainThread: Created database 
> "test_load_a61184e9" for test ID 
> "query_test/test_iceberg.py::TestIcebergTable::()::test_load[protocol: 
> beeswax | exec_option: {'test_replan': 1, 'batch_size': 0, 'num_nodes': 0, 
> 'disable_codegen_rows_threshold': 0, 'disable_codegen': False, 
> 'abort_on_error': 1, 'exec_single_node_rows_threshold': 0} | table_format: 
> parquet/none]"



--
This message was sent by Atlassian Jira
(v8.20.10#820010)

---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]

Reply via email to