[
https://issues.apache.org/jira/browse/IMPALA-11806?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=17681821#comment-17681821
]
Quanlong Huang edited comment on IMPALA-11806 at 1/30/23 1:12 AM:
------------------------------------------------------------------
Reopen this since still see it fails in Ozone builds. The error message is
different but might due to the recent fix:
{code:java}
F query_test/test_iceberg.py::TestIcebergTable::()::test_load[protocol: beeswax
| exec_option: {'test_replan': 1, 'batch_size': 0, 'num_nodes': 0,
'disable_codegen_rows_threshold': 0, 'disable_codegen': False,
'abort_on_error': 1, 'exec_single_node_rows_threshold': 0} | table_format:
parquet/none]
query_test/test_iceberg.py:842: in test_load
self.run_test_case('QueryTest/iceberg-load', vector,
use_db=unique_database)
common/impala_test_suite.py:773: in run_test_case
self.__verify_exceptions(test_section['CATCH'], str(e), use_db)
common/impala_test_suite.py:557: in __verify_exceptions
(expected_str, actual_str)
E AssertionError: Unexpected exception string. Expected: minimum memory
reservation is greater than memory available to the query for buffer
reservations
E Not found in actual: ImpalaBeeswaxException: INNER EXCEPTION: <class
'beeswaxd.ttypes.BeeswaxException'> MESSAGE: AnalysisException: INPATH location
'ofs://localhost:9862/tmp/test_load_a61184e9/parquet/00000-0-data-gfurnstahl_20220906113044_157fc172-f5d3-4c70-8653-fff150b6136a-job_16619542960420_0002-1-00001.parquet'
does not exist.{code}
Could you take a look again? [~tmate]
Also added the logs:
{noformat}
---------------------------- Captured stderr setup -----------------------------
SET
client_identifier=query_test/test_iceberg.py::TestIcebergTable::()::test_load[protocol:beeswax|exec_option:{'test_replan':1;'batch_size':0;'num_nodes':0;'disable_codegen_rows_threshold':0;'disable_codegen':False;'abort_on_error':1;'exec_single_node_rows_threshold':0}|table;
SET sync_ddl=False;
-- executing against localhost:21000
DROP DATABASE IF EXISTS `test_load_a61184e9` CASCADE;
-- 2023-01-28 02:50:33,868 INFO MainThread: Started query
58461c91b3d336a7:2432b82e00000000
SET
client_identifier=query_test/test_iceberg.py::TestIcebergTable::()::test_load[protocol:beeswax|exec_option:{'test_replan':1;'batch_size':0;'num_nodes':0;'disable_codegen_rows_threshold':0;'disable_codegen':False;'abort_on_error':1;'exec_single_node_rows_threshold':0}|table;
SET sync_ddl=False;
-- executing against localhost:21000
CREATE DATABASE `test_load_a61184e9`;
-- 2023-01-28 02:50:40,221 INFO MainThread: Started query
c24370b426b545c3:6fa8231500000000
-- 2023-01-28 02:50:40,272 INFO MainThread: Created database
"test_load_a61184e9" for test ID
"query_test/test_iceberg.py::TestIcebergTable::()::test_load[protocol: beeswax
| exec_option: {'test_replan': 1, 'batch_size': 0, 'num_nodes': 0,
'disable_codegen_rows_threshold': 0, 'disable_codegen': False,
'abort_on_error': 1, 'exec_single_node_rows_threshold': 0} | table_format:
parquet/none]"
----------------------------- Captured stderr call -----------------------------
/data/jenkins/workspace/impala-cdwh-2023.0.13.0-core-ozone/repos/Impala/infra/python/env-gcc10.4.0/lib/python2.7/site-packages/avro/schema.py:1048:
IgnoredLogicalType: Unknown map, using array.
warnings.warn(IgnoredLogicalType("Unknown {}, using {}.".format(logical_type,
type_)))
23/01/28 02:51:05 WARN impl.MetricsConfig: Cannot locate configuration: tried
hadoop-metrics2-xceiverclientmetrics.properties,hadoop-metrics2.properties
23/01/28 02:51:05 INFO impl.MetricsSystemImpl: Scheduled Metric snapshot period
at 10 second(s).
23/01/28 02:51:05 INFO impl.MetricsSystemImpl: XceiverClientMetrics metrics
system started
23/01/28 02:51:06 INFO metrics.MetricRegistries: Loaded MetricRegistries class
org.apache.ratis.metrics.impl.MetricRegistriesImpl
-- executing against localhost:21000
create external table test_load_a61184e9.iceberg_mixed_file_format_test stored
as iceberg location
'ofs://localhost:9862/impala/test-warehouse/iceberg_mixed_file_format_test'
tblproperties('write.format.default'='parquet',
'iceberg.catalog'=
'hadoop.tables');
-- 2023-01-28 02:51:07,100 INFO MainThread: Started query
3d461f30b9331806:dbe7ea7000000000
-- executing against localhost:21000
alter table test_load_a61184e9.iceberg_mixed_file_format_test set tblproperties
('external.table.purge'=
'True');;
-- 2023-01-28 02:51:12,916 INFO MainThread: Started query
8c4c9685cc4512fd:51b2417c00000000
SET
client_identifier=query_test/test_iceberg.py::TestIcebergTable::()::test_load[protocol:beeswax|exec_option:{'test_replan':1;'batch_size':0;'num_nodes':0;'disable_codegen_rows_threshold':0;'disable_codegen':False;'abort_on_error':1;'exec_single_node_rows_threshold':0}|table;
-- executing against localhost:21000
use test_load_a61184e9;
-- 2023-01-28 02:51:13,120 INFO MainThread: Started query
3c4a5bba881f8c96:f7ff062c00000000
SET
client_identifier=query_test/test_iceberg.py::TestIcebergTable::()::test_load[protocol:beeswax|exec_option:{'test_replan':1;'batch_size':0;'num_nodes':0;'disable_codegen_rows_threshold':0;'disable_codegen':False;'abort_on_error':1;'exec_single_node_rows_threshold':0}|table;
SET test_replan=1;
SET batch_size=0;
SET num_nodes=0;
SET disable_codegen_rows_threshold=0;
SET disable_codegen=False;
SET abort_on_error=1;
SET exec_single_node_rows_threshold=0;
-- 2023-01-28 02:51:13,120 INFO MainThread: Loading query test file:
/data/jenkins/workspace/impala-cdwh-2023.0.13.0-core-ozone/repos/Impala/testdata/workloads/functional-query/queries/QueryTest/iceberg-load.test
-- executing against localhost:21000
create table test_iceberg_load_parquet like iceberg_mixed_file_format_test
stored as iceberg;
-- 2023-01-28 02:51:14,684 INFO MainThread: Started query
3d4a0a7f0c3ccdec:2d9fe5cf00000000
-- executing against localhost:21000
set mem_limit=1;
-- 2023-01-28 02:51:14,938 INFO MainThread: Started query
2f459d894fb8f77b:ce500c1a00000000
-- executing against localhost:21000
load data inpath
'/tmp/test_load_a61184e9/parquet/00000-0-data-gfurnstahl_20220906113044_157fc172-f5d3-4c70-8653-fff150b6136a-job_16619542960420_0002-1-00001.parquet'
into table test_iceberg_load_parquet;
-- executing against localhost:21000
SET MEM_LIMIT="0";
-- 2023-01-28 02:51:18,992 INFO MainThread: Started query
ae44d82bd603ffcd:90040d3a00000000 {noformat}
was (Author: stiga-huang):
Reopen this since still see it fails in Ozone builds. The error message is
different but might due to the recent fix:
{code:java}
F query_test/test_iceberg.py::TestIcebergTable::()::test_load[protocol: beeswax
| exec_option: {'test_replan': 1, 'batch_size': 0, 'num_nodes': 0,
'disable_codegen_rows_threshold': 0, 'disable_codegen': False,
'abort_on_error': 1, 'exec_single_node_rows_threshold': 0} | table_format:
parquet/none]
query_test/test_iceberg.py:842: in test_load
self.run_test_case('QueryTest/iceberg-load', vector,
use_db=unique_database)
common/impala_test_suite.py:773: in run_test_case
self.__verify_exceptions(test_section['CATCH'], str(e), use_db)
common/impala_test_suite.py:557: in __verify_exceptions
(expected_str, actual_str)
E AssertionError: Unexpected exception string. Expected: minimum memory
reservation is greater than memory available to the query for buffer
reservations
E Not found in actual: ImpalaBeeswaxException: INNER EXCEPTION: <class
'beeswaxd.ttypes.BeeswaxException'> MESSAGE: AnalysisException: INPATH location
'ofs://localhost:9862/tmp/test_load_a61184e9/parquet/00000-0-data-gfurnstahl_20220906113044_157fc172-f5d3-4c70-8653-fff150b6136a-job_16619542960420_0002-1-00001.parquet'
does not exist.{code}
Could you take a look again? [~tmate]
> TestIcebergTable.test_load failed
> ---------------------------------
>
> Key: IMPALA-11806
> URL: https://issues.apache.org/jira/browse/IMPALA-11806
> Project: IMPALA
> Issue Type: Bug
> Components: Backend
> Affects Versions: Impala 4.3.0
> Reporter: Wenzhe Zhou
> Assignee: Tamas Mate
> Priority: Critical
> Fix For: Impala 4.3.0
>
>
> TestIcebergTable.test_load was added by IMPALA-11339 (Add Iceberg LOAD DATA
> INPATH statement). It failed in core-ozone build.
> *Error Message*
> query_test/test_iceberg.py:805: in test_load
> self.hdfs_client.make_dir(DST_DIR, permission=777) E AttributeError:
> 'TestIcebergTable' object has no attribute 'hdfs_client'
> *Stacktrace*
> query_test/test_iceberg.py:805: in test_load
> self.hdfs_client.make_dir(DST_DIR, permission=777)
> E AttributeError: 'TestIcebergTable' object has no attribute 'hdfs_client'
> Standard Error
> SET
> client_identifier=query_test/test_iceberg.py::TestIcebergTable::()::test_load[protocol:beeswax|exec_option:{'test_replan':1;'batch_size':0;'num_nodes':0;'disable_codegen_rows_threshold':0;'disable_codegen':False;'abort_on_error':1;'exec_single_node_rows_threshold':0}|table;
> SET sync_ddl=False;
> -- executing against localhost:21000
> DROP DATABASE IF EXISTS `test_load_a61184e9` CASCADE;
> -- 2022-12-16 09:11:10,345 INFO MainThread: Started query
> 7748bb1822e271fa:9bada05000000000
> SET
> client_identifier=query_test/test_iceberg.py::TestIcebergTable::()::test_load[protocol:beeswax|exec_option:{'test_replan':1;'batch_size':0;'num_nodes':0;'disable_codegen_rows_threshold':0;'disable_codegen':False;'abort_on_error':1;'exec_single_node_rows_threshold':0}|table;
> SET sync_ddl=False;
> -- executing against localhost:21000
> CREATE DATABASE `test_load_a61184e9`;
> -- 2022-12-16 09:11:14,357 INFO MainThread: Started query
> 2649fc95833f8f75:cafcfec300000000
> -- 2022-12-16 09:11:14,408 INFO MainThread: Created database
> "test_load_a61184e9" for test ID
> "query_test/test_iceberg.py::TestIcebergTable::()::test_load[protocol:
> beeswax | exec_option: {'test_replan': 1, 'batch_size': 0, 'num_nodes': 0,
> 'disable_codegen_rows_threshold': 0, 'disable_codegen': False,
> 'abort_on_error': 1, 'exec_single_node_rows_threshold': 0} | table_format:
> parquet/none]"
--
This message was sent by Atlassian Jira
(v8.20.10#820010)
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]