Vikram Ahuja created HIVE-29099:
-----------------------------------

             Summary: Select query result mismatch in iceberg table vs hive 
table for the same inserted data
                 Key: HIVE-29099
                 URL: https://issues.apache.org/jira/browse/HIVE-29099
             Project: Hive
          Issue Type: Bug
            Reporter: Vikram Ahuja
            Assignee: Vikram Ahuja


Hive Table:
 
drop table tbl_parquet;
create external table tbl_parquet(a int) partitioned by (b string) stored as 
parquet;
insert into tbl_parquet values(1,'');
insert into tbl_parquet values(2,null);
insert into tbl_parquet values(3, NULL);
select count(*) from tbl_parquet where b = ''; -> Returns 0
select count(*) from tbl_parquet where b != ''; -> Returns 3
 
Iceberg table
drop table tbl_parquet_iceberg;
create external table tbl_parquet_iceberg(a int) partitioned by (b string) 
stored by iceberg stored as parquet;
insert into tbl_parquet_iceberg values(1,'');
insert into tbl_parquet_iceberg values(2,null);
insert into tbl_parquet_iceberg values(3, NULL);
select count(*) from tbl_parquet_iceberg where b = ''; -> Returns 1
select count(*) from tbl_parquet_iceberg where b != ''; -> Returns 2
 



--
This message was sent by Atlassian Jira
(v8.20.10#820010)

Reply via email to