Vikram Ahuja created HIVE-29099:
-----------------------------------
Summary: Select query result mismatch in iceberg table vs hive
table for the same inserted data
Key: HIVE-29099
URL: https://issues.apache.org/jira/browse/HIVE-29099
Project: Hive
Issue Type: Bug
Reporter: Vikram Ahuja
Assignee: Vikram Ahuja
Hive Table:
drop table tbl_parquet;
create external table tbl_parquet(a int) partitioned by (b string) stored as
parquet;
insert into tbl_parquet values(1,'');
insert into tbl_parquet values(2,null);
insert into tbl_parquet values(3, NULL);
select count(*) from tbl_parquet where b = ''; -> Returns 0
select count(*) from tbl_parquet where b != ''; -> Returns 3
Iceberg table
drop table tbl_parquet_iceberg;
create external table tbl_parquet_iceberg(a int) partitioned by (b string)
stored by iceberg stored as parquet;
insert into tbl_parquet_iceberg values(1,'');
insert into tbl_parquet_iceberg values(2,null);
insert into tbl_parquet_iceberg values(3, NULL);
select count(*) from tbl_parquet_iceberg where b = ''; -> Returns 1
select count(*) from tbl_parquet_iceberg where b != ''; -> Returns 2
--
This message was sent by Atlassian Jira
(v8.20.10#820010)