zhaolong created HIVE-25523:
-------------------------------

             Summary: data loss when none bucket table convert to bucket map 
join in tez
                 Key: HIVE-25523
                 URL: https://issues.apache.org/jira/browse/HIVE-25523
             Project: Hive
          Issue Type: Bug
    Affects Versions: 3.1.0
            Reporter: zhaolong
         Attachments: image-2021-09-15-10-44-43-366.png, 
image-2021-09-15-10-46-57-668.png

create table wtest (equi_type varchar(765), ym string, trade_typ_code string, 
cons_no string, t_settle_pq decimal(38,0), fl string)
 row format delimited fields terminated by ',' stored as textfile ;

create table wtest2 (equi_type varchar(765), ym string, trade_typ_code string, 
cons_no string, t_settle_pq decimal(38,0), fl string)
 row format delimited fields terminated by ',' stored as textfile ;

load data local inpath '/opt/000000_0' into table wtest;

load data local inpath '/opt/000000_0' into table wtest2;

set hive.execution.engine=tez;

select x1.equi_type, x1.ym, x1.fl, x1.z,x2.fl
 from
 (
 select equi_type,ym,count(distinct cons_no) z,fl
 from wtest 
 group by equi_type,ym,fl
 ) x1,
 (
 select equi_type,ym,count(distinct cons_no) z,fl
 from wtest2 
 group by equi_type,ym,fl
 ) x2
 where
 x1.equi_type = x2.equi_type and x1.fl = x2.fl and x1.ym = x2.ym;

 

get wrong result:

!image-2021-09-15-10-44-43-366.png!

 

when disable mapjoin or set hive.convert.join.bucket.mapjoin.tez=false, result 
is correct.

!image-2021-09-15-10-46-57-668.png!



--
This message was sent by Atlassian Jira
(v8.3.4#803005)

Reply via email to