[ 
https://issues.apache.org/jira/browse/HIVE-15870?page=com.atlassian.jira.plugin.system.issuetabpanels:all-tabpanel
 ]

Sergey Shelukhin updated HIVE-15870:
------------------------------------
    Description: 
Both single-join queries produce results, but not the last query.
Looking at MM logs, it looks like the inputs are read correctly. Must be 
something parquet-specific w.r.t. multiple files in a table.
{noformat}
set hive.optimize.index.filter = true;
set hive.auto.convert.join=false;

CREATE TABLE tbl1(id INT) STORED AS PARQUET;
INSERT INTO tbl1 VALUES(1), (2);

CREATE TABLE tbl2(id INT, value STRING) STORED AS PARQUET;
INSERT INTO tbl2 VALUES(1, 'value1');
INSERT INTO tbl2 VALUES(1, 'value2');

select tbl1.id, t1.value
FROM tbl1
JOIN (SELECT * FROM tbl2 WHERE value='value2') t1 ON tbl1.id=t1.id;
select tbl1.id, t1.value
FROM tbl1
JOIN (SELECT * FROM tbl2 WHERE value='value1') t1 ON tbl1.id=t1.id;

select tbl1.id, t1.value, t2.value
FROM tbl1
JOIN (SELECT * FROM tbl2 WHERE value='value1') t1 ON tbl1.id=t1.id
JOIN (SELECT * FROM tbl2 WHERE value='value2') t2 ON tbl1.id=t2.id;
{noformat}

  was:
Either of the single-join queries produces results, but not the last query.
Looking at MM logs, it looks like the inputs are read correctly. Must be 
something parquet-specific w.r.t. multiple files in a table.
{noformat}
set hive.optimize.index.filter = true;
set hive.auto.convert.join=false;

CREATE TABLE tbl1(id INT) STORED AS PARQUET;
INSERT INTO tbl1 VALUES(1), (2);

CREATE TABLE tbl2(id INT, value STRING) STORED AS PARQUET;
INSERT INTO tbl2 VALUES(1, 'value1');
INSERT INTO tbl2 VALUES(1, 'value2');

select tbl1.id, t1.value
FROM tbl1
JOIN (SELECT * FROM tbl2 WHERE value='value2') t1 ON tbl1.id=t1.id;
select tbl1.id, t1.value
FROM tbl1
JOIN (SELECT * FROM tbl2 WHERE value='value1') t1 ON tbl1.id=t1.id;

select tbl1.id, t1.value, t2.value
FROM tbl1
JOIN (SELECT * FROM tbl2 WHERE value='value1') t1 ON tbl1.id=t1.id
JOIN (SELECT * FROM tbl2 WHERE value='value2') t2 ON tbl1.id=t2.id;
{noformat}


> MM tables - parquet_join test fails
> -----------------------------------
>
>                 Key: HIVE-15870
>                 URL: https://issues.apache.org/jira/browse/HIVE-15870
>             Project: Hive
>          Issue Type: Sub-task
>            Reporter: Sergey Shelukhin
>
> Both single-join queries produce results, but not the last query.
> Looking at MM logs, it looks like the inputs are read correctly. Must be 
> something parquet-specific w.r.t. multiple files in a table.
> {noformat}
> set hive.optimize.index.filter = true;
> set hive.auto.convert.join=false;
> CREATE TABLE tbl1(id INT) STORED AS PARQUET;
> INSERT INTO tbl1 VALUES(1), (2);
> CREATE TABLE tbl2(id INT, value STRING) STORED AS PARQUET;
> INSERT INTO tbl2 VALUES(1, 'value1');
> INSERT INTO tbl2 VALUES(1, 'value2');
> select tbl1.id, t1.value
> FROM tbl1
> JOIN (SELECT * FROM tbl2 WHERE value='value2') t1 ON tbl1.id=t1.id;
> select tbl1.id, t1.value
> FROM tbl1
> JOIN (SELECT * FROM tbl2 WHERE value='value1') t1 ON tbl1.id=t1.id;
> select tbl1.id, t1.value, t2.value
> FROM tbl1
> JOIN (SELECT * FROM tbl2 WHERE value='value1') t1 ON tbl1.id=t1.id
> JOIN (SELECT * FROM tbl2 WHERE value='value2') t2 ON tbl1.id=t2.id;
> {noformat}



--
This message was sent by Atlassian JIRA
(v6.3.15#6346)

Reply via email to