dongjoon-hyun commented on a change in pull request #24860: [SPARK-28034][SQL] 
Port with.sql
URL: https://github.com/apache/spark/pull/24860#discussion_r300815838
 
 

 ##########
 File path: sql/core/src/test/resources/sql-tests/inputs/pgSQL/with.sql
 ##########
 @@ -0,0 +1,1222 @@
+--
+-- Portions Copyright (c) 1996-2019, PostgreSQL Global Development Group
+--
+--
+-- WITH
+-- 
https://github.com/postgres/postgres/blob/REL_12_BETA2/src/test/regress/sql/with.sql
+--
+-- This test suite contains two Cartesian products without using explicit 
CROSS JOIN syntax.
+-- Thus, we set spark.sql.crossJoin.enabled to true.
+set spark.sql.crossJoin.enabled=true;
+
+--
+-- Tests for common table expressions (WITH query, ... SELECT ...)
+--
+
+-- Basic WITH
+WITH q1(x,y) AS (SELECT 1,2)
+SELECT * FROM q1, q1 AS q2;
+
+-- Multiple uses are evaluated only once
+-- [SPARK-19799] Support recursive SQL query
+--SELECT count(*) FROM (
+--  WITH q1(x) AS (SELECT random() FROM generate_series(1, 5))
+--    SELECT * FROM q1
+--  UNION
+--    SELECT * FROM q1
+--) ss;
+
+-- WITH RECURSIVE
+
+-- sum of 1..100
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE t(n) AS (
+--    VALUES (1)
+--UNION ALL
+--    SELECT n+1 FROM t WHERE n < 100
+--)
+--SELECT sum(n) FROM t;
+
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE t(n) AS (
+--    SELECT (VALUES(1))
+--UNION ALL
+--    SELECT n+1 FROM t WHERE n < 5
+--)
+--SELECT * FROM t;
+
+-- recursive view
+-- [SPARK-24497] Support recursive SQL query
+--CREATE RECURSIVE VIEW nums (n) AS
+--    VALUES (1)
+--UNION ALL
+--    SELECT n+1 FROM nums WHERE n < 5;
+--
+--SELECT * FROM nums;
+
+-- [SPARK-24497] Support recursive SQL query
+--CREATE OR REPLACE RECURSIVE VIEW nums (n) AS
+--    VALUES (1)
+--UNION ALL
+--    SELECT n+1 FROM nums WHERE n < 6;
+--
+--SELECT * FROM nums;
+
+-- This is an infinite loop with UNION ALL, but not with UNION
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE t(n) AS (
+--    SELECT 1
+--UNION
+--    SELECT 10-n FROM t)
+--SELECT * FROM t;
+
+-- This'd be an infinite loop, but outside query reads only as much as needed
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE t(n) AS (
+--    VALUES (1)
+--UNION ALL
+--    SELECT n+1 FROM t)
+--SELECT * FROM t LIMIT 10;
+
+-- UNION case should have same property
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE t(n) AS (
+--    SELECT 1
+--UNION
+--    SELECT n+1 FROM t)
+--SELECT * FROM t LIMIT 10;
+
+-- Test behavior with an unknown-type literal in the WITH
+-- [SPARK-28146] Support IS OF type predicate
+--WITH q AS (SELECT 'foo' AS x)
+--SELECT x, x IS OF (text) AS is_text FROM q;
+
+-- [SPARK-24497] Support recursive SQL query
+-- [SPARK-28146] Support IS OF type predicate
+--WITH RECURSIVE t(n) AS (
+--    SELECT 'foo'
+--UNION ALL
+--    SELECT n || ' bar' FROM t WHERE length(n) < 20
+--)
+--SELECT n, n IS OF (text) AS is_text FROM t;
+
+-- In a perfect world, this would work and resolve the literal as int ...
+-- but for now, we have to be content with resolving to text too soon.
+-- [SPARK-24497] Support recursive SQL query
+-- [SPARK-28146] Support IS OF type predicate
+--WITH RECURSIVE t(n) AS (
+--    SELECT '7'
+--UNION ALL
+--    SELECT n+1 FROM t WHERE n < 10
+--)
+--SELECT n, n IS OF (int) AS is_int FROM t;
+
+--
+-- Some examples with a tree
+--
+-- department structure represented here is as follows:
+--
+-- ROOT-+->A-+->B-+->C
+--      |         |
+--      |         +->D-+->F
+--      +->E-+->G
+
+
+-- [ORIGINAL SQL]
+--CREATE TEMP TABLE department (
+--     id INTEGER PRIMARY KEY,  -- department ID
+--     parent_department INTEGER REFERENCES department, -- upper department ID
+--     name string -- department name
+--);
+CREATE TABLE department (
+       id INTEGER,  -- department ID
+       parent_department INTEGER, -- upper department ID
+       name string -- department name
+) USING parquet;
+
+INSERT INTO department VALUES (0, NULL, 'ROOT');
+INSERT INTO department VALUES (1, 0, 'A');
+INSERT INTO department VALUES (2, 1, 'B');
+INSERT INTO department VALUES (3, 2, 'C');
+INSERT INTO department VALUES (4, 2, 'D');
+INSERT INTO department VALUES (5, 0, 'E');
+INSERT INTO department VALUES (6, 4, 'F');
+INSERT INTO department VALUES (7, 5, 'G');
+
+
+-- extract all departments under 'A'. Result should be A, B, C, D and F
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE subdepartment AS
+--(
+--     -- non recursive term
+--     SELECT name as root_name, * FROM department WHERE name = 'A'
+--
+--     UNION ALL
+--
+--     -- recursive term
+--     SELECT sd.root_name, d.* FROM department AS d, subdepartment AS sd
+--             WHERE d.parent_department = sd.id
+--)
+--SELECT * FROM subdepartment ORDER BY name;
+
+-- extract all departments under 'A' with "level" number
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE subdepartment(level, id, parent_department, name) AS
+--(
+--     -- non recursive term
+--     SELECT 1, * FROM department WHERE name = 'A'
+--
+--     UNION ALL
+--
+--     -- recursive term
+--     SELECT sd.level + 1, d.* FROM department AS d, subdepartment AS sd
+--             WHERE d.parent_department = sd.id
+--)
+--SELECT * FROM subdepartment ORDER BY name;
+
+-- extract all departments under 'A' with "level" number.
+-- Only shows level 2 or more
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE subdepartment(level, id, parent_department, name) AS
+--(
+--     -- non recursive term
+--     SELECT 1, * FROM department WHERE name = 'A'
+--
+--     UNION ALL
+--
+--     -- recursive term
+--     SELECT sd.level + 1, d.* FROM department AS d, subdepartment AS sd
+--             WHERE d.parent_department = sd.id
+--)
+--SELECT * FROM subdepartment WHERE level >= 2 ORDER BY name;
+
+-- "RECURSIVE" is ignored if the query has no self-reference
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE subdepartment AS
+--(
+--     -- note lack of recursive UNION structure
+--     SELECT * FROM department WHERE name = 'A'
+--)
+--SELECT * FROM subdepartment ORDER BY name;
+
+-- inside subqueries
+-- [SPARK-19799] Support WITH clause in subqueries
+-- [SPARK-24497] Support recursive SQL query
+--SELECT count(*) FROM (
+--    WITH RECURSIVE t(n) AS (
+--        SELECT 1 UNION ALL SELECT n + 1 FROM t WHERE n < 500
+--    )
+--    SELECT * FROM t) AS t WHERE n < (
+--        SELECT count(*) FROM (
+--            WITH RECURSIVE t(n) AS (
+--                   SELECT 1 UNION ALL SELECT n + 1 FROM t WHERE n < 100
+--                )
+--            SELECT * FROM t WHERE n < 50000
+--         ) AS t WHERE n < 100);
+
+-- use same CTE twice at different subquery levels
+-- [SPARK-24497] Support recursive SQL query
+--WITH q1(x,y) AS (
+--    SELECT hundred, sum(ten) FROM tenk1 GROUP BY hundred
+--  )
+--SELECT count(*) FROM q1 WHERE y > (SELECT sum(y)/100 FROM q1 qsub);
+
+-- via a VIEW
+-- [SPARK-24497] Support recursive SQL query
+--CREATE TEMPORARY VIEW vsubdepartment AS
+--     WITH RECURSIVE subdepartment AS
+--     (
+--              -- non recursive term
+--             SELECT * FROM department WHERE name = 'A'
+--             UNION ALL
+--             -- recursive term
+--             SELECT d.* FROM department AS d, subdepartment AS sd
+--                     WHERE d.parent_department = sd.id
+--     )
+--     SELECT * FROM subdepartment;
+--
+--SELECT * FROM vsubdepartment ORDER BY name;
+
+-- Check reverse listing
+-- [TODO] is there a way to show DDL of a view?
+--SELECT pg_get_viewdef('vsubdepartment'::regclass);
+--SELECT pg_get_viewdef('vsubdepartment'::regclass, true);
+
+-- Another reverse-listing example
+-- [SPARK-24497] Support recursive SQL query
+--CREATE VIEW sums_1_100 AS
+--WITH RECURSIVE t(n) AS (
+--    VALUES (1)
+--UNION ALL
+--    SELECT n+1 FROM t WHERE n < 100
+--)
+--SELECT sum(n) FROM t;
+
+-- [TODO] is there a way to show DDL of a view?
+--\d+ sums_1_100
+
+-- corner case in which sub-WITH gets initialized first
+-- [SPARK-24497] Support recursive SQL query
+--with recursive q as (
+--      select * from department
+--    union all
+--      (with x as (select * from q)
+--       select * from x)
+--    )
+--select * from q limit 24;
+
+-- [SPARK-24497] Support recursive SQL query
+--with recursive q as (
+--      select * from department
+--    union all
+--      (with recursive x as (
+--           select * from department
+--         union all
+--           (select * from q union all select * from x)
+--        )
+--       select * from x)
+--    )
+--select * from q limit 32;
+
+-- recursive term has sub-UNION
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE t(i,j) AS (
+--     VALUES (1,2)
+--     UNION ALL
+--     SELECT t2.i, t.j+1 FROM
+--             (SELECT 2 AS i UNION ALL SELECT 3 AS i) AS t2
+--             JOIN t ON (t2.i = t.i+1))
+--
+--     SELECT * FROM t;
+
+--
+-- different tree example
+--
+-- [ORIGINAL SQL]
+--CREATE TEMPORARY TABLE tree(
+--    id INTEGER PRIMARY KEY,
+--    parent_id INTEGER REFERENCES tree(id)
+--);
+CREATE TABLE tree(
+    id INTEGER,
+    parent_id INTEGER
+) USING parquet;
+
+INSERT INTO tree
+VALUES (1, NULL), (2, 1), (3,1), (4,2), (5,2), (6,2), (7,3), (8,3),
+       (9,4), (10,4), (11,7), (12,7), (13,7), (14, 9), (15,11), (16,11);
+
+--
+-- get all paths from "second level" nodes to leaf nodes
+--
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE t(id, path) AS (
+--    VALUES(1,ARRAY[]::integer[])
+--UNION ALL
+--    SELECT tree.id, t.path || tree.id
+--    FROM tree JOIN t ON (tree.parent_id = t.id)
+--)
+--SELECT t1.*, t2.* FROM t AS t1 JOIN t AS t2 ON
+--     (t1.path[1] = t2.path[1] AND
+--     array_upper(t1.path,1) = 1 AND
+--     array_upper(t2.path,1) > 1)
+--     ORDER BY t1.id, t2.id;
+
+-- just count 'em
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE t(id, path) AS (
+--    VALUES(1,ARRAY[]::integer[])
+--UNION ALL
+--    SELECT tree.id, t.path || tree.id
+--    FROM tree JOIN t ON (tree.parent_id = t.id)
+--)
+--SELECT t1.id, count(t2.*) FROM t AS t1 JOIN t AS t2 ON
+--     (t1.path[1] = t2.path[1] AND
+--     array_upper(t1.path,1) = 1 AND
+--     array_upper(t2.path,1) > 1)
+--     GROUP BY t1.id
+--     ORDER BY t1.id;
+
+-- this variant tickled a whole-row-variable bug in 8.4devel
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE t(id, path) AS (
+--    VALUES(1,ARRAY[]::integer[])
+--UNION ALL
+--    SELECT tree.id, t.path || tree.id
+--    FROM tree JOIN t ON (tree.parent_id = t.id)
+--)
+--SELECT t1.id, t2.path, t2 FROM t AS t1 JOIN t AS t2 ON
+--(t1.id=t2.id);
+
+--
+-- test cycle detection
+--
+-- [ORIGINAL SQL]
+--create temp table graph( f int, t int, label text );
+create table graph( f int, t int, label string ) USING parquet;
+
+insert into graph values
+       (1, 2, 'arc 1 -> 2'),
+       (1, 3, 'arc 1 -> 3'),
+       (2, 3, 'arc 2 -> 3'),
+       (1, 4, 'arc 1 -> 4'),
+       (4, 5, 'arc 4 -> 5'),
+       (5, 1, 'arc 5 -> 1');
+
+-- [SPARK-24497] Support recursive SQL query
+--with recursive search_graph(f, t, label, path, cycle) as (
+--     select *, array[row(g.f, g.t)], false from graph g
+--     union all
+--     select g.*, path || row(g.f, g.t), row(g.f, g.t) = any(path)
+--     from graph g, search_graph sg
+--     where g.f = sg.t and not cycle
+--)
+--select * from search_graph;
+
+-- ordering by the path column has same effect as SEARCH DEPTH FIRST
+-- [SPARK-24497] Support recursive SQL query
+--with recursive search_graph(f, t, label, path, cycle) as (
+--     select *, array[row(g.f, g.t)], false from graph g
+--     union all
+--     select g.*, path || row(g.f, g.t), row(g.f, g.t) = any(path)
+--     from graph g, search_graph sg
+--     where g.f = sg.t and not cycle
+--)
+--select * from search_graph order by path;
+
+--
+-- test multiple WITH queries
+--
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE
+--  y (id) AS (VALUES (1)),
+--  x (id) AS (SELECT * FROM y UNION ALL SELECT id+1 FROM x WHERE id < 5)
+--SELECT * FROM x;
+
+-- forward reference OK
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE
+--    x(id) AS (SELECT * FROM y UNION ALL SELECT id+1 FROM x WHERE id < 5),
+--    y(id) AS (values (1))
+-- SELECT * FROM x;
+
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE
+--   x(id) AS
+--     (VALUES (1) UNION ALL SELECT id+1 FROM x WHERE id < 5),
+--   y(id) AS
+--     (VALUES (1) UNION ALL SELECT id+1 FROM y WHERE id < 10)
+-- SELECT y.*, x.* FROM y LEFT JOIN x USING (id);
+
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE
+--   x(id) AS
+--     (VALUES (1) UNION ALL SELECT id+1 FROM x WHERE id < 5),
+--   y(id) AS
+--     (VALUES (1) UNION ALL SELECT id+1 FROM x WHERE id < 10)
+-- SELECT y.*, x.* FROM y LEFT JOIN x USING (id);
+
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE
+--   x(id) AS
+--     (SELECT 1 UNION ALL SELECT id+1 FROM x WHERE id < 3 ),
+--   y(id) AS
+--     (SELECT * FROM x UNION ALL SELECT * FROM x),
+--   z(id) AS
+--     (SELECT * FROM x UNION ALL SELECT id+1 FROM z WHERE id < 10)
+-- SELECT * FROM z;
+
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE
+--   x(id) AS
+--     (SELECT 1 UNION ALL SELECT id+1 FROM x WHERE id < 3 ),
+--   y(id) AS
+--     (SELECT * FROM x UNION ALL SELECT * FROM x),
+--   z(id) AS
+--     (SELECT * FROM y UNION ALL SELECT id+1 FROM z WHERE id < 10)
+-- SELECT * FROM z;
+
+--
+-- Test WITH attached to a data-modifying statement
+--
+
+-- [ORIGINAL SQL]
+--CREATE TEMPORARY TABLE y (a INTEGER) USING parquet;
+CREATE TABLE y (a INTEGER) USING parquet;
+-- [ORIGINAL SQL]
+--INSERT INTO y SELECT generate_series(1, 10);
+INSERT INTO y SELECT EXPLODE(SEQUENCE(1, 10));
+
+-- [SPARK-28147] Support RETURNING clause
+--WITH t AS (
+--     SELECT a FROM y
+--)
+--INSERT INTO y
+--SELECT a+20 FROM t RETURNING *;
+--
+--SELECT * FROM y;
+
+-- [NOTE] Spark SQL doesn't support UPDATE statement
+----WITH t AS (
+----   SELECT a FROM y
+----)
+----UPDATE y SET a = y.a-10 FROM t WHERE y.a > 20 AND t.a = y.a RETURNING y.a;
+--
+--SELECT * FROM y;
+
+-- [NOTE] Spark SQL doesn't support DELETE statement
+--WITH RECURSIVE t(a) AS (
+--     SELECT 11
+--     UNION ALL
+--     SELECT a+1 FROM t WHERE a < 50
+--)
+--DELETE FROM y USING t WHERE t.a = y.a RETURNING y.a;
+--
+--SELECT * FROM y;
+
+DROP TABLE y;
+
+--
+-- error cases
+--
+
+-- INTERSECT
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE x(n) AS (SELECT 1 INTERSECT SELECT n+1 FROM x)
+--     SELECT * FROM x;
+
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE x(n) AS (SELECT 1 INTERSECT ALL SELECT n+1 FROM x)
+--     SELECT * FROM x;
+
+-- EXCEPT
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE x(n) AS (SELECT 1 EXCEPT SELECT n+1 FROM x)
+--     SELECT * FROM x;
+
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE x(n) AS (SELECT 1 EXCEPT ALL SELECT n+1 FROM x)
+--     SELECT * FROM x;
+
+-- no non-recursive term
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE x(n) AS (SELECT n FROM x)
+--     SELECT * FROM x;
+
+-- recursive term in the left hand side (strictly speaking, should allow this)
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE x(n) AS (SELECT n FROM x UNION ALL SELECT 1)
+--     SELECT * FROM x;
+
+-- [ORIGINAL SQL]
+--CREATE TEMPORARY TABLE y (a INTEGER);
+CREATE TABLE y (a INTEGER) USING parquet;
+-- [ORIGINAL SQL]
+--INSERT INTO y SELECT generate_series(1, 10);
+INSERT INTO y SELECT EXPLODE(SEQUENCE(1, 10));
+
+-- LEFT JOIN
+
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE x(n) AS (SELECT a FROM y WHERE a = 1
+--     UNION ALL
+--     SELECT x.n+1 FROM y LEFT JOIN x ON x.n = y.a WHERE n < 10)
+--SELECT * FROM x;
+
+-- RIGHT JOIN
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE x(n) AS (SELECT a FROM y WHERE a = 1
+--     UNION ALL
+--     SELECT x.n+1 FROM x RIGHT JOIN y ON x.n = y.a WHERE n < 10)
+--SELECT * FROM x;
+
+-- FULL JOIN
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE x(n) AS (SELECT a FROM y WHERE a = 1
+--     UNION ALL
+--     SELECT x.n+1 FROM x FULL JOIN y ON x.n = y.a WHERE n < 10)
+--SELECT * FROM x;
+
+-- subquery
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE x(n) AS (SELECT 1 UNION ALL SELECT n+1 FROM x
+--                          WHERE n IN (SELECT * FROM x))
+--  SELECT * FROM x;
+
+-- aggregate functions
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE x(n) AS (SELECT 1 UNION ALL SELECT count(*) FROM x)
+--  SELECT * FROM x;
+
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE x(n) AS (SELECT 1 UNION ALL SELECT sum(n) FROM x)
+--  SELECT * FROM x;
+
+-- ORDER BY
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE x(n) AS (SELECT 1 UNION ALL SELECT n+1 FROM x ORDER BY 1)
+--  SELECT * FROM x;
+
+-- LIMIT/OFFSET
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE x(n) AS (SELECT 1 UNION ALL SELECT n+1 FROM x LIMIT 10 OFFSET 
1)
+--  SELECT * FROM x;
+
+-- FOR UPDATE
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE x(n) AS (SELECT 1 UNION ALL SELECT n+1 FROM x FOR UPDATE)
+--  SELECT * FROM x;
+
+-- target list has a recursive query name
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE x(id) AS (values (1)
+--    UNION ALL
+--    SELECT (SELECT * FROM x) FROM x WHERE id < 5
+--) SELECT * FROM x;
+
+-- mutual recursive query (not implemented)
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE
+--  x (id) AS (SELECT 1 UNION ALL SELECT id+1 FROM y WHERE id < 5),
+--  y (id) AS (SELECT 1 UNION ALL SELECT id+1 FROM x WHERE id < 5)
+--SELECT * FROM x;
+
+-- non-linear recursion is not allowed
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE foo(i) AS
+--    (values (1)
+--    UNION ALL
+--       (SELECT i+1 FROM foo WHERE i < 10
+--          UNION ALL
+--       SELECT i+1 FROM foo WHERE i < 5)
+--) SELECT * FROM foo;
+
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE foo(i) AS
+--    (values (1)
+--    UNION ALL
+--        SELECT * FROM
+--       (SELECT i+1 FROM foo WHERE i < 10
+--          UNION ALL
+--       SELECT i+1 FROM foo WHERE i < 5) AS t
+--) SELECT * FROM foo;
+
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE foo(i) AS
+--    (values (1)
+--    UNION ALL
+--       (SELECT i+1 FROM foo WHERE i < 10
+--          EXCEPT
+--       SELECT i+1 FROM foo WHERE i < 5)
+--) SELECT * FROM foo;
+
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE foo(i) AS
+--    (values (1)
+--    UNION ALL
+--       (SELECT i+1 FROM foo WHERE i < 10
+--          INTERSECT
+--       SELECT i+1 FROM foo WHERE i < 5)
+--) SELECT * FROM foo;
+
+-- Wrong type induced from non-recursive term
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE foo(i) AS
+--   (SELECT i FROM (VALUES(1),(2)) t(i)
+--   UNION ALL
+--   SELECT (i+1)::numeric(10,0) FROM foo WHERE i < 10)
+--SELECT * FROM foo;
+
+-- rejects different typmod, too (should we allow this?)
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE foo(i) AS
+--   (SELECT i::numeric(3,0) FROM (VALUES(1),(2)) t(i)
+--   UNION ALL
+--   SELECT (i+1)::numeric(10,0) FROM foo WHERE i < 10)
+--SELECT * FROM foo;
+
+-- [NOTE] Spark SQL doesn't support RULEs
+-- disallow OLD/NEW reference in CTE
+--CREATE TABLE x (n integer) USING parquet;
+--CREATE RULE r2 AS ON UPDATE TO x DO INSTEAD
+--    WITH t AS (SELECT OLD.*) UPDATE y SET a = t.n FROM t;
+
+--
+-- test for bug #4902
+--
+-- [SPARK-19799] Support recursive SQL query
+--with cte(foo) as ( values(42) ) values((select foo from cte));
+with cte(foo) as ( select 42 ) select * from ((select foo from cte)) q;
+
+-- test CTE referencing an outer-level variable (to see that changed-parameter
+-- signaling still works properly after fixing this bug)
+-- [SPARK-19799] Support WITH clause in subqueries
+--select ( with cte(foo) as ( values(f1) )
+--         select (select foo from cte) )
+--from int4_tbl;
+
+-- [SPARK-19799] Support WITH clause in subqueries
+--select ( with cte(foo) as ( values(f1) )
+--          values((select foo from cte)) )
+--from int4_tbl;
+
+--
+-- test for nested-recursive-WITH bug
+--
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE t(j) AS (
+--    WITH RECURSIVE s(i) AS (
+--        VALUES (1)
+--        UNION ALL
+--        SELECT i+1 FROM s WHERE i < 10
+--    )
+--    SELECT i FROM s
+--    UNION ALL
+--    SELECT j+1 FROM t WHERE j < 10
+--)
+--SELECT * FROM t;
+
+--
+-- test WITH attached to intermediate-level set operation
+--
+
+-- [SPARK-19799] Support recursive SQL query
+--WITH outermost(x) AS (
+--  SELECT 1
+--  UNION (WITH innermost as (SELECT 2)
+--         SELECT * FROM innermost
+--         UNION SELECT 3)
+--)
+--SELECT * FROM outermost ORDER BY 1;
+
+-- [SPARK-19799] Support recursive SQL query
+--WITH outermost(x) AS (
+--  SELECT 1
+--  UNION (WITH innermost as (SELECT 2)
+--         SELECT * FROM outermost  -- fail
+--         UNION SELECT * FROM innermost)
+--)
+--SELECT * FROM outermost ORDER BY 1;
+
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE outermost(x) AS (
+--  SELECT 1
+--  UNION (WITH innermost as (SELECT 2)
+--         SELECT * FROM outermost
+--         UNION SELECT * FROM innermost)
+--)
+--SELECT * FROM outermost ORDER BY 1;
+
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE outermost(x) AS (
+--  WITH innermost as (SELECT 2 FROM outermost) -- fail
+--    SELECT * FROM innermost
+--    UNION SELECT * from outermost
+--)
+--SELECT * FROM outermost ORDER BY 1;
+
+--
+-- This test will fail with the old implementation of PARAM_EXEC parameter
+-- assignment, because the "q1" Var passed down to A's targetlist subselect
+-- looks exactly like the "A.id" Var passed down to C's subselect, causing
+-- the old code to give them the same runtime PARAM_EXEC slot.  But the
+-- lifespans of the two parameters overlap, thanks to B also reading A.
+--
+
+-- [NOTE] INT8_TBL is created in int8.sql originally
+--CREATE TABLE INT8_TBL(q1 bigint, q2 bigint) USING parquet;
+--INSERT INTO INT8_TBL VALUES(trim('  123   '),trim('  456'));
+--INSERT INTO INT8_TBL VALUES(trim('123   '),'4567890123456789');
+--INSERT INTO INT8_TBL VALUES('4567890123456789','123');
+--INSERT INTO INT8_TBL VALUES(+4567890123456789,'4567890123456789');
+--INSERT INTO INT8_TBL VALUES('+4567890123456789','-4567890123456789');
+
+-- [SPARK-27878] Support ARRAY(sub-SELECT) expressions
+--with
+--A as ( select q2 as id, (select q1) as x from int8_tbl ),
+--B as ( select id, row_number() over (partition by id) as r from A ),
+--C as ( select A.id, array(select B.id from B where B.id = A.id) from A )
+--select * from C;
+
+--DROP TABLE INT8_TBL;
+
+--
+-- Test CTEs read in non-initialization orders
+--
+
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE
+--  tab(id_key,link) AS (VALUES (1,17), (2,17), (3,17), (4,17), (6,17), 
(5,17)),
+--  iter (id_key, row_type, link) AS (
+--      SELECT 0, 'base', 17
+--    UNION ALL (
+--      WITH remaining(id_key, row_type, link, min) AS (
+--        SELECT tab.id_key, 'true'::text, iter.link, MIN(tab.id_key) OVER ()
+--        FROM tab INNER JOIN iter USING (link)
+--        WHERE tab.id_key > iter.id_key
+--      ),
+--      first_remaining AS (
+--        SELECT id_key, row_type, link
+--        FROM remaining
+--        WHERE id_key=min
+--      ),
+--      effect AS (
+--        SELECT tab.id_key, 'new'::text, tab.link
+--        FROM first_remaining e INNER JOIN tab ON e.id_key=tab.id_key
+--        WHERE e.row_type = 'false'
+--      )
+--      SELECT * FROM first_remaining
+--      UNION ALL SELECT * FROM effect
+--    )
+--  )
+--SELECT * FROM iter;
+
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE
+--  tab(id_key,link) AS (VALUES (1,17), (2,17), (3,17), (4,17), (6,17), 
(5,17)),
+--  iter (id_key, row_type, link) AS (
+--      SELECT 0, 'base', 17
+--    UNION (
+--      WITH remaining(id_key, row_type, link, min) AS (
+--        SELECT tab.id_key, 'true'::text, iter.link, MIN(tab.id_key) OVER ()
+--        FROM tab INNER JOIN iter USING (link)
+--        WHERE tab.id_key > iter.id_key
+--      ),
+--      first_remaining AS (
+--        SELECT id_key, row_type, link
+--        FROM remaining
+--        WHERE id_key=min
+--      ),
+--      effect AS (
+--        SELECT tab.id_key, 'new'::text, tab.link
+--        FROM first_remaining e INNER JOIN tab ON e.id_key=tab.id_key
+--        WHERE e.row_type = 'false'
+--      )
+--      SELECT * FROM first_remaining
+--      UNION ALL SELECT * FROM effect
+--    )
+--  )
+--SELECT * FROM iter;
+
+--
+-- Data-modifying statements in WITH
+--
+
+-- INSERT ... RETURNING
+-- [SPARK-28147] Support RETURNING clause
+--WITH t AS (
+--    INSERT INTO y
+--    VALUES
+--        (11),
+--        (12),
+--        (13),
+--        (14),
+--        (15),
+--        (16),
+--        (17),
+--        (18),
+--        (19),
+--        (20)
+--    RETURNING *
+--)
+--SELECT * FROM t;
+--
+--SELECT * FROM y;
+
+-- UPDATE ... RETURNING
+-- [NOTE] Spark SQL doesn't support UPDATE statement
+--WITH t AS (
+--    UPDATE y
+--    SET a=a+1
+--    RETURNING *
+--)
+--SELECT * FROM t;
+--
+--SELECT * FROM y;
+
+-- DELETE ... RETURNING
+-- [NOTE] Spark SQL doesn't support DELETE statement
+--WITH t AS (
+--    DELETE FROM y
+--    WHERE a <= 10
+--    RETURNING *
+--)
+--SELECT * FROM t;
+--
+--SELECT * FROM y;
+
+-- forward reference
+-- [NOTE] Spark SQL doesn't support UPDATE statement
+--WITH RECURSIVE t AS (
+--     INSERT INTO y
+--             SELECT a+5 FROM t2 WHERE a > 5
+--     RETURNING *
+--), t2 AS (
+--     UPDATE y SET a=a-11 RETURNING *
+--)
+--SELECT * FROM t
+--UNION ALL
+--SELECT * FROM t2;
+--
+--SELECT * FROM y;
+
+-- unconditional DO INSTEAD rule
+-- [NOTE] Spark SQL doesn't support RULEs
+--CREATE RULE y_rule AS ON DELETE TO y DO INSTEAD
+--  INSERT INTO y VALUES(42) RETURNING *;
+
+-- [NOTE] Spark SQL doesn't support DELETE statement
+--WITH t AS (
+--     DELETE FROM y RETURNING *
+--)
+--SELECT * FROM t;
+--
+--SELECT * FROM y;
+
+--DROP RULE y_rule ON y;
+
+-- check merging of outer CTE with CTE in a rule action
+-- [ORIGINAL SQL]
+--CREATE TEMP TABLE bug6051 AS
+--  select i from generate_series(1,3) as t(i);
+CREATE TABLE bug6051 USING parquet AS
+  SELECT EXPLODE(SEQUENCE(1,3)) AS i;
+
+SELECT * FROM bug6051;
+
+-- [NOTE] Spark SQL doesn't support DELETE statement
+--WITH t1 AS ( DELETE FROM bug6051 RETURNING * )
+--INSERT INTO bug6051 SELECT * FROM t1;
+--
+--SELECT * FROM bug6051;
+
+-- [ORIGINAL SQL]
+--CREATE TEMP TABLE bug6051_2 (i int);
+CREATE TABLE bug6051_2 (i int) USING parquet;
+
+--CREATE RULE bug6051_ins AS ON INSERT TO bug6051 DO INSTEAD
+-- INSERT INTO bug6051_2
+-- SELECT NEW.i;
+
+-- [NOTE] Spark SQL doesn't support DELETE statement
+--WITH t1 AS ( DELETE FROM bug6051 RETURNING * )
+--INSERT INTO bug6051 SELECT * FROM t1;
+--
+--SELECT * FROM bug6051;
+--SELECT * FROM bug6051_2;
+
+-- a truly recursive CTE in the same list
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE t(a) AS (
+--     SELECT 0
+--             UNION ALL
+--     SELECT a+1 FROM t WHERE a+1 < 5
+--), t2 as (
+--     INSERT INTO y
+--             SELECT * FROM t RETURNING *
+--)
+--SELECT * FROM t2 JOIN y USING (a) ORDER BY a;
+--
+--SELECT * FROM y;
+
+-- data-modifying WITH in a modifying statement
+-- [NOTE] Spark SQL doesn't support DELETE statement
+--WITH t AS (
+--    DELETE FROM y
+--    WHERE a <= 10
+--    RETURNING *
+--)
+--INSERT INTO y SELECT -a FROM t RETURNING *;
+--
+--SELECT * FROM y;
+
+-- check that WITH query is run to completion even if outer query isn't
+-- [NOTE] Spark SQL doesn't support UPDATE statement
+--WITH t AS (
+--    UPDATE y SET a = a * 100 RETURNING *
+--)
+--SELECT * FROM t LIMIT 10;
+--
+--SELECT * FROM y;
+
+-- data-modifying WITH containing INSERT...ON CONFLICT DO UPDATE
+-- [ORIGINAL SQL]
+--CREATE TABLE withz AS SELECT i AS k, (i || ' v')::text v FROM 
generate_series(1, 16, 3) i;
+CREATE TABLE withz USING parquet AS SELECT i AS k, CAST(i || ' v' AS string) v 
FROM (SELECT EXPLODE(SEQUENCE(1, 16, 3)) i);
+-- [NOTE] Spark SQL doesn't support UNIQUE constraints
+--ALTER TABLE withz ADD UNIQUE (k);
+
+-- [NOTE] Spark SQL doesn't support UPDATE statement
+--WITH t AS (
+--    INSERT INTO withz SELECT i, 'insert'
+--    FROM generate_series(0, 16) i
+--    ON CONFLICT (k) DO UPDATE SET v = withz.v || ', now update'
+--    RETURNING *
+--)
+--SELECT * FROM t JOIN y ON t.k = y.a ORDER BY a, k;
+
+-- Test EXCLUDED.* reference within CTE
+-- [NOTE] Spark SQL doesn't support ON CONFLICT clause
+--WITH aa AS (
+--    INSERT INTO withz VALUES(1, 5) ON CONFLICT (k) DO UPDATE SET v = 
EXCLUDED.v
+--    WHERE withz.k != EXCLUDED.k
+--    RETURNING *
+--)
+--SELECT * FROM aa;
+
+-- New query/snapshot demonstrates side-effects of previous query.
+SELECT * FROM withz ORDER BY k;
+
+--
+-- Ensure subqueries within the update clause work, even if they
+-- reference outside values
+--
+-- [NOTE] Spark SQL doesn't support ON CONFLICT clause
+--WITH aa AS (SELECT 1 a, 2 b)
+--INSERT INTO withz VALUES(1, 'insert')
+--ON CONFLICT (k) DO UPDATE SET v = (SELECT b || ' update' FROM aa WHERE a = 1 
LIMIT 1);
+--WITH aa AS (SELECT 1 a, 2 b)
+--INSERT INTO withz VALUES(1, 'insert')
+--ON CONFLICT (k) DO UPDATE SET v = ' update' WHERE withz.k = (SELECT a FROM 
aa);
+--WITH aa AS (SELECT 1 a, 2 b)
+--INSERT INTO withz VALUES(1, 'insert')
+--ON CONFLICT (k) DO UPDATE SET v = (SELECT b || ' update' FROM aa WHERE a = 1 
LIMIT 1);
+--WITH aa AS (SELECT 'a' a, 'b' b UNION ALL SELECT 'a' a, 'b' b)
+--INSERT INTO withz VALUES(1, 'insert')
+--ON CONFLICT (k) DO UPDATE SET v = (SELECT b || ' update' FROM aa WHERE a = 
'a' LIMIT 1);
+--WITH aa AS (SELECT 1 a, 2 b)
+--INSERT INTO withz VALUES(1, (SELECT b || ' insert' FROM aa WHERE a = 1 ))
+--ON CONFLICT (k) DO UPDATE SET v = (SELECT b || ' update' FROM aa WHERE a = 1 
LIMIT 1);
+
+-- Update a row more than once, in different parts of a wCTE. That is
+-- an allowed, presumably very rare, edge case, but since it was
+-- broken in the past, having a test seems worthwhile.
+-- [NOTE] Spark SQL doesn't support ON CONFLICT clause
+--WITH simpletup AS (
+--  SELECT 2 k, 'Green' v),
+--upsert_cte AS (
+--  INSERT INTO withz VALUES(2, 'Blue') ON CONFLICT (k) DO
+--    UPDATE SET (k, v) = (SELECT k, v FROM simpletup WHERE simpletup.k = 
withz.k)
+--    RETURNING k, v)
+--INSERT INTO withz VALUES(2, 'Red') ON CONFLICT (k) DO
+--UPDATE SET (k, v) = (SELECT k, v FROM upsert_cte WHERE upsert_cte.k = 
withz.k)
+--RETURNING k, v;
+
+DROP TABLE withz;
+
+-- check that run to completion happens in proper ordering
+
+TRUNCATE TABLE y;
+-- [ORIGINAL SQL]
+--INSERT INTO y SELECT generate_series(1, 3);
+INSERT INTO y SELECT EXPLODE(SEQUENCE(1, 3));
+-- [ORIGINAL SQL]
+--CREATE TEMPORARY TABLE yy (a INTEGER);
+CREATE TABLE yy (a INTEGER) USING parquet;
+
+-- [SPARK-24497] Support recursive SQL query
+-- [SPARK-28147] Support RETURNING clause
+--WITH RECURSIVE t1 AS (
+--  INSERT INTO y SELECT * FROM y RETURNING *
+--), t2 AS (
+--  INSERT INTO yy SELECT * FROM t1 RETURNING *
+--)
+--SELECT 1;
+
+SELECT * FROM y;
+SELECT * FROM yy;
+
+-- [SPARK-24497] Support recursive SQL query
+-- [SPARK-28147] Support RETURNING clause
+--WITH RECURSIVE t1 AS (
+--  INSERT INTO yy SELECT * FROM t2 RETURNING *
+--), t2 AS (
+--  INSERT INTO y SELECT * FROM y RETURNING *
+--)
+--SELECT 1;
+
+SELECT * FROM y;
+SELECT * FROM yy;
+
+-- [NOTE] Spark SQL doesn't support TRIGGERs
+-- triggers
+--
+--TRUNCATE TABLE y;
+--INSERT INTO y SELECT generate_series(1, 10);
+--
+--CREATE FUNCTION y_trigger() RETURNS trigger AS $$
+--begin
+--  raise notice 'y_trigger: a = %', new.a;
+--  return new;
+--end;
+--$$ LANGUAGE plpgsql;
+--
+--
+--CREATE TRIGGER y_trig BEFORE INSERT ON y FOR EACH ROW
+--    EXECUTE PROCEDURE y_trigger();
+--
+--WITH t AS (
+--    INSERT INTO y
+--    VALUES
+--        (21),
+--        (22),
+--        (23)
+--    RETURNING *
+--)
+--SELECT * FROM t;
+--
+--SELECT * FROM y;
+--
+--DROP TRIGGER y_trig ON y;
+--
+--CREATE TRIGGER y_trig AFTER INSERT ON y FOR EACH ROW
+--    EXECUTE PROCEDURE y_trigger();
+--
+--WITH t AS (
+--    INSERT INTO y
+--    VALUES
+--        (31),
+--        (32),
+--        (33)
+--    RETURNING *
+--)
+--SELECT * FROM t LIMIT 1;
+--
+--SELECT * FROM y;
+--
+--DROP TRIGGER y_trig ON y;
+--
+--CREATE OR REPLACE FUNCTION y_trigger() RETURNS trigger AS $$
+--begin
+--  raise notice 'y_trigger';
+--  return null;
+--end;
+--$$ LANGUAGE plpgsql;
+--
+--CREATE TRIGGER y_trig AFTER INSERT ON y FOR EACH STATEMENT
+--    EXECUTE PROCEDURE y_trigger();
+--
+--WITH t AS (
+--    INSERT INTO y
+--    VALUES
+--        (41),
+--        (42),
+--        (43)
+--    RETURNING *
+--)
+--SELECT * FROM t;
+--
+--SELECT * FROM y;
+--
+--DROP TRIGGER y_trig ON y;
+--DROP FUNCTION y_trigger();
+
+-- WITH attached to inherited UPDATE or DELETE
+
+-- [ORIGINAL SQL]
+--CREATE TEMP TABLE parent ( id int, val text );
+CREATE TABLE parent ( id int, val string ) USING parquet;
+-- [NOTE] Spark SQL doesn't support INHERITS clause
+--CREATE TEMP TABLE child1 ( ) INHERITS ( parent );
+-- [NOTE] Spark SQL doesn't support INHERITS clause
+--CREATE TEMP TABLE child2 ( ) INHERITS ( parent );
+
+INSERT INTO parent VALUES ( 1, 'p1' );
+--INSERT INTO child1 VALUES ( 11, 'c11' ),( 12, 'c12' );
+--INSERT INTO child2 VALUES ( 23, 'c21' ),( 24, 'c22' );
+
+-- [NOTE] Spark SQL doesn't support UPDATE statement
+--WITH rcte AS ( SELECT sum(id) AS totalid FROM parent )
+--UPDATE parent SET id = id + totalid FROM rcte;
+
+SELECT * FROM parent;
+
+-- [SPARK-28147] Support RETURNING clause
+--WITH wcte AS ( INSERT INTO child1 VALUES ( 42, 'new' ) RETURNING id AS newid 
)
+--UPDATE parent SET id = id + newid FROM wcte;
+--
+--SELECT * FROM parent;
+
+-- [NOTE] Spark SQL doesn't support DELETE statement
+--WITH rcte AS ( SELECT max(id) AS maxid FROM parent )
+--DELETE FROM parent USING rcte WHERE id = maxid;
+
+SELECT * FROM parent;
+
+-- [NOTE] Spark SQL doesn't support DELETE statement
+--WITH wcte AS ( INSERT INTO child2 VALUES ( 42, 'new2' ) RETURNING id AS 
newid )
+--DELETE FROM parent USING wcte WHERE id = newid;
+--
+--SELECT * FROM parent;
+
+-- check EXPLAIN VERBOSE for a wCTE with RETURNING
+
+-- [NOTE] Spark SQL doesn't support DELETE statement
+--EXPLAIN (VERBOSE, COSTS OFF)
+--WITH wcte AS ( INSERT INTO int8_tbl VALUES ( 42, 47 ) RETURNING q2 )
+--DELETE FROM a USING wcte WHERE aa = q2;
+
+-- error cases
+
+-- data-modifying WITH tries to use its own output
+-- [SPARK-24497] Support recursive SQL query
+--WITH RECURSIVE t AS (
+--     INSERT INTO y
+--             SELECT * FROM t
+--)
+--VALUES(FALSE);
+
+-- no RETURNING in a referenced data-modifying WITH
+-- [SPARK-24497] Support recursive SQL query
+--WITH t AS (
+--     INSERT INTO y VALUES(0)
+--)
+--SELECT * FROM t;
+
+-- data-modifying WITH allowed only at the top level
+-- [SPARK-28147] Support RETURNING clause
+--SELECT * FROM (
+--     WITH t AS (UPDATE y SET a=a+1 RETURNING *)
+--     SELECT * FROM t
+--) ss;
+
+-- most variants of rules aren't allowed
+-- [NOTE] Spark SQL doesn't support RULEs
+--CREATE RULE y_rule AS ON INSERT TO y WHERE a=0 DO INSTEAD DELETE FROM y;
+--WITH t AS (
+--     INSERT INTO y VALUES(0)
+--)
+--VALUES(FALSE);
+--DROP RULE y_rule ON y;
+
+-- check that parser lookahead for WITH doesn't cause any odd behavior
+create table foo (with baz);  -- fail, WITH is a reserved word
+create table foo (with ordinality);  -- fail, WITH is a reserved word
+with ordinality as (select 1 as x) select * from ordinality;
+
+-- check sane response to attempt to modify CTE relation
+WITH test AS (SELECT 42) INSERT INTO test VALUES (1);
+
+-- check response to attempt to modify table with same name as a CTE (perhaps
+-- surprisingly it works, because CTEs don't hide tables from data-modifying
+-- statements)
+-- [ORIGINAL SQL]
+--create temp table test (i int);
+create table test (i int) USING parquet;
 
 Review comment:
   ~ditto. `create temp table test`.~ Oops. Please ignore this. This table is 
used for `insert into`.

----------------------------------------------------------------
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.
 
For queries about this service, please contact Infrastructure at:
us...@infra.apache.org


With regards,
Apache Git Services

---------------------------------------------------------------------
To unsubscribe, e-mail: reviews-unsubscr...@spark.apache.org
For additional commands, e-mail: reviews-h...@spark.apache.org

Reply via email to