Ingest data for cte_inline tests

pull/3397/head
Onder Kalaci 2020-01-17 11:58:54 +01:00
parent 3833a7e686
commit 016f561e45
3 changed files with 800 additions and 448 deletions

File diff suppressed because it is too large Load Diff

File diff suppressed because it is too large Load Diff

View File

@ -4,6 +4,8 @@ SET citus.next_shard_id TO 1960000;
CREATE TABLE test_table (key int, value text, other_value jsonb);
SELECT create_distributed_table ('test_table', 'key');
INSERT INTO test_table SELECT i % 10, 'test' || i, row_to_json(row(i, i*18, 'test' || i)) FROM generate_series (0, 100) i;
-- server version because CTE inlining might produce
-- different debug messages in PG 11 vs PG 12
SHOW server_version \gset
@ -17,14 +19,16 @@ WITH cte_1 AS (SELECT * FROM test_table)
SELECT
*, (SELECT 1)
FROM
cte_1;
cte_1
ORDER BY 1 DESC LIMIT 3;
-- Should still not be inlined even if NOT MATERIALIZED is passed
WITH cte_1 AS NOT MATERIALIZED (SELECT * FROM test_table)
SELECT
*, (SELECT 1)
FROM
cte_1;
cte_1
ORDER BY 2 DESC LIMIT 1;
-- the cte can be inlined because the unsupported
-- part of the query (subquery in WHERE clause)
@ -68,7 +72,8 @@ WITH cte_1 AS
SELECT *, (SELECT 1)
FROM
(SELECT *
FROM cte_1) AS foo;
FROM cte_1) AS foo
ORDER BY 2 DESC LIMIT 1;
-- a little more complicated query tree
-- Citus does the inlining, the planning fails
@ -76,7 +81,7 @@ FROM
WITH top_cte AS
(SELECT *
FROM test_table)
SELECT *
SELECT count(*)
FROM top_cte,
(WITH cte_1 AS
(SELECT *
@ -114,7 +119,7 @@ WITH cte_1 AS
SELECT (SELECT 1) AS KEY FROM (
WITH cte_2 AS (SELECT *, random()
FROM (SELECT *,random() FROM cte_1) as foo)
SELECT *, random() FROM cte_2) as bar;
SELECT *, random() FROM cte_2) as bar ORDER BY 1 DESC LIMIT 3;
-- in this example, cte_2 can be inlined, because it is not used
-- on any query that Citus cannot plan. However, cte_1 should not be
@ -122,7 +127,7 @@ SELECT *, random() FROM cte_2) as bar;
WITH cte_1 AS (SELECT * FROM test_table),
cte_2 AS (select * from test_table)
SELECT
*
count(*)
FROM
(SELECT *, (SELECT 1) FROM cte_1) as foo
JOIN
@ -137,7 +142,9 @@ SELECT
FROM
test_table
WHERE
key = 1;
key = 1
ORDER BY 3 DESC
LIMIT 5;
-- router queries are affected by the distributed
-- cte inlining
@ -147,7 +154,9 @@ SELECT
FROM
a
WHERE
key = 1;
key = 1
ORDER BY 1 DESC
LIMIT 5;
-- non router queries are affected by the distributed
-- cte inlining as well
@ -240,14 +249,15 @@ FROM
-- inlined
WITH cte_1 AS (SELECT *, random() FROM test_table)
SELECT
*
key, value
FROM
cte_1;
cte_1
ORDER BY 2 DESC LIMIT 1;
-- even with NOT MATERIALIZED volatile functions should not be inlined
WITH cte_1 AS NOT MATERIALIZED (SELECT *, random() FROM test_table)
SELECT
*
count(*)
FROM
cte_1;
@ -256,7 +266,7 @@ FROM
-- it is used one level below
WITH cte_1 AS (SELECT * FROM test_table)
SELECT
*
count(*)
FROM
(
WITH ct2 AS (SELECT * FROM cte_1)
@ -268,7 +278,7 @@ FROM
-- CTE
WITH cte_1 AS (SELECT * FROM test_table)
SELECT
*
count(DISTINCT key)
FROM
(
WITH cte_2 AS (SELECT * FROM cte_1),
@ -279,7 +289,7 @@ FROM
-- inlined CTE contains a reference to outer query
-- should be fine (because we pushdown the whole query)
SELECT *
SELECT count(*)
FROM
(SELECT *
FROM test_table) AS test_table_cte
@ -295,7 +305,7 @@ SELECT *
-- inlined CTE contains a reference to outer query
-- should be fine (even if the recursive planning fails
-- to recursively plan the query)
SELECT *
SELECT count(*)
FROM
(SELECT *
FROM test_table) AS test_table_cte
@ -317,9 +327,9 @@ SELECT
*
FROM
(
WITH ct2 AS (SELECT * FROM cte_1 LIMIT 5)
WITH ct2 AS (SELECT * FROM cte_1 ORDER BY 1, 2, 3 LIMIT 5)
SELECT * FROM ct2
) as foo;
) as foo ORDER BY 1 DESC, 2 DESC, 3 DESC LIMIT 5;
-- all nested CTEs can be inlinied
WITH cte_1 AS (
@ -343,13 +353,14 @@ SELECT * FROM cte_1 WHERE key = 6;
-- in set operations
WITH cte_1 AS (SELECT * FROM test_table),
cte_2 AS (SELECT * FROM test_table)
SELECT count(*) FROM (
(SELECT * FROM cte_1 EXCEPT SELECT * FROM test_table)
UNION
(SELECT * FROM cte_2);
(SELECT * FROM cte_2)) as foo;
-- cte_1 is going to be inlined even inside another set operation
WITH cte_1 AS (SELECT * FROM test_table),
cte_2 AS (SELECT * FROM test_table)
cte_2 AS (SELECT * FROM test_table ORDER BY 1 DESC LIMIT 3)
(SELECT *, (SELECT 1) FROM cte_1 EXCEPT SELECT *, 1 FROM test_table)
UNION
(SELECT *, 1 FROM cte_2);
@ -369,7 +380,7 @@ UNION
-- subquery pushdown with set operations
WITH cte_1 AS (SELECT * FROM test_table),
cte_2 AS (SELECT * FROM test_table)
SELECT * FROM
SELECT max(key) FROM
(
SELECT * FROM cte_1
UNION
@ -435,19 +446,21 @@ WITH cte_1 AS NOT MATERIALIZED (SELECT * FROM test_table)
DELETE FROM test_table WHERE key NOT IN (SELECT key FROM cte_1);
-- we don't inline CTEs if they are modifying CTEs
WITH cte_1 AS (DELETE FROM test_table RETURNING key)
SELECT * FROM cte_1;
WITH cte_1 AS (DELETE FROM test_table WHERE key % 3 = 1 RETURNING key)
SELECT * FROM cte_1 ORDER BY 1 DESC LIMIT 3;
-- NOT MATERIALIZED should not affect modifying CTEs
WITH cte_1 AS NOT MATERIALIZED (DELETE FROM test_table RETURNING key)
SELECT * FROM cte_1;
WITH cte_1 AS NOT MATERIALIZED (DELETE FROM test_table WHERE key % 3 = 0 RETURNING key)
SELECT count(*) FROM cte_1;
-- cte with column aliases
SELECT * FROM test_table,
(WITH cte_1 (x,y) AS (SELECT * FROM test_table),
cte_2 (z,y) AS (SELECT value, other_value, key FROM test_table),
cte_3 (t,m) AS (SELECT z, y, key as cte_2_key FROM cte_2)
SELECT * FROM cte_2, cte_3) as bar;
SELECT * FROM cte_2, cte_3) as bar
ORDER BY value, other_value, z, y, t, m, cte_2_key
LIMIT 5;
-- cte used in HAVING subquery just works fine
-- even if it is inlined
@ -459,7 +472,9 @@ FROM
GROUP BY
key
HAVING
(count(*) > (SELECT max FROM cte_1));
(count(*) > (SELECT max FROM cte_1))
ORDER BY 2 DESC
LIMIT 5;
-- cte used in ORDER BY just works fine
-- even if it is inlined
@ -469,32 +484,33 @@ SELECT
FROM
test_table JOIN cte_1 ON (key = max)
ORDER BY
cte_1.max;
cte_1.max
LIMIT 3;
PREPARE inlined_cte_without_params AS
WITH cte_1 AS (SELECT count(*) FROM test_table GROUP BY key)
SELECT * FROM cte_1;
SELECT * FROM cte_1 ORDER BY 1 DESC LIMIT 3;
PREPARE non_inlined_cte_without_params AS
WITH cte_1 AS (SELECT * FROM test_table)
SELECT
*, (SELECT 1)
FROM
cte_1;
PREPARE inlined_cte_has_parameter_on_non_dist_key(int) AS
WITH cte_1 AS (SELECT count(*) FROM test_table WHERE value::int = $1 GROUP BY key)
SELECT * FROM cte_1;
cte_1 ORDER BY 1 DESC LIMIT 3;
PREPARE inlined_cte_has_parameter_on_non_dist_key(text) AS
WITH cte_1 AS (SELECT count(*) FROM test_table WHERE value = $1 GROUP BY key)
SELECT * FROM cte_1 ORDER BY 1 DESC LIMIT 3;
PREPARE inlined_cte_has_parameter_on_dist_key(int) AS
WITH cte_1 AS (SELECT count(*) FROM test_table WHERE key > $1 GROUP BY key)
SELECT * FROM cte_1;
SELECT * FROM cte_1 ORDER BY 1 DESC LIMIT 3;
PREPARE non_inlined_cte_has_parameter_on_dist_key(int) AS
WITH cte_1 AS (SELECT * FROM test_table where key > $1)
SELECT
*, (SELECT 1)
FROM
cte_1;
cte_1 ORDER BY 1 DESC, 2 DESC, 3 DESC LIMIT 3;
PREPARE retry_planning(int) AS
WITH cte_1 AS (SELECT * FROM test_table WHERE key > $1)
SELECT json_object_agg(DISTINCT key, value) FROM cte_1;
SELECT json_object_agg(DISTINCT key, value) FROM cte_1 ORDER BY max(key), min(value) DESC LIMIT 3;
EXECUTE inlined_cte_without_params;
@ -511,12 +527,12 @@ EXECUTE non_inlined_cte_without_params;
EXECUTE non_inlined_cte_without_params;
EXECUTE non_inlined_cte_without_params;
EXECUTE inlined_cte_has_parameter_on_non_dist_key(1);
EXECUTE inlined_cte_has_parameter_on_non_dist_key(2);
EXECUTE inlined_cte_has_parameter_on_non_dist_key(3);
EXECUTE inlined_cte_has_parameter_on_non_dist_key(4);
EXECUTE inlined_cte_has_parameter_on_non_dist_key(5);
EXECUTE inlined_cte_has_parameter_on_non_dist_key(6);
EXECUTE inlined_cte_has_parameter_on_non_dist_key('test1');
EXECUTE inlined_cte_has_parameter_on_non_dist_key('test2');
EXECUTE inlined_cte_has_parameter_on_non_dist_key('test3');
EXECUTE inlined_cte_has_parameter_on_non_dist_key('test4');
EXECUTE inlined_cte_has_parameter_on_non_dist_key('test5');
EXECUTE inlined_cte_has_parameter_on_non_dist_key('test6');
EXECUTE inlined_cte_has_parameter_on_dist_key(1);
EXECUTE inlined_cte_has_parameter_on_dist_key(2);
@ -542,31 +558,31 @@ EXECUTE retry_planning(6);
-- this test can only work if the CTE is recursively
-- planned
WITH b AS (SELECT * FROM test_table)
SELECT * FROM (SELECT key as x FROM test_table OFFSET 0) as ref LEFT JOIN b ON (ref.x = b.key);
SELECT count(*) FROM (SELECT key as x FROM test_table OFFSET 0) as ref LEFT JOIN b ON (ref.x = b.key);
-- this becomes a non-colocated subquery join
-- because after the CTEs are inlined the joins
-- become a non-colocated subquery join
WITH a AS (SELECT * FROM test_table),
b AS (SELECT * FROM test_table)
SELECT * FROM a LEFT JOIN b ON (a.value = b.value);
SELECT count(*) FROM a LEFT JOIN b ON (a.value = b.value);
-- cte a has to be recursively planned because of OFFSET 0
-- after that, cte b also requires recursive planning
WITH a AS (SELECT * FROM test_table OFFSET 0),
b AS (SELECT * FROM test_table)
SELECT * FROM a LEFT JOIN b ON (a.value = b.value);
SELECT min(a.key) FROM a LEFT JOIN b ON (a.value = b.value);
-- after both CTEs are inlined, this becomes non-colocated subquery join
WITH cte_1 AS (SELECT * FROM test_table),
cte_2 AS (SELECT * FROM test_table)
SELECT * FROM cte_1 JOIN cte_2 ON (cte_1.value > cte_2.value);
SELECT * FROM cte_1 JOIN cte_2 ON (cte_1.value > cte_2.value) ORDER BY 1,2,3,4,5,6 DESC LIMIT 3;;
-- full join is only supported when both sides are
-- recursively planned
WITH cte_1 AS (SELECT value FROM test_table WHERE key > 1),
cte_2 AS (SELECT value FROM test_table WHERE key > 3)
SELECT * FROM cte_1 FULL JOIN cte_2 USING (value);
SELECT * FROM cte_1 FULL JOIN cte_2 USING (value) ORDER BY 1 DESC LIMIT 3;;
-- an unsupported agg. for multi-shard queries
-- so CTE has to be recursively planned
@ -580,7 +596,7 @@ SELECT json_object_agg(DISTINCT key, value) FROM cte_1;
-- "some" of the CTEs
WITH cte_1 AS (SELECT value FROM test_table WHERE key > 1),
cte_2 AS (SELECT max(value) as value FROM test_table WHERE key > 3)
SELECT * FROM cte_1 JOIN cte_2 USING (value);
SELECT count(*) FROM cte_1 JOIN cte_2 USING (value);
-- prevent DROP CASCADE to give notices