-- -- CTE_INLINE -- -- This test file has an alternative output because of the change in the -- display of SQL-standard function's arguments in INSERT/SELECT in PG15. -- The alternative output can be deleted when we drop support for PG14 -- SHOW server_version \gset SELECT substring(:'server_version', '\d+')::int >= 15 AS server_version_ge_15; server_version_ge_15 --------------------------------------------------------------------- f (1 row) CREATE SCHEMA cte_inline; SET search_path TO cte_inline; SET citus.next_shard_id TO 1960000; CREATE TABLE test_table (key int, value text, other_value jsonb); SELECT create_distributed_table ('test_table', 'key'); create_distributed_table --------------------------------------------------------------------- (1 row) INSERT INTO test_table SELECT i % 10, 'test' || i, row_to_json(row(i, i*18, 'test' || i)) FROM generate_series (0, 100) i; SET client_min_messages TO DEBUG; -- Citus should not inline this CTE because otherwise it cannot -- plan the query WITH cte_1 AS (SELECT * FROM test_table) SELECT * FROM test_table LEFT JOIN cte_1 USING (value) ORDER BY 1 DESC LIMIT 3; DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for subquery SELECT key, value, other_value FROM cte_inline.test_table DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT test_table.value, test_table.key, test_table.other_value, cte_1.key, cte_1.other_value FROM (cte_inline.test_table LEFT JOIN (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) cte_1 USING (value)) ORDER BY test_table.value DESC LIMIT 3 DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 value | key | other_value | key | other_value --------------------------------------------------------------------- test99 | 9 | {"f1": 99, "f2": 1782, "f3": "test99"} | 9 | {"f1": 99, "f2": 1782, "f3": "test99"} test98 | 8 | {"f1": 98, "f2": 1764, "f3": "test98"} | 8 | {"f1": 98, "f2": 1764, "f3": "test98"} test97 | 7 | {"f1": 97, "f2": 1746, "f3": "test97"} | 7 | {"f1": 97, "f2": 1746, "f3": "test97"} (3 rows) -- Should still not be inlined even if NOT MATERIALIZED is passed WITH cte_1 AS NOT MATERIALIZED (SELECT * FROM test_table) SELECT * FROM test_table LEFT JOIN cte_1 USING (value) ORDER BY 2 DESC LIMIT 1; DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for subquery SELECT key, value, other_value FROM cte_inline.test_table DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT test_table.value, test_table.key, test_table.other_value, cte_1.key, cte_1.other_value FROM (cte_inline.test_table LEFT JOIN (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) cte_1 USING (value)) ORDER BY test_table.key DESC LIMIT 1 DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 1 value | key | other_value | key | other_value --------------------------------------------------------------------- test9 | 9 | {"f1": 9, "f2": 162, "f3": "test9"} | 9 | {"f1": 9, "f2": 162, "f3": "test9"} (1 row) -- the cte can be inlined because the unsupported -- part of the query (subquery in WHERE clause) -- doesn't access the cte WITH cte_1 AS (SELECT * FROM test_table) SELECT count(*) FROM cte_1 WHERE key IN ( SELECT (SELECT 1) FROM test_table WHERE key = 1 ); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Creating router plan DEBUG: query has a single distribution column value: 1 DEBUG: generating subplan XXX_1 for subquery SELECT (SELECT 1) FROM cte_inline.test_table WHERE (key OPERATOR(pg_catalog.=) 1) DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT count(*) AS count FROM (SELECT test_table.key, test_table.value, test_table.other_value FROM cte_inline.test_table) cte_1 WHERE (key OPERATOR(pg_catalog.=) ANY (SELECT intermediate_result."?column?" FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result("?column?" integer))) DEBUG: Router planner cannot handle multi-shard select queries count --------------------------------------------------------------------- 10 (1 row) -- a similar query as the above, and this time the planning -- fails, but it fails because the subquery in WHERE clause -- cannot be planned by Citus WITH cte_1 AS (SELECT * FROM test_table) SELECT count(*) FROM cte_1 WHERE key IN ( SELECT key FROM test_table FOR UPDATE ); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: SELECT FOR UPDATE with table replication factor > 1 not supported for non-reference tables. DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for CTE cte_1: SELECT key, value, other_value FROM cte_inline.test_table DEBUG: Router planner cannot handle multi-shard select queries DEBUG: SELECT FOR UPDATE with table replication factor > 1 not supported for non-reference tables. ERROR: could not run distributed query with FOR UPDATE/SHARE commands HINT: Consider using an equality filter on the distributed table's partition column. -- Citus does the inlining, the planning fails -- and retries without inlining, which works -- fine later via recursive planning WITH cte_1 AS (SELECT * FROM test_table) SELECT *, (SELECT 1) FROM (SELECT * FROM cte_1) AS foo ORDER BY 2 DESC LIMIT 1; DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 1 key | value | other_value | ?column? --------------------------------------------------------------------- 9 | test99 | {"f1": 99, "f2": 1782, "f3": "test99"} | 1 (1 row) -- a little more complicated query tree -- Citus does the inlining, the planning fails -- and retries without inlining, which works WITH top_cte AS (SELECT * FROM test_table) SELECT count(*) FROM top_cte, (WITH cte_1 AS (SELECT * FROM test_table) SELECT *, (SELECT 1) FROM (SELECT * FROM cte_1) AS foo) AS bar; DEBUG: CTE top_cte is going to be inlined via distributed planning DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for subquery SELECT key, value, other_value, (SELECT 1) FROM (SELECT cte_1.key, cte_1.value, cte_1.other_value FROM (SELECT test_table.key, test_table.value, test_table.other_value FROM cte_inline.test_table) cte_1) foo DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT count(*) AS count FROM (SELECT test_table.key, test_table.value, test_table.other_value FROM cte_inline.test_table) top_cte, (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value, intermediate_result."?column?" FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb, "?column?" integer)) bar(key, value, other_value, "?column?") DEBUG: Router planner cannot handle multi-shard select queries count --------------------------------------------------------------------- 10201 (1 row) -- CTE is used inside a subquery in WHERE clause -- the query wouldn't work by inlining, so Citus -- retries again via recursive planning, which -- works fine WITH cte_1 AS (SELECT * FROM test_table) SELECT count(*) FROM test_table WHERE KEY IN (SELECT (SELECT 1) FROM (SELECT *, random() FROM (SELECT * FROM cte_1) AS foo) AS bar); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for subquery SELECT (SELECT 1) FROM (SELECT foo.key, foo.value, foo.other_value, random() AS random FROM (SELECT cte_1.key, cte_1.value, cte_1.other_value FROM (SELECT test_table.key, test_table.value, test_table.other_value FROM cte_inline.test_table) cte_1) foo) bar DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT count(*) AS count FROM cte_inline.test_table WHERE (key OPERATOR(pg_catalog.=) ANY (SELECT intermediate_result."?column?" FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result("?column?" integer))) DEBUG: Router planner cannot handle multi-shard select queries count --------------------------------------------------------------------- 10 (1 row) -- cte_1 is used inside another CTE, but still -- doesn't work when inlined because it is finally -- used in an unsupported query -- but still works fine because recursive planning -- kicks in WITH cte_1 AS (SELECT * FROM test_table) SELECT (SELECT 1) AS KEY FROM ( WITH cte_2 AS (SELECT *, random() FROM (SELECT *,random() FROM cte_1) as foo) SELECT *, random() FROM cte_2) as bar ORDER BY 1 DESC LIMIT 3; DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for CTE cte_2: SELECT key, value, other_value, random, random() AS random FROM (SELECT cte_1.key, cte_1.value, cte_1.other_value, random() AS random FROM (SELECT test_table.key, test_table.value, test_table.other_value FROM cte_inline.test_table) cte_1) foo DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT (SELECT 1) AS key FROM (SELECT cte_2.key, cte_2.value, cte_2.other_value, cte_2.random, cte_2.random_1 AS random, random() AS random FROM (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value, intermediate_result.random, intermediate_result.random_1 AS random FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb, random double precision, random_1 double precision)) cte_2(key, value, other_value, random, random_1)) bar(key, value, other_value, random, random_1, random_2) ORDER BY (SELECT 1) DESC LIMIT 3 DEBUG: Creating router plan key --------------------------------------------------------------------- 1 1 1 (3 rows) -- in this example, cte_2 can be inlined, because it is not used -- on any query that Citus cannot plan. However, cte_1 should not be -- inlined, because it is used with a subquery in target list WITH cte_1 AS (SELECT * FROM test_table), cte_2 AS (select * from test_table) SELECT count(*) FROM (SELECT *, (SELECT 1) FROM cte_1) as foo JOIN cte_2 ON (true); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: CTE cte_2 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for subquery SELECT key, value, other_value FROM cte_inline.test_table DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT count(*) AS count FROM ((SELECT cte_1.key, cte_1.value, cte_1.other_value, (SELECT 1) FROM (SELECT test_table.key, test_table.value, test_table.other_value FROM cte_inline.test_table) cte_1) foo(key, value, other_value, "?column?") JOIN (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) cte_2 ON (true)) DEBUG: Router planner cannot handle multi-shard select queries count --------------------------------------------------------------------- 10201 (1 row) -- unreferenced CTEs are just ignored -- by Citus/Postgres WITH a AS (SELECT * FROM test_table) SELECT *, row_number() OVER () FROM test_table WHERE key = 1 ORDER BY 3 DESC LIMIT 5; DEBUG: Creating router plan DEBUG: query has a single distribution column value: 1 key | value | other_value | row_number --------------------------------------------------------------------- 1 | test91 | {"f1": 91, "f2": 1638, "f3": "test91"} | 10 1 | test81 | {"f1": 81, "f2": 1458, "f3": "test81"} | 9 1 | test71 | {"f1": 71, "f2": 1278, "f3": "test71"} | 8 1 | test61 | {"f1": 61, "f2": 1098, "f3": "test61"} | 7 1 | test51 | {"f1": 51, "f2": 918, "f3": "test51"} | 6 (5 rows) -- router queries are affected by the distributed -- cte inlining WITH a AS (SELECT * FROM test_table WHERE key = 1) SELECT *, (SELECT 1) FROM a WHERE key = 1 ORDER BY 1 DESC LIMIT 5; DEBUG: CTE a is going to be inlined via distributed planning DEBUG: Creating router plan DEBUG: query has a single distribution column value: 1 key | value | other_value | ?column? --------------------------------------------------------------------- 1 | test1 | {"f1": 1, "f2": 18, "f3": "test1"} | 1 1 | test11 | {"f1": 11, "f2": 198, "f3": "test11"} | 1 1 | test21 | {"f1": 21, "f2": 378, "f3": "test21"} | 1 1 | test31 | {"f1": 31, "f2": 558, "f3": "test31"} | 1 1 | test41 | {"f1": 41, "f2": 738, "f3": "test41"} | 1 (5 rows) -- non router queries are affected by the distributed -- cte inlining as well WITH a AS (SELECT * FROM test_table) SELECT count(*) FROM a WHERE key = 1; DEBUG: CTE a is going to be inlined via distributed planning DEBUG: Creating router plan DEBUG: query has a single distribution column value: 1 count --------------------------------------------------------------------- 10 (1 row) -- explicitely using NOT MATERIALIZED should result in the same WITH a AS NOT MATERIALIZED (SELECT * FROM test_table) SELECT count(*) FROM a WHERE key = 1; DEBUG: CTE a is going to be inlined via distributed planning DEBUG: Creating router plan DEBUG: query has a single distribution column value: 1 count --------------------------------------------------------------------- 10 (1 row) -- using MATERIALIZED should cause inlining not to happen WITH a AS MATERIALIZED (SELECT * FROM test_table) SELECT count(*) FROM a WHERE key = 1; DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for CTE a: SELECT key, value, other_value FROM cte_inline.test_table DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT count(*) AS count FROM (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) a WHERE (key OPERATOR(pg_catalog.=) 1) DEBUG: Creating router plan count --------------------------------------------------------------------- 10 (1 row) -- EXPLAIN should show the difference between materialized an not materialized EXPLAIN (COSTS OFF) WITH a AS (SELECT * FROM test_table) SELECT count(*) FROM a WHERE key = 1; DEBUG: CTE a is going to be inlined via distributed planning DEBUG: Creating router plan DEBUG: query has a single distribution column value: 1 QUERY PLAN --------------------------------------------------------------------- Custom Scan (Citus Adaptive) Task Count: 1 Tasks Shown: All -> Task Node: host=localhost port=xxxxx dbname=regression -> Aggregate -> Seq Scan on test_table_1960000 test_table Filter: (key = 1) (8 rows) EXPLAIN (COSTS OFF) WITH a AS MATERIALIZED (SELECT * FROM test_table) SELECT count(*) FROM a WHERE key = 1; DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for CTE a: SELECT key, value, other_value FROM cte_inline.test_table DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT count(*) AS count FROM (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) a WHERE (key OPERATOR(pg_catalog.=) 1) DEBUG: Creating router plan QUERY PLAN --------------------------------------------------------------------- Custom Scan (Citus Adaptive) -> Distributed Subplan XXX_1 -> Custom Scan (Citus Adaptive) Task Count: 4 Tasks Shown: One of 4 -> Task Node: host=localhost port=xxxxx dbname=regression -> Seq Scan on test_table_1960000 test_table Task Count: 1 Tasks Shown: All -> Task Node: host=localhost port=xxxxx dbname=regression -> Aggregate -> Function Scan on read_intermediate_result intermediate_result Filter: (key = 1) (15 rows) -- citus should not inline the CTE because it is used multiple times WITH cte_1 AS (SELECT * FROM test_table) SELECT count(*) FROM cte_1 as first_entry JOIN cte_1 as second_entry USING (key); DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for CTE cte_1: SELECT key, value, other_value FROM cte_inline.test_table DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT count(*) AS count FROM ((SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) first_entry JOIN (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) second_entry USING (key)) DEBUG: Creating router plan count --------------------------------------------------------------------- 1021 (1 row) -- NOT MATERIALIZED should cause the query to be inlined twice WITH cte_1 AS NOT MATERIALIZED (SELECT * FROM test_table) SELECT count(*) FROM cte_1 as first_entry JOIN cte_1 as second_entry USING (key); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: join prunable for intervals [-2147483648,-1073741825] and [-1073741824,-1] DEBUG: join prunable for intervals [-2147483648,-1073741825] and [0,1073741823] DEBUG: join prunable for intervals [-2147483648,-1073741825] and [1073741824,2147483647] DEBUG: join prunable for intervals [-1073741824,-1] and [-2147483648,-1073741825] DEBUG: join prunable for intervals [-1073741824,-1] and [0,1073741823] DEBUG: join prunable for intervals [-1073741824,-1] and [1073741824,2147483647] DEBUG: join prunable for intervals [0,1073741823] and [-2147483648,-1073741825] DEBUG: join prunable for intervals [0,1073741823] and [-1073741824,-1] DEBUG: join prunable for intervals [0,1073741823] and [1073741824,2147483647] DEBUG: join prunable for intervals [1073741824,2147483647] and [-2147483648,-1073741825] DEBUG: join prunable for intervals [1073741824,2147483647] and [-1073741824,-1] DEBUG: join prunable for intervals [1073741824,2147483647] and [0,1073741823] count --------------------------------------------------------------------- 1021 (1 row) -- EXPLAIN should show the differences between MATERIALIZED and NOT MATERIALIZED \set VERBOSITY terse SELECT public.coordinator_plan_with_subplans($Q$ EXPLAIN (COSTS OFF) WITH cte_1 AS (SELECT * FROM test_table) SELECT count(*) FROM cte_1 as first_entry JOIN cte_1 as second_entry USING (key); $Q$); DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for CTE cte_1: SELECT key, value, other_value FROM cte_inline.test_table DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT count(*) AS count FROM ((SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) first_entry JOIN (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) second_entry USING (key)) DEBUG: Creating router plan coordinator_plan_with_subplans --------------------------------------------------------------------- Custom Scan (Citus Adaptive) -> Distributed Subplan XXX_1 -> Custom Scan (Citus Adaptive) Task Count: 4 Task Count: 1 (5 rows) \set VERBOSITY default EXPLAIN (COSTS OFF) WITH cte_1 AS NOT MATERIALIZED (SELECT * FROM test_table) SELECT count(*) FROM cte_1 as first_entry JOIN cte_1 as second_entry USING (key); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: join prunable for intervals [-2147483648,-1073741825] and [-1073741824,-1] DEBUG: join prunable for intervals [-2147483648,-1073741825] and [0,1073741823] DEBUG: join prunable for intervals [-2147483648,-1073741825] and [1073741824,2147483647] DEBUG: join prunable for intervals [-1073741824,-1] and [-2147483648,-1073741825] DEBUG: join prunable for intervals [-1073741824,-1] and [0,1073741823] DEBUG: join prunable for intervals [-1073741824,-1] and [1073741824,2147483647] DEBUG: join prunable for intervals [0,1073741823] and [-2147483648,-1073741825] DEBUG: join prunable for intervals [0,1073741823] and [-1073741824,-1] DEBUG: join prunable for intervals [0,1073741823] and [1073741824,2147483647] DEBUG: join prunable for intervals [1073741824,2147483647] and [-2147483648,-1073741825] DEBUG: join prunable for intervals [1073741824,2147483647] and [-1073741824,-1] DEBUG: join prunable for intervals [1073741824,2147483647] and [0,1073741823] QUERY PLAN --------------------------------------------------------------------- Aggregate -> Custom Scan (Citus Adaptive) Task Count: 4 Tasks Shown: One of 4 -> Task Node: host=localhost port=xxxxx dbname=regression -> Aggregate -> Hash Join Hash Cond: (test_table.key = test_table_1.key) -> Seq Scan on test_table_1960000 test_table -> Hash -> Seq Scan on test_table_1960000 test_table_1 (12 rows) -- ctes with volatile functions are not -- inlined WITH cte_1 AS (SELECT *, random() FROM test_table) SELECT key, value FROM cte_1 ORDER BY 2 DESC LIMIT 1; DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for CTE cte_1: SELECT key, value, other_value, random() AS random FROM cte_inline.test_table DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT key, value FROM (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value, intermediate_result.random FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb, random double precision)) cte_1 ORDER BY value DESC LIMIT 1 DEBUG: Creating router plan key | value --------------------------------------------------------------------- 9 | test99 (1 row) -- even with NOT MATERIALIZED volatile functions should not be inlined WITH cte_1 AS NOT MATERIALIZED (SELECT *, random() FROM test_table) SELECT count(*) FROM cte_1; DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for CTE cte_1: SELECT key, value, other_value, random() AS random FROM cte_inline.test_table DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT count(*) AS count FROM (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value, intermediate_result.random FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb, random double precision)) cte_1 DEBUG: Creating router plan count --------------------------------------------------------------------- 101 (1 row) -- cte_1 should be able to inlined even if -- it is used one level below WITH cte_1 AS (SELECT * FROM test_table) SELECT count(*) FROM ( WITH ct2 AS (SELECT * FROM cte_1) SELECT * FROM ct2 ) as foo; DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: CTE ct2 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries count --------------------------------------------------------------------- 101 (1 row) -- a similar query, but there is also -- one more cte, which relies on the previous -- CTE WITH cte_1 AS (SELECT * FROM test_table) SELECT count(DISTINCT key) FROM ( WITH cte_2 AS (SELECT * FROM cte_1), cte_3 AS (SELECT * FROM cte_2) SELECT * FROM cte_3 ) as foo; DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: CTE cte_2 is going to be inlined via distributed planning DEBUG: CTE cte_3 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries count --------------------------------------------------------------------- 10 (1 row) -- inlined CTE contains a reference to outer query -- should be fine (because we pushdown the whole query) SELECT count(*) FROM (SELECT * FROM test_table) AS test_table_cte JOIN LATERAL (WITH bar AS (SELECT * FROM test_table WHERE key = test_table_cte.key) SELECT * FROM bar LEFT JOIN test_table u2 ON u2.key = bar.key) AS foo ON TRUE; DEBUG: CTE bar is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries count --------------------------------------------------------------------- 10331 (1 row) -- inlined CTE contains a reference to outer query -- should be fine (even if the recursive planning fails -- to recursively plan the query) SELECT count(*) FROM (SELECT * FROM test_table) AS test_table_cte JOIN LATERAL (WITH bar AS (SELECT * FROM test_table WHERE key = test_table_cte.key) SELECT * FROM bar LEFT JOIN test_table u2 ON u2.key = bar.value::int) AS foo ON TRUE; DEBUG: CTE bar is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: skipping recursive planning for the subquery since it contains references to outer queries DEBUG: skipping recursive planning for the subquery since it contains references to outer queries DEBUG: skipping recursive planning for the subquery since it contains references to outer queries DEBUG: Router planner cannot handle multi-shard select queries ERROR: CTEs that refer to other subqueries are not supported in multi-shard queries -- inlined CTE can recursively planned later, that's the decision -- recursive planning makes -- LIMIT 5 in cte2 triggers recusrive planning, after cte inlining WITH cte_1 AS (SELECT * FROM test_table) SELECT * FROM ( WITH ct2 AS (SELECT * FROM cte_1 ORDER BY 1, 2, 3 LIMIT 5) SELECT * FROM ct2 ) as foo ORDER BY 1 DESC, 2 DESC, 3 DESC LIMIT 5; DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: CTE ct2 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 5 DEBUG: generating subplan XXX_1 for subquery SELECT key, value, other_value FROM (SELECT test_table.key, test_table.value, test_table.other_value FROM cte_inline.test_table) cte_1 ORDER BY key, value, other_value LIMIT 5 DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT key, value, other_value FROM (SELECT ct2.key, ct2.value, ct2.other_value FROM (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) ct2) foo ORDER BY key DESC, value DESC, other_value DESC LIMIT 5 DEBUG: Creating router plan key | value | other_value --------------------------------------------------------------------- 0 | test30 | {"f1": 30, "f2": 540, "f3": "test30"} 0 | test20 | {"f1": 20, "f2": 360, "f3": "test20"} 0 | test100 | {"f1": 100, "f2": 1800, "f3": "test100"} 0 | test10 | {"f1": 10, "f2": 180, "f3": "test10"} 0 | test0 | {"f1": 0, "f2": 0, "f3": "test0"} (5 rows) -- all nested CTEs can be inlinied WITH cte_1 AS ( WITH cte_1 AS ( WITH cte_1 AS ( WITH cte_1 AS ( WITH cte_1 AS ( WITH cte_1 AS ( WITH cte_1 AS (SELECT count(*), key FROM test_table GROUP BY key) SELECT * FROM cte_1) SELECT * FROM cte_1 WHERE key = 1) SELECT * FROM cte_1 WHERE key = 2) SELECT * FROM cte_1 WHERE key = 3) SELECT * FROM cte_1 WHERE key = 4) SELECT * FROM cte_1 WHERE key = 5) SELECT * FROM cte_1 WHERE key = 6; DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Creating router plan DEBUG: query has a single distribution column value: 1 count | key --------------------------------------------------------------------- (0 rows) -- ctes can be inlined even if they are used -- in set operations WITH cte_1 AS (SELECT * FROM test_table), cte_2 AS (SELECT * FROM test_table) SELECT count(*) FROM ( (SELECT * FROM cte_1 EXCEPT SELECT * FROM test_table) UNION (SELECT * FROM cte_2)) as foo; DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: CTE cte_2 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for subquery SELECT key, value, other_value FROM (SELECT test_table.key, test_table.value, test_table.other_value FROM cte_inline.test_table) cte_1 DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_2 for subquery SELECT key, value, other_value FROM cte_inline.test_table DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_3 for subquery SELECT key, value, other_value FROM (SELECT test_table.key, test_table.value, test_table.other_value FROM cte_inline.test_table) cte_2 DEBUG: Creating router plan DEBUG: generating subplan XXX_4 for subquery (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb) EXCEPT SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_2'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) UNION SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_3'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb) DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT count(*) AS count FROM (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_4'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) foo DEBUG: Creating router plan count --------------------------------------------------------------------- 101 (1 row) -- cte_1 is going to be inlined even inside another set operation WITH cte_1 AS (SELECT * FROM test_table), cte_2 AS (SELECT * FROM test_table ORDER BY 1 DESC LIMIT 3) (SELECT *, (SELECT 1) FROM cte_1 EXCEPT SELECT *, 1 FROM test_table) UNION (SELECT *, 1 FROM cte_2) ORDER BY 1,2; DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: CTE cte_2 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 DEBUG: generating subplan XXX_1 for subquery SELECT key, value, other_value FROM cte_inline.test_table ORDER BY key DESC LIMIT 3 DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_2 for subquery SELECT key, value, other_value, (SELECT 1) FROM (SELECT test_table.key, test_table.value, test_table.other_value FROM cte_inline.test_table) cte_1 DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_3 for subquery SELECT key, value, other_value, 1 FROM cte_inline.test_table DEBUG: Plan XXX query after replacing subqueries and CTEs: (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value, intermediate_result."?column?" FROM read_intermediate_result('XXX_2'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb, "?column?" integer) EXCEPT SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value, intermediate_result."?column?" FROM read_intermediate_result('XXX_3'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb, "?column?" integer)) UNION SELECT cte_2.key, cte_2.value, cte_2.other_value, 1 FROM (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) cte_2 ORDER BY 1, 2 DEBUG: Creating router plan key | value | other_value | ?column? --------------------------------------------------------------------- 9 | test19 | {"f1": 19, "f2": 342, "f3": "test19"} | 1 9 | test29 | {"f1": 29, "f2": 522, "f3": "test29"} | 1 9 | test9 | {"f1": 9, "f2": 162, "f3": "test9"} | 1 (3 rows) -- cte_1 is safe to inline, even if because after inlining -- it'd be in a query tree where there is a query that is -- not supported by Citus unless recursively planned -- cte_2 is on another queryTree, should be fine WITH cte_1 AS (SELECT * FROM test_table), cte_2 AS (SELECT * FROM test_table) (SELECT *, (SELECT key FROM cte_1) FROM test_table) UNION (SELECT *, 1 FROM cte_2); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: CTE cte_2 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for CTE cte_1: SELECT key, value, other_value FROM cte_inline.test_table DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_2 for CTE cte_2: SELECT key, value, other_value FROM cte_inline.test_table DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_3 for subquery SELECT key, value, other_value, (SELECT cte_1.key FROM (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) cte_1) AS key FROM cte_inline.test_table DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value, intermediate_result.key_1 AS key FROM read_intermediate_result('XXX_3'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb, key_1 integer) UNION SELECT cte_2.key, cte_2.value, cte_2.other_value, 1 FROM (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_2'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) cte_2 DEBUG: Creating router plan ERROR: more than one row returned by a subquery used as an expression CONTEXT: while executing command on localhost:xxxxx -- after inlining CTEs, the query becomes -- subquery pushdown with set operations WITH cte_1 AS (SELECT * FROM test_table), cte_2 AS (SELECT * FROM test_table) SELECT max(key) FROM ( SELECT * FROM cte_1 UNION SELECT * FROM cte_2 ) as bar; DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: CTE cte_2 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries max --------------------------------------------------------------------- 9 (1 row) -- cte LEFT JOIN subquery should only work -- when CTE is inlined, as Citus currently -- doesn't know how to handle intermediate -- results in the outer parts of outer -- queries WITH cte AS (SELECT * FROM test_table) SELECT count(*) FROM cte LEFT JOIN test_table USING (key); DEBUG: CTE cte is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries count --------------------------------------------------------------------- 1021 (1 row) -- the CTEs are very simple, so postgres -- can pull-up the subqueries after inlining -- the CTEs, and the query that we send to workers -- becomes a join between two tables WITH cte_1 AS (SELECT key FROM test_table), cte_2 AS (SELECT key FROM test_table) SELECT count(*) FROM cte_1 JOIN cte_2 USING (key); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: CTE cte_2 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: join prunable for intervals [-2147483648,-1073741825] and [-1073741824,-1] DEBUG: join prunable for intervals [-2147483648,-1073741825] and [0,1073741823] DEBUG: join prunable for intervals [-2147483648,-1073741825] and [1073741824,2147483647] DEBUG: join prunable for intervals [-1073741824,-1] and [-2147483648,-1073741825] DEBUG: join prunable for intervals [-1073741824,-1] and [0,1073741823] DEBUG: join prunable for intervals [-1073741824,-1] and [1073741824,2147483647] DEBUG: join prunable for intervals [0,1073741823] and [-2147483648,-1073741825] DEBUG: join prunable for intervals [0,1073741823] and [-1073741824,-1] DEBUG: join prunable for intervals [0,1073741823] and [1073741824,2147483647] DEBUG: join prunable for intervals [1073741824,2147483647] and [-2147483648,-1073741825] DEBUG: join prunable for intervals [1073741824,2147483647] and [-1073741824,-1] DEBUG: join prunable for intervals [1073741824,2147483647] and [0,1073741823] count --------------------------------------------------------------------- 1021 (1 row) -- the following query is kind of interesting -- During INSERT .. SELECT via coordinator, -- Citus moves the CTEs into SELECT part, and plans/execute -- the SELECT separately. Thus, fist_table_cte can be inlined -- by Citus -- but not by Postgres WITH fist_table_cte AS (SELECT * FROM test_table) INSERT INTO test_table (key, value) SELECT key, value FROM fist_table_cte; DEBUG: distributed INSERT ... SELECT can only select from distributed tables DEBUG: CTE fist_table_cte is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: performing repartitioned INSERT ... SELECT DEBUG: partitioning SELECT query by column index 0 with name 'key' DEBUG: distributed statement: INSERT INTO cte_inline.test_table_1960000 AS citus_table_alias (key, value) SELECT key, value FROM read_intermediate_results('{repartitioned_results_xxxxx_from_1960000_to_0}'::text[], 'binary'::citus_copy_format) intermediate_result(key integer, value text) DEBUG: distributed statement: INSERT INTO cte_inline.test_table_1960001 AS citus_table_alias (key, value) SELECT key, value FROM read_intermediate_results('{repartitioned_results_xxxxx_from_1960001_to_1}'::text[], 'binary'::citus_copy_format) intermediate_result(key integer, value text) DEBUG: distributed statement: INSERT INTO cte_inline.test_table_1960002 AS citus_table_alias (key, value) SELECT key, value FROM read_intermediate_results('{repartitioned_results_xxxxx_from_1960002_to_2}'::text[], 'binary'::citus_copy_format) intermediate_result(key integer, value text) DEBUG: distributed statement: INSERT INTO cte_inline.test_table_1960003 AS citus_table_alias (key, value) SELECT key, value FROM read_intermediate_results('{repartitioned_results_xxxxx_from_1960003_to_3}'::text[], 'binary'::citus_copy_format) intermediate_result(key integer, value text) -- the following INSERT..SELECT is even more interesting -- the CTE becomes pushdownable INSERT INTO test_table WITH fist_table_cte AS (SELECT * FROM test_table) SELECT key, value FROM fist_table_cte; DEBUG: CTE fist_table_cte is going to be inlined via distributed planning DEBUG: distributed statement: INSERT INTO cte_inline.test_table_1960000 AS citus_table_alias (key, value) SELECT key, value FROM (SELECT test_table.key, test_table.value, test_table.other_value FROM cte_inline.test_table_1960000 test_table) fist_table_cte WHERE (key IS NOT NULL) DEBUG: distributed statement: INSERT INTO cte_inline.test_table_1960001 AS citus_table_alias (key, value) SELECT key, value FROM (SELECT test_table.key, test_table.value, test_table.other_value FROM cte_inline.test_table_1960001 test_table) fist_table_cte WHERE (key IS NOT NULL) DEBUG: distributed statement: INSERT INTO cte_inline.test_table_1960002 AS citus_table_alias (key, value) SELECT key, value FROM (SELECT test_table.key, test_table.value, test_table.other_value FROM cte_inline.test_table_1960002 test_table) fist_table_cte WHERE (key IS NOT NULL) DEBUG: distributed statement: INSERT INTO cte_inline.test_table_1960003 AS citus_table_alias (key, value) SELECT key, value FROM (SELECT test_table.key, test_table.value, test_table.other_value FROM cte_inline.test_table_1960003 test_table) fist_table_cte WHERE (key IS NOT NULL) -- update/delete/modifying ctes -- we don't support any cte inlining in modifications -- queries and modifying CTEs WITH cte_1 AS (SELECT * FROM test_table) DELETE FROM test_table WHERE key NOT IN (SELECT key FROM cte_1); DEBUG: complex joins are only supported when all distributed tables are co-located and joined on their distribution columns DEBUG: generating subplan XXX_1 for CTE cte_1: SELECT key, value, other_value FROM cte_inline.test_table DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Plan XXX query after replacing subqueries and CTEs: DELETE FROM cte_inline.test_table WHERE (NOT (key OPERATOR(pg_catalog.=) ANY (SELECT cte_1.key FROM (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) cte_1))) DEBUG: Creating router plan -- NOT MATERIALIZED should not CTEs that are used in a modifying query, because -- we de still don't support it WITH cte_1 AS NOT MATERIALIZED (SELECT * FROM test_table) DELETE FROM test_table WHERE key NOT IN (SELECT key FROM cte_1); DEBUG: complex joins are only supported when all distributed tables are co-located and joined on their distribution columns DEBUG: generating subplan XXX_1 for CTE cte_1: SELECT key, value, other_value FROM cte_inline.test_table DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Plan XXX query after replacing subqueries and CTEs: DELETE FROM cte_inline.test_table WHERE (NOT (key OPERATOR(pg_catalog.=) ANY (SELECT cte_1.key FROM (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) cte_1))) DEBUG: Creating router plan -- we don't inline CTEs if they are modifying CTEs WITH cte_1 AS (DELETE FROM test_table WHERE key % 3 = 1 RETURNING key) SELECT * FROM cte_1 ORDER BY 1 DESC LIMIT 3; DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for CTE cte_1: DELETE FROM cte_inline.test_table WHERE ((key OPERATOR(pg_catalog.%) 3) OPERATOR(pg_catalog.=) 1) RETURNING key DEBUG: Creating router plan DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT key FROM (SELECT intermediate_result.key FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer)) cte_1 ORDER BY key DESC LIMIT 3 DEBUG: Creating router plan key --------------------------------------------------------------------- 7 7 7 (3 rows) -- NOT MATERIALIZED should not affect modifying CTEs WITH cte_1 AS NOT MATERIALIZED (DELETE FROM test_table WHERE key % 3 = 0 RETURNING key) SELECT count(*) FROM cte_1; DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for CTE cte_1: DELETE FROM cte_inline.test_table WHERE ((key OPERATOR(pg_catalog.%) 3) OPERATOR(pg_catalog.=) 0) RETURNING key DEBUG: Creating router plan DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT count(*) AS count FROM (SELECT intermediate_result.key FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer)) cte_1 DEBUG: Creating router plan count --------------------------------------------------------------------- 164 (1 row) -- cte with column aliases SELECT * FROM test_table, (WITH cte_1 (x,y) AS (SELECT * FROM test_table), cte_2 (z,y) AS (SELECT value, other_value, key FROM test_table), cte_3 (t,m) AS (SELECT z, y, key as cte_2_key FROM cte_2) SELECT * FROM cte_2, cte_3) as bar ORDER BY value, other_value, z, y, t, m, cte_2_key LIMIT 5; DEBUG: CTE cte_3 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for CTE cte_2: SELECT value, other_value, key FROM cte_inline.test_table DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT test_table.key, test_table.value, test_table.other_value, bar.z, bar.y, bar.key, bar.t, bar.m, bar.cte_2_key FROM cte_inline.test_table, (SELECT cte_2.z, cte_2.y, cte_2.key, cte_3.t, cte_3.m, cte_3.cte_2_key FROM (SELECT intermediate_result.value AS z, intermediate_result.other_value AS y, intermediate_result.key FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(value text, other_value jsonb, key integer)) cte_2, (SELECT cte_2_1.z AS t, cte_2_1.y AS m, cte_2_1.key AS cte_2_key FROM (SELECT intermediate_result.value AS z, intermediate_result.other_value AS y, intermediate_result.key FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(value text, other_value jsonb, key integer)) cte_2_1) cte_3) bar ORDER BY test_table.value, test_table.other_value, bar.z, bar.y, bar.t, bar.m, bar.cte_2_key LIMIT 5 DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 5 key | value | other_value | z | y | key | t | m | cte_2_key --------------------------------------------------------------------- 2 | test12 | {"f1": 12, "f2": 216, "f3": "test12"} | test12 | {"f1": 12, "f2": 216, "f3": "test12"} | 2 | test12 | {"f1": 12, "f2": 216, "f3": "test12"} | 2 2 | test12 | {"f1": 12, "f2": 216, "f3": "test12"} | test12 | {"f1": 12, "f2": 216, "f3": "test12"} | 2 | test12 | | 2 2 | test12 | {"f1": 12, "f2": 216, "f3": "test12"} | test12 | {"f1": 12, "f2": 216, "f3": "test12"} | 2 | test12 | | 2 2 | test12 | {"f1": 12, "f2": 216, "f3": "test12"} | test12 | {"f1": 12, "f2": 216, "f3": "test12"} | 2 | test12 | | 2 2 | test12 | {"f1": 12, "f2": 216, "f3": "test12"} | test12 | {"f1": 12, "f2": 216, "f3": "test12"} | 2 | test15 | {"f1": 15, "f2": 270, "f3": "test15"} | 5 (5 rows) -- cte used in HAVING subquery just works fine -- even if it is inlined WITH cte_1 AS (SELECT max(key) as max FROM test_table) SELECT key, count(*) FROM test_table GROUP BY key HAVING (count(*) > (SELECT max FROM cte_1)) ORDER BY 2 DESC, 1 DESC LIMIT 5; DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for subquery SELECT max(key) AS max FROM cte_inline.test_table DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT key, count(*) AS count FROM cte_inline.test_table GROUP BY key HAVING (count(*) OPERATOR(pg_catalog.>) (SELECT cte_1.max FROM (SELECT intermediate_result.max FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(max integer)) cte_1)) ORDER BY (count(*)) DESC, key DESC LIMIT 5 DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 5 key | count --------------------------------------------------------------------- 8 | 40 5 | 40 2 | 40 (3 rows) -- cte used in ORDER BY just works fine -- even if it is inlined WITH cte_1 AS (SELECT max(key) as max FROM test_table) SELECT key FROM test_table JOIN cte_1 ON (key = max) ORDER BY cte_1.max LIMIT 3; DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for subquery SELECT max(key) AS max FROM cte_inline.test_table DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT test_table.key FROM (cte_inline.test_table JOIN (SELECT intermediate_result.max FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(max integer)) cte_1 ON ((test_table.key OPERATOR(pg_catalog.=) cte_1.max))) ORDER BY cte_1.max LIMIT 3 DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 key --------------------------------------------------------------------- 8 8 8 (3 rows) PREPARE inlined_cte_without_params AS WITH cte_1 AS (SELECT count(*) FROM test_table GROUP BY key) SELECT * FROM cte_1 ORDER BY 1 DESC LIMIT 3; PREPARE non_inlined_cte_without_params AS WITH cte_1 AS (SELECT * FROM test_table) SELECT * FROM test_table LEFT JOIN cte_1 USING (value) ORDER BY 1 DESC, 2 DESC, 3 DESC LIMIT 3; PREPARE inlined_cte_has_parameter_on_non_dist_key(text) AS WITH cte_1 AS (SELECT count(*) FROM test_table WHERE value = $1 GROUP BY key) SELECT * FROM cte_1 ORDER BY 1 DESC LIMIT 3; PREPARE inlined_cte_has_parameter_on_dist_key(int) AS WITH cte_1 AS (SELECT count(*) FROM test_table WHERE key > $1 GROUP BY key) SELECT * FROM cte_1 ORDER BY 1 DESC LIMIT 3; PREPARE non_inlined_cte_has_parameter_on_dist_key(int) AS WITH cte_1 AS (SELECT * FROM test_table where key > $1) SELECT * FROM test_table LEFT JOIN cte_1 USING (value) ORDER BY 1 DESC, 2 DESC, 3 DESC LIMIT 3; PREPARE retry_planning(int) AS WITH cte_1 AS (SELECT * FROM test_table WHERE key > $1) SELECT json_object_agg(DISTINCT key, value) FROM cte_1 ORDER BY max(key), min(value) DESC LIMIT 3; EXECUTE inlined_cte_without_params; DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 count --------------------------------------------------------------------- 40 40 40 (3 rows) EXECUTE inlined_cte_without_params; count --------------------------------------------------------------------- 40 40 40 (3 rows) EXECUTE inlined_cte_without_params; count --------------------------------------------------------------------- 40 40 40 (3 rows) EXECUTE inlined_cte_without_params; count --------------------------------------------------------------------- 40 40 40 (3 rows) EXECUTE inlined_cte_without_params; count --------------------------------------------------------------------- 40 40 40 (3 rows) EXECUTE inlined_cte_without_params; count --------------------------------------------------------------------- 40 40 40 (3 rows) EXECUTE non_inlined_cte_without_params; DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for subquery SELECT key, value, other_value FROM cte_inline.test_table DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT test_table.value, test_table.key, test_table.other_value, cte_1.key, cte_1.other_value FROM (cte_inline.test_table LEFT JOIN (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) cte_1 USING (value)) ORDER BY test_table.value DESC, test_table.key DESC, test_table.other_value DESC LIMIT 3 DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 value | key | other_value | key | other_value --------------------------------------------------------------------- test98 | 8 | | 8 | test98 | 8 | | 8 | test98 | 8 | | 8 | (3 rows) EXECUTE non_inlined_cte_without_params; value | key | other_value | key | other_value --------------------------------------------------------------------- test98 | 8 | | 8 | test98 | 8 | | 8 | test98 | 8 | | 8 | (3 rows) EXECUTE non_inlined_cte_without_params; value | key | other_value | key | other_value --------------------------------------------------------------------- test98 | 8 | | 8 | test98 | 8 | | 8 | test98 | 8 | | 8 | (3 rows) EXECUTE non_inlined_cte_without_params; value | key | other_value | key | other_value --------------------------------------------------------------------- test98 | 8 | | 8 | test98 | 8 | | 8 | test98 | 8 | | 8 | (3 rows) EXECUTE non_inlined_cte_without_params; value | key | other_value | key | other_value --------------------------------------------------------------------- test98 | 8 | | 8 | test98 | 8 | | 8 | test98 | 8 | | 8 | (3 rows) EXECUTE non_inlined_cte_without_params; value | key | other_value | key | other_value --------------------------------------------------------------------- test98 | 8 | | 8 | test98 | 8 | | 8 | test98 | 8 | | 8 | (3 rows) EXECUTE inlined_cte_has_parameter_on_non_dist_key('test1'); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 count --------------------------------------------------------------------- (0 rows) EXECUTE inlined_cte_has_parameter_on_non_dist_key('test2'); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 count --------------------------------------------------------------------- 4 (1 row) EXECUTE inlined_cte_has_parameter_on_non_dist_key('test3'); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 count --------------------------------------------------------------------- (0 rows) EXECUTE inlined_cte_has_parameter_on_non_dist_key('test4'); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 count --------------------------------------------------------------------- (0 rows) EXECUTE inlined_cte_has_parameter_on_non_dist_key('test5'); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 count --------------------------------------------------------------------- 4 (1 row) EXECUTE inlined_cte_has_parameter_on_non_dist_key('test6'); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 count --------------------------------------------------------------------- (0 rows) EXECUTE inlined_cte_has_parameter_on_dist_key(1); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 count --------------------------------------------------------------------- 40 40 40 (3 rows) EXECUTE inlined_cte_has_parameter_on_dist_key(2); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 count --------------------------------------------------------------------- 40 40 (2 rows) EXECUTE inlined_cte_has_parameter_on_dist_key(3); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 count --------------------------------------------------------------------- 40 40 (2 rows) EXECUTE inlined_cte_has_parameter_on_dist_key(4); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 count --------------------------------------------------------------------- 40 40 (2 rows) EXECUTE inlined_cte_has_parameter_on_dist_key(5); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 count --------------------------------------------------------------------- 40 (1 row) EXECUTE inlined_cte_has_parameter_on_dist_key(6); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 count --------------------------------------------------------------------- 40 (1 row) EXECUTE non_inlined_cte_has_parameter_on_dist_key(1); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for subquery SELECT key, value, other_value FROM cte_inline.test_table WHERE (key OPERATOR(pg_catalog.>) 1) DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT test_table.value, test_table.key, test_table.other_value, cte_1.key, cte_1.other_value FROM (cte_inline.test_table LEFT JOIN (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) cte_1 USING (value)) ORDER BY test_table.value DESC, test_table.key DESC, test_table.other_value DESC LIMIT 3 DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 value | key | other_value | key | other_value --------------------------------------------------------------------- test98 | 8 | | 8 | test98 | 8 | | 8 | test98 | 8 | | 8 | (3 rows) EXECUTE non_inlined_cte_has_parameter_on_dist_key(2); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for subquery SELECT key, value, other_value FROM cte_inline.test_table WHERE (key OPERATOR(pg_catalog.>) 2) DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT test_table.value, test_table.key, test_table.other_value, cte_1.key, cte_1.other_value FROM (cte_inline.test_table LEFT JOIN (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) cte_1 USING (value)) ORDER BY test_table.value DESC, test_table.key DESC, test_table.other_value DESC LIMIT 3 DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 value | key | other_value | key | other_value --------------------------------------------------------------------- test98 | 8 | | 8 | test98 | 8 | | 8 | test98 | 8 | | 8 | (3 rows) EXECUTE non_inlined_cte_has_parameter_on_dist_key(3); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for subquery SELECT key, value, other_value FROM cte_inline.test_table WHERE (key OPERATOR(pg_catalog.>) 3) DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT test_table.value, test_table.key, test_table.other_value, cte_1.key, cte_1.other_value FROM (cte_inline.test_table LEFT JOIN (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) cte_1 USING (value)) ORDER BY test_table.value DESC, test_table.key DESC, test_table.other_value DESC LIMIT 3 DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 value | key | other_value | key | other_value --------------------------------------------------------------------- test98 | 8 | | 8 | test98 | 8 | | 8 | test98 | 8 | | 8 | (3 rows) EXECUTE non_inlined_cte_has_parameter_on_dist_key(4); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for subquery SELECT key, value, other_value FROM cte_inline.test_table WHERE (key OPERATOR(pg_catalog.>) 4) DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT test_table.value, test_table.key, test_table.other_value, cte_1.key, cte_1.other_value FROM (cte_inline.test_table LEFT JOIN (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) cte_1 USING (value)) ORDER BY test_table.value DESC, test_table.key DESC, test_table.other_value DESC LIMIT 3 DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 value | key | other_value | key | other_value --------------------------------------------------------------------- test98 | 8 | | 8 | test98 | 8 | | 8 | test98 | 8 | | 8 | (3 rows) EXECUTE non_inlined_cte_has_parameter_on_dist_key(5); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for subquery SELECT key, value, other_value FROM cte_inline.test_table WHERE (key OPERATOR(pg_catalog.>) 5) DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT test_table.value, test_table.key, test_table.other_value, cte_1.key, cte_1.other_value FROM (cte_inline.test_table LEFT JOIN (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) cte_1 USING (value)) ORDER BY test_table.value DESC, test_table.key DESC, test_table.other_value DESC LIMIT 3 DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 value | key | other_value | key | other_value --------------------------------------------------------------------- test98 | 8 | | 8 | test98 | 8 | | 8 | test98 | 8 | | 8 | (3 rows) EXECUTE non_inlined_cte_has_parameter_on_dist_key(6); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for subquery SELECT key, value, other_value FROM cte_inline.test_table WHERE (key OPERATOR(pg_catalog.>) 6) DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT test_table.value, test_table.key, test_table.other_value, cte_1.key, cte_1.other_value FROM (cte_inline.test_table LEFT JOIN (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) cte_1 USING (value)) ORDER BY test_table.value DESC, test_table.key DESC, test_table.other_value DESC LIMIT 3 DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 value | key | other_value | key | other_value --------------------------------------------------------------------- test98 | 8 | | 8 | test98 | 8 | | 8 | test98 | 8 | | 8 | (3 rows) EXECUTE retry_planning(1); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries json_object_agg --------------------------------------------------------------------- { "2" : "test12", "2" : "test2", "2" : "test22", "2" : "test32", "2" : "test42", "2" : "test52", "2" : "test62", "2" : "test72", "2" : "test82", "2" : "test92", "5" : "test15", "5" : "test25", "5" : "test35", "5" : "test45", "5" : "test5", "5" : "test55", "5" : "test65", "5" : "test75", "5" : "test85", "5" : "test95", "8" : "test18", "8" : "test28", "8" : "test38", "8" : "test48", "8" : "test58", "8" : "test68", "8" : "test78", "8" : "test8", "8" : "test88", "8" : "test98" } (1 row) EXECUTE retry_planning(2); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries json_object_agg --------------------------------------------------------------------- { "5" : "test15", "5" : "test25", "5" : "test35", "5" : "test45", "5" : "test5", "5" : "test55", "5" : "test65", "5" : "test75", "5" : "test85", "5" : "test95", "8" : "test18", "8" : "test28", "8" : "test38", "8" : "test48", "8" : "test58", "8" : "test68", "8" : "test78", "8" : "test8", "8" : "test88", "8" : "test98" } (1 row) EXECUTE retry_planning(3); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries json_object_agg --------------------------------------------------------------------- { "5" : "test15", "5" : "test25", "5" : "test35", "5" : "test45", "5" : "test5", "5" : "test55", "5" : "test65", "5" : "test75", "5" : "test85", "5" : "test95", "8" : "test18", "8" : "test28", "8" : "test38", "8" : "test48", "8" : "test58", "8" : "test68", "8" : "test78", "8" : "test8", "8" : "test88", "8" : "test98" } (1 row) EXECUTE retry_planning(4); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries json_object_agg --------------------------------------------------------------------- { "5" : "test15", "5" : "test25", "5" : "test35", "5" : "test45", "5" : "test5", "5" : "test55", "5" : "test65", "5" : "test75", "5" : "test85", "5" : "test95", "8" : "test18", "8" : "test28", "8" : "test38", "8" : "test48", "8" : "test58", "8" : "test68", "8" : "test78", "8" : "test8", "8" : "test88", "8" : "test98" } (1 row) EXECUTE retry_planning(5); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries json_object_agg --------------------------------------------------------------------- { "8" : "test18", "8" : "test28", "8" : "test38", "8" : "test48", "8" : "test58", "8" : "test68", "8" : "test78", "8" : "test8", "8" : "test88", "8" : "test98" } (1 row) EXECUTE retry_planning(6); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries json_object_agg --------------------------------------------------------------------- { "8" : "test18", "8" : "test28", "8" : "test38", "8" : "test48", "8" : "test58", "8" : "test68", "8" : "test78", "8" : "test8", "8" : "test88", "8" : "test98" } (1 row) WITH b AS (SELECT * FROM test_table) SELECT count(*) FROM (SELECT key as x FROM test_table OFFSET 0) as ref LEFT JOIN b ON (ref.x = b.key); DEBUG: CTE b is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for subquery SELECT key AS x FROM cte_inline.test_table OFFSET 0 DEBUG: recursively planning right side of the left join since the outer side is a recurring rel DEBUG: recursively planning the distributed subquery since it is part of a distributed join node that is outer joined with a recurring rel DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_2 for subquery SELECT key, value, other_value FROM cte_inline.test_table DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT count(*) AS count FROM ((SELECT intermediate_result.x FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(x integer)) ref LEFT JOIN (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_2'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) b ON ((ref.x OPERATOR(pg_catalog.=) b.key))) DEBUG: Creating router plan count --------------------------------------------------------------------- 4800 (1 row) -- this becomes a non-colocated subquery join -- because after the CTEs are inlined the joins -- become a non-colocated subquery join WITH a AS (SELECT * FROM test_table), b AS (SELECT * FROM test_table) SELECT count(*) FROM a LEFT JOIN b ON (a.value = b.value); DEBUG: CTE a is going to be inlined via distributed planning DEBUG: CTE b is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for subquery SELECT key, value, other_value FROM cte_inline.test_table DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT count(*) AS count FROM ((SELECT test_table.key, test_table.value, test_table.other_value FROM cte_inline.test_table) a LEFT JOIN (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) b ON ((a.value OPERATOR(pg_catalog.=) b.value))) DEBUG: Router planner cannot handle multi-shard select queries count --------------------------------------------------------------------- 480 (1 row) WITH a AS (SELECT * FROM test_table OFFSET 0), b AS (SELECT * FROM test_table) SELECT min(a.key) FROM a LEFT JOIN b ON (a.value = b.value); DEBUG: CTE a is going to be inlined via distributed planning DEBUG: CTE b is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for subquery SELECT key, value, other_value FROM cte_inline.test_table OFFSET 0 DEBUG: recursively planning right side of the left join since the outer side is a recurring rel DEBUG: recursively planning the distributed subquery since it is part of a distributed join node that is outer joined with a recurring rel DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_2 for subquery SELECT key, value, other_value FROM cte_inline.test_table DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT min(a.key) AS min FROM ((SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) a LEFT JOIN (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_2'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) b ON ((a.value OPERATOR(pg_catalog.=) b.value))) DEBUG: Creating router plan min --------------------------------------------------------------------- 2 (1 row) -- after both CTEs are inlined, this becomes non-colocated subquery join WITH cte_1 AS (SELECT * FROM test_table), cte_2 AS (SELECT * FROM test_table) SELECT * FROM cte_1 JOIN cte_2 ON (cte_1.value > cte_2.value) ORDER BY 1,2,3,4,5,6 DESC LIMIT 3;; DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: CTE cte_2 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for subquery SELECT key, value, other_value FROM cte_inline.test_table DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT cte_1.key, cte_1.value, cte_1.other_value, cte_2.key, cte_2.value, cte_2.other_value FROM ((SELECT test_table.key, test_table.value, test_table.other_value FROM cte_inline.test_table) cte_1 JOIN (SELECT intermediate_result.key, intermediate_result.value, intermediate_result.other_value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(key integer, value text, other_value jsonb)) cte_2 ON ((cte_1.value OPERATOR(pg_catalog.>) cte_2.value))) ORDER BY cte_1.key, cte_1.value, cte_1.other_value, cte_2.key, cte_2.value, cte_2.other_value DESC LIMIT 3 DEBUG: Router planner cannot handle multi-shard select queries DEBUG: push down of limit count: 3 key | value | other_value | key | value | other_value --------------------------------------------------------------------- 2 | test2 | {"f1": 2, "f2": 36, "f3": "test2"} | 2 | test12 | 2 | test2 | {"f1": 2, "f2": 36, "f3": "test2"} | 2 | test12 | 2 | test2 | {"f1": 2, "f2": 36, "f3": "test2"} | 2 | test12 | (3 rows) -- full join is only supported when both sides are -- recursively planned WITH cte_1 AS (SELECT value FROM test_table WHERE key > 1), cte_2 AS (SELECT value FROM test_table WHERE key > 3) SELECT * FROM cte_1 FULL JOIN cte_2 USING (value) ORDER BY 1 DESC LIMIT 3;; DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: CTE cte_2 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for subquery SELECT value FROM cte_inline.test_table WHERE (key OPERATOR(pg_catalog.>) 3) DEBUG: recursively planning left side of the full join since the other side is a recurring rel DEBUG: recursively planning the distributed subquery since it is part of a distributed join node that is outer joined with a recurring rel DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_2 for subquery SELECT value FROM cte_inline.test_table WHERE (key OPERATOR(pg_catalog.>) 1) DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT value FROM ((SELECT intermediate_result.value FROM read_intermediate_result('XXX_2'::text, 'binary'::citus_copy_format) intermediate_result(value text)) cte_1 FULL JOIN (SELECT intermediate_result.value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(value text)) cte_2 USING (value)) ORDER BY value DESC LIMIT 3 DEBUG: Creating router plan value --------------------------------------------------------------------- test98 test98 test98 (3 rows) -- an unsupported agg. for multi-shard queries -- so CTE has to be recursively planned WITH cte_1 AS (SELECT * FROM test_table WHERE key > 1) SELECT json_object_agg(DISTINCT key, value) FROM cte_1; DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries json_object_agg --------------------------------------------------------------------- { "2" : "test12", "2" : "test2", "2" : "test22", "2" : "test32", "2" : "test42", "2" : "test52", "2" : "test62", "2" : "test72", "2" : "test82", "2" : "test92", "5" : "test15", "5" : "test25", "5" : "test35", "5" : "test45", "5" : "test5", "5" : "test55", "5" : "test65", "5" : "test75", "5" : "test85", "5" : "test95", "8" : "test18", "8" : "test28", "8" : "test38", "8" : "test48", "8" : "test58", "8" : "test68", "8" : "test78", "8" : "test8", "8" : "test88", "8" : "test98" } (1 row) -- both cte_1 and cte_2 are going to be inlined. -- later, cte_2 is recursively planned since it doesn't have -- GROUP BY but aggragate in a subquery. -- this is an important example of being able to recursively plan -- "some" of the CTEs WITH cte_1 AS (SELECT value FROM test_table WHERE key > 1), cte_2 AS (SELECT max(value) as value FROM test_table WHERE key > 3) SELECT count(*) FROM cte_1 JOIN cte_2 USING (value); DEBUG: CTE cte_1 is going to be inlined via distributed planning DEBUG: CTE cte_2 is going to be inlined via distributed planning DEBUG: Router planner cannot handle multi-shard select queries DEBUG: Router planner cannot handle multi-shard select queries DEBUG: generating subplan XXX_1 for subquery SELECT max(value) AS value FROM cte_inline.test_table WHERE (key OPERATOR(pg_catalog.>) 3) DEBUG: Plan XXX query after replacing subqueries and CTEs: SELECT count(*) AS count FROM ((SELECT test_table.value FROM cte_inline.test_table WHERE (test_table.key OPERATOR(pg_catalog.>) 1)) cte_1 JOIN (SELECT intermediate_result.value FROM read_intermediate_result('XXX_1'::text, 'binary'::citus_copy_format) intermediate_result(value text)) cte_2 USING (value)) DEBUG: Router planner cannot handle multi-shard select queries count --------------------------------------------------------------------- 4 (1 row) -- prevent DROP CASCADE to give notices SET client_min_messages TO ERROR; DROP SCHEMA cte_inline CASCADE;