-- -- MULTI_CREATE_TABLE -- -- Create new table definitions for use in testing in distributed planning and -- execution functionality. Also create indexes to boost performance. Since we -- need to cover both reference join and partitioned join, we have created -- reference and hash-distributed version of orders, customer and part tables. SET citus.next_shard_id TO 360000; CREATE TABLE lineitem ( l_orderkey bigint not null, l_partkey integer not null, l_suppkey integer not null, l_linenumber integer not null, l_quantity decimal(15, 2) not null, l_extendedprice decimal(15, 2) not null, l_discount decimal(15, 2) not null, l_tax decimal(15, 2) not null, l_returnflag char(1) not null, l_linestatus char(1) not null, l_shipdate date not null, l_commitdate date not null, l_receiptdate date not null, l_shipinstruct char(25) not null, l_shipmode char(10) not null, l_comment varchar(44) not null, PRIMARY KEY(l_orderkey, l_linenumber) ); SELECT create_distributed_table('lineitem', 'l_orderkey', 'hash', shard_count := 2); CREATE INDEX lineitem_time_index ON lineitem (l_shipdate); CREATE TABLE orders ( o_orderkey bigint not null, o_custkey integer not null, o_orderstatus char(1) not null, o_totalprice decimal(15,2) not null, o_orderdate date not null, o_orderpriority char(15) not null, o_clerk char(15) not null, o_shippriority integer not null, o_comment varchar(79) not null, PRIMARY KEY(o_orderkey) ); SELECT create_distributed_table('orders', 'o_orderkey', 'hash', colocate_with := 'lineitem'); CREATE TABLE orders_reference ( o_orderkey bigint not null, o_custkey integer not null, o_orderstatus char(1) not null, o_totalprice decimal(15,2) not null, o_orderdate date not null, o_orderpriority char(15) not null, o_clerk char(15) not null, o_shippriority integer not null, o_comment varchar(79) not null, PRIMARY KEY(o_orderkey) ); SELECT create_reference_table('orders_reference'); CREATE TABLE customer ( c_custkey integer not null, c_name varchar(25) not null, c_address varchar(40) not null, c_nationkey integer not null, c_phone char(15) not null, c_acctbal decimal(15,2) not null, c_mktsegment char(10) not null, c_comment varchar(117) not null); SELECT create_reference_table('customer'); CREATE TABLE customer_append ( c_custkey integer not null, c_name varchar(25) not null, c_address varchar(40) not null, c_nationkey integer not null, c_phone char(15) not null, c_acctbal decimal(15,2) not null, c_mktsegment char(10) not null, c_comment varchar(117) not null); SELECT create_distributed_table('customer_append', 'c_custkey', 'append'); SELECT master_create_empty_shard('customer_append'); CREATE TABLE nation ( n_nationkey integer not null, n_name char(25) not null, n_regionkey integer not null, n_comment varchar(152)); SELECT create_reference_table('nation'); CREATE TABLE part ( p_partkey integer not null, p_name varchar(55) not null, p_mfgr char(25) not null, p_brand char(10) not null, p_type varchar(25) not null, p_size integer not null, p_container char(10) not null, p_retailprice decimal(15,2) not null, p_comment varchar(23) not null); SELECT create_reference_table('part'); CREATE TABLE part_append ( p_partkey integer not null, p_name varchar(55) not null, p_mfgr char(25) not null, p_brand char(10) not null, p_type varchar(25) not null, p_size integer not null, p_container char(10) not null, p_retailprice decimal(15,2) not null, p_comment varchar(23) not null); SELECT create_distributed_table('part_append', 'p_partkey', 'append'); SELECT master_create_empty_shard('part_append'); CREATE TABLE supplier ( s_suppkey integer not null, s_name char(25) not null, s_address varchar(40) not null, s_nationkey integer, s_phone char(15) not null, s_acctbal decimal(15,2) not null, s_comment varchar(101) not null ); SELECT create_reference_table('supplier'); -- create a single shard supplier table which is not -- a reference table CREATE TABLE supplier_single_shard ( s_suppkey integer not null, s_name char(25) not null, s_address varchar(40) not null, s_nationkey integer, s_phone char(15) not null, s_acctbal decimal(15,2) not null, s_comment varchar(101) not null ); SELECT create_distributed_table('supplier_single_shard', 's_suppkey', 'hash', shard_count := 1); CREATE TABLE mx_table_test (col1 int, col2 text); SET citus.next_shard_id TO 360013; -- Test initial data loading CREATE TABLE data_load_test (col1 int, col2 text, col3 serial); INSERT INTO data_load_test VALUES (132, 'hello'); INSERT INTO data_load_test VALUES (243, 'world'); -- table must be empty when using append- or range-partitioning SELECT create_distributed_table('data_load_test', 'col1', 'append'); SELECT create_distributed_table('data_load_test', 'col1', 'range'); -- create_distributed_table creates shards and copies data into the distributed table SELECT create_distributed_table('data_load_test', 'col1'); SELECT * FROM data_load_test ORDER BY col1; DROP TABLE data_load_test; -- test queries on distributed tables with no shards CREATE TABLE no_shard_test (col1 int, col2 text); SELECT create_distributed_table('no_shard_test', 'col1', 'append'); SELECT * FROM no_shard_test WHERE col1 > 1; DROP TABLE no_shard_test; CREATE TABLE no_shard_test (col1 int, col2 text); SELECT create_distributed_table('no_shard_test', 'col1', 'range'); SELECT * FROM no_shard_test WHERE col1 > 1; DROP TABLE no_shard_test; -- ensure writes in the same transaction as create_distributed_table are visible BEGIN; CREATE TABLE data_load_test (col1 int, col2 text, col3 serial); INSERT INTO data_load_test VALUES (132, 'hello'); SELECT create_distributed_table('data_load_test', 'col1'); INSERT INTO data_load_test VALUES (243, 'world'); END; SELECT * FROM data_load_test ORDER BY col1; DROP TABLE data_load_test; -- creating co-located distributed tables in the same transaction works BEGIN; CREATE TABLE data_load_test1 (col1 int, col2 text, col3 serial); INSERT INTO data_load_test1 VALUES (132, 'hello'); SELECT create_distributed_table('data_load_test1', 'col1'); CREATE TABLE data_load_test2 (col1 int, col2 text, col3 serial); INSERT INTO data_load_test2 VALUES (132, 'world'); SELECT create_distributed_table('data_load_test2', 'col1'); SELECT a.col2 ||' '|| b.col2 FROM data_load_test1 a JOIN data_load_test2 b USING (col1) WHERE col1 = 132; DROP TABLE data_load_test1, data_load_test2; END; -- distributing catalog tables is not supported SELECT create_distributed_table('pg_class', 'relname'); SELECT create_reference_table('pg_class'); -- test shard_count parameter -- first set citus.shard_count so we know the parameter works SET citus.shard_count TO 10; CREATE TABLE shard_count_table (a INT, b TEXT); CREATE TABLE shard_count_table_2 (a INT, b TEXT); SELECT create_distributed_table('shard_count_table', 'a', shard_count:=5); SELECT shard_count FROM citus_tables WHERE table_name::text = 'shard_count_table'; SELECT create_distributed_table('shard_count_table_2', 'a', shard_count:=0); SELECT create_distributed_table('shard_count_table_2', 'a', shard_count:=-100); SELECT create_distributed_table('shard_count_table_2', 'a', shard_count:=64001); -- shard count with colocate with table should error SELECT create_distributed_table('shard_count_table_2', 'a', shard_count:=12, colocate_with:='shard_count'); -- none should not error SELECT create_distributed_table('shard_count_table_2', 'a', shard_count:=12, colocate_with:='none'); DROP TABLE shard_count_table, shard_count_table_2; -- test shard splitting doesn't break shard_count parameter -- when shard count is given table needs to have exactly that -- many shards, regardless of shard splitting on other tables -- ensure there is no colocation group with 9 shards SELECT count(*) FROM pg_dist_colocation WHERE shardcount = 9; SET citus.shard_count TO 9; SET citus.shard_replication_factor TO 1; CREATE TABLE shard_split_table (a int, b int); SELECT create_distributed_table ('shard_split_table', 'a'); SELECT 1 FROM isolate_tenant_to_new_shard('shard_split_table', 5, shard_transfer_mode => 'block_writes'); -- show the difference in pg_dist_colocation and citus_tables shard counts SELECT ( SELECT shardcount FROM pg_dist_colocation WHERE colocationid IN ( SELECT colocation_id FROM citus_tables WHERE table_name = 'shard_split_table'::regclass ) ) AS "pg_dist_colocation", (SELECT shard_count FROM citus_tables WHERE table_name = 'shard_split_table'::regclass) AS "citus_tables"; CREATE TABLE shard_split_table_2 (a int, b int); SELECT create_distributed_table ('shard_split_table_2', 'a', shard_count:=9); SELECT a.colocation_id = b.colocation_id FROM citus_tables a, citus_tables b WHERE a.table_name = 'shard_split_table'::regclass AND b.table_name = 'shard_split_table_2'::regclass; SELECT shard_count FROM citus_tables WHERE table_name = 'shard_split_table_2'::regclass; -- also check we don't break regular behaviour CREATE TABLE shard_split_table_3 (a int, b int); SELECT create_distributed_table ('shard_split_table_3', 'a'); SELECT a.colocation_id = b.colocation_id FROM citus_tables a, citus_tables b WHERE a.table_name = 'shard_split_table'::regclass AND b.table_name = 'shard_split_table_3'::regclass; SELECT shard_count FROM citus_tables WHERE table_name = 'shard_split_table_3'::regclass; DROP TABLE shard_split_table, shard_split_table_2, shard_split_table_3; -- test a shard count with an empty default colocation group -- ensure there is no colocation group with 13 shards SELECT count(*) FROM pg_dist_colocation WHERE shardcount = 13; SET citus.shard_count TO 13; CREATE TABLE shard_count_drop_table (a int); SELECT create_distributed_table('shard_count_drop_table', 'a'); DROP TABLE shard_count_drop_table; CREATE TABLE shard_count_table_3 (a int); SELECT create_distributed_table('shard_count_table_3', 'a', shard_count:=13); SELECT shardcount FROM pg_dist_colocation WHERE colocationid IN ( SELECT colocation_id FROM citus_tables WHERE table_name = 'shard_count_table_3'::regclass ); CREATE TEMP TABLE temp_table(a int); -- make sure temp table cannot be distributed and we give a good error select create_distributed_table('temp_table', 'a'); select create_reference_table('temp_table'); DROP TABLE temp_table; DROP TABLE shard_count_table_3; -- test shard count 1 placement with colocate none. -- create a base table instance set citus.enable_single_shard_table_multi_node_placement to on; CREATE TABLE shard_count_table_1_inst_1 (a int); SELECT create_distributed_table('shard_count_table_1_inst_1', 'a', shard_count:=1, colocate_with:='none'); -- create another table with similar requirements CREATE TABLE shard_count_table_1_inst_2 (a int); SELECT create_distributed_table('shard_count_table_1_inst_2', 'a', shard_count:=1, colocate_with:='none'); -- Now check placement: SELECT (SELECT colocation_id FROM citus_tables WHERE table_name = 'shard_count_table_1_inst_1'::regclass) != (SELECT colocation_id FROM citus_tables WHERE table_name = 'shard_count_table_1_inst_2'::regclass); -- double check shard counts SELECT (SELECT shard_count FROM citus_tables WHERE table_name = 'shard_count_table_1_inst_1'::regclass) = (SELECT shard_count FROM citus_tables WHERE table_name = 'shard_count_table_1_inst_2'::regclass); SELECT shard_count = 1 FROM citus_tables WHERE table_name = 'shard_count_table_1_inst_1'::regclass; -- check placement: These should be placed on different workers. SELECT nodename || ':' || nodeport AS inst_1_node_endpoint FROM citus_shards WHERE table_name = 'shard_count_table_1_inst_1'::regclass \gset SELECT nodename || ':' || nodeport AS inst_2_node_endpoint FROM citus_shards WHERE table_name = 'shard_count_table_1_inst_2'::regclass \gset SELECT :'inst_1_node_endpoint', :'inst_2_node_endpoint', :'inst_1_node_endpoint' = :'inst_2_node_endpoint'; DROP TABLE shard_count_table_1_inst_1; DROP TABLE shard_count_table_1_inst_2;