citus/src/test/regress/expected/tdigest_aggregate_support_0...

235 lines
13 KiB
Plaintext

--
-- TDIGEST_AGGREGATE_SUPPORT
-- test the integration of github.com/tvondra/tdigest aggregates into the citus planner
-- for push down parts of the aggregate to use parallelized execution and reduced data
-- transfer sizes for aggregates not grouped by the distribution column
--
SET citus.next_shard_id TO 20070000;
CREATE SCHEMA tdigest_aggregate_support;
SET search_path TO tdigest_aggregate_support, public;
-- create the tdigest extension when installed
SELECT CASE WHEN COUNT(*) > 0
THEN 'CREATE EXTENSION tdigest WITH SCHEMA public'
ELSE 'SELECT false AS tdigest_present' END
AS create_cmd FROM pg_available_extensions()
WHERE name = 'tdigest'
\gset
:create_cmd;
tdigest_present
---------------------------------------------------------------------
f
(1 row)
SET citus.shard_count TO 4;
SET citus.coordinator_aggregation_strategy TO 'disabled'; -- prevent aggregate execution when the aggregate can't be pushed down
CREATE TABLE latencies (a int, b int, latency double precision);
SELECT create_distributed_table('latencies', 'a');
create_distributed_table
---------------------------------------------------------------------
(1 row)
SELECT setseed(0.42); -- make the random data inserted deterministic
setseed
---------------------------------------------------------------------
(1 row)
INSERT INTO latencies
SELECT (random()*20)::int AS a,
(random()*20)::int AS b,
random()*10000.0 AS latency
FROM generate_series(1, 10000);
-- explain no grouping to verify partially pushed down for tdigest(value, compression)
EXPLAIN (COSTS OFF, VERBOSE)
SELECT tdigest(latency, 100)
FROM latencies;
ERROR: function tdigest(double precision, integer) does not exist
HINT: No function matches the given name and argument types. You might need to add explicit type casts.
-- explain grouping by distribution column is completely pushed down for tdigest(value, compression)
EXPLAIN (COSTS OFF, VERBOSE)
SELECT a, tdigest(latency, 100)
FROM latencies
GROUP BY a;
ERROR: function tdigest(double precision, integer) does not exist
HINT: No function matches the given name and argument types. You might need to add explicit type casts.
-- explain grouping by non-distribution column is partially pushed down for tdigest(value, compression)
EXPLAIN (COSTS OFF, VERBOSE)
SELECT b, tdigest(latency, 100)
FROM latencies
GROUP BY b;
ERROR: function tdigest(double precision, integer) does not exist
HINT: No function matches the given name and argument types. You might need to add explicit type casts.
-- explain no grouping to verify partially pushed down for tdigest_precentile(value, compression, quantile)
EXPLAIN (COSTS OFF, VERBOSE)
SELECT tdigest_percentile(latency, 100, 0.99)
FROM latencies;
ERROR: function tdigest_percentile(double precision, integer, numeric) does not exist
HINT: No function matches the given name and argument types. You might need to add explicit type casts.
-- explain grouping by distribution column is completely pushed down for tdigest_precentile(value, compression, quantile)
EXPLAIN (COSTS OFF, VERBOSE)
SELECT a, tdigest_percentile(latency, 100, 0.99)
FROM latencies
GROUP BY a;
ERROR: function tdigest_percentile(double precision, integer, numeric) does not exist
HINT: No function matches the given name and argument types. You might need to add explicit type casts.
-- explain grouping by non-distribution column is partially pushed down for tdigest_precentile(value, compression, quantile)
EXPLAIN (COSTS OFF, VERBOSE)
SELECT b, tdigest_percentile(latency, 100, 0.99)
FROM latencies
GROUP BY b;
ERROR: function tdigest_percentile(double precision, integer, numeric) does not exist
HINT: No function matches the given name and argument types. You might need to add explicit type casts.
-- explain no grouping to verify partially pushed down for tdigest_precentile(value, compression, quantiles[])
EXPLAIN (COSTS OFF, VERBOSE)
SELECT tdigest_percentile(latency, 100, ARRAY[0.99, 0.95])
FROM latencies;
ERROR: function tdigest_percentile(double precision, integer, numeric[]) does not exist
HINT: No function matches the given name and argument types. You might need to add explicit type casts.
-- explain grouping by distribution column is completely pushed down for tdigest_precentile(value, compression, quantiles[])
EXPLAIN (COSTS OFF, VERBOSE)
SELECT a, tdigest_percentile(latency, 100, ARRAY[0.99, 0.95])
FROM latencies
GROUP BY a;
ERROR: function tdigest_percentile(double precision, integer, numeric[]) does not exist
HINT: No function matches the given name and argument types. You might need to add explicit type casts.
-- explain grouping by non-distribution column is partially pushed down for tdigest_precentile(value, compression, quantiles[])
EXPLAIN (COSTS OFF, VERBOSE)
SELECT b, tdigest_percentile(latency, 100, ARRAY[0.99, 0.95])
FROM latencies
GROUP BY b;
ERROR: function tdigest_percentile(double precision, integer, numeric[]) does not exist
HINT: No function matches the given name and argument types. You might need to add explicit type casts.
-- explain no grouping to verify partially pushed down for tdigest_precentile_of(value, compression, hypotetical_value)
EXPLAIN (COSTS OFF, VERBOSE)
SELECT tdigest_percentile_of(latency, 100, 9000)
FROM latencies;
ERROR: function tdigest_percentile_of(double precision, integer, integer) does not exist
HINT: No function matches the given name and argument types. You might need to add explicit type casts.
-- explain grouping by distribution column is completely pushed down for tdigest_precentile_of(value, compression, hypotetical_value)
EXPLAIN (COSTS OFF, VERBOSE)
SELECT a, tdigest_percentile_of(latency, 100, 9000)
FROM latencies
GROUP BY a;
ERROR: function tdigest_percentile_of(double precision, integer, integer) does not exist
HINT: No function matches the given name and argument types. You might need to add explicit type casts.
-- explain grouping by non-distribution column is partially pushed down for tdigest_precentile_of(value, compression, hypotetical_value)
EXPLAIN (COSTS OFF, VERBOSE)
SELECT b, tdigest_percentile_of(latency, 100, 9000)
FROM latencies
GROUP BY b;
ERROR: function tdigest_percentile_of(double precision, integer, integer) does not exist
HINT: No function matches the given name and argument types. You might need to add explicit type casts.
-- explain no grouping to verify partially pushed down for tdigest_precentile_of(value, compression, hypotetical_values[])
EXPLAIN (COSTS OFF, VERBOSE)
SELECT tdigest_percentile_of(latency, 100, ARRAY[9000, 9500])
FROM latencies;
ERROR: function tdigest_percentile_of(double precision, integer, integer[]) does not exist
HINT: No function matches the given name and argument types. You might need to add explicit type casts.
-- explain grouping by distribution column is completely pushed down for tdigest_precentile_of(value, compression, hypotetical_values[])
EXPLAIN (COSTS OFF, VERBOSE)
SELECT a, tdigest_percentile_of(latency, 100, ARRAY[9000, 9500])
FROM latencies
GROUP BY a;
ERROR: function tdigest_percentile_of(double precision, integer, integer[]) does not exist
HINT: No function matches the given name and argument types. You might need to add explicit type casts.
-- explain grouping by non-distribution column is partially pushed down for tdigest_precentile_of(value, compression, hypotetical_values[])
EXPLAIN (COSTS OFF, VERBOSE)
SELECT b, tdigest_percentile_of(latency, 100, ARRAY[9000, 9500])
FROM latencies
GROUP BY b;
ERROR: function tdigest_percentile_of(double precision, integer, integer[]) does not exist
HINT: No function matches the given name and argument types. You might need to add explicit type casts.
-- verifying results - should be stable due to seed while inserting the data, if failure due to data these queries could be removed or check for certain ranges
SELECT tdigest(latency, 100) FROM latencies;
ERROR: function tdigest(double precision, integer) does not exist
HINT: No function matches the given name and argument types. You might need to add explicit type casts.
SELECT tdigest_percentile(latency, 100, 0.99) FROM latencies;
ERROR: function tdigest_percentile(double precision, integer, numeric) does not exist
HINT: No function matches the given name and argument types. You might need to add explicit type casts.
SELECT tdigest_percentile(latency, 100, ARRAY[0.99, 0.95]) FROM latencies;
ERROR: function tdigest_percentile(double precision, integer, numeric[]) does not exist
HINT: No function matches the given name and argument types. You might need to add explicit type casts.
SELECT tdigest_percentile_of(latency, 100, 9000) FROM latencies;
ERROR: function tdigest_percentile_of(double precision, integer, integer) does not exist
HINT: No function matches the given name and argument types. You might need to add explicit type casts.
SELECT tdigest_percentile_of(latency, 100, ARRAY[9000, 9500]) FROM latencies;
ERROR: function tdigest_percentile_of(double precision, integer, integer[]) does not exist
HINT: No function matches the given name and argument types. You might need to add explicit type casts.
CREATE TABLE latencies_rollup (a int, tdigest tdigest);
ERROR: type "tdigest" does not exist
SELECT create_distributed_table('latencies_rollup', 'a', colocate_with => 'latencies');
ERROR: relation "latencies_rollup" does not exist
INSERT INTO latencies_rollup
SELECT a, tdigest(latency, 100)
FROM latencies
GROUP BY a;
ERROR: relation "latencies_rollup" does not exist
EXPLAIN (COSTS OFF, VERBOSE)
SELECT tdigest(tdigest)
FROM latencies_rollup;
ERROR: relation "latencies_rollup" does not exist
-- explain grouping by distribution column is completely pushed down for tdigest(tdigest)
EXPLAIN (COSTS OFF, VERBOSE)
SELECT a, tdigest(tdigest)
FROM latencies_rollup
GROUP BY a;
ERROR: relation "latencies_rollup" does not exist
-- explain no grouping to verify partially pushed down for tdigest_precentile(tdigest, quantile)
EXPLAIN (COSTS OFF, VERBOSE)
SELECT tdigest_percentile(tdigest, 0.99)
FROM latencies_rollup;
ERROR: relation "latencies_rollup" does not exist
-- explain grouping by distribution column is completely pushed down for tdigest_precentile(tdigest, quantile)
EXPLAIN (COSTS OFF, VERBOSE)
SELECT a, tdigest_percentile(tdigest, 0.99)
FROM latencies_rollup
GROUP BY a;
ERROR: relation "latencies_rollup" does not exist
-- explain no grouping to verify partially pushed down for tdigest_precentile(value, compression, quantiles[])
EXPLAIN (COSTS OFF, VERBOSE)
SELECT tdigest_percentile(tdigest, ARRAY[0.99, 0.95])
FROM latencies_rollup;
ERROR: relation "latencies_rollup" does not exist
-- explain grouping by distribution column is completely pushed down for tdigest_precentile(value, compression, quantiles[])
EXPLAIN (COSTS OFF, VERBOSE)
SELECT a, tdigest_percentile(tdigest, ARRAY[0.99, 0.95])
FROM latencies_rollup
GROUP BY a;
ERROR: relation "latencies_rollup" does not exist
-- explain no grouping to verify partially pushed down for tdigest_precentile_of(value, compression, hypotetical_value)
EXPLAIN (COSTS OFF, VERBOSE)
SELECT tdigest_percentile_of(tdigest, 9000)
FROM latencies_rollup;
ERROR: relation "latencies_rollup" does not exist
-- explain grouping by distribution column is completely pushed down for tdigest_precentile_of(value, compression, hypotetical_value)
EXPLAIN (COSTS OFF, VERBOSE)
SELECT a, tdigest_percentile_of(tdigest, 9000)
FROM latencies_rollup
GROUP BY a;
ERROR: relation "latencies_rollup" does not exist
-- explain no grouping to verify partially pushed down for tdigest_precentile_of(value, compression, hypotetical_values[])
EXPLAIN (COSTS OFF, VERBOSE)
SELECT tdigest_percentile_of(tdigest, ARRAY[9000, 9500])
FROM latencies_rollup;
ERROR: relation "latencies_rollup" does not exist
-- explain grouping by distribution column is completely pushed down for tdigest_precentile_of(value, compression, hypotetical_values[])
EXPLAIN (COSTS OFF, VERBOSE)
SELECT a, tdigest_percentile_of(tdigest, ARRAY[9000, 9500])
FROM latencies_rollup
GROUP BY a;
ERROR: relation "latencies_rollup" does not exist
-- verifying results - should be stable due to seed while inserting the data, if failure due to data these queries could be removed or check for certain ranges
SELECT tdigest(tdigest) FROM latencies_rollup;
ERROR: relation "latencies_rollup" does not exist
SELECT tdigest_percentile(tdigest, 0.99) FROM latencies_rollup;
ERROR: relation "latencies_rollup" does not exist
SELECT tdigest_percentile(tdigest, ARRAY[0.99, 0.95]) FROM latencies_rollup;
ERROR: relation "latencies_rollup" does not exist
SELECT tdigest_percentile_of(tdigest, 9000) FROM latencies_rollup;
ERROR: relation "latencies_rollup" does not exist
SELECT tdigest_percentile_of(tdigest, ARRAY[9000, 9500]) FROM latencies_rollup;
ERROR: relation "latencies_rollup" does not exist
SET client_min_messages TO WARNING; -- suppress cascade messages
DROP SCHEMA tdigest_aggregate_support CASCADE;