-- Test passing off function call to mx workers CREATE SCHEMA multi_mx_function_call_delegation; SET search_path TO multi_mx_function_call_delegation, public; \set VERBOSITY terse SET citus.shard_replication_factor TO 2; -- This table requires specific settings, create before getting into things create table mx_call_dist_table_replica(id int, val int); select create_distributed_table('mx_call_dist_table_replica', 'id'); insert into mx_call_dist_table_replica values (9,1),(8,2),(7,3),(6,4),(5,5); SET citus.shard_replication_factor TO 1; -- -- Create tables and functions we want to use in tests -- create table mx_call_dist_table_1(id int, val int); select create_distributed_table('mx_call_dist_table_1', 'id'); insert into mx_call_dist_table_1 values (3,1),(4,5),(9,2),(6,5),(3,5); create table mx_call_dist_table_2(id int, val int); select create_distributed_table('mx_call_dist_table_2', 'id'); insert into mx_call_dist_table_2 values (1,1),(1,2),(2,2),(3,3),(3,4); create table mx_call_dist_table_bigint(id bigint, val bigint); select create_distributed_table('mx_call_dist_table_bigint', 'id'); insert into mx_call_dist_table_bigint values (1,1),(1,2),(2,2),(3,3),(3,4); create table mx_call_dist_table_single_shard(id int, val int); select create_distributed_table('mx_call_dist_table_single_shard', null); insert into mx_call_dist_table_single_shard values (2,7),(1,8),(2,8),(1,8),(2,8); create table mx_call_dist_table_ref(id int, val int); select create_reference_table('mx_call_dist_table_ref'); insert into mx_call_dist_table_ref values (2,7),(1,8),(2,8),(1,8),(2,8); create type mx_call_enum as enum ('A', 'S', 'D', 'F'); create table mx_call_dist_table_enum(id int, key mx_call_enum); select create_distributed_table('mx_call_dist_table_enum', 'key'); insert into mx_call_dist_table_enum values (1,'S'),(2,'A'),(3,'D'),(4,'F'); CREATE FUNCTION squares(int) RETURNS SETOF RECORD AS $$ SELECT i, i * i FROM generate_series(1, $1) i $$ LANGUAGE SQL; CREATE FUNCTION mx_call_func(x int, INOUT y int) LANGUAGE plpgsql AS $$ BEGIN -- groupid is 0 in coordinator and non-zero in workers, so by using it here -- we make sure the function is being executed in the worker. y := x + (select case groupid when 0 then 1 else 0 end from pg_dist_local_group); -- we also make sure that we can run distributed queries in the functions -- that are routed to the workers. y := y + (select sum(t1.val + t2.val) from multi_mx_function_call_delegation.mx_call_dist_table_1 t1 join multi_mx_function_call_delegation.mx_call_dist_table_2 t2 on t1.id = t2.id); END;$$; CREATE FUNCTION mx_call_func_bigint(x bigint, INOUT y bigint) LANGUAGE plpgsql AS $$ BEGIN y := x + y * 2; END;$$; CREATE FUNCTION mx_call_func_bigint_force(x bigint, INOUT y bigint) LANGUAGE plpgsql AS $$ BEGIN PERFORM multi_mx_function_call_delegation.mx_call_func_bigint(x, y); END;$$; -- create another function which verifies: -- 1. we work fine with multiple return columns -- 2. we work fine in combination with custom types CREATE FUNCTION mx_call_func_custom_types(INOUT x mx_call_enum, INOUT y mx_call_enum) LANGUAGE plpgsql AS $$ BEGIN y := x; x := (select case groupid when 0 then 'F' else 'S' end from pg_dist_local_group); END;$$; -- function which internally uses COPY protocol without remote execution CREATE FUNCTION mx_call_func_copy(x int) RETURNS bool LANGUAGE plpgsql AS $$ BEGIN INSERT INTO multi_mx_function_call_delegation.mx_call_dist_table_1 SELECT s,s FROM generate_series(100, 110) s; RETURN true; END;$$; -- Test that undistributed functions have no issue executing select multi_mx_function_call_delegation.mx_call_func(2, 0); select multi_mx_function_call_delegation.mx_call_func_custom_types('S', 'A'); select multi_mx_function_call_delegation.mx_call_copy(2); select squares(4); -- Same for unqualified name select mx_call_func(2, 0); -- Mark both functions as distributed ... select create_distributed_function('mx_call_func(int,int)'); select create_distributed_function('mx_call_func_bigint(bigint,bigint)'); select create_distributed_function('mx_call_func_custom_types(mx_call_enum,mx_call_enum)'); select create_distributed_function('mx_call_func_copy(int)'); select create_distributed_function('squares(int)'); -- We still don't route them to the workers, because they aren't -- colocated with any distributed tables. SET client_min_messages TO DEBUG1; select mx_call_func(2, 0); select multi_mx_function_call_delegation.mx_call_func_bigint(4, 2); select mx_call_func_custom_types('S', 'A'); -- Mark them as colocated with a table. Now we should route them to workers. select colocate_proc_with_table('mx_call_func', 'mx_call_dist_table_1'::regclass, 1); select colocate_proc_with_table('mx_call_func_custom_types', 'mx_call_dist_table_enum'::regclass, 1); select colocate_proc_with_table('squares', 'mx_call_dist_table_2'::regclass, 0); select create_distributed_function('mx_call_func_bigint(bigint,bigint)', 'x', colocate_with := 'mx_call_dist_table_bigint'); -- set up a force_delegation function select create_distributed_function('mx_call_func_bigint_force(bigint,bigint)', 'x', colocate_with := 'mx_call_dist_table_2', force_delegation := true); select mx_call_func(2, 0); select mx_call_func_bigint(4, 2); select mx_call_func_custom_types('S', 'A'); select squares(4); select multi_mx_function_call_delegation.mx_call_func(2, 0); select multi_mx_function_call_delegation.mx_call_func_custom_types('S', 'A'); SET citus.enable_binary_protocol = TRUE; select mx_call_func_custom_types('S', 'A'); select multi_mx_function_call_delegation.mx_call_func_custom_types('S', 'A'); RESET citus.enable_binary_protocol; -- We don't allow distributing calls inside transactions begin; select mx_call_func(2, 0); commit; -- Drop the table colocated with mx_call_func_custom_types. Now it shouldn't -- be routed to workers anymore. SET client_min_messages TO NOTICE; drop table mx_call_dist_table_enum; SET client_min_messages TO DEBUG1; select mx_call_func_custom_types('S', 'A'); -- Make sure we do bounds checking on distributed argument index -- This also tests that we have cache invalidation for pg_dist_object updates select colocate_proc_with_table('mx_call_func', 'mx_call_dist_table_1'::regclass, -1); select mx_call_func(2, 0); select colocate_proc_with_table('mx_call_func', 'mx_call_dist_table_1'::regclass, 2); select mx_call_func(2, 0); -- We don't currently support colocating with reference tables select colocate_proc_with_table('mx_call_func', 'mx_call_dist_table_ref'::regclass, 1); select mx_call_func(2, 0); -- We support colocating with single shard tables select colocate_proc_with_table('mx_call_func', 'mx_call_dist_table_single_shard'::regclass, 1); select mx_call_func(2, 0); -- We don't currently support colocating with replicated tables select colocate_proc_with_table('mx_call_func', 'mx_call_dist_table_replica'::regclass, 1); select mx_call_func(2, 0); SET client_min_messages TO NOTICE; drop table mx_call_dist_table_replica; SET client_min_messages TO DEBUG1; select colocate_proc_with_table('mx_call_func', 'mx_call_dist_table_1'::regclass, 1); -- Test table returning functions. CREATE FUNCTION mx_call_func_tbl(x int) RETURNS TABLE (p0 int, p1 int) LANGUAGE plpgsql AS $$ BEGIN INSERT INTO multi_mx_function_call_delegation.mx_call_dist_table_1 VALUES (x, -1), (x+1, 4); UPDATE multi_mx_function_call_delegation.mx_call_dist_table_1 SET val = val+1 WHERE id >= x; UPDATE multi_mx_function_call_delegation.mx_call_dist_table_1 SET val = val-1 WHERE id >= x; RETURN QUERY SELECT id, val FROM multi_mx_function_call_delegation.mx_call_dist_table_1 t WHERE id >= x ORDER BY 1, 2; END;$$; -- before distribution ... select mx_call_func_tbl(10); -- after distribution ... select create_distributed_function('mx_call_func_tbl(int)', '$1', 'mx_call_dist_table_1'); select mx_call_func_tbl(20); -- Test that we properly propagate errors raised from procedures. CREATE FUNCTION mx_call_func_raise(x int) RETURNS void LANGUAGE plpgsql AS $$ BEGIN RAISE WARNING 'warning'; RAISE EXCEPTION 'error'; END;$$; select create_distributed_function('mx_call_func_raise(int)', '$1', 'mx_call_dist_table_1'); \set VERBOSITY terse select mx_call_func_raise(2); \set VERBOSITY default -- Don't push-down when doing INSERT INTO ... SELECT func(); SET client_min_messages TO ERROR; CREATE TABLE test (x int primary key); SELECT create_distributed_table('test','x'); CREATE OR REPLACE FUNCTION delegated_function(a int) RETURNS int LANGUAGE plpgsql AS $function$ DECLARE BEGIN INSERT INTO multi_mx_function_call_delegation.test VALUES (a); INSERT INTO multi_mx_function_call_delegation.test VALUES (a + 1); RETURN a+2; END; $function$; SELECT create_distributed_function('delegated_function(int)', 'a'); SET client_min_messages TO DEBUG1; INSERT INTO test SELECT delegated_function(1); -- Don't push down in subqueries or CTEs. SELECT * FROM test WHERE not exists( SELECT delegated_function(4) ); WITH r AS ( SELECT delegated_function(7) ) SELECT * FROM test WHERE (SELECT count(*)=0 FROM r); WITH r AS ( SELECT delegated_function(10) ), t AS ( SELECT count(*) c FROM r ) SELECT * FROM test, t WHERE t.c=0; WITH r AS ( SELECT count(*) FROM test ), s AS ( SELECT delegated_function(13) ), t AS ( SELECT count(*) c FROM s ) SELECT * FROM test, r, t WHERE t.c=0; -- Test that we don't propagate to non-metadata worker nodes SET client_min_messages TO WARNING; select stop_metadata_sync_to_node('localhost', :worker_1_port); select stop_metadata_sync_to_node('localhost', :worker_2_port); SET client_min_messages TO DEBUG1; select mx_call_func(2, 0); SET client_min_messages TO NOTICE; select start_metadata_sync_to_node('localhost', :worker_1_port); select start_metadata_sync_to_node('localhost', :worker_2_port); -- stop_metadata_sync_to_node()/start_metadata_sync_to_node() might make -- worker backend caches inconsistent. Reconnect to coordinator to use -- new worker connections, hence new backends. \c - - - :master_port \set VERBOSITY terse SET search_path to multi_mx_function_call_delegation, public; SET client_min_messages TO DEBUG1; SET citus.shard_replication_factor = 1; -- -- Test non-const parameter values -- CREATE FUNCTION mx_call_add(int, int) RETURNS int AS 'select $1 + $2;' LANGUAGE SQL IMMUTABLE; SELECT create_distributed_function('mx_call_add(int,int)', '$1'); -- subquery parameters cannot be pushed down select mx_call_func((select x + 1 from mx_call_add(3, 4) x), 2); -- volatile parameter cannot be pushed down select mx_call_func(floor(random())::int, 2); -- test forms we don't distribute select mx_call_func(2, 0) where mx_call_func(0, 2) = 0; select mx_call_func(2, 0), mx_call_func(0, 2); -- regular call in FROM can be pushed down select * from mx_call_func(2, 0); -- prepared statement with 6 invocations to trigger generic plan prepare call_func(int, int) as select $1 from mx_call_func($1, $2); execute call_func(2, 0); execute call_func(2, 0); execute call_func(2, 0); execute call_func(2, 0); execute call_func(2, 0); execute call_func(2, 0); -- we do not delegate the call, but do push down the query -- that result in remote execution from workers select mx_call_func(id, 0) from mx_call_dist_table_1; select mx_call_func(2, 0) from mx_call_dist_table_1 where id = 3; select mx_call_func_copy(2) from mx_call_dist_table_1 where id = 3; DO $$ BEGIN perform mx_call_func_tbl(40); END; $$; SELECT * FROM mx_call_dist_table_1 WHERE id >= 40 ORDER BY id, val; -- Prepared statements. Repeat 8 times to test for generic plans PREPARE call_plan (int, int) AS SELECT mx_call_func($1, $2); EXECUTE call_plan(2, 0); EXECUTE call_plan(2, 0); EXECUTE call_plan(2, 0); EXECUTE call_plan(2, 0); EXECUTE call_plan(2, 0); EXECUTE call_plan(2, 0); EXECUTE call_plan(2, 0); EXECUTE call_plan(2, 0); \c - - - :worker_1_port \set VERBOSITY terse SET search_path TO multi_mx_function_call_delegation, public; -- create_distributed_function is disallowed from worker nodes select create_distributed_function('mx_call_func(int,int)'); -- show that functions can be delegated from worker nodes SET client_min_messages TO DEBUG1; SELECT mx_call_func(2, 0); -- not delegated in a transaction block BEGIN; SELECT mx_call_func(2, 0); END; -- not delegated in a DO block DO $$ BEGIN PERFORM mx_call_func(2, 0); END; $$ LANGUAGE plpgsql; -- forced calls are delegated in a transaction block BEGIN; SELECT mx_call_func_bigint_force(4, 2); END; -- forced calls are delegated in a DO block DO $$ BEGIN PERFORM * FROM mx_call_func_bigint_force(4, 2); END; $$ LANGUAGE plpgsql; \c - - - :master_port \set VERBOSITY terse SET search_path TO multi_mx_function_call_delegation, public; RESET client_min_messages; \set VERBOSITY terse DROP SCHEMA multi_mx_function_call_delegation CASCADE;