Mark partialize_agg as parallel safe

Postgres knows whether a given aggregate is parallel-safe, and creates parallel aggregation plans based on that. The `partialize_agg` is a wrapper we use to perform partial aggregation on data nodes. It is a pure function that produces serialized aggregation state as a result. Being pure, it doesn't influence parallel safety. This means we don't need to mark it parallel-unsafe to artificially disable the parallel plans for partial aggregation. They will be chosen as usual based on the parallel-safety of the underlying aggregate function.
2025-05-16 18:43:18 +08:00 · 2022-05-06 14:14:48 +03:00 · 2022-05-06 14:14:48 +03:00 · 5c0110cbbf
commit 5c0110cbbf
parent 1d0670e703
5 changed files with 159 additions and 6 deletions
--- a/sql/partialize_finalize.sql
+++ b/sql/partialize_finalize.sql
@ -2,24 +2,30 @@
 -- Please see the included NOTICE for copyright information and
 -- LICENSE-APACHE for a copy of the license.
 -- These wrapper functions are used to push down aggregation to data nodes.
 -- They can be marked parallel-safe, and the parallel plan will be chosen
 -- depending on whether the underlying aggregate function itself is
 -- parallel-safe.
 CREATE OR REPLACE FUNCTION _timescaledb_internal.partialize_agg(arg ANYELEMENT)
-RETURNS BYTEA AS '@MODULE_PATHNAME@', 'ts_partialize_agg' LANGUAGE C VOLATILE;
+RETURNS BYTEA AS '@MODULE_PATHNAME@', 'ts_partialize_agg' LANGUAGE C STABLE PARALLEL SAFE;
 CREATE OR REPLACE FUNCTION _timescaledb_internal.finalize_agg_sfunc(
 tstate internal, aggfn TEXT, inner_agg_collation_schema NAME, inner_agg_collation_name NAME, inner_agg_input_types NAME[][], inner_agg_serialized_state BYTEA, return_type_dummy_val ANYELEMENT)
 RETURNS internal
 AS '@MODULE_PATHNAME@', 'ts_finalize_agg_sfunc'
-LANGUAGE C IMMUTABLE ;
+LANGUAGE C IMMUTABLE PARALLEL SAFE;
 CREATE OR REPLACE FUNCTION _timescaledb_internal.finalize_agg_ffunc(
 tstate internal, aggfn TEXT, inner_agg_collation_schema NAME, inner_agg_collation_name NAME, inner_agg_input_types NAME[][], inner_agg_serialized_state BYTEA, return_type_dummy_val ANYELEMENT)
 RETURNS anyelement
 AS '@MODULE_PATHNAME@', 'ts_finalize_agg_ffunc'
-LANGUAGE C IMMUTABLE ;
+LANGUAGE C IMMUTABLE PARALLEL SAFE;
 CREATE OR REPLACE AGGREGATE _timescaledb_internal.finalize_agg(agg_name TEXT,  inner_agg_collation_schema NAME,  inner_agg_collation_name NAME, inner_agg_input_types NAME[][], inner_agg_serialized_state BYTEA, return_type_dummy_val anyelement) (
    SFUNC = _timescaledb_internal.finalize_agg_sfunc,
    STYPE = internal,
    FINALFUNC = _timescaledb_internal.finalize_agg_ffunc,
-    FINALFUNC_EXTRA
+    FINALFUNC_EXTRA,
    PARALLEL = SAFE
 );
--- a/test/runner_shared.sh
+++ b/test/runner_shared.sh
@ -81,6 +81,7 @@ ${PSQL} -U ${TEST_PGUSER} \
          sed  -e '/<exclude_from_test>/,/<\/exclude_from_test>/d' \
               -e 's!_[0-9]\{1,\}_[0-9]\{1,\}_chunk!_X_X_chunk!g' \
               -e 's!^ \{1,\}QUERY PLAN \{1,\}$!QUERY PLAN!' \
               -e 's!:  actual rows!: actual rows!' \
               -e '/^-\{1,\}$/d' \
               -e 's!\(_timescaledb_internal.chunks_in([^,]\{1,\}, ARRAY\[\)[^]]\{1,\}\]!\1..]!' \
               -e 's! Memory: [0-9]\{1,\}kB!!' \
--- a/tsl/test/shared/expected/dist_parallel_agg.out
+++ b/tsl/test/shared/expected/dist_parallel_agg.out
@ -0,0 +1,104 @@
 -- This file and its contents are licensed under the Timescale License.
 -- Please see the included NOTICE for copyright information and
 -- LICENSE-TIMESCALE for a copy of the license.
 -- Test that for parallel-safe aggregate function a parallel plan is generated
 -- on data nodes, and for unsafe it is not. We use a manually created safe
 -- function and not a builtin one, to check that we can in fact create a
 -- function that is parallelized, to prevent a false negative (i.e. it's not
 -- parallelized, but for a different reason, not because it's unsafe).
 -- Create a relatively big table on one data node to test parallel plans and
 -- avoid flakiness.
 create table metrics_dist1(like metrics_dist);
 select table_name from create_distributed_hypertable('metrics_dist1', 'time', 'device_id',
    data_nodes => '{"data_node_1"}');
 WARNING:  only one data node was assigned to the hypertable
  table_name   
 metrics_dist1
 (1 row)
 insert into metrics_dist1 select * from metrics_dist order by metrics_dist limit 20000;
 \set safe 'create or replace aggregate ts_debug_shippable_safe_count(*) (sfunc = int8inc, combinefunc=int8pl, stype = bigint, initcond = 0, parallel = safe);'
 \set unsafe 'create or replace aggregate ts_debug_shippable_unsafe_count(*) (sfunc = int8inc, combinefunc=int8pl, stype = bigint, initcond = 0, parallel = unsafe);'
 :safe
 call distributed_exec(:'safe');
 :unsafe
 call distributed_exec(:'unsafe');
 call distributed_exec($$ set parallel_tuple_cost = 0; $$);
 call distributed_exec($$ set parallel_setup_cost = 0; $$);
 call distributed_exec($$ set max_parallel_workers_per_gather = 1; $$);
 set timescaledb.enable_remote_explain = 1;
 set enable_partitionwise_aggregate = 1;
 \set analyze 'explain (analyze, verbose, costs off, timing off, summary off)'
 :analyze
 select count(*) from metrics_dist1;
 QUERY PLAN
 Custom Scan (DataNodeScan) (actual rows=1 loops=1)
   Output: (count(*))
   Relations: Aggregate on (public.metrics_dist1)
   Data node: data_node_1
   Fetcher Type: Row by row
   Chunks: _dist_hyper_X_X_chunk, _dist_hyper_X_X_chunk
   Remote SQL: SELECT count(*) FROM public.metrics_dist1 WHERE _timescaledb_internal.chunks_in(public.metrics_dist1.*, ARRAY[..])
   Remote EXPLAIN: 
     Finalize Aggregate (actual rows=1 loops=1)
       Output: count(*)
       ->  Gather (actual rows=2 loops=1)
             Output: (PARTIAL count(*))
             Workers Planned: 1
             Workers Launched: 1
             ->  Partial Aggregate (actual rows=1 loops=2)
                   Output: PARTIAL count(*)
                   Worker 0: actual rows=1 loops=1
                   ->  Parallel Append (actual rows=10000 loops=2)
                         Worker 0: actual rows=0 loops=1
                         ->  Parallel Seq Scan on _timescaledb_internal._dist_hyper_X_X_chunk (actual rows=17990 loops=1)
                         ->  Parallel Seq Scan on _timescaledb_internal._dist_hyper_X_X_chunk (actual rows=2010 loops=1)
 (22 rows)
 :analyze
 select ts_debug_shippable_safe_count(*) from metrics_dist1;
 QUERY PLAN
 Custom Scan (DataNodeScan) (actual rows=1 loops=1)
   Output: (ts_debug_shippable_safe_count(*))
   Relations: Aggregate on (public.metrics_dist1)
   Data node: data_node_1
   Fetcher Type: Row by row
   Chunks: _dist_hyper_X_X_chunk, _dist_hyper_X_X_chunk
   Remote SQL: SELECT public.ts_debug_shippable_safe_count(*) FROM public.metrics_dist1 WHERE _timescaledb_internal.chunks_in(public.metrics_dist1.*, ARRAY[..])
   Remote EXPLAIN: 
     Finalize Aggregate (actual rows=1 loops=1)
       Output: public.ts_debug_shippable_safe_count(*)
       ->  Gather (actual rows=2 loops=1)
             Output: (PARTIAL public.ts_debug_shippable_safe_count(*))
             Workers Planned: 1
             Workers Launched: 1
             ->  Partial Aggregate (actual rows=1 loops=2)
                   Output: PARTIAL public.ts_debug_shippable_safe_count(*)
                   Worker 0: actual rows=1 loops=1
                   ->  Parallel Append (actual rows=10000 loops=2)
                         Worker 0: actual rows=0 loops=1
                         ->  Parallel Seq Scan on _timescaledb_internal._dist_hyper_X_X_chunk (actual rows=17990 loops=1)
                         ->  Parallel Seq Scan on _timescaledb_internal._dist_hyper_X_X_chunk (actual rows=2010 loops=1)
 (22 rows)
 :analyze
 select ts_debug_shippable_unsafe_count(*) from metrics_dist1;
 QUERY PLAN
 Custom Scan (DataNodeScan) (actual rows=1 loops=1)
   Output: (ts_debug_shippable_unsafe_count(*))
   Relations: Aggregate on (public.metrics_dist1)
   Data node: data_node_1
   Fetcher Type: Row by row
   Chunks: _dist_hyper_X_X_chunk, _dist_hyper_X_X_chunk
   Remote SQL: SELECT public.ts_debug_shippable_unsafe_count(*) FROM public.metrics_dist1 WHERE _timescaledb_internal.chunks_in(public.metrics_dist1.*, ARRAY[..])
   Remote EXPLAIN: 
     Aggregate (actual rows=1 loops=1)
       Output: public.ts_debug_shippable_unsafe_count(*)
       ->  Append (actual rows=20000 loops=1)
             ->  Seq Scan on _timescaledb_internal._dist_hyper_X_X_chunk (actual rows=17990 loops=1)
             ->  Seq Scan on _timescaledb_internal._dist_hyper_X_X_chunk (actual rows=2010 loops=1)
 (14 rows)
--- a/tsl/test/shared/sql/CMakeLists.txt
+++ b/tsl/test/shared/sql/CMakeLists.txt
@ -22,8 +22,8 @@ if((${PG_VERSION_MAJOR} GREATER_EQUAL "14"))
 endif()
 if(CMAKE_BUILD_TYPE MATCHES Debug)
-  list(APPEND TEST_FILES_SHARED dist_remote_error.sql timestamp_limits.sql
+  list(APPEND TEST_FILES_SHARED dist_parallel_agg.sql dist_remote_error.sql
-       with_clause_parser.sql)
+       timestamp_limits.sql with_clause_parser.sql)
  list(APPEND TEST_TEMPLATES_SHARED constify_now.sql.in)
 endif(CMAKE_BUILD_TYPE MATCHES Debug)
--- a/tsl/test/shared/sql/dist_parallel_agg.sql
+++ b/tsl/test/shared/sql/dist_parallel_agg.sql
@ -0,0 +1,42 @@
 -- This file and its contents are licensed under the Timescale License.
 -- Please see the included NOTICE for copyright information and
 -- LICENSE-TIMESCALE for a copy of the license.
 -- Test that for parallel-safe aggregate function a parallel plan is generated
 -- on data nodes, and for unsafe it is not. We use a manually created safe
 -- function and not a builtin one, to check that we can in fact create a
 -- function that is parallelized, to prevent a false negative (i.e. it's not
 -- parallelized, but for a different reason, not because it's unsafe).
 -- Create a relatively big table on one data node to test parallel plans and
 -- avoid flakiness.
 create table metrics_dist1(like metrics_dist);
 select table_name from create_distributed_hypertable('metrics_dist1', 'time', 'device_id',
    data_nodes => '{"data_node_1"}');
 insert into metrics_dist1 select * from metrics_dist order by metrics_dist limit 20000;
 \set safe 'create or replace aggregate ts_debug_shippable_safe_count(*) (sfunc = int8inc, combinefunc=int8pl, stype = bigint, initcond = 0, parallel = safe);'
 \set unsafe 'create or replace aggregate ts_debug_shippable_unsafe_count(*) (sfunc = int8inc, combinefunc=int8pl, stype = bigint, initcond = 0, parallel = unsafe);'
 :safe
 call distributed_exec(:'safe');
 :unsafe
 call distributed_exec(:'unsafe');
 call distributed_exec($$ set parallel_tuple_cost = 0; $$);
 call distributed_exec($$ set parallel_setup_cost = 0; $$);
 call distributed_exec($$ set max_parallel_workers_per_gather = 1; $$);
 set timescaledb.enable_remote_explain = 1;
 set enable_partitionwise_aggregate = 1;
 \set analyze 'explain (analyze, verbose, costs off, timing off, summary off)'
 :analyze
 select count(*) from metrics_dist1;
 :analyze
 select ts_debug_shippable_safe_count(*) from metrics_dist1;
 :analyze
 select ts_debug_shippable_unsafe_count(*) from metrics_dist1;