Allow negative aggtransspace to indicate unbounded state size

author Richard Guo <rguo@postgresql.org>

Wed, 8 Oct 2025 08:01:48 +0000 (17:01 +0900)

committer Richard Guo <rguo@postgresql.org>

Wed, 8 Oct 2025 08:01:48 +0000 (17:01 +0900)
author Richard Guo <rguo@postgresql.org>
Wed, 8 Oct 2025 08:01:48 +0000 (17:01 +0900)
committer Richard Guo <rguo@postgresql.org>
Wed, 8 Oct 2025 08:01:48 +0000 (17:01 +0900)
diff --git a/doc/src/sgml/catalogs.sgml b/doc/src/sgml/catalogs.sgml

index e9095bedf21e0ad6c839f1d5f13ad05cc0e96bbb..3acc2222a87306365b9b7f02b3b4506d26e2e89f 100644 (file)
--- a/doc/src/sgml/catalogs.sgml
+++ b/doc/src/sgml/catalogs.sgml
@@ -596,7 +596,10 @@
        </para>
        <para>
         Approximate average size (in bytes) of the transition state
-       data, or zero to use a default estimate
+       data. A positive value provides an estimate; zero means to
+       use a default estimate. A negative value indicates the state
+       data can grow unboundedly in size, such as when the aggregate
+       accumulates input rows (e.g., array_agg, string_agg).
        </para></entry>
       </row>
  
diff --git a/doc/src/sgml/ref/create_aggregate.sgml b/doc/src/sgml/ref/create_aggregate.sgml

index 222e0aa5c9d08bf7223664438af0c9525e655581..0472ac2e874590aac38c2176ef8959d76077a016 100644 (file)
--- a/doc/src/sgml/ref/create_aggregate.sgml
+++ b/doc/src/sgml/ref/create_aggregate.sgml
@@ -384,9 +384,13 @@ SELECT col FROM tab ORDER BY col USING sortop LIMIT 1;
       <para>
        The approximate average size (in bytes) of the aggregate's state value.
        If this parameter is omitted or is zero, a default estimate is used
-      based on the <replaceable>state_data_type</replaceable>.
+      based on the <replaceable>state_data_type</replaceable>. If set to a
+      negative value, it indicates the state data can grow unboundedly in
+      size, such as when the aggregate accumulates input rows (e.g.,
+      array_agg, string_agg).
        The planner uses this value to estimate the memory required for a
-      grouped aggregate query.
+      grouped aggregate query and to avoid optimizations that may cause
+      excessive memory usage.
       </para>
      </listitem>
     </varlistentry>
@@ -568,7 +572,8 @@ SELECT col FROM tab ORDER BY col USING sortop LIMIT 1;
       <para>
        The approximate average size (in bytes) of the aggregate's state
        value, when using moving-aggregate mode.  This works the same as
-      <replaceable>state_data_size</replaceable>.
+      <replaceable>state_data_size</replaceable>, except that negative
+      values are not used to indicate unbounded state size.
       </para>
      </listitem>
     </varlistentry>
diff --git a/src/include/catalog/catversion.h b/src/include/catalog/catversion.h

index 00b3bce1e120835d38ac80f729e3435d380a7d4f..af54211f330f17a25ad266b8e6aff52ae4d664a9 100644 (file)
--- a/src/include/catalog/catversion.h
+++ b/src/include/catalog/catversion.h
@@ -57,6 +57,6 @@
   */
  
  /*                                                     yyyymmddN */
-#define CATALOG_VERSION_NO     202510081
+#define CATALOG_VERSION_NO     202510082
  
  #endif
diff --git a/src/include/catalog/pg_aggregate.dat b/src/include/catalog/pg_aggregate.dat

index d6aa1f6ec478709b9cf34461355f86719b219750..870769e8f14cc501c9ef143b61831f5d3808c97a 100644 (file)
--- a/src/include/catalog/pg_aggregate.dat
+++ b/src/include/catalog/pg_aggregate.dat
@@ -558,26 +558,28 @@
    aggfinalfn => 'array_agg_finalfn', aggcombinefn => 'array_agg_combine',
    aggserialfn => 'array_agg_serialize',
    aggdeserialfn => 'array_agg_deserialize', aggfinalextra => 't',
-  aggtranstype => 'internal' },
+  aggtranstype => 'internal', aggtransspace => '-1' },
  { aggfnoid => 'array_agg(anyarray)', aggtransfn => 'array_agg_array_transfn',
    aggfinalfn => 'array_agg_array_finalfn',
    aggcombinefn => 'array_agg_array_combine',
    aggserialfn => 'array_agg_array_serialize',
    aggdeserialfn => 'array_agg_array_deserialize', aggfinalextra => 't',
-  aggtranstype => 'internal' },
+  aggtranstype => 'internal', aggtransspace => '-1' },
  
  # text
  { aggfnoid => 'string_agg(text,text)', aggtransfn => 'string_agg_transfn',
    aggfinalfn => 'string_agg_finalfn', aggcombinefn => 'string_agg_combine',
    aggserialfn => 'string_agg_serialize',
-  aggdeserialfn => 'string_agg_deserialize', aggtranstype => 'internal' },
+  aggdeserialfn => 'string_agg_deserialize',
+  aggtranstype => 'internal', aggtransspace => '-1' },
  
  # bytea
  { aggfnoid => 'string_agg(bytea,bytea)',
    aggtransfn => 'bytea_string_agg_transfn',
    aggfinalfn => 'bytea_string_agg_finalfn',
    aggcombinefn => 'string_agg_combine', aggserialfn => 'string_agg_serialize',
-  aggdeserialfn => 'string_agg_deserialize', aggtranstype => 'internal' },
+  aggdeserialfn => 'string_agg_deserialize',
+  aggtranstype => 'internal', aggtransspace => '-1' },
  
  # range
  { aggfnoid => 'range_intersect_agg(anyrange)',
diff --git a/src/test/regress/expected/opr_sanity.out b/src/test/regress/expected/opr_sanity.out

index 20bf9ea9cdf766c8245b5b56874efaeae9a4f15a..a357e1d0c0e1842f95974a6ab26d063d80174d69 100644 (file)
--- a/src/test/regress/expected/opr_sanity.out
+++ b/src/test/regress/expected/opr_sanity.out
@@ -1470,7 +1470,7 @@ WHERE aggfnoid = 0 OR aggtransfn = 0 OR
      (aggkind = 'n' AND aggnumdirectargs > 0) OR
      aggfinalmodify NOT IN ('r', 's', 'w') OR
      aggmfinalmodify NOT IN ('r', 's', 'w') OR
-    aggtranstype = 0 OR aggtransspace < 0 OR aggmtransspace < 0;
+    aggtranstype = 0 OR aggmtransspace < 0;
   ctid | aggfnoid 
  ------+----------
  (0 rows)
diff --git a/src/test/regress/sql/opr_sanity.sql b/src/test/regress/sql/opr_sanity.sql

index 2fb3a85287816f00fca60038150426083598fa38..cd674d7dbca388db27317bddd4cbddbb4e22c81b 100644 (file)
--- a/src/test/regress/sql/opr_sanity.sql
+++ b/src/test/regress/sql/opr_sanity.sql
@@ -847,7 +847,7 @@ WHERE aggfnoid = 0 OR aggtransfn = 0 OR
      (aggkind = 'n' AND aggnumdirectargs > 0) OR
      aggfinalmodify NOT IN ('r', 's', 'w') OR
      aggmfinalmodify NOT IN ('r', 's', 'w') OR
-    aggtranstype = 0 OR aggtransspace < 0 OR aggmtransspace < 0;
+    aggtranstype = 0 OR aggmtransspace < 0;
  
  -- Make sure the matching pg_proc entry is sensible, too.
author	Richard Guo <rguo@postgresql.org>
	Wed, 8 Oct 2025 08:01:48 +0000 (17:01 +0900)
committer	Richard Guo <rguo@postgresql.org>
	Wed, 8 Oct 2025 08:01:48 +0000 (17:01 +0900)
doc/src/sgml/catalogs.sgml		patch \| blob \| blame \| history
doc/src/sgml/ref/create_aggregate.sgml		patch \| blob \| blame \| history
src/include/catalog/catversion.h		patch \| blob \| blame \| history
src/include/catalog/pg_aggregate.dat		patch \| blob \| blame \| history
src/test/regress/expected/opr_sanity.out		patch \| blob \| blame \| history
src/test/regress/sql/opr_sanity.sql		patch \| blob \| blame \| history