1
0
mirror of https://github.com/postgres/postgres.git synced 2025-10-24 01:29:19 +03:00

Allow extension functions to participate in in-place updates.

Commit 1dc5ebc90 allowed PL/pgSQL to perform in-place updates
of expanded-object variables that are being updated with
assignments like "x := f(x, ...)".  However this was allowed
only for a hard-wired list of functions f(), since we need to
be sure that f() will not modify the variable if it fails.
It was always envisioned that we should make that extensible,
but at the time we didn't have a good way to do so.  Since
then we've invented the idea of "support functions" to allow
attaching specialized optimization knowledge to functions,
and that is a perfect mechanism for doing this.

Hence, adjust PL/pgSQL to use a support function request instead
of hard-wired logic to decide if in-place update is safe.
Preserve the previous optimizations by creating support functions
for the three functions that were previously hard-wired.

Author: Tom Lane <tgl@sss.pgh.pa.us>
Reviewed-by: Andrey Borodin <x4mmm@yandex-team.ru>
Reviewed-by: Pavel Borisov <pashkin.elfe@gmail.com>
Discussion: https://postgr.es/m/CACxu=vJaKFNsYxooSnW1wEgsAO5u_v1XYBacfVJ14wgJV_PYeg@mail.gmail.com
This commit is contained in:
Tom Lane
2025-02-11 12:49:34 -05:00
parent 6c7251db0c
commit c366d2bdba
9 changed files with 203 additions and 60 deletions

View File

@@ -16,6 +16,7 @@
#include "common/int.h" #include "common/int.h"
#include "common/pg_prng.h" #include "common/pg_prng.h"
#include "libpq/pqformat.h" #include "libpq/pqformat.h"
#include "nodes/supportnodes.h"
#include "port/pg_bitutils.h" #include "port/pg_bitutils.h"
#include "utils/array.h" #include "utils/array.h"
#include "utils/builtins.h" #include "utils/builtins.h"
@@ -167,6 +168,36 @@ array_append(PG_FUNCTION_ARGS)
PG_RETURN_DATUM(result); PG_RETURN_DATUM(result);
} }
/*
* array_append_support()
*
* Planner support function for array_append()
*/
Datum
array_append_support(PG_FUNCTION_ARGS)
{
Node *rawreq = (Node *) PG_GETARG_POINTER(0);
Node *ret = NULL;
if (IsA(rawreq, SupportRequestModifyInPlace))
{
/*
* We can optimize in-place appends if the function's array argument
* is the array being assigned to. We don't need to worry about array
* references within the other argument.
*/
SupportRequestModifyInPlace *req = (SupportRequestModifyInPlace *) rawreq;
Param *arg = (Param *) linitial(req->args);
if (arg && IsA(arg, Param) &&
arg->paramkind == PARAM_EXTERN &&
arg->paramid == req->paramid)
ret = (Node *) arg;
}
PG_RETURN_POINTER(ret);
}
/*----------------------------------------------------------------------------- /*-----------------------------------------------------------------------------
* array_prepend : * array_prepend :
* push an element onto the front of a one-dimensional array * push an element onto the front of a one-dimensional array
@@ -230,6 +261,36 @@ array_prepend(PG_FUNCTION_ARGS)
PG_RETURN_DATUM(result); PG_RETURN_DATUM(result);
} }
/*
* array_prepend_support()
*
* Planner support function for array_prepend()
*/
Datum
array_prepend_support(PG_FUNCTION_ARGS)
{
Node *rawreq = (Node *) PG_GETARG_POINTER(0);
Node *ret = NULL;
if (IsA(rawreq, SupportRequestModifyInPlace))
{
/*
* We can optimize in-place prepends if the function's array argument
* is the array being assigned to. We don't need to worry about array
* references within the other argument.
*/
SupportRequestModifyInPlace *req = (SupportRequestModifyInPlace *) rawreq;
Param *arg = (Param *) lsecond(req->args);
if (arg && IsA(arg, Param) &&
arg->paramkind == PARAM_EXTERN &&
arg->paramid == req->paramid)
ret = (Node *) arg;
}
PG_RETURN_POINTER(ret);
}
/*----------------------------------------------------------------------------- /*-----------------------------------------------------------------------------
* array_cat : * array_cat :
* concatenate two nD arrays to form an nD array, or * concatenate two nD arrays to form an nD array, or

View File

@@ -18,6 +18,7 @@
#include "nodes/makefuncs.h" #include "nodes/makefuncs.h"
#include "nodes/nodeFuncs.h" #include "nodes/nodeFuncs.h"
#include "nodes/subscripting.h" #include "nodes/subscripting.h"
#include "nodes/supportnodes.h"
#include "parser/parse_coerce.h" #include "parser/parse_coerce.h"
#include "parser/parse_expr.h" #include "parser/parse_expr.h"
#include "utils/array.h" #include "utils/array.h"
@@ -575,3 +576,36 @@ raw_array_subscript_handler(PG_FUNCTION_ARGS)
PG_RETURN_POINTER(&sbsroutines); PG_RETURN_POINTER(&sbsroutines);
} }
/*
* array_subscript_handler_support()
*
* Planner support function for array_subscript_handler()
*/
Datum
array_subscript_handler_support(PG_FUNCTION_ARGS)
{
Node *rawreq = (Node *) PG_GETARG_POINTER(0);
Node *ret = NULL;
if (IsA(rawreq, SupportRequestModifyInPlace))
{
/*
* We can optimize in-place subscripted assignment if the refexpr is
* the array being assigned to. We don't need to worry about array
* references within the refassgnexpr or the subscripts; however, if
* there's no refassgnexpr then it's a fetch which there's no need to
* optimize.
*/
SupportRequestModifyInPlace *req = (SupportRequestModifyInPlace *) rawreq;
Param *refexpr = (Param *) linitial(req->args);
if (refexpr && IsA(refexpr, Param) &&
refexpr->paramkind == PARAM_EXTERN &&
refexpr->paramid == req->paramid &&
lsecond(req->args) != NULL)
ret = (Node *) refexpr;
}
PG_RETURN_POINTER(ret);
}

View File

@@ -57,6 +57,6 @@
*/ */
/* yyyymmddN */ /* yyyymmddN */
#define CATALOG_VERSION_NO 202502071 #define CATALOG_VERSION_NO 202502111
#endif #endif

View File

@@ -1598,14 +1598,20 @@
proname => 'cardinality', prorettype => 'int4', proargtypes => 'anyarray', proname => 'cardinality', prorettype => 'int4', proargtypes => 'anyarray',
prosrc => 'array_cardinality' }, prosrc => 'array_cardinality' },
{ oid => '378', descr => 'append element onto end of array', { oid => '378', descr => 'append element onto end of array',
proname => 'array_append', proisstrict => 'f', proname => 'array_append', prosupport => 'array_append_support',
prorettype => 'anycompatiblearray', proisstrict => 'f', prorettype => 'anycompatiblearray',
proargtypes => 'anycompatiblearray anycompatible', prosrc => 'array_append' }, proargtypes => 'anycompatiblearray anycompatible', prosrc => 'array_append' },
{ oid => '8680', descr => 'planner support for array_append',
proname => 'array_append_support', prorettype => 'internal',
proargtypes => 'internal', prosrc => 'array_append_support' },
{ oid => '379', descr => 'prepend element onto front of array', { oid => '379', descr => 'prepend element onto front of array',
proname => 'array_prepend', proisstrict => 'f', proname => 'array_prepend', prosupport => 'array_prepend_support',
prorettype => 'anycompatiblearray', proisstrict => 'f', prorettype => 'anycompatiblearray',
proargtypes => 'anycompatible anycompatiblearray', proargtypes => 'anycompatible anycompatiblearray',
prosrc => 'array_prepend' }, prosrc => 'array_prepend' },
{ oid => '8681', descr => 'planner support for array_prepend',
proname => 'array_prepend_support', prorettype => 'internal',
proargtypes => 'internal', prosrc => 'array_prepend_support' },
{ oid => '383', { oid => '383',
proname => 'array_cat', proisstrict => 'f', proname => 'array_cat', proisstrict => 'f',
prorettype => 'anycompatiblearray', prorettype => 'anycompatiblearray',
@@ -12207,8 +12213,12 @@
# subscripting support for built-in types # subscripting support for built-in types
{ oid => '6179', descr => 'standard array subscripting support', { oid => '6179', descr => 'standard array subscripting support',
proname => 'array_subscript_handler', prorettype => 'internal', proname => 'array_subscript_handler',
prosupport => 'array_subscript_handler_support', prorettype => 'internal',
proargtypes => 'internal', prosrc => 'array_subscript_handler' }, proargtypes => 'internal', prosrc => 'array_subscript_handler' },
{ oid => '8682', descr => 'planner support for array_subscript_handler',
proname => 'array_subscript_handler_support', prorettype => 'internal',
proargtypes => 'internal', prosrc => 'array_subscript_handler_support' },
{ oid => '6180', descr => 'raw array subscripting support', { oid => '6180', descr => 'raw array subscripting support',
proname => 'raw_array_subscript_handler', prorettype => 'internal', proname => 'raw_array_subscript_handler', prorettype => 'internal',
proargtypes => 'internal', prosrc => 'raw_array_subscript_handler' }, proargtypes => 'internal', prosrc => 'raw_array_subscript_handler' },

View File

@@ -6,10 +6,10 @@
* This file defines the API for "planner support functions", which * This file defines the API for "planner support functions", which
* are SQL functions (normally written in C) that can be attached to * are SQL functions (normally written in C) that can be attached to
* another "target" function to give the system additional knowledge * another "target" function to give the system additional knowledge
* about the target function. All the current capabilities have to do * about the target function. The name is now something of a misnomer,
* with planning queries that use the target function, though it is * since some of the call sites are in the executor not the planner,
* possible that future extensions will add functionality to be invoked * but "function support function" would be a confusing name so we
* by the parser or executor. * stick with "planner support function".
* *
* A support function must have the SQL signature * A support function must have the SQL signature
* supportfn(internal) returns internal * supportfn(internal) returns internal
@@ -343,4 +343,51 @@ typedef struct SupportRequestOptimizeWindowClause
* optimizations are possible. */ * optimizations are possible. */
} SupportRequestOptimizeWindowClause; } SupportRequestOptimizeWindowClause;
/*
* The ModifyInPlace request allows the support function to detect whether
* a call to its target function can be allowed to modify a read/write
* expanded object in-place. The context is that we are considering a
* PL/pgSQL (or similar PL) assignment of the form "x := f(x, ...)" where
* the variable x is of a type that can be represented as an expanded object
* (see utils/expandeddatum.h). If f() can usefully optimize by modifying
* the passed-in object in-place, then this request can be implemented to
* instruct PL/pgSQL to pass a read-write expanded pointer to the variable's
* value. (Note that there is no guarantee that later calls to f() will
* actually do so. If f() receives a read-only pointer, or a pointer to a
* non-expanded object, it must follow the usual convention of not modifying
* the pointed-to object.) There are two requirements that must be met
* to make this safe:
* 1. f() must guarantee that it will not have modified the object if it
* fails. Otherwise the variable's value might change unexpectedly.
* 2. If the other arguments to f() ("..." in the above example) contain
* references to x, f() must be able to cope with that; or if that's not
* safe, the support function must scan the other arguments to verify that
* there are no other references to x. An example of the concern here is
* that in "arr := array_append(arr, arr[1])", if the array element type
* is pass-by-reference then array_append would receive a second argument
* that points into the array object it intends to modify. array_append is
* coded to make that safe, but other functions might not be able to cope.
*
* "args" is a node tree list representing the function's arguments.
* One or more nodes within the node tree will be PARAM_EXTERN Params
* with ID "paramid", which represent the assignment target variable.
* (Note that such references are not necessarily at top level in the list,
* for example we might have "x := f(x, g(x))". Generally it's only safe
* to optimize a reference that is at top level, else we're making promises
* about the behavior of g() as well as f().)
*
* If modify-in-place is safe, the support function should return the
* address of the Param node that is to return a read-write pointer.
* (At most one of the references is allowed to do so.) Otherwise,
* return NULL.
*/
typedef struct SupportRequestModifyInPlace
{
NodeTag type;
Oid funcid; /* PG_PROC OID of the target function */
List *args; /* Arguments to the function */
int paramid; /* ID of Param(s) representing variable */
} SupportRequestModifyInPlace;
#endif /* SUPPORTNODES_H */ #endif /* SUPPORTNODES_H */

View File

@@ -57,10 +57,11 @@ begin
-- test scenarios for optimization of updates of R/W expanded objects -- test scenarios for optimization of updates of R/W expanded objects
a := array_append(a, 42); -- optimizable using "transfer" method a := array_append(a, 42); -- optimizable using "transfer" method
a := a || a[3]; -- optimizable using "inplace" method a := a || a[3]; -- optimizable using "inplace" method
a := a[1] || a; -- ditto, but let's test array_prepend
a := a || a; -- not optimizable a := a || a; -- not optimizable
raise notice 'a = %', a; raise notice 'a = %', a;
end$$; end$$;
NOTICE: a = {1,2,3,42,3,1,2,3,42,3} NOTICE: a = {1,1,2,3,42,3,1,1,2,3,42,3}
create temp table onecol as select array[1,2] as f1; create temp table onecol as select array[1,2] as f1;
do $$ declare a int[]; do $$ declare a int[];
begin a := f1 from onecol; raise notice 'a = %', a; end$$; begin a := f1 from onecol; raise notice 'a = %', a; end$$;

View File

@@ -29,6 +29,7 @@
#include "mb/stringinfo_mb.h" #include "mb/stringinfo_mb.h"
#include "miscadmin.h" #include "miscadmin.h"
#include "nodes/nodeFuncs.h" #include "nodes/nodeFuncs.h"
#include "nodes/supportnodes.h"
#include "optimizer/optimizer.h" #include "optimizer/optimizer.h"
#include "parser/parse_coerce.h" #include "parser/parse_coerce.h"
#include "parser/parse_type.h" #include "parser/parse_type.h"
@@ -8411,7 +8412,7 @@ exec_check_rw_parameter(PLpgSQL_expr *expr, int paramid)
Expr *sexpr = expr->expr_simple_expr; Expr *sexpr = expr->expr_simple_expr;
Oid funcid; Oid funcid;
List *fargs; List *fargs;
ListCell *lc; Oid prosupport;
/* Assume unsafe */ /* Assume unsafe */
expr->expr_rwopt = PLPGSQL_RWOPT_NOPE; expr->expr_rwopt = PLPGSQL_RWOPT_NOPE;
@@ -8480,66 +8481,53 @@ exec_check_rw_parameter(PLpgSQL_expr *expr, int paramid)
{ {
SubscriptingRef *sbsref = (SubscriptingRef *) sexpr; SubscriptingRef *sbsref = (SubscriptingRef *) sexpr;
/* We only trust standard varlena arrays to be safe */ funcid = get_typsubscript(sbsref->refcontainertype, NULL);
/* TODO: install some extensibility here */
if (get_typsubscript(sbsref->refcontainertype, NULL) !=
F_ARRAY_SUBSCRIPT_HANDLER)
return;
/* We can optimize the refexpr if it's the target, otherwise not */ /*
if (sbsref->refexpr && IsA(sbsref->refexpr, Param)) * We assume that only the refexpr and refassgnexpr (if any) are
{ * relevant to the support function's decision. If that turns out to
Param *param = (Param *) sbsref->refexpr; * be a bad idea, we could incorporate the subscript expressions into
* the fargs list somehow.
if (param->paramkind == PARAM_EXTERN && */
param->paramid == paramid) fargs = list_make2(sbsref->refexpr, sbsref->refassgnexpr);
{
/* Found the Param we want to pass as read/write */
expr->expr_rwopt = PLPGSQL_RWOPT_INPLACE;
expr->expr_rw_param = param;
return;
}
}
return;
} }
else else
return; return;
/* /*
* The top-level function must be one that we trust to be "safe". * The top-level function must be one that can handle in-place update
* Currently we hard-wire the list, but it would be very desirable to * safely. We allow functions to declare their ability to do that via a
* allow extensions to mark their functions as safe ... * support function request.
*/ */
if (!(funcid == F_ARRAY_APPEND || prosupport = get_func_support(funcid);
funcid == F_ARRAY_PREPEND)) if (OidIsValid(prosupport))
return;
/*
* The target variable (in the form of a Param) must appear as a direct
* argument of the top-level function. References further down in the
* tree can't be optimized; but on the other hand, they don't invalidate
* optimizing the top-level call, since that will be executed last.
*/
foreach(lc, fargs)
{ {
Node *arg = (Node *) lfirst(lc); SupportRequestModifyInPlace req;
Param *param;
if (arg && IsA(arg, Param)) req.type = T_SupportRequestModifyInPlace;
{ req.funcid = funcid;
Param *param = (Param *) arg; req.args = fargs;
req.paramid = paramid;
param = (Param *)
DatumGetPointer(OidFunctionCall1(prosupport,
PointerGetDatum(&req)));
if (param == NULL)
return; /* support function fails */
/* Verify support function followed the API */
Assert(IsA(param, Param));
Assert(param->paramkind == PARAM_EXTERN);
Assert(param->paramid == paramid);
if (param->paramkind == PARAM_EXTERN &&
param->paramid == paramid)
{
/* Found the Param we want to pass as read/write */ /* Found the Param we want to pass as read/write */
expr->expr_rwopt = PLPGSQL_RWOPT_INPLACE; expr->expr_rwopt = PLPGSQL_RWOPT_INPLACE;
expr->expr_rw_param = param; expr->expr_rw_param = param;
return; return;
} }
} }
}
}
/* /*
* Count Params referencing the specified paramid, and return one of them * Count Params referencing the specified paramid, and return one of them

View File

@@ -53,6 +53,7 @@ begin
-- test scenarios for optimization of updates of R/W expanded objects -- test scenarios for optimization of updates of R/W expanded objects
a := array_append(a, 42); -- optimizable using "transfer" method a := array_append(a, 42); -- optimizable using "transfer" method
a := a || a[3]; -- optimizable using "inplace" method a := a || a[3]; -- optimizable using "inplace" method
a := a[1] || a; -- ditto, but let's test array_prepend
a := a || a; -- not optimizable a := a || a; -- not optimizable
raise notice 'a = %', a; raise notice 'a = %', a;
end$$; end$$;

View File

@@ -2804,6 +2804,7 @@ SubscriptionRelState
SummarizerReadLocalXLogPrivate SummarizerReadLocalXLogPrivate
SupportRequestCost SupportRequestCost
SupportRequestIndexCondition SupportRequestIndexCondition
SupportRequestModifyInPlace
SupportRequestOptimizeWindowClause SupportRequestOptimizeWindowClause
SupportRequestRows SupportRequestRows
SupportRequestSelectivity SupportRequestSelectivity