mirror of
https://github.com/postgres/postgres.git
synced 2025-07-28 23:42:10 +03:00
Still another try at fixing scanjoin_target insertion into parallel plans.
The previous code neglected the fact that the scanjoin_target might carry sortgroupref labelings that we need to absorb. Instead, do create_projection_path() unconditionally, and tweak the path's cost estimate after the fact. (I'm now convinced that we ought to refactor the way we account for sometimes not needing a separate projection step, but right now is not the time for that sort of cleanup.) Problem identified by Amit Kapila, patch by me.
This commit is contained in:
@ -1788,36 +1788,39 @@ grouping_planner(PlannerInfo *root, bool inheritance_update,
|
|||||||
Path *subpath = (Path *) lfirst(lc);
|
Path *subpath = (Path *) lfirst(lc);
|
||||||
Path *newpath;
|
Path *newpath;
|
||||||
|
|
||||||
|
/* Shouldn't have any parameterized paths anymore */
|
||||||
|
Assert(subpath->param_info == NULL);
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* We can't use apply_projection_to_path() here, because there
|
* We can't use apply_projection_to_path() here, because there
|
||||||
* could already be pointers to these paths, and therefore we
|
* could already be pointers to these paths, and therefore we
|
||||||
* cannot modify them in place. Instead, we must use
|
* dare not modify them in place. Instead, we must use
|
||||||
* create_projection_path(). The good news is this won't
|
* create_projection_path() unconditionally.
|
||||||
* actually insert a Result node into the final plan unless
|
|
||||||
* it's needed, but the bad news is that it will charge for
|
|
||||||
* the node whether it's needed or not. Therefore, if the
|
|
||||||
* target list is already what we need it to be, just leave
|
|
||||||
* this partial path alone.
|
|
||||||
*/
|
*/
|
||||||
if (equal(scanjoin_target->exprs, subpath->pathtarget->exprs))
|
|
||||||
continue;
|
|
||||||
|
|
||||||
Assert(subpath->param_info == NULL);
|
|
||||||
newpath = (Path *) create_projection_path(root,
|
newpath = (Path *) create_projection_path(root,
|
||||||
current_rel,
|
current_rel,
|
||||||
subpath,
|
subpath,
|
||||||
scanjoin_target);
|
scanjoin_target);
|
||||||
if (is_projection_capable_path(subpath))
|
|
||||||
|
/*
|
||||||
|
* Although create_projection_path() inserts a ProjectionPath
|
||||||
|
* unconditionally, create_projection_plan() will only insert
|
||||||
|
* a Result node if the subpath is not projection-capable, so
|
||||||
|
* we should discount the cost of that node if it will not
|
||||||
|
* actually get inserted. (This is pretty grotty but we can
|
||||||
|
* improve it later if it seems important.)
|
||||||
|
*/
|
||||||
|
if (equal(scanjoin_target->exprs, subpath->pathtarget->exprs))
|
||||||
{
|
{
|
||||||
/*
|
/* at most we need a relabeling of the subpath */
|
||||||
* Since the target lists differ, a projection path is
|
|
||||||
* essential, but it will disappear at plan creation time
|
|
||||||
* because the subpath is projection-capable. So avoid
|
|
||||||
* charging anything for the disappearing node.
|
|
||||||
*/
|
|
||||||
newpath->startup_cost = subpath->startup_cost;
|
newpath->startup_cost = subpath->startup_cost;
|
||||||
newpath->total_cost = subpath->total_cost;
|
newpath->total_cost = subpath->total_cost;
|
||||||
}
|
}
|
||||||
|
else if (is_projection_capable_path(subpath))
|
||||||
|
{
|
||||||
|
/* need to project, but we don't need a Result */
|
||||||
|
newpath->total_cost -= cpu_tuple_cost * subpath->rows;
|
||||||
|
}
|
||||||
|
|
||||||
lfirst(lc) = newpath;
|
lfirst(lc) = newpath;
|
||||||
}
|
}
|
||||||
|
@ -6,9 +6,10 @@ create or replace function parallel_restricted(int) returns int as
|
|||||||
-- Serializable isolation would disable parallel query, so explicitly use an
|
-- Serializable isolation would disable parallel query, so explicitly use an
|
||||||
-- arbitrary other level.
|
-- arbitrary other level.
|
||||||
begin isolation level repeatable read;
|
begin isolation level repeatable read;
|
||||||
-- setup parallel test
|
-- encourage use of parallel plans
|
||||||
set parallel_setup_cost=0;
|
set parallel_setup_cost=0;
|
||||||
set parallel_tuple_cost=0;
|
set parallel_tuple_cost=0;
|
||||||
|
set min_parallel_relation_size=0;
|
||||||
set max_parallel_workers_per_gather=4;
|
set max_parallel_workers_per_gather=4;
|
||||||
explain (costs off)
|
explain (costs off)
|
||||||
select count(*) from a_star;
|
select count(*) from a_star;
|
||||||
@ -71,6 +72,21 @@ select length(stringu1) from tenk1 group by length(stringu1);
|
|||||||
6
|
6
|
||||||
(1 row)
|
(1 row)
|
||||||
|
|
||||||
|
explain (costs off)
|
||||||
|
select stringu1, count(*) from tenk1 group by stringu1 order by stringu1;
|
||||||
|
QUERY PLAN
|
||||||
|
----------------------------------------------------
|
||||||
|
Sort
|
||||||
|
Sort Key: stringu1
|
||||||
|
-> Finalize HashAggregate
|
||||||
|
Group Key: stringu1
|
||||||
|
-> Gather
|
||||||
|
Workers Planned: 4
|
||||||
|
-> Partial HashAggregate
|
||||||
|
Group Key: stringu1
|
||||||
|
-> Parallel Seq Scan on tenk1
|
||||||
|
(9 rows)
|
||||||
|
|
||||||
-- test that parallel plan for aggregates is not selected when
|
-- test that parallel plan for aggregates is not selected when
|
||||||
-- target list contains parallel restricted clause.
|
-- target list contains parallel restricted clause.
|
||||||
explain (costs off)
|
explain (costs off)
|
||||||
|
@ -9,9 +9,10 @@ create or replace function parallel_restricted(int) returns int as
|
|||||||
-- arbitrary other level.
|
-- arbitrary other level.
|
||||||
begin isolation level repeatable read;
|
begin isolation level repeatable read;
|
||||||
|
|
||||||
-- setup parallel test
|
-- encourage use of parallel plans
|
||||||
set parallel_setup_cost=0;
|
set parallel_setup_cost=0;
|
||||||
set parallel_tuple_cost=0;
|
set parallel_tuple_cost=0;
|
||||||
|
set min_parallel_relation_size=0;
|
||||||
set max_parallel_workers_per_gather=4;
|
set max_parallel_workers_per_gather=4;
|
||||||
|
|
||||||
explain (costs off)
|
explain (costs off)
|
||||||
@ -29,6 +30,9 @@ explain (costs off)
|
|||||||
select length(stringu1) from tenk1 group by length(stringu1);
|
select length(stringu1) from tenk1 group by length(stringu1);
|
||||||
select length(stringu1) from tenk1 group by length(stringu1);
|
select length(stringu1) from tenk1 group by length(stringu1);
|
||||||
|
|
||||||
|
explain (costs off)
|
||||||
|
select stringu1, count(*) from tenk1 group by stringu1 order by stringu1;
|
||||||
|
|
||||||
-- test that parallel plan for aggregates is not selected when
|
-- test that parallel plan for aggregates is not selected when
|
||||||
-- target list contains parallel restricted clause.
|
-- target list contains parallel restricted clause.
|
||||||
explain (costs off)
|
explain (costs off)
|
||||||
|
Reference in New Issue
Block a user