Commit 75f9c4ca authored by Amit Kapila's avatar Amit Kapila

Don't allow LIMIT/OFFSET clause within sub-selects to be pushed to workers.

Allowing sub-select containing LIMIT/OFFSET in workers can lead to
inconsistent results at the top-level as there is no guarantee that the
row order will be fully deterministic.  The fix is to prohibit pushing
LIMIT/OFFSET within sub-selects to workers.

Reported-by: Andrew Fletcher
Bug: 15324
Author: Amit Kapila
Reviewed-by: Dilip Kumar
Backpatch-through: 9.6
Discussion: https://postgr.es/m/153417684333.10284.11356259990921828616@wrigleys.postgresql.org
parent 0ba06e0b
...@@ -620,7 +620,20 @@ set_rel_consider_parallel(PlannerInfo *root, RelOptInfo *rel, ...@@ -620,7 +620,20 @@ set_rel_consider_parallel(PlannerInfo *root, RelOptInfo *rel,
* the SubqueryScanPath as not parallel-safe. (Note that * the SubqueryScanPath as not parallel-safe. (Note that
* set_subquery_pathlist() might push some of these quals down * set_subquery_pathlist() might push some of these quals down
* into the subquery itself, but that doesn't change anything.) * into the subquery itself, but that doesn't change anything.)
*
* We can't push sub-select containing LIMIT/OFFSET to workers as
* there is no guarantee that the row order will be fully
* deterministic, and applying LIMIT/OFFSET will lead to
* inconsistent results at the top-level. (In some cases, where
* the result is ordered, we could relax this restriction. But it
* doesn't currently seem worth expending extra effort to do so.)
*/ */
{
Query *subquery = castNode(Query, rte->subquery);
if (limit_needed(subquery))
return;
}
break; break;
case RTE_JOIN: case RTE_JOIN:
......
...@@ -123,7 +123,6 @@ static void preprocess_rowmarks(PlannerInfo *root); ...@@ -123,7 +123,6 @@ static void preprocess_rowmarks(PlannerInfo *root);
static double preprocess_limit(PlannerInfo *root, static double preprocess_limit(PlannerInfo *root,
double tuple_fraction, double tuple_fraction,
int64 *offset_est, int64 *count_est); int64 *offset_est, int64 *count_est);
static bool limit_needed(Query *parse);
static void remove_useless_groupby_columns(PlannerInfo *root); static void remove_useless_groupby_columns(PlannerInfo *root);
static List *preprocess_groupclause(PlannerInfo *root, List *force); static List *preprocess_groupclause(PlannerInfo *root, List *force);
static List *extract_rollup_sets(List *groupingSets); static List *extract_rollup_sets(List *groupingSets);
...@@ -2870,7 +2869,7 @@ preprocess_limit(PlannerInfo *root, double tuple_fraction, ...@@ -2870,7 +2869,7 @@ preprocess_limit(PlannerInfo *root, double tuple_fraction,
* a key distinction: here we need hard constants in OFFSET/LIMIT, whereas * a key distinction: here we need hard constants in OFFSET/LIMIT, whereas
* in preprocess_limit it's good enough to consider estimated values. * in preprocess_limit it's good enough to consider estimated values.
*/ */
static bool bool
limit_needed(Query *parse) limit_needed(Query *parse)
{ {
Node *node; Node *node;
......
...@@ -47,6 +47,8 @@ extern bool is_dummy_plan(Plan *plan); ...@@ -47,6 +47,8 @@ extern bool is_dummy_plan(Plan *plan);
extern RowMarkType select_rowmark_type(RangeTblEntry *rte, extern RowMarkType select_rowmark_type(RangeTblEntry *rte,
LockClauseStrength strength); LockClauseStrength strength);
extern bool limit_needed(Query *parse);
extern void mark_partial_aggref(Aggref *agg, AggSplit aggsplit); extern void mark_partial_aggref(Aggref *agg, AggSplit aggsplit);
extern Path *get_cheapest_fractional_path(RelOptInfo *rel, extern Path *get_cheapest_fractional_path(RelOptInfo *rel,
......
...@@ -984,6 +984,25 @@ explain (costs off, verbose) ...@@ -984,6 +984,25 @@ explain (costs off, verbose)
Output: b.unique1 Output: b.unique1
(18 rows) (18 rows)
-- LIMIT/OFFSET within sub-selects can't be pushed to workers.
explain (costs off)
select * from tenk1 a where two in
(select two from tenk1 b where stringu1 like '%AAAA' limit 3);
QUERY PLAN
---------------------------------------------------------------
Hash Semi Join
Hash Cond: (a.two = b.two)
-> Gather
Workers Planned: 4
-> Parallel Seq Scan on tenk1 a
-> Hash
-> Limit
-> Gather
Workers Planned: 4
-> Parallel Seq Scan on tenk1 b
Filter: (stringu1 ~~ '%AAAA'::text)
(11 rows)
-- to increase the parallel query test coverage -- to increase the parallel query test coverage
SAVEPOINT settings; SAVEPOINT settings;
SET LOCAL force_parallel_mode = 1; SET LOCAL force_parallel_mode = 1;
......
...@@ -368,6 +368,11 @@ explain (costs off, verbose) ...@@ -368,6 +368,11 @@ explain (costs off, verbose)
(select unique1, row_number() over() from tenk1 b); (select unique1, row_number() over() from tenk1 b);
-- LIMIT/OFFSET within sub-selects can't be pushed to workers.
explain (costs off)
select * from tenk1 a where two in
(select two from tenk1 b where stringu1 like '%AAAA' limit 3);
-- to increase the parallel query test coverage -- to increase the parallel query test coverage
SAVEPOINT settings; SAVEPOINT settings;
SET LOCAL force_parallel_mode = 1; SET LOCAL force_parallel_mode = 1;
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment