Commit 624e440a authored by Tom Lane's avatar Tom Lane

Improve the heuristic for ordering child paths of a parallel append.

Commit ab727167 introduced code that attempts to order the child
scans of a Parallel Append node in a way that will minimize execution
time, based on total cost and startup cost.  However, it failed to
think hard about what to do when estimated costs are exactly equal;
a case that's particularly likely to occur when comparing on startup
cost.  In such a case the ordering of the child paths would be left
to the whims of qsort, an algorithm that isn't even stable.

We can improve matters by applying the rule used elsewhere in the
planner: if total costs are equal, sort on startup cost, and
vice versa.  When both cost estimates are exactly equal, rather
than letting qsort do something unpredictable, sort based on the
child paths' relids, which should typically result in sorting in
inheritance order.  (The latter provision requires inventing a
qsort-style comparator for bitmapsets, but maybe we'll have use
for that for other reasons in future.)

This results in a few plan changes in the select_parallel test,
but those all look more reasonable than before, when the actual
underlying cost numbers are taken into account.

Discussion: https://postgr.es/m/4944.1515446989@sss.pgh.pa.us
parent 80259d4d
...@@ -172,6 +172,50 @@ bms_equal(const Bitmapset *a, const Bitmapset *b) ...@@ -172,6 +172,50 @@ bms_equal(const Bitmapset *a, const Bitmapset *b)
return true; return true;
} }
/*
* bms_compare - qsort-style comparator for bitmapsets
*
* This guarantees to report values as equal iff bms_equal would say they are
* equal. Otherwise, the highest-numbered bit that is set in one value but
* not the other determines the result. (This rule means that, for example,
* {6} is greater than {5}, which seems plausible.)
*/
int
bms_compare(const Bitmapset *a, const Bitmapset *b)
{
int shortlen;
int i;
/* Handle cases where either input is NULL */
if (a == NULL)
return bms_is_empty(b) ? 0 : -1;
else if (b == NULL)
return bms_is_empty(a) ? 0 : +1;
/* Handle cases where one input is longer than the other */
shortlen = Min(a->nwords, b->nwords);
for (i = shortlen; i < a->nwords; i++)
{
if (a->words[i] != 0)
return +1;
}
for (i = shortlen; i < b->nwords; i++)
{
if (b->words[i] != 0)
return -1;
}
/* Process words in common */
i = shortlen;
while (--i >= 0)
{
bitmapword aw = a->words[i];
bitmapword bw = b->words[i];
if (aw != bw)
return (aw > bw) ? +1 : -1;
}
return 0;
}
/* /*
* bms_make_singleton - build a bitmapset containing a single member * bms_make_singleton - build a bitmapset containing a single member
*/ */
...@@ -838,7 +882,7 @@ bms_add_range(Bitmapset *a, int lower, int upper) ...@@ -838,7 +882,7 @@ bms_add_range(Bitmapset *a, int lower, int upper)
if (lwordnum == uwordnum) if (lwordnum == uwordnum)
{ {
a->words[lwordnum] |= ~(bitmapword) (((bitmapword) 1 << lbitnum) - 1) a->words[lwordnum] |= ~(bitmapword) (((bitmapword) 1 << lbitnum) - 1)
& (~(bitmapword) 0) >> ushiftbits; & (~(bitmapword) 0) >> ushiftbits;
} }
else else
{ {
......
...@@ -1274,38 +1274,44 @@ create_append_path(RelOptInfo *rel, ...@@ -1274,38 +1274,44 @@ create_append_path(RelOptInfo *rel,
/* /*
* append_total_cost_compare * append_total_cost_compare
* list_qsort comparator for sorting append child paths by total_cost * qsort comparator for sorting append child paths by total_cost descending
*
* For equal total costs, we fall back to comparing startup costs; if those
* are equal too, break ties using bms_compare on the paths' relids.
* (This is to avoid getting unpredictable results from qsort.)
*/ */
static int static int
append_total_cost_compare(const void *a, const void *b) append_total_cost_compare(const void *a, const void *b)
{ {
Path *path1 = (Path *) lfirst(*(ListCell **) a); Path *path1 = (Path *) lfirst(*(ListCell **) a);
Path *path2 = (Path *) lfirst(*(ListCell **) b); Path *path2 = (Path *) lfirst(*(ListCell **) b);
int cmp;
if (path1->total_cost > path2->total_cost) cmp = compare_path_costs(path1, path2, TOTAL_COST);
return -1; if (cmp != 0)
if (path1->total_cost < path2->total_cost) return -cmp;
return 1; return bms_compare(path1->parent->relids, path2->parent->relids);
return 0;
} }
/* /*
* append_startup_cost_compare * append_startup_cost_compare
* list_qsort comparator for sorting append child paths by startup_cost * qsort comparator for sorting append child paths by startup_cost descending
*
* For equal startup costs, we fall back to comparing total costs; if those
* are equal too, break ties using bms_compare on the paths' relids.
* (This is to avoid getting unpredictable results from qsort.)
*/ */
static int static int
append_startup_cost_compare(const void *a, const void *b) append_startup_cost_compare(const void *a, const void *b)
{ {
Path *path1 = (Path *) lfirst(*(ListCell **) a); Path *path1 = (Path *) lfirst(*(ListCell **) a);
Path *path2 = (Path *) lfirst(*(ListCell **) b); Path *path2 = (Path *) lfirst(*(ListCell **) b);
int cmp;
if (path1->startup_cost > path2->startup_cost) cmp = compare_path_costs(path1, path2, STARTUP_COST);
return -1; if (cmp != 0)
if (path1->startup_cost < path2->startup_cost) return -cmp;
return 1; return bms_compare(path1->parent->relids, path2->parent->relids);
return 0;
} }
/* /*
......
...@@ -65,6 +65,7 @@ typedef enum ...@@ -65,6 +65,7 @@ typedef enum
extern Bitmapset *bms_copy(const Bitmapset *a); extern Bitmapset *bms_copy(const Bitmapset *a);
extern bool bms_equal(const Bitmapset *a, const Bitmapset *b); extern bool bms_equal(const Bitmapset *a, const Bitmapset *b);
extern int bms_compare(const Bitmapset *a, const Bitmapset *b);
extern Bitmapset *bms_make_singleton(int x); extern Bitmapset *bms_make_singleton(int x);
extern void bms_free(Bitmapset *a); extern void bms_free(Bitmapset *a);
......
...@@ -21,12 +21,12 @@ explain (costs off) ...@@ -21,12 +21,12 @@ explain (costs off)
Workers Planned: 3 Workers Planned: 3
-> Partial Aggregate -> Partial Aggregate
-> Parallel Append -> Parallel Append
-> Parallel Seq Scan on a_star
-> Parallel Seq Scan on b_star
-> Parallel Seq Scan on c_star
-> Parallel Seq Scan on d_star -> Parallel Seq Scan on d_star
-> Parallel Seq Scan on e_star
-> Parallel Seq Scan on f_star -> Parallel Seq Scan on f_star
-> Parallel Seq Scan on e_star
-> Parallel Seq Scan on b_star
-> Parallel Seq Scan on c_star
-> Parallel Seq Scan on a_star
(11 rows) (11 rows)
select round(avg(aa)), sum(aa) from a_star a1; select round(avg(aa)), sum(aa) from a_star a1;
...@@ -49,10 +49,10 @@ explain (costs off) ...@@ -49,10 +49,10 @@ explain (costs off)
-> Parallel Append -> Parallel Append
-> Seq Scan on d_star -> Seq Scan on d_star
-> Seq Scan on c_star -> Seq Scan on c_star
-> Parallel Seq Scan on a_star
-> Parallel Seq Scan on b_star
-> Parallel Seq Scan on e_star
-> Parallel Seq Scan on f_star -> Parallel Seq Scan on f_star
-> Parallel Seq Scan on e_star
-> Parallel Seq Scan on b_star
-> Parallel Seq Scan on a_star
(11 rows) (11 rows)
select round(avg(aa)), sum(aa) from a_star a2; select round(avg(aa)), sum(aa) from a_star a2;
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment