Commit 728202b6 authored by Andrew Gierth's avatar Andrew Gierth

Order active window clauses for greater reuse of Sort nodes.

By sorting the active window list lexicographically by the sort clause
list but putting longer clauses before shorter prefixes, we generate
more chances to elide Sort nodes when building the path.

Author: Daniel Gustafsson (with some editorialization by me)
Reviewed-by: Alexander Kuzmenkov, Masahiko Sawada, Tom Lane
Discussion: https://postgr.es/m/124A7F69-84CD-435B-BA0E-2695BE21E5C2%40yesql.se
parent 75f9c4ca
...@@ -1011,8 +1011,11 @@ list_append_unique_oid(List *list, Oid datum) ...@@ -1011,8 +1011,11 @@ list_append_unique_oid(List *list, Oid datum)
* via equal(). * via equal().
* *
* This is almost the same functionality as list_union(), but list1 is * This is almost the same functionality as list_union(), but list1 is
* modified in-place rather than being copied. Note also that list2's cells * modified in-place rather than being copied. However, callers of this
* are not inserted in list1, so the analogy to list_concat() isn't perfect. * function may have strict ordering expectations -- i.e. that the relative
* order of those list2 elements that are not duplicates is preserved. Note
* also that list2's cells are not inserted in list1, so the analogy to
* list_concat() isn't perfect.
*/ */
List * List *
list_concat_unique(List *list1, List *list2) list_concat_unique(List *list1, List *list2)
......
...@@ -110,6 +110,17 @@ typedef struct ...@@ -110,6 +110,17 @@ typedef struct
int *tleref_to_colnum_map; int *tleref_to_colnum_map;
} grouping_sets_data; } grouping_sets_data;
/*
* Temporary structure for use during WindowClause reordering in order to be
* be able to sort WindowClauses on partitioning/ordering prefix.
*/
typedef struct
{
WindowClause *wc;
List *uniqueOrder; /* A List of unique ordering/partitioning
* clauses per Window */
} WindowClauseSortData;
/* Local functions */ /* Local functions */
static Node *preprocess_expression(PlannerInfo *root, Node *expr, int kind); static Node *preprocess_expression(PlannerInfo *root, Node *expr, int kind);
static void preprocess_qual_conditions(PlannerInfo *root, Node *jtnode); static void preprocess_qual_conditions(PlannerInfo *root, Node *jtnode);
...@@ -236,6 +247,7 @@ static void create_partitionwise_grouping_paths(PlannerInfo *root, ...@@ -236,6 +247,7 @@ static void create_partitionwise_grouping_paths(PlannerInfo *root,
static bool group_by_has_partkey(RelOptInfo *input_rel, static bool group_by_has_partkey(RelOptInfo *input_rel,
List *targetList, List *targetList,
List *groupClause); List *groupClause);
static int common_prefix_cmp(const void *a, const void *b);
/***************************************************************************** /*****************************************************************************
...@@ -5259,67 +5271,119 @@ postprocess_setop_tlist(List *new_tlist, List *orig_tlist) ...@@ -5259,67 +5271,119 @@ postprocess_setop_tlist(List *new_tlist, List *orig_tlist)
static List * static List *
select_active_windows(PlannerInfo *root, WindowFuncLists *wflists) select_active_windows(PlannerInfo *root, WindowFuncLists *wflists)
{ {
List *result; List *windowClause = root->parse->windowClause;
List *actives; List *result = NIL;
ListCell *lc; ListCell *lc;
int nActive = 0;
WindowClauseSortData *actives = palloc(sizeof(WindowClauseSortData)
* list_length(windowClause));
/* First, make a list of the active windows */ /* First, construct an array of the active windows */
actives = NIL; foreach(lc, windowClause)
foreach(lc, root->parse->windowClause)
{ {
WindowClause *wc = lfirst_node(WindowClause, lc); WindowClause *wc = lfirst_node(WindowClause, lc);
/* It's only active if wflists shows some related WindowFuncs */ /* It's only active if wflists shows some related WindowFuncs */
Assert(wc->winref <= wflists->maxWinRef); Assert(wc->winref <= wflists->maxWinRef);
if (wflists->windowFuncs[wc->winref] != NIL) if (wflists->windowFuncs[wc->winref] == NIL)
actives = lappend(actives, wc); continue;
actives[nActive].wc = wc; /* original clause */
/*
* For sorting, we want the list of partition keys followed by the
* list of sort keys. But pathkeys construction will remove duplicates
* between the two, so we can as well (even though we can't detect all
* of the duplicates, since some may come from ECs - that might mean
* we miss optimization chances here). We must, however, ensure that
* the order of entries is preserved with respect to the ones we do
* keep.
*
* partitionClause and orderClause had their own duplicates removed in
* parse analysis, so we're only concerned here with removing
* orderClause entries that also appear in partitionClause.
*/
actives[nActive].uniqueOrder =
list_concat_unique(list_copy(wc->partitionClause),
wc->orderClause);
nActive++;
} }
/* /*
* Now, ensure that windows with identical partitioning/ordering clauses * Sort active windows by their partitioning/ordering clauses, ignoring
* are adjacent in the list. This is required by the SQL standard, which * any framing clauses, so that the windows that need the same sorting are
* says that only one sort is to be used for such windows, even if they * adjacent in the list. When we come to generate paths, this will avoid
* are otherwise distinct (eg, different names or framing clauses). * inserting additional Sort nodes.
* *
* There is room to be much smarter here, for example detecting whether * This is how we implement a specific requirement from the SQL standard,
* one window's sort keys are a prefix of another's (so that sorting for * which says that when two or more windows are order-equivalent (i.e.
* the latter would do for the former), or putting windows first that * have matching partition and order clauses, even if their names or
* match a sort order available for the underlying query. For the moment * framing clauses differ), then all peer rows must be presented in the
* we are content with meeting the spec. * same order in all of them. If we allowed multiple sort nodes for such
*/ * cases, we'd risk having the peer rows end up in different orders in
result = NIL; * equivalent windows due to sort instability. (See General Rule 4 of
while (actives != NIL) * <window clause> in SQL2008 - SQL2016.)
{ *
WindowClause *wc = linitial_node(WindowClause, actives); * Additionally, if the entire list of clauses of one window is a prefix
ListCell *prev; * of another, put first the window with stronger sorting requirements.
ListCell *next; * This way we will first sort for stronger window, and won't have to sort
* again for the weaker one.
/* Move wc from actives to result */ */
actives = list_delete_first(actives); qsort(actives, nActive, sizeof(WindowClauseSortData), common_prefix_cmp);
result = lappend(result, wc);
/* Now move any matching windows from actives to result */
prev = NULL;
for (lc = list_head(actives); lc; lc = next)
{
WindowClause *wc2 = lfirst_node(WindowClause, lc);
next = lnext(lc); /* build ordered list of the original WindowClause nodes */
/* framing options are NOT to be compared here! */ for (int i = 0; i < nActive; i++)
if (equal(wc->partitionClause, wc2->partitionClause) && result = lappend(result, actives[i].wc);
equal(wc->orderClause, wc2->orderClause))
{ pfree(actives);
actives = list_delete_cell(actives, lc, prev);
result = lappend(result, wc2);
}
else
prev = lc;
}
}
return result; return result;
} }
/*
* common_prefix_cmp
* QSort comparison function for WindowClauseSortData
*
* Sort the windows by the required sorting clauses. First, compare the sort
* clauses themselves. Second, if one window's clauses are a prefix of another
* one's clauses, put the window with more sort clauses first.
*/
static int
common_prefix_cmp(const void *a, const void *b)
{
const WindowClauseSortData *wcsa = a;
const WindowClauseSortData *wcsb = b;
ListCell *item_a;
ListCell *item_b;
forboth(item_a, wcsa->uniqueOrder, item_b, wcsb->uniqueOrder)
{
SortGroupClause *sca = lfirst_node(SortGroupClause, item_a);
SortGroupClause *scb = lfirst_node(SortGroupClause, item_b);
if (sca->tleSortGroupRef > scb->tleSortGroupRef)
return -1;
else if (sca->tleSortGroupRef < scb->tleSortGroupRef)
return 1;
else if (sca->sortop > scb->sortop)
return -1;
else if (sca->sortop < scb->sortop)
return 1;
else if (sca->nulls_first && !scb->nulls_first)
return -1;
else if (!sca->nulls_first && scb->nulls_first)
return 1;
/* no need to compare eqop, since it is fully determined by sortop */
}
if (list_length(wcsa->uniqueOrder) > list_length(wcsb->uniqueOrder))
return -1;
else if (list_length(wcsa->uniqueOrder) < list_length(wcsb->uniqueOrder))
return 1;
return 0;
}
/* /*
* make_window_input_target * make_window_input_target
* Generate appropriate PathTarget for initial input to WindowAgg nodes. * Generate appropriate PathTarget for initial input to WindowAgg nodes.
......
...@@ -504,9 +504,9 @@ SELECT sum(salary), ...@@ -504,9 +504,9 @@ SELECT sum(salary),
FROM empsalary GROUP BY depname; FROM empsalary GROUP BY depname;
sum | row_number | sum sum | row_number | sum
-------+------------+------- -------+------------+-------
14600 | 3 | 14600
7400 | 2 | 22000
25100 | 1 | 47100 25100 | 1 | 47100
7400 | 2 | 22000
14600 | 3 | 14600
(3 rows) (3 rows)
-- identical windows with different names -- identical windows with different names
...@@ -2994,9 +2994,9 @@ SELECT sum(salary), row_number() OVER (ORDER BY depname), sum( ...@@ -2994,9 +2994,9 @@ SELECT sum(salary), row_number() OVER (ORDER BY depname), sum(
FROM empsalary GROUP BY depname; FROM empsalary GROUP BY depname;
sum | row_number | filtered_sum | depname sum | row_number | filtered_sum | depname
-------+------------+--------------+----------- -------+------------+--------------+-----------
14600 | 3 | | sales
7400 | 2 | 3500 | personnel
25100 | 1 | 22600 | develop 25100 | 1 | 22600 | develop
7400 | 2 | 3500 | personnel
14600 | 3 | | sales
(3 rows) (3 rows)
-- Test pushdown of quals into a subquery containing window functions -- Test pushdown of quals into a subquery containing window functions
...@@ -3008,13 +3008,13 @@ SELECT * FROM ...@@ -3008,13 +3008,13 @@ SELECT * FROM
min(salary) OVER (PARTITION BY depname || 'A', depname) depminsalary min(salary) OVER (PARTITION BY depname || 'A', depname) depminsalary
FROM empsalary) emp FROM empsalary) emp
WHERE depname = 'sales'; WHERE depname = 'sales';
QUERY PLAN QUERY PLAN
--------------------------------------------------------------------- --------------------------------------------------------------------------
Subquery Scan on emp Subquery Scan on emp
-> WindowAgg -> WindowAgg
-> Sort -> WindowAgg
Sort Key: (((empsalary.depname)::text || 'A'::text)) -> Sort
-> WindowAgg Sort Key: (((empsalary.depname)::text || 'A'::text))
-> Seq Scan on empsalary -> Seq Scan on empsalary
Filter: ((depname)::text = 'sales'::text) Filter: ((depname)::text = 'sales'::text)
(7 rows) (7 rows)
...@@ -3027,19 +3027,53 @@ SELECT * FROM ...@@ -3027,19 +3027,53 @@ SELECT * FROM
min(salary) OVER (PARTITION BY depname) depminsalary min(salary) OVER (PARTITION BY depname) depminsalary
FROM empsalary) emp FROM empsalary) emp
WHERE depname = 'sales'; WHERE depname = 'sales';
QUERY PLAN QUERY PLAN
----------------------------------------------------------- -------------------------------------------------------
Subquery Scan on emp Subquery Scan on emp
Filter: ((emp.depname)::text = 'sales'::text) Filter: ((emp.depname)::text = 'sales'::text)
-> WindowAgg -> WindowAgg
-> Sort -> Sort
Sort Key: empsalary.depname Sort Key: empsalary.enroll_date
-> WindowAgg -> WindowAgg
-> Sort -> Sort
Sort Key: empsalary.enroll_date Sort Key: empsalary.depname
-> Seq Scan on empsalary -> Seq Scan on empsalary
(9 rows) (9 rows)
-- Test Sort node collapsing
EXPLAIN (COSTS OFF)
SELECT * FROM
(SELECT depname,
sum(salary) OVER (PARTITION BY depname order by empno) depsalary,
min(salary) OVER (PARTITION BY depname, empno order by enroll_date) depminsalary
FROM empsalary) emp
WHERE depname = 'sales';
QUERY PLAN
----------------------------------------------------------------------
Subquery Scan on emp
-> WindowAgg
-> WindowAgg
-> Sort
Sort Key: empsalary.empno, empsalary.enroll_date
-> Seq Scan on empsalary
Filter: ((depname)::text = 'sales'::text)
(7 rows)
-- Test Sort node reordering
EXPLAIN (COSTS OFF)
SELECT
lead(1) OVER (PARTITION BY depname ORDER BY salary, enroll_date),
lag(1) OVER (PARTITION BY depname ORDER BY salary,enroll_date,empno)
FROM empsalary;
QUERY PLAN
-------------------------------------------------------------
WindowAgg
-> WindowAgg
-> Sort
Sort Key: depname, salary, enroll_date, empno
-> Seq Scan on empsalary
(5 rows)
-- cleanup -- cleanup
DROP TABLE empsalary; DROP TABLE empsalary;
-- test user-defined window function with named args and default args -- test user-defined window function with named args and default args
......
...@@ -892,6 +892,22 @@ SELECT * FROM ...@@ -892,6 +892,22 @@ SELECT * FROM
FROM empsalary) emp FROM empsalary) emp
WHERE depname = 'sales'; WHERE depname = 'sales';
-- Test Sort node collapsing
EXPLAIN (COSTS OFF)
SELECT * FROM
(SELECT depname,
sum(salary) OVER (PARTITION BY depname order by empno) depsalary,
min(salary) OVER (PARTITION BY depname, empno order by enroll_date) depminsalary
FROM empsalary) emp
WHERE depname = 'sales';
-- Test Sort node reordering
EXPLAIN (COSTS OFF)
SELECT
lead(1) OVER (PARTITION BY depname ORDER BY salary, enroll_date),
lag(1) OVER (PARTITION BY depname ORDER BY salary,enroll_date,empno)
FROM empsalary;
-- cleanup -- cleanup
DROP TABLE empsalary; DROP TABLE empsalary;
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment