Commit 3373c715 authored by David Rowley's avatar David Rowley

Speed up finding EquivalenceClasses for a given set of rels

Previously in order to determine which ECs a relation had members in, we
had to loop over all ECs stored in PlannerInfo's eq_classes and check if
ec_relids mentioned the relation.  For the most part, this was fine, as
generally, unless queries were fairly complex, the overhead of performing
the lookup would have not been that significant.  However, when queries
contained large numbers of joins and ECs, the overhead to find the set of
classes matching a given set of relations could become a significant
portion of the overall planning effort.

Here we allow a much more efficient method to access the ECs which match a
given relation or set of relations.  A new Bitmapset field in RelOptInfo
now exists to store the indexes into PlannerInfo's eq_classes list which
each relation is mentioned in.  This allows very fast lookups to find all
ECs belonging to a single relation.  When we need to lookup ECs belonging
to a given pair of relations, we can simply bitwise-AND the Bitmapsets from
each relation and use the result to perform the lookup.

We also take the opportunity to write a new implementation of
generate_join_implied_equalities which makes use of the new indexes.
generate_join_implied_equalities_for_ecs must remain as is as it can be
given a custom list of ECs, which we can't easily determine the indexes of.

This was originally intended to fix the performance penalty of looking up
foreign keys matching a join condition which was introduced by 100340e2.
However, we're speeding up much more than just that here.

Author: David Rowley, Tom Lane
Reviewed-by: Tom Lane, Tomas Vondra
Discussion: https://postgr.es/m/6970.1545327857@sss.pgh.pa.us
parent 894af78f
...@@ -2195,6 +2195,7 @@ _outPlannerInfo(StringInfo str, const PlannerInfo *node) ...@@ -2195,6 +2195,7 @@ _outPlannerInfo(StringInfo str, const PlannerInfo *node)
WRITE_NODE_FIELD(cte_plan_ids); WRITE_NODE_FIELD(cte_plan_ids);
WRITE_NODE_FIELD(multiexpr_params); WRITE_NODE_FIELD(multiexpr_params);
WRITE_NODE_FIELD(eq_classes); WRITE_NODE_FIELD(eq_classes);
WRITE_BOOL_FIELD(ec_merging_done);
WRITE_NODE_FIELD(canon_pathkeys); WRITE_NODE_FIELD(canon_pathkeys);
WRITE_NODE_FIELD(left_join_clauses); WRITE_NODE_FIELD(left_join_clauses);
WRITE_NODE_FIELD(right_join_clauses); WRITE_NODE_FIELD(right_join_clauses);
...@@ -2261,6 +2262,7 @@ _outRelOptInfo(StringInfo str, const RelOptInfo *node) ...@@ -2261,6 +2262,7 @@ _outRelOptInfo(StringInfo str, const RelOptInfo *node)
WRITE_UINT_FIELD(pages); WRITE_UINT_FIELD(pages);
WRITE_FLOAT_FIELD(tuples, "%.0f"); WRITE_FLOAT_FIELD(tuples, "%.0f");
WRITE_FLOAT_FIELD(allvisfrac, "%.6f"); WRITE_FLOAT_FIELD(allvisfrac, "%.6f");
WRITE_BITMAPSET_FIELD(eclass_indexes);
WRITE_NODE_FIELD(subroot); WRITE_NODE_FIELD(subroot);
WRITE_NODE_FIELD(subplan_params); WRITE_NODE_FIELD(subplan_params);
WRITE_INT_FIELD(rel_parallel_workers); WRITE_INT_FIELD(rel_parallel_workers);
......
This diff is collapsed.
...@@ -48,9 +48,7 @@ static bool right_merge_direction(PlannerInfo *root, PathKey *pathkey); ...@@ -48,9 +48,7 @@ static bool right_merge_direction(PlannerInfo *root, PathKey *pathkey);
* entry if there's not one already. * entry if there's not one already.
* *
* Note that this function must not be used until after we have completed * Note that this function must not be used until after we have completed
* merging EquivalenceClasses. (We don't try to enforce that here; instead, * merging EquivalenceClasses.
* equivclass.c will complain if a merge occurs after root->canon_pathkeys
* has become nonempty.)
*/ */
PathKey * PathKey *
make_canonical_pathkey(PlannerInfo *root, make_canonical_pathkey(PlannerInfo *root,
...@@ -61,6 +59,10 @@ make_canonical_pathkey(PlannerInfo *root, ...@@ -61,6 +59,10 @@ make_canonical_pathkey(PlannerInfo *root,
ListCell *lc; ListCell *lc;
MemoryContext oldcontext; MemoryContext oldcontext;
/* Can't make canonical pathkeys if the set of ECs might still change */
if (!root->ec_merging_done)
elog(ERROR, "too soon to build canonical pathkeys");
/* The passed eclass might be non-canonical, so chase up to the top */ /* The passed eclass might be non-canonical, so chase up to the top */
while (eclass->ec_merged) while (eclass->ec_merged)
eclass = eclass->ec_merged; eclass = eclass->ec_merged;
......
...@@ -139,6 +139,12 @@ query_planner(PlannerInfo *root, ...@@ -139,6 +139,12 @@ query_planner(PlannerInfo *root,
/* Select cheapest path (pretty easy in this case...) */ /* Select cheapest path (pretty easy in this case...) */
set_cheapest(final_rel); set_cheapest(final_rel);
/*
* We don't need to run generate_base_implied_equalities, but
* we do need to pretend that EC merging is complete.
*/
root->ec_merging_done = true;
/* /*
* We still are required to call qp_callback, in case it's * We still are required to call qp_callback, in case it's
* something like "SELECT 2+2 ORDER BY 1". * something like "SELECT 2+2 ORDER BY 1".
......
...@@ -618,6 +618,7 @@ subquery_planner(PlannerGlobal *glob, Query *parse, ...@@ -618,6 +618,7 @@ subquery_planner(PlannerGlobal *glob, Query *parse,
root->cte_plan_ids = NIL; root->cte_plan_ids = NIL;
root->multiexpr_params = NIL; root->multiexpr_params = NIL;
root->eq_classes = NIL; root->eq_classes = NIL;
root->ec_merging_done = false;
root->append_rel_list = NIL; root->append_rel_list = NIL;
root->rowMarks = NIL; root->rowMarks = NIL;
memset(root->upper_rels, 0, sizeof(root->upper_rels)); memset(root->upper_rels, 0, sizeof(root->upper_rels));
......
...@@ -886,6 +886,7 @@ pull_up_simple_subquery(PlannerInfo *root, Node *jtnode, RangeTblEntry *rte, ...@@ -886,6 +886,7 @@ pull_up_simple_subquery(PlannerInfo *root, Node *jtnode, RangeTblEntry *rte,
subroot->cte_plan_ids = NIL; subroot->cte_plan_ids = NIL;
subroot->multiexpr_params = NIL; subroot->multiexpr_params = NIL;
subroot->eq_classes = NIL; subroot->eq_classes = NIL;
subroot->ec_merging_done = false;
subroot->append_rel_list = NIL; subroot->append_rel_list = NIL;
subroot->rowMarks = NIL; subroot->rowMarks = NIL;
memset(subroot->upper_rels, 0, sizeof(subroot->upper_rels)); memset(subroot->upper_rels, 0, sizeof(subroot->upper_rels));
......
...@@ -120,6 +120,15 @@ plan_set_operations(PlannerInfo *root) ...@@ -120,6 +120,15 @@ plan_set_operations(PlannerInfo *root)
Assert(parse->windowClause == NIL); Assert(parse->windowClause == NIL);
Assert(parse->distinctClause == NIL); Assert(parse->distinctClause == NIL);
/*
* In the outer query level, we won't have any true equivalences to deal
* with; but we do want to be able to make pathkeys, which will require
* single-member EquivalenceClasses. Indicate that EC merging is complete
* so that pathkeys.c won't complain.
*/
Assert(root->eq_classes == NIL);
root->ec_merging_done = true;
/* /*
* We'll need to build RelOptInfos for each of the leaf subqueries, which * We'll need to build RelOptInfos for each of the leaf subqueries, which
* are RTE_SUBQUERY rangetable entries in this Query. Prepare the index * are RTE_SUBQUERY rangetable entries in this Query. Prepare the index
......
...@@ -218,6 +218,7 @@ build_simple_rel(PlannerInfo *root, int relid, RelOptInfo *parent) ...@@ -218,6 +218,7 @@ build_simple_rel(PlannerInfo *root, int relid, RelOptInfo *parent)
rel->pages = 0; rel->pages = 0;
rel->tuples = 0; rel->tuples = 0;
rel->allvisfrac = 0; rel->allvisfrac = 0;
rel->eclass_indexes = NULL;
rel->subroot = NULL; rel->subroot = NULL;
rel->subplan_params = NIL; rel->subplan_params = NIL;
rel->rel_parallel_workers = -1; /* set up in get_relation_info */ rel->rel_parallel_workers = -1; /* set up in get_relation_info */
...@@ -629,6 +630,7 @@ build_join_rel(PlannerInfo *root, ...@@ -629,6 +630,7 @@ build_join_rel(PlannerInfo *root,
joinrel->pages = 0; joinrel->pages = 0;
joinrel->tuples = 0; joinrel->tuples = 0;
joinrel->allvisfrac = 0; joinrel->allvisfrac = 0;
joinrel->eclass_indexes = NULL;
joinrel->subroot = NULL; joinrel->subroot = NULL;
joinrel->subplan_params = NIL; joinrel->subplan_params = NIL;
joinrel->rel_parallel_workers = -1; joinrel->rel_parallel_workers = -1;
...@@ -808,6 +810,7 @@ build_child_join_rel(PlannerInfo *root, RelOptInfo *outer_rel, ...@@ -808,6 +810,7 @@ build_child_join_rel(PlannerInfo *root, RelOptInfo *outer_rel,
joinrel->pages = 0; joinrel->pages = 0;
joinrel->tuples = 0; joinrel->tuples = 0;
joinrel->allvisfrac = 0; joinrel->allvisfrac = 0;
joinrel->eclass_indexes = NULL;
joinrel->subroot = NULL; joinrel->subroot = NULL;
joinrel->subplan_params = NIL; joinrel->subplan_params = NIL;
joinrel->serverid = InvalidOid; joinrel->serverid = InvalidOid;
......
...@@ -265,6 +265,8 @@ struct PlannerInfo ...@@ -265,6 +265,8 @@ struct PlannerInfo
List *eq_classes; /* list of active EquivalenceClasses */ List *eq_classes; /* list of active EquivalenceClasses */
bool ec_merging_done; /* set true once ECs are canonical */
List *canon_pathkeys; /* list of "canonical" PathKeys */ List *canon_pathkeys; /* list of "canonical" PathKeys */
List *left_join_clauses; /* list of RestrictInfos for mergejoinable List *left_join_clauses; /* list of RestrictInfos for mergejoinable
...@@ -505,6 +507,8 @@ typedef struct PartitionSchemeData *PartitionScheme; ...@@ -505,6 +507,8 @@ typedef struct PartitionSchemeData *PartitionScheme;
* pages - number of disk pages in relation (zero if not a table) * pages - number of disk pages in relation (zero if not a table)
* tuples - number of tuples in relation (not considering restrictions) * tuples - number of tuples in relation (not considering restrictions)
* allvisfrac - fraction of disk pages that are marked all-visible * allvisfrac - fraction of disk pages that are marked all-visible
* eclass_indexes - EquivalenceClasses that mention this rel (filled
* only after EC merging is complete)
* subroot - PlannerInfo for subquery (NULL if it's not a subquery) * subroot - PlannerInfo for subquery (NULL if it's not a subquery)
* subplan_params - list of PlannerParamItems to be passed to subquery * subplan_params - list of PlannerParamItems to be passed to subquery
* *
...@@ -678,6 +682,8 @@ typedef struct RelOptInfo ...@@ -678,6 +682,8 @@ typedef struct RelOptInfo
BlockNumber pages; /* size estimates derived from pg_class */ BlockNumber pages; /* size estimates derived from pg_class */
double tuples; double tuples;
double allvisfrac; double allvisfrac;
Bitmapset *eclass_indexes; /* Indexes in PlannerInfo's eq_classes list of
* ECs that mention this rel */
PlannerInfo *subroot; /* if subquery */ PlannerInfo *subroot; /* if subquery */
List *subplan_params; /* if subquery */ List *subplan_params; /* if subquery */
int rel_parallel_workers; /* wanted number of parallel workers */ int rel_parallel_workers; /* wanted number of parallel workers */
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment