Commit 7c944bd9 authored by Robert Haas's avatar Robert Haas

Introduce a new GUC force_parallel_mode for testing purposes.

When force_parallel_mode = true, we enable the parallel mode restrictions
for all queries for which this is believed to be safe.  For the subset of
those queries believed to be safe to run entirely within a worker, we spin
up a worker and run the query there instead of running it in the
original process.  When force_parallel_mode = regress, make additional
changes to allow the regression tests to run cleanly even though parallel
workers have been injected under the hood.

Taken together, this facilitates both better user testing and better
regression testing of the parallelism code.

Robert Haas, with help from Amit Kapila and Rushabh Lathia.
parent a1c1af2a
...@@ -3802,6 +3802,51 @@ SELECT * FROM parent WHERE key = 2400; ...@@ -3802,6 +3802,51 @@ SELECT * FROM parent WHERE key = 2400;
</listitem> </listitem>
</varlistentry> </varlistentry>
<varlistentry id="guc-force-parallel-mode" xreflabel="force_parallel_mode">
<term><varname>force_parallel_mode</varname> (<type>enum</type>)
<indexterm>
<primary><varname>force_parallel_mode</> configuration parameter</primary>
</indexterm>
</term>
<listitem>
<para>
Allows the use of parallel queries for testing purposes even in cases
where no performance benefit is expected.
The allowed values of <varname>force_parallel_mode</> are
<literal>off</> (use parallel mode only when it is expected to improve
performance), <literal>on</> (force parallel query for all queries
for which it is thought to be safe), and <literal>regress</> (like
on, but with additional behavior changes to facilitate automated
regression testing).
</para>
<para>
More specifically, setting this value to <literal>on</> will add
a <literal>Gather</> node to the top of any query plan for which this
appears to be safe, so that the query runs inside of a parallel worker.
Even when a parallel worker is not available or cannot be used,
operations such as starting a subtransaction that would be prohibited
in a parallel query context will be prohibited unless the planner
believes that this will cause the query to fail. If failures or
unexpected results occur when this option is set, some functions used
by the query may need to be marked <literal>PARALLEL UNSAFE</literal>
(or, possibly, <literal>PARALLEL RESTRICTED</literal>).
</para>
<para>
Setting this value to <literal>regress</> has all of the same effects
as setting it to <literal>on</> plus some additional effect that are
intended to facilitate automated regression testing. Normally,
messages from a parallel worker are prefixed with a context line,
but a setting of <literal>regress</> suppresses this to guarantee
reproducible results. Also, the <literal>Gather</> nodes added to
plans by this setting are hidden from the <literal>EXPLAIN</> output
so that the output matches what would be obtained if this setting
were turned <literal>off</>.
</para>
</listitem>
</varlistentry>
</variablelist> </variablelist>
</sect2> </sect2>
</sect1> </sect1>
......
...@@ -22,6 +22,7 @@ ...@@ -22,6 +22,7 @@
#include "libpq/pqformat.h" #include "libpq/pqformat.h"
#include "libpq/pqmq.h" #include "libpq/pqmq.h"
#include "miscadmin.h" #include "miscadmin.h"
#include "optimizer/planmain.h"
#include "storage/ipc.h" #include "storage/ipc.h"
#include "storage/sinval.h" #include "storage/sinval.h"
#include "storage/spin.h" #include "storage/spin.h"
...@@ -1079,6 +1080,7 @@ ParallelExtensionTrampoline(dsm_segment *seg, shm_toc *toc) ...@@ -1079,6 +1080,7 @@ ParallelExtensionTrampoline(dsm_segment *seg, shm_toc *toc)
static void static void
ParallelErrorContext(void *arg) ParallelErrorContext(void *arg)
{ {
if (force_parallel_mode != FORCE_PARALLEL_REGRESS)
errcontext("parallel worker, PID %d", *(int32 *) arg); errcontext("parallel worker, PID %d", *(int32 *) arg);
} }
......
...@@ -23,6 +23,7 @@ ...@@ -23,6 +23,7 @@
#include "foreign/fdwapi.h" #include "foreign/fdwapi.h"
#include "nodes/nodeFuncs.h" #include "nodes/nodeFuncs.h"
#include "optimizer/clauses.h" #include "optimizer/clauses.h"
#include "optimizer/planmain.h"
#include "parser/parsetree.h" #include "parser/parsetree.h"
#include "rewrite/rewriteHandler.h" #include "rewrite/rewriteHandler.h"
#include "tcop/tcopprot.h" #include "tcop/tcopprot.h"
...@@ -572,6 +573,7 @@ void ...@@ -572,6 +573,7 @@ void
ExplainPrintPlan(ExplainState *es, QueryDesc *queryDesc) ExplainPrintPlan(ExplainState *es, QueryDesc *queryDesc)
{ {
Bitmapset *rels_used = NULL; Bitmapset *rels_used = NULL;
PlanState *ps;
Assert(queryDesc->plannedstmt != NULL); Assert(queryDesc->plannedstmt != NULL);
es->pstmt = queryDesc->plannedstmt; es->pstmt = queryDesc->plannedstmt;
...@@ -580,7 +582,17 @@ ExplainPrintPlan(ExplainState *es, QueryDesc *queryDesc) ...@@ -580,7 +582,17 @@ ExplainPrintPlan(ExplainState *es, QueryDesc *queryDesc)
es->rtable_names = select_rtable_names_for_explain(es->rtable, rels_used); es->rtable_names = select_rtable_names_for_explain(es->rtable, rels_used);
es->deparse_cxt = deparse_context_for_plan_rtable(es->rtable, es->deparse_cxt = deparse_context_for_plan_rtable(es->rtable,
es->rtable_names); es->rtable_names);
ExplainNode(queryDesc->planstate, NIL, NULL, NULL, es);
/*
* Sometimes we mark a Gather node as "invisible", which means that it's
* not displayed in EXPLAIN output. The purpose of this is to allow
* running regression tests with force_parallel_mode=regress to get the
* same results as running the same tests with force_parallel_mode=off.
*/
ps = queryDesc->planstate;
if (IsA(ps, GatherState) &&((Gather *) ps->plan)->invisible)
ps = outerPlanState(ps);
ExplainNode(ps, NIL, NULL, NULL, es);
} }
/* /*
......
...@@ -334,6 +334,7 @@ _copyGather(const Gather *from) ...@@ -334,6 +334,7 @@ _copyGather(const Gather *from)
*/ */
COPY_SCALAR_FIELD(num_workers); COPY_SCALAR_FIELD(num_workers);
COPY_SCALAR_FIELD(single_copy); COPY_SCALAR_FIELD(single_copy);
COPY_SCALAR_FIELD(invisible);
return newnode; return newnode;
} }
......
...@@ -443,6 +443,7 @@ _outGather(StringInfo str, const Gather *node) ...@@ -443,6 +443,7 @@ _outGather(StringInfo str, const Gather *node)
WRITE_INT_FIELD(num_workers); WRITE_INT_FIELD(num_workers);
WRITE_BOOL_FIELD(single_copy); WRITE_BOOL_FIELD(single_copy);
WRITE_BOOL_FIELD(invisible);
} }
static void static void
...@@ -1824,6 +1825,7 @@ _outPlannerGlobal(StringInfo str, const PlannerGlobal *node) ...@@ -1824,6 +1825,7 @@ _outPlannerGlobal(StringInfo str, const PlannerGlobal *node)
WRITE_BOOL_FIELD(hasRowSecurity); WRITE_BOOL_FIELD(hasRowSecurity);
WRITE_BOOL_FIELD(parallelModeOK); WRITE_BOOL_FIELD(parallelModeOK);
WRITE_BOOL_FIELD(parallelModeNeeded); WRITE_BOOL_FIELD(parallelModeNeeded);
WRITE_BOOL_FIELD(wholePlanParallelSafe);
WRITE_BOOL_FIELD(hasForeignJoin); WRITE_BOOL_FIELD(hasForeignJoin);
} }
......
...@@ -2053,6 +2053,7 @@ _readGather(void) ...@@ -2053,6 +2053,7 @@ _readGather(void)
READ_INT_FIELD(num_workers); READ_INT_FIELD(num_workers);
READ_BOOL_FIELD(single_copy); READ_BOOL_FIELD(single_copy);
READ_BOOL_FIELD(invisible);
READ_DONE(); READ_DONE();
} }
......
...@@ -212,6 +212,10 @@ create_plan(PlannerInfo *root, Path *best_path) ...@@ -212,6 +212,10 @@ create_plan(PlannerInfo *root, Path *best_path)
/* Recursively process the path tree */ /* Recursively process the path tree */
plan = create_plan_recurse(root, best_path); plan = create_plan_recurse(root, best_path);
/* Update parallel safety information if needed. */
if (!best_path->parallel_safe)
root->glob->wholePlanParallelSafe = false;
/* Check we successfully assigned all NestLoopParams to plan nodes */ /* Check we successfully assigned all NestLoopParams to plan nodes */
if (root->curOuterParams != NIL) if (root->curOuterParams != NIL)
elog(ERROR, "failed to assign all NestLoopParams to plan nodes"); elog(ERROR, "failed to assign all NestLoopParams to plan nodes");
...@@ -4829,6 +4833,7 @@ make_gather(List *qptlist, ...@@ -4829,6 +4833,7 @@ make_gather(List *qptlist,
plan->righttree = NULL; plan->righttree = NULL;
node->num_workers = nworkers; node->num_workers = nworkers;
node->single_copy = single_copy; node->single_copy = single_copy;
node->invisible = false;
return node; return node;
} }
......
...@@ -48,10 +48,12 @@ ...@@ -48,10 +48,12 @@
#include "storage/dsm_impl.h" #include "storage/dsm_impl.h"
#include "utils/rel.h" #include "utils/rel.h"
#include "utils/selfuncs.h" #include "utils/selfuncs.h"
#include "utils/syscache.h"
/* GUC parameter */ /* GUC parameters */
double cursor_tuple_fraction = DEFAULT_CURSOR_TUPLE_FRACTION; double cursor_tuple_fraction = DEFAULT_CURSOR_TUPLE_FRACTION;
int force_parallel_mode = FORCE_PARALLEL_OFF;
/* Hook for plugins to get control in planner() */ /* Hook for plugins to get control in planner() */
planner_hook_type planner_hook = NULL; planner_hook_type planner_hook = NULL;
...@@ -230,25 +232,31 @@ standard_planner(Query *parse, int cursorOptions, ParamListInfo boundParams) ...@@ -230,25 +232,31 @@ standard_planner(Query *parse, int cursorOptions, ParamListInfo boundParams)
!has_parallel_hazard((Node *) parse, true); !has_parallel_hazard((Node *) parse, true);
/* /*
* glob->parallelModeOK should tell us whether it's necessary to impose * glob->parallelModeNeeded should tell us whether it's necessary to
* the parallel mode restrictions, but we don't actually want to impose * impose the parallel mode restrictions, but we don't actually want to
* them unless we choose a parallel plan, so that people who mislabel * impose them unless we choose a parallel plan, so that people who
* their functions but don't use parallelism anyway aren't harmed. * mislabel their functions but don't use parallelism anyway aren't
* However, it's useful for testing purposes to be able to force the * harmed. But when force_parallel_mode is set, we enable the restrictions
* restrictions to be imposed whenever a parallel plan is actually chosen * whenever possible for testing purposes.
* or not.
* *
* (It's been suggested that we should always impose these restrictions * glob->wholePlanParallelSafe should tell us whether it's OK to stick a
* whenever glob->parallelModeOK is true, so that it's easier to notice * Gather node on top of the entire plan. However, it only needs to be
* incorrectly-labeled functions sooner. That might be the right thing to * accurate when force_parallel_mode is 'on' or 'regress', so we don't
* do, but for now I've taken this approach. We could also control this * bother doing the work otherwise. The value we set here is just a
* with a GUC.) * preliminary guess; it may get changed from true to false later, but
*/ * not visca versa.
#ifdef FORCE_PARALLEL_MODE */
glob->parallelModeNeeded = glob->parallelModeOK; if (force_parallel_mode == FORCE_PARALLEL_OFF || !glob->parallelModeOK)
#else {
glob->parallelModeNeeded = false; glob->parallelModeNeeded = false;
#endif glob->wholePlanParallelSafe = false; /* either false or don't care */
}
else
{
glob->parallelModeNeeded = true;
glob->wholePlanParallelSafe =
!has_parallel_hazard((Node *) parse, false);
}
/* Determine what fraction of the plan is likely to be scanned */ /* Determine what fraction of the plan is likely to be scanned */
if (cursorOptions & CURSOR_OPT_FAST_PLAN) if (cursorOptions & CURSOR_OPT_FAST_PLAN)
...@@ -292,6 +300,35 @@ standard_planner(Query *parse, int cursorOptions, ParamListInfo boundParams) ...@@ -292,6 +300,35 @@ standard_planner(Query *parse, int cursorOptions, ParamListInfo boundParams)
top_plan = materialize_finished_plan(top_plan); top_plan = materialize_finished_plan(top_plan);
} }
/*
* At present, we don't copy subplans to workers. The presence of a
* subplan in one part of the plan doesn't preclude the use of parallelism
* in some other part of the plan, but it does preclude the possibility of
* regarding the entire plan parallel-safe.
*/
if (glob->subplans != NULL)
glob->wholePlanParallelSafe = false;
/*
* Optionally add a Gather node for testing purposes, provided this is
* actually a safe thing to do.
*/
if (glob->wholePlanParallelSafe &&
force_parallel_mode != FORCE_PARALLEL_OFF)
{
Gather *gather = makeNode(Gather);
gather->plan.targetlist = top_plan->targetlist;
gather->plan.qual = NIL;
gather->plan.lefttree = top_plan;
gather->plan.righttree = NULL;
gather->num_workers = 1;
gather->single_copy = true;
gather->invisible = (force_parallel_mode == FORCE_PARALLEL_REGRESS);
root->glob->parallelModeNeeded = true;
top_plan = &gather->plan;
}
/* /*
* If any Params were generated, run through the plan tree and compute * If any Params were generated, run through the plan tree and compute
* each plan node's extParam/allParam sets. Ideally we'd merge this into * each plan node's extParam/allParam sets. Ideally we'd merge this into
......
...@@ -379,6 +379,19 @@ static const struct config_enum_entry huge_pages_options[] = { ...@@ -379,6 +379,19 @@ static const struct config_enum_entry huge_pages_options[] = {
{NULL, 0, false} {NULL, 0, false}
}; };
static const struct config_enum_entry force_parallel_mode_options[] = {
{"off", FORCE_PARALLEL_OFF, false},
{"on", FORCE_PARALLEL_ON, false},
{"regress", FORCE_PARALLEL_REGRESS, false},
{"true", FORCE_PARALLEL_ON, true},
{"false", FORCE_PARALLEL_OFF, true},
{"yes", FORCE_PARALLEL_ON, true},
{"no", FORCE_PARALLEL_OFF, true},
{"1", FORCE_PARALLEL_ON, true},
{"0", FORCE_PARALLEL_OFF, true},
{NULL, 0, false}
};
/* /*
* Options for enum values stored in other modules * Options for enum values stored in other modules
*/ */
...@@ -863,6 +876,7 @@ static struct config_bool ConfigureNamesBool[] = ...@@ -863,6 +876,7 @@ static struct config_bool ConfigureNamesBool[] =
true, true,
NULL, NULL, NULL NULL, NULL, NULL
}, },
{ {
{"geqo", PGC_USERSET, QUERY_TUNING_GEQO, {"geqo", PGC_USERSET, QUERY_TUNING_GEQO,
gettext_noop("Enables genetic query optimization."), gettext_noop("Enables genetic query optimization."),
...@@ -3672,6 +3686,16 @@ static struct config_enum ConfigureNamesEnum[] = ...@@ -3672,6 +3686,16 @@ static struct config_enum ConfigureNamesEnum[] =
NULL, NULL, NULL NULL, NULL, NULL
}, },
{
{"force_parallel_mode", PGC_USERSET, QUERY_TUNING_OTHER,
gettext_noop("Forces use of parallel query facilities."),
gettext_noop("If possible, run query using a parallel worker and with parallel restrictions.")
},
&force_parallel_mode,
FORCE_PARALLEL_OFF, force_parallel_mode_options,
NULL, NULL, NULL
},
/* End-of-list marker */ /* End-of-list marker */
{ {
{NULL, 0, 0, NULL, NULL}, NULL, 0, NULL, NULL, NULL, NULL {NULL, 0, 0, NULL, NULL}, NULL, 0, NULL, NULL, NULL, NULL
......
...@@ -313,6 +313,7 @@ ...@@ -313,6 +313,7 @@
#from_collapse_limit = 8 #from_collapse_limit = 8
#join_collapse_limit = 8 # 1 disables collapsing of explicit #join_collapse_limit = 8 # 1 disables collapsing of explicit
# JOIN clauses # JOIN clauses
#force_parallel_mode = off
#------------------------------------------------------------------------------ #------------------------------------------------------------------------------
......
...@@ -775,6 +775,7 @@ typedef struct Gather ...@@ -775,6 +775,7 @@ typedef struct Gather
Plan plan; Plan plan;
int num_workers; int num_workers;
bool single_copy; bool single_copy;
bool invisible; /* suppress EXPLAIN display (for testing)? */
} Gather; } Gather;
/* ---------------- /* ----------------
......
...@@ -108,6 +108,9 @@ typedef struct PlannerGlobal ...@@ -108,6 +108,9 @@ typedef struct PlannerGlobal
bool parallelModeOK; /* parallel mode potentially OK? */ bool parallelModeOK; /* parallel mode potentially OK? */
bool parallelModeNeeded; /* parallel mode actually required? */ bool parallelModeNeeded; /* parallel mode actually required? */
bool wholePlanParallelSafe; /* is the entire plan parallel safe? */
bool hasForeignJoin; /* does have a pushed down foreign join */ bool hasForeignJoin; /* does have a pushed down foreign join */
} PlannerGlobal; } PlannerGlobal;
......
...@@ -17,9 +17,18 @@ ...@@ -17,9 +17,18 @@
#include "nodes/plannodes.h" #include "nodes/plannodes.h"
#include "nodes/relation.h" #include "nodes/relation.h"
/* possible values for force_parallel_mode */
typedef enum
{
FORCE_PARALLEL_OFF,
FORCE_PARALLEL_ON,
FORCE_PARALLEL_REGRESS
} ForceParallelMode;
/* GUC parameters */ /* GUC parameters */
#define DEFAULT_CURSOR_TUPLE_FRACTION 0.1 #define DEFAULT_CURSOR_TUPLE_FRACTION 0.1
extern double cursor_tuple_fraction; extern double cursor_tuple_fraction;
extern int force_parallel_mode;
/* query_planner callback to compute query_pathkeys */ /* query_planner callback to compute query_pathkeys */
typedef void (*query_pathkeys_callback) (PlannerInfo *root, void *extra); typedef void (*query_pathkeys_callback) (PlannerInfo *root, void *extra);
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment