Commit b1495393 authored by Tom Lane's avatar Tom Lane

Revise FDW planning API, again.

Further reflection shows that a single callback isn't very workable if we
desire to let FDWs generate multiple Paths, because that forces the FDW to
do all work necessary to generate a valid Plan node for each Path.  Instead
split the former PlanForeignScan API into three steps: GetForeignRelSize,
GetForeignPaths, GetForeignPlan.  We had already bit the bullet of breaking
the 9.1 FDW API for 9.2, so this shouldn't cause very much additional pain,
and it's substantially more flexible for complex FDWs.

Add an fdw_private field to RelOptInfo so that the new functions can save
state there rather than possibly having to recalculate information two or
three times.

In addition, we'd not thought through what would be needed to allow an FDW
to set up subexpressions of its choice for runtime execution.  We could
treat ForeignScan.fdw_private as an executable expression but that seems
likely to break existing FDWs unnecessarily (in particular, it would
restrict the set of node types allowable in fdw_private to those supported
by expression_tree_walker).  Instead, invent a separate field fdw_exprs
which will receive the postprocessing appropriate for expression trees.
(One field is enough since it can be a list of expressions; also, we assume
the corresponding expression state tree(s) will be held within fdw_state,
so we don't need to add anything to ForeignScanState.)

Per review of Hanada Shigeru's pgsql_fdw patch.  We may need to tweak this
further as we continue to work on that patch, but to me it feels a lot
closer to being right now.
parent 342baf4c
...@@ -26,6 +26,8 @@ ...@@ -26,6 +26,8 @@
#include "nodes/makefuncs.h" #include "nodes/makefuncs.h"
#include "optimizer/cost.h" #include "optimizer/cost.h"
#include "optimizer/pathnode.h" #include "optimizer/pathnode.h"
#include "optimizer/planmain.h"
#include "optimizer/restrictinfo.h"
#include "utils/rel.h" #include "utils/rel.h"
PG_MODULE_MAGIC; PG_MODULE_MAGIC;
...@@ -48,7 +50,7 @@ struct FileFdwOption ...@@ -48,7 +50,7 @@ struct FileFdwOption
* Note: If you are adding new option for user mapping, you need to modify * Note: If you are adding new option for user mapping, you need to modify
* fileGetOptions(), which currently doesn't bother to look at user mappings. * fileGetOptions(), which currently doesn't bother to look at user mappings.
*/ */
static struct FileFdwOption valid_options[] = { static const struct FileFdwOption valid_options[] = {
/* File options */ /* File options */
{"filename", ForeignTableRelationId}, {"filename", ForeignTableRelationId},
...@@ -71,6 +73,17 @@ static struct FileFdwOption valid_options[] = { ...@@ -71,6 +73,17 @@ static struct FileFdwOption valid_options[] = {
{NULL, InvalidOid} {NULL, InvalidOid}
}; };
/*
* FDW-specific information for RelOptInfo.fdw_private.
*/
typedef struct FileFdwPlanState
{
char *filename; /* file to read */
List *options; /* merged COPY options, excluding filename */
BlockNumber pages; /* estimate of file's physical size */
double ntuples; /* estimate of number of rows in file */
} FileFdwPlanState;
/* /*
* FDW-specific information for ForeignScanState.fdw_state. * FDW-specific information for ForeignScanState.fdw_state.
*/ */
...@@ -93,9 +106,18 @@ PG_FUNCTION_INFO_V1(file_fdw_validator); ...@@ -93,9 +106,18 @@ PG_FUNCTION_INFO_V1(file_fdw_validator);
/* /*
* FDW callback routines * FDW callback routines
*/ */
static void filePlanForeignScan(Oid foreigntableid, static void fileGetForeignRelSize(PlannerInfo *root,
PlannerInfo *root, RelOptInfo *baserel,
RelOptInfo *baserel); Oid foreigntableid);
static void fileGetForeignPaths(PlannerInfo *root,
RelOptInfo *baserel,
Oid foreigntableid);
static ForeignScan *fileGetForeignPlan(PlannerInfo *root,
RelOptInfo *baserel,
Oid foreigntableid,
ForeignPath *best_path,
List *tlist,
List *scan_clauses);
static void fileExplainForeignScan(ForeignScanState *node, ExplainState *es); static void fileExplainForeignScan(ForeignScanState *node, ExplainState *es);
static void fileBeginForeignScan(ForeignScanState *node, int eflags); static void fileBeginForeignScan(ForeignScanState *node, int eflags);
static TupleTableSlot *fileIterateForeignScan(ForeignScanState *node); static TupleTableSlot *fileIterateForeignScan(ForeignScanState *node);
...@@ -109,8 +131,10 @@ static bool is_valid_option(const char *option, Oid context); ...@@ -109,8 +131,10 @@ static bool is_valid_option(const char *option, Oid context);
static void fileGetOptions(Oid foreigntableid, static void fileGetOptions(Oid foreigntableid,
char **filename, List **other_options); char **filename, List **other_options);
static List *get_file_fdw_attribute_options(Oid relid); static List *get_file_fdw_attribute_options(Oid relid);
static void estimate_size(PlannerInfo *root, RelOptInfo *baserel,
FileFdwPlanState *fdw_private);
static void estimate_costs(PlannerInfo *root, RelOptInfo *baserel, static void estimate_costs(PlannerInfo *root, RelOptInfo *baserel,
const char *filename, FileFdwPlanState *fdw_private,
Cost *startup_cost, Cost *total_cost); Cost *startup_cost, Cost *total_cost);
...@@ -123,7 +147,9 @@ file_fdw_handler(PG_FUNCTION_ARGS) ...@@ -123,7 +147,9 @@ file_fdw_handler(PG_FUNCTION_ARGS)
{ {
FdwRoutine *fdwroutine = makeNode(FdwRoutine); FdwRoutine *fdwroutine = makeNode(FdwRoutine);
fdwroutine->PlanForeignScan = filePlanForeignScan; fdwroutine->GetForeignRelSize = fileGetForeignRelSize;
fdwroutine->GetForeignPaths = fileGetForeignPaths;
fdwroutine->GetForeignPlan = fileGetForeignPlan;
fdwroutine->ExplainForeignScan = fileExplainForeignScan; fdwroutine->ExplainForeignScan = fileExplainForeignScan;
fdwroutine->BeginForeignScan = fileBeginForeignScan; fdwroutine->BeginForeignScan = fileBeginForeignScan;
fdwroutine->IterateForeignScan = fileIterateForeignScan; fdwroutine->IterateForeignScan = fileIterateForeignScan;
...@@ -177,7 +203,7 @@ file_fdw_validator(PG_FUNCTION_ARGS) ...@@ -177,7 +203,7 @@ file_fdw_validator(PG_FUNCTION_ARGS)
if (!is_valid_option(def->defname, catalog)) if (!is_valid_option(def->defname, catalog))
{ {
struct FileFdwOption *opt; const struct FileFdwOption *opt;
StringInfoData buf; StringInfoData buf;
/* /*
...@@ -249,7 +275,7 @@ file_fdw_validator(PG_FUNCTION_ARGS) ...@@ -249,7 +275,7 @@ file_fdw_validator(PG_FUNCTION_ARGS)
static bool static bool
is_valid_option(const char *option, Oid context) is_valid_option(const char *option, Oid context)
{ {
struct FileFdwOption *opt; const struct FileFdwOption *opt;
for (opt = valid_options; opt->optname; opt++) for (opt = valid_options; opt->optname; opt++)
{ {
...@@ -381,7 +407,31 @@ get_file_fdw_attribute_options(Oid relid) ...@@ -381,7 +407,31 @@ get_file_fdw_attribute_options(Oid relid)
} }
/* /*
* filePlanForeignScan * fileGetForeignRelSize
* Obtain relation size estimates for a foreign table
*/
static void
fileGetForeignRelSize(PlannerInfo *root,
RelOptInfo *baserel,
Oid foreigntableid)
{
FileFdwPlanState *fdw_private;
/*
* Fetch options. We only need filename at this point, but we might
* as well get everything and not need to re-fetch it later in planning.
*/
fdw_private = (FileFdwPlanState *) palloc(sizeof(FileFdwPlanState));
fileGetOptions(foreigntableid,
&fdw_private->filename, &fdw_private->options);
baserel->fdw_private = (void *) fdw_private;
/* Estimate relation size */
estimate_size(root, baserel, fdw_private);
}
/*
* fileGetForeignPaths
* Create possible access paths for a scan on the foreign table * Create possible access paths for a scan on the foreign table
* *
* Currently we don't support any push-down feature, so there is only one * Currently we don't support any push-down feature, so there is only one
...@@ -389,20 +439,16 @@ get_file_fdw_attribute_options(Oid relid) ...@@ -389,20 +439,16 @@ get_file_fdw_attribute_options(Oid relid)
* the data file. * the data file.
*/ */
static void static void
filePlanForeignScan(Oid foreigntableid, fileGetForeignPaths(PlannerInfo *root,
PlannerInfo *root, RelOptInfo *baserel,
RelOptInfo *baserel) Oid foreigntableid)
{ {
char *filename; FileFdwPlanState *fdw_private = (FileFdwPlanState *) baserel->fdw_private;
List *options;
Cost startup_cost; Cost startup_cost;
Cost total_cost; Cost total_cost;
/* Fetch options --- we only need filename at this point */ /* Estimate costs */
fileGetOptions(foreigntableid, &filename, &options); estimate_costs(root, baserel, fdw_private,
/* Estimate costs and update baserel->rows */
estimate_costs(root, baserel, filename,
&startup_cost, &total_cost); &startup_cost, &total_cost);
/* Create a ForeignPath node and add it as only possible path */ /* Create a ForeignPath node and add it as only possible path */
...@@ -422,6 +468,37 @@ filePlanForeignScan(Oid foreigntableid, ...@@ -422,6 +468,37 @@ filePlanForeignScan(Oid foreigntableid,
*/ */
} }
/*
* fileGetForeignPlan
* Create a ForeignScan plan node for scanning the foreign table
*/
static ForeignScan *
fileGetForeignPlan(PlannerInfo *root,
RelOptInfo *baserel,
Oid foreigntableid,
ForeignPath *best_path,
List *tlist,
List *scan_clauses)
{
Index scan_relid = baserel->relid;
/*
* We have no native ability to evaluate restriction clauses, so we just
* put all the scan_clauses into the plan node's qual list for the
* executor to check. So all we have to do here is strip RestrictInfo
* nodes from the clauses and ignore pseudoconstants (which will be
* handled elsewhere).
*/
scan_clauses = extract_actual_clauses(scan_clauses, false);
/* Create the ForeignScan node */
return make_foreignscan(tlist,
scan_clauses,
scan_relid,
NIL, /* no expressions to evaluate */
NIL); /* no private state either */
}
/* /*
* fileExplainForeignScan * fileExplainForeignScan
* Produce extra output for EXPLAIN * Produce extra output for EXPLAIN
...@@ -568,38 +645,38 @@ fileReScanForeignScan(ForeignScanState *node) ...@@ -568,38 +645,38 @@ fileReScanForeignScan(ForeignScanState *node)
} }
/* /*
* Estimate costs of scanning a foreign table. * Estimate size of a foreign table.
* *
* In addition to setting *startup_cost and *total_cost, this should * The main result is returned in baserel->rows. We also set
* update baserel->rows. * fdw_private->pages and fdw_private->ntuples for later use in the cost
* calculation.
*/ */
static void static void
estimate_costs(PlannerInfo *root, RelOptInfo *baserel, estimate_size(PlannerInfo *root, RelOptInfo *baserel,
const char *filename, FileFdwPlanState *fdw_private)
Cost *startup_cost, Cost *total_cost)
{ {
struct stat stat_buf; struct stat stat_buf;
BlockNumber pages; BlockNumber pages;
int tuple_width; int tuple_width;
double ntuples; double ntuples;
double nrows; double nrows;
Cost run_cost = 0;
Cost cpu_per_tuple;
/* /*
* Get size of the file. It might not be there at plan time, though, in * Get size of the file. It might not be there at plan time, though, in
* which case we have to use a default estimate. * which case we have to use a default estimate.
*/ */
if (stat(filename, &stat_buf) < 0) if (stat(fdw_private->filename, &stat_buf) < 0)
stat_buf.st_size = 10 * BLCKSZ; stat_buf.st_size = 10 * BLCKSZ;
/* /*
* Convert size to pages for use in I/O cost estimate below. * Convert size to pages for use in I/O cost estimate later.
*/ */
pages = (stat_buf.st_size + (BLCKSZ - 1)) / BLCKSZ; pages = (stat_buf.st_size + (BLCKSZ - 1)) / BLCKSZ;
if (pages < 1) if (pages < 1)
pages = 1; pages = 1;
fdw_private->pages = pages;
/* /*
* Estimate the number of tuples in the file. We back into this estimate * Estimate the number of tuples in the file. We back into this estimate
* using the planner's idea of the relation width; which is bogus if not * using the planner's idea of the relation width; which is bogus if not
...@@ -611,6 +688,8 @@ estimate_costs(PlannerInfo *root, RelOptInfo *baserel, ...@@ -611,6 +688,8 @@ estimate_costs(PlannerInfo *root, RelOptInfo *baserel,
ntuples = clamp_row_est((double) stat_buf.st_size / (double) tuple_width); ntuples = clamp_row_est((double) stat_buf.st_size / (double) tuple_width);
fdw_private->ntuples = ntuples;
/* /*
* Now estimate the number of rows returned by the scan after applying the * Now estimate the number of rows returned by the scan after applying the
* baserestrictinfo quals. This is pretty bogus too, since the planner * baserestrictinfo quals. This is pretty bogus too, since the planner
...@@ -627,12 +706,28 @@ estimate_costs(PlannerInfo *root, RelOptInfo *baserel, ...@@ -627,12 +706,28 @@ estimate_costs(PlannerInfo *root, RelOptInfo *baserel,
/* Save the output-rows estimate for the planner */ /* Save the output-rows estimate for the planner */
baserel->rows = nrows; baserel->rows = nrows;
}
/*
* Estimate costs of scanning a foreign table.
*
* Results are returned in *startup_cost and *total_cost.
*/
static void
estimate_costs(PlannerInfo *root, RelOptInfo *baserel,
FileFdwPlanState *fdw_private,
Cost *startup_cost, Cost *total_cost)
{
BlockNumber pages = fdw_private->pages;
double ntuples = fdw_private->ntuples;
Cost run_cost = 0;
Cost cpu_per_tuple;
/* /*
* Now estimate costs. We estimate costs almost the same way as * We estimate costs almost the same way as cost_seqscan(), thus assuming
* cost_seqscan(), thus assuming that I/O costs are equivalent to a * that I/O costs are equivalent to a regular table file of the same size.
* regular table file of the same size. However, we take per-tuple CPU * However, we take per-tuple CPU costs as 10x of a seqscan, to account
* costs as 10x of a seqscan, to account for the cost of parsing records. * for the cost of parsing records.
*/ */
run_cost += seq_page_cost * pages; run_cost += seq_page_cost * pages;
......
...@@ -89,52 +89,92 @@ ...@@ -89,52 +89,92 @@
<para> <para>
<programlisting> <programlisting>
void void
PlanForeignScan (Oid foreigntableid, GetForeignRelSize (PlannerInfo *root,
PlannerInfo *root, RelOptInfo *baserel,
RelOptInfo *baserel); Oid foreigntableid);
</programlisting> </programlisting>
Create possible access paths for a scan on a foreign table. This is Obtain relation size estimates for a foreign table. This is called
called when a query is planned. at the beginning of planning for a query involving a foreign table.
<literal>root</> is the planner's global information about the query;
<literal>baserel</> is the planner's information about this table; and
<literal>foreigntableid</> is the <structname>pg_class</> OID of the <literal>foreigntableid</> is the <structname>pg_class</> OID of the
foreign table. <literal>root</> is the planner's global information foreign table. (<literal>foreigntableid</> could be obtained from the
about the query, and <literal>baserel</> is the planner's information planner data structures, but it's passed explicitly to save effort.)
about this table.
</para> </para>
<para> <para>
The function must generate at least one access path (ForeignPath node) This function should update <literal>baserel-&gt;rows</> to be the
for a scan on the foreign table and must call <function>add_path</> to expected number of rows returned by the table scan, after accounting for
add the path to <literal>baserel-&gt;pathlist</>. It's recommended to the filtering done by the restriction quals. The initial value of
use <function>create_foreignscan_path</> to build the ForeignPath node. <literal>baserel-&gt;rows</> is just a constant default estimate, which
The function may generate multiple access paths, e.g., a path which has should be replaced if at all possible. The function may also choose to
valid <literal>pathkeys</> to represent a pre-sorted result. Each access update <literal>baserel-&gt;width</> if it can compute a better estimate
path must contain cost estimates, and can contain any FDW-private of the average result row width.
information that is needed to execute the foreign scan at a later time.
(Note that the private information must be represented in a form that
<function>copyObject</> knows how to copy.)
</para> </para>
<para> <para>
The information in <literal>root</> and <literal>baserel</> can be used See <xref linkend="fdw-planning"> for additional information.
to reduce the amount of information that has to be fetched from the </para>
foreign table (and therefore reduce the cost estimate).
<literal>baserel-&gt;baserestrictinfo</> is particularly interesting, as <para>
it contains restriction quals (<literal>WHERE</> clauses) that can be <programlisting>
used to filter the rows to be fetched. (The FDW is not required to void
enforce these quals, as the finished plan will recheck them anyway.) GetForeignPaths (PlannerInfo *root,
<literal>baserel-&gt;reltargetlist</> can be used to determine which RelOptInfo *baserel,
columns need to be fetched. Oid foreigntableid);
</programlisting>
Create possible access paths for a scan on a foreign table.
This is called during query planning.
The parameters are the same as for <function>GetForeignRelSize</>,
which has already been called.
</para>
<para>
This function must generate at least one access path
(<structname>ForeignPath</> node) for a scan on the foreign table and
must call <function>add_path</> to add each such path to
<literal>baserel-&gt;pathlist</>. It's recommended to use
<function>create_foreignscan_path</> to build the
<structname>ForeignPath</> nodes. The function can generate multiple
access paths, e.g., a path which has valid <literal>pathkeys</> to
represent a pre-sorted result. Each access path must contain cost
estimates, and can contain any FDW-private information that is needed to
identify the specific scan method intended.
</para>
<para>
See <xref linkend="fdw-planning"> for additional information.
</para>
<para>
<programlisting>
ForeignScan *
GetForeignPlan (PlannerInfo *root,
RelOptInfo *baserel,
Oid foreigntableid,
ForeignPath *best_path,
List *tlist,
List *scan_clauses);
</programlisting>
Create a <structname>ForeignScan</> plan node from the selected foreign
access path. This is called at the end of query planning.
The parameters are as for <function>GetForeignRelSize</>, plus
the selected <structname>ForeignPath</> (previously produced by
<function>GetForeignPaths</>), the target list to be emitted by the
plan node, and the restriction clauses to be enforced by the plan node.
</para> </para>
<para> <para>
In addition to returning cost estimates, the function should update This function must create and return a <structname>ForeignScan</> plan
<literal>baserel-&gt;rows</> to be the expected number of rows returned node; it's recommended to use <function>make_foreignscan</> to build the
by the scan, after accounting for the filtering done by the restriction <structname>ForeignScan</> node.
quals. The initial value of <literal>baserel-&gt;rows</> is just a </para>
constant default estimate, which should be replaced if at all possible.
The function may also choose to update <literal>baserel-&gt;width</> if <para>
it can compute a better estimate of the average result row width. See <xref linkend="fdw-planning"> for additional information.
</para> </para>
<para> <para>
...@@ -170,7 +210,7 @@ BeginForeignScan (ForeignScanState *node, ...@@ -170,7 +210,7 @@ BeginForeignScan (ForeignScanState *node,
the table to scan is accessible through the the table to scan is accessible through the
<structname>ForeignScanState</> node (in particular, from the underlying <structname>ForeignScanState</> node (in particular, from the underlying
<structname>ForeignScan</> plan node, which contains any FDW-private <structname>ForeignScan</> plan node, which contains any FDW-private
information provided by <function>PlanForeignScan</>). information provided by <function>GetForeignPlan</>).
</para> </para>
<para> <para>
...@@ -347,6 +387,126 @@ GetForeignServerByName(const char *name, bool missing_ok); ...@@ -347,6 +387,126 @@ GetForeignServerByName(const char *name, bool missing_ok);
return NULL if missing_ok is true, otherwise raise an error. return NULL if missing_ok is true, otherwise raise an error.
</para> </para>
</sect1>
<sect1 id="fdw-planning">
<title>Foreign Data Wrapper Query Planning</title>
<para>
The FDW callback functions <function>GetForeignRelSize</>,
<function>GetForeignPaths</>, and <function>GetForeignPlan</> must fit
into the workings of the <productname>PostgreSQL</> planner. Here are
some notes about what they must do.
</para>
<para>
The information in <literal>root</> and <literal>baserel</> can be used
to reduce the amount of information that has to be fetched from the
foreign table (and therefore reduce the cost).
<literal>baserel-&gt;baserestrictinfo</> is particularly interesting, as
it contains restriction quals (<literal>WHERE</> clauses) that should be
used to filter the rows to be fetched. (The FDW itself is not required
to enforce these quals, as the core executor can check them instead.)
<literal>baserel-&gt;reltargetlist</> can be used to determine which
columns need to be fetched; but note that it only lists columns that
have to be emitted by the <structname>ForeignScan</> plan node, not
columns that are used in qual evaluation but not output by the query.
</para>
<para>
Various private fields are available for the FDW planning functions to
keep information in. Generally, whatever you store in FDW private fields
should be palloc'd, so that it will be reclaimed at the end of planning.
</para>
<para>
<literal>baserel-&gt;fdw_private</> is a <type>void</> pointer that is
available for FDW planning functions to store information relevant to
the particular foreign table. The core planner does not touch it except
to initialize it to NULL when the <literal>baserel</> node is created.
It is useful for passing information forward from
<function>GetForeignRelSize</> to <function>GetForeignPaths</> and/or
<function>GetForeignPaths</> to <function>GetForeignPlan</>, thereby
avoiding recalculation.
</para>
<para>
<function>GetForeignPaths</> can identify the meaning of different
access paths by storing private information in the
<structfield>fdw_private</> field of <structname>ForeignPath</> nodes.
<structfield>fdw_private</> is declared as a <type>List</> pointer, but
could actually contain anything since the core planner does not touch
it. However, best practice is to use a representation that's dumpable
by <function>nodeToString</>, for use with debugging support available
in the backend.
</para>
<para>
<function>GetForeignPlan</> can examine the <structfield>fdw_private</>
field of the selected <structname>ForeignPath</> node, and can generate
<structfield>fdw_exprs</> and <structfield>fdw_private</> lists to be
placed in the <structname>ForeignScan</> plan node, where they will be
available at execution time. Both of these lists must be
represented in a form that <function>copyObject</> knows how to copy.
The <structfield>fdw_private</> list has no other restrictions and is
not interpreted by the core backend in any way. The
<structfield>fdw_exprs</> list, if not NIL, is expected to contain
expression trees that are intended to be executed at runtime. These
trees will undergo post-processing by the planner to make them fully
executable.
</para>
<para>
In <function>GetForeignPlan</>, generally the passed-in targetlist can
be copied into the plan node as-is. The passed scan_clauses list
contains the same clauses as <literal>baserel-&gt;baserestrictinfo</>,
but may be re-ordered for better execution efficiency. In simple cases
the FDW can just strip <structname>RestrictInfo</> nodes from the
scan_clauses list (using <function>extract_actual_clauses</>) and put
all the clauses into the plan node's qual list, which means that all the
clauses will be checked by the executor at runtime. More complex FDWs
may be able to check some of the clauses internally, in which case those
clauses can be removed from the plan node's qual list so that the
executor doesn't waste time rechecking them.
</para>
<para>
As an example, the FDW might identify some restriction clauses of the
form <replaceable>foreign_variable</> <literal>=</>
<replaceable>sub_expression</>, which it determines can be executed on
the remote server given the locally-evaluated value of the
<replaceable>sub_expression</>. The actual identification of such a
clause should happen during <function>GetForeignPaths</>, since it would
affect the cost estimate for the path. The path's
<structfield>fdw_private</> field would probably include a pointer to
the identified clause's <structname>RestrictInfo</> node. Then
<function>GetForeignPlan</> would remove that clause from scan_clauses,
but add the <replaceable>sub_expression</> to <structfield>fdw_exprs</>
to ensure that it gets massaged into executable form. It would probably
also put control information into the plan node's
<structfield>fdw_private</> field to tell the execution functions what
to do at runtime. The query transmitted to the remote server would
involve something like <literal>WHERE <replaceable>foreign_variable</> =
$1</literal>, with the parameter value obtained at runtime from
evaluation of the <structfield>fdw_exprs</> expression tree.
</para>
<para>
The FDW should always construct at least one path that depends only on
the table's restriction clauses. In join queries, it might also choose
to construct path(s) that depend on join clauses, for example
<replaceable>foreign_variable</> <literal>=</>
<replaceable>local_variable</>. Such clauses will not be found in
<literal>baserel-&gt;baserestrictinfo</> but must be sought in the
relation's join lists. A path using such a clause is called a
<quote>parameterized path</>. It must show the other relation(s) as
<literal>required_outer</> and list the specific join clause(s) in
<literal>param_clauses</>. In <function>GetForeignPlan</>, the
<replaceable>local_variable</> portion of the join clause would be added
to <structfield>fdw_exprs</>, and then at runtime the case works the
same as for an ordinary restriction clause.
</para>
</sect1> </sect1>
</chapter> </chapter>
...@@ -591,8 +591,9 @@ _copyForeignScan(const ForeignScan *from) ...@@ -591,8 +591,9 @@ _copyForeignScan(const ForeignScan *from)
/* /*
* copy remainder of node * copy remainder of node
*/ */
COPY_SCALAR_FIELD(fsSystemCol); COPY_NODE_FIELD(fdw_exprs);
COPY_NODE_FIELD(fdw_private); COPY_NODE_FIELD(fdw_private);
COPY_SCALAR_FIELD(fsSystemCol);
return newnode; return newnode;
} }
......
...@@ -559,8 +559,9 @@ _outForeignScan(StringInfo str, const ForeignScan *node) ...@@ -559,8 +559,9 @@ _outForeignScan(StringInfo str, const ForeignScan *node)
_outScanInfo(str, (const Scan *) node); _outScanInfo(str, (const Scan *) node);
WRITE_BOOL_FIELD(fsSystemCol); WRITE_NODE_FIELD(fdw_exprs);
WRITE_NODE_FIELD(fdw_private); WRITE_NODE_FIELD(fdw_private);
WRITE_BOOL_FIELD(fsSystemCol);
} }
static void static void
...@@ -1741,6 +1742,7 @@ _outRelOptInfo(StringInfo str, const RelOptInfo *node) ...@@ -1741,6 +1742,7 @@ _outRelOptInfo(StringInfo str, const RelOptInfo *node)
WRITE_FLOAT_FIELD(allvisfrac, "%.6f"); WRITE_FLOAT_FIELD(allvisfrac, "%.6f");
WRITE_NODE_FIELD(subplan); WRITE_NODE_FIELD(subplan);
WRITE_NODE_FIELD(subroot); WRITE_NODE_FIELD(subroot);
/* we don't try to print fdwroutine or fdw_private */
WRITE_NODE_FIELD(baserestrictinfo); WRITE_NODE_FIELD(baserestrictinfo);
WRITE_NODE_FIELD(joininfo); WRITE_NODE_FIELD(joininfo);
WRITE_BOOL_FIELD(has_eclass_joins); WRITE_BOOL_FIELD(has_eclass_joins);
......
...@@ -396,6 +396,12 @@ set_foreign_size(PlannerInfo *root, RelOptInfo *rel, RangeTblEntry *rte) ...@@ -396,6 +396,12 @@ set_foreign_size(PlannerInfo *root, RelOptInfo *rel, RangeTblEntry *rte)
{ {
/* Mark rel with estimated output rows, width, etc */ /* Mark rel with estimated output rows, width, etc */
set_foreign_size_estimates(root, rel); set_foreign_size_estimates(root, rel);
/* Get FDW routine pointers for the rel */
rel->fdwroutine = GetFdwRoutineByRelId(rte->relid);
/* Let FDW adjust the size estimates, if it can */
rel->fdwroutine->GetForeignRelSize(root, rel, rte->relid);
} }
/* /*
...@@ -405,11 +411,8 @@ set_foreign_size(PlannerInfo *root, RelOptInfo *rel, RangeTblEntry *rte) ...@@ -405,11 +411,8 @@ set_foreign_size(PlannerInfo *root, RelOptInfo *rel, RangeTblEntry *rte)
static void static void
set_foreign_pathlist(PlannerInfo *root, RelOptInfo *rel, RangeTblEntry *rte) set_foreign_pathlist(PlannerInfo *root, RelOptInfo *rel, RangeTblEntry *rte)
{ {
FdwRoutine *fdwroutine; /* Call the FDW's GetForeignPaths function to generate path(s) */
rel->fdwroutine->GetForeignPaths(root, rel, rte->relid);
/* Call the FDW's PlanForeignScan function to generate path(s) */
fdwroutine = GetFdwRoutineByRelId(rte->relid);
fdwroutine->PlanForeignScan(rte->relid, root, rel);
/* Select cheapest path */ /* Select cheapest path */
set_cheapest(rel); set_cheapest(rel);
......
...@@ -3745,7 +3745,7 @@ set_cte_size_estimates(PlannerInfo *root, RelOptInfo *rel, Plan *cteplan) ...@@ -3745,7 +3745,7 @@ set_cte_size_estimates(PlannerInfo *root, RelOptInfo *rel, Plan *cteplan)
* using what will be purely datatype-driven estimates from the targetlist. * using what will be purely datatype-driven estimates from the targetlist.
* There is no way to do anything sane with the rows value, so we just put * There is no way to do anything sane with the rows value, so we just put
* a default estimate and hope that the wrapper can improve on it. The * a default estimate and hope that the wrapper can improve on it. The
* wrapper's PlanForeignScan function will be called momentarily. * wrapper's GetForeignRelSize function will be called momentarily.
* *
* The rel's targetlist and restrictinfo list must have been constructed * The rel's targetlist and restrictinfo list must have been constructed
* already. * already.
......
...@@ -20,6 +20,7 @@ ...@@ -20,6 +20,7 @@
#include <math.h> #include <math.h>
#include "access/skey.h" #include "access/skey.h"
#include "foreign/fdwapi.h"
#include "miscadmin.h" #include "miscadmin.h"
#include "nodes/makefuncs.h" #include "nodes/makefuncs.h"
#include "nodes/nodeFuncs.h" #include "nodes/nodeFuncs.h"
...@@ -119,8 +120,6 @@ static CteScan *make_ctescan(List *qptlist, List *qpqual, ...@@ -119,8 +120,6 @@ static CteScan *make_ctescan(List *qptlist, List *qpqual,
Index scanrelid, int ctePlanId, int cteParam); Index scanrelid, int ctePlanId, int cteParam);
static WorkTableScan *make_worktablescan(List *qptlist, List *qpqual, static WorkTableScan *make_worktablescan(List *qptlist, List *qpqual,
Index scanrelid, int wtParam); Index scanrelid, int wtParam);
static ForeignScan *make_foreignscan(List *qptlist, List *qpqual,
Index scanrelid, bool fsSystemCol, List *fdw_private);
static BitmapAnd *make_bitmap_and(List *bitmapplans); static BitmapAnd *make_bitmap_and(List *bitmapplans);
static BitmapOr *make_bitmap_or(List *bitmapplans); static BitmapOr *make_bitmap_or(List *bitmapplans);
static NestLoop *make_nestloop(List *tlist, static NestLoop *make_nestloop(List *tlist,
...@@ -1816,7 +1815,6 @@ create_foreignscan_plan(PlannerInfo *root, ForeignPath *best_path, ...@@ -1816,7 +1815,6 @@ create_foreignscan_plan(PlannerInfo *root, ForeignPath *best_path,
RelOptInfo *rel = best_path->path.parent; RelOptInfo *rel = best_path->path.parent;
Index scan_relid = rel->relid; Index scan_relid = rel->relid;
RangeTblEntry *rte; RangeTblEntry *rte;
bool fsSystemCol;
int i; int i;
/* it should be a base rel... */ /* it should be a base rel... */
...@@ -1825,31 +1823,56 @@ create_foreignscan_plan(PlannerInfo *root, ForeignPath *best_path, ...@@ -1825,31 +1823,56 @@ create_foreignscan_plan(PlannerInfo *root, ForeignPath *best_path,
rte = planner_rt_fetch(scan_relid, root); rte = planner_rt_fetch(scan_relid, root);
Assert(rte->rtekind == RTE_RELATION); Assert(rte->rtekind == RTE_RELATION);
/* Sort clauses into best execution order */ /*
* Sort clauses into best execution order. We do this first since the
* FDW might have more info than we do and wish to adjust the ordering.
*/
scan_clauses = order_qual_clauses(root, scan_clauses); scan_clauses = order_qual_clauses(root, scan_clauses);
/* Reduce RestrictInfo list to bare expressions; ignore pseudoconstants */ /*
scan_clauses = extract_actual_clauses(scan_clauses, false); * Let the FDW perform its processing on the restriction clauses and
* generate the plan node. Note that the FDW might remove restriction
* clauses that it intends to execute remotely, or even add more (if it
* has selected some join clauses for remote use but also wants them
* rechecked locally).
*/
scan_plan = rel->fdwroutine->GetForeignPlan(root, rel, rte->relid,
best_path,
tlist, scan_clauses);
/* Copy cost data from Path to Plan; no need to make FDW do this */
copy_path_costsize(&scan_plan->scan.plan, &best_path->path);
/* Detect whether any system columns are requested from rel */ /*
fsSystemCol = false; * Replace any outer-relation variables with nestloop params in the qual
* and fdw_exprs expressions. We do this last so that the FDW doesn't
* have to be involved. (Note that parts of fdw_exprs could have come
* from join clauses, so doing this beforehand on the scan_clauses
* wouldn't work.)
*/
if (best_path->path.required_outer)
{
scan_plan->scan.plan.qual = (List *)
replace_nestloop_params(root, (Node *) scan_plan->scan.plan.qual);
scan_plan->fdw_exprs = (List *)
replace_nestloop_params(root, (Node *) scan_plan->fdw_exprs);
}
/*
* Detect whether any system columns are requested from rel. This is a
* bit of a kluge and might go away someday, so we intentionally leave it
* out of the API presented to FDWs.
*/
scan_plan->fsSystemCol = false;
for (i = rel->min_attr; i < 0; i++) for (i = rel->min_attr; i < 0; i++)
{ {
if (!bms_is_empty(rel->attr_needed[i - rel->min_attr])) if (!bms_is_empty(rel->attr_needed[i - rel->min_attr]))
{ {
fsSystemCol = true; scan_plan->fsSystemCol = true;
break; break;
} }
} }
scan_plan = make_foreignscan(tlist,
scan_clauses,
scan_relid,
fsSystemCol,
best_path->fdw_private);
copy_path_costsize(&scan_plan->scan.plan, &best_path->path);
return scan_plan; return scan_plan;
} }
...@@ -3183,24 +3206,26 @@ make_worktablescan(List *qptlist, ...@@ -3183,24 +3206,26 @@ make_worktablescan(List *qptlist,
return node; return node;
} }
static ForeignScan * ForeignScan *
make_foreignscan(List *qptlist, make_foreignscan(List *qptlist,
List *qpqual, List *qpqual,
Index scanrelid, Index scanrelid,
bool fsSystemCol, List *fdw_exprs,
List *fdw_private) List *fdw_private)
{ {
ForeignScan *node = makeNode(ForeignScan); ForeignScan *node = makeNode(ForeignScan);
Plan *plan = &node->scan.plan; Plan *plan = &node->scan.plan;
/* cost should be inserted by caller */ /* cost will be filled in by create_foreignscan_plan */
plan->targetlist = qptlist; plan->targetlist = qptlist;
plan->qual = qpqual; plan->qual = qpqual;
plan->lefttree = NULL; plan->lefttree = NULL;
plan->righttree = NULL; plan->righttree = NULL;
node->scan.scanrelid = scanrelid; node->scan.scanrelid = scanrelid;
node->fsSystemCol = fsSystemCol; node->fdw_exprs = fdw_exprs;
node->fdw_private = fdw_private; node->fdw_private = fdw_private;
/* fsSystemCol will be filled in by create_foreignscan_plan */
node->fsSystemCol = false;
return node; return node;
} }
......
...@@ -428,6 +428,8 @@ set_plan_refs(PlannerInfo *root, Plan *plan, int rtoffset) ...@@ -428,6 +428,8 @@ set_plan_refs(PlannerInfo *root, Plan *plan, int rtoffset)
fix_scan_list(root, splan->scan.plan.targetlist, rtoffset); fix_scan_list(root, splan->scan.plan.targetlist, rtoffset);
splan->scan.plan.qual = splan->scan.plan.qual =
fix_scan_list(root, splan->scan.plan.qual, rtoffset); fix_scan_list(root, splan->scan.plan.qual, rtoffset);
splan->fdw_exprs =
fix_scan_list(root, splan->fdw_exprs, rtoffset);
} }
break; break;
......
...@@ -2137,6 +2137,8 @@ finalize_plan(PlannerInfo *root, Plan *plan, Bitmapset *valid_params, ...@@ -2137,6 +2137,8 @@ finalize_plan(PlannerInfo *root, Plan *plan, Bitmapset *valid_params,
break; break;
case T_ForeignScan: case T_ForeignScan:
finalize_primnode((Node *) ((ForeignScan *) plan)->fdw_exprs,
&context);
context.paramids = bms_add_members(context.paramids, scan_params); context.paramids = bms_add_members(context.paramids, scan_params);
break; break;
......
...@@ -1767,7 +1767,7 @@ create_worktablescan_path(PlannerInfo *root, RelOptInfo *rel) ...@@ -1767,7 +1767,7 @@ create_worktablescan_path(PlannerInfo *root, RelOptInfo *rel)
* returning the pathnode. * returning the pathnode.
* *
* This function is never called from core Postgres; rather, it's expected * This function is never called from core Postgres; rather, it's expected
* to be called by the PlanForeignScan function of a foreign data wrapper. * to be called by the GetForeignPaths function of a foreign data wrapper.
* We make the FDW supply all fields of the path, since we do not have any * We make the FDW supply all fields of the path, since we do not have any
* way to calculate them in core. * way to calculate them in core.
*/ */
......
...@@ -113,6 +113,8 @@ build_simple_rel(PlannerInfo *root, int relid, RelOptKind reloptkind) ...@@ -113,6 +113,8 @@ build_simple_rel(PlannerInfo *root, int relid, RelOptKind reloptkind)
rel->allvisfrac = 0; rel->allvisfrac = 0;
rel->subplan = NULL; rel->subplan = NULL;
rel->subroot = NULL; rel->subroot = NULL;
rel->fdwroutine = NULL;
rel->fdw_private = NULL;
rel->baserestrictinfo = NIL; rel->baserestrictinfo = NIL;
rel->baserestrictcost.startup = 0; rel->baserestrictcost.startup = 0;
rel->baserestrictcost.per_tuple = 0; rel->baserestrictcost.per_tuple = 0;
...@@ -366,6 +368,8 @@ build_join_rel(PlannerInfo *root, ...@@ -366,6 +368,8 @@ build_join_rel(PlannerInfo *root,
joinrel->allvisfrac = 0; joinrel->allvisfrac = 0;
joinrel->subplan = NULL; joinrel->subplan = NULL;
joinrel->subroot = NULL; joinrel->subroot = NULL;
joinrel->fdwroutine = NULL;
joinrel->fdw_private = NULL;
joinrel->baserestrictinfo = NIL; joinrel->baserestrictinfo = NIL;
joinrel->baserestrictcost.startup = 0; joinrel->baserestrictcost.startup = 0;
joinrel->baserestrictcost.per_tuple = 0; joinrel->baserestrictcost.per_tuple = 0;
......
...@@ -23,9 +23,20 @@ struct ExplainState; ...@@ -23,9 +23,20 @@ struct ExplainState;
* Callback function signatures --- see fdwhandler.sgml for more info. * Callback function signatures --- see fdwhandler.sgml for more info.
*/ */
typedef void (*PlanForeignScan_function) (Oid foreigntableid, typedef void (*GetForeignRelSize_function) (PlannerInfo *root,
PlannerInfo *root, RelOptInfo *baserel,
RelOptInfo *baserel); Oid foreigntableid);
typedef void (*GetForeignPaths_function) (PlannerInfo *root,
RelOptInfo *baserel,
Oid foreigntableid);
typedef ForeignScan *(*GetForeignPlan_function) (PlannerInfo *root,
RelOptInfo *baserel,
Oid foreigntableid,
ForeignPath *best_path,
List *tlist,
List *scan_clauses);
typedef void (*ExplainForeignScan_function) (ForeignScanState *node, typedef void (*ExplainForeignScan_function) (ForeignScanState *node,
struct ExplainState *es); struct ExplainState *es);
...@@ -53,7 +64,9 @@ typedef struct FdwRoutine ...@@ -53,7 +64,9 @@ typedef struct FdwRoutine
{ {
NodeTag type; NodeTag type;
PlanForeignScan_function PlanForeignScan; GetForeignRelSize_function GetForeignRelSize;
GetForeignPaths_function GetForeignPaths;
GetForeignPlan_function GetForeignPlan;
ExplainForeignScan_function ExplainForeignScan; ExplainForeignScan_function ExplainForeignScan;
BeginForeignScan_function BeginForeignScan; BeginForeignScan_function BeginForeignScan;
IterateForeignScan_function IterateForeignScan; IterateForeignScan_function IterateForeignScan;
......
...@@ -462,13 +462,22 @@ typedef struct WorkTableScan ...@@ -462,13 +462,22 @@ typedef struct WorkTableScan
/* ---------------- /* ----------------
* ForeignScan node * ForeignScan node
*
* fdw_exprs and fdw_private are both under the control of the foreign-data
* wrapper, but fdw_exprs is presumed to contain expression trees and will
* be post-processed accordingly by the planner; fdw_private won't be.
* Note that everything in both lists must be copiable by copyObject().
* One way to store an arbitrary blob of bytes is to represent it as a bytea
* Const. Usually, though, you'll be better off choosing a representation
* that can be dumped usefully by nodeToString().
* ---------------- * ----------------
*/ */
typedef struct ForeignScan typedef struct ForeignScan
{ {
Scan scan; Scan scan;
bool fsSystemCol; /* true if any "system column" is needed */ List *fdw_exprs; /* expressions that FDW may evaluate */
List *fdw_private; /* private data for FDW */ List *fdw_private; /* private data for FDW */
bool fsSystemCol; /* true if any "system column" is needed */
} ForeignScan; } ForeignScan;
......
...@@ -334,10 +334,13 @@ typedef struct PlannerInfo ...@@ -334,10 +334,13 @@ typedef struct PlannerInfo
* allvisfrac - fraction of disk pages that are marked all-visible * allvisfrac - fraction of disk pages that are marked all-visible
* subplan - plan for subquery (NULL if it's not a subquery) * subplan - plan for subquery (NULL if it's not a subquery)
* subroot - PlannerInfo for subquery (NULL if it's not a subquery) * subroot - PlannerInfo for subquery (NULL if it's not a subquery)
* fdwroutine - function hooks for FDW, if foreign table (else NULL)
* fdw_private - private state for FDW, if foreign table (else NULL)
* *
* Note: for a subquery, tuples, subplan, subroot are not set immediately * Note: for a subquery, tuples, subplan, subroot are not set immediately
* upon creation of the RelOptInfo object; they are filled in when * upon creation of the RelOptInfo object; they are filled in when
* set_base_rel_pathlist processes the object. * set_subquery_pathlist processes the object. Likewise, fdwroutine
* and fdw_private are filled during initial path creation.
* *
* For otherrels that are appendrel members, these fields are filled * For otherrels that are appendrel members, these fields are filled
* in just as for a baserel. * in just as for a baserel.
...@@ -414,8 +417,12 @@ typedef struct RelOptInfo ...@@ -414,8 +417,12 @@ typedef struct RelOptInfo
BlockNumber pages; /* size estimates derived from pg_class */ BlockNumber pages; /* size estimates derived from pg_class */
double tuples; double tuples;
double allvisfrac; double allvisfrac;
/* use "struct Plan" to avoid including plannodes.h here */
struct Plan *subplan; /* if subquery */ struct Plan *subplan; /* if subquery */
PlannerInfo *subroot; /* if subquery */ PlannerInfo *subroot; /* if subquery */
/* use "struct FdwRoutine" to avoid including fdwapi.h here */
struct FdwRoutine *fdwroutine; /* if foreign table */
void *fdw_private; /* if foreign table */
/* used by various scans and joins: */ /* used by various scans and joins: */
List *baserestrictinfo; /* RestrictInfo structures (if base List *baserestrictinfo; /* RestrictInfo structures (if base
...@@ -793,14 +800,13 @@ typedef struct TidPath ...@@ -793,14 +800,13 @@ typedef struct TidPath
} TidPath; } TidPath;
/* /*
* ForeignPath represents a scan of a foreign table * ForeignPath represents a potential scan of a foreign table
* *
* fdw_private contains FDW private data about the scan, which will be copied * fdw_private stores FDW private data about the scan. While fdw_private is
* to the final ForeignScan plan node so that it is available at execution * not actually touched by the core code during normal operations, it's
* time. Note that everything in this list must be copiable by copyObject(). * generally a good idea to use a representation that can be dumped by
* One way to store an arbitrary blob of bytes is to represent it as a bytea * nodeToString(), so that you can examine the structure during debugging
* Const. Usually, though, you'll be better off choosing a representation * with tools like pprint().
* that can be dumped usefully by nodeToString().
*/ */
typedef struct ForeignPath typedef struct ForeignPath
{ {
......
...@@ -42,6 +42,8 @@ extern Plan *optimize_minmax_aggregates(PlannerInfo *root, List *tlist, ...@@ -42,6 +42,8 @@ extern Plan *optimize_minmax_aggregates(PlannerInfo *root, List *tlist,
extern Plan *create_plan(PlannerInfo *root, Path *best_path); extern Plan *create_plan(PlannerInfo *root, Path *best_path);
extern SubqueryScan *make_subqueryscan(List *qptlist, List *qpqual, extern SubqueryScan *make_subqueryscan(List *qptlist, List *qpqual,
Index scanrelid, Plan *subplan); Index scanrelid, Plan *subplan);
extern ForeignScan *make_foreignscan(List *qptlist, List *qpqual,
Index scanrelid, List *fdw_exprs, List *fdw_private);
extern Append *make_append(List *appendplans, List *tlist); extern Append *make_append(List *appendplans, List *tlist);
extern RecursiveUnion *make_recursive_union(List *tlist, extern RecursiveUnion *make_recursive_union(List *tlist,
Plan *lefttree, Plan *righttree, int wtParam, Plan *lefttree, Plan *righttree, int wtParam,
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment