Commit 5b931237 authored by Tom Lane's avatar Tom Lane

Load relcache entries' partitioning data on-demand, not immediately.

Formerly the rd_partkey and rd_partdesc data structures were always
populated immediately when a relcache entry was built or rebuilt.
This patch changes things so that they are populated only when they
are first requested.  (Hence, callers *must* now always use
RelationGetPartitionKey or RelationGetPartitionDesc; just fetching
the pointer directly is no longer acceptable.)

This seems to have some performance benefits, but the main reason to do
it is that it eliminates a recursive-reload failure that occurs if the
partkey or partdesc expressions contain any references to the relation's
rowtype (as discovered by Amit Langote).  In retrospect, since loading
these data structures might result in execution of nearly-arbitrary code
via eval_const_expressions, it was a dumb idea to require that to happen
during relcache entry rebuild.

Also, fix things so that old copies of a relcache partition descriptor
will be dropped when the cache entry's refcount goes to zero.  In the
previous coding it was possible for such copies to survive for the
lifetime of the session, as I'd complained of in a previous discussion.
(This management technique still isn't perfect, but it's better than
before.)  Improve the commentary explaining how that works and why
it's safe to hand out direct pointers to these relcache substructures.

In passing, improve RelationBuildPartitionDesc by using the same
memory-context-parent-swap approach used by RelationBuildPartitionKey,
thereby making it less dependent on strong assumptions about what
partition_bounds_copy does.  Avoid doing get_rel_relkind in the
critical section, too.

Patch by Amit Langote and Tom Lane; Robert Haas deserves some credit
for prior work in the area, too.  Although this is a pre-existing
problem, no back-patch: the patch seems too invasive to be safe to
back-patch, and the bug it fixes is a corner case that seems
relatively unlikely to cause problems in the field.

Discussion: https://postgr.es/m/CA+HiwqFUzjfj9HEsJtYWcr1SgQ_=iCAvQ=O2Sx6aQxoDu4OiHw@mail.gmail.com
Discussion: https://postgr.es/m/CA+TgmoY3bRmGB6-DUnoVy5fJoreiBJ43rwMrQRCdPXuKt4Ykaw@mail.gmail.com
parent 8ce3aa9b
...@@ -83,7 +83,6 @@ ...@@ -83,7 +83,6 @@
#include "utils/inval.h" #include "utils/inval.h"
#include "utils/lsyscache.h" #include "utils/lsyscache.h"
#include "utils/partcache.h" #include "utils/partcache.h"
#include "utils/rel.h"
#include "utils/ruleutils.h" #include "utils/ruleutils.h"
#include "utils/snapmgr.h" #include "utils/snapmgr.h"
#include "utils/syscache.h" #include "utils/syscache.h"
......
...@@ -812,7 +812,7 @@ DefineIndex(Oid relationId, ...@@ -812,7 +812,7 @@ DefineIndex(Oid relationId,
*/ */
if (partitioned && (stmt->unique || stmt->primary)) if (partitioned && (stmt->unique || stmt->primary))
{ {
PartitionKey key = rel->rd_partkey; PartitionKey key = RelationGetPartitionKey(rel);
int i; int i;
/* /*
......
...@@ -30,7 +30,6 @@ ...@@ -30,7 +30,6 @@
#include "rewrite/rewriteManip.h" #include "rewrite/rewriteManip.h"
#include "utils/lsyscache.h" #include "utils/lsyscache.h"
#include "utils/partcache.h" #include "utils/partcache.h"
#include "utils/rel.h"
#include "utils/rls.h" #include "utils/rls.h"
#include "utils/ruleutils.h" #include "utils/ruleutils.h"
......
...@@ -35,7 +35,6 @@ ...@@ -35,7 +35,6 @@
#include "utils/hashutils.h" #include "utils/hashutils.h"
#include "utils/lsyscache.h" #include "utils/lsyscache.h"
#include "utils/partcache.h" #include "utils/partcache.h"
#include "utils/rel.h"
#include "utils/ruleutils.h" #include "utils/ruleutils.h"
#include "utils/snapmgr.h" #include "utils/snapmgr.h"
#include "utils/syscache.h" #include "utils/syscache.h"
...@@ -775,6 +774,11 @@ partition_bounds_equal(int partnatts, int16 *parttyplen, bool *parttypbyval, ...@@ -775,6 +774,11 @@ partition_bounds_equal(int partnatts, int16 *parttyplen, bool *parttypbyval,
/* /*
* Return a copy of given PartitionBoundInfo structure. The data types of bounds * Return a copy of given PartitionBoundInfo structure. The data types of bounds
* are described by given partition key specification. * are described by given partition key specification.
*
* Note: it's important that this function and its callees not do any catalog
* access, nor anything else that would result in allocating memory other than
* the returned data structure. Since this is called in a long-lived context,
* that would result in unwanted memory leaks.
*/ */
PartitionBoundInfo PartitionBoundInfo
partition_bounds_copy(PartitionBoundInfo src, partition_bounds_copy(PartitionBoundInfo src,
......
...@@ -47,17 +47,48 @@ typedef struct PartitionDirectoryEntry ...@@ -47,17 +47,48 @@ typedef struct PartitionDirectoryEntry
PartitionDesc pd; PartitionDesc pd;
} PartitionDirectoryEntry; } PartitionDirectoryEntry;
static void RelationBuildPartitionDesc(Relation rel);
/*
* RelationGetPartitionDesc -- get partition descriptor, if relation is partitioned
*
* Note: we arrange for partition descriptors to not get freed until the
* relcache entry's refcount goes to zero (see hacks in RelationClose,
* RelationClearRelation, and RelationBuildPartitionDesc). Therefore, even
* though we hand back a direct pointer into the relcache entry, it's safe
* for callers to continue to use that pointer as long as (a) they hold the
* relation open, and (b) they hold a relation lock strong enough to ensure
* that the data doesn't become stale.
*/
PartitionDesc
RelationGetPartitionDesc(Relation rel)
{
if (rel->rd_rel->relkind != RELKIND_PARTITIONED_TABLE)
return NULL;
if (unlikely(rel->rd_partdesc == NULL))
RelationBuildPartitionDesc(rel);
return rel->rd_partdesc;
}
/* /*
* RelationBuildPartitionDesc * RelationBuildPartitionDesc
* Form rel's partition descriptor, and store in relcache entry * Form rel's partition descriptor, and store in relcache entry
* *
* Note: the descriptor won't be flushed from the cache by * Partition descriptor is a complex structure; to avoid complicated logic to
* RelationClearRelation() unless it's changed because of * free individual elements whenever the relcache entry is flushed, we give it
* addition or removal of a partition. Hence, code holding a lock * its own memory context, a child of CacheMemoryContext, which can easily be
* that's sufficient to prevent that can assume that rd_partdesc * deleted on its own. To avoid leaking memory in that context in case of an
* won't change underneath it. * error partway through this function, the context is initially created as a
* child of CurTransactionContext and only re-parented to CacheMemoryContext
* at the end, when no further errors are possible. Also, we don't make this
* context the current context except in very brief code sections, out of fear
* that some of our callees allocate memory on their own which would be leaked
* permanently.
*/ */
void static void
RelationBuildPartitionDesc(Relation rel) RelationBuildPartitionDesc(Relation rel)
{ {
PartitionDesc partdesc; PartitionDesc partdesc;
...@@ -65,10 +96,12 @@ RelationBuildPartitionDesc(Relation rel) ...@@ -65,10 +96,12 @@ RelationBuildPartitionDesc(Relation rel)
List *inhoids; List *inhoids;
PartitionBoundSpec **boundspecs = NULL; PartitionBoundSpec **boundspecs = NULL;
Oid *oids = NULL; Oid *oids = NULL;
bool *is_leaf = NULL;
ListCell *cell; ListCell *cell;
int i, int i,
nparts; nparts;
PartitionKey key = RelationGetPartitionKey(rel); PartitionKey key = RelationGetPartitionKey(rel);
MemoryContext new_pdcxt;
MemoryContext oldcxt; MemoryContext oldcxt;
int *mapping; int *mapping;
...@@ -81,10 +114,11 @@ RelationBuildPartitionDesc(Relation rel) ...@@ -81,10 +114,11 @@ RelationBuildPartitionDesc(Relation rel)
inhoids = find_inheritance_children(RelationGetRelid(rel), NoLock); inhoids = find_inheritance_children(RelationGetRelid(rel), NoLock);
nparts = list_length(inhoids); nparts = list_length(inhoids);
/* Allocate arrays for OIDs and boundspecs. */ /* Allocate working arrays for OIDs, leaf flags, and boundspecs. */
if (nparts > 0) if (nparts > 0)
{ {
oids = palloc(nparts * sizeof(Oid)); oids = (Oid *) palloc(nparts * sizeof(Oid));
is_leaf = (bool *) palloc(nparts * sizeof(bool));
boundspecs = palloc(nparts * sizeof(PartitionBoundSpec *)); boundspecs = palloc(nparts * sizeof(PartitionBoundSpec *));
} }
...@@ -172,65 +206,73 @@ RelationBuildPartitionDesc(Relation rel) ...@@ -172,65 +206,73 @@ RelationBuildPartitionDesc(Relation rel)
/* Save results. */ /* Save results. */
oids[i] = inhrelid; oids[i] = inhrelid;
is_leaf[i] = (get_rel_relkind(inhrelid) != RELKIND_PARTITIONED_TABLE);
boundspecs[i] = boundspec; boundspecs[i] = boundspec;
++i; ++i;
} }
/* Assert we aren't about to leak any old data structure */ /*
Assert(rel->rd_pdcxt == NULL); * Create PartitionBoundInfo and mapping, working in the caller's context.
Assert(rel->rd_partdesc == NULL); * This could fail, but we haven't done any damage if so.
*/
if (nparts > 0)
boundinfo = partition_bounds_create(boundspecs, nparts, key, &mapping);
/* /*
* Now build the actual relcache partition descriptor. Note that the * Now build the actual relcache partition descriptor, copying all the
* order of operations here is fairly critical. If we fail partway * data into a new, small context. As per above comment, we don't make
* through this code, we won't have leaked memory because the rd_pdcxt is * this a long-lived context until it's finished.
* attached to the relcache entry immediately, so it'll be freed whenever
* the entry is rebuilt or destroyed. However, we don't assign to
* rd_partdesc until the cached data structure is fully complete and
* valid, so that no other code might try to use it.
*/ */
rel->rd_pdcxt = AllocSetContextCreate(CacheMemoryContext, new_pdcxt = AllocSetContextCreate(CurTransactionContext,
"partition descriptor", "partition descriptor",
ALLOCSET_SMALL_SIZES); ALLOCSET_SMALL_SIZES);
MemoryContextCopyAndSetIdentifier(rel->rd_pdcxt, MemoryContextCopyAndSetIdentifier(new_pdcxt,
RelationGetRelationName(rel)); RelationGetRelationName(rel));
partdesc = (PartitionDescData *) partdesc = (PartitionDescData *)
MemoryContextAllocZero(rel->rd_pdcxt, sizeof(PartitionDescData)); MemoryContextAllocZero(new_pdcxt, sizeof(PartitionDescData));
partdesc->nparts = nparts; partdesc->nparts = nparts;
/* If there are no partitions, the rest of the partdesc can stay zero */ /* If there are no partitions, the rest of the partdesc can stay zero */
if (nparts > 0) if (nparts > 0)
{ {
/* Create PartitionBoundInfo, using the caller's context. */ oldcxt = MemoryContextSwitchTo(new_pdcxt);
boundinfo = partition_bounds_create(boundspecs, nparts, key, &mapping);
/* Now copy all info into relcache's partdesc. */
oldcxt = MemoryContextSwitchTo(rel->rd_pdcxt);
partdesc->boundinfo = partition_bounds_copy(boundinfo, key); partdesc->boundinfo = partition_bounds_copy(boundinfo, key);
partdesc->oids = (Oid *) palloc(nparts * sizeof(Oid)); partdesc->oids = (Oid *) palloc(nparts * sizeof(Oid));
partdesc->is_leaf = (bool *) palloc(nparts * sizeof(bool)); partdesc->is_leaf = (bool *) palloc(nparts * sizeof(bool));
MemoryContextSwitchTo(oldcxt);
/* /*
* Assign OIDs from the original array into mapped indexes of the * Assign OIDs from the original array into mapped indexes of the
* result array. The order of OIDs in the former is defined by the * result array. The order of OIDs in the former is defined by the
* catalog scan that retrieved them, whereas that in the latter is * catalog scan that retrieved them, whereas that in the latter is
* defined by canonicalized representation of the partition bounds. * defined by canonicalized representation of the partition bounds.
* * Also save leaf-ness of each partition.
* Also record leaf-ness of each partition. For this we use
* get_rel_relkind() which may leak memory, so be sure to run it in
* the caller's context.
*/ */
for (i = 0; i < nparts; i++) for (i = 0; i < nparts; i++)
{ {
int index = mapping[i]; int index = mapping[i];
partdesc->oids[index] = oids[i]; partdesc->oids[index] = oids[i];
partdesc->is_leaf[index] = partdesc->is_leaf[index] = is_leaf[i];
(get_rel_relkind(oids[i]) != RELKIND_PARTITIONED_TABLE);
} }
MemoryContextSwitchTo(oldcxt);
} }
/*
* We have a fully valid partdesc ready to store into the relcache.
* Reparent it so it has the right lifespan.
*/
MemoryContextSetParent(new_pdcxt, CacheMemoryContext);
/*
* But first, a kluge: if there's an old rd_pdcxt, it contains an old
* partition descriptor that may still be referenced somewhere. Preserve
* it, while not leaking it, by reattaching it as a child context of the
* new rd_pdcxt. Eventually it will get dropped by either RelationClose
* or RelationClearRelation.
*/
if (rel->rd_pdcxt != NULL)
MemoryContextSetParent(rel->rd_pdcxt, new_pdcxt);
rel->rd_pdcxt = new_pdcxt;
rel->rd_partdesc = partdesc; rel->rd_partdesc = partdesc;
} }
......
...@@ -37,8 +37,31 @@ ...@@ -37,8 +37,31 @@
#include "utils/syscache.h" #include "utils/syscache.h"
static void RelationBuildPartitionKey(Relation relation);
static List *generate_partition_qual(Relation rel); static List *generate_partition_qual(Relation rel);
/*
* RelationGetPartitionKey -- get partition key, if relation is partitioned
*
* Note: partition keys are not allowed to change after the partitioned rel
* is created. RelationClearRelation knows this and preserves rd_partkey
* across relcache rebuilds, as long as the relation is open. Therefore,
* even though we hand back a direct pointer into the relcache entry, it's
* safe for callers to continue to use that pointer as long as they hold
* the relation open.
*/
PartitionKey
RelationGetPartitionKey(Relation rel)
{
if (rel->rd_rel->relkind != RELKIND_PARTITIONED_TABLE)
return NULL;
if (unlikely(rel->rd_partkey == NULL))
RelationBuildPartitionKey(rel);
return rel->rd_partkey;
}
/* /*
* RelationBuildPartitionKey * RelationBuildPartitionKey
* Build partition key data of relation, and attach to relcache * Build partition key data of relation, and attach to relcache
...@@ -54,7 +77,7 @@ static List *generate_partition_qual(Relation rel); ...@@ -54,7 +77,7 @@ static List *generate_partition_qual(Relation rel);
* that some of our callees allocate memory on their own which would be leaked * that some of our callees allocate memory on their own which would be leaked
* permanently. * permanently.
*/ */
void static void
RelationBuildPartitionKey(Relation relation) RelationBuildPartitionKey(Relation relation)
{ {
Form_pg_partitioned_table form; Form_pg_partitioned_table form;
...@@ -74,12 +97,9 @@ RelationBuildPartitionKey(Relation relation) ...@@ -74,12 +97,9 @@ RelationBuildPartitionKey(Relation relation)
tuple = SearchSysCache1(PARTRELID, tuple = SearchSysCache1(PARTRELID,
ObjectIdGetDatum(RelationGetRelid(relation))); ObjectIdGetDatum(RelationGetRelid(relation)));
/*
* The following happens when we have created our pg_class entry but not
* the pg_partitioned_table entry yet.
*/
if (!HeapTupleIsValid(tuple)) if (!HeapTupleIsValid(tuple))
return; elog(ERROR, "cache lookup failed for partition key of relation %u",
RelationGetRelid(relation));
partkeycxt = AllocSetContextCreate(CurTransactionContext, partkeycxt = AllocSetContextCreate(CurTransactionContext,
"partition key", "partition key",
......
...@@ -43,7 +43,6 @@ ...@@ -43,7 +43,6 @@
#include "catalog/catalog.h" #include "catalog/catalog.h"
#include "catalog/indexing.h" #include "catalog/indexing.h"
#include "catalog/namespace.h" #include "catalog/namespace.h"
#include "catalog/partition.h"
#include "catalog/pg_am.h" #include "catalog/pg_am.h"
#include "catalog/pg_amproc.h" #include "catalog/pg_amproc.h"
#include "catalog/pg_attrdef.h" #include "catalog/pg_attrdef.h"
...@@ -53,7 +52,6 @@ ...@@ -53,7 +52,6 @@
#include "catalog/pg_database.h" #include "catalog/pg_database.h"
#include "catalog/pg_namespace.h" #include "catalog/pg_namespace.h"
#include "catalog/pg_opclass.h" #include "catalog/pg_opclass.h"
#include "catalog/pg_partitioned_table.h"
#include "catalog/pg_proc.h" #include "catalog/pg_proc.h"
#include "catalog/pg_publication.h" #include "catalog/pg_publication.h"
#include "catalog/pg_rewrite.h" #include "catalog/pg_rewrite.h"
...@@ -71,8 +69,6 @@ ...@@ -71,8 +69,6 @@
#include "nodes/makefuncs.h" #include "nodes/makefuncs.h"
#include "nodes/nodeFuncs.h" #include "nodes/nodeFuncs.h"
#include "optimizer/optimizer.h" #include "optimizer/optimizer.h"
#include "partitioning/partbounds.h"
#include "partitioning/partdesc.h"
#include "rewrite/rewriteDefine.h" #include "rewrite/rewriteDefine.h"
#include "rewrite/rowsecurity.h" #include "rewrite/rowsecurity.h"
#include "storage/lmgr.h" #include "storage/lmgr.h"
...@@ -84,7 +80,6 @@ ...@@ -84,7 +80,6 @@
#include "utils/inval.h" #include "utils/inval.h"
#include "utils/lsyscache.h" #include "utils/lsyscache.h"
#include "utils/memutils.h" #include "utils/memutils.h"
#include "utils/partcache.h"
#include "utils/relmapper.h" #include "utils/relmapper.h"
#include "utils/resowner_private.h" #include "utils/resowner_private.h"
#include "utils/snapmgr.h" #include "utils/snapmgr.h"
...@@ -1165,20 +1160,11 @@ RelationBuildDesc(Oid targetRelId, bool insertIt) ...@@ -1165,20 +1160,11 @@ RelationBuildDesc(Oid targetRelId, bool insertIt)
relation->rd_fkeylist = NIL; relation->rd_fkeylist = NIL;
relation->rd_fkeyvalid = false; relation->rd_fkeyvalid = false;
/* if a partitioned table, initialize key and partition descriptor info */ /* partitioning data is not loaded till asked for */
if (relation->rd_rel->relkind == RELKIND_PARTITIONED_TABLE) relation->rd_partkey = NULL;
{ relation->rd_partkeycxt = NULL;
RelationBuildPartitionKey(relation); relation->rd_partdesc = NULL;
RelationBuildPartitionDesc(relation); relation->rd_pdcxt = NULL;
}
else
{
relation->rd_partkey = NULL;
relation->rd_partkeycxt = NULL;
relation->rd_partdesc = NULL;
relation->rd_pdcxt = NULL;
}
/* ... but partcheck is not loaded till asked for */
relation->rd_partcheck = NIL; relation->rd_partcheck = NIL;
relation->rd_partcheckvalid = false; relation->rd_partcheckvalid = false;
relation->rd_partcheckcxt = NULL; relation->rd_partcheckcxt = NULL;
...@@ -2090,6 +2076,16 @@ RelationClose(Relation relation) ...@@ -2090,6 +2076,16 @@ RelationClose(Relation relation)
/* Note: no locking manipulations needed */ /* Note: no locking manipulations needed */
RelationDecrementReferenceCount(relation); RelationDecrementReferenceCount(relation);
/*
* If the relation is no longer open in this session, we can clean up any
* stale partition descriptors it has. This is unlikely, so check to see
* if there are child contexts before expending a call to mcxt.c.
*/
if (RelationHasReferenceCountZero(relation) &&
relation->rd_pdcxt != NULL &&
relation->rd_pdcxt->firstchild != NULL)
MemoryContextDeleteChildren(relation->rd_pdcxt);
#ifdef RELCACHE_FORCE_RELEASE #ifdef RELCACHE_FORCE_RELEASE
if (RelationHasReferenceCountZero(relation) && if (RelationHasReferenceCountZero(relation) &&
relation->rd_createSubid == InvalidSubTransactionId && relation->rd_createSubid == InvalidSubTransactionId &&
...@@ -2527,7 +2523,6 @@ RelationClearRelation(Relation relation, bool rebuild) ...@@ -2527,7 +2523,6 @@ RelationClearRelation(Relation relation, bool rebuild)
bool keep_rules; bool keep_rules;
bool keep_policies; bool keep_policies;
bool keep_partkey; bool keep_partkey;
bool keep_partdesc;
/* Build temporary entry, but don't link it into hashtable */ /* Build temporary entry, but don't link it into hashtable */
newrel = RelationBuildDesc(save_relid, false); newrel = RelationBuildDesc(save_relid, false);
...@@ -2560,9 +2555,6 @@ RelationClearRelation(Relation relation, bool rebuild) ...@@ -2560,9 +2555,6 @@ RelationClearRelation(Relation relation, bool rebuild)
keep_policies = equalRSDesc(relation->rd_rsdesc, newrel->rd_rsdesc); keep_policies = equalRSDesc(relation->rd_rsdesc, newrel->rd_rsdesc);
/* partkey is immutable once set up, so we can always keep it */ /* partkey is immutable once set up, so we can always keep it */
keep_partkey = (relation->rd_partkey != NULL); keep_partkey = (relation->rd_partkey != NULL);
keep_partdesc = equalPartitionDescs(relation->rd_partkey,
relation->rd_partdesc,
newrel->rd_partdesc);
/* /*
* Perform swapping of the relcache entry contents. Within this * Perform swapping of the relcache entry contents. Within this
...@@ -2617,34 +2609,45 @@ RelationClearRelation(Relation relation, bool rebuild) ...@@ -2617,34 +2609,45 @@ RelationClearRelation(Relation relation, bool rebuild)
SWAPFIELD(Oid, rd_toastoid); SWAPFIELD(Oid, rd_toastoid);
/* pgstat_info must be preserved */ /* pgstat_info must be preserved */
SWAPFIELD(struct PgStat_TableStatus *, pgstat_info); SWAPFIELD(struct PgStat_TableStatus *, pgstat_info);
/* preserve old partitioning info if no logical change */ /* preserve old partition key if we have one */
if (keep_partkey) if (keep_partkey)
{ {
SWAPFIELD(PartitionKey, rd_partkey); SWAPFIELD(PartitionKey, rd_partkey);
SWAPFIELD(MemoryContext, rd_partkeycxt); SWAPFIELD(MemoryContext, rd_partkeycxt);
} }
if (keep_partdesc) if (newrel->rd_pdcxt != NULL)
{
SWAPFIELD(PartitionDesc, rd_partdesc);
SWAPFIELD(MemoryContext, rd_pdcxt);
}
else if (rebuild && newrel->rd_pdcxt != NULL)
{ {
/* /*
* We are rebuilding a partitioned relation with a non-zero * We are rebuilding a partitioned relation with a non-zero
* reference count, so keep the old partition descriptor around, * reference count, so we must keep the old partition descriptor
* in case there's a PartitionDirectory with a pointer to it. * around, in case there's a PartitionDirectory with a pointer to
* Attach it to the new rd_pdcxt so that it gets cleaned up * it. This means we can't free the old rd_pdcxt yet. (This is
* eventually. In the case where the reference count is 0, this * necessary because RelationGetPartitionDesc hands out direct
* code is not reached, which should be OK because in that case * pointers to the relcache's data structure, unlike our usual
* there should be no PartitionDirectory with a pointer to the old * practice which is to hand out copies. We'd have the same
* entry. * problem with rd_partkey, except that we always preserve that
* once created.)
*
* To ensure that it's not leaked completely, re-attach it to the
* new reldesc, or make it a child of the new reldesc's rd_pdcxt
* in the unlikely event that there is one already. (Compare hack
* in RelationBuildPartitionDesc.) RelationClose will clean up
* any such contexts once the reference count reaches zero.
*
* In the case where the reference count is zero, this code is not
* reached, which should be OK because in that case there should
* be no PartitionDirectory with a pointer to the old entry.
* *
* Note that newrel and relation have already been swapped, so the * Note that newrel and relation have already been swapped, so the
* "old" partition descriptor is actually the one hanging off of * "old" partition descriptor is actually the one hanging off of
* newrel. * newrel.
*/ */
MemoryContextSetParent(newrel->rd_pdcxt, relation->rd_pdcxt); relation->rd_partdesc = NULL; /* ensure rd_partdesc is invalid */
if (relation->rd_pdcxt != NULL) /* probably never happens */
MemoryContextSetParent(newrel->rd_pdcxt, relation->rd_pdcxt);
else
relation->rd_pdcxt = newrel->rd_pdcxt;
/* drop newrel's pointers so we don't destroy it below */
newrel->rd_partdesc = NULL; newrel->rd_partdesc = NULL;
newrel->rd_pdcxt = NULL; newrel->rd_pdcxt = NULL;
} }
...@@ -3907,27 +3910,7 @@ RelationCacheInitializePhase3(void) ...@@ -3907,27 +3910,7 @@ RelationCacheInitializePhase3(void)
restart = true; restart = true;
} }
/* /* Reload tableam data if needed */
* Reload the partition key and descriptor for a partitioned table.
*/
if (relation->rd_rel->relkind == RELKIND_PARTITIONED_TABLE &&
relation->rd_partkey == NULL)
{
RelationBuildPartitionKey(relation);
Assert(relation->rd_partkey != NULL);
restart = true;
}
if (relation->rd_rel->relkind == RELKIND_PARTITIONED_TABLE &&
relation->rd_partdesc == NULL)
{
RelationBuildPartitionDesc(relation);
Assert(relation->rd_partdesc != NULL);
restart = true;
}
if (relation->rd_tableam == NULL && if (relation->rd_tableam == NULL &&
(relation->rd_rel->relkind == RELKIND_RELATION || (relation->rd_rel->relkind == RELKIND_RELATION ||
relation->rd_rel->relkind == RELKIND_SEQUENCE || relation->rd_rel->relkind == RELKIND_SEQUENCE ||
......
...@@ -29,7 +29,8 @@ typedef struct PartitionDescData ...@@ -29,7 +29,8 @@ typedef struct PartitionDescData
PartitionBoundInfo boundinfo; /* collection of partition bounds */ PartitionBoundInfo boundinfo; /* collection of partition bounds */
} PartitionDescData; } PartitionDescData;
extern void RelationBuildPartitionDesc(Relation rel);
extern PartitionDesc RelationGetPartitionDesc(Relation rel);
extern PartitionDirectory CreatePartitionDirectory(MemoryContext mcxt); extern PartitionDirectory CreatePartitionDirectory(MemoryContext mcxt);
extern PartitionDesc PartitionDirectoryLookup(PartitionDirectory, Relation); extern PartitionDesc PartitionDirectoryLookup(PartitionDirectory, Relation);
......
...@@ -46,7 +46,8 @@ typedef struct PartitionKeyData ...@@ -46,7 +46,8 @@ typedef struct PartitionKeyData
Oid *parttypcoll; Oid *parttypcoll;
} PartitionKeyData; } PartitionKeyData;
extern void RelationBuildPartitionKey(Relation relation);
extern PartitionKey RelationGetPartitionKey(Relation rel);
extern List *RelationGetPartitionQual(Relation rel); extern List *RelationGetPartitionQual(Relation rel);
extern Expr *get_partition_qual_relid(Oid relid); extern Expr *get_partition_qual_relid(Oid relid);
......
...@@ -20,6 +20,7 @@ ...@@ -20,6 +20,7 @@
#include "catalog/pg_index.h" #include "catalog/pg_index.h"
#include "catalog/pg_publication.h" #include "catalog/pg_publication.h"
#include "nodes/bitmapset.h" #include "nodes/bitmapset.h"
#include "partitioning/partdefs.h"
#include "rewrite/prs2lock.h" #include "rewrite/prs2lock.h"
#include "storage/block.h" #include "storage/block.h"
#include "storage/relfilenode.h" #include "storage/relfilenode.h"
...@@ -94,9 +95,9 @@ typedef struct RelationData ...@@ -94,9 +95,9 @@ typedef struct RelationData
List *rd_fkeylist; /* list of ForeignKeyCacheInfo (see below) */ List *rd_fkeylist; /* list of ForeignKeyCacheInfo (see below) */
bool rd_fkeyvalid; /* true if list has been computed */ bool rd_fkeyvalid; /* true if list has been computed */
struct PartitionKeyData *rd_partkey; /* partition key, or NULL */ PartitionKey rd_partkey; /* partition key, or NULL */
MemoryContext rd_partkeycxt; /* private context for rd_partkey, if any */ MemoryContext rd_partkeycxt; /* private context for rd_partkey, if any */
struct PartitionDescData *rd_partdesc; /* partitions, or NULL */ PartitionDesc rd_partdesc; /* partition descriptor, or NULL */
MemoryContext rd_pdcxt; /* private context for rd_partdesc, if any */ MemoryContext rd_pdcxt; /* private context for rd_partdesc, if any */
List *rd_partcheck; /* partition CHECK quals */ List *rd_partcheck; /* partition CHECK quals */
bool rd_partcheckvalid; /* true if list has been computed */ bool rd_partcheckvalid; /* true if list has been computed */
...@@ -158,7 +159,7 @@ typedef struct RelationData ...@@ -158,7 +159,7 @@ typedef struct RelationData
Oid *rd_opfamily; /* OIDs of op families for each index col */ Oid *rd_opfamily; /* OIDs of op families for each index col */
Oid *rd_opcintype; /* OIDs of opclass declared input data types */ Oid *rd_opcintype; /* OIDs of opclass declared input data types */
RegProcedure *rd_support; /* OIDs of support procedures */ RegProcedure *rd_support; /* OIDs of support procedures */
struct FmgrInfo *rd_supportinfo; /* lookup info for support procedures */ struct FmgrInfo *rd_supportinfo; /* lookup info for support procedures */
int16 *rd_indoption; /* per-column AM-specific flags */ int16 *rd_indoption; /* per-column AM-specific flags */
List *rd_indexprs; /* index expression trees, if any */ List *rd_indexprs; /* index expression trees, if any */
List *rd_indpred; /* index predicate tree, if any */ List *rd_indpred; /* index predicate tree, if any */
...@@ -596,18 +597,6 @@ typedef struct ViewOptions ...@@ -596,18 +597,6 @@ typedef struct ViewOptions
RelationNeedsWAL(relation) && \ RelationNeedsWAL(relation) && \
!IsCatalogRelation(relation)) !IsCatalogRelation(relation))
/*
* RelationGetPartitionKey
* Returns the PartitionKey of a relation
*/
#define RelationGetPartitionKey(relation) ((relation)->rd_partkey)
/*
* RelationGetPartitionDesc
* Returns partition descriptor for a relation.
*/
#define RelationGetPartitionDesc(relation) ((relation)->rd_partdesc)
/* routines in utils/cache/relcache.c */ /* routines in utils/cache/relcache.c */
extern void RelationIncrementReferenceCount(Relation rel); extern void RelationIncrementReferenceCount(Relation rel);
extern void RelationDecrementReferenceCount(Relation rel); extern void RelationDecrementReferenceCount(Relation rel);
......
...@@ -512,6 +512,22 @@ Partition of: partitioned2 FOR VALUES FROM ('-1', 'aaaaa') TO (100, 'ccccc') ...@@ -512,6 +512,22 @@ Partition of: partitioned2 FOR VALUES FROM ('-1', 'aaaaa') TO (100, 'ccccc')
Partition constraint: (((a + 1) IS NOT NULL) AND (substr(b, 1, 5) IS NOT NULL) AND (((a + 1) > '-1'::integer) OR (((a + 1) = '-1'::integer) AND (substr(b, 1, 5) >= 'aaaaa'::text))) AND (((a + 1) < 100) OR (((a + 1) = 100) AND (substr(b, 1, 5) < 'ccccc'::text)))) Partition constraint: (((a + 1) IS NOT NULL) AND (substr(b, 1, 5) IS NOT NULL) AND (((a + 1) > '-1'::integer) OR (((a + 1) = '-1'::integer) AND (substr(b, 1, 5) >= 'aaaaa'::text))) AND (((a + 1) < 100) OR (((a + 1) = 100) AND (substr(b, 1, 5) < 'ccccc'::text))))
DROP TABLE partitioned, partitioned2; DROP TABLE partitioned, partitioned2;
-- check reference to partitioned table's rowtype in partition descriptor
create table partitioned (a int, b int)
partition by list ((row(a, b)::partitioned));
create table partitioned1
partition of partitioned for values in ('(1,2)'::partitioned);
create table partitioned2
partition of partitioned for values in ('(2,4)'::partitioned);
explain (costs off)
select * from partitioned where row(a,b)::partitioned = '(1,2)'::partitioned;
QUERY PLAN
-----------------------------------------------------------
Seq Scan on partitioned1 partitioned
Filter: (ROW(a, b)::partitioned = '(1,2)'::partitioned)
(2 rows)
drop table partitioned;
-- check that dependencies of partition columns are handled correctly -- check that dependencies of partition columns are handled correctly
create domain intdom1 as int; create domain intdom1 as int;
create table partitioned ( create table partitioned (
......
...@@ -459,6 +459,17 @@ CREATE TABLE part2_1 PARTITION OF partitioned2 FOR VALUES FROM (-1, 'aaaaa') TO ...@@ -459,6 +459,17 @@ CREATE TABLE part2_1 PARTITION OF partitioned2 FOR VALUES FROM (-1, 'aaaaa') TO
DROP TABLE partitioned, partitioned2; DROP TABLE partitioned, partitioned2;
-- check reference to partitioned table's rowtype in partition descriptor
create table partitioned (a int, b int)
partition by list ((row(a, b)::partitioned));
create table partitioned1
partition of partitioned for values in ('(1,2)'::partitioned);
create table partitioned2
partition of partitioned for values in ('(2,4)'::partitioned);
explain (costs off)
select * from partitioned where row(a,b)::partitioned = '(1,2)'::partitioned;
drop table partitioned;
-- check that dependencies of partition columns are handled correctly -- check that dependencies of partition columns are handled correctly
create domain intdom1 as int; create domain intdom1 as int;
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment