Commit 1bf3d615 authored by Tom Lane's avatar Tom Lane

Fix subtransaction behavior for large objects, temp namespace, files,

password/group files.  Also allow read-only subtransactions of a read-write
parent, but not vice versa.  These are the reasonably noncontroversial
parts of Alvaro's recent mop-up patch, plus further work on large objects
to minimize use of the TopTransactionResourceOwner.
parent cc813fc2
...@@ -8,7 +8,7 @@ ...@@ -8,7 +8,7 @@
* *
* *
* IDENTIFICATION * IDENTIFICATION
* $PostgreSQL: pgsql/src/backend/access/transam/xact.c,v 1.172 2004/07/27 05:10:49 tgl Exp $ * $PostgreSQL: pgsql/src/backend/access/transam/xact.c,v 1.173 2004/07/28 14:23:27 tgl Exp $
* *
* NOTES * NOTES
* Transaction aborts can now occur two ways: * Transaction aborts can now occur two ways:
...@@ -224,6 +224,7 @@ typedef struct TransactionStateData ...@@ -224,6 +224,7 @@ typedef struct TransactionStateData
ResourceOwner curTransactionOwner; /* my query resources */ ResourceOwner curTransactionOwner; /* my query resources */
List *childXids; /* subcommitted child XIDs */ List *childXids; /* subcommitted child XIDs */
AclId currentUser; /* subxact start current_user */ AclId currentUser; /* subxact start current_user */
bool prevXactReadOnly; /* entry-time xact r/o state */
struct TransactionStateData *parent; /* back link to parent */ struct TransactionStateData *parent; /* back link to parent */
} TransactionStateData; } TransactionStateData;
...@@ -284,6 +285,7 @@ static TransactionStateData TopTransactionStateData = { ...@@ -284,6 +285,7 @@ static TransactionStateData TopTransactionStateData = {
NULL, /* cur transaction resource owner */ NULL, /* cur transaction resource owner */
NIL, /* subcommitted child Xids */ NIL, /* subcommitted child Xids */
0, /* entry-time current userid */ 0, /* entry-time current userid */
false, /* entry-time xact r/o state */
NULL /* link to parent state block */ NULL /* link to parent state block */
}; };
...@@ -1242,7 +1244,8 @@ StartTransaction(void) ...@@ -1242,7 +1244,8 @@ StartTransaction(void)
* check the current transaction state * check the current transaction state
*/ */
if (s->state != TRANS_DEFAULT) if (s->state != TRANS_DEFAULT)
elog(WARNING, "StartTransaction and not in default state"); elog(WARNING, "StartTransaction while in %s state",
TransStateAsString(s->state));
/* /*
* set the current transaction state information appropriately during * set the current transaction state information appropriately during
...@@ -1287,6 +1290,8 @@ StartTransaction(void) ...@@ -1287,6 +1290,8 @@ StartTransaction(void)
* you won't because it doesn't work during startup; the userid isn't * you won't because it doesn't work during startup; the userid isn't
* set yet during a backend's first transaction start. We only use * set yet during a backend's first transaction start. We only use
* the currentUser field in sub-transaction state structs. * the currentUser field in sub-transaction state structs.
*
* prevXactReadOnly is also valid only in sub-transactions.
*/ */
/* /*
...@@ -1319,7 +1324,8 @@ CommitTransaction(void) ...@@ -1319,7 +1324,8 @@ CommitTransaction(void)
* check the current transaction state * check the current transaction state
*/ */
if (s->state != TRANS_INPROGRESS) if (s->state != TRANS_INPROGRESS)
elog(WARNING, "CommitTransaction and not in in-progress state"); elog(WARNING, "CommitTransaction while in %s state",
TransStateAsString(s->state));
Assert(s->parent == NULL); Assert(s->parent == NULL);
/* /*
...@@ -1351,14 +1357,14 @@ CommitTransaction(void) ...@@ -1351,14 +1357,14 @@ CommitTransaction(void)
AtCommit_Portals(); AtCommit_Portals();
/* handle commit for large objects [ PA, 7/17/98 ] */ /* close large objects before lower-level cleanup */
/* XXX probably this does not belong here */ AtEOXact_LargeObject(true);
lo_commit(true);
/* NOTIFY commit must come before lower-level cleanup */ /* NOTIFY commit must come before lower-level cleanup */
AtCommit_Notify(); AtCommit_Notify();
/* Update the flat password file if we changed pg_shadow or pg_group */ /* Update the flat password file if we changed pg_shadow or pg_group */
/* This should be the last step before commit */
AtEOXact_UpdatePasswordFile(true); AtEOXact_UpdatePasswordFile(true);
/* /*
...@@ -1486,7 +1492,8 @@ AbortTransaction(void) ...@@ -1486,7 +1492,8 @@ AbortTransaction(void)
* check the current transaction state * check the current transaction state
*/ */
if (s->state != TRANS_INPROGRESS) if (s->state != TRANS_INPROGRESS)
elog(WARNING, "AbortTransaction and not in in-progress state"); elog(WARNING, "AbortTransaction while in %s state",
TransStateAsString(s->state));
Assert(s->parent == NULL); Assert(s->parent == NULL);
/* /*
...@@ -1515,7 +1522,7 @@ AbortTransaction(void) ...@@ -1515,7 +1522,7 @@ AbortTransaction(void)
*/ */
DeferredTriggerAbortXact(); DeferredTriggerAbortXact();
AtAbort_Portals(); AtAbort_Portals();
lo_commit(false); /* 'false' means it's abort */ AtEOXact_LargeObject(false); /* 'false' means it's abort */
AtAbort_Notify(); AtAbort_Notify();
AtEOXact_UpdatePasswordFile(false); AtEOXact_UpdatePasswordFile(false);
...@@ -1870,6 +1877,9 @@ CleanupAbortedSubTransactions(bool returnName) ...@@ -1870,6 +1877,9 @@ CleanupAbortedSubTransactions(bool returnName)
s = CurrentTransactionState; s = CurrentTransactionState;
} }
AssertState(s->blockState == TBLOCK_SUBINPROGRESS ||
s->blockState == TBLOCK_INPROGRESS);
return name; return name;
} }
...@@ -2866,7 +2876,8 @@ StartSubTransaction(void) ...@@ -2866,7 +2876,8 @@ StartSubTransaction(void)
TransactionState s = CurrentTransactionState; TransactionState s = CurrentTransactionState;
if (s->state != TRANS_DEFAULT) if (s->state != TRANS_DEFAULT)
elog(WARNING, "StartSubTransaction and not in default state"); elog(WARNING, "StartSubTransaction while in %s state",
TransStateAsString(s->state));
s->state = TRANS_START; s->state = TRANS_START;
...@@ -2889,6 +2900,7 @@ StartSubTransaction(void) ...@@ -2889,6 +2900,7 @@ StartSubTransaction(void)
* Finish setup of other transaction state fields. * Finish setup of other transaction state fields.
*/ */
s->currentUser = GetUserId(); s->currentUser = GetUserId();
s->prevXactReadOnly = XactReadOnly;
/* /*
* Initialize other subsystems for new subtransaction * Initialize other subsystems for new subtransaction
...@@ -2913,7 +2925,8 @@ CommitSubTransaction(void) ...@@ -2913,7 +2925,8 @@ CommitSubTransaction(void)
ShowTransactionState("CommitSubTransaction"); ShowTransactionState("CommitSubTransaction");
if (s->state != TRANS_INPROGRESS) if (s->state != TRANS_INPROGRESS)
elog(WARNING, "CommitSubTransaction and not in in-progress state"); elog(WARNING, "CommitSubTransaction while in %s state",
TransStateAsString(s->state));
/* Pre-commit processing */ /* Pre-commit processing */
AtSubCommit_Portals(s->parent->transactionIdData, AtSubCommit_Portals(s->parent->transactionIdData,
...@@ -2930,9 +2943,18 @@ CommitSubTransaction(void) ...@@ -2930,9 +2943,18 @@ CommitSubTransaction(void)
/* Post-commit cleanup */ /* Post-commit cleanup */
AtSubCommit_smgr(); AtSubCommit_smgr();
AtSubEOXact_Inval(true); AtEOSubXact_Inval(true);
AtEOSubXact_SPI(true, s->transactionIdData); AtEOSubXact_SPI(true, s->transactionIdData);
AtEOSubXact_LargeObject(true, s->transactionIdData,
s->parent->transactionIdData);
AtEOSubXact_UpdatePasswordFile(true, s->transactionIdData,
s->parent->transactionIdData);
AtEOSubXact_Files(true, s->transactionIdData,
s->parent->transactionIdData);
AtEOSubXact_Namespace(true, s->transactionIdData,
s->parent->transactionIdData);
/* /*
* Note that we just release the resource owner's resources and don't * Note that we just release the resource owner's resources and don't
* delete it. This is because locks are not actually released here. * delete it. This is because locks are not actually released here.
...@@ -2953,6 +2975,13 @@ CommitSubTransaction(void) ...@@ -2953,6 +2975,13 @@ CommitSubTransaction(void)
AtEOSubXact_on_commit_actions(true, s->transactionIdData, AtEOSubXact_on_commit_actions(true, s->transactionIdData,
s->parent->transactionIdData); s->parent->transactionIdData);
/*
* We need to restore the upper transaction's read-only state,
* in case the upper is read-write while the child is read-only;
* GUC will incorrectly think it should leave the child state in place.
*/
XactReadOnly = s->prevXactReadOnly;
CurrentResourceOwner = s->parent->curTransactionOwner; CurrentResourceOwner = s->parent->curTransactionOwner;
CurTransactionResourceOwner = s->parent->curTransactionOwner; CurTransactionResourceOwner = s->parent->curTransactionOwner;
s->curTransactionOwner = NULL; s->curTransactionOwner = NULL;
...@@ -2973,7 +3002,8 @@ AbortSubTransaction(void) ...@@ -2973,7 +3002,8 @@ AbortSubTransaction(void)
ShowTransactionState("AbortSubTransaction"); ShowTransactionState("AbortSubTransaction");
if (s->state != TRANS_INPROGRESS) if (s->state != TRANS_INPROGRESS)
elog(WARNING, "AbortSubTransaction and not in in-progress state"); elog(WARNING, "AbortSubTransaction while in %s state",
TransStateAsString(s->state));
HOLD_INTERRUPTS(); HOLD_INTERRUPTS();
...@@ -3010,7 +3040,16 @@ AbortSubTransaction(void) ...@@ -3010,7 +3040,16 @@ AbortSubTransaction(void)
AtEOSubXact_SPI(false, s->transactionIdData); AtEOSubXact_SPI(false, s->transactionIdData);
AtSubAbort_Portals(s->parent->transactionIdData, AtSubAbort_Portals(s->parent->transactionIdData,
s->parent->curTransactionOwner); s->parent->curTransactionOwner);
AtSubEOXact_Inval(false); AtEOSubXact_Inval(false);
AtEOSubXact_LargeObject(false, s->transactionIdData,
s->parent->transactionIdData);
AtEOSubXact_UpdatePasswordFile(false, s->transactionIdData,
s->parent->transactionIdData);
AtEOSubXact_Files(false, s->transactionIdData,
s->parent->transactionIdData);
AtEOSubXact_Namespace(false, s->transactionIdData,
s->parent->transactionIdData);
ResourceOwnerRelease(s->curTransactionOwner, ResourceOwnerRelease(s->curTransactionOwner,
RESOURCE_RELEASE_BEFORE_LOCKS, RESOURCE_RELEASE_BEFORE_LOCKS,
...@@ -3041,6 +3080,13 @@ AbortSubTransaction(void) ...@@ -3041,6 +3080,13 @@ AbortSubTransaction(void)
*/ */
SetUserId(s->currentUser); SetUserId(s->currentUser);
/*
* Restore the upper transaction's read-only state, too. This should
* be redundant with GUC's cleanup but we may as well do it for
* consistency with the commit case.
*/
XactReadOnly = s->prevXactReadOnly;
CommandCounterIncrement(); CommandCounterIncrement();
RESUME_INTERRUPTS(); RESUME_INTERRUPTS();
...@@ -3057,7 +3103,8 @@ CleanupSubTransaction(void) ...@@ -3057,7 +3103,8 @@ CleanupSubTransaction(void)
ShowTransactionState("CleanupSubTransaction"); ShowTransactionState("CleanupSubTransaction");
if (s->state != TRANS_ABORT) if (s->state != TRANS_ABORT)
elog(WARNING, "CleanupSubTransaction and not in aborted state"); elog(WARNING, "CleanupSubTransaction while in %s state",
TransStateAsString(s->state));
AtSubCleanup_Portals(); AtSubCleanup_Portals();
...@@ -3088,7 +3135,8 @@ StartAbortedSubTransaction(void) ...@@ -3088,7 +3135,8 @@ StartAbortedSubTransaction(void)
TransactionState s = CurrentTransactionState; TransactionState s = CurrentTransactionState;
if (s->state != TRANS_DEFAULT) if (s->state != TRANS_DEFAULT)
elog(WARNING, "StartAbortedSubTransaction and not in default state"); elog(WARNING, "StartAbortedSubTransaction while in %s state",
TransStateAsString(s->state));
s->state = TRANS_START; s->state = TRANS_START;
...@@ -3168,7 +3216,8 @@ PopTransaction(void) ...@@ -3168,7 +3216,8 @@ PopTransaction(void)
TransactionState s = CurrentTransactionState; TransactionState s = CurrentTransactionState;
if (s->state != TRANS_DEFAULT) if (s->state != TRANS_DEFAULT)
elog(WARNING, "PopTransaction and not in default state"); elog(WARNING, "PopTransaction while in %s state",
TransStateAsString(s->state));
if (s->parent == NULL) if (s->parent == NULL)
elog(FATAL, "PopTransaction with no parent"); elog(FATAL, "PopTransaction with no parent");
......
...@@ -13,7 +13,7 @@ ...@@ -13,7 +13,7 @@
* Portions Copyright (c) 1994, Regents of the University of California * Portions Copyright (c) 1994, Regents of the University of California
* *
* IDENTIFICATION * IDENTIFICATION
* $PostgreSQL: pgsql/src/backend/catalog/namespace.c,v 1.67 2004/06/18 06:13:19 tgl Exp $ * $PostgreSQL: pgsql/src/backend/catalog/namespace.c,v 1.68 2004/07/28 14:23:27 tgl Exp $
* *
*------------------------------------------------------------------------- *-------------------------------------------------------------------------
*/ */
...@@ -107,12 +107,17 @@ static bool namespaceSearchPathValid = true; ...@@ -107,12 +107,17 @@ static bool namespaceSearchPathValid = true;
* myTempNamespace is InvalidOid until and unless a TEMP namespace is set up * myTempNamespace is InvalidOid until and unless a TEMP namespace is set up
* in a particular backend session (this happens when a CREATE TEMP TABLE * in a particular backend session (this happens when a CREATE TEMP TABLE
* command is first executed). Thereafter it's the OID of the temp namespace. * command is first executed). Thereafter it's the OID of the temp namespace.
* firstTempTransaction flags whether we've committed creation of the TEMP *
* namespace or not. * myTempNamespaceXID shows whether we've created the TEMP namespace in the
* current transaction. The TransactionId propagates up the transaction tree,
* so the main transaction will correctly recognize the flag if all
* intermediate subtransactions commit. When it is InvalidTransactionId,
* we either haven't made the TEMP namespace yet, or have successfully
* committed its creation, depending on whether myTempNamespace is valid.
*/ */
static Oid myTempNamespace = InvalidOid; static Oid myTempNamespace = InvalidOid;
static bool firstTempTransaction = false; static TransactionId myTempNamespaceXID = InvalidTransactionId;
/* /*
* "Special" namespace for CREATE SCHEMA. If set, it's the first search * "Special" namespace for CREATE SCHEMA. If set, it's the first search
...@@ -1688,7 +1693,9 @@ InitTempTableNamespace(void) ...@@ -1688,7 +1693,9 @@ InitTempTableNamespace(void)
*/ */
myTempNamespace = namespaceId; myTempNamespace = namespaceId;
firstTempTransaction = true; /* It should not be done already. */
AssertState(myTempNamespaceXID == InvalidTransactionId);
myTempNamespaceXID = GetCurrentTransactionId();
namespaceSearchPathValid = false; /* need to rebuild list */ namespaceSearchPathValid = false; /* need to rebuild list */
} }
...@@ -1707,7 +1714,7 @@ AtEOXact_Namespace(bool isCommit) ...@@ -1707,7 +1714,7 @@ AtEOXact_Namespace(bool isCommit)
* temp tables at backend shutdown. (We only want to register the * temp tables at backend shutdown. (We only want to register the
* callback once per session, so this is a good place to do it.) * callback once per session, so this is a good place to do it.)
*/ */
if (firstTempTransaction) if (myTempNamespaceXID == GetCurrentTransactionId())
{ {
if (isCommit) if (isCommit)
on_shmem_exit(RemoveTempRelationsCallback, 0); on_shmem_exit(RemoveTempRelationsCallback, 0);
...@@ -1716,7 +1723,7 @@ AtEOXact_Namespace(bool isCommit) ...@@ -1716,7 +1723,7 @@ AtEOXact_Namespace(bool isCommit)
myTempNamespace = InvalidOid; myTempNamespace = InvalidOid;
namespaceSearchPathValid = false; /* need to rebuild list */ namespaceSearchPathValid = false; /* need to rebuild list */
} }
firstTempTransaction = false; myTempNamespaceXID = InvalidTransactionId;
} }
/* /*
...@@ -1729,6 +1736,32 @@ AtEOXact_Namespace(bool isCommit) ...@@ -1729,6 +1736,32 @@ AtEOXact_Namespace(bool isCommit)
} }
} }
/*
* AtEOSubXact_Namespace
*
* At subtransaction commit, propagate the temp-namespace-creation
* flag to the parent transaction.
*
* At subtransaction abort, forget the flag if we set it up.
*/
void
AtEOSubXact_Namespace(bool isCommit, TransactionId myXid,
TransactionId parentXid)
{
if (myTempNamespaceXID == myXid)
{
if (isCommit)
myTempNamespaceXID = parentXid;
else
{
myTempNamespaceXID = InvalidTransactionId;
/* TEMP namespace creation failed, so reset state */
myTempNamespace = InvalidOid;
namespaceSearchPathValid = false; /* need to rebuild list */
}
}
}
/* /*
* Remove all relations in the specified temp namespace. * Remove all relations in the specified temp namespace.
* *
......
...@@ -6,7 +6,7 @@ ...@@ -6,7 +6,7 @@
* Portions Copyright (c) 1996-2003, PostgreSQL Global Development Group * Portions Copyright (c) 1996-2003, PostgreSQL Global Development Group
* Portions Copyright (c) 1994, Regents of the University of California * Portions Copyright (c) 1994, Regents of the University of California
* *
* $PostgreSQL: pgsql/src/backend/commands/user.c,v 1.141 2004/05/26 04:41:12 neilc Exp $ * $PostgreSQL: pgsql/src/backend/commands/user.c,v 1.142 2004/07/28 14:23:28 tgl Exp $
* *
*------------------------------------------------------------------------- *-------------------------------------------------------------------------
*/ */
...@@ -44,8 +44,30 @@ ...@@ -44,8 +44,30 @@
extern bool Password_encryption; extern bool Password_encryption;
static bool user_file_update_needed = false; /*
static bool group_file_update_needed = false; * The need-to-update-files flags are a pair of TransactionIds that show what
* level of the transaction tree requested the update. To register an update,
* the transaction saves its own TransactionId in the flag, unless the value
* was already set to a valid TransactionId. If it aborts and the value is its
* TransactionId, it resets the value to InvalidTransactionId. If it commits,
* it changes the value to its parent's TransactionId. This way the value is
* propagated up to the topmost transaction, which will update the files if a
* valid TransactionId is detected.
*/
static TransactionId user_file_update_xid = InvalidTransactionId;
static TransactionId group_file_update_xid = InvalidTransactionId;
#define user_file_update_needed() \
do { \
if (user_file_update_xid == InvalidTransactionId) \
user_file_update_xid = GetCurrentTransactionId(); \
} while (0)
#define group_file_update_needed() \
do { \
if (group_file_update_xid == InvalidTransactionId) \
group_file_update_xid = GetCurrentTransactionId(); \
} while (0)
static void CheckPgUserAclNotNull(void); static void CheckPgUserAclNotNull(void);
...@@ -402,8 +424,8 @@ write_user_file(Relation urel) ...@@ -402,8 +424,8 @@ write_user_file(Relation urel)
Datum Datum
update_pg_pwd_and_pg_group(PG_FUNCTION_ARGS) update_pg_pwd_and_pg_group(PG_FUNCTION_ARGS)
{ {
user_file_update_needed = true; user_file_update_needed();
group_file_update_needed = true; group_file_update_needed();
return PointerGetDatum(NULL); return PointerGetDatum(NULL);
} }
...@@ -429,13 +451,14 @@ AtEOXact_UpdatePasswordFile(bool isCommit) ...@@ -429,13 +451,14 @@ AtEOXact_UpdatePasswordFile(bool isCommit)
Relation urel = NULL; Relation urel = NULL;
Relation grel = NULL; Relation grel = NULL;
if (!(user_file_update_needed || group_file_update_needed)) if (user_file_update_xid == InvalidTransactionId &&
group_file_update_xid == InvalidTransactionId)
return; return;
if (!isCommit) if (!isCommit)
{ {
user_file_update_needed = false; user_file_update_xid = InvalidTransactionId;
group_file_update_needed = false; group_file_update_xid = InvalidTransactionId;
return; return;
} }
...@@ -447,22 +470,22 @@ AtEOXact_UpdatePasswordFile(bool isCommit) ...@@ -447,22 +470,22 @@ AtEOXact_UpdatePasswordFile(bool isCommit)
* pg_shadow or pg_group, which likely won't have gotten a strong * pg_shadow or pg_group, which likely won't have gotten a strong
* enough lock), so get the locks we need before writing anything. * enough lock), so get the locks we need before writing anything.
*/ */
if (user_file_update_needed) if (user_file_update_xid != InvalidTransactionId)
urel = heap_openr(ShadowRelationName, ExclusiveLock); urel = heap_openr(ShadowRelationName, ExclusiveLock);
if (group_file_update_needed) if (group_file_update_xid != InvalidTransactionId)
grel = heap_openr(GroupRelationName, ExclusiveLock); grel = heap_openr(GroupRelationName, ExclusiveLock);
/* Okay to write the files */ /* Okay to write the files */
if (user_file_update_needed) if (user_file_update_xid != InvalidTransactionId)
{ {
user_file_update_needed = false; user_file_update_xid = InvalidTransactionId;
write_user_file(urel); write_user_file(urel);
heap_close(urel, NoLock); heap_close(urel, NoLock);
} }
if (group_file_update_needed) if (group_file_update_xid != InvalidTransactionId)
{ {
group_file_update_needed = false; group_file_update_xid = InvalidTransactionId;
write_group_file(grel); write_group_file(grel);
heap_close(grel, NoLock); heap_close(grel, NoLock);
} }
...@@ -473,7 +496,33 @@ AtEOXact_UpdatePasswordFile(bool isCommit) ...@@ -473,7 +496,33 @@ AtEOXact_UpdatePasswordFile(bool isCommit)
SendPostmasterSignal(PMSIGNAL_PASSWORD_CHANGE); SendPostmasterSignal(PMSIGNAL_PASSWORD_CHANGE);
} }
/*
* AtEOSubXact_UpdatePasswordFile
*
* Called at subtransaction end, this routine resets or updates the
* need-to-update-files flags.
*/
void
AtEOSubXact_UpdatePasswordFile(bool isCommit, TransactionId myXid,
TransactionId parentXid)
{
if (isCommit)
{
if (user_file_update_xid == myXid)
user_file_update_xid = parentXid;
if (group_file_update_xid == myXid)
group_file_update_xid = parentXid;
}
else
{
if (user_file_update_xid == myXid)
user_file_update_xid = InvalidTransactionId;
if (group_file_update_xid == myXid)
group_file_update_xid = InvalidTransactionId;
}
}
/* /*
* CREATE USER * CREATE USER
...@@ -728,7 +777,7 @@ CreateUser(CreateUserStmt *stmt) ...@@ -728,7 +777,7 @@ CreateUser(CreateUserStmt *stmt)
/* /*
* Set flag to update flat password file at commit. * Set flag to update flat password file at commit.
*/ */
user_file_update_needed = true; user_file_update_needed();
} }
...@@ -925,7 +974,7 @@ AlterUser(AlterUserStmt *stmt) ...@@ -925,7 +974,7 @@ AlterUser(AlterUserStmt *stmt)
/* /*
* Set flag to update flat password file at commit. * Set flag to update flat password file at commit.
*/ */
user_file_update_needed = true; user_file_update_needed();
} }
...@@ -1147,7 +1196,7 @@ DropUser(DropUserStmt *stmt) ...@@ -1147,7 +1196,7 @@ DropUser(DropUserStmt *stmt)
/* /*
* Set flag to update flat password file at commit. * Set flag to update flat password file at commit.
*/ */
user_file_update_needed = true; user_file_update_needed();
} }
...@@ -1233,7 +1282,7 @@ RenameUser(const char *oldname, const char *newname) ...@@ -1233,7 +1282,7 @@ RenameUser(const char *oldname, const char *newname)
ReleaseSysCache(oldtuple); ReleaseSysCache(oldtuple);
heap_close(rel, NoLock); heap_close(rel, NoLock);
user_file_update_needed = true; user_file_update_needed();
} }
...@@ -1438,7 +1487,7 @@ CreateGroup(CreateGroupStmt *stmt) ...@@ -1438,7 +1487,7 @@ CreateGroup(CreateGroupStmt *stmt)
/* /*
* Set flag to update flat group file at commit. * Set flag to update flat group file at commit.
*/ */
group_file_update_needed = true; group_file_update_needed();
} }
...@@ -1590,7 +1639,7 @@ AlterGroup(AlterGroupStmt *stmt, const char *tag) ...@@ -1590,7 +1639,7 @@ AlterGroup(AlterGroupStmt *stmt, const char *tag)
/* /*
* Set flag to update flat group file at commit. * Set flag to update flat group file at commit.
*/ */
group_file_update_needed = true; group_file_update_needed();
} }
/* /*
...@@ -1730,7 +1779,7 @@ DropGroup(DropGroupStmt *stmt) ...@@ -1730,7 +1779,7 @@ DropGroup(DropGroupStmt *stmt)
/* /*
* Set flag to update flat group file at commit. * Set flag to update flat group file at commit.
*/ */
group_file_update_needed = true; group_file_update_needed();
} }
...@@ -1776,5 +1825,5 @@ RenameGroup(const char *oldname, const char *newname) ...@@ -1776,5 +1825,5 @@ RenameGroup(const char *oldname, const char *newname)
heap_close(rel, NoLock); heap_close(rel, NoLock);
heap_freetuple(tup); heap_freetuple(tup);
group_file_update_needed = true; group_file_update_needed();
} }
/*------------------------------------------------------------------------- /*-------------------------------------------------------------------------
* *
* be-fsstubs.c * be-fsstubs.c
* support for filesystem operations on large objects * Builtin functions for open/close/read/write operations on large objects
* *
* Portions Copyright (c) 1996-2003, PostgreSQL Global Development Group * Portions Copyright (c) 1996-2003, PostgreSQL Global Development Group
* Portions Copyright (c) 1994, Regents of the University of California * Portions Copyright (c) 1994, Regents of the University of California
* *
* *
* IDENTIFICATION * IDENTIFICATION
* $PostgreSQL: pgsql/src/backend/libpq/be-fsstubs.c,v 1.70 2004/02/10 01:55:25 tgl Exp $ * $PostgreSQL: pgsql/src/backend/libpq/be-fsstubs.c,v 1.71 2004/07/28 14:23:28 tgl Exp $
* *
* NOTES * NOTES
* This should be moved to a more appropriate place. It is here * This should be moved to a more appropriate place. It is here
* for lack of a better place. * for lack of a better place.
* *
* Builtin functions for open/close/read/write operations on large objects.
*
* These functions operate in a private MemoryContext, which means * These functions operate in a private MemoryContext, which means
* that large object descriptors hang around until we destroy the context. * that large object descriptors hang around until we destroy the context
* That happens in lo_commit(). It'd be possible to prolong the lifetime * at transaction end. It'd be possible to prolong the lifetime
* of the context so that LO FDs are good across transactions (for example, * of the context so that LO FDs are good across transactions (for example,
* we could release the context only if we see that no FDs remain open). * we could release the context only if we see that no FDs remain open).
* But we'd need additional state in order to do the right thing at the * But we'd need additional state in order to do the right thing at the
...@@ -29,6 +27,11 @@ ...@@ -29,6 +27,11 @@
* existing documented semantics of LO FDs: they're only good within a * existing documented semantics of LO FDs: they're only good within a
* transaction. * transaction.
* *
* As of PostgreSQL 7.5, much of the angst expressed above is no longer
* relevant, and in fact it'd be pretty easy to allow LO FDs to stay
* open across transactions. However backwards compatibility suggests
* that we should stick to the status quo.
*
*------------------------------------------------------------------------- *-------------------------------------------------------------------------
*/ */
...@@ -46,8 +49,6 @@ ...@@ -46,8 +49,6 @@
#include "utils/memutils.h" #include "utils/memutils.h"
/* [PA] is Pascal Andr <andre@via.ecp.fr> */
/*#define FSDB 1*/ /*#define FSDB 1*/
#define BUFSIZE 8192 #define BUFSIZE 8192
...@@ -68,6 +69,7 @@ static MemoryContext fscxt = NULL; ...@@ -68,6 +69,7 @@ static MemoryContext fscxt = NULL;
static int newLOfd(LargeObjectDesc *lobjCookie); static int newLOfd(LargeObjectDesc *lobjCookie);
static void deleteLOfd(int fd); static void deleteLOfd(int fd);
/***************************************************************************** /*****************************************************************************
* File Interfaces for Large Objects * File Interfaces for Large Objects
*****************************************************************************/ *****************************************************************************/
...@@ -399,7 +401,7 @@ lo_import(PG_FUNCTION_ARGS) ...@@ -399,7 +401,7 @@ lo_import(PG_FUNCTION_ARGS)
lobjOid = lobj->id; lobjOid = lobj->id;
/* /*
* read in from the Unix file and write to the inversion file * read in from the filesystem and write to the inversion file
*/ */
while ((nbytes = FileRead(fd, buf, BUFSIZE)) > 0) while ((nbytes = FileRead(fd, buf, BUFSIZE)) > 0)
{ {
...@@ -471,7 +473,7 @@ lo_export(PG_FUNCTION_ARGS) ...@@ -471,7 +473,7 @@ lo_export(PG_FUNCTION_ARGS)
fnamebuf))); fnamebuf)));
/* /*
* read in from the inversion file and write to the Unix file * read in from the inversion file and write to the filesystem
*/ */
while ((nbytes = inv_read(lobj, buf, BUFSIZE)) > 0) while ((nbytes = inv_read(lobj, buf, BUFSIZE)) > 0)
{ {
...@@ -490,11 +492,11 @@ lo_export(PG_FUNCTION_ARGS) ...@@ -490,11 +492,11 @@ lo_export(PG_FUNCTION_ARGS)
} }
/* /*
* lo_commit - * AtEOXact_LargeObject -
* prepares large objects for transaction commit [PA, 7/17/98] * prepares large objects for transaction commit
*/ */
void void
lo_commit(bool isCommit) AtEOXact_LargeObject(bool isCommit)
{ {
int i; int i;
MemoryContext currentContext; MemoryContext currentContext;
...@@ -505,8 +507,8 @@ lo_commit(bool isCommit) ...@@ -505,8 +507,8 @@ lo_commit(bool isCommit)
currentContext = MemoryContextSwitchTo(fscxt); currentContext = MemoryContextSwitchTo(fscxt);
/* /*
* Clean out still-open index scans (not necessary if aborting) and * Close LO fds and clear cookies array so that LO fds are no longer good.
* clear cookies array so that LO fds are no longer good. * On abort we skip the close step.
*/ */
for (i = 0; i < cookies_size; i++) for (i = 0; i < cookies_size; i++)
{ {
...@@ -514,7 +516,7 @@ lo_commit(bool isCommit) ...@@ -514,7 +516,7 @@ lo_commit(bool isCommit)
{ {
if (isCommit) if (isCommit)
inv_close(cookies[i]); inv_close(cookies[i]);
cookies[i] = NULL; deleteLOfd(i);
} }
} }
...@@ -527,8 +529,47 @@ lo_commit(bool isCommit) ...@@ -527,8 +529,47 @@ lo_commit(bool isCommit)
/* Release the LO memory context to prevent permanent memory leaks. */ /* Release the LO memory context to prevent permanent memory leaks. */
MemoryContextDelete(fscxt); MemoryContextDelete(fscxt);
fscxt = NULL; fscxt = NULL;
/* Give inv_api.c a chance to clean up, too */
close_lo_relation(isCommit);
} }
/*
* AtEOSubXact_LargeObject
* Take care of large objects at subtransaction commit/abort
*
* Reassign LOs created/opened during a committing subtransaction
* to the parent transaction. On abort, just close them.
*/
void
AtEOSubXact_LargeObject(bool isCommit, TransactionId myXid,
TransactionId parentXid)
{
int i;
if (fscxt == NULL) /* no LO operations in this xact */
return;
for (i = 0; i < cookies_size; i++)
{
LargeObjectDesc *lo = cookies[i];
if (lo != NULL && lo->xid == myXid)
{
if (isCommit)
lo->xid = parentXid;
else
{
/*
* Make sure we do not call inv_close twice if it errors out
* for some reason. Better a leak than a crash.
*/
deleteLOfd(i);
inv_close(lo);
}
}
}
}
/***************************************************************************** /*****************************************************************************
* Support routines for this file * Support routines for this file
......
...@@ -7,7 +7,7 @@ ...@@ -7,7 +7,7 @@
* Portions Copyright (c) 1994, Regents of the University of California * Portions Copyright (c) 1994, Regents of the University of California
* *
* IDENTIFICATION * IDENTIFICATION
* $PostgreSQL: pgsql/src/backend/storage/file/fd.c,v 1.109 2004/05/31 03:48:04 tgl Exp $ * $PostgreSQL: pgsql/src/backend/storage/file/fd.c,v 1.110 2004/07/28 14:23:28 tgl Exp $
* *
* NOTES: * NOTES:
* *
...@@ -47,6 +47,7 @@ ...@@ -47,6 +47,7 @@
#include <fcntl.h> #include <fcntl.h>
#include "miscadmin.h" #include "miscadmin.h"
#include "access/xact.h"
#include "storage/fd.h" #include "storage/fd.h"
#include "storage/ipc.h" #include "storage/ipc.h"
...@@ -122,6 +123,7 @@ typedef struct vfd ...@@ -122,6 +123,7 @@ typedef struct vfd
{ {
signed short fd; /* current FD, or VFD_CLOSED if none */ signed short fd; /* current FD, or VFD_CLOSED if none */
unsigned short fdstate; /* bitflags for VFD's state */ unsigned short fdstate; /* bitflags for VFD's state */
TransactionId create_xid; /* for XACT_TEMPORARY fds, creating Xid */
File nextFree; /* link to next free VFD, if in freelist */ File nextFree; /* link to next free VFD, if in freelist */
File lruMoreRecently; /* doubly linked recency-of-use list */ File lruMoreRecently; /* doubly linked recency-of-use list */
File lruLessRecently; File lruLessRecently;
...@@ -146,27 +148,31 @@ static Size SizeVfdCache = 0; ...@@ -146,27 +148,31 @@ static Size SizeVfdCache = 0;
static int nfile = 0; static int nfile = 0;
/* /*
* List of stdio FILEs opened with AllocateFile. * List of stdio FILEs and <dirent.h> DIRs opened with AllocateFile
* and AllocateDir.
* *
* Since we don't want to encourage heavy use of AllocateFile, it seems * Since we don't want to encourage heavy use of AllocateFile or AllocateDir,
* OK to put a pretty small maximum limit on the number of simultaneously * it seems OK to put a pretty small maximum limit on the number of
* allocated files. * simultaneously allocated descs.
*/ */
#define MAX_ALLOCATED_FILES 32 #define MAX_ALLOCATED_DESCS 32
static int numAllocatedFiles = 0; typedef enum {
static FILE *allocatedFiles[MAX_ALLOCATED_FILES]; AllocateDescFile,
AllocateDescDir
} AllocateDescKind;
/* typedef struct {
* List of <dirent.h> DIRs opened with AllocateDir. AllocateDescKind kind;
* union {
* Since we don't have heavy use of AllocateDir, it seems OK to put a pretty FILE *file;
* small maximum limit on the number of simultaneously allocated dirs. DIR *dir;
*/ } desc;
#define MAX_ALLOCATED_DIRS 10 TransactionId create_xid;
} AllocateDesc;
static int numAllocatedDirs = 0; static int numAllocatedDescs = 0;
static DIR *allocatedDirs[MAX_ALLOCATED_DIRS]; static AllocateDesc allocatedDescs[MAX_ALLOCATED_DESCS];
/* /*
* Number of temporary files opened during the current session; * Number of temporary files opened during the current session;
...@@ -499,7 +505,7 @@ LruInsert(File file) ...@@ -499,7 +505,7 @@ LruInsert(File file)
if (FileIsNotOpen(file)) if (FileIsNotOpen(file))
{ {
while (nfile + numAllocatedFiles + numAllocatedDirs >= max_safe_fds) while (nfile + numAllocatedDescs >= max_safe_fds)
{ {
if (!ReleaseLruFile()) if (!ReleaseLruFile())
break; break;
...@@ -759,7 +765,7 @@ fileNameOpenFile(FileName fileName, ...@@ -759,7 +765,7 @@ fileNameOpenFile(FileName fileName,
file = AllocateVfd(); file = AllocateVfd();
vfdP = &VfdCache[file]; vfdP = &VfdCache[file];
while (nfile + numAllocatedFiles + numAllocatedDirs >= max_safe_fds) while (nfile + numAllocatedDescs >= max_safe_fds)
{ {
if (!ReleaseLruFile()) if (!ReleaseLruFile())
break; break;
...@@ -876,7 +882,10 @@ OpenTemporaryFile(bool interXact) ...@@ -876,7 +882,10 @@ OpenTemporaryFile(bool interXact)
/* Mark it for deletion at EOXact */ /* Mark it for deletion at EOXact */
if (!interXact) if (!interXact)
{
VfdCache[file].fdstate |= FD_XACT_TEMPORARY; VfdCache[file].fdstate |= FD_XACT_TEMPORARY;
VfdCache[file].create_xid = GetCurrentTransactionId();
}
return file; return file;
} }
...@@ -1134,24 +1143,29 @@ AllocateFile(char *name, char *mode) ...@@ -1134,24 +1143,29 @@ AllocateFile(char *name, char *mode)
{ {
FILE *file; FILE *file;
DO_DB(elog(LOG, "AllocateFile: Allocated %d", numAllocatedFiles)); DO_DB(elog(LOG, "AllocateFile: Allocated %d (%s)",
numAllocatedDescs, name));
/* /*
* The test against MAX_ALLOCATED_FILES prevents us from overflowing * The test against MAX_ALLOCATED_DESCS prevents us from overflowing
* allocatedFiles[]; the test against max_safe_fds prevents AllocateFile * allocatedFiles[]; the test against max_safe_fds prevents AllocateFile
* from hogging every one of the available FDs, which'd lead to infinite * from hogging every one of the available FDs, which'd lead to infinite
* looping. * looping.
*/ */
if (numAllocatedFiles >= MAX_ALLOCATED_FILES || if (numAllocatedDescs >= MAX_ALLOCATED_DESCS ||
numAllocatedFiles + numAllocatedDirs >= max_safe_fds - 1) numAllocatedDescs >= max_safe_fds - 1)
elog(ERROR, "too many private files demanded"); elog(ERROR, "too many private files demanded");
TryAgain: TryAgain:
if ((file = fopen(name, mode)) != NULL) if ((file = fopen(name, mode)) != NULL)
{ {
allocatedFiles[numAllocatedFiles] = file; AllocateDesc *desc = &allocatedDescs[numAllocatedDescs];
numAllocatedFiles++;
return file; desc->kind = AllocateDescFile;
desc->desc.file = file;
desc->create_xid = GetCurrentTransactionId();
numAllocatedDescs++;
return desc->desc.file;
} }
if (errno == EMFILE || errno == ENFILE) if (errno == EMFILE || errno == ENFILE)
...@@ -1170,6 +1184,38 @@ TryAgain: ...@@ -1170,6 +1184,38 @@ TryAgain:
return NULL; return NULL;
} }
/*
* Free an AllocateDesc of either type.
*
* The argument *must* point into the allocatedDescs[] array.
*/
static int
FreeDesc(AllocateDesc *desc)
{
int result;
/* Close the underlying object */
switch (desc->kind)
{
case AllocateDescFile:
result = fclose(desc->desc.file);
break;
case AllocateDescDir:
result = closedir(desc->desc.dir);
break;
default:
elog(ERROR, "AllocateDesc kind not recognized");
result = 0; /* keep compiler quiet */
break;
}
/* Compact storage in the allocatedDescs array */
numAllocatedDescs--;
*desc = allocatedDescs[numAllocatedDescs];
return result;
}
/* /*
* Close a file returned by AllocateFile. * Close a file returned by AllocateFile.
* *
...@@ -1181,19 +1227,18 @@ FreeFile(FILE *file) ...@@ -1181,19 +1227,18 @@ FreeFile(FILE *file)
{ {
int i; int i;
DO_DB(elog(LOG, "FreeFile: Allocated %d", numAllocatedFiles)); DO_DB(elog(LOG, "FreeFile: Allocated %d", numAllocatedDescs));
/* Remove file from list of allocated files, if it's present */ /* Remove file from list of allocated files, if it's present */
for (i = numAllocatedFiles; --i >= 0;) for (i = numAllocatedDescs; --i >= 0;)
{ {
if (allocatedFiles[i] == file) AllocateDesc *desc = &allocatedDescs[i];
{
numAllocatedFiles--; if (desc->kind == AllocateDescFile && desc->desc.file == file)
allocatedFiles[i] = allocatedFiles[numAllocatedFiles]; return FreeDesc(desc);
break;
}
} }
if (i < 0)
/* Only get here if someone passes us a file not in allocatedDescs */
elog(WARNING, "file passed to FreeFile was not obtained from AllocateFile"); elog(WARNING, "file passed to FreeFile was not obtained from AllocateFile");
return fclose(file); return fclose(file);
...@@ -1213,24 +1258,29 @@ AllocateDir(const char *dirname) ...@@ -1213,24 +1258,29 @@ AllocateDir(const char *dirname)
{ {
DIR *dir; DIR *dir;
DO_DB(elog(LOG, "AllocateDir: Allocated %d", numAllocatedDirs)); DO_DB(elog(LOG, "AllocateDir: Allocated %d (%s)",
numAllocatedDescs, dirname));
/* /*
* The test against MAX_ALLOCATED_DIRS prevents us from overflowing * The test against MAX_ALLOCATED_DESCS prevents us from overflowing
* allocatedDirs[]; the test against max_safe_fds prevents AllocateDir * allocatedDescs[]; the test against max_safe_fds prevents AllocateDir
* from hogging every one of the available FDs, which'd lead to infinite * from hogging every one of the available FDs, which'd lead to infinite
* looping. * looping.
*/ */
if (numAllocatedDirs >= MAX_ALLOCATED_DIRS || if (numAllocatedDescs >= MAX_ALLOCATED_DESCS ||
numAllocatedDirs + numAllocatedFiles >= max_safe_fds - 1) numAllocatedDescs >= max_safe_fds - 1)
elog(ERROR, "too many private dirs demanded"); elog(ERROR, "too many private dirs demanded");
TryAgain: TryAgain:
if ((dir = opendir(dirname)) != NULL) if ((dir = opendir(dirname)) != NULL)
{ {
allocatedDirs[numAllocatedDirs] = dir; AllocateDesc *desc = &allocatedDescs[numAllocatedDescs];
numAllocatedDirs++;
return dir; desc->kind = AllocateDescDir;
desc->desc.dir = dir;
desc->create_xid = GetCurrentTransactionId();
numAllocatedDescs++;
return desc->desc.dir;
} }
if (errno == EMFILE || errno == ENFILE) if (errno == EMFILE || errno == ENFILE)
...@@ -1260,19 +1310,18 @@ FreeDir(DIR *dir) ...@@ -1260,19 +1310,18 @@ FreeDir(DIR *dir)
{ {
int i; int i;
DO_DB(elog(LOG, "FreeDir: Allocated %d", numAllocatedDirs)); DO_DB(elog(LOG, "FreeDir: Allocated %d", numAllocatedDescs));
/* Remove dir from list of allocated dirs, if it's present */ /* Remove dir from list of allocated dirs, if it's present */
for (i = numAllocatedDirs; --i >= 0;) for (i = numAllocatedDescs; --i >= 0;)
{ {
if (allocatedDirs[i] == dir) AllocateDesc *desc = &allocatedDescs[i];
{
numAllocatedDirs--; if (desc->kind == AllocateDescDir && desc->desc.dir == dir)
allocatedDirs[i] = allocatedDirs[numAllocatedDirs]; return FreeDesc(desc);
break;
}
} }
if (i < 0)
/* Only get here if someone passes us a dir not in allocatedDescs */
elog(WARNING, "dir passed to FreeDir was not obtained from AllocateDir"); elog(WARNING, "dir passed to FreeDir was not obtained from AllocateDir");
return closedir(dir); return closedir(dir);
...@@ -1302,6 +1351,51 @@ closeAllVfds(void) ...@@ -1302,6 +1351,51 @@ closeAllVfds(void)
} }
} }
/*
* AtEOSubXact_Files
*
* Take care of subtransaction commit/abort. At abort, we close temp files
* that the subtransaction may have opened. At commit, we reassign the
* files that were opened to the parent transaction.
*/
void
AtEOSubXact_Files(bool isCommit, TransactionId myXid, TransactionId parentXid)
{
Index i;
if (SizeVfdCache > 0)
{
Assert(FileIsNotOpen(0)); /* Make sure ring not corrupted */
for (i = 1; i < SizeVfdCache; i++)
{
unsigned short fdstate = VfdCache[i].fdstate;
if ((fdstate & FD_XACT_TEMPORARY) &&
VfdCache[i].create_xid == myXid)
{
if (isCommit)
VfdCache[i].create_xid = parentXid;
else if (VfdCache[i].fileName != NULL)
FileClose(i);
}
}
}
for (i = 0; i < numAllocatedDescs; i++)
{
if (allocatedDescs[i].create_xid == myXid)
{
if (isCommit)
allocatedDescs[i].create_xid = parentXid;
else
{
/* have to recheck the item after FreeDesc (ugly) */
FreeDesc(&allocatedDescs[i--]);
}
}
}
}
/* /*
* AtEOXact_Files * AtEOXact_Files
* *
...@@ -1362,11 +1456,8 @@ CleanupTempFiles(bool isProcExit) ...@@ -1362,11 +1456,8 @@ CleanupTempFiles(bool isProcExit)
} }
} }
while (numAllocatedFiles > 0) while (numAllocatedDescs > 0)
FreeFile(allocatedFiles[0]); FreeDesc(&allocatedDescs[0]);
while (numAllocatedDirs > 0)
FreeDir(allocatedDirs[0]);
} }
......
...@@ -9,36 +9,92 @@ ...@@ -9,36 +9,92 @@
* *
* *
* IDENTIFICATION * IDENTIFICATION
* $PostgreSQL: pgsql/src/backend/storage/large_object/inv_api.c,v 1.102 2003/11/29 19:51:56 pgsql Exp $ * $PostgreSQL: pgsql/src/backend/storage/large_object/inv_api.c,v 1.103 2004/07/28 14:23:29 tgl Exp $
* *
*------------------------------------------------------------------------- *-------------------------------------------------------------------------
*/ */
#include "postgres.h" #include "postgres.h"
#include <errno.h>
#include <sys/file.h>
#include <sys/stat.h>
#include "access/genam.h" #include "access/genam.h"
#include "access/heapam.h" #include "access/heapam.h"
#include "access/htup.h"
#include "access/tuptoaster.h" #include "access/tuptoaster.h"
#include "catalog/catalog.h" #include "catalog/catalog.h"
#include "catalog/catname.h" #include "catalog/catname.h"
#include "catalog/heap.h"
#include "catalog/index.h"
#include "catalog/indexing.h" #include "catalog/indexing.h"
#include "catalog/pg_opclass.h"
#include "catalog/pg_largeobject.h" #include "catalog/pg_largeobject.h"
#include "catalog/pg_type.h"
#include "commands/comment.h" #include "commands/comment.h"
#include "libpq/libpq-fs.h" #include "libpq/libpq-fs.h"
#include "miscadmin.h"
#include "storage/large_object.h" #include "storage/large_object.h"
#include "storage/smgr.h"
#include "utils/builtins.h"
#include "utils/fmgroids.h" #include "utils/fmgroids.h"
#include "utils/lsyscache.h" #include "utils/lsyscache.h"
#include "utils/resowner.h"
/*
* All accesses to pg_largeobject and its index make use of a single Relation
* reference, so that we only need to open pg_relation once per transaction.
* To avoid problems when the first such reference occurs inside a
* subtransaction, we execute a slightly klugy maneuver to assign ownership of
* the Relation reference to TopTransactionResourceOwner.
*/
static Relation lo_heap_r = NULL;
static Relation lo_index_r = NULL;
/*
* Open pg_largeobject and its index, if not already done in current xact
*/
static void
open_lo_relation(void)
{
ResourceOwner currentOwner;
if (lo_heap_r && lo_index_r)
return; /* already open in current xact */
/* Arrange for the top xact to own these relation references */
currentOwner = CurrentResourceOwner;
CurrentResourceOwner = TopTransactionResourceOwner;
/* Use RowExclusiveLock since we might either read or write */
if (lo_heap_r == NULL)
lo_heap_r = heap_openr(LargeObjectRelationName, RowExclusiveLock);
if (lo_index_r == NULL)
lo_index_r = index_openr(LargeObjectLOidPNIndex);
CurrentResourceOwner = currentOwner;
}
/*
* Clean up at main transaction end
*/
void
close_lo_relation(bool isCommit)
{
if (lo_heap_r || lo_index_r)
{
/*
* Only bother to close if committing; else abort cleanup will
* handle it
*/
if (isCommit)
{
ResourceOwner currentOwner;
currentOwner = CurrentResourceOwner;
CurrentResourceOwner = TopTransactionResourceOwner;
if (lo_index_r)
index_close(lo_index_r);
if (lo_heap_r)
heap_close(lo_heap_r, NoLock);
CurrentResourceOwner = currentOwner;
}
lo_heap_r = NULL;
lo_index_r = NULL;
}
}
static int32 static int32
...@@ -50,6 +106,7 @@ getbytealen(bytea *data) ...@@ -50,6 +106,7 @@ getbytealen(bytea *data)
return (VARSIZE(data) - VARHDRSZ); return (VARSIZE(data) - VARHDRSZ);
} }
/* /*
* inv_create -- create a new large object. * inv_create -- create a new large object.
* *
...@@ -92,23 +149,20 @@ inv_create(int flags) ...@@ -92,23 +149,20 @@ inv_create(int flags)
retval = (LargeObjectDesc *) palloc(sizeof(LargeObjectDesc)); retval = (LargeObjectDesc *) palloc(sizeof(LargeObjectDesc));
retval->id = file_oid; retval->id = file_oid;
retval->xid = GetCurrentTransactionId();
retval->offset = 0; retval->offset = 0;
if (flags & INV_WRITE) if (flags & INV_WRITE)
{ {
retval->flags = IFS_WRLOCK | IFS_RDLOCK; retval->flags = IFS_WRLOCK | IFS_RDLOCK;
retval->heap_r = heap_openr(LargeObjectRelationName, RowExclusiveLock);
} }
else if (flags & INV_READ) else if (flags & INV_READ)
{ {
retval->flags = IFS_RDLOCK; retval->flags = IFS_RDLOCK;
retval->heap_r = heap_openr(LargeObjectRelationName, AccessShareLock);
} }
else else
elog(ERROR, "invalid flags: %d", flags); elog(ERROR, "invalid flags: %d", flags);
retval->index_r = index_openr(LargeObjectLOidPNIndex);
return retval; return retval;
} }
...@@ -131,23 +185,20 @@ inv_open(Oid lobjId, int flags) ...@@ -131,23 +185,20 @@ inv_open(Oid lobjId, int flags)
retval = (LargeObjectDesc *) palloc(sizeof(LargeObjectDesc)); retval = (LargeObjectDesc *) palloc(sizeof(LargeObjectDesc));
retval->id = lobjId; retval->id = lobjId;
retval->xid = GetCurrentTransactionId();
retval->offset = 0; retval->offset = 0;
if (flags & INV_WRITE) if (flags & INV_WRITE)
{ {
retval->flags = IFS_WRLOCK | IFS_RDLOCK; retval->flags = IFS_WRLOCK | IFS_RDLOCK;
retval->heap_r = heap_openr(LargeObjectRelationName, RowExclusiveLock);
} }
else if (flags & INV_READ) else if (flags & INV_READ)
{ {
retval->flags = IFS_RDLOCK; retval->flags = IFS_RDLOCK;
retval->heap_r = heap_openr(LargeObjectRelationName, AccessShareLock);
} }
else else
elog(ERROR, "invalid flags: %d", flags); elog(ERROR, "invalid flags: %d", flags);
retval->index_r = index_openr(LargeObjectLOidPNIndex);
return retval; return retval;
} }
...@@ -158,13 +209,6 @@ void ...@@ -158,13 +209,6 @@ void
inv_close(LargeObjectDesc *obj_desc) inv_close(LargeObjectDesc *obj_desc)
{ {
Assert(PointerIsValid(obj_desc)); Assert(PointerIsValid(obj_desc));
if (obj_desc->flags & IFS_WRLOCK)
heap_close(obj_desc->heap_r, RowExclusiveLock);
else if (obj_desc->flags & IFS_RDLOCK)
heap_close(obj_desc->heap_r, AccessShareLock);
index_close(obj_desc->index_r);
pfree(obj_desc); pfree(obj_desc);
} }
...@@ -212,12 +256,14 @@ inv_getsize(LargeObjectDesc *obj_desc) ...@@ -212,12 +256,14 @@ inv_getsize(LargeObjectDesc *obj_desc)
Assert(PointerIsValid(obj_desc)); Assert(PointerIsValid(obj_desc));
open_lo_relation();
ScanKeyInit(&skey[0], ScanKeyInit(&skey[0],
Anum_pg_largeobject_loid, Anum_pg_largeobject_loid,
BTEqualStrategyNumber, F_OIDEQ, BTEqualStrategyNumber, F_OIDEQ,
ObjectIdGetDatum(obj_desc->id)); ObjectIdGetDatum(obj_desc->id));
sd = index_beginscan(obj_desc->heap_r, obj_desc->index_r, sd = index_beginscan(lo_heap_r, lo_index_r,
SnapshotNow, 1, skey); SnapshotNow, 1, skey);
/* /*
...@@ -316,6 +362,8 @@ inv_read(LargeObjectDesc *obj_desc, char *buf, int nbytes) ...@@ -316,6 +362,8 @@ inv_read(LargeObjectDesc *obj_desc, char *buf, int nbytes)
if (nbytes <= 0) if (nbytes <= 0)
return 0; return 0;
open_lo_relation();
ScanKeyInit(&skey[0], ScanKeyInit(&skey[0],
Anum_pg_largeobject_loid, Anum_pg_largeobject_loid,
BTEqualStrategyNumber, F_OIDEQ, BTEqualStrategyNumber, F_OIDEQ,
...@@ -326,7 +374,7 @@ inv_read(LargeObjectDesc *obj_desc, char *buf, int nbytes) ...@@ -326,7 +374,7 @@ inv_read(LargeObjectDesc *obj_desc, char *buf, int nbytes)
BTGreaterEqualStrategyNumber, F_INT4GE, BTGreaterEqualStrategyNumber, F_INT4GE,
Int32GetDatum(pageno)); Int32GetDatum(pageno));
sd = index_beginscan(obj_desc->heap_r, obj_desc->index_r, sd = index_beginscan(lo_heap_r, lo_index_r,
SnapshotNow, 2, skey); SnapshotNow, 2, skey);
while ((tuple = index_getnext(sd, ForwardScanDirection)) != NULL) while ((tuple = index_getnext(sd, ForwardScanDirection)) != NULL)
...@@ -421,7 +469,9 @@ inv_write(LargeObjectDesc *obj_desc, char *buf, int nbytes) ...@@ -421,7 +469,9 @@ inv_write(LargeObjectDesc *obj_desc, char *buf, int nbytes)
if (nbytes <= 0) if (nbytes <= 0)
return 0; return 0;
indstate = CatalogOpenIndexes(obj_desc->heap_r); open_lo_relation();
indstate = CatalogOpenIndexes(lo_heap_r);
ScanKeyInit(&skey[0], ScanKeyInit(&skey[0],
Anum_pg_largeobject_loid, Anum_pg_largeobject_loid,
...@@ -433,7 +483,7 @@ inv_write(LargeObjectDesc *obj_desc, char *buf, int nbytes) ...@@ -433,7 +483,7 @@ inv_write(LargeObjectDesc *obj_desc, char *buf, int nbytes)
BTGreaterEqualStrategyNumber, F_INT4GE, BTGreaterEqualStrategyNumber, F_INT4GE,
Int32GetDatum(pageno)); Int32GetDatum(pageno));
sd = index_beginscan(obj_desc->heap_r, obj_desc->index_r, sd = index_beginscan(lo_heap_r, lo_index_r,
SnapshotNow, 2, skey); SnapshotNow, 2, skey);
oldtuple = NULL; oldtuple = NULL;
...@@ -510,9 +560,9 @@ inv_write(LargeObjectDesc *obj_desc, char *buf, int nbytes) ...@@ -510,9 +560,9 @@ inv_write(LargeObjectDesc *obj_desc, char *buf, int nbytes)
memset(replace, ' ', sizeof(replace)); memset(replace, ' ', sizeof(replace));
values[Anum_pg_largeobject_data - 1] = PointerGetDatum(&workbuf); values[Anum_pg_largeobject_data - 1] = PointerGetDatum(&workbuf);
replace[Anum_pg_largeobject_data - 1] = 'r'; replace[Anum_pg_largeobject_data - 1] = 'r';
newtup = heap_modifytuple(oldtuple, obj_desc->heap_r, newtup = heap_modifytuple(oldtuple, lo_heap_r,
values, nulls, replace); values, nulls, replace);
simple_heap_update(obj_desc->heap_r, &newtup->t_self, newtup); simple_heap_update(lo_heap_r, &newtup->t_self, newtup);
CatalogIndexInsert(indstate, newtup); CatalogIndexInsert(indstate, newtup);
heap_freetuple(newtup); heap_freetuple(newtup);
...@@ -554,8 +604,8 @@ inv_write(LargeObjectDesc *obj_desc, char *buf, int nbytes) ...@@ -554,8 +604,8 @@ inv_write(LargeObjectDesc *obj_desc, char *buf, int nbytes)
values[Anum_pg_largeobject_loid - 1] = ObjectIdGetDatum(obj_desc->id); values[Anum_pg_largeobject_loid - 1] = ObjectIdGetDatum(obj_desc->id);
values[Anum_pg_largeobject_pageno - 1] = Int32GetDatum(pageno); values[Anum_pg_largeobject_pageno - 1] = Int32GetDatum(pageno);
values[Anum_pg_largeobject_data - 1] = PointerGetDatum(&workbuf); values[Anum_pg_largeobject_data - 1] = PointerGetDatum(&workbuf);
newtup = heap_formtuple(obj_desc->heap_r->rd_att, values, nulls); newtup = heap_formtuple(lo_heap_r->rd_att, values, nulls);
simple_heap_insert(obj_desc->heap_r, newtup); simple_heap_insert(lo_heap_r, newtup);
CatalogIndexInsert(indstate, newtup); CatalogIndexInsert(indstate, newtup);
heap_freetuple(newtup); heap_freetuple(newtup);
} }
......
...@@ -8,7 +8,7 @@ ...@@ -8,7 +8,7 @@
* *
* *
* IDENTIFICATION * IDENTIFICATION
* $PostgreSQL: pgsql/src/backend/storage/lmgr/lmgr.c,v 1.65 2004/07/27 05:10:58 tgl Exp $ * $PostgreSQL: pgsql/src/backend/storage/lmgr/lmgr.c,v 1.66 2004/07/28 14:23:29 tgl Exp $
* *
*------------------------------------------------------------------------- *-------------------------------------------------------------------------
*/ */
...@@ -137,7 +137,7 @@ LockRelation(Relation relation, LOCKMODE lockmode) ...@@ -137,7 +137,7 @@ LockRelation(Relation relation, LOCKMODE lockmode)
tag.dbId = relation->rd_lockInfo.lockRelId.dbId; tag.dbId = relation->rd_lockInfo.lockRelId.dbId;
tag.objId.blkno = InvalidBlockNumber; tag.objId.blkno = InvalidBlockNumber;
if (!LockAcquire(LockTableId, &tag, GetCurrentTransactionId(), if (!LockAcquire(LockTableId, &tag, GetTopTransactionId(),
lockmode, false)) lockmode, false))
elog(ERROR, "LockAcquire failed"); elog(ERROR, "LockAcquire failed");
...@@ -171,7 +171,7 @@ ConditionalLockRelation(Relation relation, LOCKMODE lockmode) ...@@ -171,7 +171,7 @@ ConditionalLockRelation(Relation relation, LOCKMODE lockmode)
tag.dbId = relation->rd_lockInfo.lockRelId.dbId; tag.dbId = relation->rd_lockInfo.lockRelId.dbId;
tag.objId.blkno = InvalidBlockNumber; tag.objId.blkno = InvalidBlockNumber;
if (!LockAcquire(LockTableId, &tag, GetCurrentTransactionId(), if (!LockAcquire(LockTableId, &tag, GetTopTransactionId(),
lockmode, true)) lockmode, true))
return false; return false;
...@@ -201,7 +201,7 @@ UnlockRelation(Relation relation, LOCKMODE lockmode) ...@@ -201,7 +201,7 @@ UnlockRelation(Relation relation, LOCKMODE lockmode)
tag.dbId = relation->rd_lockInfo.lockRelId.dbId; tag.dbId = relation->rd_lockInfo.lockRelId.dbId;
tag.objId.blkno = InvalidBlockNumber; tag.objId.blkno = InvalidBlockNumber;
LockRelease(LockTableId, &tag, GetCurrentTransactionId(), lockmode); LockRelease(LockTableId, &tag, GetTopTransactionId(), lockmode);
} }
/* /*
...@@ -264,7 +264,7 @@ LockPage(Relation relation, BlockNumber blkno, LOCKMODE lockmode) ...@@ -264,7 +264,7 @@ LockPage(Relation relation, BlockNumber blkno, LOCKMODE lockmode)
tag.dbId = relation->rd_lockInfo.lockRelId.dbId; tag.dbId = relation->rd_lockInfo.lockRelId.dbId;
tag.objId.blkno = blkno; tag.objId.blkno = blkno;
if (!LockAcquire(LockTableId, &tag, GetCurrentTransactionId(), if (!LockAcquire(LockTableId, &tag, GetTopTransactionId(),
lockmode, false)) lockmode, false))
elog(ERROR, "LockAcquire failed"); elog(ERROR, "LockAcquire failed");
} }
...@@ -285,7 +285,7 @@ ConditionalLockPage(Relation relation, BlockNumber blkno, LOCKMODE lockmode) ...@@ -285,7 +285,7 @@ ConditionalLockPage(Relation relation, BlockNumber blkno, LOCKMODE lockmode)
tag.dbId = relation->rd_lockInfo.lockRelId.dbId; tag.dbId = relation->rd_lockInfo.lockRelId.dbId;
tag.objId.blkno = blkno; tag.objId.blkno = blkno;
return LockAcquire(LockTableId, &tag, GetCurrentTransactionId(), return LockAcquire(LockTableId, &tag, GetTopTransactionId(),
lockmode, true); lockmode, true);
} }
...@@ -302,7 +302,7 @@ UnlockPage(Relation relation, BlockNumber blkno, LOCKMODE lockmode) ...@@ -302,7 +302,7 @@ UnlockPage(Relation relation, BlockNumber blkno, LOCKMODE lockmode)
tag.dbId = relation->rd_lockInfo.lockRelId.dbId; tag.dbId = relation->rd_lockInfo.lockRelId.dbId;
tag.objId.blkno = blkno; tag.objId.blkno = blkno;
LockRelease(LockTableId, &tag, GetCurrentTransactionId(), lockmode); LockRelease(LockTableId, &tag, GetTopTransactionId(), lockmode);
} }
/* /*
...@@ -343,7 +343,7 @@ void ...@@ -343,7 +343,7 @@ void
XactLockTableWait(TransactionId xid) XactLockTableWait(TransactionId xid)
{ {
LOCKTAG tag; LOCKTAG tag;
TransactionId myxid = GetCurrentTransactionId(); TransactionId myxid = GetTopTransactionId();
Assert(!SubTransXidsHaveCommonAncestor(xid, myxid)); Assert(!SubTransXidsHaveCommonAncestor(xid, myxid));
......
...@@ -80,7 +80,7 @@ ...@@ -80,7 +80,7 @@
* Portions Copyright (c) 1994, Regents of the University of California * Portions Copyright (c) 1994, Regents of the University of California
* *
* IDENTIFICATION * IDENTIFICATION
* $PostgreSQL: pgsql/src/backend/utils/cache/inval.c,v 1.63 2004/07/01 00:51:17 tgl Exp $ * $PostgreSQL: pgsql/src/backend/utils/cache/inval.c,v 1.64 2004/07/28 14:23:29 tgl Exp $
* *
*------------------------------------------------------------------------- *-------------------------------------------------------------------------
*/ */
...@@ -678,7 +678,7 @@ AtEOXact_Inval(bool isCommit) ...@@ -678,7 +678,7 @@ AtEOXact_Inval(bool isCommit)
} }
/* /*
* AtSubEOXact_Inval * AtEOSubXact_Inval
* Process queued-up invalidation messages at end of subtransaction. * Process queued-up invalidation messages at end of subtransaction.
* *
* If isCommit, process CurrentCmdInvalidMsgs if any (there probably aren't), * If isCommit, process CurrentCmdInvalidMsgs if any (there probably aren't),
...@@ -695,7 +695,7 @@ AtEOXact_Inval(bool isCommit) ...@@ -695,7 +695,7 @@ AtEOXact_Inval(bool isCommit)
* (if aborting). * (if aborting).
*/ */
void void
AtSubEOXact_Inval(bool isCommit) AtEOSubXact_Inval(bool isCommit)
{ {
TransInvalidationInfo *myInfo = transInvalInfo; TransInvalidationInfo *myInfo = transInvalInfo;
......
...@@ -10,7 +10,7 @@ ...@@ -10,7 +10,7 @@
* Written by Peter Eisentraut <peter_e@gmx.net>. * Written by Peter Eisentraut <peter_e@gmx.net>.
* *
* IDENTIFICATION * IDENTIFICATION
* $PostgreSQL: pgsql/src/backend/utils/misc/guc.c,v 1.224 2004/07/24 19:51:23 tgl Exp $ * $PostgreSQL: pgsql/src/backend/utils/misc/guc.c,v 1.225 2004/07/28 14:23:29 tgl Exp $
* *
*-------------------------------------------------------------------- *--------------------------------------------------------------------
*/ */
...@@ -5436,10 +5436,15 @@ assign_log_stats(bool newval, bool doit, GucSource source) ...@@ -5436,10 +5436,15 @@ assign_log_stats(bool newval, bool doit, GucSource source)
static bool static bool
assign_transaction_read_only(bool newval, bool doit, GucSource source) assign_transaction_read_only(bool newval, bool doit, GucSource source)
{ {
if (doit && source >= PGC_S_INTERACTIVE && IsSubTransaction()) /* Can't go to r/w mode inside a r/o transaction */
if (newval == false && XactReadOnly && IsSubTransaction())
{
if (source >= PGC_S_INTERACTIVE)
ereport(ERROR, ereport(ERROR,
(errcode(ERRCODE_INVALID_PARAMETER_VALUE), (errcode(ERRCODE_INVALID_PARAMETER_VALUE),
errmsg("cannot set transaction read only mode inside a subtransaction"))); errmsg("cannot set transaction read-write mode inside a read-only transaction")));
return false;
}
return true; return true;
} }
......
...@@ -16,7 +16,7 @@ ...@@ -16,7 +16,7 @@
* Portions Copyright (c) 1994, Regents of the University of California * Portions Copyright (c) 1994, Regents of the University of California
* *
* IDENTIFICATION * IDENTIFICATION
* $PostgreSQL: pgsql/src/backend/utils/time/tqual.c,v 1.73 2004/07/01 00:51:33 tgl Exp $ * $PostgreSQL: pgsql/src/backend/utils/time/tqual.c,v 1.74 2004/07/28 14:23:30 tgl Exp $
* *
*------------------------------------------------------------------------- *-------------------------------------------------------------------------
*/ */
...@@ -118,7 +118,10 @@ HeapTupleSatisfiesItself(HeapTupleHeader tuple) ...@@ -118,7 +118,10 @@ HeapTupleSatisfiesItself(HeapTupleHeader tuple)
/* deleting subtransaction aborted */ /* deleting subtransaction aborted */
if (TransactionIdDidAbort(HeapTupleHeaderGetXmax(tuple))) if (TransactionIdDidAbort(HeapTupleHeaderGetXmax(tuple)))
{
tuple->t_infomask |= HEAP_XMAX_INVALID;
return true; return true;
}
Assert(TransactionIdIsCurrentTransactionId(HeapTupleHeaderGetXmax(tuple))); Assert(TransactionIdIsCurrentTransactionId(HeapTupleHeaderGetXmax(tuple)));
...@@ -268,7 +271,10 @@ HeapTupleSatisfiesNow(HeapTupleHeader tuple) ...@@ -268,7 +271,10 @@ HeapTupleSatisfiesNow(HeapTupleHeader tuple)
/* deleting subtransaction aborted */ /* deleting subtransaction aborted */
if (TransactionIdDidAbort(HeapTupleHeaderGetXmax(tuple))) if (TransactionIdDidAbort(HeapTupleHeaderGetXmax(tuple)))
{
tuple->t_infomask |= HEAP_XMAX_INVALID;
return true; return true;
}
Assert(TransactionIdIsCurrentTransactionId(HeapTupleHeaderGetXmax(tuple))); Assert(TransactionIdIsCurrentTransactionId(HeapTupleHeaderGetXmax(tuple)));
...@@ -452,7 +458,10 @@ HeapTupleSatisfiesUpdate(HeapTupleHeader tuple, CommandId curcid) ...@@ -452,7 +458,10 @@ HeapTupleSatisfiesUpdate(HeapTupleHeader tuple, CommandId curcid)
/* deleting subtransaction aborted */ /* deleting subtransaction aborted */
if (TransactionIdDidAbort(HeapTupleHeaderGetXmax(tuple))) if (TransactionIdDidAbort(HeapTupleHeaderGetXmax(tuple)))
{
tuple->t_infomask |= HEAP_XMAX_INVALID;
return HeapTupleMayBeUpdated; return HeapTupleMayBeUpdated;
}
Assert(TransactionIdIsCurrentTransactionId(HeapTupleHeaderGetXmax(tuple))); Assert(TransactionIdIsCurrentTransactionId(HeapTupleHeaderGetXmax(tuple)));
...@@ -590,7 +599,10 @@ HeapTupleSatisfiesDirty(HeapTupleHeader tuple) ...@@ -590,7 +599,10 @@ HeapTupleSatisfiesDirty(HeapTupleHeader tuple)
/* deleting subtransaction aborted */ /* deleting subtransaction aborted */
if (TransactionIdDidAbort(HeapTupleHeaderGetXmax(tuple))) if (TransactionIdDidAbort(HeapTupleHeaderGetXmax(tuple)))
{
tuple->t_infomask |= HEAP_XMAX_INVALID;
return true; return true;
}
Assert(TransactionIdIsCurrentTransactionId(HeapTupleHeaderGetXmax(tuple))); Assert(TransactionIdIsCurrentTransactionId(HeapTupleHeaderGetXmax(tuple)));
...@@ -732,7 +744,10 @@ HeapTupleSatisfiesSnapshot(HeapTupleHeader tuple, Snapshot snapshot) ...@@ -732,7 +744,10 @@ HeapTupleSatisfiesSnapshot(HeapTupleHeader tuple, Snapshot snapshot)
/* deleting subtransaction aborted */ /* deleting subtransaction aborted */
/* FIXME -- is this correct w.r.t. the cmax of the tuple? */ /* FIXME -- is this correct w.r.t. the cmax of the tuple? */
if (TransactionIdDidAbort(HeapTupleHeaderGetXmax(tuple))) if (TransactionIdDidAbort(HeapTupleHeaderGetXmax(tuple)))
{
tuple->t_infomask |= HEAP_XMAX_INVALID;
return true; return true;
}
Assert(TransactionIdIsCurrentTransactionId(HeapTupleHeaderGetXmax(tuple))); Assert(TransactionIdIsCurrentTransactionId(HeapTupleHeaderGetXmax(tuple)));
...@@ -757,23 +772,38 @@ HeapTupleSatisfiesSnapshot(HeapTupleHeader tuple, Snapshot snapshot) ...@@ -757,23 +772,38 @@ HeapTupleSatisfiesSnapshot(HeapTupleHeader tuple, Snapshot snapshot)
/* /*
* By here, the inserting transaction has committed - have to check * By here, the inserting transaction has committed - have to check
* when... * when...
*
* Note that the provided snapshot contains only top-level XIDs, so
* we have to convert a subxact XID to its parent for comparison.
* However, we can make first-pass range checks with the given XID,
* because a subxact with XID < xmin has surely also got a parent with
* XID < xmin, while one with XID >= xmax must belong to a parent that
* was not yet committed at the time of this snapshot.
*/ */
if (TransactionIdFollowsOrEquals(HeapTupleHeaderGetXmin(tuple), if (TransactionIdFollowsOrEquals(HeapTupleHeaderGetXmin(tuple),
snapshot->xmin)) snapshot->xmin))
{ {
uint32 i; TransactionId parentXid;
if (TransactionIdFollowsOrEquals(HeapTupleHeaderGetXmin(tuple), if (TransactionIdFollowsOrEquals(HeapTupleHeaderGetXmin(tuple),
snapshot->xmax)) snapshot->xmax))
return false; return false;
parentXid = SubTransGetTopmostTransaction(HeapTupleHeaderGetXmin(tuple));
if (TransactionIdFollowsOrEquals(parentXid, snapshot->xmin))
{
uint32 i;
/* no point in checking parentXid against xmax here */
for (i = 0; i < snapshot->xcnt; i++) for (i = 0; i < snapshot->xcnt; i++)
{ {
if (SubTransXidsHaveCommonAncestor(HeapTupleHeaderGetXmin(tuple), if (TransactionIdEquals(parentXid, snapshot->xip[i]))
snapshot->xip[i]))
return false; return false;
} }
} }
}
if (tuple->t_infomask & HEAP_XMAX_INVALID) /* xid invalid or aborted */ if (tuple->t_infomask & HEAP_XMAX_INVALID) /* xid invalid or aborted */
return true; return true;
...@@ -804,20 +834,33 @@ HeapTupleSatisfiesSnapshot(HeapTupleHeader tuple, Snapshot snapshot) ...@@ -804,20 +834,33 @@ HeapTupleSatisfiesSnapshot(HeapTupleHeader tuple, Snapshot snapshot)
/* /*
* OK, the deleting transaction committed too ... but when? * OK, the deleting transaction committed too ... but when?
*
* See notes for the similar tests on tuple xmin, above.
*/ */
if (TransactionIdFollowsOrEquals(HeapTupleHeaderGetXmax(tuple), snapshot->xmin)) if (TransactionIdFollowsOrEquals(HeapTupleHeaderGetXmax(tuple),
snapshot->xmin))
{ {
uint32 i; TransactionId parentXid;
if (TransactionIdFollowsOrEquals(HeapTupleHeaderGetXmax(tuple), if (TransactionIdFollowsOrEquals(HeapTupleHeaderGetXmax(tuple),
snapshot->xmax)) snapshot->xmax))
return true; return true;
parentXid = SubTransGetTopmostTransaction(HeapTupleHeaderGetXmax(tuple));
if (TransactionIdFollowsOrEquals(parentXid, snapshot->xmin))
{
uint32 i;
/* no point in checking parentXid against xmax here */
for (i = 0; i < snapshot->xcnt; i++) for (i = 0; i < snapshot->xcnt; i++)
{ {
if (SubTransXidsHaveCommonAncestor(HeapTupleHeaderGetXmax(tuple), snapshot->xip[i])) if (TransactionIdEquals(parentXid, snapshot->xip[i]))
return true; return true;
} }
} }
}
return false; return false;
} }
......
...@@ -3,7 +3,7 @@ ...@@ -3,7 +3,7 @@
* *
* Copyright (c) 2000-2003, PostgreSQL Global Development Group * Copyright (c) 2000-2003, PostgreSQL Global Development Group
* *
* $PostgreSQL: pgsql/src/bin/psql/tab-complete.c,v 1.108 2004/07/27 05:11:11 tgl Exp $ * $PostgreSQL: pgsql/src/bin/psql/tab-complete.c,v 1.109 2004/07/28 14:23:30 tgl Exp $
*/ */
/*---------------------------------------------------------------------- /*----------------------------------------------------------------------
...@@ -722,7 +722,7 @@ psql_completion(char *text, int start, int end) ...@@ -722,7 +722,7 @@ psql_completion(char *text, int start, int end)
else if (pg_strcasecmp(prev2_wd, "ANALYZE") == 0) else if (pg_strcasecmp(prev2_wd, "ANALYZE") == 0)
COMPLETE_WITH_CONST(";"); COMPLETE_WITH_CONST(";");
/* BEGIN, COMMIT, ABORT */ /* BEGIN, END, COMMIT, ABORT */
else if (pg_strcasecmp(prev_wd, "BEGIN") == 0 || else if (pg_strcasecmp(prev_wd, "BEGIN") == 0 ||
pg_strcasecmp(prev_wd, "END") == 0 || pg_strcasecmp(prev_wd, "END") == 0 ||
pg_strcasecmp(prev_wd, "COMMIT") == 0 || pg_strcasecmp(prev_wd, "COMMIT") == 0 ||
......
...@@ -7,7 +7,7 @@ ...@@ -7,7 +7,7 @@
* Portions Copyright (c) 1996-2003, PostgreSQL Global Development Group * Portions Copyright (c) 1996-2003, PostgreSQL Global Development Group
* Portions Copyright (c) 1994, Regents of the University of California * Portions Copyright (c) 1994, Regents of the University of California
* *
* $PostgreSQL: pgsql/src/include/catalog/namespace.h,v 1.30 2004/01/19 19:04:40 tgl Exp $ * $PostgreSQL: pgsql/src/include/catalog/namespace.h,v 1.31 2004/07/28 14:23:30 tgl Exp $
* *
*------------------------------------------------------------------------- *-------------------------------------------------------------------------
*/ */
...@@ -91,6 +91,8 @@ extern Oid FindDefaultConversionProc(int4 for_encoding, int4 to_encoding); ...@@ -91,6 +91,8 @@ extern Oid FindDefaultConversionProc(int4 for_encoding, int4 to_encoding);
/* initialization & transaction cleanup code */ /* initialization & transaction cleanup code */
extern void InitializeSearchPath(void); extern void InitializeSearchPath(void);
extern void AtEOXact_Namespace(bool isCommit); extern void AtEOXact_Namespace(bool isCommit);
extern void AtEOSubXact_Namespace(bool isCommit, TransactionId myXid,
TransactionId parentXid);
/* stuff for search_path GUC variable */ /* stuff for search_path GUC variable */
extern char *namespace_search_path; extern char *namespace_search_path;
......
...@@ -4,7 +4,7 @@ ...@@ -4,7 +4,7 @@
* Commands for manipulating users and groups. * Commands for manipulating users and groups.
* *
* *
* $PostgreSQL: pgsql/src/include/commands/user.h,v 1.22 2003/11/29 22:40:59 pgsql Exp $ * $PostgreSQL: pgsql/src/include/commands/user.h,v 1.23 2004/07/28 14:23:31 tgl Exp $
* *
*------------------------------------------------------------------------- *-------------------------------------------------------------------------
*/ */
...@@ -32,5 +32,7 @@ extern void RenameGroup(const char *oldname, const char *newname); ...@@ -32,5 +32,7 @@ extern void RenameGroup(const char *oldname, const char *newname);
extern Datum update_pg_pwd_and_pg_group(PG_FUNCTION_ARGS); extern Datum update_pg_pwd_and_pg_group(PG_FUNCTION_ARGS);
extern void AtEOXact_UpdatePasswordFile(bool isCommit); extern void AtEOXact_UpdatePasswordFile(bool isCommit);
extern void AtEOSubXact_UpdatePasswordFile(bool isCommit, TransactionId myXid,
TransactionId parentXid);
#endif /* USER_H */ #endif /* USER_H */
...@@ -7,7 +7,7 @@ ...@@ -7,7 +7,7 @@
* Portions Copyright (c) 1996-2003, PostgreSQL Global Development Group * Portions Copyright (c) 1996-2003, PostgreSQL Global Development Group
* Portions Copyright (c) 1994, Regents of the University of California * Portions Copyright (c) 1994, Regents of the University of California
* *
* $PostgreSQL: pgsql/src/include/libpq/be-fsstubs.h,v 1.18 2003/11/29 22:41:03 pgsql Exp $ * $PostgreSQL: pgsql/src/include/libpq/be-fsstubs.h,v 1.19 2004/07/28 14:23:31 tgl Exp $
* *
*------------------------------------------------------------------------- *-------------------------------------------------------------------------
*/ */
...@@ -43,8 +43,10 @@ extern int lo_read(int fd, char *buf, int len); ...@@ -43,8 +43,10 @@ extern int lo_read(int fd, char *buf, int len);
extern int lo_write(int fd, char *buf, int len); extern int lo_write(int fd, char *buf, int len);
/* /*
* Cleanup LOs at xact commit/abort [ Pascal Andr <andre@via.ecp.fr> ] * Cleanup LOs at xact commit/abort
*/ */
extern void lo_commit(bool isCommit); extern void AtEOXact_LargeObject(bool isCommit);
extern void AtEOSubXact_LargeObject(bool isCommit, TransactionId myXid,
TransactionId parentXid);
#endif /* BE_FSSTUBS_H */ #endif /* BE_FSSTUBS_H */
...@@ -7,7 +7,7 @@ ...@@ -7,7 +7,7 @@
* Portions Copyright (c) 1996-2003, PostgreSQL Global Development Group * Portions Copyright (c) 1996-2003, PostgreSQL Global Development Group
* Portions Copyright (c) 1994, Regents of the University of California * Portions Copyright (c) 1994, Regents of the University of California
* *
* $PostgreSQL: pgsql/src/include/storage/fd.h,v 1.45 2004/05/31 03:48:10 tgl Exp $ * $PostgreSQL: pgsql/src/include/storage/fd.h,v 1.46 2004/07/28 14:23:31 tgl Exp $
* *
*------------------------------------------------------------------------- *-------------------------------------------------------------------------
*/ */
...@@ -85,6 +85,8 @@ extern int BasicOpenFile(FileName fileName, int fileFlags, int fileMode); ...@@ -85,6 +85,8 @@ extern int BasicOpenFile(FileName fileName, int fileFlags, int fileMode);
extern void set_max_safe_fds(void); extern void set_max_safe_fds(void);
extern void closeAllVfds(void); extern void closeAllVfds(void);
extern void AtEOXact_Files(void); extern void AtEOXact_Files(void);
extern void AtEOSubXact_Files(bool isCommit, TransactionId myXid,
TransactionId parentXid);
extern void RemovePgTempFiles(void); extern void RemovePgTempFiles(void);
extern int pg_fsync(int fd); extern int pg_fsync(int fd);
extern int pg_fdatasync(int fd); extern int pg_fdatasync(int fd);
......
/*------------------------------------------------------------------------- /*-------------------------------------------------------------------------
* *
* large_object.h * large_object.h
* file of info for Postgres large objects. POSTGRES 4.2 supports * Declarations for PostgreSQL large objects. POSTGRES 4.2 supported
* zillions of large objects (internal, external, jaquith, inversion). * zillions of large objects (internal, external, jaquith, inversion).
* Now we only support inversion. * Now we only support inversion.
* *
* Portions Copyright (c) 1996-2003, PostgreSQL Global Development Group * Portions Copyright (c) 1996-2003, PostgreSQL Global Development Group
* Portions Copyright (c) 1994, Regents of the University of California * Portions Copyright (c) 1994, Regents of the University of California
* *
* $PostgreSQL: pgsql/src/include/storage/large_object.h,v 1.27 2003/11/29 22:41:13 pgsql Exp $ * $PostgreSQL: pgsql/src/include/storage/large_object.h,v 1.28 2004/07/28 14:23:31 tgl Exp $
* *
*------------------------------------------------------------------------- *-------------------------------------------------------------------------
*/ */
#ifndef LARGE_OBJECT_H #ifndef LARGE_OBJECT_H
#define LARGE_OBJECT_H #define LARGE_OBJECT_H
#include "utils/rel.h"
/*---------- /*----------
* Data about a currently-open large object. * Data about a currently-open large object.
* *
* id is the logical OID of the large object * id is the logical OID of the large object
* xid is the transaction Id that opened the LO (or currently owns it)
* offset is the current seek offset within the LO * offset is the current seek offset within the LO
* heap_r holds an open-relation reference to pg_largeobject * flags contains some flag bits
* index_r holds an open-relation reference to pg_largeobject_loid_pn_index
* *
* NOTE: before 7.1, heap_r and index_r held references to the separate * NOTE: before 7.1, we also had to store references to the separate table
* table and index of a specific large object. Now they all live in one rel. * and index of a specific large object. Now they all live in pg_largeobject
* and are accessed via a common relation descriptor.
*---------- *----------
*/ */
typedef struct LargeObjectDesc typedef struct LargeObjectDesc
{ {
Oid id; Oid id; /* LO's identifier */
TransactionId xid; /* owning XID */
uint32 offset; /* current seek pointer */ uint32 offset; /* current seek pointer */
int flags; /* locking info, etc */ int flags; /* locking info, etc */
/* flag bits: */ /* flag bits: */
#define IFS_RDLOCK (1 << 0) #define IFS_RDLOCK (1 << 0)
#define IFS_WRLOCK (1 << 1) #define IFS_WRLOCK (1 << 1)
Relation heap_r;
Relation index_r;
} LargeObjectDesc; } LargeObjectDesc;
...@@ -67,6 +64,7 @@ typedef struct LargeObjectDesc ...@@ -67,6 +64,7 @@ typedef struct LargeObjectDesc
*/ */
/* inversion stuff in inv_api.c */ /* inversion stuff in inv_api.c */
extern void close_lo_relation(bool isCommit);
extern LargeObjectDesc *inv_create(int flags); extern LargeObjectDesc *inv_create(int flags);
extern LargeObjectDesc *inv_open(Oid lobjId, int flags); extern LargeObjectDesc *inv_open(Oid lobjId, int flags);
extern void inv_close(LargeObjectDesc *obj_desc); extern void inv_close(LargeObjectDesc *obj_desc);
......
...@@ -7,7 +7,7 @@ ...@@ -7,7 +7,7 @@
* Portions Copyright (c) 1996-2003, PostgreSQL Global Development Group * Portions Copyright (c) 1996-2003, PostgreSQL Global Development Group
* Portions Copyright (c) 1994, Regents of the University of California * Portions Copyright (c) 1994, Regents of the University of California
* *
* $PostgreSQL: pgsql/src/include/utils/inval.h,v 1.32 2004/07/01 00:51:44 tgl Exp $ * $PostgreSQL: pgsql/src/include/utils/inval.h,v 1.33 2004/07/28 14:23:31 tgl Exp $
* *
*------------------------------------------------------------------------- *-------------------------------------------------------------------------
*/ */
...@@ -28,7 +28,7 @@ extern void AtSubStart_Inval(void); ...@@ -28,7 +28,7 @@ extern void AtSubStart_Inval(void);
extern void AtEOXact_Inval(bool isCommit); extern void AtEOXact_Inval(bool isCommit);
extern void AtSubEOXact_Inval(bool isCommit); extern void AtEOSubXact_Inval(bool isCommit);
extern void CommandEndInvalidationMessages(void); extern void CommandEndInvalidationMessages(void);
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment