Commit 7e3da1c4 authored by Kevin Grittner's avatar Kevin Grittner

Mitigate "snapshot too old" performance regression on NUMA

Limit maintenance of time to xid mapping to once per minute.  At
least in the tested case this brings performance within 5% of when
the feature is off, compared to several times slower without this
patch.

While there, fix comments and whitespace.

Ants Aasma, with cosmetic adjustments suggested by Andres Freund
Reviewed by Kevin Grittner and Andres Freund
parent eb7de00a
...@@ -78,10 +78,13 @@ typedef struct OldSnapshotControlData ...@@ -78,10 +78,13 @@ typedef struct OldSnapshotControlData
* Variables for old snapshot handling are shared among processes and are * Variables for old snapshot handling are shared among processes and are
* only allowed to move forward. * only allowed to move forward.
*/ */
slock_t mutex_current; /* protect current timestamp */ slock_t mutex_current; /* protect current_timestamp */
int64 current_timestamp; /* latest snapshot timestamp */ int64 current_timestamp; /* latest snapshot timestamp */
slock_t mutex_latest_xmin; /* protect latest snapshot xmin */ slock_t mutex_latest_xmin; /* protect latest_xmin
* and next_map_update
*/
TransactionId latest_xmin; /* latest snapshot xmin */ TransactionId latest_xmin; /* latest snapshot xmin */
int64 next_map_update; /* latest snapshot valid up to */
slock_t mutex_threshold; /* protect threshold fields */ slock_t mutex_threshold; /* protect threshold fields */
int64 threshold_timestamp; /* earlier snapshot is old */ int64 threshold_timestamp; /* earlier snapshot is old */
TransactionId threshold_xid; /* earlier xid may be gone */ TransactionId threshold_xid; /* earlier xid may be gone */
...@@ -95,7 +98,10 @@ typedef struct OldSnapshotControlData ...@@ -95,7 +98,10 @@ typedef struct OldSnapshotControlData
* count_used value of OLD_SNAPSHOT_TIME_MAP_ENTRIES means that the buffer * count_used value of OLD_SNAPSHOT_TIME_MAP_ENTRIES means that the buffer
* is full and the head must be advanced to add new entries. Use * is full and the head must be advanced to add new entries. Use
* timestamps aligned to minute boundaries, since that seems less * timestamps aligned to minute boundaries, since that seems less
* surprising than aligning based on the first usage timestamp. * surprising than aligning based on the first usage timestamp. The
* latest bucket is effectively stored within latest_xmin. The circular
* buffer is updated when we get a new xmin value that doesn't fall into
* the same interval.
* *
* It is OK if the xid for a given time slot is from earlier than * It is OK if the xid for a given time slot is from earlier than
* calculated by adding the number of minutes corresponding to the * calculated by adding the number of minutes corresponding to the
...@@ -269,6 +275,7 @@ SnapMgrInit(void) ...@@ -269,6 +275,7 @@ SnapMgrInit(void)
oldSnapshotControl->current_timestamp = 0; oldSnapshotControl->current_timestamp = 0;
SpinLockInit(&oldSnapshotControl->mutex_latest_xmin); SpinLockInit(&oldSnapshotControl->mutex_latest_xmin);
oldSnapshotControl->latest_xmin = InvalidTransactionId; oldSnapshotControl->latest_xmin = InvalidTransactionId;
oldSnapshotControl->next_map_update = 0;
SpinLockInit(&oldSnapshotControl->mutex_threshold); SpinLockInit(&oldSnapshotControl->mutex_threshold);
oldSnapshotControl->threshold_timestamp = 0; oldSnapshotControl->threshold_timestamp = 0;
oldSnapshotControl->threshold_xid = InvalidTransactionId; oldSnapshotControl->threshold_xid = InvalidTransactionId;
...@@ -1595,9 +1602,15 @@ TransactionIdLimitedForOldSnapshots(TransactionId recentXmin, ...@@ -1595,9 +1602,15 @@ TransactionIdLimitedForOldSnapshots(TransactionId recentXmin,
{ {
int64 ts = GetSnapshotCurrentTimestamp(); int64 ts = GetSnapshotCurrentTimestamp();
TransactionId xlimit = recentXmin; TransactionId xlimit = recentXmin;
TransactionId latest_xmin = oldSnapshotControl->latest_xmin; TransactionId latest_xmin;
int64 update_ts;
bool same_ts_as_threshold = false; bool same_ts_as_threshold = false;
SpinLockAcquire(&oldSnapshotControl->mutex_latest_xmin);
latest_xmin = oldSnapshotControl->latest_xmin;
update_ts = oldSnapshotControl->next_map_update;
SpinLockRelease(&oldSnapshotControl->mutex_latest_xmin);
/* /*
* Zero threshold always overrides to latest xmin, if valid. Without * Zero threshold always overrides to latest xmin, if valid. Without
* some heuristic it will find its own snapshot too old on, for * some heuristic it will find its own snapshot too old on, for
...@@ -1631,6 +1644,14 @@ TransactionIdLimitedForOldSnapshots(TransactionId recentXmin, ...@@ -1631,6 +1644,14 @@ TransactionIdLimitedForOldSnapshots(TransactionId recentXmin,
SpinLockRelease(&oldSnapshotControl->mutex_threshold); SpinLockRelease(&oldSnapshotControl->mutex_threshold);
if (!same_ts_as_threshold) if (!same_ts_as_threshold)
{
if (ts == update_ts)
{
xlimit = latest_xmin;
if (NormalTransactionIdFollows(xlimit, recentXmin))
SetOldSnapshotThresholdTimestamp(ts, xlimit);
}
else
{ {
LWLockAcquire(OldSnapshotTimeMapLock, LW_SHARED); LWLockAcquire(OldSnapshotTimeMapLock, LW_SHARED);
...@@ -1653,6 +1674,7 @@ TransactionIdLimitedForOldSnapshots(TransactionId recentXmin, ...@@ -1653,6 +1674,7 @@ TransactionIdLimitedForOldSnapshots(TransactionId recentXmin,
LWLockRelease(OldSnapshotTimeMapLock); LWLockRelease(OldSnapshotTimeMapLock);
} }
}
/* /*
* Failsafe protection against vacuuming work of active transaction. * Failsafe protection against vacuuming work of active transaction.
...@@ -1681,16 +1703,35 @@ void ...@@ -1681,16 +1703,35 @@ void
MaintainOldSnapshotTimeMapping(int64 whenTaken, TransactionId xmin) MaintainOldSnapshotTimeMapping(int64 whenTaken, TransactionId xmin)
{ {
int64 ts; int64 ts;
TransactionId latest_xmin;
int64 update_ts;
bool map_update_required = false;
/* Never call this function when old snapshot checking is disabled. */ /* Never call this function when old snapshot checking is disabled. */
Assert(old_snapshot_threshold >= 0); Assert(old_snapshot_threshold >= 0);
/* Keep track of the latest xmin seen by any process. */ ts = AlignTimestampToMinuteBoundary(whenTaken);
/*
* Keep track of the latest xmin seen by any process. Update mapping
* with a new value when we have crossed a bucket boundary.
*/
SpinLockAcquire(&oldSnapshotControl->mutex_latest_xmin); SpinLockAcquire(&oldSnapshotControl->mutex_latest_xmin);
if (TransactionIdFollows(xmin, oldSnapshotControl->latest_xmin)) latest_xmin = oldSnapshotControl->latest_xmin;
update_ts = oldSnapshotControl->next_map_update;
if (ts > update_ts)
{
oldSnapshotControl->next_map_update = ts;
map_update_required = true;
}
if (TransactionIdFollows(xmin, latest_xmin))
oldSnapshotControl->latest_xmin = xmin; oldSnapshotControl->latest_xmin = xmin;
SpinLockRelease(&oldSnapshotControl->mutex_latest_xmin); SpinLockRelease(&oldSnapshotControl->mutex_latest_xmin);
/* We only needed to update the most recent xmin value. */
if (!map_update_required)
return;
/* No further tracking needed for 0 (used for testing). */ /* No further tracking needed for 0 (used for testing). */
if (old_snapshot_threshold == 0) if (old_snapshot_threshold == 0)
return; return;
...@@ -1716,8 +1757,6 @@ MaintainOldSnapshotTimeMapping(int64 whenTaken, TransactionId xmin) ...@@ -1716,8 +1757,6 @@ MaintainOldSnapshotTimeMapping(int64 whenTaken, TransactionId xmin)
return; return;
} }
ts = AlignTimestampToMinuteBoundary(whenTaken);
LWLockAcquire(OldSnapshotTimeMapLock, LW_EXCLUSIVE); LWLockAcquire(OldSnapshotTimeMapLock, LW_EXCLUSIVE);
Assert(oldSnapshotControl->head_offset >= 0); Assert(oldSnapshotControl->head_offset >= 0);
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment