Commit 496ee647 authored by Fujii Masao's avatar Fujii Masao

Prefer standby promotion over recovery pause.

Previously if a promotion was triggered while recovery was paused,
the paused state continued. Also recovery could be paused by executing
pg_wal_replay_pause() even while a promotion was ongoing. That is,
recovery pause had higher priority over a standby promotion.
But this behavior was not desirable because most users basically wanted
the recovery to complete as soon as possible and the server to become
the master when they requested a promotion.

This commit changes recovery so that it prefers a promotion over
recovery pause. That is, if a promotion is triggered while recovery
is paused, the paused state ends and a promotion continues. Also
this commit makes recovery pause functions like pg_wal_replay_pause()
throw an error if they are executed while a promotion is ongoing.

Internally, this commit adds new internal function PromoteIsTriggered()
that returns true if a promotion is triggered. Since the name of
this function and the existing function IsPromoteTriggered() are
confusingly similar, the commit changes the name of IsPromoteTriggered()
to IsPromoteSignaled, as more appropriate name.

Author: Fujii Masao
Reviewed-by: Atsushi Torikoshi, Sergei Kornilov
Discussion: https://postgr.es/m/00c194b2-dbbb-2e8a-5b39-13f14048ef0a@oss.nttdata.com
parent e09ad07b
...@@ -3590,6 +3590,9 @@ restore_command = 'copy "C:\\server\\archivedir\\%f" "%p"' # Windows ...@@ -3590,6 +3590,9 @@ restore_command = 'copy "C:\\server\\archivedir\\%f" "%p"' # Windows
This setting has no effect if no recovery target is set. This setting has no effect if no recovery target is set.
If <xref linkend="guc-hot-standby"/> is not enabled, a setting of If <xref linkend="guc-hot-standby"/> is not enabled, a setting of
<literal>pause</literal> will act the same as <literal>shutdown</literal>. <literal>pause</literal> will act the same as <literal>shutdown</literal>.
If the recovery target is reached while a promotion is ongoing,
a setting of <literal>pause</literal> will act the same as
<literal>promote</literal>.
</para> </para>
<para> <para>
In any case, if a recovery target is configured but the archive In any case, if a recovery target is configured but the archive
......
...@@ -20177,6 +20177,13 @@ postgres=# SELECT * FROM pg_walfile_name_offset(pg_stop_backup()); ...@@ -20177,6 +20177,13 @@ postgres=# SELECT * FROM pg_walfile_name_offset(pg_stop_backup());
recovery is resumed. recovery is resumed.
</para> </para>
<para>
<function>pg_wal_replay_pause</function> and
<function>pg_wal_replay_resume</function> cannot be executed while
a promotion is ongoing. If a promotion is triggered while recovery
is paused, the paused state ends and a promotion continues.
</para>
<para> <para>
If streaming replication is disabled, the paused state may continue If streaming replication is disabled, the paused state may continue
indefinitely without problem. While streaming replication is in indefinitely without problem. While streaming replication is in
......
...@@ -229,6 +229,12 @@ static bool LocalRecoveryInProgress = true; ...@@ -229,6 +229,12 @@ static bool LocalRecoveryInProgress = true;
*/ */
static bool LocalHotStandbyActive = false; static bool LocalHotStandbyActive = false;
/*
* Local copy of SharedPromoteIsTriggered variable. False actually means "not
* known, need to check the shared state".
*/
static bool LocalPromoteIsTriggered = false;
/* /*
* Local state for XLogInsertAllowed(): * Local state for XLogInsertAllowed():
* 1: unconditionally allowed to insert XLOG * 1: unconditionally allowed to insert XLOG
...@@ -654,6 +660,12 @@ typedef struct XLogCtlData ...@@ -654,6 +660,12 @@ typedef struct XLogCtlData
*/ */
bool SharedHotStandbyActive; bool SharedHotStandbyActive;
/*
* SharedPromoteIsTriggered indicates if a standby promotion has been
* triggered. Protected by info_lck.
*/
bool SharedPromoteIsTriggered;
/* /*
* WalWriterSleeping indicates whether the WAL writer is currently in * WalWriterSleeping indicates whether the WAL writer is currently in
* low-power mode (and hence should be nudged if an async commit occurs). * low-power mode (and hence should be nudged if an async commit occurs).
...@@ -912,6 +924,7 @@ static void InitControlFile(uint64 sysidentifier); ...@@ -912,6 +924,7 @@ static void InitControlFile(uint64 sysidentifier);
static void WriteControlFile(void); static void WriteControlFile(void);
static void ReadControlFile(void); static void ReadControlFile(void);
static char *str_time(pg_time_t tnow); static char *str_time(pg_time_t tnow);
static void SetPromoteIsTriggered(void);
static bool CheckForStandbyTrigger(void); static bool CheckForStandbyTrigger(void);
#ifdef WAL_DEBUG #ifdef WAL_DEBUG
...@@ -5112,6 +5125,7 @@ XLOGShmemInit(void) ...@@ -5112,6 +5125,7 @@ XLOGShmemInit(void)
XLogCtl->XLogCacheBlck = XLOGbuffers - 1; XLogCtl->XLogCacheBlck = XLOGbuffers - 1;
XLogCtl->SharedRecoveryInProgress = true; XLogCtl->SharedRecoveryInProgress = true;
XLogCtl->SharedHotStandbyActive = false; XLogCtl->SharedHotStandbyActive = false;
XLogCtl->SharedPromoteIsTriggered = false;
XLogCtl->WalWriterSleeping = false; XLogCtl->WalWriterSleeping = false;
SpinLockInit(&XLogCtl->Insert.insertpos_lck); SpinLockInit(&XLogCtl->Insert.insertpos_lck);
...@@ -5940,16 +5954,22 @@ recoveryPausesHere(void) ...@@ -5940,16 +5954,22 @@ recoveryPausesHere(void)
if (!LocalHotStandbyActive) if (!LocalHotStandbyActive)
return; return;
/* Don't pause after standby promotion has been triggered */
if (LocalPromoteIsTriggered)
return;
ereport(LOG, ereport(LOG,
(errmsg("recovery has paused"), (errmsg("recovery has paused"),
errhint("Execute pg_wal_replay_resume() to continue."))); errhint("Execute pg_wal_replay_resume() to continue.")));
while (RecoveryIsPaused()) while (RecoveryIsPaused())
{ {
HandleStartupProcInterrupts();
if (CheckForStandbyTrigger())
return;
pgstat_report_wait_start(WAIT_EVENT_RECOVERY_PAUSE); pgstat_report_wait_start(WAIT_EVENT_RECOVERY_PAUSE);
pg_usleep(1000000L); /* 1000 ms */ pg_usleep(1000000L); /* 1000 ms */
pgstat_report_wait_end(); pgstat_report_wait_end();
HandleStartupProcInterrupts();
} }
} }
...@@ -12277,6 +12297,40 @@ emode_for_corrupt_record(int emode, XLogRecPtr RecPtr) ...@@ -12277,6 +12297,40 @@ emode_for_corrupt_record(int emode, XLogRecPtr RecPtr)
return emode; return emode;
} }
/*
* Has a standby promotion already been triggered?
*
* Unlike CheckForStandbyTrigger(), this works in any process
* that's connected to shared memory.
*/
bool
PromoteIsTriggered(void)
{
/*
* We check shared state each time only until a standby promotion is
* triggered. We can't trigger a promotion again, so there's no need to
* keep checking after the shared variable has once been seen true.
*/
if (LocalPromoteIsTriggered)
return true;
SpinLockAcquire(&XLogCtl->info_lck);
LocalPromoteIsTriggered = XLogCtl->SharedPromoteIsTriggered;
SpinLockRelease(&XLogCtl->info_lck);
return LocalPromoteIsTriggered;
}
static void
SetPromoteIsTriggered(void)
{
SpinLockAcquire(&XLogCtl->info_lck);
XLogCtl->SharedPromoteIsTriggered = true;
SpinLockRelease(&XLogCtl->info_lck);
LocalPromoteIsTriggered = true;
}
/* /*
* Check to see whether the user-specified trigger file exists and whether a * Check to see whether the user-specified trigger file exists and whether a
* promote request has arrived. If either condition holds, return true. * promote request has arrived. If either condition holds, return true.
...@@ -12285,12 +12339,11 @@ static bool ...@@ -12285,12 +12339,11 @@ static bool
CheckForStandbyTrigger(void) CheckForStandbyTrigger(void)
{ {
struct stat stat_buf; struct stat stat_buf;
static bool triggered = false;
if (triggered) if (LocalPromoteIsTriggered)
return true; return true;
if (IsPromoteTriggered()) if (IsPromoteSignaled())
{ {
/* /*
* In 9.1 and 9.2 the postmaster unlinked the promote file inside the * In 9.1 and 9.2 the postmaster unlinked the promote file inside the
...@@ -12313,8 +12366,8 @@ CheckForStandbyTrigger(void) ...@@ -12313,8 +12366,8 @@ CheckForStandbyTrigger(void)
ereport(LOG, (errmsg("received promote request"))); ereport(LOG, (errmsg("received promote request")));
ResetPromoteTriggered(); ResetPromoteSignaled();
triggered = true; SetPromoteIsTriggered();
return true; return true;
} }
...@@ -12326,7 +12379,7 @@ CheckForStandbyTrigger(void) ...@@ -12326,7 +12379,7 @@ CheckForStandbyTrigger(void)
ereport(LOG, ereport(LOG,
(errmsg("promote trigger file found: %s", PromoteTriggerFile))); (errmsg("promote trigger file found: %s", PromoteTriggerFile)));
unlink(PromoteTriggerFile); unlink(PromoteTriggerFile);
triggered = true; SetPromoteIsTriggered();
fast_promote = true; fast_promote = true;
return true; return true;
} }
......
...@@ -531,6 +531,13 @@ pg_wal_replay_pause(PG_FUNCTION_ARGS) ...@@ -531,6 +531,13 @@ pg_wal_replay_pause(PG_FUNCTION_ARGS)
errmsg("recovery is not in progress"), errmsg("recovery is not in progress"),
errhint("Recovery control functions can only be executed during recovery."))); errhint("Recovery control functions can only be executed during recovery.")));
if (PromoteIsTriggered())
ereport(ERROR,
(errcode(ERRCODE_OBJECT_NOT_IN_PREREQUISITE_STATE),
errmsg("standby promotion is ongoing"),
errhint("%s cannot be executed after promotion is triggered.",
"pg_wal_replay_pause()")));
SetRecoveryPause(true); SetRecoveryPause(true);
PG_RETURN_VOID(); PG_RETURN_VOID();
...@@ -551,6 +558,13 @@ pg_wal_replay_resume(PG_FUNCTION_ARGS) ...@@ -551,6 +558,13 @@ pg_wal_replay_resume(PG_FUNCTION_ARGS)
errmsg("recovery is not in progress"), errmsg("recovery is not in progress"),
errhint("Recovery control functions can only be executed during recovery."))); errhint("Recovery control functions can only be executed during recovery.")));
if (PromoteIsTriggered())
ereport(ERROR,
(errcode(ERRCODE_OBJECT_NOT_IN_PREREQUISITE_STATE),
errmsg("standby promotion is ongoing"),
errhint("%s cannot be executed after promotion is triggered.",
"pg_wal_replay_resume()")));
SetRecoveryPause(false); SetRecoveryPause(false);
PG_RETURN_VOID(); PG_RETURN_VOID();
......
...@@ -39,7 +39,7 @@ ...@@ -39,7 +39,7 @@
*/ */
static volatile sig_atomic_t got_SIGHUP = false; static volatile sig_atomic_t got_SIGHUP = false;
static volatile sig_atomic_t shutdown_requested = false; static volatile sig_atomic_t shutdown_requested = false;
static volatile sig_atomic_t promote_triggered = false; static volatile sig_atomic_t promote_signaled = false;
/* /*
* Flag set when executing a restore command, to tell SIGTERM signal handler * Flag set when executing a restore command, to tell SIGTERM signal handler
...@@ -63,7 +63,7 @@ StartupProcTriggerHandler(SIGNAL_ARGS) ...@@ -63,7 +63,7 @@ StartupProcTriggerHandler(SIGNAL_ARGS)
{ {
int save_errno = errno; int save_errno = errno;
promote_triggered = true; promote_signaled = true;
WakeupRecovery(); WakeupRecovery();
errno = save_errno; errno = save_errno;
...@@ -197,13 +197,13 @@ PostRestoreCommand(void) ...@@ -197,13 +197,13 @@ PostRestoreCommand(void)
} }
bool bool
IsPromoteTriggered(void) IsPromoteSignaled(void)
{ {
return promote_triggered; return promote_signaled;
} }
void void
ResetPromoteTriggered(void) ResetPromoteSignaled(void)
{ {
promote_triggered = false; promote_signaled = false;
} }
...@@ -313,6 +313,7 @@ extern XLogRecPtr GetFlushRecPtr(void); ...@@ -313,6 +313,7 @@ extern XLogRecPtr GetFlushRecPtr(void);
extern XLogRecPtr GetLastImportantRecPtr(void); extern XLogRecPtr GetLastImportantRecPtr(void);
extern void RemovePromoteSignalFiles(void); extern void RemovePromoteSignalFiles(void);
extern bool PromoteIsTriggered(void);
extern bool CheckPromoteSignal(void); extern bool CheckPromoteSignal(void);
extern void WakeupRecovery(void); extern void WakeupRecovery(void);
extern void SetWalWriterSleeping(bool sleeping); extern void SetWalWriterSleeping(bool sleeping);
......
...@@ -16,7 +16,7 @@ extern void HandleStartupProcInterrupts(void); ...@@ -16,7 +16,7 @@ extern void HandleStartupProcInterrupts(void);
extern void StartupProcessMain(void) pg_attribute_noreturn(); extern void StartupProcessMain(void) pg_attribute_noreturn();
extern void PreRestoreCommand(void); extern void PreRestoreCommand(void);
extern void PostRestoreCommand(void); extern void PostRestoreCommand(void);
extern bool IsPromoteTriggered(void); extern bool IsPromoteSignaled(void);
extern void ResetPromoteTriggered(void); extern void ResetPromoteSignaled(void);
#endif /* _STARTUP_H */ #endif /* _STARTUP_H */
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment