Commit 6d90eaaa authored by Heikki Linnakangas's avatar Heikki Linnakangas

Make bgwriter sleep longer when it has no work to do, to save electricity.

To make it wake up promptly when activity starts again, backends nudge it
by setting a latch in MarkBufferDirty(). The latch is kept set while
bgwriter is active, so there is very little overhead from that when the
system is busy. It is only armed before going into longer sleep.

Peter Geoghegan, with some changes by me.
parent 467ff207
...@@ -51,6 +51,7 @@ ...@@ -51,6 +51,7 @@
#include "storage/ipc.h" #include "storage/ipc.h"
#include "storage/lwlock.h" #include "storage/lwlock.h"
#include "storage/pmsignal.h" #include "storage/pmsignal.h"
#include "storage/proc.h"
#include "storage/shmem.h" #include "storage/shmem.h"
#include "storage/smgr.h" #include "storage/smgr.h"
#include "storage/spin.h" #include "storage/spin.h"
...@@ -64,6 +65,11 @@ ...@@ -64,6 +65,11 @@
*/ */
int BgWriterDelay = 200; int BgWriterDelay = 200;
/*
* Time to sleep between bgwriter rounds, when it has no work to do.
*/
#define BGWRITER_HIBERNATE_MS 10000
/* /*
* Flags set by interrupt handlers for later service in the main loop. * Flags set by interrupt handlers for later service in the main loop.
*/ */
...@@ -77,13 +83,14 @@ static bool am_bg_writer = false; ...@@ -77,13 +83,14 @@ static bool am_bg_writer = false;
/* Prototypes for private functions */ /* Prototypes for private functions */
static void BgWriterNap(void); static void BgWriterNap(bool hibernating);
/* Signal handlers */ /* Signal handlers */
static void bg_quickdie(SIGNAL_ARGS); static void bg_quickdie(SIGNAL_ARGS);
static void BgSigHupHandler(SIGNAL_ARGS); static void BgSigHupHandler(SIGNAL_ARGS);
static void ReqShutdownHandler(SIGNAL_ARGS); static void ReqShutdownHandler(SIGNAL_ARGS);
static void bgwriter_sigusr1_handler(SIGNAL_ARGS);
/* /*
...@@ -97,6 +104,7 @@ BackgroundWriterMain(void) ...@@ -97,6 +104,7 @@ BackgroundWriterMain(void)
{ {
sigjmp_buf local_sigjmp_buf; sigjmp_buf local_sigjmp_buf;
MemoryContext bgwriter_context; MemoryContext bgwriter_context;
bool hibernating;
am_bg_writer = true; am_bg_writer = true;
...@@ -112,10 +120,10 @@ BackgroundWriterMain(void) ...@@ -112,10 +120,10 @@ BackgroundWriterMain(void)
#endif #endif
/* /*
* Properly accept or ignore signals the postmaster might send us * Properly accept or ignore signals the postmaster might send us.
* *
* SIGUSR1 is presently unused; keep it spare in case someday we want this * bgwriter doesn't participate in ProcSignal signalling, but a SIGUSR1
* process to participate in ProcSignal signalling. * handler is still needed for latch wakeups.
*/ */
pqsignal(SIGHUP, BgSigHupHandler); /* set flag to read config file */ pqsignal(SIGHUP, BgSigHupHandler); /* set flag to read config file */
pqsignal(SIGINT, SIG_IGN); /* as of 9.2 no longer requests checkpoint */ pqsignal(SIGINT, SIG_IGN); /* as of 9.2 no longer requests checkpoint */
...@@ -123,7 +131,7 @@ BackgroundWriterMain(void) ...@@ -123,7 +131,7 @@ BackgroundWriterMain(void)
pqsignal(SIGQUIT, bg_quickdie); /* hard crash time */ pqsignal(SIGQUIT, bg_quickdie); /* hard crash time */
pqsignal(SIGALRM, SIG_IGN); pqsignal(SIGALRM, SIG_IGN);
pqsignal(SIGPIPE, SIG_IGN); pqsignal(SIGPIPE, SIG_IGN);
pqsignal(SIGUSR1, SIG_IGN); /* reserve for ProcSignal */ pqsignal(SIGUSR1, bgwriter_sigusr1_handler);
pqsignal(SIGUSR2, SIG_IGN); pqsignal(SIGUSR2, SIG_IGN);
/* /*
...@@ -138,6 +146,12 @@ BackgroundWriterMain(void) ...@@ -138,6 +146,12 @@ BackgroundWriterMain(void)
/* We allow SIGQUIT (quickdie) at all times */ /* We allow SIGQUIT (quickdie) at all times */
sigdelset(&BlockSig, SIGQUIT); sigdelset(&BlockSig, SIGQUIT);
/*
* Advertise our latch that backends can use to wake us up while we're
* sleeping.
*/
ProcGlobal->bgwriterLatch = &MyProc->procLatch;
/* /*
* Create a resource owner to keep track of our resources (currently only * Create a resource owner to keep track of our resources (currently only
* buffer pins). * buffer pins).
...@@ -235,8 +249,11 @@ BackgroundWriterMain(void) ...@@ -235,8 +249,11 @@ BackgroundWriterMain(void)
/* /*
* Loop forever * Loop forever
*/ */
hibernating = false;
for (;;) for (;;)
{ {
bool lapped;
/* /*
* Emergency bailout if postmaster has died. This is to avoid the * Emergency bailout if postmaster has died. This is to avoid the
* necessity for manual cleanup of all postmaster children. * necessity for manual cleanup of all postmaster children.
...@@ -264,18 +281,66 @@ BackgroundWriterMain(void) ...@@ -264,18 +281,66 @@ BackgroundWriterMain(void)
/* /*
* Do one cycle of dirty-buffer writing. * Do one cycle of dirty-buffer writing.
*/ */
BgBufferSync(); if (hibernating && bgwriter_lru_maxpages > 0)
ResetLatch(&MyProc->procLatch);
lapped = BgBufferSync();
if (lapped && !hibernating)
{
/*
* BgBufferSync did nothing. Since there doesn't seem to be any
* work for the bgwriter to do, go into slower-paced
* "hibernation" mode, where we sleep for much longer times than
* bgwriter_delay says. Fewer wakeups saves electricity. If a
* backend starts dirtying pages again, it will wake us up by
* setting our latch.
*
* The latch is kept set during productive cycles where buffers
* are written, and only reset before going into a longer sleep.
* That ensures that when there's a constant trickle of activity,
* the SetLatch() calls that backends have to do will see the
* latch as already set, and are not slowed down by having to
* actually set the latch and signal us.
*/
hibernating = true;
/* Nap for the configured time. */ /*
BgWriterNap(); * Take one more short nap and perform one more bgwriter cycle -
* someone might've dirtied a buffer just after we finished the
* previous bgwriter cycle, while the latch was still set. If
* we still find nothing to do after this cycle, the next sleep
* will be longer.
*/
BgWriterNap(false);
continue;
}
else if (!lapped && hibernating)
{
/*
* Woken up from hibernation. Set the latch just in case it's
* not set yet (usually we wake up from hibernation because a
* backend already set the latch, but not necessarily).
*/
SetLatch(&MyProc->procLatch);
hibernating = false;
}
/*
* Take a short or long nap, depending on whether there was any work
* to do.
*/
BgWriterNap(hibernating);
} }
} }
/* /*
* BgWriterNap -- Nap for the configured time or until a signal is received. * BgWriterNap -- Nap for the configured time or until a signal is received.
*
* If 'hibernating' is false, sleeps for bgwriter_delay milliseconds.
* Otherwise sleeps longer, but also wakes up if the process latch is set.
*/ */
static void static void
BgWriterNap(void) BgWriterNap(bool hibernating)
{ {
long udelay; long udelay;
...@@ -285,18 +350,44 @@ BgWriterNap(void) ...@@ -285,18 +350,44 @@ BgWriterNap(void)
pgstat_send_bgwriter(); pgstat_send_bgwriter();
/* /*
* Nap for the configured time, or sleep for 10 seconds if there is no * If there was no work to do in the previous bgwriter cycle, take a
* bgwriter activity configured. * longer nap.
*/
if (hibernating)
{
/*
* We wake on a buffer being dirtied. It's possible that some
* useful work will become available for the bgwriter to do without
* a buffer actually being dirtied, like when a dirty buffer's usage
* count is decremented to zero or it's unpinned. This corner case
* is judged as too marginal to justify adding additional SetLatch()
* calls in very hot code paths, cheap though those calls may be.
*
* We still wake up periodically, so that BufferAlloc stats are
* updated reasonably promptly.
*/
int res = WaitLatch(&MyProc->procLatch,
WL_LATCH_SET | WL_TIMEOUT | WL_POSTMASTER_DEATH,
BGWRITER_HIBERNATE_MS);
/*
* Only do a quick return if timeout was reached (or postmaster died)
* to ensure that no less than BgWriterDelay ms has passed between
* BgBufferSyncs - WaitLatch() might have returned instantaneously.
*/
if (res & (WL_TIMEOUT | WL_POSTMASTER_DEATH))
return;
}
/*
* Nap for the configured time.
* *
* On some platforms, signals won't interrupt the sleep. To ensure we * On some platforms, signals won't interrupt the sleep. To ensure we
* respond reasonably promptly when someone signals us, break down the * respond reasonably promptly when someone signals us, break down the
* sleep into 1-second increments, and check for interrupts after each * sleep into 1-second increments, and check for interrupts after each
* nap. * nap.
*/ */
if (bgwriter_lru_maxpages > 0) udelay = BgWriterDelay * 1000L;
udelay = BgWriterDelay * 1000L;
else
udelay = 10000000L; /* Ten seconds */
while (udelay > 999999L) while (udelay > 999999L)
{ {
...@@ -351,12 +442,35 @@ bg_quickdie(SIGNAL_ARGS) ...@@ -351,12 +442,35 @@ bg_quickdie(SIGNAL_ARGS)
static void static void
BgSigHupHandler(SIGNAL_ARGS) BgSigHupHandler(SIGNAL_ARGS)
{ {
int save_errno = errno;
got_SIGHUP = true; got_SIGHUP = true;
if (MyProc)
SetLatch(&MyProc->procLatch);
errno = save_errno;
} }
/* SIGTERM: set flag to shutdown and exit */ /* SIGTERM: set flag to shutdown and exit */
static void static void
ReqShutdownHandler(SIGNAL_ARGS) ReqShutdownHandler(SIGNAL_ARGS)
{ {
int save_errno = errno;
shutdown_requested = true; shutdown_requested = true;
if (MyProc)
SetLatch(&MyProc->procLatch);
errno = save_errno;
}
/* SIGUSR1: used for latch wakeups */
static void
bgwriter_sigusr1_handler(SIGNAL_ARGS)
{
int save_errno = errno;
latch_sigusr1_handler();
errno = save_errno;
} }
...@@ -953,6 +953,7 @@ void ...@@ -953,6 +953,7 @@ void
MarkBufferDirty(Buffer buffer) MarkBufferDirty(Buffer buffer)
{ {
volatile BufferDesc *bufHdr; volatile BufferDesc *bufHdr;
bool dirtied = false;
if (!BufferIsValid(buffer)) if (!BufferIsValid(buffer))
elog(ERROR, "bad buffer ID: %d", buffer); elog(ERROR, "bad buffer ID: %d", buffer);
...@@ -973,19 +974,25 @@ MarkBufferDirty(Buffer buffer) ...@@ -973,19 +974,25 @@ MarkBufferDirty(Buffer buffer)
Assert(bufHdr->refcount > 0); Assert(bufHdr->refcount > 0);
if (!(bufHdr->flags & BM_DIRTY))
dirtied = true;
bufHdr->flags |= (BM_DIRTY | BM_JUST_DIRTIED);
UnlockBufHdr(bufHdr);
/* /*
* If the buffer was not dirty already, do vacuum accounting. * If the buffer was not dirty already, do vacuum accounting, and
* nudge bgwriter.
*/ */
if (!(bufHdr->flags & BM_DIRTY)) if (dirtied)
{ {
VacuumPageDirty++; VacuumPageDirty++;
if (VacuumCostActive) if (VacuumCostActive)
VacuumCostBalance += VacuumCostPageDirty; VacuumCostBalance += VacuumCostPageDirty;
if (ProcGlobal->bgwriterLatch)
SetLatch(ProcGlobal->bgwriterLatch);
} }
bufHdr->flags |= (BM_DIRTY | BM_JUST_DIRTIED);
UnlockBufHdr(bufHdr);
} }
/* /*
...@@ -1307,8 +1314,12 @@ BufferSync(int flags) ...@@ -1307,8 +1314,12 @@ BufferSync(int flags)
* BgBufferSync -- Write out some dirty buffers in the pool. * BgBufferSync -- Write out some dirty buffers in the pool.
* *
* This is called periodically by the background writer process. * This is called periodically by the background writer process.
*
* Returns true if the clocksweep has been "lapped", so that there's nothing
* to do. Also returns true if there's nothing to do because bgwriter was
* effectively disabled by setting bgwriter_lru_maxpages to 0.
*/ */
void bool
BgBufferSync(void) BgBufferSync(void)
{ {
/* info obtained from freelist.c */ /* info obtained from freelist.c */
...@@ -1365,7 +1376,7 @@ BgBufferSync(void) ...@@ -1365,7 +1376,7 @@ BgBufferSync(void)
if (bgwriter_lru_maxpages <= 0) if (bgwriter_lru_maxpages <= 0)
{ {
saved_info_valid = false; saved_info_valid = false;
return; return true;
} }
/* /*
...@@ -1584,6 +1595,8 @@ BgBufferSync(void) ...@@ -1584,6 +1595,8 @@ BgBufferSync(void)
recent_alloc, strategy_delta, scans_per_alloc, smoothed_density); recent_alloc, strategy_delta, scans_per_alloc, smoothed_density);
#endif #endif
} }
return (bufs_to_lap == 0);
} }
/* /*
...@@ -2341,16 +2354,24 @@ SetBufferCommitInfoNeedsSave(Buffer buffer) ...@@ -2341,16 +2354,24 @@ SetBufferCommitInfoNeedsSave(Buffer buffer)
if ((bufHdr->flags & (BM_DIRTY | BM_JUST_DIRTIED)) != if ((bufHdr->flags & (BM_DIRTY | BM_JUST_DIRTIED)) !=
(BM_DIRTY | BM_JUST_DIRTIED)) (BM_DIRTY | BM_JUST_DIRTIED))
{ {
bool dirtied = false;
LockBufHdr(bufHdr); LockBufHdr(bufHdr);
Assert(bufHdr->refcount > 0); Assert(bufHdr->refcount > 0);
if (!(bufHdr->flags & BM_DIRTY)) if (!(bufHdr->flags & BM_DIRTY))
dirtied = true;
bufHdr->flags |= (BM_DIRTY | BM_JUST_DIRTIED);
UnlockBufHdr(bufHdr);
if (dirtied)
{ {
VacuumPageDirty++; VacuumPageDirty++;
if (VacuumCostActive) if (VacuumCostActive)
VacuumCostBalance += VacuumCostPageDirty; VacuumCostBalance += VacuumCostPageDirty;
/* The bgwriter may need to be woken. */
if (ProcGlobal->bgwriterLatch)
SetLatch(ProcGlobal->bgwriterLatch);
} }
bufHdr->flags |= (BM_DIRTY | BM_JUST_DIRTIED);
UnlockBufHdr(bufHdr);
} }
} }
......
...@@ -213,7 +213,7 @@ extern bool HoldingBufferPinThatDelaysRecovery(void); ...@@ -213,7 +213,7 @@ extern bool HoldingBufferPinThatDelaysRecovery(void);
extern void AbortBufferIO(void); extern void AbortBufferIO(void);
extern void BufmgrCommit(void); extern void BufmgrCommit(void);
extern void BgBufferSync(void); extern bool BgBufferSync(void);
extern void AtProcExit_LocalBuffers(void); extern void AtProcExit_LocalBuffers(void);
......
...@@ -188,6 +188,8 @@ typedef struct PROC_HDR ...@@ -188,6 +188,8 @@ typedef struct PROC_HDR
PGPROC *freeProcs; PGPROC *freeProcs;
/* Head of list of autovacuum's free PGPROC structures */ /* Head of list of autovacuum's free PGPROC structures */
PGPROC *autovacFreeProcs; PGPROC *autovacFreeProcs;
/* BGWriter process latch */
Latch *bgwriterLatch;
/* Current shared estimate of appropriate spins_per_delay value */ /* Current shared estimate of appropriate spins_per_delay value */
int spins_per_delay; int spins_per_delay;
/* The proc of the Startup process, since not in ProcArray */ /* The proc of the Startup process, since not in ProcArray */
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment