Commit 50e54709 authored by Heikki Linnakangas's avatar Heikki Linnakangas

Add GUC to enable WAL-logging of hint bits, even with checksums disabled.

WAL records of hint bit updates is useful to tools that want to examine
which pages have been modified. In particular, this is required to make
the pg_rewind tool safe (without checksums).

This can also be used to test how much extra WAL-logging would occur if
you enabled checksums, without actually enabling them (which you can't
currently do without re-initdb'ing).

Sawada Masahiko, docs by Samrat Revagade. Reviewed by Dilip Kumar, with
further changes by me.
parent 56afe850
...@@ -1944,6 +1944,32 @@ include 'filename' ...@@ -1944,6 +1944,32 @@ include 'filename'
</listitem> </listitem>
</varlistentry> </varlistentry>
<varlistentry id="guc-wal-log-hintbits" xreflabel="wal_log_hintbits">
<term><varname>wal_log_hintbits</varname> (<type>boolean</type>)</term>
<indexterm>
<primary><varname>wal_log_hintbits</> configuration parameter</primary>
</indexterm>
<listitem>
<para>
When this parameter is <literal>on</>, the <productname>PostgreSQL</>
server writes the entire content of each disk page to WAL during the
first modification of that page after a checkpoint, even for
non-critical modifications of so-called hint bits.
</para>
<para>
If data checksums are enabled, hint bit updates are always WAL-logged
and this setting is ignored. You can use this setting to test how much
extra WAL-logging would occur if your database had data checksums
enabled.
</para>
<para>
This parameter can only be set at server start. The default value is <literal>off</>.
</para>
</listitem>
</varlistentry>
<varlistentry id="guc-wal-buffers" xreflabel="wal_buffers"> <varlistentry id="guc-wal-buffers" xreflabel="wal_buffers">
<term><varname>wal_buffers</varname> (<type>integer</type>)</term> <term><varname>wal_buffers</varname> (<type>integer</type>)</term>
<indexterm> <indexterm>
......
...@@ -6271,7 +6271,7 @@ log_heap_visible(RelFileNode rnode, Buffer heap_buffer, Buffer vm_buffer, ...@@ -6271,7 +6271,7 @@ log_heap_visible(RelFileNode rnode, Buffer heap_buffer, Buffer vm_buffer,
rdata[1].buffer_std = false; rdata[1].buffer_std = false;
rdata[1].next = NULL; rdata[1].next = NULL;
if (DataChecksumsEnabled()) if (XLogHintBitIsNeeded())
{ {
rdata[1].next = &(rdata[2]); rdata[1].next = &(rdata[2]);
......
...@@ -287,10 +287,10 @@ visibilitymap_set(Relation rel, BlockNumber heapBlk, Buffer heapBuf, ...@@ -287,10 +287,10 @@ visibilitymap_set(Relation rel, BlockNumber heapBlk, Buffer heapBuf,
cutoff_xid); cutoff_xid);
/* /*
* If data checksums are enabled, we need to protect the heap * If data checksums are enabled (or wal_log_hintbits=on), we
* page from being torn. * need to protect the heap page from being torn.
*/ */
if (DataChecksumsEnabled()) if (XLogHintBitIsNeeded())
{ {
Page heapPage = BufferGetPage(heapBuf); Page heapPage = BufferGetPage(heapBuf);
......
...@@ -79,6 +79,7 @@ bool XLogArchiveMode = false; ...@@ -79,6 +79,7 @@ bool XLogArchiveMode = false;
char *XLogArchiveCommand = NULL; char *XLogArchiveCommand = NULL;
bool EnableHotStandby = false; bool EnableHotStandby = false;
bool fullPageWrites = true; bool fullPageWrites = true;
bool walLogHintbits = false;
bool log_checkpoints = false; bool log_checkpoints = false;
int sync_method = DEFAULT_SYNC_METHOD; int sync_method = DEFAULT_SYNC_METHOD;
int wal_level = WAL_LEVEL_MINIMAL; int wal_level = WAL_LEVEL_MINIMAL;
...@@ -5270,6 +5271,7 @@ BootStrapXLOG(void) ...@@ -5270,6 +5271,7 @@ BootStrapXLOG(void)
ControlFile->max_prepared_xacts = max_prepared_xacts; ControlFile->max_prepared_xacts = max_prepared_xacts;
ControlFile->max_locks_per_xact = max_locks_per_xact; ControlFile->max_locks_per_xact = max_locks_per_xact;
ControlFile->wal_level = wal_level; ControlFile->wal_level = wal_level;
ControlFile->wal_log_hintbits = walLogHintbits;
ControlFile->data_checksum_version = bootstrap_data_checksum_version; ControlFile->data_checksum_version = bootstrap_data_checksum_version;
/* some additional ControlFile fields are set in WriteControlFile() */ /* some additional ControlFile fields are set in WriteControlFile() */
...@@ -9058,6 +9060,7 @@ static void ...@@ -9058,6 +9060,7 @@ static void
XLogReportParameters(void) XLogReportParameters(void)
{ {
if (wal_level != ControlFile->wal_level || if (wal_level != ControlFile->wal_level ||
walLogHintbits != ControlFile->wal_log_hintbits ||
MaxConnections != ControlFile->MaxConnections || MaxConnections != ControlFile->MaxConnections ||
max_worker_processes != ControlFile->max_worker_processes || max_worker_processes != ControlFile->max_worker_processes ||
max_prepared_xacts != ControlFile->max_prepared_xacts || max_prepared_xacts != ControlFile->max_prepared_xacts ||
...@@ -9080,6 +9083,7 @@ XLogReportParameters(void) ...@@ -9080,6 +9083,7 @@ XLogReportParameters(void)
xlrec.max_prepared_xacts = max_prepared_xacts; xlrec.max_prepared_xacts = max_prepared_xacts;
xlrec.max_locks_per_xact = max_locks_per_xact; xlrec.max_locks_per_xact = max_locks_per_xact;
xlrec.wal_level = wal_level; xlrec.wal_level = wal_level;
xlrec.wal_log_hintbits = walLogHintbits;
rdata.buffer = InvalidBuffer; rdata.buffer = InvalidBuffer;
rdata.data = (char *) &xlrec; rdata.data = (char *) &xlrec;
...@@ -9094,6 +9098,7 @@ XLogReportParameters(void) ...@@ -9094,6 +9098,7 @@ XLogReportParameters(void)
ControlFile->max_prepared_xacts = max_prepared_xacts; ControlFile->max_prepared_xacts = max_prepared_xacts;
ControlFile->max_locks_per_xact = max_locks_per_xact; ControlFile->max_locks_per_xact = max_locks_per_xact;
ControlFile->wal_level = wal_level; ControlFile->wal_level = wal_level;
ControlFile->wal_log_hintbits = walLogHintbits;
UpdateControlFile(); UpdateControlFile();
} }
} }
...@@ -9480,6 +9485,7 @@ xlog_redo(XLogRecPtr lsn, XLogRecord *record) ...@@ -9480,6 +9485,7 @@ xlog_redo(XLogRecPtr lsn, XLogRecord *record)
ControlFile->max_prepared_xacts = xlrec.max_prepared_xacts; ControlFile->max_prepared_xacts = xlrec.max_prepared_xacts;
ControlFile->max_locks_per_xact = xlrec.max_locks_per_xact; ControlFile->max_locks_per_xact = xlrec.max_locks_per_xact;
ControlFile->wal_level = xlrec.wal_level; ControlFile->wal_level = xlrec.wal_level;
ControlFile->wal_log_hintbits = walLogHintbits;
/* /*
* Update minRecoveryPoint to ensure that if recovery is aborted, we * Update minRecoveryPoint to ensure that if recovery is aborted, we
......
...@@ -2626,16 +2626,15 @@ MarkBufferDirtyHint(Buffer buffer, bool buffer_std) ...@@ -2626,16 +2626,15 @@ MarkBufferDirtyHint(Buffer buffer, bool buffer_std)
bool delayChkpt = false; bool delayChkpt = false;
/* /*
* If checksums are enabled, and the buffer is permanent, then a full * If we need to protect hint bit updates from torn writes, WAL-log a
* page image may be required even for some hint bit updates to * full page image of the page. This full page image is only necessary
* protect against torn pages. This full page image is only necessary
* if the hint bit update is the first change to the page since the * if the hint bit update is the first change to the page since the
* last checkpoint. * last checkpoint.
* *
* We don't check full_page_writes here because that logic is included * We don't check full_page_writes here because that logic is included
* when we call XLogInsert() since the value changes dynamically. * when we call XLogInsert() since the value changes dynamically.
*/ */
if (DataChecksumsEnabled() && (bufHdr->flags & BM_PERMANENT)) if (XLogHintBitIsNeeded() && (bufHdr->flags & BM_PERMANENT))
{ {
/* /*
* If we're in recovery we cannot dirty a page because of a hint. * If we're in recovery we cannot dirty a page because of a hint.
......
...@@ -866,6 +866,17 @@ static struct config_bool ConfigureNamesBool[] = ...@@ -866,6 +866,17 @@ static struct config_bool ConfigureNamesBool[] =
true, true,
NULL, NULL, NULL NULL, NULL, NULL
}, },
{
{"wal_log_hintbits", PGC_POSTMASTER, WAL_SETTINGS,
gettext_noop("Writes full pages to WAL when first modified after a checkpoint, even for a non-critical modifications"),
NULL
},
&walLogHintbits,
false,
NULL, NULL, NULL
},
{ {
{"log_checkpoints", PGC_SIGHUP, LOGGING_WHAT, {"log_checkpoints", PGC_SIGHUP, LOGGING_WHAT,
gettext_noop("Logs each checkpoint."), gettext_noop("Logs each checkpoint."),
......
...@@ -184,6 +184,7 @@ ...@@ -184,6 +184,7 @@
# fsync_writethrough # fsync_writethrough
# open_sync # open_sync
#full_page_writes = on # recover from partial page writes #full_page_writes = on # recover from partial page writes
#wal_log_hintbits = off # also do full pages writes of non-critical updates
#wal_buffers = -1 # min 32kB, -1 sets based on shared_buffers #wal_buffers = -1 # min 32kB, -1 sets based on shared_buffers
# (change requires restart) # (change requires restart)
#wal_writer_delay = 200ms # 1-10000 milliseconds #wal_writer_delay = 200ms # 1-10000 milliseconds
......
...@@ -260,6 +260,8 @@ main(int argc, char *argv[]) ...@@ -260,6 +260,8 @@ main(int argc, char *argv[])
ControlFile.backupEndRequired ? _("yes") : _("no")); ControlFile.backupEndRequired ? _("yes") : _("no"));
printf(_("Current wal_level setting: %s\n"), printf(_("Current wal_level setting: %s\n"),
wal_level_str(ControlFile.wal_level)); wal_level_str(ControlFile.wal_level));
printf(_("Current wal_log_hintbits setting: %s\n"),
ControlFile.wal_log_hintbits ? _("on") : _("off"));
printf(_("Current max_connections setting: %d\n"), printf(_("Current max_connections setting: %d\n"),
ControlFile.MaxConnections); ControlFile.MaxConnections);
printf(_("Current max_worker_processes setting: %d\n"), printf(_("Current max_worker_processes setting: %d\n"),
......
...@@ -525,6 +525,7 @@ GuessControlValues(void) ...@@ -525,6 +525,7 @@ GuessControlValues(void)
/* minRecoveryPoint, backupStartPoint and backupEndPoint can be left zero */ /* minRecoveryPoint, backupStartPoint and backupEndPoint can be left zero */
ControlFile.wal_level = WAL_LEVEL_MINIMAL; ControlFile.wal_level = WAL_LEVEL_MINIMAL;
ControlFile.wal_log_hintbits = false;
ControlFile.MaxConnections = 100; ControlFile.MaxConnections = 100;
ControlFile.max_worker_processes = 8; ControlFile.max_worker_processes = 8;
ControlFile.max_prepared_xacts = 0; ControlFile.max_prepared_xacts = 0;
...@@ -721,6 +722,7 @@ RewriteControlFile(void) ...@@ -721,6 +722,7 @@ RewriteControlFile(void)
* anyway at startup. * anyway at startup.
*/ */
ControlFile.wal_level = WAL_LEVEL_MINIMAL; ControlFile.wal_level = WAL_LEVEL_MINIMAL;
ControlFile.wal_log_hintbits = false;
ControlFile.MaxConnections = 100; ControlFile.MaxConnections = 100;
ControlFile.max_worker_processes = 8; ControlFile.max_worker_processes = 8;
ControlFile.max_prepared_xacts = 0; ControlFile.max_prepared_xacts = 0;
......
...@@ -189,6 +189,7 @@ extern bool XLogArchiveMode; ...@@ -189,6 +189,7 @@ extern bool XLogArchiveMode;
extern char *XLogArchiveCommand; extern char *XLogArchiveCommand;
extern bool EnableHotStandby; extern bool EnableHotStandby;
extern bool fullPageWrites; extern bool fullPageWrites;
extern bool walLogHintbits;
extern bool log_checkpoints; extern bool log_checkpoints;
extern int num_xloginsert_slots; extern int num_xloginsert_slots;
...@@ -211,6 +212,17 @@ extern int wal_level; ...@@ -211,6 +212,17 @@ extern int wal_level;
*/ */
#define XLogIsNeeded() (wal_level >= WAL_LEVEL_ARCHIVE) #define XLogIsNeeded() (wal_level >= WAL_LEVEL_ARCHIVE)
/*
* Is a full-page image needed for hint bit updates?
*
* Normally, we don't WAL-log hint bit updates, but if checksums are enabled,
* we have to protect them against torn page writes. When you only set
* individual bits on a page, it's still consistent no matter what combination
* of the bits make it to disk, but the checksum wouldn't match. Also WAL-log
* them if forced by wal_log_hintbits=on.
*/
#define XLogHintBitIsNeeded() (DataChecksumsEnabled() || walLogHintbits)
/* Do we need to WAL-log information required only for Hot Standby and logical replication? */ /* Do we need to WAL-log information required only for Hot Standby and logical replication? */
#define XLogStandbyInfoActive() (wal_level >= WAL_LEVEL_HOT_STANDBY) #define XLogStandbyInfoActive() (wal_level >= WAL_LEVEL_HOT_STANDBY)
......
...@@ -209,6 +209,7 @@ typedef struct xl_parameter_change ...@@ -209,6 +209,7 @@ typedef struct xl_parameter_change
int max_prepared_xacts; int max_prepared_xacts;
int max_locks_per_xact; int max_locks_per_xact;
int wal_level; int wal_level;
bool wal_log_hintbits;
} xl_parameter_change; } xl_parameter_change;
/* logs restore point */ /* logs restore point */
......
...@@ -53,6 +53,6 @@ ...@@ -53,6 +53,6 @@
*/ */
/* yyyymmddN */ /* yyyymmddN */
#define CATALOG_VERSION_NO 201311261 #define CATALOG_VERSION_NO 201312131
#endif #endif
...@@ -171,6 +171,7 @@ typedef struct ControlFileData ...@@ -171,6 +171,7 @@ typedef struct ControlFileData
* or hot standby. * or hot standby.
*/ */
int wal_level; int wal_level;
bool wal_log_hintbits;
int MaxConnections; int MaxConnections;
int max_worker_processes; int max_worker_processes;
int max_prepared_xacts; int max_prepared_xacts;
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment