Commit 7dbb6069 authored by Andres Freund's avatar Andres Freund

Flush unlogged table's buffers when copying or moving databases.

CREATE DATABASE and ALTER DATABASE .. SET TABLESPACE copy the source
database directory on the filesystem level. To ensure the on disk
state is consistent they block out users of the affected database and
force a checkpoint to flush out all data to disk. Unfortunately, up to
now, that checkpoint didn't flush out dirty buffers from unlogged
relations.

That bug means there could be leftover dirty buffers in either the
template database, or the database in its old location. Leading to
problems when accessing relations in an inconsistent state; and to
possible problems during shutdown in the SET TABLESPACE case because
buffers belonging files that don't exist anymore are flushed.

This was reported in bug #10675 by Maxim Boguk.

Fix by Pavan Deolasee, modified somewhat by me. Reviewed by MauMau and
Fujii Masao.

Backpatch to 9.1 where unlogged tables were introduced.
parent 83dc5908
...@@ -7771,9 +7771,9 @@ LogCheckpointStart(int flags, bool restartpoint) ...@@ -7771,9 +7771,9 @@ LogCheckpointStart(int flags, bool restartpoint)
* the main message, but what about all the flags? * the main message, but what about all the flags?
*/ */
if (restartpoint) if (restartpoint)
msg = "restartpoint starting:%s%s%s%s%s%s%s"; msg = "restartpoint starting:%s%s%s%s%s%s%s%s";
else else
msg = "checkpoint starting:%s%s%s%s%s%s%s"; msg = "checkpoint starting:%s%s%s%s%s%s%s%s";
elog(LOG, msg, elog(LOG, msg,
(flags & CHECKPOINT_IS_SHUTDOWN) ? " shutdown" : "", (flags & CHECKPOINT_IS_SHUTDOWN) ? " shutdown" : "",
...@@ -7782,7 +7782,8 @@ LogCheckpointStart(int flags, bool restartpoint) ...@@ -7782,7 +7782,8 @@ LogCheckpointStart(int flags, bool restartpoint)
(flags & CHECKPOINT_FORCE) ? " force" : "", (flags & CHECKPOINT_FORCE) ? " force" : "",
(flags & CHECKPOINT_WAIT) ? " wait" : "", (flags & CHECKPOINT_WAIT) ? " wait" : "",
(flags & CHECKPOINT_CAUSE_XLOG) ? " xlog" : "", (flags & CHECKPOINT_CAUSE_XLOG) ? " xlog" : "",
(flags & CHECKPOINT_CAUSE_TIME) ? " time" : ""); (flags & CHECKPOINT_CAUSE_TIME) ? " time" : "",
(flags & CHECKPOINT_FLUSH_ALL) ? " flush-all" :"");
} }
/* /*
......
...@@ -549,15 +549,17 @@ createdb(const CreatedbStmt *stmt) ...@@ -549,15 +549,17 @@ createdb(const CreatedbStmt *stmt)
InvokeObjectPostCreateHook(DatabaseRelationId, dboid, 0); InvokeObjectPostCreateHook(DatabaseRelationId, dboid, 0);
/* /*
* Force a checkpoint before starting the copy. This will force dirty * Force a checkpoint before starting the copy. This will force all dirty
* buffers out to disk, to ensure source database is up-to-date on disk * buffers, including those of unlogged tables, out to disk, to ensure
* for the copy. FlushDatabaseBuffers() would suffice for that, but we * source database is up-to-date on disk for the copy.
* also want to process any pending unlink requests. Otherwise, if a * FlushDatabaseBuffers() would suffice for that, but we also want
* checkpoint happened while we're copying files, a file might be deleted * to process any pending unlink requests. Otherwise, if a checkpoint
* just when we're about to copy it, causing the lstat() call in copydir() * happened while we're copying files, a file might be deleted just when
* to fail with ENOENT. * we're about to copy it, causing the lstat() call in copydir() to fail
* with ENOENT.
*/ */
RequestCheckpoint(CHECKPOINT_IMMEDIATE | CHECKPOINT_FORCE | CHECKPOINT_WAIT); RequestCheckpoint(CHECKPOINT_IMMEDIATE | CHECKPOINT_FORCE | CHECKPOINT_WAIT
| CHECKPOINT_FLUSH_ALL);
/* /*
* Once we start copying subdirectories, we need to be able to clean 'em * Once we start copying subdirectories, we need to be able to clean 'em
...@@ -1138,8 +1140,9 @@ movedb(const char *dbname, const char *tblspcname) ...@@ -1138,8 +1140,9 @@ movedb(const char *dbname, const char *tblspcname)
dst_dbpath = GetDatabasePath(db_id, dst_tblspcoid); dst_dbpath = GetDatabasePath(db_id, dst_tblspcoid);
/* /*
* Force a checkpoint before proceeding. This will force dirty buffers out * Force a checkpoint before proceeding. This will force all dirty
* to disk, to ensure source database is up-to-date on disk for the copy. * buffers, including those of unlogged tables, out to disk, to ensure
* source database is up-to-date on disk for the copy.
* FlushDatabaseBuffers() would suffice for that, but we also want to * FlushDatabaseBuffers() would suffice for that, but we also want to
* process any pending unlink requests. Otherwise, the check for existing * process any pending unlink requests. Otherwise, the check for existing
* files in the target directory might fail unnecessarily, not to mention * files in the target directory might fail unnecessarily, not to mention
...@@ -1147,7 +1150,8 @@ movedb(const char *dbname, const char *tblspcname) ...@@ -1147,7 +1150,8 @@ movedb(const char *dbname, const char *tblspcname)
* On Windows, this also ensures that background procs don't hold any open * On Windows, this also ensures that background procs don't hold any open
* files, which would cause rmdir() to fail. * files, which would cause rmdir() to fail.
*/ */
RequestCheckpoint(CHECKPOINT_IMMEDIATE | CHECKPOINT_FORCE | CHECKPOINT_WAIT); RequestCheckpoint(CHECKPOINT_IMMEDIATE | CHECKPOINT_FORCE | CHECKPOINT_WAIT
| CHECKPOINT_FLUSH_ALL);
/* /*
* Check for existence of files in the target directory, i.e., objects of * Check for existence of files in the target directory, i.e., objects of
......
...@@ -1493,9 +1493,10 @@ UnpinBuffer(volatile BufferDesc *buf, bool fixOwner) ...@@ -1493,9 +1493,10 @@ UnpinBuffer(volatile BufferDesc *buf, bool fixOwner)
* *
* This is called at checkpoint time to write out all dirty shared buffers. * This is called at checkpoint time to write out all dirty shared buffers.
* The checkpoint request flags should be passed in. If CHECKPOINT_IMMEDIATE * The checkpoint request flags should be passed in. If CHECKPOINT_IMMEDIATE
* is set, we disable delays between writes; if CHECKPOINT_IS_SHUTDOWN is * is set, we disable delays between writes; if CHECKPOINT_IS_SHUTDOWN,
* set, we write even unlogged buffers, which are otherwise skipped. The * CHECKPOINT_END_OF_RECOVERY or CHECKPOINT_FLUSH_ALL is set, we write even
* remaining flags currently have no effect here. * unlogged buffers, which are otherwise skipped. The remaining flags
* currently have no effect here.
*/ */
static void static void
BufferSync(int flags) BufferSync(int flags)
...@@ -1510,11 +1511,12 @@ BufferSync(int flags) ...@@ -1510,11 +1511,12 @@ BufferSync(int flags)
ResourceOwnerEnlargeBuffers(CurrentResourceOwner); ResourceOwnerEnlargeBuffers(CurrentResourceOwner);
/* /*
* Unless this is a shutdown checkpoint, we write only permanent, dirty * Unless this is a shutdown checkpoint or we have been explicitly told,
* buffers. But at shutdown or end of recovery, we write all dirty * we write only permanent, dirty buffers. But at shutdown or end of
* buffers. * recovery, we write all dirty buffers.
*/ */
if (!((flags & CHECKPOINT_IS_SHUTDOWN) || (flags & CHECKPOINT_END_OF_RECOVERY))) if (!((flags & (CHECKPOINT_IS_SHUTDOWN | CHECKPOINT_END_OF_RECOVERY |
CHECKPOINT_FLUSH_ALL))))
mask |= BM_PERMANENT; mask |= BM_PERMANENT;
/* /*
......
...@@ -253,6 +253,8 @@ extern bool XLOG_DEBUG; ...@@ -253,6 +253,8 @@ extern bool XLOG_DEBUG;
/* These indicate the cause of a checkpoint request */ /* These indicate the cause of a checkpoint request */
#define CHECKPOINT_CAUSE_XLOG 0x0020 /* XLOG consumption */ #define CHECKPOINT_CAUSE_XLOG 0x0020 /* XLOG consumption */
#define CHECKPOINT_CAUSE_TIME 0x0040 /* Elapsed time */ #define CHECKPOINT_CAUSE_TIME 0x0040 /* Elapsed time */
#define CHECKPOINT_FLUSH_ALL 0x0080 /* Flush all pages, including those
* belonging to unlogged tables */
/* Checkpoint statistics */ /* Checkpoint statistics */
typedef struct CheckpointStatsData typedef struct CheckpointStatsData
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment