Commit 04e298b8 authored by Heikki Linnakangas's avatar Heikki Linnakangas

Avoid palloc in critical section in GiST WAL-logging.

Memory allocation can fail if you run out of memory, and inside a critical
section that will lead to a PANIC. Use conservatively-sized arrays in stack
instead.

There was previously no explicit limit on the number of pages a GiST split
can produce, it was only limited by the number of LWLocks that can be held
simultaneously (100 at the moment). This patch adds an explicit limit of 75
pages. That should be plenty, a typical split shouldn't produce more than
2-3 page halves.

The bug has been there forever, but only backpatch down to 9.1. The code
was changed significantly in 9.1, and it doesn't seem worth the risk or
trouble to adapt this for 9.0 and 8.4.
parent fc752505
...@@ -135,7 +135,7 @@ that didn't need to be split. ...@@ -135,7 +135,7 @@ that didn't need to be split.
This differs from the insertion algorithm in the original paper. In the This differs from the insertion algorithm in the original paper. In the
original paper, you first walk down the tree until you reach a leaf page, and original paper, you first walk down the tree until you reach a leaf page, and
then you adjust the downlink in the parent, and propagating the adjustment up, then you adjust the downlink in the parent, and propagate the adjustment up,
all the way up to the root in the worst case. But we adjust the downlinks to all the way up to the root in the worst case. But we adjust the downlinks to
cover the new key already when we walk down, so that when we reach the leaf cover the new key already when we walk down, so that when we reach the leaf
page, we don't need to update the parents anymore, except to insert the page, we don't need to update the parents anymore, except to insert the
......
...@@ -220,6 +220,7 @@ gistplacetopage(Relation rel, Size freespace, GISTSTATE *giststate, ...@@ -220,6 +220,7 @@ gistplacetopage(Relation rel, Size freespace, GISTSTATE *giststate,
GistNSN oldnsn = 0; GistNSN oldnsn = 0;
SplitedPageLayout rootpg; SplitedPageLayout rootpg;
bool is_rootsplit; bool is_rootsplit;
int npage;
is_rootsplit = (blkno == GIST_ROOT_BLKNO); is_rootsplit = (blkno == GIST_ROOT_BLKNO);
...@@ -240,6 +241,19 @@ gistplacetopage(Relation rel, Size freespace, GISTSTATE *giststate, ...@@ -240,6 +241,19 @@ gistplacetopage(Relation rel, Size freespace, GISTSTATE *giststate,
itvec = gistjoinvector(itvec, &tlen, itup, ntup); itvec = gistjoinvector(itvec, &tlen, itup, ntup);
dist = gistSplit(rel, page, itvec, tlen, giststate); dist = gistSplit(rel, page, itvec, tlen, giststate);
/*
* Check that split didn't produce too many pages.
*/
npage = 0;
for (ptr = dist; ptr; ptr = ptr->next)
npage++;
/* in a root split, we'll add one more page to the list below */
if (is_rootsplit)
npage++;
if (npage > GIST_MAX_SPLIT_PAGES)
elog(ERROR, "GiST page split into too many halves (%d, maximum %d)",
npage, GIST_MAX_SPLIT_PAGES);
/* /*
* Set up pages to work with. Allocate new buffers for all but the * Set up pages to work with. Allocate new buffers for all but the
* leftmost page. The original page becomes the new leftmost page, and * leftmost page. The original page becomes the new leftmost page, and
......
...@@ -379,7 +379,7 @@ gistXLogSplit(RelFileNode node, BlockNumber blkno, bool page_is_leaf, ...@@ -379,7 +379,7 @@ gistXLogSplit(RelFileNode node, BlockNumber blkno, bool page_is_leaf,
BlockNumber origrlink, GistNSN orignsn, BlockNumber origrlink, GistNSN orignsn,
Buffer leftchildbuf, bool markfollowright) Buffer leftchildbuf, bool markfollowright)
{ {
XLogRecData *rdata; XLogRecData rdata[GIST_MAX_SPLIT_PAGES * 2 + 2];
gistxlogPageSplit xlrec; gistxlogPageSplit xlrec;
SplitedPageLayout *ptr; SplitedPageLayout *ptr;
int npage = 0, int npage = 0,
...@@ -388,8 +388,12 @@ gistXLogSplit(RelFileNode node, BlockNumber blkno, bool page_is_leaf, ...@@ -388,8 +388,12 @@ gistXLogSplit(RelFileNode node, BlockNumber blkno, bool page_is_leaf,
for (ptr = dist; ptr; ptr = ptr->next) for (ptr = dist; ptr; ptr = ptr->next)
npage++; npage++;
/*
rdata = (XLogRecData *) palloc(sizeof(XLogRecData) * (npage * 2 + 2)); * the caller should've checked this already, but doesn't hurt to check
* again.
*/
if (npage > GIST_MAX_SPLIT_PAGES)
elog(ERROR, "GiST page split into too many halves");
xlrec.node = node; xlrec.node = node;
xlrec.origblkno = blkno; xlrec.origblkno = blkno;
...@@ -439,7 +443,6 @@ gistXLogSplit(RelFileNode node, BlockNumber blkno, bool page_is_leaf, ...@@ -439,7 +443,6 @@ gistXLogSplit(RelFileNode node, BlockNumber blkno, bool page_is_leaf,
recptr = XLogInsert(RM_GIST_ID, XLOG_GIST_PAGE_SPLIT, rdata); recptr = XLogInsert(RM_GIST_ID, XLOG_GIST_PAGE_SPLIT, rdata);
pfree(rdata);
return recptr; return recptr;
} }
...@@ -462,14 +465,12 @@ gistXLogUpdate(RelFileNode node, Buffer buffer, ...@@ -462,14 +465,12 @@ gistXLogUpdate(RelFileNode node, Buffer buffer,
IndexTuple *itup, int ituplen, IndexTuple *itup, int ituplen,
Buffer leftchildbuf) Buffer leftchildbuf)
{ {
XLogRecData *rdata; XLogRecData rdata[MaxIndexTuplesPerPage + 3];
gistxlogPageUpdate xlrec; gistxlogPageUpdate xlrec;
int cur, int cur,
i; i;
XLogRecPtr recptr; XLogRecPtr recptr;
rdata = (XLogRecData *) palloc(sizeof(XLogRecData) * (3 + ituplen));
xlrec.node = node; xlrec.node = node;
xlrec.blkno = BufferGetBlockNumber(buffer); xlrec.blkno = BufferGetBlockNumber(buffer);
xlrec.ntodelete = ntodelete; xlrec.ntodelete = ntodelete;
...@@ -516,6 +517,5 @@ gistXLogUpdate(RelFileNode node, Buffer buffer, ...@@ -516,6 +517,5 @@ gistXLogUpdate(RelFileNode node, Buffer buffer,
recptr = XLogInsert(RM_GIST_ID, XLOG_GIST_PAGE_UPDATE, rdata); recptr = XLogInsert(RM_GIST_ID, XLOG_GIST_PAGE_UPDATE, rdata);
pfree(rdata);
return recptr; return recptr;
} }
...@@ -22,6 +22,21 @@ ...@@ -22,6 +22,21 @@
#include "utils/rbtree.h" #include "utils/rbtree.h"
#include "utils/hsearch.h" #include "utils/hsearch.h"
/*
* Maximum number of "halves" a page can be split into in one operation.
* Typically a split produces 2 halves, but can be more if keys have very
* different lengths, or when inserting multiple keys in one operation (as
* when inserting downlinks to an internal node). There is no theoretical
* limit on this, but in practice if you get more than a handful page halves
* in one split, there's something wrong with the opclass implementation.
* GIST_MAX_SPLIT_PAGES is an arbitrary limit on that, used to size some
* local arrays used during split. Note that there is also a limit on the
* number of buffers that can be held locked at a time, MAX_SIMUL_LWLOCKS,
* so if you raise this higher than that limit, you'll just get a different
* error.
*/
#define GIST_MAX_SPLIT_PAGES 75
/* Buffer lock modes */ /* Buffer lock modes */
#define GIST_SHARE BUFFER_LOCK_SHARE #define GIST_SHARE BUFFER_LOCK_SHARE
#define GIST_EXCLUSIVE BUFFER_LOCK_EXCLUSIVE #define GIST_EXCLUSIVE BUFFER_LOCK_EXCLUSIVE
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment