Commit 41f5e04a authored by Andres Freund's avatar Andres Freund

Fix a number of issues around modifying a previously updated row.

This commit fixes three, unfortunately related, issues:

1) Since 5db6df0c, the introduction of DML via tableam, it was
   possible to trigger "ERROR: unexpected table_lock_tuple status: 1"
   when updating a row that was previously updated in the same
   transaction - but only when the previously updated row was before
   updated in a concurrent transaction (and READ COMMITTED was
   used). The reason for that was that that case simply wasn't
   expected. Fixing that lead to:

2) Even before the above commit, there were error checks (introduced
   in 6868ed74) preventing a row being updated by different
   commands within the same statement (say in a function called by an
   UPDATE) - but that check wasn't performed when the row was first
   updated in a concurrent transaction - instead the second update was
   silently skipped in that case. After this change we throw the same
   error as we'd without the concurrent transaction.

3) The error messages (introduced in 6868ed74) preventing such
   updates emitted the same error message for both DELETE and
   UPDATE ("tuple to be updated was already modified by an operation
   triggered by the current command"). While that could be changed
   separately, it made it hard to write tests that verify the correct
   correct behavior of the code.

This commit changes heap's implementation of table_lock_tuple() to
return TM_SelfModified instead of TM_Invisible (previously loosely
modeled after EvalPlanQualFetch), and teaches nodeModifyTable.c to
handle that in response to table_lock_tuple() and not just in response
to table_(delete|update).

Additionally it fixes the wrong error message (see 3 above). The
comment for table_lock_tuple() is also adjusted to state that
TM_Deleted won't return information in TM_FailureData - it'll not
always be available.

This also adds tests to ensure that DELETE/UPDATE correctly error out
when affecting a row that concurrently was modified by another
transaction.

Author: Andres Freund
Reported-By: Tom Lane, when investigating a bug bug fix to another bug
    by Amit Langote
Discussion: https://postgr.es/m/19321.1554567786@sss.pgh.pa.us
parent 964bae4d
...@@ -463,8 +463,14 @@ tuple_lock_retry: ...@@ -463,8 +463,14 @@ tuple_lock_retry:
if (TransactionIdIsCurrentTransactionId(priorXmax) && if (TransactionIdIsCurrentTransactionId(priorXmax) &&
HeapTupleHeaderGetCmin(tuple->t_data) >= cid) HeapTupleHeaderGetCmin(tuple->t_data) >= cid)
{ {
tmfd->xmax = priorXmax;
/*
* Cmin is the problematic value, so store that. See
* above.
*/
tmfd->cmax = HeapTupleHeaderGetCmin(tuple->t_data);
ReleaseBuffer(buffer); ReleaseBuffer(buffer);
return TM_Invisible; return TM_SelfModified;
} }
/* /*
......
...@@ -799,7 +799,7 @@ ldelete:; ...@@ -799,7 +799,7 @@ ldelete:;
if (tmfd.cmax != estate->es_output_cid) if (tmfd.cmax != estate->es_output_cid)
ereport(ERROR, ereport(ERROR,
(errcode(ERRCODE_TRIGGERED_DATA_CHANGE_VIOLATION), (errcode(ERRCODE_TRIGGERED_DATA_CHANGE_VIOLATION),
errmsg("tuple to be updated was already modified by an operation triggered by the current command"), errmsg("tuple to be deleted was already modified by an operation triggered by the current command"),
errhint("Consider using an AFTER trigger instead of a BEFORE trigger to propagate changes to other rows."))); errhint("Consider using an AFTER trigger instead of a BEFORE trigger to propagate changes to other rows.")));
/* Else, already deleted by self; nothing to do */ /* Else, already deleted by self; nothing to do */
...@@ -858,6 +858,25 @@ ldelete:; ...@@ -858,6 +858,25 @@ ldelete:;
else else
goto ldelete; goto ldelete;
case TM_SelfModified:
/*
* This can be reached when following an update
* chain from a tuple updated by another session,
* reaching a tuple that was already updated in
* this transaction. If previously updated by this
* command, ignore the delete, otherwise error
* out.
*
* See also TM_SelfModified response to
* table_delete() above.
*/
if (tmfd.cmax != estate->es_output_cid)
ereport(ERROR,
(errcode(ERRCODE_TRIGGERED_DATA_CHANGE_VIOLATION),
errmsg("tuple to be deleted was already modified by an operation triggered by the current command"),
errhint("Consider using an AFTER trigger instead of a BEFORE trigger to propagate changes to other rows.")));
return NULL;
case TM_Deleted: case TM_Deleted:
/* tuple already deleted; nothing to do */ /* tuple already deleted; nothing to do */
return NULL; return NULL;
...@@ -870,10 +889,6 @@ ldelete:; ...@@ -870,10 +889,6 @@ ldelete:;
* already have errored out if the first version * already have errored out if the first version
* is invisible. * is invisible.
* *
* TM_SelfModified should be impossible, as we'd
* otherwise should have hit the TM_SelfModified
* case in response to table_delete above.
*
* TM_Updated should be impossible, because we're * TM_Updated should be impossible, because we're
* locking the latest version via * locking the latest version via
* TUPLE_LOCK_FLAG_FIND_LAST_VERSION. * TUPLE_LOCK_FLAG_FIND_LAST_VERSION.
...@@ -1379,6 +1394,25 @@ lreplace:; ...@@ -1379,6 +1394,25 @@ lreplace:;
/* tuple already deleted; nothing to do */ /* tuple already deleted; nothing to do */
return NULL; return NULL;
case TM_SelfModified:
/*
* This can be reached when following an update
* chain from a tuple updated by another session,
* reaching a tuple that was already updated in
* this transaction. If previously modified by
* this command, ignore the redundant update,
* otherwise error out.
*
* See also TM_SelfModified response to
* table_update() above.
*/
if (tmfd.cmax != estate->es_output_cid)
ereport(ERROR,
(errcode(ERRCODE_TRIGGERED_DATA_CHANGE_VIOLATION),
errmsg("tuple to be updated was already modified by an operation triggered by the current command"),
errhint("Consider using an AFTER trigger instead of a BEFORE trigger to propagate changes to other rows.")));
return NULL;
default: default:
/* see table_lock_tuple call in ExecDelete() */ /* see table_lock_tuple call in ExecDelete() */
elog(ERROR, "unexpected table_lock_tuple status: %u", elog(ERROR, "unexpected table_lock_tuple status: %u",
......
...@@ -1216,9 +1216,9 @@ table_update(Relation rel, ItemPointer otid, TupleTableSlot *slot, ...@@ -1216,9 +1216,9 @@ table_update(Relation rel, ItemPointer otid, TupleTableSlot *slot,
* TM_Deleted: lock failed because tuple deleted by other xact * TM_Deleted: lock failed because tuple deleted by other xact
* TM_WouldBlock: lock couldn't be acquired and wait_policy is skip * TM_WouldBlock: lock couldn't be acquired and wait_policy is skip
* *
* In the failure cases other than TM_Invisible, the routine fills *tmfd with * In the failure cases other than TM_Invisible and TM_Deleted, the routine
* the tuple's t_ctid, t_xmax, and, if possible, t_cmax. See comments for * fills *tmfd with the tuple's t_ctid, t_xmax, and, if possible, t_cmax. See
* struct TM_FailureData for additional info. * comments for struct TM_FailureData for additional info.
*/ */
static inline TM_Result static inline TM_Result
table_lock_tuple(Relation rel, ItemPointer tid, Snapshot snapshot, table_lock_tuple(Relation rel, ItemPointer tid, Snapshot snapshot,
......
...@@ -258,6 +258,73 @@ accountid balance ...@@ -258,6 +258,73 @@ accountid balance
checking 1050 checking 1050
savings 600 savings 600
starting permutation: wx1 updwcte c1 c2 read
step wx1: UPDATE accounts SET balance = balance - 200 WHERE accountid = 'checking' RETURNING balance;
balance
400
step updwcte: WITH doup AS (UPDATE accounts SET balance = balance + 1100 WHERE accountid = 'checking' RETURNING *) UPDATE accounts a SET balance = doup.balance + 100 FROM doup RETURNING *; <waiting ...>
step c1: COMMIT;
step updwcte: <... completed>
accountid balance accountid balance
savings 1600 checking 1500
step c2: COMMIT;
step read: SELECT * FROM accounts ORDER BY accountid;
accountid balance
checking 1500
savings 1600
starting permutation: wx1 updwctefail c1 c2 read
step wx1: UPDATE accounts SET balance = balance - 200 WHERE accountid = 'checking' RETURNING balance;
balance
400
step updwctefail: WITH doup AS (UPDATE accounts SET balance = balance + 1100 WHERE accountid = 'checking' RETURNING *, update_checking(999)) UPDATE accounts a SET balance = doup.balance + 100 FROM doup RETURNING *; <waiting ...>
step c1: COMMIT;
step updwctefail: <... completed>
error in steps c1 updwctefail: ERROR: tuple to be updated was already modified by an operation triggered by the current command
step c2: COMMIT;
step read: SELECT * FROM accounts ORDER BY accountid;
accountid balance
checking 400
savings 600
starting permutation: wx1 delwcte c1 c2 read
step wx1: UPDATE accounts SET balance = balance - 200 WHERE accountid = 'checking' RETURNING balance;
balance
400
step delwcte: WITH doup AS (UPDATE accounts SET balance = balance + 1100 WHERE accountid = 'checking' RETURNING *) DELETE FROM accounts a USING doup RETURNING *; <waiting ...>
step c1: COMMIT;
step delwcte: <... completed>
accountid balance accountid balance
savings 600 checking 1500
step c2: COMMIT;
step read: SELECT * FROM accounts ORDER BY accountid;
accountid balance
checking 1500
starting permutation: wx1 delwctefail c1 c2 read
step wx1: UPDATE accounts SET balance = balance - 200 WHERE accountid = 'checking' RETURNING balance;
balance
400
step delwctefail: WITH doup AS (UPDATE accounts SET balance = balance + 1100 WHERE accountid = 'checking' RETURNING *, update_checking(999)) DELETE FROM accounts a USING doup RETURNING *; <waiting ...>
step c1: COMMIT;
step delwctefail: <... completed>
error in steps c1 delwctefail: ERROR: tuple to be deleted was already modified by an operation triggered by the current command
step c2: COMMIT;
step read: SELECT * FROM accounts ORDER BY accountid;
accountid balance
checking 400
savings 600
starting permutation: upsert1 upsert2 c1 c2 read starting permutation: upsert1 upsert2 c1 c2 read
step upsert1: step upsert1:
WITH upsert AS WITH upsert AS
......
...@@ -9,6 +9,9 @@ setup ...@@ -9,6 +9,9 @@ setup
CREATE TABLE accounts (accountid text PRIMARY KEY, balance numeric not null); CREATE TABLE accounts (accountid text PRIMARY KEY, balance numeric not null);
INSERT INTO accounts VALUES ('checking', 600), ('savings', 600); INSERT INTO accounts VALUES ('checking', 600), ('savings', 600);
CREATE FUNCTION update_checking(int) RETURNS bool LANGUAGE sql AS $$
UPDATE accounts SET balance = balance + 1 WHERE accountid = 'checking'; SELECT true;$$;
CREATE TABLE accounts_ext (accountid text PRIMARY KEY, balance numeric not null, other text); CREATE TABLE accounts_ext (accountid text PRIMARY KEY, balance numeric not null, other text);
INSERT INTO accounts_ext VALUES ('checking', 600, 'other'), ('savings', 700, null); INSERT INTO accounts_ext VALUES ('checking', 600, 'other'), ('savings', 700, null);
ALTER TABLE accounts_ext ADD COLUMN newcol int DEFAULT 42; ALTER TABLE accounts_ext ADD COLUMN newcol int DEFAULT 42;
...@@ -34,6 +37,7 @@ setup ...@@ -34,6 +37,7 @@ setup
teardown teardown
{ {
DROP TABLE accounts; DROP TABLE accounts;
DROP FUNCTION update_checking(int);
DROP TABLE accounts_ext; DROP TABLE accounts_ext;
DROP TABLE p CASCADE; DROP TABLE p CASCADE;
DROP TABLE table_a, table_b, jointest; DROP TABLE table_a, table_b, jointest;
...@@ -170,6 +174,16 @@ step "updateforcip3" { ...@@ -170,6 +174,16 @@ step "updateforcip3" {
} }
step "wrtwcte" { UPDATE table_a SET value = 'tableAValue2' WHERE id = 1; } step "wrtwcte" { UPDATE table_a SET value = 'tableAValue2' WHERE id = 1; }
step "wrjt" { UPDATE jointest SET data = 42 WHERE id = 7; } step "wrjt" { UPDATE jointest SET data = 42 WHERE id = 7; }
# Use writable CTEs to create self-updated rows, that then are
# (updated|deleted). The *fail versions of the tests additionally
# perform an update, via a function, in a different command, to test
# behaviour relating to that.
step "updwcte" { WITH doup AS (UPDATE accounts SET balance = balance + 1100 WHERE accountid = 'checking' RETURNING *) UPDATE accounts a SET balance = doup.balance + 100 FROM doup RETURNING *; }
step "updwctefail" { WITH doup AS (UPDATE accounts SET balance = balance + 1100 WHERE accountid = 'checking' RETURNING *, update_checking(999)) UPDATE accounts a SET balance = doup.balance + 100 FROM doup RETURNING *; }
step "delwcte" { WITH doup AS (UPDATE accounts SET balance = balance + 1100 WHERE accountid = 'checking' RETURNING *) DELETE FROM accounts a USING doup RETURNING *; }
step "delwctefail" { WITH doup AS (UPDATE accounts SET balance = balance + 1100 WHERE accountid = 'checking' RETURNING *, update_checking(999)) DELETE FROM accounts a USING doup RETURNING *; }
step "c2" { COMMIT; } step "c2" { COMMIT; }
step "r2" { ROLLBACK; } step "r2" { ROLLBACK; }
...@@ -221,6 +235,19 @@ permutation "wx2" "d2" "d1" "r2" "c1" "read" ...@@ -221,6 +235,19 @@ permutation "wx2" "d2" "d1" "r2" "c1" "read"
permutation "d1" "wx2" "c1" "c2" "read" permutation "d1" "wx2" "c1" "c2" "read"
permutation "d1" "wx2" "r1" "c2" "read" permutation "d1" "wx2" "r1" "c2" "read"
# test that an update to a self-modified row is ignored when
# previously updated by the same cid
permutation "wx1" "updwcte" "c1" "c2" "read"
# test that an update to a self-modified row throws error when
# previously updated by a different cid
permutation "wx1" "updwctefail" "c1" "c2" "read"
# test that a delete to a self-modified row is ignored when
# previously updated by the same cid
permutation "wx1" "delwcte" "c1" "c2" "read"
# test that a delete to a self-modified row throws error when
# previously updated by a different cid
permutation "wx1" "delwctefail" "c1" "c2" "read"
permutation "upsert1" "upsert2" "c1" "c2" "read" permutation "upsert1" "upsert2" "c1" "c2" "read"
permutation "readp1" "writep1" "readp2" "c1" "c2" permutation "readp1" "writep1" "readp2" "c1" "c2"
permutation "writep2" "returningp1" "c1" "c2" permutation "writep2" "returningp1" "c1" "c2"
......
...@@ -1607,7 +1607,7 @@ select * from parent; select * from child; ...@@ -1607,7 +1607,7 @@ select * from parent; select * from child;
(1 row) (1 row)
delete from parent where aid = 1; -- should fail delete from parent where aid = 1; -- should fail
ERROR: tuple to be updated was already modified by an operation triggered by the current command ERROR: tuple to be deleted was already modified by an operation triggered by the current command
HINT: Consider using an AFTER trigger instead of a BEFORE trigger to propagate changes to other rows. HINT: Consider using an AFTER trigger instead of a BEFORE trigger to propagate changes to other rows.
select * from parent; select * from child; select * from parent; select * from child;
aid | val1 | val2 | val3 | val4 | bcnt aid | val1 | val2 | val3 | val4 | bcnt
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment