mirror of
https://github.com/postgres/postgres.git
synced 2025-08-28 18:48:04 +03:00
Fix data loss at inplace update after heap_update().
As previously-added tests demonstrated, heap_inplace_update() could instead update an unrelated tuple of the same catalog. It could lose the update. Losing relhasindex=t was a source of index corruption. Inplace-updating commands like VACUUM will now wait for heap_update() commands like GRANT TABLE and GRANT DATABASE. That isn't ideal, but a long-running GRANT already hurts VACUUM progress more just by keeping an XID running. The VACUUM will behave like a DELETE or UPDATE waiting for the uncommitted change. For implementation details, start at the systable_inplace_update_begin() header comment and README.tuplock. Back-patch to v12 (all supported versions). In back branches, retain a deprecated heap_inplace_update(), for extensions. Reported by Smolkin Grigory. Reviewed by Nitin Motiani, (in earlier versions) Heikki Linnakangas, and (in earlier versions) Alexander Lakhin. Discussion: https://postgr.es/m/CAMp+ueZQz3yDk7qg42hk6-9gxniYbp-=bG2mgqecErqR5gGGOA@mail.gmail.com
This commit is contained in:
@@ -1524,7 +1524,7 @@ dropdb(const char *dbname, bool missing_ok, bool force)
|
||||
Relation pgdbrel;
|
||||
HeapTuple tup;
|
||||
ScanKeyData scankey;
|
||||
SysScanDesc scan;
|
||||
void *inplace_state;
|
||||
Form_pg_database datform;
|
||||
int notherbackends;
|
||||
int npreparedxacts;
|
||||
@@ -1662,24 +1662,6 @@ dropdb(const char *dbname, bool missing_ok, bool force)
|
||||
*/
|
||||
pgstat_drop_database(db_id);
|
||||
|
||||
/*
|
||||
* Get the pg_database tuple to scribble on. Note that this does not
|
||||
* directly rely on the syscache to avoid issues with flattened toast
|
||||
* values for the in-place update.
|
||||
*/
|
||||
ScanKeyInit(&scankey,
|
||||
Anum_pg_database_datname,
|
||||
BTEqualStrategyNumber, F_NAMEEQ,
|
||||
CStringGetDatum(dbname));
|
||||
|
||||
scan = systable_beginscan(pgdbrel, DatabaseNameIndexId, true,
|
||||
NULL, 1, &scankey);
|
||||
|
||||
tup = systable_getnext(scan);
|
||||
if (!HeapTupleIsValid(tup))
|
||||
elog(ERROR, "cache lookup failed for database %u", db_id);
|
||||
datform = (Form_pg_database) GETSTRUCT(tup);
|
||||
|
||||
/*
|
||||
* Except for the deletion of the catalog row, subsequent actions are not
|
||||
* transactional (consider DropDatabaseBuffers() discarding modified
|
||||
@@ -1691,8 +1673,17 @@ dropdb(const char *dbname, bool missing_ok, bool force)
|
||||
* modification is durable before performing irreversible filesystem
|
||||
* operations.
|
||||
*/
|
||||
ScanKeyInit(&scankey,
|
||||
Anum_pg_database_datname,
|
||||
BTEqualStrategyNumber, F_NAMEEQ,
|
||||
CStringGetDatum(dbname));
|
||||
systable_inplace_update_begin(pgdbrel, DatabaseNameIndexId, true,
|
||||
NULL, 1, &scankey, &tup, &inplace_state);
|
||||
if (!HeapTupleIsValid(tup))
|
||||
elog(ERROR, "cache lookup failed for database %u", db_id);
|
||||
datform = (Form_pg_database) GETSTRUCT(tup);
|
||||
datform->datconnlimit = DATCONNLIMIT_INVALID_DB;
|
||||
heap_inplace_update(pgdbrel, tup);
|
||||
systable_inplace_update_finish(inplace_state, tup);
|
||||
XLogFlush(XactLastRecEnd);
|
||||
|
||||
/*
|
||||
@@ -1700,8 +1691,7 @@ dropdb(const char *dbname, bool missing_ok, bool force)
|
||||
* the row will be gone, but if we fail, dropdb() can be invoked again.
|
||||
*/
|
||||
CatalogTupleDelete(pgdbrel, &tup->t_self);
|
||||
|
||||
systable_endscan(scan);
|
||||
heap_freetuple(tup);
|
||||
|
||||
/*
|
||||
* Drop db-specific replication slots.
|
||||
|
@@ -1326,7 +1326,9 @@ vac_update_relstats(Relation relation,
|
||||
{
|
||||
Oid relid = RelationGetRelid(relation);
|
||||
Relation rd;
|
||||
ScanKeyData key[1];
|
||||
HeapTuple ctup;
|
||||
void *inplace_state;
|
||||
Form_pg_class pgcform;
|
||||
bool dirty,
|
||||
futurexid,
|
||||
@@ -1337,7 +1339,12 @@ vac_update_relstats(Relation relation,
|
||||
rd = table_open(RelationRelationId, RowExclusiveLock);
|
||||
|
||||
/* Fetch a copy of the tuple to scribble on */
|
||||
ctup = SearchSysCacheCopy1(RELOID, ObjectIdGetDatum(relid));
|
||||
ScanKeyInit(&key[0],
|
||||
Anum_pg_class_oid,
|
||||
BTEqualStrategyNumber, F_OIDEQ,
|
||||
ObjectIdGetDatum(relid));
|
||||
systable_inplace_update_begin(rd, ClassOidIndexId, true,
|
||||
NULL, 1, key, &ctup, &inplace_state);
|
||||
if (!HeapTupleIsValid(ctup))
|
||||
elog(ERROR, "pg_class entry for relid %u vanished during vacuuming",
|
||||
relid);
|
||||
@@ -1445,7 +1452,9 @@ vac_update_relstats(Relation relation,
|
||||
|
||||
/* If anything changed, write out the tuple. */
|
||||
if (dirty)
|
||||
heap_inplace_update(rd, ctup);
|
||||
systable_inplace_update_finish(inplace_state, ctup);
|
||||
else
|
||||
systable_inplace_update_cancel(inplace_state);
|
||||
|
||||
table_close(rd, RowExclusiveLock);
|
||||
|
||||
@@ -1497,6 +1506,7 @@ vac_update_datfrozenxid(void)
|
||||
bool bogus = false;
|
||||
bool dirty = false;
|
||||
ScanKeyData key[1];
|
||||
void *inplace_state;
|
||||
|
||||
/*
|
||||
* Restrict this task to one backend per database. This avoids race
|
||||
@@ -1620,20 +1630,18 @@ vac_update_datfrozenxid(void)
|
||||
relation = table_open(DatabaseRelationId, RowExclusiveLock);
|
||||
|
||||
/*
|
||||
* Get the pg_database tuple to scribble on. Note that this does not
|
||||
* directly rely on the syscache to avoid issues with flattened toast
|
||||
* values for the in-place update.
|
||||
* Fetch a copy of the tuple to scribble on. We could check the syscache
|
||||
* tuple first. If that concluded !dirty, we'd avoid waiting on
|
||||
* concurrent heap_update() and would avoid exclusive-locking the buffer.
|
||||
* For now, don't optimize that.
|
||||
*/
|
||||
ScanKeyInit(&key[0],
|
||||
Anum_pg_database_oid,
|
||||
BTEqualStrategyNumber, F_OIDEQ,
|
||||
ObjectIdGetDatum(MyDatabaseId));
|
||||
|
||||
scan = systable_beginscan(relation, DatabaseOidIndexId, true,
|
||||
NULL, 1, key);
|
||||
tuple = systable_getnext(scan);
|
||||
tuple = heap_copytuple(tuple);
|
||||
systable_endscan(scan);
|
||||
systable_inplace_update_begin(relation, DatabaseOidIndexId, true,
|
||||
NULL, 1, key, &tuple, &inplace_state);
|
||||
|
||||
if (!HeapTupleIsValid(tuple))
|
||||
elog(ERROR, "could not find tuple for database %u", MyDatabaseId);
|
||||
@@ -1667,7 +1675,9 @@ vac_update_datfrozenxid(void)
|
||||
newMinMulti = dbform->datminmxid;
|
||||
|
||||
if (dirty)
|
||||
heap_inplace_update(relation, tuple);
|
||||
systable_inplace_update_finish(inplace_state, tuple);
|
||||
else
|
||||
systable_inplace_update_cancel(inplace_state);
|
||||
|
||||
heap_freetuple(tuple);
|
||||
table_close(relation, RowExclusiveLock);
|
||||
|
Reference in New Issue
Block a user