1
0
mirror of https://github.com/postgres/postgres.git synced 2025-08-18 12:22:09 +03:00

It turns out that TablespaceCreateDbspace fails badly if a relcache flush

occurs when it tries to heap_open pg_tablespace.  When control returns to
smgrcreate, that routine will be holding a dangling pointer to a closed
SMgrRelation, resulting in mayhem.  This is of course a consequence of
the violation of proper module layering inherent in having smgr.c call
a tablespace command routine, but the simplest fix seems to be to change
the locking mechanism.  There's no real need for TablespaceCreateDbspace
to touch pg_tablespace at all --- it's only opening it as a way of locking
against a parallel DROP TABLESPACE command.  A much better answer is to
create a special-purpose LWLock to interlock these two operations.
This drops TablespaceCreateDbspace quite a few layers down the food chain
and makes it something reasonably safe for smgr to call.
This commit is contained in:
Tom Lane
2006-01-19 04:45:58 +00:00
parent 754da88e19
commit 9fad6e338b
2 changed files with 27 additions and 31 deletions

View File

@@ -37,7 +37,7 @@
* *
* *
* IDENTIFICATION * IDENTIFICATION
* $PostgreSQL: pgsql/src/backend/commands/tablespace.c,v 1.15 2004/12/31 21:59:41 pgsql Exp $ * $PostgreSQL: pgsql/src/backend/commands/tablespace.c,v 1.15.4.1 2006/01/19 04:45:57 tgl Exp $
* *
*------------------------------------------------------------------------- *-------------------------------------------------------------------------
*/ */
@@ -83,12 +83,9 @@ static void set_short_version(const char *path);
* If tablespaces are not supported, this is just a no-op; CREATE DATABASE * If tablespaces are not supported, this is just a no-op; CREATE DATABASE
* is expected to create the default subdirectory for the database. * is expected to create the default subdirectory for the database.
* *
* isRedo indicates that we are creating an object during WAL replay; * isRedo indicates that we are creating an object during WAL replay.
* we can skip doing locking in that case (and should do so to avoid * In this case we will cope with the possibility of the tablespace
* any possible problems with pg_tablespace not being valid). * directory not being there either --- this could happen if we are
*
* Also, when isRedo is true, we will cope with the possibility of the
* tablespace not being there either --- this could happen if we are
* replaying an operation on a table in a subsequently-dropped tablespace. * replaying an operation on a table in a subsequently-dropped tablespace.
* We handle this by making a directory in the place where the tablespace * We handle this by making a directory in the place where the tablespace
* symlink would normally be. This isn't an exact replay of course, but * symlink would normally be. This isn't an exact replay of course, but
@@ -118,16 +115,10 @@ TablespaceCreateDbspace(Oid spcNode, Oid dbNode, bool isRedo)
if (errno == ENOENT) if (errno == ENOENT)
{ {
/* /*
* Acquire ExclusiveLock on pg_tablespace to ensure that no * Acquire TablespaceCreateLock to ensure that no DROP TABLESPACE
* DROP TABLESPACE or TablespaceCreateDbspace is running * or TablespaceCreateDbspace is running concurrently.
* concurrently. Simple reads from pg_tablespace are OK.
*/ */
Relation rel; LWLockAcquire(TablespaceCreateLock, LW_EXCLUSIVE);
if (!isRedo)
rel = heap_openr(TableSpaceRelationName, ExclusiveLock);
else
rel = NULL;
/* /*
* Recheck to see if someone created the directory while we * Recheck to see if someone created the directory while we
@@ -166,9 +157,7 @@ TablespaceCreateDbspace(Oid spcNode, Oid dbNode, bool isRedo)
} }
} }
/* OK to drop the exclusive lock */ LWLockRelease(TablespaceCreateLock);
if (!isRedo)
heap_close(rel, ExclusiveLock);
} }
else else
{ {
@@ -402,16 +391,11 @@ DropTableSpace(DropTableSpaceStmt *stmt)
/* don't call this in a transaction block */ /* don't call this in a transaction block */
PreventTransactionChain((void *) stmt, "DROP TABLESPACE"); PreventTransactionChain((void *) stmt, "DROP TABLESPACE");
/*
* Acquire ExclusiveLock on pg_tablespace to ensure that no one else
* is trying to do DROP TABLESPACE or TablespaceCreateDbspace
* concurrently.
*/
rel = heap_openr(TableSpaceRelationName, ExclusiveLock);
/* /*
* Find the target tuple * Find the target tuple
*/ */
rel = heap_openr(TableSpaceRelationName, RowExclusiveLock);
ScanKeyInit(&entry[0], ScanKeyInit(&entry[0],
Anum_pg_tablespace_spcname, Anum_pg_tablespace_spcname,
BTEqualStrategyNumber, F_NAMEEQ, BTEqualStrategyNumber, F_NAMEEQ,
@@ -447,6 +431,12 @@ DropTableSpace(DropTableSpaceStmt *stmt)
heap_endscan(scandesc); heap_endscan(scandesc);
/*
* Acquire TablespaceCreateLock to ensure that no TablespaceCreateDbspace
* is running concurrently.
*/
LWLockAcquire(TablespaceCreateLock, LW_EXCLUSIVE);
/* /*
* Try to remove the physical infrastructure * Try to remove the physical infrastructure
*/ */
@@ -470,6 +460,11 @@ DropTableSpace(DropTableSpaceStmt *stmt)
(void) XLogInsert(RM_TBLSPC_ID, XLOG_TBLSPC_DROP, rdata); (void) XLogInsert(RM_TBLSPC_ID, XLOG_TBLSPC_DROP, rdata);
} }
/*
* Allow TablespaceCreateDbspace again.
*/
LWLockRelease(TablespaceCreateLock);
/* We keep the lock on pg_tablespace until commit */ /* We keep the lock on pg_tablespace until commit */
heap_close(rel, NoLock); heap_close(rel, NoLock);
@@ -507,10 +502,10 @@ remove_tablespace_directories(Oid tablespaceoid, bool redo)
* next attempt to use the tablespace from that database will simply * next attempt to use the tablespace from that database will simply
* recreate the subdirectory via TablespaceCreateDbspace.) * recreate the subdirectory via TablespaceCreateDbspace.)
* *
* Since we hold exclusive lock, no one else should be creating any fresh * Since we hold TablespaceCreateLock, no one else should be creating any
* subdirectories in parallel. It is possible that new files are * fresh subdirectories in parallel. It is possible that new files are
* being created within subdirectories, though, so the rmdir call * being created within subdirectories, though, so the rmdir call could
* could fail. Worst consequence is a less friendly error message. * fail. Worst consequence is a less friendly error message.
*/ */
dirdesc = AllocateDir(location); dirdesc = AllocateDir(location);
if (dirdesc == NULL) if (dirdesc == NULL)

View File

@@ -7,7 +7,7 @@
* Portions Copyright (c) 1996-2005, PostgreSQL Global Development Group * Portions Copyright (c) 1996-2005, PostgreSQL Global Development Group
* Portions Copyright (c) 1994, Regents of the University of California * Portions Copyright (c) 1994, Regents of the University of California
* *
* $PostgreSQL: pgsql/src/include/storage/lwlock.h,v 1.16 2004/12/31 22:03:42 pgsql Exp $ * $PostgreSQL: pgsql/src/include/storage/lwlock.h,v 1.16.4.1 2006/01/19 04:45:58 tgl Exp $
* *
*------------------------------------------------------------------------- *-------------------------------------------------------------------------
*/ */
@@ -41,6 +41,7 @@ typedef enum LWLockId
SubtransControlLock, SubtransControlLock,
RelCacheInitLock, RelCacheInitLock,
BgWriterCommLock, BgWriterCommLock,
TablespaceCreateLock,
NumFixedLWLocks, /* must be last except for NumFixedLWLocks, /* must be last except for
* MaxDynamicLWLock */ * MaxDynamicLWLock */