mirror of
https://github.com/postgres/postgres.git
synced 2025-09-02 04:21:28 +03:00
Include the backend ID in the relpath of temporary relations.
This allows us to reliably remove all leftover temporary relation files on cluster startup without reference to system catalogs or WAL; therefore, we no longer include temporary relations in XLOG_XACT_COMMIT and XLOG_XACT_ABORT WAL records. Since these changes require including a backend ID in each SharedInvalSmgrMsg, the size of the SharedInvalidationMessage.id field has been reduced from two bytes to one, and the maximum number of connections has been reduced from INT_MAX / 4 to 2^23-1. It would be possible to remove these restrictions by increasing the size of SharedInvalidationMessage by 4 bytes, but right now that doesn't seem like a good trade-off. Review by Jaime Casanova and Tom Lane.
This commit is contained in:
@@ -11,7 +11,7 @@
|
||||
*
|
||||
*
|
||||
* IDENTIFICATION
|
||||
* $PostgreSQL: pgsql/src/backend/storage/smgr/smgr.c,v 1.121 2010/02/26 02:01:01 momjian Exp $
|
||||
* $PostgreSQL: pgsql/src/backend/storage/smgr/smgr.c,v 1.122 2010/08/13 20:10:52 rhaas Exp $
|
||||
*
|
||||
*-------------------------------------------------------------------------
|
||||
*/
|
||||
@@ -45,19 +45,19 @@ typedef struct f_smgr
|
||||
void (*smgr_create) (SMgrRelation reln, ForkNumber forknum,
|
||||
bool isRedo);
|
||||
bool (*smgr_exists) (SMgrRelation reln, ForkNumber forknum);
|
||||
void (*smgr_unlink) (RelFileNode rnode, ForkNumber forknum,
|
||||
void (*smgr_unlink) (RelFileNodeBackend rnode, ForkNumber forknum,
|
||||
bool isRedo);
|
||||
void (*smgr_extend) (SMgrRelation reln, ForkNumber forknum,
|
||||
BlockNumber blocknum, char *buffer, bool isTemp);
|
||||
BlockNumber blocknum, char *buffer, bool skipFsync);
|
||||
void (*smgr_prefetch) (SMgrRelation reln, ForkNumber forknum,
|
||||
BlockNumber blocknum);
|
||||
void (*smgr_read) (SMgrRelation reln, ForkNumber forknum,
|
||||
BlockNumber blocknum, char *buffer);
|
||||
void (*smgr_write) (SMgrRelation reln, ForkNumber forknum,
|
||||
BlockNumber blocknum, char *buffer, bool isTemp);
|
||||
BlockNumber blocknum, char *buffer, bool skipFsync);
|
||||
BlockNumber (*smgr_nblocks) (SMgrRelation reln, ForkNumber forknum);
|
||||
void (*smgr_truncate) (SMgrRelation reln, ForkNumber forknum,
|
||||
BlockNumber nblocks, bool isTemp);
|
||||
BlockNumber nblocks);
|
||||
void (*smgr_immedsync) (SMgrRelation reln, ForkNumber forknum);
|
||||
void (*smgr_pre_ckpt) (void); /* may be NULL */
|
||||
void (*smgr_sync) (void); /* may be NULL */
|
||||
@@ -83,8 +83,6 @@ static HTAB *SMgrRelationHash = NULL;
|
||||
|
||||
/* local function prototypes */
|
||||
static void smgrshutdown(int code, Datum arg);
|
||||
static void smgr_internal_unlink(RelFileNode rnode, ForkNumber forknum,
|
||||
int which, bool isTemp, bool isRedo);
|
||||
|
||||
|
||||
/*
|
||||
@@ -131,8 +129,9 @@ smgrshutdown(int code, Datum arg)
|
||||
* This does not attempt to actually open the object.
|
||||
*/
|
||||
SMgrRelation
|
||||
smgropen(RelFileNode rnode)
|
||||
smgropen(RelFileNode rnode, BackendId backend)
|
||||
{
|
||||
RelFileNodeBackend brnode;
|
||||
SMgrRelation reln;
|
||||
bool found;
|
||||
|
||||
@@ -142,7 +141,7 @@ smgropen(RelFileNode rnode)
|
||||
HASHCTL ctl;
|
||||
|
||||
MemSet(&ctl, 0, sizeof(ctl));
|
||||
ctl.keysize = sizeof(RelFileNode);
|
||||
ctl.keysize = sizeof(RelFileNodeBackend);
|
||||
ctl.entrysize = sizeof(SMgrRelationData);
|
||||
ctl.hash = tag_hash;
|
||||
SMgrRelationHash = hash_create("smgr relation table", 400,
|
||||
@@ -150,8 +149,10 @@ smgropen(RelFileNode rnode)
|
||||
}
|
||||
|
||||
/* Look up or create an entry */
|
||||
brnode.node = rnode;
|
||||
brnode.backend = backend;
|
||||
reln = (SMgrRelation) hash_search(SMgrRelationHash,
|
||||
(void *) &rnode,
|
||||
(void *) &brnode,
|
||||
HASH_ENTER, &found);
|
||||
|
||||
/* Initialize it if not present before */
|
||||
@@ -261,7 +262,7 @@ smgrcloseall(void)
|
||||
* such entry exists already.
|
||||
*/
|
||||
void
|
||||
smgrclosenode(RelFileNode rnode)
|
||||
smgrclosenode(RelFileNodeBackend rnode)
|
||||
{
|
||||
SMgrRelation reln;
|
||||
|
||||
@@ -305,8 +306,8 @@ smgrcreate(SMgrRelation reln, ForkNumber forknum, bool isRedo)
|
||||
* should be here and not in commands/tablespace.c? But that would imply
|
||||
* importing a lot of stuff that smgr.c oughtn't know, either.
|
||||
*/
|
||||
TablespaceCreateDbspace(reln->smgr_rnode.spcNode,
|
||||
reln->smgr_rnode.dbNode,
|
||||
TablespaceCreateDbspace(reln->smgr_rnode.node.spcNode,
|
||||
reln->smgr_rnode.node.dbNode,
|
||||
isRedo);
|
||||
|
||||
(*(smgrsw[reln->smgr_which].smgr_create)) (reln, forknum, isRedo);
|
||||
@@ -323,29 +324,19 @@ smgrcreate(SMgrRelation reln, ForkNumber forknum, bool isRedo)
|
||||
* already.
|
||||
*/
|
||||
void
|
||||
smgrdounlink(SMgrRelation reln, ForkNumber forknum, bool isTemp, bool isRedo)
|
||||
smgrdounlink(SMgrRelation reln, ForkNumber forknum, bool isRedo)
|
||||
{
|
||||
RelFileNode rnode = reln->smgr_rnode;
|
||||
RelFileNodeBackend rnode = reln->smgr_rnode;
|
||||
int which = reln->smgr_which;
|
||||
|
||||
/* Close the fork */
|
||||
(*(smgrsw[which].smgr_close)) (reln, forknum);
|
||||
|
||||
smgr_internal_unlink(rnode, forknum, which, isTemp, isRedo);
|
||||
}
|
||||
|
||||
/*
|
||||
* Shared subroutine that actually does the unlink ...
|
||||
*/
|
||||
static void
|
||||
smgr_internal_unlink(RelFileNode rnode, ForkNumber forknum,
|
||||
int which, bool isTemp, bool isRedo)
|
||||
{
|
||||
/*
|
||||
* Get rid of any remaining buffers for the relation. bufmgr will just
|
||||
* drop them without bothering to write the contents.
|
||||
*/
|
||||
DropRelFileNodeBuffers(rnode, forknum, isTemp, 0);
|
||||
DropRelFileNodeBuffers(rnode, forknum, 0);
|
||||
|
||||
/*
|
||||
* It'd be nice to tell the stats collector to forget it immediately, too.
|
||||
@@ -385,10 +376,10 @@ smgr_internal_unlink(RelFileNode rnode, ForkNumber forknum,
|
||||
*/
|
||||
void
|
||||
smgrextend(SMgrRelation reln, ForkNumber forknum, BlockNumber blocknum,
|
||||
char *buffer, bool isTemp)
|
||||
char *buffer, bool skipFsync)
|
||||
{
|
||||
(*(smgrsw[reln->smgr_which].smgr_extend)) (reln, forknum, blocknum,
|
||||
buffer, isTemp);
|
||||
buffer, skipFsync);
|
||||
}
|
||||
|
||||
/*
|
||||
@@ -426,16 +417,16 @@ smgrread(SMgrRelation reln, ForkNumber forknum, BlockNumber blocknum,
|
||||
* on disk at return, only dumped out to the kernel. However,
|
||||
* provisions will be made to fsync the write before the next checkpoint.
|
||||
*
|
||||
* isTemp indicates that the relation is a temp table (ie, is managed
|
||||
* by the local-buffer manager). In this case no provisions need be
|
||||
* made to fsync the write before checkpointing.
|
||||
* skipFsync indicates that the caller will make other provisions to
|
||||
* fsync the relation, so we needn't bother. Temporary relations also
|
||||
* do not require fsync.
|
||||
*/
|
||||
void
|
||||
smgrwrite(SMgrRelation reln, ForkNumber forknum, BlockNumber blocknum,
|
||||
char *buffer, bool isTemp)
|
||||
char *buffer, bool skipFsync)
|
||||
{
|
||||
(*(smgrsw[reln->smgr_which].smgr_write)) (reln, forknum, blocknum,
|
||||
buffer, isTemp);
|
||||
buffer, skipFsync);
|
||||
}
|
||||
|
||||
/*
|
||||
@@ -455,14 +446,13 @@ smgrnblocks(SMgrRelation reln, ForkNumber forknum)
|
||||
* The truncation is done immediately, so this can't be rolled back.
|
||||
*/
|
||||
void
|
||||
smgrtruncate(SMgrRelation reln, ForkNumber forknum, BlockNumber nblocks,
|
||||
bool isTemp)
|
||||
smgrtruncate(SMgrRelation reln, ForkNumber forknum, BlockNumber nblocks)
|
||||
{
|
||||
/*
|
||||
* Get rid of any buffers for the about-to-be-deleted blocks. bufmgr will
|
||||
* just drop them without bothering to write the contents.
|
||||
*/
|
||||
DropRelFileNodeBuffers(reln->smgr_rnode, forknum, isTemp, nblocks);
|
||||
DropRelFileNodeBuffers(reln->smgr_rnode, forknum, nblocks);
|
||||
|
||||
/*
|
||||
* Send a shared-inval message to force other backends to close any smgr
|
||||
@@ -479,8 +469,7 @@ smgrtruncate(SMgrRelation reln, ForkNumber forknum, BlockNumber nblocks,
|
||||
/*
|
||||
* Do the truncation.
|
||||
*/
|
||||
(*(smgrsw[reln->smgr_which].smgr_truncate)) (reln, forknum, nblocks,
|
||||
isTemp);
|
||||
(*(smgrsw[reln->smgr_which].smgr_truncate)) (reln, forknum, nblocks);
|
||||
}
|
||||
|
||||
/*
|
||||
@@ -499,7 +488,7 @@ smgrtruncate(SMgrRelation reln, ForkNumber forknum, BlockNumber nblocks,
|
||||
* to use the WAL log for PITR or replication purposes: in that case
|
||||
* we have to make WAL entries as well.)
|
||||
*
|
||||
* The preceding writes should specify isTemp = true to avoid
|
||||
* The preceding writes should specify skipFsync = true to avoid
|
||||
* duplicative fsyncs.
|
||||
*
|
||||
* Note that you need to do FlushRelationBuffers() first if there is
|
||||
|
Reference in New Issue
Block a user