aboutsummaryrefslogtreecommitdiff
path: root/src/backend/storage/freespace/freespace.c
diff options
context:
space:
mode:
authorTom Lane <tgl@sss.pgh.pa.us>2010-02-09 21:43:30 +0000
committerTom Lane <tgl@sss.pgh.pa.us>2010-02-09 21:43:30 +0000
commitcbe9d6beb4ae1cb20c08cab29b534be4923b6768 (patch)
treea9476492cd8c7eda7718f95b0ad5a45d41e55a3a /src/backend/storage/freespace/freespace.c
parent79647eed86cc972e80ea165dcb0b7f6fef876169 (diff)
downloadpostgresql-cbe9d6beb4ae1cb20c08cab29b534be4923b6768.tar.gz
postgresql-cbe9d6beb4ae1cb20c08cab29b534be4923b6768.zip
Fix up rickety handling of relation-truncation interlocks.
Move rd_targblock, rd_fsm_nblocks, and rd_vm_nblocks from relcache to the smgr relation entries, so that they will get reset to InvalidBlockNumber whenever an smgr-level flush happens. Because we now send smgr invalidation messages immediately (not at end of transaction) when a relation truncation occurs, this ensures that other backends will reset their values before they next access the relation. We no longer need the unreliable assumption that a VACUUM that's doing a truncation will hold its AccessExclusive lock until commit --- in fact, we can intentionally release that lock as soon as we've completed the truncation. This patch therefore reverts (most of) Alvaro's patch of 2009-11-10, as well as my marginal hacking on it yesterday. We can also get rid of assorted no-longer-needed relcache flushes, which are far more expensive than an smgr flush because they kill a lot more state. In passing this patch fixes smgr_redo's failure to perform visibility-map truncation, and cleans up some rather dubious assumptions in freespace.c and visibilitymap.c about when rd_fsm_nblocks and rd_vm_nblocks can be out of date.
Diffstat (limited to 'src/backend/storage/freespace/freespace.c')
-rw-r--r--src/backend/storage/freespace/freespace.c76
1 files changed, 43 insertions, 33 deletions
diff --git a/src/backend/storage/freespace/freespace.c b/src/backend/storage/freespace/freespace.c
index fb7bd7d83f8..b584c1fe380 100644
--- a/src/backend/storage/freespace/freespace.c
+++ b/src/backend/storage/freespace/freespace.c
@@ -8,7 +8,7 @@
* Portions Copyright (c) 1994, Regents of the University of California
*
* IDENTIFICATION
- * $PostgreSQL: pgsql/src/backend/storage/freespace/freespace.c,v 1.75 2010/02/09 00:28:57 tgl Exp $
+ * $PostgreSQL: pgsql/src/backend/storage/freespace/freespace.c,v 1.76 2010/02/09 21:43:30 tgl Exp $
*
*
* NOTES:
@@ -25,16 +25,16 @@
#include "access/htup.h"
#include "access/xlogutils.h"
-#include "storage/bufpage.h"
+#include "miscadmin.h"
#include "storage/bufmgr.h"
+#include "storage/bufpage.h"
#include "storage/freespace.h"
#include "storage/fsm_internals.h"
#include "storage/lmgr.h"
#include "storage/lwlock.h"
#include "storage/smgr.h"
#include "utils/rel.h"
-#include "utils/inval.h"
-#include "miscadmin.h"
+
/*
* We use just one byte to store the amount of free space on a page, so we
@@ -251,9 +251,9 @@ GetRecordedFreeSpace(Relation rel, BlockNumber heapBlk)
/*
* FreeSpaceMapTruncateRel - adjust for truncation of a relation.
*
- * The caller must hold AccessExclusiveLock on the relation, to ensure
- * that other backends receive the relcache invalidation event that this
- * function sends, before accessing the FSM again.
+ * The caller must hold AccessExclusiveLock on the relation, to ensure that
+ * other backends receive the smgr invalidation event that this function sends
+ * before they access the FSM again.
*
* nblocks is the new size of the heap.
*/
@@ -302,17 +302,18 @@ FreeSpaceMapTruncateRel(Relation rel, BlockNumber nblocks)
return; /* nothing to do; the FSM was already smaller */
}
- /* Truncate the unused FSM pages */
+ /* Truncate the unused FSM pages, and send smgr inval message */
smgrtruncate(rel->rd_smgr, FSM_FORKNUM, new_nfsmblocks, rel->rd_istemp);
/*
- * Need to invalidate the relcache entry, because rd_fsm_nblocks seen by
- * other backends is no longer valid.
+ * We might as well update the local smgr_fsm_nblocks setting.
+ * smgrtruncate sent an smgr cache inval message, which will cause
+ * other backends to invalidate their copy of smgr_fsm_nblocks, and
+ * this one too at the next command boundary. But this ensures it
+ * isn't outright wrong until then.
*/
- if (!InRecovery)
- CacheInvalidateRelcache(rel);
-
- rel->rd_fsm_nblocks = new_nfsmblocks;
+ if (rel->rd_smgr)
+ rel->rd_smgr->smgr_fsm_nblocks = new_nfsmblocks;
}
/*
@@ -506,17 +507,24 @@ fsm_readbuf(Relation rel, FSMAddress addr, bool extend)
RelationOpenSmgr(rel);
- /* If we haven't cached the size of the FSM yet, check it first */
- if (rel->rd_fsm_nblocks == InvalidBlockNumber)
+ /*
+ * If we haven't cached the size of the FSM yet, check it first. Also
+ * recheck if the requested block seems to be past end, since our
+ * cached value might be stale. (We send smgr inval messages on
+ * truncation, but not on extension.)
+ */
+ if (rel->rd_smgr->smgr_fsm_nblocks == InvalidBlockNumber ||
+ blkno >= rel->rd_smgr->smgr_fsm_nblocks)
{
if (smgrexists(rel->rd_smgr, FSM_FORKNUM))
- rel->rd_fsm_nblocks = smgrnblocks(rel->rd_smgr, FSM_FORKNUM);
+ rel->rd_smgr->smgr_fsm_nblocks = smgrnblocks(rel->rd_smgr,
+ FSM_FORKNUM);
else
- rel->rd_fsm_nblocks = 0;
+ rel->rd_smgr->smgr_fsm_nblocks = 0;
}
/* Handle requests beyond EOF */
- if (blkno >= rel->rd_fsm_nblocks)
+ if (blkno >= rel->rd_smgr->smgr_fsm_nblocks)
{
if (extend)
fsm_extend(rel, blkno + 1);
@@ -559,19 +567,23 @@ fsm_extend(Relation rel, BlockNumber fsm_nblocks)
* it.
*
* Note that another backend might have extended or created the relation
- * before we get the lock.
+ * by the time we get the lock.
*/
LockRelationForExtension(rel, ExclusiveLock);
- /* Create the FSM file first if it doesn't exist */
- if ((rel->rd_fsm_nblocks == 0 || rel->rd_fsm_nblocks == InvalidBlockNumber)
- && !smgrexists(rel->rd_smgr, FSM_FORKNUM))
- {
+ /* Might have to re-open if a cache flush happened */
+ RelationOpenSmgr(rel);
+
+ /*
+ * Create the FSM file first if it doesn't exist. If smgr_fsm_nblocks
+ * is positive then it must exist, no need for an smgrexists call.
+ */
+ if ((rel->rd_smgr->smgr_fsm_nblocks == 0 ||
+ rel->rd_smgr->smgr_fsm_nblocks == InvalidBlockNumber) &&
+ !smgrexists(rel->rd_smgr, FSM_FORKNUM))
smgrcreate(rel->rd_smgr, FSM_FORKNUM, false);
- fsm_nblocks_now = 0;
- }
- else
- fsm_nblocks_now = smgrnblocks(rel->rd_smgr, FSM_FORKNUM);
+
+ fsm_nblocks_now = smgrnblocks(rel->rd_smgr, FSM_FORKNUM);
while (fsm_nblocks_now < fsm_nblocks)
{
@@ -580,14 +592,12 @@ fsm_extend(Relation rel, BlockNumber fsm_nblocks)
fsm_nblocks_now++;
}
+ /* Update local cache with the up-to-date size */
+ rel->rd_smgr->smgr_fsm_nblocks = fsm_nblocks_now;
+
UnlockRelationForExtension(rel, ExclusiveLock);
pfree(pg);
-
- /* Update the relcache with the up-to-date size */
- if (!InRecovery)
- CacheInvalidateRelcache(rel);
- rel->rd_fsm_nblocks = fsm_nblocks_now;
}
/*