smgr.c 20.9 KB
Newer Older
1 2
/*-------------------------------------------------------------------------
 *
3
 * smgr.c
4
 *	  public interface routines to storage manager switch.
5
 *
6 7
 *	  All file system operations in POSTGRES dispatch through these
 *	  routines.
8
 *
B
Bruce Momjian 已提交
9
 * Portions Copyright (c) 1996-2003, PostgreSQL Global Development Group
B
Add:  
Bruce Momjian 已提交
10
 * Portions Copyright (c) 1994, Regents of the University of California
11 12 13
 *
 *
 * IDENTIFICATION
14
 *	  $PostgreSQL: pgsql/src/backend/storage/smgr/smgr.c,v 1.72 2004/05/31 20:31:33 tgl Exp $
15 16 17 18 19
 *
 *-------------------------------------------------------------------------
 */
#include "postgres.h"

20
#include "storage/bufmgr.h"
21
#include "storage/freespace.h"
22
#include "storage/ipc.h"
M
Marc G. Fournier 已提交
23
#include "storage/smgr.h"
24
#include "utils/hsearch.h"
25 26
#include "utils/memutils.h"

27

28 29 30 31 32 33 34
/*
 * This struct of function pointers defines the API between smgr.c and
 * any individual storage manager module.  Note that smgr subfunctions are
 * generally expected to return TRUE on success, FALSE on error.  (For
 * nblocks and truncate we instead say that returning InvalidBlockNumber
 * indicates an error.)
 */
35 36
typedef struct f_smgr
{
37 38 39 40 41 42
	bool		(*smgr_init) (void);			/* may be NULL */
	bool		(*smgr_shutdown) (void);		/* may be NULL */
	bool		(*smgr_close) (SMgrRelation reln);
	bool		(*smgr_create) (SMgrRelation reln, bool isRedo);
	bool		(*smgr_unlink) (RelFileNode rnode, bool isRedo);
	bool		(*smgr_extend) (SMgrRelation reln, BlockNumber blocknum,
43
								char *buffer, bool isTemp);
44
	bool		(*smgr_read) (SMgrRelation reln, BlockNumber blocknum,
45
							  char *buffer);
46
	bool		(*smgr_write) (SMgrRelation reln, BlockNumber blocknum,
47
							   char *buffer, bool isTemp);
48
	BlockNumber (*smgr_nblocks) (SMgrRelation reln);
49 50
	BlockNumber (*smgr_truncate) (SMgrRelation reln, BlockNumber nblocks,
								  bool isTemp);
51 52 53
	bool		(*smgr_commit) (void);			/* may be NULL */
	bool		(*smgr_abort) (void);			/* may be NULL */
	bool		(*smgr_sync) (void);			/* may be NULL */
54
} f_smgr;
55 56


57
static const f_smgr smgrsw[] = {
58
	/* magnetic disk */
59
	{mdinit, NULL, mdclose, mdcreate, mdunlink, mdextend,
60
	 mdread, mdwrite, mdnblocks, mdtruncate, NULL, NULL, mdsync
61
	}
62 63
};

64
static const int	NSmgr = lengthof(smgrsw);
65

66

67 68 69 70
/*
 * Each backend has a hashtable that stores all extant SMgrRelation objects.
 */
static HTAB *SMgrRelationHash = NULL;
71

72 73 74 75 76
/*
 * We keep a list of all relations (represented as RelFileNode values)
 * that have been created or deleted in the current transaction.  When
 * a relation is created, we create the physical file immediately, but
 * remember it so that we can delete the file again if the current
B
Bruce Momjian 已提交
77
 * transaction is aborted.	Conversely, a deletion request is NOT
78 79 80 81 82 83 84 85 86 87 88
 * executed immediately, but is just entered in the list.  When and if
 * the transaction commits, we can delete the physical file.
 *
 * NOTE: the list is kept in TopMemoryContext to be sure it won't disappear
 * unbetimes.  It'd probably be OK to keep it in TopTransactionContext,
 * but I'm being paranoid.
 */

typedef struct PendingRelDelete
{
	RelFileNode relnode;		/* relation that may need to be deleted */
89
	int			which;			/* which storage manager? */
90
	bool		isTemp;			/* is it a temporary relation? */
B
Bruce Momjian 已提交
91 92
	bool		atCommit;		/* T=delete at commit; F=delete at abort */
	struct PendingRelDelete *next;		/* linked-list link */
93 94
} PendingRelDelete;

B
Bruce Momjian 已提交
95
static PendingRelDelete *pendingDeletes = NULL; /* head of linked list */
96 97


98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120
/*
 * Declarations for smgr-related XLOG records
 *
 * Note: we log file creation and truncation here, but logging of deletion
 * actions is handled by xact.c, because it is part of transaction commit.
 */

/* XLOG gives us high 4 bits */
#define XLOG_SMGR_CREATE	0x10
#define XLOG_SMGR_TRUNCATE	0x20

typedef struct xl_smgr_create
{
	RelFileNode		rnode;
} xl_smgr_create;

typedef struct xl_smgr_truncate
{
	BlockNumber		blkno;
	RelFileNode		rnode;
} xl_smgr_truncate;


121 122 123 124 125 126
/* local function prototypes */
static void smgrshutdown(int code, Datum arg);
static void smgr_internal_unlink(RelFileNode rnode, int which,
								 bool isTemp, bool isRedo);


127
/*
128 129
 *	smgrinit(), smgrshutdown() -- Initialize or shut down all storage
 *								  managers.
130
 *
131 132
 * Note: in the normal multiprocess scenario with a postmaster, these are
 * called at postmaster start and stop, not per-backend.
133
 */
134
void
135
smgrinit(void)
136
{
137
	int			i;
138 139 140 141 142

	for (i = 0; i < NSmgr; i++)
	{
		if (smgrsw[i].smgr_init)
		{
143
			if (! (*(smgrsw[i].smgr_init)) ())
144
				elog(FATAL, "smgr initialization failed on %s: %m",
145
					 DatumGetCString(DirectFunctionCall1(smgrout,
B
Bruce Momjian 已提交
146
													 Int16GetDatum(i))));
147
		}
148 149
	}

150
	/* register the shutdown proc */
151
	on_proc_exit(smgrshutdown, 0);
152 153
}

154
static void
155
smgrshutdown(int code, Datum arg)
156
{
157
	int			i;
158 159 160 161 162

	for (i = 0; i < NSmgr; i++)
	{
		if (smgrsw[i].smgr_shutdown)
		{
163
			if (! (*(smgrsw[i].smgr_shutdown)) ())
164
				elog(FATAL, "smgr shutdown failed on %s: %m",
165
					 DatumGetCString(DirectFunctionCall1(smgrout,
B
Bruce Momjian 已提交
166
													 Int16GetDatum(i))));
167
		}
168 169 170
	}
}

171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286
/*
 *	smgropen() -- Return an SMgrRelation object, creating it if need be.
 *
 *		This does not attempt to actually open the object.
 */
SMgrRelation
smgropen(RelFileNode rnode)
{
	SMgrRelation	reln;
	bool		found;

	if (SMgrRelationHash == NULL)
	{
		/* First time through: initialize the hash table */
		HASHCTL		ctl;

		MemSet(&ctl, 0, sizeof(ctl));
		ctl.keysize = sizeof(RelFileNode);
		ctl.entrysize = sizeof(SMgrRelationData);
		ctl.hash = tag_hash;
		SMgrRelationHash = hash_create("smgr relation table", 400,
									   &ctl, HASH_ELEM | HASH_FUNCTION);
	}

	/* Look up or create an entry */
	reln = (SMgrRelation) hash_search(SMgrRelationHash,
									  (void *) &rnode,
									  HASH_ENTER, &found);
	if (reln == NULL)
		ereport(ERROR,
				(errcode(ERRCODE_OUT_OF_MEMORY),
				 errmsg("out of memory")));

	/* Initialize it if not present before */
	if (!found)
	{
		/* hash_search already filled in the lookup key */
		reln->smgr_which = 0;	/* we only have md.c at present */
		reln->md_fd = NULL;		/* mark it not open */
	}

	return reln;
}

/*
 *	smgrclose() -- Close and delete an SMgrRelation object.
 *
 * It is the caller's responsibility not to leave any dangling references
 * to the object.  (Pointers should be cleared after successful return;
 * on the off chance of failure, the SMgrRelation object will still exist.)
 */
void
smgrclose(SMgrRelation reln)
{
	if (! (*(smgrsw[reln->smgr_which].smgr_close)) (reln))
		ereport(ERROR,
				(errcode_for_file_access(),
				 errmsg("could not close relation %u/%u: %m",
						reln->smgr_rnode.tblNode,
						reln->smgr_rnode.relNode)));

	if (hash_search(SMgrRelationHash,
					(void *) &(reln->smgr_rnode),
					HASH_REMOVE, NULL) == NULL)
		elog(ERROR, "SMgrRelation hashtable corrupted");
}

/*
 *	smgrcloseall() -- Close all existing SMgrRelation objects.
 *
 * It is the caller's responsibility not to leave any dangling references.
 */
void
smgrcloseall(void)
{
	HASH_SEQ_STATUS status;
	SMgrRelation reln;

	/* Nothing to do if hashtable not set up */
	if (SMgrRelationHash == NULL)
		return;

	hash_seq_init(&status, SMgrRelationHash);

	while ((reln = (SMgrRelation) hash_seq_search(&status)) != NULL)
	{
		smgrclose(reln);
	}
}

/*
 *	smgrclosenode() -- Close SMgrRelation object for given RelFileNode,
 *					   if one exists.
 *
 * This has the same effects as smgrclose(smgropen(rnode)), but it avoids
 * uselessly creating a hashtable entry only to drop it again when no
 * such entry exists already.
 *
 * It is the caller's responsibility not to leave any dangling references.
 */
void
smgrclosenode(RelFileNode rnode)
{
	SMgrRelation	reln;

	/* Nothing to do if hashtable not set up */
	if (SMgrRelationHash == NULL)
		return;

	reln = (SMgrRelation) hash_search(SMgrRelationHash,
									  (void *) &rnode,
									  HASH_FIND, NULL);
	if (reln != NULL)
		smgrclose(reln);
}

287
/*
288
 *	smgrcreate() -- Create a new relation.
289
 *
290 291 292 293 294 295 296
 *		Given an already-created (but presumably unused) SMgrRelation,
 *		cause the underlying disk file or other storage to be created.
 *
 *		If isRedo is true, it is okay for the underlying file to exist
 *		already because we are in a WAL replay sequence.  In this case
 *		we should make no PendingRelDelete entry; the WAL sequence will
 *		tell whether to drop the file.
297
 */
298 299
void
smgrcreate(SMgrRelation reln, bool isTemp, bool isRedo)
300
{
301 302 303
	XLogRecPtr		lsn;
	XLogRecData		rdata;
	xl_smgr_create	xlrec;
304
	PendingRelDelete *pending;
305

306
	if (! (*(smgrsw[reln->smgr_which].smgr_create)) (reln, isRedo))
307 308
		ereport(ERROR,
				(errcode_for_file_access(),
309 310 311 312 313 314
				 errmsg("could not create relation %u/%u: %m",
						reln->smgr_rnode.tblNode,
						reln->smgr_rnode.relNode)));

	if (isRedo)
		return;
315

316 317 318 319 320 321 322 323 324 325 326 327 328 329
	/*
	 * Make a non-transactional XLOG entry showing the file creation.  It's
	 * non-transactional because we should replay it whether the transaction
	 * commits or not; if not, the file will be dropped at abort time.
	 */
	xlrec.rnode = reln->smgr_rnode;

	rdata.buffer = InvalidBuffer;
	rdata.data = (char *) &xlrec;
	rdata.len = sizeof(xlrec);
	rdata.next = NULL;

	lsn = XLogInsert(RM_SMGR_ID, XLOG_SMGR_CREATE | XLOG_NO_TRAN, &rdata);

330 331 332
	/* Add the relation to the list of stuff to delete at abort */
	pending = (PendingRelDelete *)
		MemoryContextAlloc(TopMemoryContext, sizeof(PendingRelDelete));
333 334 335
	pending->relnode = reln->smgr_rnode;
	pending->which = reln->smgr_which;
	pending->isTemp = isTemp;
336 337 338
	pending->atCommit = false;	/* delete if abort */
	pending->next = pendingDeletes;
	pendingDeletes = pending;
339 340 341
}

/*
342 343 344 345
 *	smgrscheduleunlink() -- Schedule unlinking a relation at xact commit.
 *
 *		The relation is marked to be removed from the store if we
 *		successfully commit the current transaction.
346
 *
347
 * This also implies smgrclose() on the SMgrRelation object.
348
 */
349 350
void
smgrscheduleunlink(SMgrRelation reln, bool isTemp)
351
{
352 353 354 355 356
	PendingRelDelete *pending;

	/* Add the relation to the list of stuff to delete at commit */
	pending = (PendingRelDelete *)
		MemoryContextAlloc(TopMemoryContext, sizeof(PendingRelDelete));
357 358 359
	pending->relnode = reln->smgr_rnode;
	pending->which = reln->smgr_which;
	pending->isTemp = isTemp;
360 361 362 363 364 365
	pending->atCommit = true;	/* delete if commit */
	pending->next = pendingDeletes;
	pendingDeletes = pending;

	/*
	 * NOTE: if the relation was created in this transaction, it will now
B
Bruce Momjian 已提交
366 367 368 369 370
	 * be present in the pending-delete list twice, once with atCommit
	 * true and once with atCommit false.  Hence, it will be physically
	 * deleted at end of xact in either case (and the other entry will be
	 * ignored by smgrDoPendingDeletes, so no error will occur).  We could
	 * instead remove the existing list entry and delete the physical file
371 372
	 * immediately, but for now I'll keep the logic simple.
	 */
373

374 375
	/* Now close the file and throw away the hashtable entry */
	smgrclose(reln);
376 377 378
}

/*
379
 *	smgrdounlink() -- Immediately unlink a relation.
380
 *
381 382
 *		The relation is removed from the store.  This should not be used
 *		during transactional operations, since it can't be undone.
383
 *
384 385 386 387
 *		If isRedo is true, it is okay for the underlying file to be gone
 *		already.  (In practice isRedo will always be true.)
 *
 * This also implies smgrclose() on the SMgrRelation object.
388
 */
389 390
void
smgrdounlink(SMgrRelation reln, bool isTemp, bool isRedo)
391
{
392 393
	RelFileNode	rnode = reln->smgr_rnode;
	int			which = reln->smgr_which;
394

395 396
	/* Close the file and throw away the hashtable entry */
	smgrclose(reln);
397

398
	smgr_internal_unlink(rnode, which, isTemp, isRedo);
399 400 401
}

/*
402
 * Shared subroutine that actually does the unlink ...
403
 */
404 405
static void
smgr_internal_unlink(RelFileNode rnode, int which, bool isTemp, bool isRedo)
406
{
407 408 409 410
	/*
	 * Get rid of any leftover buffers for the rel (shouldn't be any in the
	 * commit case, but there can be in the abort case).
	 */
411
	DropRelFileNodeBuffers(rnode, isTemp, 0);
412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430

	/*
	 * Tell the free space map to forget this relation.  It won't be accessed
	 * any more anyway, but we may as well recycle the map space quickly.
	 */
	FreeSpaceMapForgetRel(&rnode);

	/*
	 * And delete the physical files.
	 *
	 * Note: we treat deletion failure as a WARNING, not an error,
	 * because we've already decided to commit or abort the current xact.
	 */
	if (! (*(smgrsw[which].smgr_unlink)) (rnode, isRedo))
		ereport(WARNING,
				(errcode_for_file_access(),
				 errmsg("could not unlink relation %u/%u: %m",
						rnode.tblNode,
						rnode.relNode)));
431 432 433
}

/*
434
 *	smgrextend() -- Add a new block to a file.
435
 *
436 437 438 439
 *		The semantics are basically the same as smgrwrite(): write at the
 *		specified position.  However, we are expecting to extend the
 *		relation (ie, blocknum is the current EOF), and so in case of
 *		failure we clean up by truncating.
440
 */
441
void
442
smgrextend(SMgrRelation reln, BlockNumber blocknum, char *buffer, bool isTemp)
443
{
444 445
	if (! (*(smgrsw[reln->smgr_which].smgr_extend)) (reln, blocknum, buffer,
													 isTemp))
446 447
		ereport(ERROR,
				(errcode_for_file_access(),
448 449 450 451
				 errmsg("could not extend relation %u/%u: %m",
						reln->smgr_rnode.tblNode,
						reln->smgr_rnode.relNode),
				 errhint("Check free disk space.")));
452 453 454
}

/*
455 456
 *	smgrread() -- read a particular block from a relation into the supplied
 *				  buffer.
457
 *
458 459
 *		This routine is called from the buffer manager in order to
 *		instantiate pages in the shared buffer cache.  All storage managers
460
 *		return pages in the format that POSTGRES expects.
461
 */
462 463
void
smgrread(SMgrRelation reln, BlockNumber blocknum, char *buffer)
464
{
465
	if (! (*(smgrsw[reln->smgr_which].smgr_read)) (reln, blocknum, buffer))
466 467
		ereport(ERROR,
				(errcode_for_file_access(),
468 469 470 471
				 errmsg("could not read block %u of relation %u/%u: %m",
						blocknum,
						reln->smgr_rnode.tblNode,
						reln->smgr_rnode.relNode)));
472 473 474
}

/*
475
 *	smgrwrite() -- Write the supplied buffer out.
476
 *
477
 *		This is not a synchronous write -- the block is not necessarily
478 479 480 481 482 483
 *		on disk at return, only dumped out to the kernel.  However,
 *		provisions will be made to fsync the write before the next checkpoint.
 *
 *		isTemp indicates that the relation is a temp table (ie, is managed
 *		by the local-buffer manager).  In this case no provisions need be
 *		made to fsync the write before checkpointing.
484
 */
485
void
486
smgrwrite(SMgrRelation reln, BlockNumber blocknum, char *buffer, bool isTemp)
487
{
488 489
	if (! (*(smgrsw[reln->smgr_which].smgr_write)) (reln, blocknum, buffer,
													isTemp))
490 491
		ereport(ERROR,
				(errcode_for_file_access(),
492 493 494 495
				 errmsg("could not write block %u of relation %u/%u: %m",
						blocknum,
						reln->smgr_rnode.tblNode,
						reln->smgr_rnode.relNode)));
496 497
}

498
/*
N
Neil Conway 已提交
499
 *	smgrnblocks() -- Calculate the number of blocks in the
500
 *					 supplied relation.
501
 *
502 503
 *		Returns the number of blocks on success, aborts the current
 *		transaction on failure.
504
 */
505
BlockNumber
506
smgrnblocks(SMgrRelation reln)
507
{
508
	BlockNumber nblocks;
509

510
	nblocks = (*(smgrsw[reln->smgr_which].smgr_nblocks)) (reln);
511

512 513 514 515 516 517 518
	/*
	 * NOTE: if a relation ever did grow to 2^32-1 blocks, this code would
	 * fail --- but that's a good thing, because it would stop us from
	 * extending the rel another block and having a block whose number
	 * actually is InvalidBlockNumber.
	 */
	if (nblocks == InvalidBlockNumber)
519 520
		ereport(ERROR,
				(errcode_for_file_access(),
521 522 523
				 errmsg("could not count blocks of relation %u/%u: %m",
						reln->smgr_rnode.tblNode,
						reln->smgr_rnode.relNode)));
524 525

	return nblocks;
526 527
}

528
/*
N
Neil Conway 已提交
529 530
 *	smgrtruncate() -- Truncate supplied relation to the specified number
 *					  of blocks
531
 *
532 533
 *		Returns the number of blocks on success, aborts the current
 *		transaction on failure.
534
 */
535
BlockNumber
536
smgrtruncate(SMgrRelation reln, BlockNumber nblocks, bool isTemp)
537
{
538
	BlockNumber newblks;
539

540 541 542 543 544 545 546
	/*
	 * Tell the free space map to forget anything it may have stored
	 * for the about-to-be-deleted blocks.	We want to be sure it
	 * won't return bogus block numbers later on.
	 */
	FreeSpaceMapTruncateRel(&reln->smgr_rnode, nblocks);

547
	/* Do the truncation */
548 549
	newblks = (*(smgrsw[reln->smgr_which].smgr_truncate)) (reln, nblocks,
														   isTemp);
550 551 552 553 554 555 556
	if (newblks == InvalidBlockNumber)
		ereport(ERROR,
				(errcode_for_file_access(),
				 errmsg("could not truncate relation %u/%u to %u blocks: %m",
						reln->smgr_rnode.tblNode,
						reln->smgr_rnode.relNode,
						nblocks)));
557

558 559 560 561 562 563 564 565 566 567 568
	if (!isTemp)
	{
		/*
		 * Make a non-transactional XLOG entry showing the file truncation.
		 * It's non-transactional because we should replay it whether the
		 * transaction commits or not; the underlying file change is certainly
		 * not reversible.
		 */
		XLogRecPtr		lsn;
		XLogRecData		rdata;
		xl_smgr_truncate xlrec;
569

570 571
		xlrec.blkno = newblks;
		xlrec.rnode = reln->smgr_rnode;
572

573 574 575 576 577 578 579 580
		rdata.buffer = InvalidBuffer;
		rdata.data = (char *) &xlrec;
		rdata.len = sizeof(xlrec);
		rdata.next = NULL;

		lsn = XLogInsert(RM_SMGR_ID, XLOG_SMGR_TRUNCATE | XLOG_NO_TRAN,
						 &rdata);
	}
581

582
	return newblks;
583 584
}

585
/*
N
Neil Conway 已提交
586
 *	smgrDoPendingDeletes() -- Take care of relation deletes at end of xact.
587
 */
588
void
589 590 591 592 593 594 595 596
smgrDoPendingDeletes(bool isCommit)
{
	while (pendingDeletes != NULL)
	{
		PendingRelDelete *pending = pendingDeletes;

		pendingDeletes = pending->next;
		if (pending->atCommit == isCommit)
597 598 599 600
			smgr_internal_unlink(pending->relnode,
								 pending->which,
								 pending->isTemp,
								 false);
601 602 603 604
		pfree(pending);
	}
}

605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639
/*
 * smgrGetPendingDeletes() -- Get a list of relations to be deleted.
 *
 * The return value is the number of relations scheduled for termination.
 * *ptr is set to point to a freshly-palloc'd array of RelFileNodes.
 * If there are no relations to be deleted, *ptr is set to NULL.
 */
int
smgrGetPendingDeletes(bool forCommit, RelFileNode **ptr)
{
	int			nrels;
	RelFileNode *rptr;
	PendingRelDelete *pending;

	nrels = 0;
	for (pending = pendingDeletes; pending != NULL; pending = pending->next)
	{
		if (pending->atCommit == forCommit)
			nrels++;
	}
	if (nrels == 0)
	{
		*ptr = NULL;
		return 0;
	}
	rptr = (RelFileNode *) palloc(nrels * sizeof(RelFileNode));
	*ptr = rptr;
	for (pending = pendingDeletes; pending != NULL; pending = pending->next)
	{
		if (pending->atCommit == forCommit)
			*rptr++ = pending->relnode;
	}
	return nrels;
}

640
/*
641 642 643
 *	smgrcommit() -- Prepare to commit changes made during the current
 *					transaction.
 *
N
Neil Conway 已提交
644
 *		This is called before we actually commit.
645
 */
646
void
647
smgrcommit(void)
648
{
649
	int			i;
650 651 652 653 654

	for (i = 0; i < NSmgr; i++)
	{
		if (smgrsw[i].smgr_commit)
		{
655
			if (! (*(smgrsw[i].smgr_commit)) ())
656
				elog(ERROR, "transaction commit failed on %s: %m",
657
					 DatumGetCString(DirectFunctionCall1(smgrout,
B
Bruce Momjian 已提交
658
													 Int16GetDatum(i))));
659
		}
660 661 662
	}
}

663 664 665
/*
 *	smgrabort() -- Abort changes made during the current transaction.
 */
666
void
667
smgrabort(void)
668
{
669
	int			i;
670 671 672 673 674

	for (i = 0; i < NSmgr; i++)
	{
		if (smgrsw[i].smgr_abort)
		{
675
			if (! (*(smgrsw[i].smgr_abort)) ())
676
				elog(ERROR, "transaction abort failed on %s: %m",
677
					 DatumGetCString(DirectFunctionCall1(smgrout,
B
Bruce Momjian 已提交
678
													 Int16GetDatum(i))));
679
		}
680 681
	}
}
682

683
/*
N
Neil Conway 已提交
684
 *	smgrsync() -- Sync files to disk at checkpoint time.
685
 */
686
void
687
smgrsync(void)
V
WAL  
Vadim B. Mikheev 已提交
688 689 690 691 692 693 694
{
	int			i;

	for (i = 0; i < NSmgr; i++)
	{
		if (smgrsw[i].smgr_sync)
		{
695
			if (! (*(smgrsw[i].smgr_sync)) ())
696
				elog(ERROR, "storage sync failed on %s: %m",
V
WAL  
Vadim B. Mikheev 已提交
697
					 DatumGetCString(DirectFunctionCall1(smgrout,
B
Bruce Momjian 已提交
698
													 Int16GetDatum(i))));
V
WAL  
Vadim B. Mikheev 已提交
699 700 701 702
		}
	}
}

V
WAL  
Vadim B. Mikheev 已提交
703 704 705 706

void
smgr_redo(XLogRecPtr lsn, XLogRecord *record)
{
707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724
	uint8		info = record->xl_info & ~XLR_INFO_MASK;

	if (info == XLOG_SMGR_CREATE)
	{
		xl_smgr_create *xlrec = (xl_smgr_create *) XLogRecGetData(record);
		SMgrRelation reln;

		reln = smgropen(xlrec->rnode);
		smgrcreate(reln, false, true);
	}
	else if (info == XLOG_SMGR_TRUNCATE)
	{
		xl_smgr_truncate *xlrec = (xl_smgr_truncate *) XLogRecGetData(record);
		SMgrRelation reln;
		BlockNumber newblks;

		reln = smgropen(xlrec->rnode);

725 726 727 728 729 730 731
		/*
		 * First, force bufmgr to drop any buffers it has for the to-be-
		 * truncated blocks.  We must do this, else subsequent XLogReadBuffer
		 * operations will not re-extend the file properly.
		 */
		DropRelFileNodeBuffers(xlrec->rnode, false, xlrec->blkno);

732 733 734 735 736 737 738 739 740 741 742
		/* Can't use smgrtruncate because it would try to xlog */

		/*
		 * Tell the free space map to forget anything it may have stored
		 * for the about-to-be-deleted blocks.	We want to be sure it
		 * won't return bogus block numbers later on.
		 */
		FreeSpaceMapTruncateRel(&reln->smgr_rnode, xlrec->blkno);

		/* Do the truncation */
		newblks = (*(smgrsw[reln->smgr_which].smgr_truncate)) (reln,
743 744
															   xlrec->blkno,
															   false);
745 746 747 748 749 750 751 752 753 754
		if (newblks == InvalidBlockNumber)
			ereport(WARNING,
					(errcode_for_file_access(),
					 errmsg("could not truncate relation %u/%u to %u blocks: %m",
							reln->smgr_rnode.tblNode,
							reln->smgr_rnode.relNode,
							xlrec->blkno)));
	}
	else
		elog(PANIC, "smgr_redo: unknown op code %u", info);
V
WAL  
Vadim B. Mikheev 已提交
755 756 757 758 759
}

void
smgr_undo(XLogRecPtr lsn, XLogRecord *record)
{
760 761
	/* Since we have no transactional WAL entries, should never undo */
	elog(PANIC, "smgr_undo: cannot undo");
V
WAL  
Vadim B. Mikheev 已提交
762
}
B
Bruce Momjian 已提交
763

V
WAL  
Vadim B. Mikheev 已提交
764
void
B
Bruce Momjian 已提交
765
smgr_desc(char *buf, uint8 xl_info, char *rec)
V
WAL  
Vadim B. Mikheev 已提交
766
{
767 768 769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785
	uint8		info = xl_info & ~XLR_INFO_MASK;

	if (info == XLOG_SMGR_CREATE)
	{
		xl_smgr_create *xlrec = (xl_smgr_create *) rec;

		sprintf(buf + strlen(buf), "file create: %u/%u",
				xlrec->rnode.tblNode, xlrec->rnode.relNode);
	}
	else if (info == XLOG_SMGR_TRUNCATE)
	{
		xl_smgr_truncate *xlrec = (xl_smgr_truncate *) rec;

		sprintf(buf + strlen(buf), "file truncate: %u/%u to %u blocks",
				xlrec->rnode.tblNode, xlrec->rnode.relNode,
				xlrec->blkno);
	}
	else
		strcat(buf, "UNKNOWN");
V
WAL  
Vadim B. Mikheev 已提交
786
}