pg_backup_tar.c 28.5 KB
Newer Older
P
Philip Warner 已提交
1 2 3 4 5 6 7 8 9 10
/*-------------------------------------------------------------------------
 *
 * pg_backup_tar.c
 *
 *	This file is copied from the 'files' format file, but dumps data into
 *	one temp file then sends it to the output TAR archive.
 *
 *	See the headers to pg_backup_files & pg_restore for more details.
 *
 * Copyright (c) 2000, Philip Warner
B
Bruce Momjian 已提交
11 12
 *		Rights are granted to use this software in any way so long
 *		as this notice is not removed.
P
Philip Warner 已提交
13 14 15 16 17 18
 *
 *	The author is not responsible for loss or damages that may
 *	result from it's use.
 *
 *
 * IDENTIFICATION
19
 *		$PostgreSQL: pgsql/src/bin/pg_dump/pg_backup_tar.c,v 1.48 2005/06/22 02:00:47 neilc Exp $
20
 *
P
Philip Warner 已提交
21 22 23
 *-------------------------------------------------------------------------
 */

24 25 26 27
#include "pg_backup.h"
#include "pg_backup_archiver.h"
#include "pg_backup_tar.h"

P
Philip Warner 已提交
28
#include <ctype.h>
29
#include <limits.h>
P
Philip Warner 已提交
30 31
#include <unistd.h>

B
Bruce Momjian 已提交
32 33
static void _ArchiveEntry(ArchiveHandle *AH, TocEntry *te);
static void _StartData(ArchiveHandle *AH, TocEntry *te);
B
Bruce Momjian 已提交
34
static size_t _WriteData(ArchiveHandle *AH, const void *data, size_t dLen);
B
Bruce Momjian 已提交
35 36 37
static void _EndData(ArchiveHandle *AH, TocEntry *te);
static int	_WriteByte(ArchiveHandle *AH, const int i);
static int	_ReadByte(ArchiveHandle *);
B
Bruce Momjian 已提交
38 39
static size_t _WriteBuf(ArchiveHandle *AH, const void *buf, size_t len);
static size_t _ReadBuf(ArchiveHandle *AH, void *buf, size_t len);
B
Bruce Momjian 已提交
40 41 42 43 44 45 46
static void _CloseArchive(ArchiveHandle *AH);
static void _PrintTocData(ArchiveHandle *AH, TocEntry *te, RestoreOptions *ropt);
static void _WriteExtraToc(ArchiveHandle *AH, TocEntry *te);
static void _ReadExtraToc(ArchiveHandle *AH, TocEntry *te);
static void _PrintExtraToc(ArchiveHandle *AH, TocEntry *te);

static void _StartBlobs(ArchiveHandle *AH, TocEntry *te);
47 48
static void _StartBlob(ArchiveHandle *AH, TocEntry *te, Oid oid);
static void _EndBlob(ArchiveHandle *AH, TocEntry *te, Oid oid);
B
Bruce Momjian 已提交
49
static void _EndBlobs(ArchiveHandle *AH, TocEntry *te);
P
Philip Warner 已提交
50 51 52 53 54

#define K_STD_BUF_SIZE 1024


#ifdef HAVE_LIBZ
B
Bruce Momjian 已提交
55 56 57
 /* typedef gzFile	 ThingFile; */
typedef FILE ThingFile;

P
Philip Warner 已提交
58
#else
B
Bruce Momjian 已提交
59
typedef FILE ThingFile;
P
Philip Warner 已提交
60 61
#endif

B
Bruce Momjian 已提交
62 63 64 65 66 67 68 69
typedef struct
{
	ThingFile  *zFH;
	FILE	   *nFH;
	FILE	   *tarFH;
	FILE	   *tmpFH;
	char	   *targetFile;
	char		mode;
P
Peter Eisentraut 已提交
70 71
	off_t		pos;
	off_t		fileLen;
B
Bruce Momjian 已提交
72
	ArchiveHandle *AH;
P
Philip Warner 已提交
73 74
} TAR_MEMBER;

75 76 77 78 79 80 81 82 83 84 85
/*
 * Maximum file size for a tar member: The limit inherent in the
 * format is 2^33-1 bytes (nearly 8 GB).  But we don't want to exceed
 * what we can represent by an off_t.
 */
#ifdef INT64_IS_BUSTED
#define MAX_TAR_MEMBER_FILELEN INT_MAX
#else
#define MAX_TAR_MEMBER_FILELEN (((int64) 1 << Min(33, sizeof(off_t)*8 - 1)) - 1)
#endif

B
Bruce Momjian 已提交
86 87
typedef struct
{
P
Philip Warner 已提交
88
	int			hasSeek;
P
Peter Eisentraut 已提交
89
	off_t		filePos;
B
Bruce Momjian 已提交
90 91
	TAR_MEMBER *blobToc;
	FILE	   *tarFH;
P
Peter Eisentraut 已提交
92 93
	off_t		tarFHpos;
	off_t		tarNextMember;
B
Bruce Momjian 已提交
94
	TAR_MEMBER *FH;
P
Philip Warner 已提交
95
	int			isSpecialScript;
B
Bruce Momjian 已提交
96
	TAR_MEMBER *scriptTH;
P
Philip Warner 已提交
97 98
} lclContext;

B
Bruce Momjian 已提交
99 100 101 102
typedef struct
{
	TAR_MEMBER *TH;
	char	   *filename;
P
Philip Warner 已提交
103 104
} lclTocEntry;

105
static char *modulename = gettext_noop("tar archiver");
B
Bruce Momjian 已提交
106 107

static void _LoadBlobs(ArchiveHandle *AH, RestoreOptions *ropt);
P
Philip Warner 已提交
108

B
Bruce Momjian 已提交
109 110
static TAR_MEMBER *tarOpen(ArchiveHandle *AH, const char *filename, char mode);
static void tarClose(ArchiveHandle *AH, TAR_MEMBER *TH);
P
Philip Warner 已提交
111 112

#ifdef __NOT_USED__
P
Peter Eisentraut 已提交
113
static char *tarGets(char *buf, size_t len, TAR_MEMBER *th);
P
Philip Warner 已提交
114
#endif
B
Bruce Momjian 已提交
115
static int	tarPrintf(ArchiveHandle *AH, TAR_MEMBER *th, const char *fmt,...);
P
Philip Warner 已提交
116

B
Bruce Momjian 已提交
117 118 119
static void _tarAddFile(ArchiveHandle *AH, TAR_MEMBER *th);
static int	_tarChecksum(char *th);
static TAR_MEMBER *_tarPositionTo(ArchiveHandle *AH, const char *filename);
B
Bruce Momjian 已提交
120 121
static size_t tarRead(void *buf, size_t len, TAR_MEMBER *th);
static size_t tarWrite(const void *buf, size_t len, TAR_MEMBER *th);
B
Bruce Momjian 已提交
122 123
static void _tarWriteHeader(TAR_MEMBER *th);
static int	_tarGetHeader(ArchiveHandle *AH, TAR_MEMBER *th);
B
Bruce Momjian 已提交
124
static size_t _tarReadRaw(ArchiveHandle *AH, void *buf, size_t len, TAR_MEMBER *th, FILE *fh);
P
Philip Warner 已提交
125

B
Bruce Momjian 已提交
126
static size_t _scriptOut(ArchiveHandle *AH, const void *buf, size_t len);
P
Philip Warner 已提交
127 128

/*
B
Bruce Momjian 已提交
129
 *	Initializer
P
Philip Warner 已提交
130
 */
B
Bruce Momjian 已提交
131 132
void
InitArchiveFmt_Tar(ArchiveHandle *AH)
P
Philip Warner 已提交
133
{
B
Bruce Momjian 已提交
134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158
	lclContext *ctx;

	/* Assuming static functions, this can be copied for each format. */
	AH->ArchiveEntryPtr = _ArchiveEntry;
	AH->StartDataPtr = _StartData;
	AH->WriteDataPtr = _WriteData;
	AH->EndDataPtr = _EndData;
	AH->WriteBytePtr = _WriteByte;
	AH->ReadBytePtr = _ReadByte;
	AH->WriteBufPtr = _WriteBuf;
	AH->ReadBufPtr = _ReadBuf;
	AH->ClosePtr = _CloseArchive;
	AH->PrintTocDataPtr = _PrintTocData;
	AH->ReadExtraTocPtr = _ReadExtraToc;
	AH->WriteExtraTocPtr = _WriteExtraToc;
	AH->PrintExtraTocPtr = _PrintExtraToc;

	AH->StartBlobsPtr = _StartBlobs;
	AH->StartBlobPtr = _StartBlob;
	AH->EndBlobPtr = _EndBlob;
	AH->EndBlobsPtr = _EndBlobs;

	/*
	 * Set up some special context used in compressing data.
	 */
159
	ctx = (lclContext *) calloc(1, sizeof(lclContext));
B
Bruce Momjian 已提交
160 161
	AH->formatData = (void *) ctx;
	ctx->filePos = 0;
162
	ctx->isSpecialScript = 0;
B
Bruce Momjian 已提交
163

164 165
	/* Initialize LO buffering */
	AH->lo_buf_size = LOBBUFSIZE;
B
Bruce Momjian 已提交
166
	AH->lo_buf = (void *) malloc(LOBBUFSIZE);
P
Peter Eisentraut 已提交
167 168
	if (AH->lo_buf == NULL)
		die_horribly(AH, modulename, "out of memory\n");
B
Bruce Momjian 已提交
169 170 171 172 173 174 175 176

	/*
	 * Now open the TOC file
	 */
	if (AH->mode == archModeWrite)
	{

		if (AH->fSpec && strcmp(AH->fSpec, "") != 0)
P
Philip Warner 已提交
177
			ctx->tarFH = fopen(AH->fSpec, PG_BINARY_W);
B
Bruce Momjian 已提交
178
		else
P
Philip Warner 已提交
179
			ctx->tarFH = stdout;
180

B
Bruce Momjian 已提交
181
		if (ctx->tarFH == NULL)
182
			die_horribly(NULL, modulename,
183
			"could not open TOC file for output: %s\n", strerror(errno));
184

P
Philip Warner 已提交
185 186
		ctx->tarFHpos = 0;

B
Bruce Momjian 已提交
187 188 189 190
		/*
		 * Make unbuffered since we will dup() it, and the buffers screw
		 * each other
		 */
191
		/* setvbuf(ctx->tarFH, NULL, _IONBF, 0); */
P
Philip Warner 已提交
192

193
		ctx->hasSeek = checkSeek(ctx->tarFH);
P
Philip Warner 已提交
194

B
Bruce Momjian 已提交
195
		if (AH->compression < 0 || AH->compression > 9)
P
Philip Warner 已提交
196 197 198 199 200 201
			AH->compression = Z_DEFAULT_COMPRESSION;

		/* Don't compress into tar files unless asked to do so */
		if (AH->compression == Z_DEFAULT_COMPRESSION)
			AH->compression = 0;

B
Bruce Momjian 已提交
202 203 204 205
		/*
		 * We don't support compression because reading the files back is
		 * not possible since gzdopen uses buffered IO which totally
		 * screws file positioning.
P
Philip Warner 已提交
206 207
		 */
		if (AH->compression != 0)
208
			die_horribly(NULL, modulename, "compression not supported by tar output format\n");
P
Philip Warner 已提交
209

B
Bruce Momjian 已提交
210 211 212
	}
	else
	{							/* Read Mode */
P
Philip Warner 已提交
213

B
Bruce Momjian 已提交
214
		if (AH->fSpec && strcmp(AH->fSpec, "") != 0)
P
Philip Warner 已提交
215
			ctx->tarFH = fopen(AH->fSpec, PG_BINARY_R);
B
Bruce Momjian 已提交
216
		else
P
Philip Warner 已提交
217 218
			ctx->tarFH = stdin;

219
		if (ctx->tarFH == NULL)
220
			die_horribly(NULL, modulename, "could not open TOC file for input: %s\n", strerror(errno));
221

B
Bruce Momjian 已提交
222 223 224 225
		/*
		 * Make unbuffered since we will dup() it, and the buffers screw
		 * each other
		 */
226
		/* setvbuf(ctx->tarFH, NULL, _IONBF, 0); */
P
Philip Warner 已提交
227 228 229

		ctx->tarFHpos = 0;

230
		ctx->hasSeek = checkSeek(ctx->tarFH);
P
Philip Warner 已提交
231

B
Bruce Momjian 已提交
232 233 234 235
		/*
		 * Forcibly unmark the header as read since we use the lookahead
		 * buffer
		 */
P
Philip Warner 已提交
236 237
		AH->readHeader = 0;

B
Bruce Momjian 已提交
238
		ctx->FH = (void *) tarOpen(AH, "toc.dat", 'r');
P
Philip Warner 已提交
239 240
		ReadHead(AH);
		ReadToc(AH);
B
Bruce Momjian 已提交
241 242
		tarClose(AH, ctx->FH);	/* Nothing else in the file... */
	}
P
Philip Warner 已提交
243 244 245 246
}

/*
 * - Start a new TOC entry
B
Bruce Momjian 已提交
247
 *	 Setup the output file name.
P
Philip Warner 已提交
248
 */
B
Bruce Momjian 已提交
249 250
static void
_ArchiveEntry(ArchiveHandle *AH, TocEntry *te)
P
Philip Warner 已提交
251
{
B
Bruce Momjian 已提交
252 253
	lclTocEntry *ctx;
	char		fn[K_STD_BUF_SIZE];
P
Philip Warner 已提交
254

255
	ctx = (lclTocEntry *) calloc(1, sizeof(lclTocEntry));
256
	if (te->dataDumper != NULL)
B
Bruce Momjian 已提交
257
	{
P
Philip Warner 已提交
258
#ifdef HAVE_LIBZ
B
Bruce Momjian 已提交
259
		if (AH->compression == 0)
260
			sprintf(fn, "%d.dat", te->dumpId);
B
Bruce Momjian 已提交
261
		else
262
			sprintf(fn, "%d.dat.gz", te->dumpId);
P
Philip Warner 已提交
263
#else
264
		sprintf(fn, "%d.dat", te->dumpId);
P
Philip Warner 已提交
265 266
#endif
		ctx->filename = strdup(fn);
B
Bruce Momjian 已提交
267 268 269
	}
	else
	{
P
Philip Warner 已提交
270 271
		ctx->filename = NULL;
		ctx->TH = NULL;
B
Bruce Momjian 已提交
272 273
	}
	te->formatData = (void *) ctx;
P
Philip Warner 已提交
274 275
}

B
Bruce Momjian 已提交
276 277
static void
_WriteExtraToc(ArchiveHandle *AH, TocEntry *te)
P
Philip Warner 已提交
278
{
B
Bruce Momjian 已提交
279
	lclTocEntry *ctx = (lclTocEntry *) te->formatData;
P
Philip Warner 已提交
280

B
Bruce Momjian 已提交
281
	if (ctx->filename)
P
Philip Warner 已提交
282
		WriteStr(AH, ctx->filename);
B
Bruce Momjian 已提交
283
	else
P
Philip Warner 已提交
284 285 286
		WriteStr(AH, "");
}

B
Bruce Momjian 已提交
287 288
static void
_ReadExtraToc(ArchiveHandle *AH, TocEntry *te)
P
Philip Warner 已提交
289
{
B
Bruce Momjian 已提交
290
	lclTocEntry *ctx = (lclTocEntry *) te->formatData;
P
Philip Warner 已提交
291

B
Bruce Momjian 已提交
292 293
	if (ctx == NULL)
	{
294
		ctx = (lclTocEntry *) calloc(1, sizeof(lclTocEntry));
B
Bruce Momjian 已提交
295 296
		te->formatData = (void *) ctx;
	}
P
Philip Warner 已提交
297

B
Bruce Momjian 已提交
298 299 300
	ctx->filename = ReadStr(AH);
	if (strlen(ctx->filename) == 0)
	{
P
Philip Warner 已提交
301 302
		free(ctx->filename);
		ctx->filename = NULL;
B
Bruce Momjian 已提交
303 304
	}
	ctx->TH = NULL;
P
Philip Warner 已提交
305 306
}

B
Bruce Momjian 已提交
307 308
static void
_PrintExtraToc(ArchiveHandle *AH, TocEntry *te)
P
Philip Warner 已提交
309
{
B
Bruce Momjian 已提交
310
	lclTocEntry *ctx = (lclTocEntry *) te->formatData;
P
Philip Warner 已提交
311

312
	if (AH->public.verbose && ctx->filename != NULL)
313
		ahprintf(AH, "-- File: %s\n", ctx->filename);
P
Philip Warner 已提交
314 315
}

B
Bruce Momjian 已提交
316 317
static void
_StartData(ArchiveHandle *AH, TocEntry *te)
P
Philip Warner 已提交
318
{
B
Bruce Momjian 已提交
319
	lclTocEntry *tctx = (lclTocEntry *) te->formatData;
P
Philip Warner 已提交
320 321 322 323

	tctx->TH = tarOpen(AH, tctx->filename, 'w');
}

B
Bruce Momjian 已提交
324 325
static TAR_MEMBER *
tarOpen(ArchiveHandle *AH, const char *filename, char mode)
P
Philip Warner 已提交
326
{
B
Bruce Momjian 已提交
327 328 329
	lclContext *ctx = (lclContext *) AH->formatData;
	TAR_MEMBER *tm;

P
Philip Warner 已提交
330
#ifdef HAVE_LIBZ
B
Bruce Momjian 已提交
331
	char		fmode[10];
P
Philip Warner 已提交
332 333 334 335 336
#endif

	if (mode == 'r')
	{
		tm = _tarPositionTo(AH, filename);
B
Bruce Momjian 已提交
337
		if (!tm)				/* Not found */
P
Philip Warner 已提交
338
		{
B
Bruce Momjian 已提交
339 340
			if (filename)		/* Couldn't find the requested file.
								 * Future: DO SEEK(0) and retry. */
341
				die_horribly(AH, modulename, "could not find file %s in archive\n", filename);
B
Bruce Momjian 已提交
342
			else
343
				/* Any file OK, non left, so return NULL */
P
Philip Warner 已提交
344 345 346 347 348 349 350 351
				return NULL;
		}

#ifdef HAVE_LIBZ

		if (AH->compression == 0)
			tm->nFH = ctx->tarFH;
		else
352
			die_horribly(AH, modulename, "compression support is disabled in this format\n");
B
Bruce Momjian 已提交
353
		/* tm->zFH = gzdopen(dup(fileno(ctx->tarFH)), "rb"); */
P
Philip Warner 已提交
354 355 356 357 358

#else
		tm->nFH = ctx->tarFH;
#endif

B
Bruce Momjian 已提交
359 360 361
	}
	else
	{
P
Philip Warner 已提交
362 363 364 365
		tm = calloc(1, sizeof(TAR_MEMBER));

		tm->tmpFH = tmpfile();

B
Bruce Momjian 已提交
366
		if (tm->tmpFH == NULL)
367
			die_horribly(AH, modulename, "could not generate temporary file name: %s\n", strerror(errno));
368

P
Philip Warner 已提交
369 370 371 372 373 374
#ifdef HAVE_LIBZ

		if (AH->compression != 0)
		{
			sprintf(fmode, "wb%d", AH->compression);
			tm->zFH = gzdopen(dup(fileno(tm->tmpFH)), fmode);
375
			if (tm->zFH == NULL)
376
				die_horribly(AH, modulename, "could not open temporary file\n");
377

B
Bruce Momjian 已提交
378 379
		}
		else
P
Philip Warner 已提交
380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397
			tm->nFH = tm->tmpFH;

#else

		tm->nFH = tm->tmpFH;
#endif

		tm->AH = AH;
		tm->targetFile = strdup(filename);
	}

	tm->mode = mode;
	tm->tarFH = ctx->tarFH;

	return tm;

}

B
Bruce Momjian 已提交
398 399
static void
tarClose(ArchiveHandle *AH, TAR_MEMBER *th)
P
Philip Warner 已提交
400 401 402 403 404
{
	/*
	 * Close the GZ file since we dup'd. This will flush the buffers.
	 */
	if (AH->compression != 0)
405
		if (GZCLOSE(th->zFH) != 0)
406
			die_horribly(AH, modulename, "could not close tar member\n");
P
Philip Warner 已提交
407 408

	if (th->mode == 'w')
B
Bruce Momjian 已提交
409 410 411 412 413
		_tarAddFile(AH, th);	/* This will close the temp file */

	/*
	 * else Nothing to do for normal read since we don't dup() normal file
	 * handle, and we don't use temp files.
P
Philip Warner 已提交
414 415
	 */

B
Bruce Momjian 已提交
416
	if (th->targetFile)
P
Philip Warner 已提交
417 418 419 420 421 422 423
		free(th->targetFile);

	th->nFH = NULL;
	th->zFH = NULL;
}

#ifdef __NOT_USED__
B
Bruce Momjian 已提交
424
static char *
P
Peter Eisentraut 已提交
425
tarGets(char *buf, size_t len, TAR_MEMBER *th)
P
Philip Warner 已提交
426
{
B
Bruce Momjian 已提交
427
	char	   *s;
P
Peter Eisentraut 已提交
428
	size_t		cnt = 0;
B
Bruce Momjian 已提交
429 430
	char		c = ' ';
	int			eof = 0;
P
Philip Warner 已提交
431 432 433 434 435 436 437

	/* Can't read past logical EOF */
	if (len > (th->fileLen - th->pos))
		len = th->fileLen - th->pos;

	while (cnt < len && c != '\n')
	{
B
Bruce Momjian 已提交
438 439
		if (_tarReadRaw(th->AH, &c, 1, th, NULL) <= 0)
		{
P
Philip Warner 已提交
440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455
			eof = 1;
			break;
		}
		buf[cnt++] = c;
	}

	if (eof && cnt == 0)
		s = NULL;
	else
	{
		buf[cnt++] = '\0';
		s = buf;
	}

	if (s)
	{
B
Bruce Momjian 已提交
456
		len = strlen(s);
P
Philip Warner 已提交
457 458 459 460 461 462 463
		th->pos += len;
	}

	return s;
}
#endif

B
Bruce Momjian 已提交
464
/*
P
Philip Warner 已提交
465 466 467
 * Just read bytes from the archive. This is the low level read routine
 * that is used for ALL reads on a tar file.
 */
P
Peter Eisentraut 已提交
468 469
static size_t
_tarReadRaw(ArchiveHandle *AH, void *buf, size_t len, TAR_MEMBER *th, FILE *fh)
P
Philip Warner 已提交
470
{
B
Bruce Momjian 已提交
471
	lclContext *ctx = (lclContext *) AH->formatData;
P
Peter Eisentraut 已提交
472 473 474
	size_t		avail;
	size_t		used = 0;
	size_t		res = 0;
P
Philip Warner 已提交
475 476 477 478 479

	avail = AH->lookaheadLen - AH->lookaheadPos;
	if (avail > 0)
	{
		/* We have some lookahead bytes to use */
B
Bruce Momjian 已提交
480
		if (avail >= len)		/* Just use the lookahead buffer */
P
Philip Warner 已提交
481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496
			used = len;
		else
			used = avail;

		/* Copy, and adjust buffer pos */
		memcpy(buf, AH->lookahead, used);
		AH->lookaheadPos += used;

		/* Adjust required length */
		len -= used;
	}

	/* Read the file if len > 0 */
	if (len > 0)
	{
		if (fh)
B
Bruce Momjian 已提交
497
			res = fread(&((char *) buf)[used], 1, len, fh);
P
Philip Warner 已提交
498 499 500
		else if (th)
		{
			if (th->zFH)
B
Bruce Momjian 已提交
501
				res = GZREAD(&((char *) buf)[used], 1, len, th->zFH);
P
Philip Warner 已提交
502
			else
B
Bruce Momjian 已提交
503 504
				res = fread(&((char *) buf)[used], 1, len, th->nFH);
		}
P
Philip Warner 已提交
505
		else
506
			die_horribly(AH, modulename, "internal error -- neither th nor fh specified in tarReadRaw()\n");
P
Philip Warner 已提交
507 508
	}

509 510 511 512
#if 0
	write_msg(modulename, "requested %d bytes, got %d from lookahead and %d from file\n",
			  reqLen, used, res);
#endif
P
Philip Warner 已提交
513 514 515 516 517

	ctx->tarFHpos += res + used;

	return (res + used);
}
B
Bruce Momjian 已提交
518

P
Peter Eisentraut 已提交
519 520
static size_t
tarRead(void *buf, size_t len, TAR_MEMBER *th)
P
Philip Warner 已提交
521
{
P
Peter Eisentraut 已提交
522
	size_t		res;
P
Philip Warner 已提交
523 524 525 526 527 528 529 530 531 532 533 534 535 536

	if (th->pos + len > th->fileLen)
		len = th->fileLen - th->pos;

	if (len <= 0)
		return 0;

	res = _tarReadRaw(th->AH, buf, len, th, NULL);

	th->pos += res;

	return res;
}

P
Peter Eisentraut 已提交
537 538
static size_t
tarWrite(const void *buf, size_t len, TAR_MEMBER *th)
P
Philip Warner 已提交
539
{
P
Peter Eisentraut 已提交
540
	size_t		res;
P
Philip Warner 已提交
541 542

	if (th->zFH != 0)
B
Bruce Momjian 已提交
543
		res = GZWRITE((void *) buf, 1, len, th->zFH);
P
Philip Warner 已提交
544 545 546
	else
		res = fwrite(buf, 1, len, th->nFH);

547
	if (res != len)
548
		die_horribly(th->AH, modulename,
B
Bruce Momjian 已提交
549
			"could not write to tar member (wrote %lu, attempted %lu)\n",
P
Peter Eisentraut 已提交
550
					 (unsigned long) res, (unsigned long) len);
551

P
Philip Warner 已提交
552 553 554 555
	th->pos += res;
	return res;
}

P
Peter Eisentraut 已提交
556 557
static size_t
_WriteData(ArchiveHandle *AH, const void *data, size_t dLen)
P
Philip Warner 已提交
558
{
B
Bruce Momjian 已提交
559
	lclTocEntry *tctx = (lclTocEntry *) AH->currToc->formatData;
P
Philip Warner 已提交
560

B
Bruce Momjian 已提交
561
	dLen = tarWrite((void *) data, dLen, tctx->TH);
P
Philip Warner 已提交
562

B
Bruce Momjian 已提交
563
	return dLen;
P
Philip Warner 已提交
564 565
}

B
Bruce Momjian 已提交
566 567
static void
_EndData(ArchiveHandle *AH, TocEntry *te)
P
Philip Warner 已提交
568
{
B
Bruce Momjian 已提交
569
	lclTocEntry *tctx = (lclTocEntry *) te->formatData;
P
Philip Warner 已提交
570

B
Bruce Momjian 已提交
571 572 573
	/* Close the file */
	tarClose(AH, tctx->TH);
	tctx->TH = NULL;
P
Philip Warner 已提交
574 575
}

B
Bruce Momjian 已提交
576 577
/*
 * Print data for a given file
P
Philip Warner 已提交
578
 */
B
Bruce Momjian 已提交
579 580
static void
_PrintFileData(ArchiveHandle *AH, char *filename, RestoreOptions *ropt)
P
Philip Warner 已提交
581
{
B
Bruce Momjian 已提交
582 583
	lclContext *ctx = (lclContext *) AH->formatData;
	char		buf[4096];
P
Peter Eisentraut 已提交
584
	size_t		cnt;
B
Bruce Momjian 已提交
585
	TAR_MEMBER *th;
P
Philip Warner 已提交
586

B
Bruce Momjian 已提交
587
	if (!filename)
P
Philip Warner 已提交
588 589 590 591 592
		return;

	th = tarOpen(AH, filename, 'r');
	ctx->FH = th;

B
Bruce Momjian 已提交
593 594
	while ((cnt = tarRead(buf, 4095, th)) > 0)
	{
P
Philip Warner 已提交
595 596
		buf[cnt] = '\0';
		ahwrite(buf, 1, cnt, AH);
B
Bruce Momjian 已提交
597
	}
P
Philip Warner 已提交
598

B
Bruce Momjian 已提交
599
	tarClose(AH, th);
P
Philip Warner 已提交
600 601 602 603 604 605
}


/*
 * Print data for a given TOC entry
*/
B
Bruce Momjian 已提交
606 607
static void
_PrintTocData(ArchiveHandle *AH, TocEntry *te, RestoreOptions *ropt)
P
Philip Warner 已提交
608
{
B
Bruce Momjian 已提交
609 610 611
	lclContext *ctx = (lclContext *) AH->formatData;
	lclTocEntry *tctx = (lclTocEntry *) te->formatData;
	char	   *tmpCopy;
P
Peter Eisentraut 已提交
612
	size_t		i,
B
Bruce Momjian 已提交
613 614 615 616
				pos1,
				pos2;

	if (!tctx->filename)
P
Philip Warner 已提交
617 618 619 620 621 622 623 624 625 626 627 628
		return;

	if (ctx->isSpecialScript)
	{
		if (!te->copyStmt)
			return;

		/* Abort the default COPY */
		ahprintf(AH, "\\.\n");

		/* Get a copy of the COPY statement and clean it up */
		tmpCopy = strdup(te->copyStmt);
B
Bruce Momjian 已提交
629
		for (i = 0; i < strlen(tmpCopy); i++)
630
			tmpCopy[i] = pg_tolower((unsigned char) tmpCopy[i]);
P
Philip Warner 已提交
631 632

		/*
B
Bruce Momjian 已提交
633 634
		 * This is very nasty; we don't know if the archive used WITH
		 * OIDS, so we search the string for it in a paranoid sort of way.
P
Philip Warner 已提交
635 636
		 */
		if (strncmp(tmpCopy, "copy ", 5) != 0)
637
			die_horribly(AH, modulename,
638
						 "invalid COPY statement -- could not find \"copy\" in string \"%s\"\n", tmpCopy);
P
Philip Warner 已提交
639 640 641 642

		pos1 = 5;
		for (pos1 = 5; pos1 < strlen(tmpCopy); pos1++)
			if (tmpCopy[pos1] != ' ')
B
Bruce Momjian 已提交
643
				break;
P
Philip Warner 已提交
644 645 646

		if (tmpCopy[pos1] == '"')
			pos1 += 2;
B
Bruce Momjian 已提交
647

648
		pos1 += strlen(te->tag);
P
Philip Warner 已提交
649

B
Bruce Momjian 已提交
650
		for (pos2 = pos1; pos2 < strlen(tmpCopy); pos2++)
P
Philip Warner 已提交
651 652 653 654
			if (strncmp(&tmpCopy[pos2], "from stdin", 10) == 0)
				break;

		if (pos2 >= strlen(tmpCopy))
655
			die_horribly(AH, modulename,
656
						 "invalid COPY statement -- could not find \"from stdin\" in string \"%s\" starting at position %lu\n",
P
Peter Eisentraut 已提交
657
						 tmpCopy, (unsigned long) pos1);
P
Philip Warner 已提交
658

B
Bruce Momjian 已提交
659 660
		ahwrite(tmpCopy, 1, pos2, AH);	/* 'copy "table" [with oids]' */
		ahprintf(AH, " from '$$PATH$$/%s' %s", tctx->filename, &tmpCopy[pos2 + 10]);
P
Philip Warner 已提交
661 662 663 664 665 666 667 668 669 670

		return;
	}

	if (strcmp(te->desc, "BLOBS") == 0)
		_LoadBlobs(AH, ropt);
	else
		_PrintFileData(AH, tctx->filename, ropt);
}

B
Bruce Momjian 已提交
671 672
static void
_LoadBlobs(ArchiveHandle *AH, RestoreOptions *ropt)
P
Philip Warner 已提交
673
{
674
	Oid			oid;
B
Bruce Momjian 已提交
675 676
	lclContext *ctx = (lclContext *) AH->formatData;
	TAR_MEMBER *th;
P
Peter Eisentraut 已提交
677
	size_t		cnt;
B
Bruce Momjian 已提交
678
	char		buf[4096];
P
Philip Warner 已提交
679

680 681
	StartRestoreBlobs(AH);

682
	th = tarOpen(AH, NULL, 'r');	/* Open next file */
P
Philip Warner 已提交
683 684 685 686
	while (th != NULL)
	{
		ctx->FH = th;

687
		if (strncmp(th->targetFile, "blob_", 5) == 0)
P
Philip Warner 已提交
688
		{
689 690 691 692
			oid = atooid(&th->targetFile[5]);
			if (oid != 0)
			{
				ahlog(AH, 1, "restoring large object OID %u\n", oid);
P
Philip Warner 已提交
693

694
				StartRestoreBlob(AH, oid);
P
Philip Warner 已提交
695

696 697 698 699 700 701
				while ((cnt = tarRead(buf, 4095, th)) > 0)
				{
					buf[cnt] = '\0';
					ahwrite(buf, 1, cnt, AH);
				}
				EndRestoreBlob(AH, oid);
P
Philip Warner 已提交
702 703 704 705 706 707 708
			}
		}

		tarClose(AH, th);

		th = tarOpen(AH, NULL, 'r');
	}
709
	EndRestoreBlobs(AH);
P
Philip Warner 已提交
710 711 712
}


B
Bruce Momjian 已提交
713 714
static int
_WriteByte(ArchiveHandle *AH, const int i)
P
Philip Warner 已提交
715
{
B
Bruce Momjian 已提交
716 717 718
	lclContext *ctx = (lclContext *) AH->formatData;
	int			res;
	char		b = i;			/* Avoid endian problems */
P
Philip Warner 已提交
719

B
Bruce Momjian 已提交
720 721
	res = tarWrite(&b, 1, ctx->FH);
	if (res != EOF)
P
Philip Warner 已提交
722
		ctx->filePos += res;
B
Bruce Momjian 已提交
723
	return res;
P
Philip Warner 已提交
724 725
}

B
Bruce Momjian 已提交
726 727
static int
_ReadByte(ArchiveHandle *AH)
P
Philip Warner 已提交
728
{
B
Bruce Momjian 已提交
729 730 731
	lclContext *ctx = (lclContext *) AH->formatData;
	int			res;
	char		c = '\0';
P
Philip Warner 已提交
732

B
Bruce Momjian 已提交
733 734
	res = tarRead(&c, 1, ctx->FH);
	if (res != EOF)
P
Philip Warner 已提交
735
		ctx->filePos += res;
B
Bruce Momjian 已提交
736
	return c;
P
Philip Warner 已提交
737 738
}

P
Peter Eisentraut 已提交
739 740
static size_t
_WriteBuf(ArchiveHandle *AH, const void *buf, size_t len)
P
Philip Warner 已提交
741
{
B
Bruce Momjian 已提交
742
	lclContext *ctx = (lclContext *) AH->formatData;
P
Peter Eisentraut 已提交
743
	size_t		res;
P
Philip Warner 已提交
744

B
Bruce Momjian 已提交
745 746 747
	res = tarWrite((void *) buf, len, ctx->FH);
	ctx->filePos += res;
	return res;
P
Philip Warner 已提交
748 749
}

P
Peter Eisentraut 已提交
750 751
static size_t
_ReadBuf(ArchiveHandle *AH, void *buf, size_t len)
P
Philip Warner 已提交
752
{
B
Bruce Momjian 已提交
753
	lclContext *ctx = (lclContext *) AH->formatData;
P
Peter Eisentraut 已提交
754
	size_t		res;
P
Philip Warner 已提交
755

B
Bruce Momjian 已提交
756 757 758
	res = tarRead(buf, len, ctx->FH);
	ctx->filePos += res;
	return res;
P
Philip Warner 已提交
759 760
}

B
Bruce Momjian 已提交
761 762
static void
_CloseArchive(ArchiveHandle *AH)
P
Philip Warner 已提交
763
{
B
Bruce Momjian 已提交
764 765 766 767 768
	lclContext *ctx = (lclContext *) AH->formatData;
	TAR_MEMBER *th;
	RestoreOptions *ropt;
	int			savVerbose,
				i;
P
Philip Warner 已提交
769

B
Bruce Momjian 已提交
770 771
	if (AH->mode == archModeWrite)
	{
P
Philip Warner 已提交
772 773 774 775 776 777 778
		/*
		 * Write the Header & TOC to the archive FIRST
		 */
		th = tarOpen(AH, "toc.dat", 'w');
		ctx->FH = th;
		WriteHead(AH);
		WriteToc(AH);
B
Bruce Momjian 已提交
779
		tarClose(AH, th);		/* Not needed any more */
P
Philip Warner 已提交
780 781 782 783 784 785

		/*
		 * Now send the data (tables & blobs)
		 */
		WriteDataChunks(AH);

B
Bruce Momjian 已提交
786 787 788
		/*
		 * Now this format wants to append a script which does a full
		 * restore if the files have been extracted.
P
Philip Warner 已提交
789 790 791
		 */
		th = tarOpen(AH, "restore.sql", 'w');
		tarPrintf(AH, th, "create temporary table pgdump_restore_path(p text);\n");
B
Bruce Momjian 已提交
792 793 794 795 796 797 798 799 800 801
		tarPrintf(AH, th, "--\n"
				  "-- NOTE:\n"
				  "--\n"
			 "-- File paths need to be edited. Search for $$PATH$$ and\n"
			  "-- replace it with the path to the directory containing\n"
				  "-- the extracted data files.\n"
				  "--\n"
				  "-- Edit the following to match the path where the\n"
				  "-- tar archive has been extracted.\n"
				  "--\n");
P
Philip Warner 已提交
802 803 804
		tarPrintf(AH, th, "insert into pgdump_restore_path values('/tmp');\n\n");

		AH->CustomOutPtr = _scriptOut;
B
Bruce Momjian 已提交
805

P
Philip Warner 已提交
806 807 808 809 810 811
		ctx->isSpecialScript = 1;
		ctx->scriptTH = th;

		ropt = NewRestoreOptions();
		ropt->dropSchema = 1;
		ropt->compression = 0;
812
		ropt->superuser = NULL;
813
		ropt->suppressDumpWarnings = true;
P
Philip Warner 已提交
814 815 816 817

		savVerbose = AH->public.verbose;
		AH->public.verbose = 0;

B
Bruce Momjian 已提交
818
		RestoreArchive((Archive *) AH, ropt);
P
Philip Warner 已提交
819 820 821 822

		AH->public.verbose = savVerbose;

		tarClose(AH, th);
823 824

		/* Add a block of NULLs since it's de-rigeur. */
B
Bruce Momjian 已提交
825
		for (i = 0; i < 512; i++)
826
		{
827
			if (fputc(0, ctx->tarFH) == EOF)
828
				die_horribly(AH, modulename,
829
				   "could not write null block at end of tar archive\n");
830
		}
B
Bruce Momjian 已提交
831
	}
P
Philip Warner 已提交
832

B
Bruce Momjian 已提交
833
	AH->FH = NULL;
P
Philip Warner 已提交
834 835
}

P
Peter Eisentraut 已提交
836 837
static size_t
_scriptOut(ArchiveHandle *AH, const void *buf, size_t len)
P
Philip Warner 已提交
838
{
B
Bruce Momjian 已提交
839 840
	lclContext *ctx = (lclContext *) AH->formatData;

P
Philip Warner 已提交
841 842 843 844 845 846 847 848
	return tarWrite(buf, len, ctx->scriptTH);
}

/*
 * BLOB support
 */

/*
B
Bruce Momjian 已提交
849
 * Called by the archiver when starting to save all BLOB DATA (not schema).
P
Philip Warner 已提交
850
 * This routine should save whatever format-specific information is needed
B
Bruce Momjian 已提交
851
 * to read the BLOBs back into memory.
P
Philip Warner 已提交
852 853 854 855 856 857
 *
 * It is called just prior to the dumper's DataDumper routine.
 *
 * Optional, but strongly recommended.
 *
 */
B
Bruce Momjian 已提交
858 859
static void
_StartBlobs(ArchiveHandle *AH, TocEntry *te)
P
Philip Warner 已提交
860
{
B
Bruce Momjian 已提交
861 862
	lclContext *ctx = (lclContext *) AH->formatData;
	char		fname[K_STD_BUF_SIZE];
P
Philip Warner 已提交
863 864 865 866 867 868 869 870 871 872 873 874

	sprintf(fname, "blobs.toc");
	ctx->blobToc = tarOpen(AH, fname, 'w');
}

/*
 * Called by the archiver when the dumper calls StartBlob.
 *
 * Mandatory.
 *
 * Must save the passed OID for retrieval at restore-time.
 */
B
Bruce Momjian 已提交
875
static void
876
_StartBlob(ArchiveHandle *AH, TocEntry *te, Oid oid)
P
Philip Warner 已提交
877
{
B
Bruce Momjian 已提交
878 879 880 881
	lclContext *ctx = (lclContext *) AH->formatData;
	lclTocEntry *tctx = (lclTocEntry *) te->formatData;
	char		fname[255];
	char	   *sfx;
P
Philip Warner 已提交
882

B
Bruce Momjian 已提交
883
	if (oid == 0)
884
		die_horribly(AH, modulename, "invalid OID for large object (%u)\n", oid);
P
Philip Warner 已提交
885 886 887 888 889 890

	if (AH->compression != 0)
		sfx = ".gz";
	else
		sfx = "";

891
	sprintf(fname, "blob_%u.dat%s", oid, sfx);
P
Philip Warner 已提交
892

893
	tarPrintf(AH, ctx->blobToc, "%u %s\n", oid, fname);
P
Philip Warner 已提交
894 895 896 897 898 899 900 901 902 903

	tctx->TH = tarOpen(AH, fname, 'w');
}

/*
 * Called by the archiver when the dumper calls EndBlob.
 *
 * Optional.
 *
 */
B
Bruce Momjian 已提交
904
static void
905
_EndBlob(ArchiveHandle *AH, TocEntry *te, Oid oid)
P
Philip Warner 已提交
906
{
B
Bruce Momjian 已提交
907
	lclTocEntry *tctx = (lclTocEntry *) te->formatData;
P
Philip Warner 已提交
908 909 910 911 912

	tarClose(AH, tctx->TH);
}

/*
B
Bruce Momjian 已提交
913
 * Called by the archiver when finishing saving all BLOB DATA.
P
Philip Warner 已提交
914 915 916 917
 *
 * Optional.
 *
 */
B
Bruce Momjian 已提交
918 919
static void
_EndBlobs(ArchiveHandle *AH, TocEntry *te)
P
Philip Warner 已提交
920
{
B
Bruce Momjian 已提交
921 922
	lclContext *ctx = (lclContext *) AH->formatData;

P
Philip Warner 已提交
923
	/* Write out a fake zero OID to mark end-of-blobs. */
B
Bruce Momjian 已提交
924
	/* WriteInt(AH, 0); */
P
Philip Warner 已提交
925 926 927 928 929 930 931 932 933 934 935

	tarClose(AH, ctx->blobToc);
}



/*------------
 * TAR Support
 *------------
 */

B
Bruce Momjian 已提交
936 937
static int
tarPrintf(ArchiveHandle *AH, TAR_MEMBER *th, const char *fmt,...)
P
Philip Warner 已提交
938
{
B
Bruce Momjian 已提交
939
	char	   *p = NULL;
P
Philip Warner 已提交
940
	va_list		ap;
P
Peter Eisentraut 已提交
941
	size_t		bSize = strlen(fmt) + 256;		/* Should be enough */
P
Philip Warner 已提交
942 943
	int			cnt = -1;

B
Bruce Momjian 已提交
944 945 946 947 948 949 950 951 952 953
	/*
	 * This is paranoid: deal with the possibility that vsnprintf is
	 * willing to ignore trailing null
	 */

	/*
	 * or returns > 0 even if string does not fit. It may be the case that
	 * it returns cnt = bufsize
	 */
	while (cnt < 0 || cnt >= (bSize - 1))
954
	{
B
Bruce Momjian 已提交
955 956
		if (p != NULL)
			free(p);
P
Philip Warner 已提交
957
		bSize *= 2;
B
Bruce Momjian 已提交
958
		p = (char *) malloc(bSize);
P
Philip Warner 已提交
959
		if (p == NULL)
960
			die_horribly(AH, modulename, "out of memory\n");
961
		va_start(ap, fmt);
P
Philip Warner 已提交
962
		cnt = vsnprintf(p, bSize, fmt, ap);
963
		va_end(ap);
P
Philip Warner 已提交
964 965 966 967 968 969
	}
	cnt = tarWrite(p, cnt, th);
	free(p);
	return cnt;
}

B
Bruce Momjian 已提交
970 971
static int
_tarChecksum(char *header)
P
Philip Warner 已提交
972
{
B
Bruce Momjian 已提交
973 974 975
	int			i,
				sum;

P
Philip Warner 已提交
976
	sum = 0;
B
Bruce Momjian 已提交
977
	for (i = 0; i < 512; i++)
P
Philip Warner 已提交
978 979
		if (i < 148 || i >= 156)
			sum += 0xFF & header[i];
B
Bruce Momjian 已提交
980
	return sum + 256;			/* Assume 8 blanks in checksum field */
P
Philip Warner 已提交
981 982
}

983
bool
B
Bruce Momjian 已提交
984
isValidTarHeader(char *header)
P
Philip Warner 已提交
985
{
B
Bruce Momjian 已提交
986 987
	int			sum;
	int			chk = _tarChecksum(header);
P
Philip Warner 已提交
988 989 990

	sscanf(&header[148], "%8o", &sum);

991 992 993 994 995 996 997 998 999 1000 1001
	if (sum != chk)
		return false;

	/* POSIX format */
	if (strncmp(&header[257], "ustar00", 7) == 0)
		return true;
	/* older format */
	if (strncmp(&header[257], "ustar  ", 7) == 0)
		return true;

	return false;
P
Philip Warner 已提交
1002 1003 1004
}

/* Given the member, write the TAR header & copy the file */
B
Bruce Momjian 已提交
1005 1006
static void
_tarAddFile(ArchiveHandle *AH, TAR_MEMBER *th)
P
Philip Warner 已提交
1007
{
B
Bruce Momjian 已提交
1008
	lclContext *ctx = (lclContext *) AH->formatData;
1009
	FILE	   *tmp = th->tmpFH;	/* Grab it for convenience */
P
Philip Warner 已提交
1010
	char		buf[32768];
P
Peter Eisentraut 已提交
1011 1012 1013 1014
	size_t		cnt;
	off_t		len = 0;
	size_t		res;
	size_t		i,
B
Bruce Momjian 已提交
1015
				pad;
P
Philip Warner 已提交
1016 1017 1018 1019

	/*
	 * Find file len & go back to start.
	 */
P
Peter Eisentraut 已提交
1020 1021
	fseeko(tmp, 0, SEEK_END);
	th->fileLen = ftello(tmp);
1022 1023 1024 1025
	/*
	 *	Some compilers with throw a warning knowing this test can never be
	 *	true because off_t can't exceed the compared maximum.
	 */
1026 1027
	if (th->fileLen > MAX_TAR_MEMBER_FILELEN)
		die_horribly(AH, modulename, "archive member too large for tar format\n");
P
Peter Eisentraut 已提交
1028
	fseeko(tmp, 0, SEEK_SET);
P
Philip Warner 已提交
1029 1030 1031

	_tarWriteHeader(th);

B
Bruce Momjian 已提交
1032
	while ((cnt = fread(&buf[0], 1, 32767, tmp)) > 0)
P
Philip Warner 已提交
1033
	{
1034
		res = fwrite(&buf[0], 1, cnt, th->tarFH);
B
Bruce Momjian 已提交
1035
		if (res != cnt)
P
Peter Eisentraut 已提交
1036 1037 1038
			die_horribly(AH, modulename,
						 "write error appending to tar archive (wrote %lu, attempted %lu)\n",
						 (unsigned long) res, (unsigned long) cnt);
1039
		len += res;
P
Philip Warner 已提交
1040 1041
	}

B
Bruce Momjian 已提交
1042
	if (fclose(tmp) != 0)		/* This *should* delete it... */
1043
		die_horribly(AH, modulename, "could not close tar member: %s\n", strerror(errno));
P
Philip Warner 已提交
1044 1045

	if (len != th->fileLen)
1046
	{
B
Bruce Momjian 已提交
1047 1048 1049
		char		buf1[100],
					buf2[100];

1050 1051
		snprintf(buf1, sizeof(buf1), INT64_FORMAT, (int64) len);
		snprintf(buf2, sizeof(buf2), INT64_FORMAT, (int64) th->pos);
1052 1053 1054
		die_horribly(AH, modulename, "actual file length (%s) does not match expected (%s)\n",
					 buf1, buf2);
	}
P
Philip Warner 已提交
1055 1056

	pad = ((len + 511) & ~511) - len;
B
Bruce Momjian 已提交
1057
	for (i = 0; i < pad; i++)
1058
	{
B
Bruce Momjian 已提交
1059
		if (fputc('\0', th->tarFH) == EOF)
1060
			die_horribly(AH, modulename, "could not output padding at end of tar member\n");
B
Bruce Momjian 已提交
1061
	}
P
Philip Warner 已提交
1062 1063 1064 1065 1066

	ctx->tarFHpos += len + pad;
}

/* Locate the file in the archive, read header and position to data */
B
Bruce Momjian 已提交
1067 1068
static TAR_MEMBER *
_tarPositionTo(ArchiveHandle *AH, const char *filename)
P
Philip Warner 已提交
1069
{
B
Bruce Momjian 已提交
1070 1071 1072 1073
	lclContext *ctx = (lclContext *) AH->formatData;
	TAR_MEMBER *th = calloc(1, sizeof(TAR_MEMBER));
	char		c;
	char		header[512];
P
Peter Eisentraut 已提交
1074
	size_t		i,
B
Bruce Momjian 已提交
1075
				len,
P
Peter Eisentraut 已提交
1076 1077
				blks;
	int			id;
P
Philip Warner 已提交
1078 1079 1080 1081 1082 1083

	th->AH = AH;

	/* Go to end of current file, if any */
	if (ctx->tarFHpos != 0)
	{
B
Bruce Momjian 已提交
1084 1085 1086
		char		buf1[100],
					buf2[100];

1087 1088
		snprintf(buf1, sizeof(buf1), INT64_FORMAT, (int64) ctx->tarFHpos);
		snprintf(buf2, sizeof(buf2), INT64_FORMAT, (int64) ctx->tarNextMember);
1089 1090
		ahlog(AH, 4, "moving from position %s to next member at file position %s\n",
			  buf1, buf2);
P
Philip Warner 已提交
1091 1092 1093 1094 1095

		while (ctx->tarFHpos < ctx->tarNextMember)
			_tarReadRaw(AH, &c, 1, NULL, ctx->tarFH);
	}

1096
	{
B
Bruce Momjian 已提交
1097 1098
		char		buf[100];

1099
		snprintf(buf, sizeof(buf), INT64_FORMAT, (int64) ctx->tarFHpos);
1100 1101
		ahlog(AH, 4, "now at file position %s\n", buf);
	}
P
Philip Warner 已提交
1102 1103 1104 1105 1106 1107 1108

	/* We are at the start of the file. or at the next member */

	/* Get the header */
	if (!_tarGetHeader(AH, th))
	{
		if (filename)
1109
			die_horribly(AH, modulename, "could not find header for file %s in tar archive\n", filename);
B
Bruce Momjian 已提交
1110
		else
1111
		/* We're just scanning the archibe for the next file, so return null */
P
Philip Warner 已提交
1112 1113 1114 1115 1116 1117
		{
			free(th);
			return NULL;
		}
	}

B
Bruce Momjian 已提交
1118
	while (filename != NULL && strcmp(th->targetFile, filename) != 0)
P
Philip Warner 已提交
1119
	{
1120
		ahlog(AH, 4, "skipping tar member %s\n", th->targetFile);
P
Philip Warner 已提交
1121 1122

		id = atoi(th->targetFile);
1123
		if ((TocIDRequired(AH, id, AH->ropt) & REQ_DATA) != 0)
1124
			die_horribly(AH, modulename, "dumping data out of order is not supported in this archive format: "
1125
			"%s is required, but comes before %s in the archive file.\n",
1126
						 th->targetFile, filename);
P
Philip Warner 已提交
1127 1128

		/* Header doesn't match, so read to next header */
B
Bruce Momjian 已提交
1129 1130
		len = ((th->fileLen + 511) & ~511);		/* Padded length */
		blks = len >> 9;		/* # of 512 byte blocks */
P
Philip Warner 已提交
1131

B
Bruce Momjian 已提交
1132
		for (i = 0; i < blks; i++)
P
Philip Warner 已提交
1133 1134 1135
			_tarReadRaw(AH, &header[0], 512, NULL, ctx->tarFH);

		if (!_tarGetHeader(AH, th))
1136
			die_horribly(AH, modulename, "could not find header for file %s in tar archive\n", filename);
P
Philip Warner 已提交
1137 1138 1139 1140 1141 1142 1143 1144 1145 1146

	}

	ctx->tarNextMember = ctx->tarFHpos + ((th->fileLen + 511) & ~511);
	th->pos = 0;

	return th;
}

/* Read & verify a header */
B
Bruce Momjian 已提交
1147 1148
static int
_tarGetHeader(ArchiveHandle *AH, TAR_MEMBER *th)
P
Philip Warner 已提交
1149
{
B
Bruce Momjian 已提交
1150 1151
	lclContext *ctx = (lclContext *) AH->formatData;
	char		h[512];
1152
	char		tag[100];
B
Bruce Momjian 已提交
1153 1154
	int			sum,
				chk;
P
Peter Eisentraut 已提交
1155
	size_t		len;
B
Bruce Momjian 已提交
1156
	unsigned long ullen;
P
Peter Eisentraut 已提交
1157
	off_t		hPos;
B
Bruce Momjian 已提交
1158
	bool		gotBlock = false;
P
Philip Warner 已提交
1159

1160 1161
	while (!gotBlock)
	{
1162
#if 0
P
Peter Eisentraut 已提交
1163
		if (ftello(ctx->tarFH) != ctx->tarFHpos)
1164
		{
B
Bruce Momjian 已提交
1165 1166 1167
			char		buf1[100],
						buf2[100];

1168 1169
			snprintf(buf1, sizeof(buf1), INT64_FORMAT, (int64) ftello(ctx->tarFH));
			snprintf(buf2, sizeof(buf2), INT64_FORMAT, (int64) ftello(ctx->tarFHpos));
1170
			die_horribly(AH, modulename,
1171 1172 1173
						 "mismatch in actual vs. predicted file position (%s vs. %s)\n",
						 buf1, buf2);
		}
1174
#endif
P
Philip Warner 已提交
1175

1176 1177
		/* Save the pos for reporting purposes */
		hPos = ctx->tarFHpos;
P
Philip Warner 已提交
1178

1179
		/* Read a 512 byte block, return EOF, exit if short */
1180
		len = _tarReadRaw(AH, h, 512, NULL, ctx->tarFH);
B
Bruce Momjian 已提交
1181
		if (len == 0)			/* EOF */
1182 1183 1184
			return 0;

		if (len != 512)
P
Peter Eisentraut 已提交
1185 1186 1187
			die_horribly(AH, modulename,
						 "incomplete tar header found (%lu bytes)\n",
						 (unsigned long) len);
1188 1189

		/* Calc checksum */
1190 1191
		chk = _tarChecksum(h);
		sscanf(&h[148], "%8o", &sum);
P
Philip Warner 已提交
1192

1193
		/*
1194 1195
		 * If the checksum failed, see if it is a null block. If so,
		 * silently continue to the next block.
1196
		 */
B
Bruce Momjian 已提交
1197
		if (chk == sum)
1198
			gotBlock = true;
B
Bruce Momjian 已提交
1199 1200
		else
		{
1201 1202
			int			i;

B
Bruce Momjian 已提交
1203
			for (i = 0; i < 512; i++)
1204
			{
1205
				if (h[i] != 0)
1206
				{
B
Bruce Momjian 已提交
1207
					gotBlock = true;
1208 1209 1210 1211 1212
					break;
				}
			}
		}
	}
P
Philip Warner 已提交
1213

1214 1215 1216
	sscanf(&h[0], "%99s", tag);
	sscanf(&h[124], "%12lo", &ullen);
	len = (size_t) ullen;
P
Philip Warner 已提交
1217

1218
	{
B
Bruce Momjian 已提交
1219 1220
		char		buf[100];

1221
		snprintf(buf, sizeof(buf), INT64_FORMAT, (int64) hPos);
1222
		ahlog(AH, 3, "TOC Entry %s at %s (length %lu, checksum %d)\n",
1223
			  tag, buf, (unsigned long) len, sum);
1224
	}
P
Philip Warner 已提交
1225 1226

	if (chk != sum)
1227
	{
B
Bruce Momjian 已提交
1228 1229
		char		buf[100];

1230
		snprintf(buf, sizeof(buf), INT64_FORMAT, (int64) ftello(ctx->tarFH));
1231 1232
		die_horribly(AH, modulename,
					 "corrupt tar header found in %s "
1233
					 "(expected %d, computed %d) file position %s\n",
1234
					 tag, sum, chk, buf);
1235
	}
P
Philip Warner 已提交
1236

1237
	th->targetFile = strdup(tag);
P
Philip Warner 已提交
1238 1239 1240 1241 1242
	th->fileLen = len;

	return 1;
}

1243 1244 1245 1246 1247

/*
 * Utility routine to print possibly larger than 32 bit integers in a
 * portable fashion.  Filled with zeros.
 */
B
Bruce Momjian 已提交
1248 1249
static void
print_val(char *s, uint64 val, unsigned int base, size_t len)
1250
{
B
Bruce Momjian 已提交
1251 1252 1253 1254 1255 1256 1257 1258 1259
	int			i;

	for (i = len; i > 0; i--)
	{
		int			digit = val % base;

		s[i - 1] = '0' + digit;
		val = val / base;
	}
1260 1261 1262
}


B
Bruce Momjian 已提交
1263 1264
static void
_tarWriteHeader(TAR_MEMBER *th)
P
Philip Warner 已提交
1265 1266 1267 1268 1269
{
	char		h[512];
	int			lastSum = 0;
	int			sum;

1270
	memset(h, 0, sizeof(h));
P
Philip Warner 已提交
1271 1272 1273 1274 1275 1276 1277 1278

	/* Name 100 */
	sprintf(&h[0], "%.99s", th->targetFile);

	/* Mode 8 */
	sprintf(&h[100], "100600 ");

	/* User ID 8 */
1279
	sprintf(&h[108], "004000 ");
P
Philip Warner 已提交
1280 1281

	/* Group 8 */
1282
	sprintf(&h[116], "002000 ");
P
Philip Warner 已提交
1283

1284 1285 1286
	/* File size 12 - 11 digits, 1 space, no NUL */
	print_val(&h[124], th->fileLen, 8, 11);
	sprintf(&h[135], " ");
P
Philip Warner 已提交
1287 1288

	/* Mod Time 12 */
1289
	sprintf(&h[136], "%011o ", (int) time(NULL));
P
Philip Warner 已提交
1290 1291

	/* Checksum 8 */
1292
	sprintf(&h[148], "%06o ", lastSum);
P
Philip Warner 已提交
1293

1294
	/* Type - regular file */
P
Philip Warner 已提交
1295
	sprintf(&h[156], "0");
P
Philip Warner 已提交
1296

1297
	/* Link tag 100 (NULL) */
P
Philip Warner 已提交
1298

1299 1300
	/* Magic 6 + Version 2 */
	sprintf(&h[257], "ustar00");
P
Philip Warner 已提交
1301

1302
#if 0
P
Philip Warner 已提交
1303
	/* User 32 */
B
Bruce Momjian 已提交
1304 1305
	sprintf(&h[265], "%.31s", "");		/* How do I get username reliably?
										 * Do I need to? */
P
Philip Warner 已提交
1306 1307

	/* Group 32 */
B
Bruce Momjian 已提交
1308 1309
	sprintf(&h[297], "%.31s", "");		/* How do I get group reliably? Do
										 * I need to? */
P
Philip Warner 已提交
1310 1311

	/* Maj Dev 8 */
1312
	sprintf(&h[329], "%6o ", 0);
P
Philip Warner 已提交
1313

1314 1315 1316
	/* Min Dev 8 */
	sprintf(&h[337], "%6o ", 0);
#endif
P
Philip Warner 已提交
1317

B
Bruce Momjian 已提交
1318
	while ((sum = _tarChecksum(h)) != lastSum)
P
Philip Warner 已提交
1319
	{
1320
		sprintf(&h[148], "%06o ", sum);
P
Philip Warner 已提交
1321 1322 1323
		lastSum = sum;
	}

B
Bruce Momjian 已提交
1324
	if (fwrite(h, 1, 512, th->tarFH) != 512)
1325
		die_horribly(th->AH, modulename, "could not write tar header\n");
1326

P
Philip Warner 已提交
1327
}