pg_backup_tar.c 30.1 KB
Newer Older
P
Philip Warner 已提交
1 2 3 4 5 6
/*-------------------------------------------------------------------------
 *
 * pg_backup_tar.c
 *
 *	This file is copied from the 'files' format file, but dumps data into
 *	one temp file then sends it to the output TAR archive.
7
 *
8 9 10
 *	NOTE: If you untar the created 'tar' file, the resulting files are
 *	compatible with the 'directory' format. Please keep the two formats in
 *	sync.
P
Philip Warner 已提交
11 12 13 14
 *
 *	See the headers to pg_backup_files & pg_restore for more details.
 *
 * Copyright (c) 2000, Philip Warner
B
Bruce Momjian 已提交
15 16
 *		Rights are granted to use this software in any way so long
 *		as this notice is not removed.
P
Philip Warner 已提交
17 18 19 20 21 22
 *
 *	The author is not responsible for loss or damages that may
 *	result from it's use.
 *
 *
 * IDENTIFICATION
23
 *		src/bin/pg_dump/pg_backup_tar.c
24
 *
P
Philip Warner 已提交
25 26 27
 *-------------------------------------------------------------------------
 */

28 29 30
#include "pg_backup.h"
#include "pg_backup_archiver.h"
#include "pg_backup_tar.h"
31
#include "dumpmem.h"
R
Robert Haas 已提交
32
#include "dumputils.h"
33

34
#include <sys/stat.h>
P
Philip Warner 已提交
35
#include <ctype.h>
36
#include <limits.h>
P
Philip Warner 已提交
37 38
#include <unistd.h>

B
Bruce Momjian 已提交
39 40
static void _ArchiveEntry(ArchiveHandle *AH, TocEntry *te);
static void _StartData(ArchiveHandle *AH, TocEntry *te);
B
Bruce Momjian 已提交
41
static size_t _WriteData(ArchiveHandle *AH, const void *data, size_t dLen);
B
Bruce Momjian 已提交
42 43 44
static void _EndData(ArchiveHandle *AH, TocEntry *te);
static int	_WriteByte(ArchiveHandle *AH, const int i);
static int	_ReadByte(ArchiveHandle *);
B
Bruce Momjian 已提交
45 46
static size_t _WriteBuf(ArchiveHandle *AH, const void *buf, size_t len);
static size_t _ReadBuf(ArchiveHandle *AH, void *buf, size_t len);
B
Bruce Momjian 已提交
47 48 49 50 51 52 53
static void _CloseArchive(ArchiveHandle *AH);
static void _PrintTocData(ArchiveHandle *AH, TocEntry *te, RestoreOptions *ropt);
static void _WriteExtraToc(ArchiveHandle *AH, TocEntry *te);
static void _ReadExtraToc(ArchiveHandle *AH, TocEntry *te);
static void _PrintExtraToc(ArchiveHandle *AH, TocEntry *te);

static void _StartBlobs(ArchiveHandle *AH, TocEntry *te);
54 55
static void _StartBlob(ArchiveHandle *AH, TocEntry *te, Oid oid);
static void _EndBlob(ArchiveHandle *AH, TocEntry *te, Oid oid);
B
Bruce Momjian 已提交
56
static void _EndBlobs(ArchiveHandle *AH, TocEntry *te);
P
Philip Warner 已提交
57 58 59 60 61

#define K_STD_BUF_SIZE 1024


#ifdef HAVE_LIBZ
B
Bruce Momjian 已提交
62 63
 /* typedef gzFile	 ThingFile; */
typedef FILE ThingFile;
P
Philip Warner 已提交
64
#else
B
Bruce Momjian 已提交
65
typedef FILE ThingFile;
P
Philip Warner 已提交
66 67
#endif

B
Bruce Momjian 已提交
68 69 70 71 72 73 74 75
typedef struct
{
	ThingFile  *zFH;
	FILE	   *nFH;
	FILE	   *tarFH;
	FILE	   *tmpFH;
	char	   *targetFile;
	char		mode;
76 77
	pgoff_t		pos;
	pgoff_t		fileLen;
B
Bruce Momjian 已提交
78
	ArchiveHandle *AH;
P
Philip Warner 已提交
79 80
} TAR_MEMBER;

81 82 83
/*
 * Maximum file size for a tar member: The limit inherent in the
 * format is 2^33-1 bytes (nearly 8 GB).  But we don't want to exceed
84
 * what we can represent in pgoff_t.
85
 */
86
#define MAX_TAR_MEMBER_FILELEN (((int64) 1 << Min(33, sizeof(pgoff_t)*8 - 1)) - 1)
87

B
Bruce Momjian 已提交
88 89
typedef struct
{
P
Philip Warner 已提交
90
	int			hasSeek;
91
	pgoff_t		filePos;
B
Bruce Momjian 已提交
92 93
	TAR_MEMBER *blobToc;
	FILE	   *tarFH;
94 95
	pgoff_t		tarFHpos;
	pgoff_t		tarNextMember;
B
Bruce Momjian 已提交
96
	TAR_MEMBER *FH;
P
Philip Warner 已提交
97
	int			isSpecialScript;
B
Bruce Momjian 已提交
98
	TAR_MEMBER *scriptTH;
P
Philip Warner 已提交
99 100
} lclContext;

B
Bruce Momjian 已提交
101 102 103 104
typedef struct
{
	TAR_MEMBER *TH;
	char	   *filename;
P
Philip Warner 已提交
105 106
} lclTocEntry;

107
static const char *modulename = gettext_noop("tar archiver");
B
Bruce Momjian 已提交
108 109

static void _LoadBlobs(ArchiveHandle *AH, RestoreOptions *ropt);
P
Philip Warner 已提交
110

B
Bruce Momjian 已提交
111 112
static TAR_MEMBER *tarOpen(ArchiveHandle *AH, const char *filename, char mode);
static void tarClose(ArchiveHandle *AH, TAR_MEMBER *TH);
P
Philip Warner 已提交
113 114

#ifdef __NOT_USED__
P
Peter Eisentraut 已提交
115
static char *tarGets(char *buf, size_t len, TAR_MEMBER *th);
P
Philip Warner 已提交
116
#endif
P
Peter Eisentraut 已提交
117
static int	tarPrintf(ArchiveHandle *AH, TAR_MEMBER *th, const char *fmt, ...) __attribute__((format(PG_PRINTF_ATTRIBUTE, 3, 4)));
P
Philip Warner 已提交
118

B
Bruce Momjian 已提交
119 120 121
static void _tarAddFile(ArchiveHandle *AH, TAR_MEMBER *th);
static int	_tarChecksum(char *th);
static TAR_MEMBER *_tarPositionTo(ArchiveHandle *AH, const char *filename);
B
Bruce Momjian 已提交
122 123
static size_t tarRead(void *buf, size_t len, TAR_MEMBER *th);
static size_t tarWrite(const void *buf, size_t len, TAR_MEMBER *th);
B
Bruce Momjian 已提交
124 125
static void _tarWriteHeader(TAR_MEMBER *th);
static int	_tarGetHeader(ArchiveHandle *AH, TAR_MEMBER *th);
B
Bruce Momjian 已提交
126
static size_t _tarReadRaw(ArchiveHandle *AH, void *buf, size_t len, TAR_MEMBER *th, FILE *fh);
P
Philip Warner 已提交
127

B
Bruce Momjian 已提交
128
static size_t _scriptOut(ArchiveHandle *AH, const void *buf, size_t len);
P
Philip Warner 已提交
129 130

/*
B
Bruce Momjian 已提交
131
 *	Initializer
P
Philip Warner 已提交
132
 */
B
Bruce Momjian 已提交
133 134
void
InitArchiveFmt_Tar(ArchiveHandle *AH)
P
Philip Warner 已提交
135
{
B
Bruce Momjian 已提交
136 137 138 139 140 141 142 143 144 145 146 147
	lclContext *ctx;

	/* Assuming static functions, this can be copied for each format. */
	AH->ArchiveEntryPtr = _ArchiveEntry;
	AH->StartDataPtr = _StartData;
	AH->WriteDataPtr = _WriteData;
	AH->EndDataPtr = _EndData;
	AH->WriteBytePtr = _WriteByte;
	AH->ReadBytePtr = _ReadByte;
	AH->WriteBufPtr = _WriteBuf;
	AH->ReadBufPtr = _ReadBuf;
	AH->ClosePtr = _CloseArchive;
148
	AH->ReopenPtr = NULL;
B
Bruce Momjian 已提交
149 150 151 152 153 154 155 156 157
	AH->PrintTocDataPtr = _PrintTocData;
	AH->ReadExtraTocPtr = _ReadExtraToc;
	AH->WriteExtraTocPtr = _WriteExtraToc;
	AH->PrintExtraTocPtr = _PrintExtraToc;

	AH->StartBlobsPtr = _StartBlobs;
	AH->StartBlobPtr = _StartBlob;
	AH->EndBlobPtr = _EndBlob;
	AH->EndBlobsPtr = _EndBlobs;
158 159
	AH->ClonePtr = NULL;
	AH->DeClonePtr = NULL;
B
Bruce Momjian 已提交
160 161 162 163

	/*
	 * Set up some special context used in compressing data.
	 */
164
	ctx = (lclContext *) pg_calloc(1, sizeof(lclContext));
B
Bruce Momjian 已提交
165 166
	AH->formatData = (void *) ctx;
	ctx->filePos = 0;
167
	ctx->isSpecialScript = 0;
B
Bruce Momjian 已提交
168

169 170
	/* Initialize LO buffering */
	AH->lo_buf_size = LOBBUFSIZE;
171
	AH->lo_buf = (void *) pg_malloc(LOBBUFSIZE);
B
Bruce Momjian 已提交
172 173

	/*
174
	 * Now open the tar file, and load the TOC if we're in read mode.
B
Bruce Momjian 已提交
175 176 177 178
	 */
	if (AH->mode == archModeWrite)
	{
		if (AH->fSpec && strcmp(AH->fSpec, "") != 0)
179
		{
P
Philip Warner 已提交
180
			ctx->tarFH = fopen(AH->fSpec, PG_BINARY_W);
181
			if (ctx->tarFH == NULL)
R
Robert Haas 已提交
182 183 184
				exit_horribly(modulename,
							  "could not open TOC file \"%s\" for output: %s\n",
							  AH->fSpec, strerror(errno));
185
		}
B
Bruce Momjian 已提交
186
		else
187
		{
P
Philip Warner 已提交
188
			ctx->tarFH = stdout;
189
			if (ctx->tarFH == NULL)
R
Robert Haas 已提交
190 191 192
				exit_horribly(modulename,
							  "could not open TOC file for output: %s\n",
							  strerror(errno));
193
		}
194

P
Philip Warner 已提交
195 196
		ctx->tarFHpos = 0;

B
Bruce Momjian 已提交
197
		/*
B
Bruce Momjian 已提交
198 199
		 * Make unbuffered since we will dup() it, and the buffers screw each
		 * other
B
Bruce Momjian 已提交
200
		 */
201
		/* setvbuf(ctx->tarFH, NULL, _IONBF, 0); */
P
Philip Warner 已提交
202

203
		ctx->hasSeek = checkSeek(ctx->tarFH);
P
Philip Warner 已提交
204

B
Bruce Momjian 已提交
205
		if (AH->compression < 0 || AH->compression > 9)
P
Philip Warner 已提交
206 207 208 209 210 211
			AH->compression = Z_DEFAULT_COMPRESSION;

		/* Don't compress into tar files unless asked to do so */
		if (AH->compression == Z_DEFAULT_COMPRESSION)
			AH->compression = 0;

B
Bruce Momjian 已提交
212
		/*
B
Bruce Momjian 已提交
213 214 215
		 * We don't support compression because reading the files back is not
		 * possible since gzdopen uses buffered IO which totally screws file
		 * positioning.
P
Philip Warner 已提交
216 217
		 */
		if (AH->compression != 0)
R
Robert Haas 已提交
218 219
			exit_horribly(modulename,
						  "compression is not supported by tar archive format\n");
B
Bruce Momjian 已提交
220 221 222 223
	}
	else
	{							/* Read Mode */
		if (AH->fSpec && strcmp(AH->fSpec, "") != 0)
224
		{
P
Philip Warner 已提交
225
			ctx->tarFH = fopen(AH->fSpec, PG_BINARY_R);
226
			if (ctx->tarFH == NULL)
R
Robert Haas 已提交
227 228
				exit_horribly(modulename, "could not open TOC file \"%s\" for input: %s\n",
							  AH->fSpec, strerror(errno));
229
		}
B
Bruce Momjian 已提交
230
		else
231
		{
P
Philip Warner 已提交
232
			ctx->tarFH = stdin;
233
			if (ctx->tarFH == NULL)
R
Robert Haas 已提交
234 235
				exit_horribly(modulename, "could not open TOC file for input: %s\n",
							  strerror(errno));
236
		}
237

B
Bruce Momjian 已提交
238
		/*
B
Bruce Momjian 已提交
239 240
		 * Make unbuffered since we will dup() it, and the buffers screw each
		 * other
B
Bruce Momjian 已提交
241
		 */
242
		/* setvbuf(ctx->tarFH, NULL, _IONBF, 0); */
P
Philip Warner 已提交
243 244 245

		ctx->tarFHpos = 0;

246
		ctx->hasSeek = checkSeek(ctx->tarFH);
P
Philip Warner 已提交
247

B
Bruce Momjian 已提交
248 249 250 251
		/*
		 * Forcibly unmark the header as read since we use the lookahead
		 * buffer
		 */
P
Philip Warner 已提交
252 253
		AH->readHeader = 0;

B
Bruce Momjian 已提交
254
		ctx->FH = (void *) tarOpen(AH, "toc.dat", 'r');
P
Philip Warner 已提交
255 256
		ReadHead(AH);
		ReadToc(AH);
B
Bruce Momjian 已提交
257 258
		tarClose(AH, ctx->FH);	/* Nothing else in the file... */
	}
P
Philip Warner 已提交
259 260 261 262
}

/*
 * - Start a new TOC entry
B
Bruce Momjian 已提交
263
 *	 Setup the output file name.
P
Philip Warner 已提交
264
 */
B
Bruce Momjian 已提交
265 266
static void
_ArchiveEntry(ArchiveHandle *AH, TocEntry *te)
P
Philip Warner 已提交
267
{
B
Bruce Momjian 已提交
268 269
	lclTocEntry *ctx;
	char		fn[K_STD_BUF_SIZE];
P
Philip Warner 已提交
270

271
	ctx = (lclTocEntry *) pg_calloc(1, sizeof(lclTocEntry));
272
	if (te->dataDumper != NULL)
B
Bruce Momjian 已提交
273
	{
P
Philip Warner 已提交
274
#ifdef HAVE_LIBZ
B
Bruce Momjian 已提交
275
		if (AH->compression == 0)
276
			sprintf(fn, "%d.dat", te->dumpId);
B
Bruce Momjian 已提交
277
		else
278
			sprintf(fn, "%d.dat.gz", te->dumpId);
P
Philip Warner 已提交
279
#else
280
		sprintf(fn, "%d.dat", te->dumpId);
P
Philip Warner 已提交
281
#endif
282
		ctx->filename = pg_strdup(fn);
B
Bruce Momjian 已提交
283 284 285
	}
	else
	{
P
Philip Warner 已提交
286 287
		ctx->filename = NULL;
		ctx->TH = NULL;
B
Bruce Momjian 已提交
288 289
	}
	te->formatData = (void *) ctx;
P
Philip Warner 已提交
290 291
}

B
Bruce Momjian 已提交
292 293
static void
_WriteExtraToc(ArchiveHandle *AH, TocEntry *te)
P
Philip Warner 已提交
294
{
B
Bruce Momjian 已提交
295
	lclTocEntry *ctx = (lclTocEntry *) te->formatData;
P
Philip Warner 已提交
296

B
Bruce Momjian 已提交
297
	if (ctx->filename)
P
Philip Warner 已提交
298
		WriteStr(AH, ctx->filename);
B
Bruce Momjian 已提交
299
	else
P
Philip Warner 已提交
300 301 302
		WriteStr(AH, "");
}

B
Bruce Momjian 已提交
303 304
static void
_ReadExtraToc(ArchiveHandle *AH, TocEntry *te)
P
Philip Warner 已提交
305
{
B
Bruce Momjian 已提交
306
	lclTocEntry *ctx = (lclTocEntry *) te->formatData;
P
Philip Warner 已提交
307

B
Bruce Momjian 已提交
308 309
	if (ctx == NULL)
	{
310
		ctx = (lclTocEntry *) pg_calloc(1, sizeof(lclTocEntry));
B
Bruce Momjian 已提交
311 312
		te->formatData = (void *) ctx;
	}
P
Philip Warner 已提交
313

B
Bruce Momjian 已提交
314 315 316
	ctx->filename = ReadStr(AH);
	if (strlen(ctx->filename) == 0)
	{
P
Philip Warner 已提交
317 318
		free(ctx->filename);
		ctx->filename = NULL;
B
Bruce Momjian 已提交
319 320
	}
	ctx->TH = NULL;
P
Philip Warner 已提交
321 322
}

B
Bruce Momjian 已提交
323 324
static void
_PrintExtraToc(ArchiveHandle *AH, TocEntry *te)
P
Philip Warner 已提交
325
{
B
Bruce Momjian 已提交
326
	lclTocEntry *ctx = (lclTocEntry *) te->formatData;
P
Philip Warner 已提交
327

328
	if (AH->public.verbose && ctx->filename != NULL)
329
		ahprintf(AH, "-- File: %s\n", ctx->filename);
P
Philip Warner 已提交
330 331
}

B
Bruce Momjian 已提交
332 333
static void
_StartData(ArchiveHandle *AH, TocEntry *te)
P
Philip Warner 已提交
334
{
B
Bruce Momjian 已提交
335
	lclTocEntry *tctx = (lclTocEntry *) te->formatData;
P
Philip Warner 已提交
336 337 338 339

	tctx->TH = tarOpen(AH, tctx->filename, 'w');
}

B
Bruce Momjian 已提交
340 341
static TAR_MEMBER *
tarOpen(ArchiveHandle *AH, const char *filename, char mode)
P
Philip Warner 已提交
342
{
B
Bruce Momjian 已提交
343 344 345
	lclContext *ctx = (lclContext *) AH->formatData;
	TAR_MEMBER *tm;

P
Philip Warner 已提交
346
#ifdef HAVE_LIBZ
B
Bruce Momjian 已提交
347
	char		fmode[10];
P
Philip Warner 已提交
348 349 350 351 352
#endif

	if (mode == 'r')
	{
		tm = _tarPositionTo(AH, filename);
B
Bruce Momjian 已提交
353
		if (!tm)				/* Not found */
P
Philip Warner 已提交
354
		{
355 356 357
			if (filename)
			{
				/*
B
Bruce Momjian 已提交
358 359
				 * Couldn't find the requested file. Future: do SEEK(0) and
				 * retry.
360 361 362
				 */
				die_horribly(AH, modulename, "could not find file \"%s\" in archive\n", filename);
			}
B
Bruce Momjian 已提交
363
			else
364 365
			{
				/* Any file OK, none left, so return NULL */
P
Philip Warner 已提交
366
				return NULL;
367
			}
P
Philip Warner 已提交
368 369 370 371 372 373 374
		}

#ifdef HAVE_LIBZ

		if (AH->compression == 0)
			tm->nFH = ctx->tarFH;
		else
375
			die_horribly(AH, modulename, "compression is not supported by tar archive format\n");
B
Bruce Momjian 已提交
376
		/* tm->zFH = gzdopen(dup(fileno(ctx->tarFH)), "rb"); */
P
Philip Warner 已提交
377 378 379
#else
		tm->nFH = ctx->tarFH;
#endif
B
Bruce Momjian 已提交
380 381 382
	}
	else
	{
383
		tm = pg_calloc(1, sizeof(TAR_MEMBER));
P
Philip Warner 已提交
384

385
#ifndef WIN32
P
Philip Warner 已提交
386
		tm->tmpFH = tmpfile();
387
#else
B
Bruce Momjian 已提交
388

389
		/*
B
Bruce Momjian 已提交
390 391 392
		 * On WIN32, tmpfile() generates a filename in the root directory,
		 * which requires administrative permissions on certain systems. Loop
		 * until we find a unique file name we can create.
393 394 395
		 */
		while (1)
		{
B
Bruce Momjian 已提交
396 397 398
			char	   *name;
			int			fd;

399 400 401 402
			name = _tempnam(NULL, "pg_temp_");
			if (name == NULL)
				break;
			fd = open(name, O_RDWR | O_CREAT | O_EXCL | O_BINARY |
403
					  O_TEMPORARY, S_IRUSR | S_IWUSR);
404 405
			free(name);

B
Bruce Momjian 已提交
406
			if (fd != -1)		/* created a file */
407 408 409 410 411 412 413 414
			{
				tm->tmpFH = fdopen(fd, "w+b");
				break;
			}
			else if (errno != EEXIST)	/* failure other than file exists */
				break;
		}
#endif
P
Philip Warner 已提交
415

B
Bruce Momjian 已提交
416
		if (tm->tmpFH == NULL)
417
			die_horribly(AH, modulename, "could not generate temporary file name: %s\n", strerror(errno));
418

P
Philip Warner 已提交
419 420 421 422 423 424
#ifdef HAVE_LIBZ

		if (AH->compression != 0)
		{
			sprintf(fmode, "wb%d", AH->compression);
			tm->zFH = gzdopen(dup(fileno(tm->tmpFH)), fmode);
425
			if (tm->zFH == NULL)
426
				die_horribly(AH, modulename, "could not open temporary file\n");
B
Bruce Momjian 已提交
427 428
		}
		else
P
Philip Warner 已提交
429 430 431 432 433 434 435
			tm->nFH = tm->tmpFH;
#else

		tm->nFH = tm->tmpFH;
#endif

		tm->AH = AH;
436
		tm->targetFile = pg_strdup(filename);
P
Philip Warner 已提交
437 438 439 440 441 442 443 444
	}

	tm->mode = mode;
	tm->tarFH = ctx->tarFH;

	return tm;
}

B
Bruce Momjian 已提交
445 446
static void
tarClose(ArchiveHandle *AH, TAR_MEMBER *th)
P
Philip Warner 已提交
447 448 449 450 451
{
	/*
	 * Close the GZ file since we dup'd. This will flush the buffers.
	 */
	if (AH->compression != 0)
452
		if (GZCLOSE(th->zFH) != 0)
453
			die_horribly(AH, modulename, "could not close tar member\n");
P
Philip Warner 已提交
454 455

	if (th->mode == 'w')
B
Bruce Momjian 已提交
456 457 458 459 460
		_tarAddFile(AH, th);	/* This will close the temp file */

	/*
	 * else Nothing to do for normal read since we don't dup() normal file
	 * handle, and we don't use temp files.
P
Philip Warner 已提交
461 462
	 */

B
Bruce Momjian 已提交
463
	if (th->targetFile)
P
Philip Warner 已提交
464 465 466 467 468 469 470
		free(th->targetFile);

	th->nFH = NULL;
	th->zFH = NULL;
}

#ifdef __NOT_USED__
B
Bruce Momjian 已提交
471
static char *
P
Peter Eisentraut 已提交
472
tarGets(char *buf, size_t len, TAR_MEMBER *th)
P
Philip Warner 已提交
473
{
B
Bruce Momjian 已提交
474
	char	   *s;
P
Peter Eisentraut 已提交
475
	size_t		cnt = 0;
B
Bruce Momjian 已提交
476 477
	char		c = ' ';
	int			eof = 0;
P
Philip Warner 已提交
478 479 480 481 482 483 484

	/* Can't read past logical EOF */
	if (len > (th->fileLen - th->pos))
		len = th->fileLen - th->pos;

	while (cnt < len && c != '\n')
	{
B
Bruce Momjian 已提交
485 486
		if (_tarReadRaw(th->AH, &c, 1, th, NULL) <= 0)
		{
P
Philip Warner 已提交
487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502
			eof = 1;
			break;
		}
		buf[cnt++] = c;
	}

	if (eof && cnt == 0)
		s = NULL;
	else
	{
		buf[cnt++] = '\0';
		s = buf;
	}

	if (s)
	{
B
Bruce Momjian 已提交
503
		len = strlen(s);
P
Philip Warner 已提交
504 505 506 507 508 509 510
		th->pos += len;
	}

	return s;
}
#endif

B
Bruce Momjian 已提交
511
/*
P
Philip Warner 已提交
512 513 514
 * Just read bytes from the archive. This is the low level read routine
 * that is used for ALL reads on a tar file.
 */
P
Peter Eisentraut 已提交
515 516
static size_t
_tarReadRaw(ArchiveHandle *AH, void *buf, size_t len, TAR_MEMBER *th, FILE *fh)
P
Philip Warner 已提交
517
{
B
Bruce Momjian 已提交
518
	lclContext *ctx = (lclContext *) AH->formatData;
P
Peter Eisentraut 已提交
519 520 521
	size_t		avail;
	size_t		used = 0;
	size_t		res = 0;
P
Philip Warner 已提交
522 523 524 525 526

	avail = AH->lookaheadLen - AH->lookaheadPos;
	if (avail > 0)
	{
		/* We have some lookahead bytes to use */
B
Bruce Momjian 已提交
527
		if (avail >= len)		/* Just use the lookahead buffer */
P
Philip Warner 已提交
528 529 530 531 532
			used = len;
		else
			used = avail;

		/* Copy, and adjust buffer pos */
533
		memcpy(buf, AH->lookahead + AH->lookaheadPos, used);
P
Philip Warner 已提交
534 535 536 537 538 539 540 541 542 543
		AH->lookaheadPos += used;

		/* Adjust required length */
		len -= used;
	}

	/* Read the file if len > 0 */
	if (len > 0)
	{
		if (fh)
B
Bruce Momjian 已提交
544
			res = fread(&((char *) buf)[used], 1, len, fh);
P
Philip Warner 已提交
545 546 547
		else if (th)
		{
			if (th->zFH)
B
Bruce Momjian 已提交
548
				res = GZREAD(&((char *) buf)[used], 1, len, th->zFH);
P
Philip Warner 已提交
549
			else
B
Bruce Momjian 已提交
550 551
				res = fread(&((char *) buf)[used], 1, len, th->nFH);
		}
P
Philip Warner 已提交
552
		else
553
			die_horribly(AH, modulename, "internal error -- neither th nor fh specified in tarReadRaw()\n");
P
Philip Warner 已提交
554 555 556 557 558 559
	}

	ctx->tarFHpos += res + used;

	return (res + used);
}
B
Bruce Momjian 已提交
560

P
Peter Eisentraut 已提交
561 562
static size_t
tarRead(void *buf, size_t len, TAR_MEMBER *th)
P
Philip Warner 已提交
563
{
P
Peter Eisentraut 已提交
564
	size_t		res;
P
Philip Warner 已提交
565 566 567 568 569 570 571 572 573 574 575 576 577 578

	if (th->pos + len > th->fileLen)
		len = th->fileLen - th->pos;

	if (len <= 0)
		return 0;

	res = _tarReadRaw(th->AH, buf, len, th, NULL);

	th->pos += res;

	return res;
}

P
Peter Eisentraut 已提交
579 580
static size_t
tarWrite(const void *buf, size_t len, TAR_MEMBER *th)
P
Philip Warner 已提交
581
{
P
Peter Eisentraut 已提交
582
	size_t		res;
P
Philip Warner 已提交
583

584
	if (th->zFH != NULL)
585
		res = GZWRITE(buf, 1, len, th->zFH);
P
Philip Warner 已提交
586 587 588
	else
		res = fwrite(buf, 1, len, th->nFH);

589
	if (res != len)
590
		die_horribly(th->AH, modulename,
591
					 "could not write to output file: %s\n", strerror(errno));
592

P
Philip Warner 已提交
593 594 595 596
	th->pos += res;
	return res;
}

P
Peter Eisentraut 已提交
597 598
static size_t
_WriteData(ArchiveHandle *AH, const void *data, size_t dLen)
P
Philip Warner 已提交
599
{
B
Bruce Momjian 已提交
600
	lclTocEntry *tctx = (lclTocEntry *) AH->currToc->formatData;
P
Philip Warner 已提交
601

602
	dLen = tarWrite(data, dLen, tctx->TH);
P
Philip Warner 已提交
603

B
Bruce Momjian 已提交
604
	return dLen;
P
Philip Warner 已提交
605 606
}

B
Bruce Momjian 已提交
607 608
static void
_EndData(ArchiveHandle *AH, TocEntry *te)
P
Philip Warner 已提交
609
{
B
Bruce Momjian 已提交
610
	lclTocEntry *tctx = (lclTocEntry *) te->formatData;
P
Philip Warner 已提交
611

B
Bruce Momjian 已提交
612 613 614
	/* Close the file */
	tarClose(AH, tctx->TH);
	tctx->TH = NULL;
P
Philip Warner 已提交
615 616
}

B
Bruce Momjian 已提交
617 618
/*
 * Print data for a given file
P
Philip Warner 已提交
619
 */
B
Bruce Momjian 已提交
620 621
static void
_PrintFileData(ArchiveHandle *AH, char *filename, RestoreOptions *ropt)
P
Philip Warner 已提交
622
{
B
Bruce Momjian 已提交
623 624
	lclContext *ctx = (lclContext *) AH->formatData;
	char		buf[4096];
P
Peter Eisentraut 已提交
625
	size_t		cnt;
B
Bruce Momjian 已提交
626
	TAR_MEMBER *th;
P
Philip Warner 已提交
627

B
Bruce Momjian 已提交
628
	if (!filename)
P
Philip Warner 已提交
629 630 631 632 633
		return;

	th = tarOpen(AH, filename, 'r');
	ctx->FH = th;

B
Bruce Momjian 已提交
634 635
	while ((cnt = tarRead(buf, 4095, th)) > 0)
	{
P
Philip Warner 已提交
636 637
		buf[cnt] = '\0';
		ahwrite(buf, 1, cnt, AH);
B
Bruce Momjian 已提交
638
	}
P
Philip Warner 已提交
639

B
Bruce Momjian 已提交
640
	tarClose(AH, th);
P
Philip Warner 已提交
641 642 643 644 645 646
}


/*
 * Print data for a given TOC entry
*/
B
Bruce Momjian 已提交
647 648
static void
_PrintTocData(ArchiveHandle *AH, TocEntry *te, RestoreOptions *ropt)
P
Philip Warner 已提交
649
{
B
Bruce Momjian 已提交
650 651 652
	lclContext *ctx = (lclContext *) AH->formatData;
	lclTocEntry *tctx = (lclTocEntry *) te->formatData;
	char	   *tmpCopy;
P
Peter Eisentraut 已提交
653
	size_t		i,
B
Bruce Momjian 已提交
654 655 656 657
				pos1,
				pos2;

	if (!tctx->filename)
P
Philip Warner 已提交
658 659 660 661 662 663 664 665 666 667 668
		return;

	if (ctx->isSpecialScript)
	{
		if (!te->copyStmt)
			return;

		/* Abort the default COPY */
		ahprintf(AH, "\\.\n");

		/* Get a copy of the COPY statement and clean it up */
669
		tmpCopy = pg_strdup(te->copyStmt);
B
Bruce Momjian 已提交
670
		for (i = 0; i < strlen(tmpCopy); i++)
671
			tmpCopy[i] = pg_tolower((unsigned char) tmpCopy[i]);
P
Philip Warner 已提交
672 673

		/*
B
Bruce Momjian 已提交
674 675
		 * This is very nasty; we don't know if the archive used WITH OIDS, so
		 * we search the string for it in a paranoid sort of way.
P
Philip Warner 已提交
676 677
		 */
		if (strncmp(tmpCopy, "copy ", 5) != 0)
678
			die_horribly(AH, modulename,
679
						 "invalid COPY statement -- could not find \"copy\" in string \"%s\"\n", tmpCopy);
P
Philip Warner 已提交
680 681 682 683

		pos1 = 5;
		for (pos1 = 5; pos1 < strlen(tmpCopy); pos1++)
			if (tmpCopy[pos1] != ' ')
B
Bruce Momjian 已提交
684
				break;
P
Philip Warner 已提交
685 686 687

		if (tmpCopy[pos1] == '"')
			pos1 += 2;
B
Bruce Momjian 已提交
688

689
		pos1 += strlen(te->tag);
P
Philip Warner 已提交
690

B
Bruce Momjian 已提交
691
		for (pos2 = pos1; pos2 < strlen(tmpCopy); pos2++)
P
Philip Warner 已提交
692 693 694 695
			if (strncmp(&tmpCopy[pos2], "from stdin", 10) == 0)
				break;

		if (pos2 >= strlen(tmpCopy))
696
			die_horribly(AH, modulename,
697
						 "invalid COPY statement -- could not find \"from stdin\" in string \"%s\" starting at position %lu\n",
P
Peter Eisentraut 已提交
698
						 tmpCopy, (unsigned long) pos1);
P
Philip Warner 已提交
699

B
Bruce Momjian 已提交
700 701
		ahwrite(tmpCopy, 1, pos2, AH);	/* 'copy "table" [with oids]' */
		ahprintf(AH, " from '$$PATH$$/%s' %s", tctx->filename, &tmpCopy[pos2 + 10]);
P
Philip Warner 已提交
702 703 704 705 706 707 708 709 710 711

		return;
	}

	if (strcmp(te->desc, "BLOBS") == 0)
		_LoadBlobs(AH, ropt);
	else
		_PrintFileData(AH, tctx->filename, ropt);
}

B
Bruce Momjian 已提交
712 713
static void
_LoadBlobs(ArchiveHandle *AH, RestoreOptions *ropt)
P
Philip Warner 已提交
714
{
715
	Oid			oid;
B
Bruce Momjian 已提交
716 717
	lclContext *ctx = (lclContext *) AH->formatData;
	TAR_MEMBER *th;
P
Peter Eisentraut 已提交
718
	size_t		cnt;
719
	bool		foundBlob = false;
B
Bruce Momjian 已提交
720
	char		buf[4096];
P
Philip Warner 已提交
721

722 723
	StartRestoreBlobs(AH);

724
	th = tarOpen(AH, NULL, 'r');	/* Open next file */
P
Philip Warner 已提交
725 726 727 728
	while (th != NULL)
	{
		ctx->FH = th;

729
		if (strncmp(th->targetFile, "blob_", 5) == 0)
P
Philip Warner 已提交
730
		{
731 732 733 734
			oid = atooid(&th->targetFile[5]);
			if (oid != 0)
			{
				ahlog(AH, 1, "restoring large object OID %u\n", oid);
P
Philip Warner 已提交
735

736
				StartRestoreBlob(AH, oid, ropt->dropSchema);
P
Philip Warner 已提交
737

738 739 740 741 742 743
				while ((cnt = tarRead(buf, 4095, th)) > 0)
				{
					buf[cnt] = '\0';
					ahwrite(buf, 1, cnt, AH);
				}
				EndRestoreBlob(AH, oid);
744
				foundBlob = true;
P
Philip Warner 已提交
745
			}
746 747 748 749 750
			tarClose(AH, th);
		}
		else
		{
			tarClose(AH, th);
B
Bruce Momjian 已提交
751

752
			/*
B
Bruce Momjian 已提交
753 754 755 756
			 * Once we have found the first blob, stop at the first non-blob
			 * entry (which will be 'blobs.toc').  This coding would eat all
			 * the rest of the archive if there are no blobs ... but this
			 * function shouldn't be called at all in that case.
757 758 759
			 */
			if (foundBlob)
				break;
P
Philip Warner 已提交
760 761 762 763
		}

		th = tarOpen(AH, NULL, 'r');
	}
764
	EndRestoreBlobs(AH);
P
Philip Warner 已提交
765 766 767
}


B
Bruce Momjian 已提交
768 769
static int
_WriteByte(ArchiveHandle *AH, const int i)
P
Philip Warner 已提交
770
{
B
Bruce Momjian 已提交
771 772 773
	lclContext *ctx = (lclContext *) AH->formatData;
	int			res;
	char		b = i;			/* Avoid endian problems */
P
Philip Warner 已提交
774

B
Bruce Momjian 已提交
775 776
	res = tarWrite(&b, 1, ctx->FH);
	if (res != EOF)
P
Philip Warner 已提交
777
		ctx->filePos += res;
B
Bruce Momjian 已提交
778
	return res;
P
Philip Warner 已提交
779 780
}

B
Bruce Momjian 已提交
781 782
static int
_ReadByte(ArchiveHandle *AH)
P
Philip Warner 已提交
783
{
B
Bruce Momjian 已提交
784
	lclContext *ctx = (lclContext *) AH->formatData;
785 786
	size_t		res;
	unsigned char c;
P
Philip Warner 已提交
787

B
Bruce Momjian 已提交
788
	res = tarRead(&c, 1, ctx->FH);
789 790 791
	if (res != 1)
		die_horribly(AH, modulename, "unexpected end of file\n");
	ctx->filePos += 1;
B
Bruce Momjian 已提交
792
	return c;
P
Philip Warner 已提交
793 794
}

P
Peter Eisentraut 已提交
795 796
static size_t
_WriteBuf(ArchiveHandle *AH, const void *buf, size_t len)
P
Philip Warner 已提交
797
{
B
Bruce Momjian 已提交
798
	lclContext *ctx = (lclContext *) AH->formatData;
P
Peter Eisentraut 已提交
799
	size_t		res;
P
Philip Warner 已提交
800

801
	res = tarWrite(buf, len, ctx->FH);
B
Bruce Momjian 已提交
802 803
	ctx->filePos += res;
	return res;
P
Philip Warner 已提交
804 805
}

P
Peter Eisentraut 已提交
806 807
static size_t
_ReadBuf(ArchiveHandle *AH, void *buf, size_t len)
P
Philip Warner 已提交
808
{
B
Bruce Momjian 已提交
809
	lclContext *ctx = (lclContext *) AH->formatData;
P
Peter Eisentraut 已提交
810
	size_t		res;
P
Philip Warner 已提交
811

B
Bruce Momjian 已提交
812 813 814
	res = tarRead(buf, len, ctx->FH);
	ctx->filePos += res;
	return res;
P
Philip Warner 已提交
815 816
}

B
Bruce Momjian 已提交
817 818
static void
_CloseArchive(ArchiveHandle *AH)
P
Philip Warner 已提交
819
{
B
Bruce Momjian 已提交
820 821 822 823 824
	lclContext *ctx = (lclContext *) AH->formatData;
	TAR_MEMBER *th;
	RestoreOptions *ropt;
	int			savVerbose,
				i;
P
Philip Warner 已提交
825

B
Bruce Momjian 已提交
826 827
	if (AH->mode == archModeWrite)
	{
P
Philip Warner 已提交
828 829 830 831 832 833 834
		/*
		 * Write the Header & TOC to the archive FIRST
		 */
		th = tarOpen(AH, "toc.dat", 'w');
		ctx->FH = th;
		WriteHead(AH);
		WriteToc(AH);
B
Bruce Momjian 已提交
835
		tarClose(AH, th);		/* Not needed any more */
P
Philip Warner 已提交
836 837 838 839 840 841

		/*
		 * Now send the data (tables & blobs)
		 */
		WriteDataChunks(AH);

B
Bruce Momjian 已提交
842
		/*
B
Bruce Momjian 已提交
843 844
		 * Now this format wants to append a script which does a full restore
		 * if the files have been extracted.
P
Philip Warner 已提交
845 846 847
		 */
		th = tarOpen(AH, "restore.sql", 'w');
		tarPrintf(AH, th, "create temporary table pgdump_restore_path(p text);\n");
B
Bruce Momjian 已提交
848 849 850
		tarPrintf(AH, th, "--\n"
				  "-- NOTE:\n"
				  "--\n"
B
Bruce Momjian 已提交
851 852
				  "-- File paths need to be edited. Search for $$PATH$$ and\n"
				  "-- replace it with the path to the directory containing\n"
B
Bruce Momjian 已提交
853 854 855 856 857
				  "-- the extracted data files.\n"
				  "--\n"
				  "-- Edit the following to match the path where the\n"
				  "-- tar archive has been extracted.\n"
				  "--\n");
P
Philip Warner 已提交
858 859 860
		tarPrintf(AH, th, "insert into pgdump_restore_path values('/tmp');\n\n");

		AH->CustomOutPtr = _scriptOut;
B
Bruce Momjian 已提交
861

P
Philip Warner 已提交
862 863 864 865 866 867
		ctx->isSpecialScript = 1;
		ctx->scriptTH = th;

		ropt = NewRestoreOptions();
		ropt->dropSchema = 1;
		ropt->compression = 0;
868
		ropt->superuser = NULL;
869
		ropt->suppressDumpWarnings = true;
P
Philip Warner 已提交
870 871 872 873

		savVerbose = AH->public.verbose;
		AH->public.verbose = 0;

B
Bruce Momjian 已提交
874
		RestoreArchive((Archive *) AH, ropt);
P
Philip Warner 已提交
875 876 877 878

		AH->public.verbose = savVerbose;

		tarClose(AH, th);
879 880

		/* Add a block of NULLs since it's de-rigeur. */
B
Bruce Momjian 已提交
881
		for (i = 0; i < 512; i++)
882
		{
883
			if (fputc(0, ctx->tarFH) == EOF)
884
				die_horribly(AH, modulename,
B
Bruce Momjian 已提交
885
					   "could not write null block at end of tar archive\n");
886
		}
B
Bruce Momjian 已提交
887
	}
P
Philip Warner 已提交
888

B
Bruce Momjian 已提交
889
	AH->FH = NULL;
P
Philip Warner 已提交
890 891
}

P
Peter Eisentraut 已提交
892 893
static size_t
_scriptOut(ArchiveHandle *AH, const void *buf, size_t len)
P
Philip Warner 已提交
894
{
B
Bruce Momjian 已提交
895 896
	lclContext *ctx = (lclContext *) AH->formatData;

P
Philip Warner 已提交
897 898 899 900 901 902 903 904
	return tarWrite(buf, len, ctx->scriptTH);
}

/*
 * BLOB support
 */

/*
B
Bruce Momjian 已提交
905
 * Called by the archiver when starting to save all BLOB DATA (not schema).
P
Philip Warner 已提交
906
 * This routine should save whatever format-specific information is needed
B
Bruce Momjian 已提交
907
 * to read the BLOBs back into memory.
P
Philip Warner 已提交
908 909 910 911 912 913
 *
 * It is called just prior to the dumper's DataDumper routine.
 *
 * Optional, but strongly recommended.
 *
 */
B
Bruce Momjian 已提交
914 915
static void
_StartBlobs(ArchiveHandle *AH, TocEntry *te)
P
Philip Warner 已提交
916
{
B
Bruce Momjian 已提交
917 918
	lclContext *ctx = (lclContext *) AH->formatData;
	char		fname[K_STD_BUF_SIZE];
P
Philip Warner 已提交
919 920 921 922 923 924 925 926 927 928 929 930

	sprintf(fname, "blobs.toc");
	ctx->blobToc = tarOpen(AH, fname, 'w');
}

/*
 * Called by the archiver when the dumper calls StartBlob.
 *
 * Mandatory.
 *
 * Must save the passed OID for retrieval at restore-time.
 */
B
Bruce Momjian 已提交
931
static void
932
_StartBlob(ArchiveHandle *AH, TocEntry *te, Oid oid)
P
Philip Warner 已提交
933
{
B
Bruce Momjian 已提交
934 935 936 937
	lclContext *ctx = (lclContext *) AH->formatData;
	lclTocEntry *tctx = (lclTocEntry *) te->formatData;
	char		fname[255];
	char	   *sfx;
P
Philip Warner 已提交
938

B
Bruce Momjian 已提交
939
	if (oid == 0)
940
		die_horribly(AH, modulename, "invalid OID for large object (%u)\n", oid);
P
Philip Warner 已提交
941 942 943 944 945 946

	if (AH->compression != 0)
		sfx = ".gz";
	else
		sfx = "";

947
	sprintf(fname, "blob_%u.dat%s", oid, sfx);
P
Philip Warner 已提交
948

949
	tarPrintf(AH, ctx->blobToc, "%u %s\n", oid, fname);
P
Philip Warner 已提交
950 951 952 953 954 955 956 957 958 959

	tctx->TH = tarOpen(AH, fname, 'w');
}

/*
 * Called by the archiver when the dumper calls EndBlob.
 *
 * Optional.
 *
 */
B
Bruce Momjian 已提交
960
static void
961
_EndBlob(ArchiveHandle *AH, TocEntry *te, Oid oid)
P
Philip Warner 已提交
962
{
B
Bruce Momjian 已提交
963
	lclTocEntry *tctx = (lclTocEntry *) te->formatData;
P
Philip Warner 已提交
964 965 966 967 968

	tarClose(AH, tctx->TH);
}

/*
B
Bruce Momjian 已提交
969
 * Called by the archiver when finishing saving all BLOB DATA.
P
Philip Warner 已提交
970 971 972 973
 *
 * Optional.
 *
 */
B
Bruce Momjian 已提交
974 975
static void
_EndBlobs(ArchiveHandle *AH, TocEntry *te)
P
Philip Warner 已提交
976
{
B
Bruce Momjian 已提交
977 978
	lclContext *ctx = (lclContext *) AH->formatData;

P
Philip Warner 已提交
979
	/* Write out a fake zero OID to mark end-of-blobs. */
B
Bruce Momjian 已提交
980
	/* WriteInt(AH, 0); */
P
Philip Warner 已提交
981 982 983 984 985 986 987 988 989 990 991

	tarClose(AH, ctx->blobToc);
}



/*------------
 * TAR Support
 *------------
 */

B
Bruce Momjian 已提交
992 993
static int
tarPrintf(ArchiveHandle *AH, TAR_MEMBER *th, const char *fmt,...)
P
Philip Warner 已提交
994
{
B
Bruce Momjian 已提交
995
	char	   *p = NULL;
P
Philip Warner 已提交
996
	va_list		ap;
P
Peter Eisentraut 已提交
997
	size_t		bSize = strlen(fmt) + 256;		/* Should be enough */
P
Philip Warner 已提交
998 999
	int			cnt = -1;

B
Bruce Momjian 已提交
1000
	/*
B
Bruce Momjian 已提交
1001 1002
	 * This is paranoid: deal with the possibility that vsnprintf is willing
	 * to ignore trailing null
B
Bruce Momjian 已提交
1003 1004 1005
	 */

	/*
B
Bruce Momjian 已提交
1006 1007
	 * or returns > 0 even if string does not fit. It may be the case that it
	 * returns cnt = bufsize
B
Bruce Momjian 已提交
1008 1009
	 */
	while (cnt < 0 || cnt >= (bSize - 1))
1010
	{
B
Bruce Momjian 已提交
1011 1012
		if (p != NULL)
			free(p);
P
Philip Warner 已提交
1013
		bSize *= 2;
1014
		p = (char *) pg_malloc(bSize);
1015
		va_start(ap, fmt);
P
Philip Warner 已提交
1016
		cnt = vsnprintf(p, bSize, fmt, ap);
1017
		va_end(ap);
P
Philip Warner 已提交
1018 1019 1020 1021 1022 1023
	}
	cnt = tarWrite(p, cnt, th);
	free(p);
	return cnt;
}

B
Bruce Momjian 已提交
1024 1025
static int
_tarChecksum(char *header)
P
Philip Warner 已提交
1026
{
B
Bruce Momjian 已提交
1027 1028 1029
	int			i,
				sum;

P
Philip Warner 已提交
1030
	sum = 0;
B
Bruce Momjian 已提交
1031
	for (i = 0; i < 512; i++)
P
Philip Warner 已提交
1032 1033
		if (i < 148 || i >= 156)
			sum += 0xFF & header[i];
B
Bruce Momjian 已提交
1034
	return sum + 256;			/* Assume 8 blanks in checksum field */
P
Philip Warner 已提交
1035 1036
}

1037
bool
B
Bruce Momjian 已提交
1038
isValidTarHeader(char *header)
P
Philip Warner 已提交
1039
{
B
Bruce Momjian 已提交
1040 1041
	int			sum;
	int			chk = _tarChecksum(header);
P
Philip Warner 已提交
1042 1043 1044

	sscanf(&header[148], "%8o", &sum);

1045 1046 1047 1048 1049 1050 1051 1052 1053 1054 1055
	if (sum != chk)
		return false;

	/* POSIX format */
	if (strncmp(&header[257], "ustar00", 7) == 0)
		return true;
	/* older format */
	if (strncmp(&header[257], "ustar  ", 7) == 0)
		return true;

	return false;
P
Philip Warner 已提交
1056 1057 1058
}

/* Given the member, write the TAR header & copy the file */
B
Bruce Momjian 已提交
1059 1060
static void
_tarAddFile(ArchiveHandle *AH, TAR_MEMBER *th)
P
Philip Warner 已提交
1061
{
B
Bruce Momjian 已提交
1062
	lclContext *ctx = (lclContext *) AH->formatData;
1063
	FILE	   *tmp = th->tmpFH;	/* Grab it for convenience */
P
Philip Warner 已提交
1064
	char		buf[32768];
P
Peter Eisentraut 已提交
1065
	size_t		cnt;
1066
	pgoff_t		len = 0;
P
Peter Eisentraut 已提交
1067 1068
	size_t		res;
	size_t		i,
B
Bruce Momjian 已提交
1069
				pad;
P
Philip Warner 已提交
1070 1071 1072 1073

	/*
	 * Find file len & go back to start.
	 */
P
Peter Eisentraut 已提交
1074 1075
	fseeko(tmp, 0, SEEK_END);
	th->fileLen = ftello(tmp);
1076
	fseeko(tmp, 0, SEEK_SET);
B
Bruce Momjian 已提交
1077

1078
	/*
1079 1080
	 * Some compilers will throw a warning knowing this test can never be true
	 * because pgoff_t can't exceed the compared maximum on their platform.
1081
	 */
1082 1083
	if (th->fileLen > MAX_TAR_MEMBER_FILELEN)
		die_horribly(AH, modulename, "archive member too large for tar format\n");
P
Philip Warner 已提交
1084 1085 1086

	_tarWriteHeader(th);

1087
	while ((cnt = fread(buf, 1, sizeof(buf), tmp)) > 0)
P
Philip Warner 已提交
1088
	{
1089
		res = fwrite(buf, 1, cnt, th->tarFH);
B
Bruce Momjian 已提交
1090
		if (res != cnt)
P
Peter Eisentraut 已提交
1091
			die_horribly(AH, modulename,
1092 1093
						 "could not write to output file: %s\n",
						 strerror(errno));
1094
		len += res;
P
Philip Warner 已提交
1095 1096
	}

B
Bruce Momjian 已提交
1097
	if (fclose(tmp) != 0)		/* This *should* delete it... */
1098 1099
		die_horribly(AH, modulename, "could not close temporary file: %s\n",
					 strerror(errno));
P
Philip Warner 已提交
1100 1101

	if (len != th->fileLen)
1102
	{
1103 1104
		char		buf1[32],
					buf2[32];
B
Bruce Momjian 已提交
1105

1106
		snprintf(buf1, sizeof(buf1), INT64_FORMAT, (int64) len);
1107
		snprintf(buf2, sizeof(buf2), INT64_FORMAT, (int64) th->fileLen);
1108 1109 1110
		die_horribly(AH, modulename, "actual file length (%s) does not match expected (%s)\n",
					 buf1, buf2);
	}
P
Philip Warner 已提交
1111 1112

	pad = ((len + 511) & ~511) - len;
B
Bruce Momjian 已提交
1113
	for (i = 0; i < pad; i++)
1114
	{
B
Bruce Momjian 已提交
1115
		if (fputc('\0', th->tarFH) == EOF)
1116
			die_horribly(AH, modulename, "could not output padding at end of tar member\n");
B
Bruce Momjian 已提交
1117
	}
P
Philip Warner 已提交
1118 1119 1120 1121 1122

	ctx->tarFHpos += len + pad;
}

/* Locate the file in the archive, read header and position to data */
B
Bruce Momjian 已提交
1123 1124
static TAR_MEMBER *
_tarPositionTo(ArchiveHandle *AH, const char *filename)
P
Philip Warner 已提交
1125
{
B
Bruce Momjian 已提交
1126
	lclContext *ctx = (lclContext *) AH->formatData;
1127
	TAR_MEMBER *th = pg_calloc(1, sizeof(TAR_MEMBER));
B
Bruce Momjian 已提交
1128 1129
	char		c;
	char		header[512];
P
Peter Eisentraut 已提交
1130
	size_t		i,
B
Bruce Momjian 已提交
1131
				len,
P
Peter Eisentraut 已提交
1132 1133
				blks;
	int			id;
P
Philip Warner 已提交
1134 1135 1136 1137 1138 1139

	th->AH = AH;

	/* Go to end of current file, if any */
	if (ctx->tarFHpos != 0)
	{
B
Bruce Momjian 已提交
1140 1141 1142
		char		buf1[100],
					buf2[100];

1143 1144
		snprintf(buf1, sizeof(buf1), INT64_FORMAT, (int64) ctx->tarFHpos);
		snprintf(buf2, sizeof(buf2), INT64_FORMAT, (int64) ctx->tarNextMember);
1145 1146
		ahlog(AH, 4, "moving from position %s to next member at file position %s\n",
			  buf1, buf2);
P
Philip Warner 已提交
1147 1148 1149 1150 1151

		while (ctx->tarFHpos < ctx->tarNextMember)
			_tarReadRaw(AH, &c, 1, NULL, ctx->tarFH);
	}

1152
	{
B
Bruce Momjian 已提交
1153 1154
		char		buf[100];

1155
		snprintf(buf, sizeof(buf), INT64_FORMAT, (int64) ctx->tarFHpos);
1156 1157
		ahlog(AH, 4, "now at file position %s\n", buf);
	}
P
Philip Warner 已提交
1158

1159
	/* We are at the start of the file, or at the next member */
P
Philip Warner 已提交
1160 1161 1162 1163 1164

	/* Get the header */
	if (!_tarGetHeader(AH, th))
	{
		if (filename)
1165
			die_horribly(AH, modulename, "could not find header for file \"%s\" in tar archive\n", filename);
B
Bruce Momjian 已提交
1166
		else
1167
		{
B
Bruce Momjian 已提交
1168
			/*
1169
			 * We're just scanning the archive for the next file, so return
B
Bruce Momjian 已提交
1170 1171
			 * null
			 */
P
Philip Warner 已提交
1172 1173 1174 1175 1176
			free(th);
			return NULL;
		}
	}

B
Bruce Momjian 已提交
1177
	while (filename != NULL && strcmp(th->targetFile, filename) != 0)
P
Philip Warner 已提交
1178
	{
1179
		ahlog(AH, 4, "skipping tar member %s\n", th->targetFile);
P
Philip Warner 已提交
1180 1181

		id = atoi(th->targetFile);
1182
		if ((TocIDRequired(AH, id, AH->ropt) & REQ_DATA) != 0)
1183
			die_horribly(AH, modulename, "restoring data out of order is not supported in this archive format: "
B
Bruce Momjian 已提交
1184
						 "\"%s\" is required, but comes before \"%s\" in the archive file.\n",
1185
						 th->targetFile, filename);
P
Philip Warner 已提交
1186 1187

		/* Header doesn't match, so read to next header */
B
Bruce Momjian 已提交
1188 1189
		len = ((th->fileLen + 511) & ~511);		/* Padded length */
		blks = len >> 9;		/* # of 512 byte blocks */
P
Philip Warner 已提交
1190

B
Bruce Momjian 已提交
1191
		for (i = 0; i < blks; i++)
P
Philip Warner 已提交
1192 1193 1194
			_tarReadRaw(AH, &header[0], 512, NULL, ctx->tarFH);

		if (!_tarGetHeader(AH, th))
1195
			die_horribly(AH, modulename, "could not find header for file \"%s\" in tar archive\n", filename);
P
Philip Warner 已提交
1196 1197 1198 1199 1200 1201 1202 1203 1204
	}

	ctx->tarNextMember = ctx->tarFHpos + ((th->fileLen + 511) & ~511);
	th->pos = 0;

	return th;
}

/* Read & verify a header */
B
Bruce Momjian 已提交
1205 1206
static int
_tarGetHeader(ArchiveHandle *AH, TAR_MEMBER *th)
P
Philip Warner 已提交
1207
{
B
Bruce Momjian 已提交
1208 1209
	lclContext *ctx = (lclContext *) AH->formatData;
	char		h[512];
1210
	char		tag[100];
B
Bruce Momjian 已提交
1211 1212
	int			sum,
				chk;
P
Peter Eisentraut 已提交
1213
	size_t		len;
B
Bruce Momjian 已提交
1214
	unsigned long ullen;
1215
	pgoff_t		hPos;
B
Bruce Momjian 已提交
1216
	bool		gotBlock = false;
P
Philip Warner 已提交
1217

1218 1219
	while (!gotBlock)
	{
1220
#if 0
P
Peter Eisentraut 已提交
1221
		if (ftello(ctx->tarFH) != ctx->tarFHpos)
1222
		{
B
Bruce Momjian 已提交
1223 1224 1225
			char		buf1[100],
						buf2[100];

1226 1227
			snprintf(buf1, sizeof(buf1), INT64_FORMAT, (int64) ftello(ctx->tarFH));
			snprintf(buf2, sizeof(buf2), INT64_FORMAT, (int64) ftello(ctx->tarFHpos));
1228
			die_horribly(AH, modulename,
B
Bruce Momjian 已提交
1229
			  "mismatch in actual vs. predicted file position (%s vs. %s)\n",
1230 1231
						 buf1, buf2);
		}
1232
#endif
P
Philip Warner 已提交
1233

1234 1235
		/* Save the pos for reporting purposes */
		hPos = ctx->tarFHpos;
P
Philip Warner 已提交
1236

1237
		/* Read a 512 byte block, return EOF, exit if short */
1238
		len = _tarReadRaw(AH, h, 512, NULL, ctx->tarFH);
B
Bruce Momjian 已提交
1239
		if (len == 0)			/* EOF */
1240 1241 1242
			return 0;

		if (len != 512)
P
Peter Eisentraut 已提交
1243
			die_horribly(AH, modulename,
P
Peter Eisentraut 已提交
1244 1245 1246
						 ngettext("incomplete tar header found (%lu byte)\n",
								  "incomplete tar header found (%lu bytes)\n",
								  len),
P
Peter Eisentraut 已提交
1247
						 (unsigned long) len);
1248 1249

		/* Calc checksum */
1250 1251
		chk = _tarChecksum(h);
		sscanf(&h[148], "%8o", &sum);
P
Philip Warner 已提交
1252

1253
		/*
B
Bruce Momjian 已提交
1254 1255
		 * If the checksum failed, see if it is a null block. If so, silently
		 * continue to the next block.
1256
		 */
B
Bruce Momjian 已提交
1257
		if (chk == sum)
1258
			gotBlock = true;
B
Bruce Momjian 已提交
1259 1260
		else
		{
1261 1262
			int			i;

B
Bruce Momjian 已提交
1263
			for (i = 0; i < 512; i++)
1264
			{
1265
				if (h[i] != 0)
1266
				{
B
Bruce Momjian 已提交
1267
					gotBlock = true;
1268 1269 1270 1271 1272
					break;
				}
			}
		}
	}
P
Philip Warner 已提交
1273

1274 1275 1276
	sscanf(&h[0], "%99s", tag);
	sscanf(&h[124], "%12lo", &ullen);
	len = (size_t) ullen;
P
Philip Warner 已提交
1277

1278
	{
B
Bruce Momjian 已提交
1279 1280
		char		buf[100];

1281
		snprintf(buf, sizeof(buf), INT64_FORMAT, (int64) hPos);
1282
		ahlog(AH, 3, "TOC Entry %s at %s (length %lu, checksum %d)\n",
1283
			  tag, buf, (unsigned long) len, sum);
1284
	}
P
Philip Warner 已提交
1285 1286

	if (chk != sum)
1287
	{
B
Bruce Momjian 已提交
1288 1289
		char		buf[100];

1290
		snprintf(buf, sizeof(buf), INT64_FORMAT, (int64) ftello(ctx->tarFH));
1291 1292
		die_horribly(AH, modulename,
					 "corrupt tar header found in %s "
1293
					 "(expected %d, computed %d) file position %s\n",
1294
					 tag, sum, chk, buf);
1295
	}
P
Philip Warner 已提交
1296

1297
	th->targetFile = pg_strdup(tag);
P
Philip Warner 已提交
1298 1299 1300 1301 1302
	th->fileLen = len;

	return 1;
}

1303 1304 1305 1306 1307

/*
 * Utility routine to print possibly larger than 32 bit integers in a
 * portable fashion.  Filled with zeros.
 */
B
Bruce Momjian 已提交
1308 1309
static void
print_val(char *s, uint64 val, unsigned int base, size_t len)
1310
{
B
Bruce Momjian 已提交
1311 1312 1313 1314 1315 1316 1317 1318 1319
	int			i;

	for (i = len; i > 0; i--)
	{
		int			digit = val % base;

		s[i - 1] = '0' + digit;
		val = val / base;
	}
1320 1321 1322
}


B
Bruce Momjian 已提交
1323 1324
static void
_tarWriteHeader(TAR_MEMBER *th)
P
Philip Warner 已提交
1325 1326 1327 1328 1329
{
	char		h[512];
	int			lastSum = 0;
	int			sum;

1330
	memset(h, 0, sizeof(h));
P
Philip Warner 已提交
1331 1332 1333 1334 1335 1336 1337 1338

	/* Name 100 */
	sprintf(&h[0], "%.99s", th->targetFile);

	/* Mode 8 */
	sprintf(&h[100], "100600 ");

	/* User ID 8 */
1339
	sprintf(&h[108], "004000 ");
P
Philip Warner 已提交
1340 1341

	/* Group 8 */
1342
	sprintf(&h[116], "002000 ");
P
Philip Warner 已提交
1343

1344 1345 1346
	/* File size 12 - 11 digits, 1 space, no NUL */
	print_val(&h[124], th->fileLen, 8, 11);
	sprintf(&h[135], " ");
P
Philip Warner 已提交
1347 1348

	/* Mod Time 12 */
1349
	sprintf(&h[136], "%011o ", (int) time(NULL));
P
Philip Warner 已提交
1350 1351

	/* Checksum 8 */
1352
	sprintf(&h[148], "%06o ", lastSum);
P
Philip Warner 已提交
1353

1354
	/* Type - regular file */
P
Philip Warner 已提交
1355
	sprintf(&h[156], "0");
P
Philip Warner 已提交
1356

1357
	/* Link tag 100 (NULL) */
P
Philip Warner 已提交
1358

1359 1360
	/* Magic 6 + Version 2 */
	sprintf(&h[257], "ustar00");
P
Philip Warner 已提交
1361

1362
#if 0
P
Philip Warner 已提交
1363
	/* User 32 */
B
Bruce Momjian 已提交
1364 1365
	sprintf(&h[265], "%.31s", "");		/* How do I get username reliably? Do
										 * I need to? */
P
Philip Warner 已提交
1366 1367

	/* Group 32 */
B
Bruce Momjian 已提交
1368 1369
	sprintf(&h[297], "%.31s", "");		/* How do I get group reliably? Do I
										 * need to? */
P
Philip Warner 已提交
1370 1371

	/* Maj Dev 8 */
1372
	sprintf(&h[329], "%6o ", 0);
P
Philip Warner 已提交
1373

1374 1375 1376
	/* Min Dev 8 */
	sprintf(&h[337], "%6o ", 0);
#endif
P
Philip Warner 已提交
1377

B
Bruce Momjian 已提交
1378
	while ((sum = _tarChecksum(h)) != lastSum)
P
Philip Warner 已提交
1379
	{
1380
		sprintf(&h[148], "%06o ", sum);
P
Philip Warner 已提交
1381 1382 1383
		lastSum = sum;
	}

B
Bruce Momjian 已提交
1384
	if (fwrite(h, 1, 512, th->tarFH) != 512)
1385
		die_horribly(th->AH, modulename, "could not write to output file: %s\n", strerror(errno));
P
Philip Warner 已提交
1386
}