pg_backup_archiver.c 105.8 KB
Newer Older
B
Bruce Momjian 已提交
1 2 3 4 5 6 7 8 9 10
/*-------------------------------------------------------------------------
 *
 * pg_backup_archiver.c
 *
 *	Private implementation of the archiver routines.
 *
 *	See the headers to pg_restore for more details.
 *
 * Copyright (c) 2000, Philip Warner
 *	Rights are granted to use this software in any way so long
B
Bruce Momjian 已提交
11
 *	as this notice is not removed.
B
Bruce Momjian 已提交
12 13
 *
 *	The author is not responsible for loss or damages that may
14
 *	result from its use.
B
Bruce Momjian 已提交
15 16 17
 *
 *
 * IDENTIFICATION
18
 *		src/bin/pg_dump/pg_backup_archiver.c
19
 *
B
Bruce Momjian 已提交
20 21 22
 *-------------------------------------------------------------------------
 */

23
#include "pg_backup_db.h"
24
#include "pg_backup_utils.h"
A
Andrew Dunstan 已提交
25
#include "parallel.h"
26

27
#include <ctype.h>
A
Andrew Dunstan 已提交
28
#include <fcntl.h>
29
#include <unistd.h>
30
#include <sys/stat.h>
31 32
#include <sys/types.h>
#include <sys/wait.h>
B
Bruce Momjian 已提交
33

34 35 36 37
#ifdef WIN32
#include <io.h>
#endif

38
#include "libpq/libpq-fs.h"
39

40 41 42
#define TEXT_DUMP_HEADER "--\n-- PostgreSQL database dump\n--\n\n"
#define TEXT_DUMPALL_HEADER "--\n-- PostgreSQL database cluster dump\n--\n\n"

43 44 45 46 47 48 49
/* state needed to save/restore an archive's output target */
typedef struct _outputContext
{
	void	   *OF;
	int			gzOut;
} OutputContext;

50
/* translator: this is a module name */
51
static const char *modulename = gettext_noop("archiver");
52 53


B
Bruce Momjian 已提交
54
static ArchiveHandle *_allocAH(const char *FileSpec, const ArchiveFormat fmt,
A
Andrew Dunstan 已提交
55
	 const int compression, ArchiveMode mode, SetupWorkerPtr setupWorkerPtr);
56
static void _getObjectDescription(PQExpBuffer buf, TocEntry *te,
B
Bruce Momjian 已提交
57
					  ArchiveHandle *AH);
58
static void _printTocEntry(ArchiveHandle *AH, TocEntry *te, RestoreOptions *ropt, bool isData, bool acl_pass);
59
static char *replace_line_endings(const char *str);
60
static void _doSetFixedOutputState(ArchiveHandle *AH);
61
static void _doSetSessionAuth(ArchiveHandle *AH, const char *user);
62
static void _doSetWithOids(ArchiveHandle *AH, const bool withOids);
63
static void _reconnectToDB(ArchiveHandle *AH, const char *dbname);
64 65
static void _becomeUser(ArchiveHandle *AH, const char *user);
static void _becomeOwner(ArchiveHandle *AH, TocEntry *te);
66
static void _selectOutputSchema(ArchiveHandle *AH, const char *schemaName);
67
static void _selectTablespace(ArchiveHandle *AH, const char *tablespace);
68 69
static void processEncodingEntry(ArchiveHandle *AH, TocEntry *te);
static void processStdStringsEntry(ArchiveHandle *AH, TocEntry *te);
70
static teReqs _tocEntryRequired(TocEntry *te, teSection curSection, RestoreOptions *ropt);
71
static bool _tocEntryIsACL(TocEntry *te);
B
Bruce Momjian 已提交
72 73
static void _disableTriggersIfNecessary(ArchiveHandle *AH, TocEntry *te, RestoreOptions *ropt);
static void _enableTriggersIfNecessary(ArchiveHandle *AH, TocEntry *te, RestoreOptions *ropt);
74
static void buildTocEntryArrays(ArchiveHandle *AH);
75
static void _moveBefore(ArchiveHandle *AH, TocEntry *pos, TocEntry *te);
B
Bruce Momjian 已提交
76
static int	_discoverArchiveFormat(ArchiveHandle *AH);
B
Bruce Momjian 已提交
77

78
static int	RestoringToDB(ArchiveHandle *AH);
79
static void dump_lo_buf(ArchiveHandle *AH);
80
static void dumpTimestamp(ArchiveHandle *AH, const char *msg, time_t tim);
81
static void SetOutput(ArchiveHandle *AH, const char *filename, int compression);
82 83
static OutputContext SaveOutput(ArchiveHandle *AH);
static void RestoreOutput(ArchiveHandle *AH, OutputContext savedContext);
84

85
static int restore_toc_entry(ArchiveHandle *AH, TocEntry *te,
86
				  RestoreOptions *ropt, bool is_parallel);
A
Andrew Dunstan 已提交
87 88 89 90
static void restore_toc_entries_prefork(ArchiveHandle *AH);
static void restore_toc_entries_parallel(ArchiveHandle *AH, ParallelState *pstate,
							 TocEntry *pending_list);
static void restore_toc_entries_postfork(ArchiveHandle *AH, TocEntry *pending_list);
91 92 93
static void par_list_header_init(TocEntry *l);
static void par_list_append(TocEntry *l, TocEntry *te);
static void par_list_remove(TocEntry *te);
94
static TocEntry *get_next_work_item(ArchiveHandle *AH,
95
				   TocEntry *ready_list,
A
Andrew Dunstan 已提交
96
				   ParallelState *pstate);
97
static void mark_work_done(ArchiveHandle *AH, TocEntry *ready_list,
A
Andrew Dunstan 已提交
98 99
			   int worker, int status,
			   ParallelState *pstate);
100
static void fix_dependencies(ArchiveHandle *AH);
101
static bool has_lock_conflicts(TocEntry *te1, TocEntry *te2);
102 103
static void repoint_table_dependencies(ArchiveHandle *AH);
static void identify_locking_dependencies(ArchiveHandle *AH, TocEntry *te);
104
static void reduce_dependencies(ArchiveHandle *AH, TocEntry *te,
B
Bruce Momjian 已提交
105
					TocEntry *ready_list);
106 107
static void mark_create_done(ArchiveHandle *AH, TocEntry *te);
static void inhibit_data_for_failed_table(ArchiveHandle *AH, TocEntry *te);
108

B
Bruce Momjian 已提交
109
/*
B
Bruce Momjian 已提交
110 111 112 113
 *	Wrapper functions.
 *
 *	The objective it to make writing new formats and dumpers as simple
 *	as possible, if necessary at the expense of extra function calls etc.
B
Bruce Momjian 已提交
114 115 116
 *
 */

A
Andrew Dunstan 已提交
117 118 119 120 121 122 123 124 125 126 127 128 129
/*
 * The dump worker setup needs lots of knowledge of the internals of pg_dump,
 * so It's defined in pg_dump.c and passed into OpenArchive. The restore worker
 * setup doesn't need to know anything much, so it's defined here.
 */
static void
setupRestoreWorker(Archive *AHX, RestoreOptions *ropt)
{
	ArchiveHandle *AH = (ArchiveHandle *) AHX;

	(AH->ReopenPtr) (AH);
}

B
Bruce Momjian 已提交
130 131 132

/* Create a new archive */
/* Public */
133
Archive *
B
Bruce Momjian 已提交
134
CreateArchive(const char *FileSpec, const ArchiveFormat fmt,
A
Andrew Dunstan 已提交
135
	 const int compression, ArchiveMode mode, SetupWorkerPtr setupDumpWorker)
136

B
Bruce Momjian 已提交
137
{
A
Andrew Dunstan 已提交
138
	ArchiveHandle *AH = _allocAH(FileSpec, fmt, compression, mode, setupDumpWorker);
B
Bruce Momjian 已提交
139 140

	return (Archive *) AH;
B
Bruce Momjian 已提交
141 142 143 144
}

/* Open an existing archive */
/* Public */
145
Archive *
B
Bruce Momjian 已提交
146
OpenArchive(const char *FileSpec, const ArchiveFormat fmt)
B
Bruce Momjian 已提交
147
{
A
Andrew Dunstan 已提交
148
	ArchiveHandle *AH = _allocAH(FileSpec, fmt, 0, archModeRead, setupRestoreWorker);
B
Bruce Momjian 已提交
149 150

	return (Archive *) AH;
B
Bruce Momjian 已提交
151 152 153
}

/* Public */
B
Bruce Momjian 已提交
154 155
void
CloseArchive(Archive *AHX)
B
Bruce Momjian 已提交
156
{
B
Bruce Momjian 已提交
157 158 159 160
	int			res = 0;
	ArchiveHandle *AH = (ArchiveHandle *) AHX;

	(*AH->ClosePtr) (AH);
B
Bruce Momjian 已提交
161

B
Bruce Momjian 已提交
162 163
	/* Close the output */
	if (AH->gzOut)
164
		res = GZCLOSE(AH->OF);
B
Bruce Momjian 已提交
165
	else if (AH->OF != stdout)
166 167 168
		res = fclose(AH->OF);

	if (res != 0)
169 170
		exit_horribly(modulename, "could not close output file: %s\n",
					  strerror(errno));
B
Bruce Momjian 已提交
171 172 173
}

/* Public */
B
Bruce Momjian 已提交
174
void
175
SetArchiveRestoreOptions(Archive *AHX, RestoreOptions *ropt)
B
Bruce Momjian 已提交
176
{
B
Bruce Momjian 已提交
177
	ArchiveHandle *AH = (ArchiveHandle *) AHX;
178 179 180 181 182 183 184 185 186 187
	TocEntry   *te;
	teSection	curSection;

	/* Save options for later access */
	AH->ropt = ropt;

	/* Decide which TOC entries will be dumped/restored, and mark them */
	curSection = SECTION_PRE_DATA;
	for (te = AH->toc->next; te != AH->toc; te = te->next)
	{
188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220
		/*
		 * When writing an archive, we also take this opportunity to check
		 * that we have generated the entries in a sane order that respects
		 * the section divisions.  When reading, don't complain, since buggy
		 * old versions of pg_dump might generate out-of-order archives.
		 */
		if (AH->mode != archModeRead)
		{
			switch (te->section)
			{
				case SECTION_NONE:
					/* ok to be anywhere */
					break;
				case SECTION_PRE_DATA:
					if (curSection != SECTION_PRE_DATA)
						write_msg(modulename,
								  "WARNING: archive items not in correct section order\n");
					break;
				case SECTION_DATA:
					if (curSection == SECTION_POST_DATA)
						write_msg(modulename,
								  "WARNING: archive items not in correct section order\n");
					break;
				case SECTION_POST_DATA:
					/* ok no matter which section we were in */
					break;
				default:
					exit_horribly(modulename, "unexpected section code %d\n",
								  (int) te->section);
					break;
			}
		}

221 222
		if (te->section != SECTION_NONE)
			curSection = te->section;
223

224 225 226 227 228 229 230 231 232 233
		te->reqs = _tocEntryRequired(te, curSection, ropt);
	}
}

/* Public */
void
RestoreArchive(Archive *AHX)
{
	ArchiveHandle *AH = (ArchiveHandle *) AHX;
	RestoreOptions *ropt = AH->ropt;
234
	bool		parallel_mode;
235
	TocEntry   *te;
B
Bruce Momjian 已提交
236
	OutputContext sav;
B
Bruce Momjian 已提交
237

238
	AH->stage = STAGE_INITIALIZING;
239

240 241 242
	/*
	 * Check for nonsensical option combinations.
	 *
243
	 * -C is not compatible with -1, because we can't create a database inside
244
	 * a transaction block.
245
	 */
246
	if (ropt->createDB && ropt->single_txn)
247
		exit_horribly(modulename, "-C and -1 are incompatible options\n");
248

249 250 251
	/*
	 * If we're going to do parallel restore, there are some restrictions.
	 */
A
Andrew Dunstan 已提交
252
	parallel_mode = (AH->public.numWorkers > 1 && ropt->useDB);
253 254 255 256
	if (parallel_mode)
	{
		/* We haven't got round to making this work for all archive formats */
		if (AH->ClonePtr == NULL || AH->ReopenPtr == NULL)
257
			exit_horribly(modulename, "parallel restore is not supported with this archive file format\n");
258 259 260

		/* Doesn't work if the archive represents dependencies as OIDs */
		if (AH->version < K_VERS_1_8)
261
			exit_horribly(modulename, "parallel restore is not supported with archives made by pre-8.0 pg_dump\n");
262 263 264 265 266 267 268 269

		/*
		 * It's also not gonna work if we can't reopen the input file, so
		 * let's try that immediately.
		 */
		(AH->ReopenPtr) (AH);
	}

270 271 272 273
	/*
	 * Make sure we won't need (de)compression we haven't got
	 */
#ifndef HAVE_LIBZ
274
	if (AH->compression != 0 && AH->PrintTocDataPtr !=NULL)
275 276 277
	{
		for (te = AH->toc->next; te != AH->toc; te = te->next)
		{
278
			if (te->hadDumper && (te->reqs & REQ_DATA) != 0)
279
				exit_horribly(modulename, "cannot restore from compressed archive (compression not supported in this installation)\n");
280 281 282 283
		}
	}
#endif

284 285 286 287 288 289 290
	/*
	 * Prepare index arrays, so we can assume we have them throughout restore.
	 * It's possible we already did this, though.
	 */
	if (AH->tocsByDumpId == NULL)
		buildTocEntryArrays(AH);

291 292 293 294 295
	/*
	 * If we're using a DB connection, then connect it.
	 */
	if (ropt->useDB)
	{
296
		ahlog(AH, 1, "connecting to database for restore\n");
297
		if (AH->version < K_VERS_1_3)
298
			exit_horribly(modulename, "direct database connections are not supported in pre-1.3 archives\n");
299

300 301 302 303
		/* XXX Should get this from the archive */
		AHX->minRemoteVersion = 070100;
		AHX->maxRemoteVersion = 999999;

304 305
		ConnectDatabase(AHX, ropt->dbname,
						ropt->pghost, ropt->pgport, ropt->username,
306
						ropt->promptPassword);
B
Bruce Momjian 已提交
307 308

		/*
B
Bruce Momjian 已提交
309 310
		 * If we're talking to the DB directly, don't send comments since they
		 * obscure SQL when displaying errors
B
Bruce Momjian 已提交
311
		 */
312
		AH->noTocComments = 1;
313 314
	}

315
	/*
B
Bruce Momjian 已提交
316 317 318 319
	 * Work out if we have an implied data-only restore. This can happen if
	 * the dump was data only or if the user has used a toc list to exclude
	 * all of the schema data. All we do is look for schema entries - if none
	 * are found then we set the dataOnly flag.
320
	 *
B
Bruce Momjian 已提交
321
	 * We could scan for wanted TABLE entries, but that is not the same as
322
	 * dataOnly. At this stage, it seems unnecessary (6-Mar-2001).
B
Bruce Momjian 已提交
323 324 325
	 */
	if (!ropt->dataOnly)
	{
B
Bruce Momjian 已提交
326
		int			impliedDataOnly = 1;
327 328

		for (te = AH->toc->next; te != AH->toc; te = te->next)
B
Bruce Momjian 已提交
329
		{
330
			if ((te->reqs & REQ_SCHEMA) != 0)
B
Bruce Momjian 已提交
331
			{					/* It's schema, and it's wanted */
332 333 334 335 336 337 338
				impliedDataOnly = 0;
				break;
			}
		}
		if (impliedDataOnly)
		{
			ropt->dataOnly = impliedDataOnly;
339
			ahlog(AH, 1, "implied data-only restore\n");
340
		}
B
Bruce Momjian 已提交
341
	}
342

343
	/*
B
Bruce Momjian 已提交
344
	 * Setup the output file if necessary.
B
Bruce Momjian 已提交
345
	 */
346
	sav = SaveOutput(AH);
B
Bruce Momjian 已提交
347
	if (ropt->filename || ropt->compression)
348
		SetOutput(AH, ropt->filename, ropt->compression);
B
Bruce Momjian 已提交
349

350
	ahprintf(AH, "--\n-- PostgreSQL database dump\n--\n\n");
B
Bruce Momjian 已提交
351

352 353
	if (AH->public.verbose)
	{
354 355 356 357 358 359
		if (AH->archiveRemoteVersion)
			ahprintf(AH, "-- Dumped from database version %s\n",
					 AH->archiveRemoteVersion);
		if (AH->archiveDumpVersion)
			ahprintf(AH, "-- Dumped by pg_dump version %s\n",
					 AH->archiveDumpVersion);
360
		dumpTimestamp(AH, "Started on", AH->createDate);
361
	}
362

363
	if (ropt->single_txn)
364 365 366 367 368 369
	{
		if (AH->connection)
			StartTransaction(AH);
		else
			ahprintf(AH, "BEGIN;\n\n");
	}
370

371 372 373 374 375
	/*
	 * Establish important parameter values right away.
	 */
	_doSetFixedOutputState(AH);

376 377
	AH->stage = STAGE_PROCESSING;

B
Bruce Momjian 已提交
378 379
	/*
	 * Drop the items at the start, in reverse order
380
	 */
B
Bruce Momjian 已提交
381 382
	if (ropt->dropSchema)
	{
383
		for (te = AH->toc->prev; te != AH->toc; te = te->prev)
B
Bruce Momjian 已提交
384
		{
385 386
			AH->currentTE = te;

387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405
			/*
			 * In createDB mode, issue a DROP *only* for the database as a
			 * whole.  Issuing drops against anything else would be wrong,
			 * because at this point we're connected to the wrong database.
			 * Conversely, if we're not in createDB mode, we'd better not
			 * issue a DROP against the database at all.
			 */
			if (ropt->createDB)
			{
				if (strcmp(te->desc, "DATABASE") != 0)
					continue;
			}
			else
			{
				if (strcmp(te->desc, "DATABASE") == 0)
					continue;
			}

			/* Otherwise, drop anything that's selected and has a dropStmt */
406
			if (((te->reqs & (REQ_SCHEMA | REQ_DATA)) != 0) && te->dropStmt)
407
			{
408
				ahlog(AH, 1, "dropping %s %s\n", te->desc, te->tag);
409
				/* Select owner and schema as necessary */
410
				_becomeOwner(AH, te);
411
				_selectOutputSchema(AH, te->namespace);
412
				/* Drop it */
413 414 415
				ahprintf(AH, "%s", te->dropStmt);
			}
		}
416 417 418 419 420 421 422 423 424 425 426 427 428 429 430

		/*
		 * _selectOutputSchema may have set currSchema to reflect the effect
		 * of a "SET search_path" command it emitted.  However, by now we may
		 * have dropped that schema; or it might not have existed in the first
		 * place.  In either case the effective value of search_path will not
		 * be what we think.  Forcibly reset currSchema so that we will
		 * re-establish the search_path setting when needed (after creating
		 * the schema).
		 *
		 * If we treated users as pg_dump'able objects then we'd need to reset
		 * currUser here too.
		 */
		if (AH->currSchema)
			free(AH->currSchema);
431
		AH->currSchema = NULL;
B
Bruce Momjian 已提交
432
	}
B
Bruce Momjian 已提交
433

434
	/*
435 436 437
	 * In serial mode, we now process each non-ACL TOC entry.
	 *
	 * In parallel mode, turn control over to the parallel-restore logic.
438
	 */
439
	if (parallel_mode)
A
Andrew Dunstan 已提交
440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458
	{
		ParallelState *pstate;
		TocEntry	pending_list;

		par_list_header_init(&pending_list);

		/* This runs PRE_DATA items and then disconnects from the database */
		restore_toc_entries_prefork(AH);
		Assert(AH->connection == NULL);

		/* ParallelBackupStart() will actually fork the processes */
		pstate = ParallelBackupStart(AH, ropt);
		restore_toc_entries_parallel(AH, pstate, &pending_list);
		ParallelBackupEnd(AH, pstate);

		/* reconnect the master and see if we missed something */
		restore_toc_entries_postfork(AH, &pending_list);
		Assert(AH->connection != NULL);
	}
459
	else
B
Bruce Momjian 已提交
460
	{
461 462 463
		for (te = AH->toc->next; te != AH->toc; te = te->next)
			(void) restore_toc_entry(AH, te, ropt, false);
	}
B
Bruce Momjian 已提交
464

465 466 467
	/*
	 * Scan TOC again to output ownership commands and ACLs
	 */
468
	for (te = AH->toc->next; te != AH->toc; te = te->next)
469
	{
470 471
		AH->currentTE = te;

472
		/* Both schema and data objects might now have ownership/ACLs */
473
		if ((te->reqs & (REQ_SCHEMA | REQ_DATA)) != 0)
474
		{
P
Peter Eisentraut 已提交
475
			ahlog(AH, 1, "setting owner and privileges for %s %s\n",
476
				  te->desc, te->tag);
477 478 479 480
			_printTocEntry(AH, te, ropt, false, true);
		}
	}

481
	if (ropt->single_txn)
482 483 484 485 486 487
	{
		if (AH->connection)
			CommitTransaction(AH);
		else
			ahprintf(AH, "COMMIT;\n\n");
	}
B
Bruce Momjian 已提交
488

489 490 491
	if (AH->public.verbose)
		dumpTimestamp(AH, "Completed on", time(NULL));

492 493
	ahprintf(AH, "--\n-- PostgreSQL database dump complete\n--\n\n");

494
	/*
495
	 * Clean up & we're done.
496
	 */
497 498
	AH->stage = STAGE_FINALIZING;

499
	if (ropt->filename || ropt->compression)
500
		RestoreOutput(AH, sav);
501 502

	if (ropt->useDB)
R
Robert Haas 已提交
503
		DisconnectDatabase(&AH->public);
B
Bruce Momjian 已提交
504 505
}

506 507 508 509 510 511 512 513 514 515 516
/*
 * Restore a single TOC item.  Used in both parallel and non-parallel restore;
 * is_parallel is true if we are in a worker child process.
 *
 * Returns 0 normally, but WORKER_CREATE_DONE or WORKER_INHIBIT_DATA if
 * the parallel parent has to make the corresponding status update.
 */
static int
restore_toc_entry(ArchiveHandle *AH, TocEntry *te,
				  RestoreOptions *ropt, bool is_parallel)
{
A
Andrew Dunstan 已提交
517
	int			status = WORKER_OK;
518 519 520 521 522 523
	teReqs		reqs;
	bool		defnDumped;

	AH->currentTE = te;

	/* Work out what, if anything, we want from this entry */
524 525 526 527 528 529 530
	if (_tocEntryIsACL(te))
		reqs = 0;				/* ACLs are never restored here */
	else
		reqs = te->reqs;

	/*
	 * Ignore DATABASE entry unless we should create it.  We must check this
531 532
	 * here, not in _tocEntryRequired, because the createDB option should not
	 * affect emitting a DATABASE entry to an archive file.
533 534 535
	 */
	if (!ropt->createDB && strcmp(te->desc, "DATABASE") == 0)
		reqs = 0;
536 537 538 539 540 541 542 543 544 545 546 547

	/* Dump any relevant dump warnings to stderr */
	if (!ropt->suppressDumpWarnings && strcmp(te->desc, "WARNING") == 0)
	{
		if (!ropt->dataOnly && te->defn != NULL && strlen(te->defn) != 0)
			write_msg(modulename, "warning from original dump file: %s\n", te->defn);
		else if (te->copyStmt != NULL && strlen(te->copyStmt) != 0)
			write_msg(modulename, "warning from original dump file: %s\n", te->copyStmt);
	}

	defnDumped = false;

548
	if ((reqs & REQ_SCHEMA) != 0)		/* We want the schema */
549 550 551 552 553 554 555 556 557 558 559
	{
		ahlog(AH, 1, "creating %s %s\n", te->desc, te->tag);

		_printTocEntry(AH, te, ropt, false, false);
		defnDumped = true;

		if (strcmp(te->desc, "TABLE") == 0)
		{
			if (AH->lastErrorTE == te)
			{
				/*
560 561 562
				 * We failed to create the table. If
				 * --no-data-for-failed-tables was given, mark the
				 * corresponding TABLE DATA to be ignored.
563
				 *
564 565
				 * In the parallel case this must be done in the parent, so we
				 * just set the return value.
566 567 568 569
				 */
				if (ropt->noDataForFailedTables)
				{
					if (is_parallel)
A
Andrew Dunstan 已提交
570
						status = WORKER_INHIBIT_DATA;
571 572 573 574 575 576 577
					else
						inhibit_data_for_failed_table(AH, te);
				}
			}
			else
			{
				/*
578 579
				 * We created the table successfully.  Mark the corresponding
				 * TABLE DATA for possible truncation.
580
				 *
581 582
				 * In the parallel case this must be done in the parent, so we
				 * just set the return value.
583 584
				 */
				if (is_parallel)
A
Andrew Dunstan 已提交
585
					status = WORKER_CREATE_DONE;
586 587 588 589 590 591 592 593 594 595
				else
					mark_create_done(AH, te);
			}
		}

		/* If we created a DB, connect to it... */
		if (strcmp(te->desc, "DATABASE") == 0)
		{
			ahlog(AH, 1, "connecting to new database \"%s\"\n", te->tag);
			_reconnectToDB(AH, te->tag);
596
			ropt->dbname = pg_strdup(te->tag);
597 598 599 600 601 602 603 604 605
		}
	}

	/*
	 * If we have a data component, then process it
	 */
	if ((reqs & REQ_DATA) != 0)
	{
		/*
606 607 608
		 * hadDumper will be set if there is genuine data component for this
		 * node. Otherwise, we need to check the defn field for statements
		 * that need to be executed in data-only restores.
609 610 611 612 613 614
		 */
		if (te->hadDumper)
		{
			/*
			 * If we can output the data, then restore it.
			 */
615
			if (AH->PrintTocDataPtr !=NULL)
616 617 618 619 620 621
			{
				_printTocEntry(AH, te, ropt, true, false);

				if (strcmp(te->desc, "BLOBS") == 0 ||
					strcmp(te->desc, "BLOB COMMENTS") == 0)
				{
622
					ahlog(AH, 1, "processing %s\n", te->desc);
623 624 625 626 627 628 629 630 631 632 633 634 635

					_selectOutputSchema(AH, "pg_catalog");

					(*AH->PrintTocDataPtr) (AH, te, ropt);
				}
				else
				{
					_disableTriggersIfNecessary(AH, te, ropt);

					/* Select owner and schema as necessary */
					_becomeOwner(AH, te);
					_selectOutputSchema(AH, te->namespace);

636
					ahlog(AH, 1, "processing data for table \"%s\"\n",
637 638 639
						  te->tag);

					/*
640 641 642 643 644 645
					 * In parallel restore, if we created the table earlier in
					 * the run then we wrap the COPY in a transaction and
					 * precede it with a TRUNCATE.	If archiving is not on
					 * this prevents WAL-logging the COPY.	This obtains a
					 * speedup similar to that from using single_txn mode in
					 * non-parallel restores.
646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666
					 */
					if (is_parallel && te->created)
					{
						/*
						 * Parallel restore is always talking directly to a
						 * server, so no need to see if we should issue BEGIN.
						 */
						StartTransaction(AH);

						/*
						 * If the server version is >= 8.4, make sure we issue
						 * TRUNCATE with ONLY so that child tables are not
						 * wiped.
						 */
						ahprintf(AH, "TRUNCATE TABLE %s%s;\n\n",
								 (PQserverVersion(AH->connection) >= 80400 ?
								  "ONLY " : ""),
								 fmtId(te->tag));
					}

					/*
667
					 * If we have a copy statement, use it.
668 669 670 671
					 */
					if (te->copyStmt && strlen(te->copyStmt) > 0)
					{
						ahprintf(AH, "%s", te->copyStmt);
672
						AH->outputKind = OUTPUT_COPYDATA;
673
					}
674 675
					else
						AH->outputKind = OUTPUT_OTHERDATA;
676 677 678

					(*AH->PrintTocDataPtr) (AH, te, ropt);

679 680 681
					/*
					 * Terminate COPY if needed.
					 */
682 683 684 685
					if (AH->outputKind == OUTPUT_COPYDATA &&
						RestoringToDB(AH))
						EndDBCopyMode(AH, te);
					AH->outputKind = OUTPUT_SQLCMDS;
686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702

					/* close out the transaction started above */
					if (is_parallel && te->created)
						CommitTransaction(AH);

					_enableTriggersIfNecessary(AH, te, ropt);
				}
			}
		}
		else if (!defnDumped)
		{
			/* If we haven't already dumped the defn part, do so now */
			ahlog(AH, 1, "executing %s %s\n", te->desc, te->tag);
			_printTocEntry(AH, te, ropt, false, false);
		}
	}

A
Andrew Dunstan 已提交
703 704 705 706
	if (AH->public.n_errors > 0 && status == WORKER_OK)
		status = WORKER_IGNORED_ERRORS;

	return status;
707 708
}

709 710 711 712
/*
 * Allocate a new RestoreOptions block.
 * This is mainly so we can initialize it, but also for future expansion,
 */
B
Bruce Momjian 已提交
713 714
RestoreOptions *
NewRestoreOptions(void)
B
Bruce Momjian 已提交
715
{
B
Bruce Momjian 已提交
716
	RestoreOptions *opts;
B
Bruce Momjian 已提交
717

718
	opts = (RestoreOptions *) pg_malloc0(sizeof(RestoreOptions));
B
Bruce Momjian 已提交
719

720
	/* set any fields that shouldn't default to zeroes */
B
Bruce Momjian 已提交
721
	opts->format = archUnknown;
722
	opts->promptPassword = TRI_DEFAULT;
723
	opts->dumpSections = DUMP_UNSECTIONED;
B
Bruce Momjian 已提交
724 725 726 727

	return opts;
}

B
Bruce Momjian 已提交
728 729
static void
_disableTriggersIfNecessary(ArchiveHandle *AH, TocEntry *te, RestoreOptions *ropt)
B
Bruce Momjian 已提交
730
{
731 732
	/* This hack is only needed in a data-only restore */
	if (!ropt->dataOnly || !ropt->disable_triggers)
733 734
		return;

735 736
	ahlog(AH, 1, "disabling triggers for %s\n", te->tag);

737
	/*
B
Bruce Momjian 已提交
738
	 * Become superuser if possible, since they are the only ones who can
739 740 741
	 * disable constraint triggers.  If -S was not given, assume the initial
	 * user identity is a superuser.  (XXX would it be better to become the
	 * table owner?)
742
	 */
743
	_becomeUser(AH, ropt->superuser);
744 745

	/*
746
	 * Disable them.
747
	 */
748
	_selectOutputSchema(AH, te->namespace);
749

750 751
	ahprintf(AH, "ALTER TABLE %s DISABLE TRIGGER ALL;\n\n",
			 fmtId(te->tag));
B
Bruce Momjian 已提交
752 753
}

B
Bruce Momjian 已提交
754 755
static void
_enableTriggersIfNecessary(ArchiveHandle *AH, TocEntry *te, RestoreOptions *ropt)
B
Bruce Momjian 已提交
756
{
757 758
	/* This hack is only needed in a data-only restore */
	if (!ropt->dataOnly || !ropt->disable_triggers)
759 760
		return;

761 762
	ahlog(AH, 1, "enabling triggers for %s\n", te->tag);

763
	/*
B
Bruce Momjian 已提交
764
	 * Become superuser if possible, since they are the only ones who can
765 766 767
	 * disable constraint triggers.  If -S was not given, assume the initial
	 * user identity is a superuser.  (XXX would it be better to become the
	 * table owner?)
768
	 */
769
	_becomeUser(AH, ropt->superuser);
770 771

	/*
772
	 * Enable them.
773
	 */
774
	_selectOutputSchema(AH, te->namespace);
775

776 777
	ahprintf(AH, "ALTER TABLE %s ENABLE TRIGGER ALL;\n\n",
			 fmtId(te->tag));
778
}
B
Bruce Momjian 已提交
779 780

/*
781
 * This is a routine that is part of the dumper interface, hence the 'Archive*' parameter.
B
Bruce Momjian 已提交
782 783 784
 */

/* Public */
P
Peter Eisentraut 已提交
785 786
size_t
WriteData(Archive *AHX, const void *data, size_t dLen)
B
Bruce Momjian 已提交
787
{
B
Bruce Momjian 已提交
788
	ArchiveHandle *AH = (ArchiveHandle *) AHX;
B
Bruce Momjian 已提交
789

790
	if (!AH->currToc)
791
		exit_horribly(modulename, "internal error -- WriteData cannot be called outside the context of a DataDumper routine\n");
792

B
Bruce Momjian 已提交
793
	return (*AH->WriteDataPtr) (AH, data, dLen);
B
Bruce Momjian 已提交
794 795 796
}

/*
B
Bruce Momjian 已提交
797
 * Create a new TOC entry. The TOC was designed as a TOC, but is now the
B
Bruce Momjian 已提交
798 799 800 801
 * repository for all metadata. But the name has stuck.
 */

/* Public */
B
Bruce Momjian 已提交
802
void
803 804 805
ArchiveEntry(Archive *AHX,
			 CatalogId catalogId, DumpId dumpId,
			 const char *tag,
806
			 const char *namespace,
B
Bruce Momjian 已提交
807
			 const char *tablespace,
808
			 const char *owner, bool withOids,
809 810
			 const char *desc, teSection section,
			 const char *defn,
811 812
			 const char *dropStmt, const char *copyStmt,
			 const DumpId *deps, int nDeps,
B
Bruce Momjian 已提交
813
			 DataDumperPtr dumpFn, void *dumpArg)
B
Bruce Momjian 已提交
814
{
B
Bruce Momjian 已提交
815 816 817
	ArchiveHandle *AH = (ArchiveHandle *) AHX;
	TocEntry   *newToc;

818
	newToc = (TocEntry *) pg_malloc0(sizeof(TocEntry));
B
Bruce Momjian 已提交
819

820 821 822 823
	AH->tocCount++;
	if (dumpId > AH->maxDumpId)
		AH->maxDumpId = dumpId;

B
Bruce Momjian 已提交
824 825 826 827 828
	newToc->prev = AH->toc->prev;
	newToc->next = AH->toc;
	AH->toc->prev->next = newToc;
	AH->toc->prev = newToc;

829 830
	newToc->catalogId = catalogId;
	newToc->dumpId = dumpId;
831
	newToc->section = section;
832

833 834 835 836
	newToc->tag = pg_strdup(tag);
	newToc->namespace = namespace ? pg_strdup(namespace) : NULL;
	newToc->tablespace = tablespace ? pg_strdup(tablespace) : NULL;
	newToc->owner = pg_strdup(owner);
837
	newToc->withOids = withOids;
838 839 840 841
	newToc->desc = pg_strdup(desc);
	newToc->defn = pg_strdup(defn);
	newToc->dropStmt = pg_strdup(dropStmt);
	newToc->copyStmt = copyStmt ? pg_strdup(copyStmt) : NULL;
842

843 844
	if (nDeps > 0)
	{
845
		newToc->dependencies = (DumpId *) pg_malloc(nDeps * sizeof(DumpId));
846 847 848 849 850 851 852 853
		memcpy(newToc->dependencies, deps, nDeps * sizeof(DumpId));
		newToc->nDeps = nDeps;
	}
	else
	{
		newToc->dependencies = NULL;
		newToc->nDeps = 0;
	}
854

855 856
	newToc->dataDumper = dumpFn;
	newToc->dataDumperArg = dumpArg;
857
	newToc->hadDumper = dumpFn ? true : false;
B
Bruce Momjian 已提交
858

859
	newToc->formatData = NULL;
B
Bruce Momjian 已提交
860

B
Bruce Momjian 已提交
861
	if (AH->ArchiveEntryPtr !=NULL)
B
Bruce Momjian 已提交
862
		(*AH->ArchiveEntryPtr) (AH, newToc);
B
Bruce Momjian 已提交
863 864 865
}

/* Public */
B
Bruce Momjian 已提交
866 867
void
PrintTOCSummary(Archive *AHX, RestoreOptions *ropt)
B
Bruce Momjian 已提交
868
{
B
Bruce Momjian 已提交
869
	ArchiveHandle *AH = (ArchiveHandle *) AHX;
870
	TocEntry   *te;
871
	teSection	curSection;
B
Bruce Momjian 已提交
872
	OutputContext sav;
873
	const char *fmtName;
B
Bruce Momjian 已提交
874

875
	sav = SaveOutput(AH);
B
Bruce Momjian 已提交
876
	if (ropt->filename)
877
		SetOutput(AH, ropt->filename, 0 /* no compression */ );
B
Bruce Momjian 已提交
878

879 880
	ahprintf(AH, ";\n; Archive created at %s", ctime(&AH->createDate));
	ahprintf(AH, ";     dbname: %s\n;     TOC Entries: %d\n;     Compression: %d\n",
B
Bruce Momjian 已提交
881
			 AH->archdbname, AH->tocCount, AH->compression);
882

B
Bruce Momjian 已提交
883 884
	switch (AH->format)
	{
885 886 887 888 889 890 891 892 893
		case archCustom:
			fmtName = "CUSTOM";
			break;
		case archTar:
			fmtName = "TAR";
			break;
		default:
			fmtName = "UNKNOWN";
	}
894 895

	ahprintf(AH, ";     Dump Version: %d.%d-%d\n", AH->vmaj, AH->vmin, AH->vrev);
896
	ahprintf(AH, ";     Format: %s\n", fmtName);
T
Tom Lane 已提交
897 898
	ahprintf(AH, ";     Integer: %d bytes\n", (int) AH->intSize);
	ahprintf(AH, ";     Offset: %d bytes\n", (int) AH->offSize);
899 900 901 902 903 904
	if (AH->archiveRemoteVersion)
		ahprintf(AH, ";     Dumped from database version: %s\n",
				 AH->archiveRemoteVersion);
	if (AH->archiveDumpVersion)
		ahprintf(AH, ";     Dumped by pg_dump version: %s\n",
				 AH->archiveDumpVersion);
905

906
	ahprintf(AH, ";\n;\n; Selected TOC Entries:\n;\n");
B
Bruce Momjian 已提交
907

908
	curSection = SECTION_PRE_DATA;
909
	for (te = AH->toc->next; te != AH->toc; te = te->next)
B
Bruce Momjian 已提交
910
	{
911 912 913 914
		if (te->section != SECTION_NONE)
			curSection = te->section;
		if (ropt->verbose ||
			(_tocEntryRequired(te, curSection, ropt) & (REQ_SCHEMA | REQ_DATA)) != 0)
915
			ahprintf(AH, "%d; %u %u %s %s %s %s\n", te->dumpId,
916
					 te->catalogId.tableoid, te->catalogId.oid,
917 918
					 te->desc, te->namespace ? te->namespace : "-",
					 te->tag, te->owner);
919 920
		if (ropt->verbose && te->nDeps > 0)
		{
921
			int			i;
922 923 924 925 926 927

			ahprintf(AH, ";\tdepends on:");
			for (i = 0; i < te->nDeps; i++)
				ahprintf(AH, " %d", te->dependencies[i]);
			ahprintf(AH, "\n");
		}
B
Bruce Momjian 已提交
928
	}
B
Bruce Momjian 已提交
929

B
Bruce Momjian 已提交
930
	if (ropt->filename)
931
		RestoreOutput(AH, sav);
B
Bruce Momjian 已提交
932 933
}

934 935 936 937 938
/***********
 * BLOB Archival
 ***********/

/* Called by a dumper to signal start of a BLOB */
B
Bruce Momjian 已提交
939
int
940
StartBlob(Archive *AHX, Oid oid)
941
{
B
Bruce Momjian 已提交
942
	ArchiveHandle *AH = (ArchiveHandle *) AHX;
943

B
Bruce Momjian 已提交
944
	if (!AH->StartBlobPtr)
945
		exit_horribly(modulename, "large-object output not supported in chosen format\n");
946

B
Bruce Momjian 已提交
947
	(*AH->StartBlobPtr) (AH, AH->currToc, oid);
948

B
Bruce Momjian 已提交
949
	return 1;
950 951 952
}

/* Called by a dumper to signal end of a BLOB */
B
Bruce Momjian 已提交
953
int
954
EndBlob(Archive *AHX, Oid oid)
955
{
B
Bruce Momjian 已提交
956
	ArchiveHandle *AH = (ArchiveHandle *) AHX;
957

B
Bruce Momjian 已提交
958 959
	if (AH->EndBlobPtr)
		(*AH->EndBlobPtr) (AH, AH->currToc, oid);
960

B
Bruce Momjian 已提交
961
	return 1;
962 963 964 965 966 967
}

/**********
 * BLOB Restoration
 **********/

968
/*
B
Bruce Momjian 已提交
969
 * Called by a format handler before any blobs are restored
970
 */
B
Bruce Momjian 已提交
971 972
void
StartRestoreBlobs(ArchiveHandle *AH)
973
{
974 975 976 977 978 979 980
	if (!AH->ropt->single_txn)
	{
		if (AH->connection)
			StartTransaction(AH);
		else
			ahprintf(AH, "BEGIN;\n\n");
	}
981

982 983 984 985
	AH->blobCount = 0;
}

/*
B
Bruce Momjian 已提交
986
 * Called by a format handler after all blobs are restored
987
 */
B
Bruce Momjian 已提交
988 989
void
EndRestoreBlobs(ArchiveHandle *AH)
990
{
991 992 993 994 995 996 997
	if (!AH->ropt->single_txn)
	{
		if (AH->connection)
			CommitTransaction(AH);
		else
			ahprintf(AH, "COMMIT;\n\n");
	}
998

P
Peter Eisentraut 已提交
999 1000 1001 1002
	ahlog(AH, 1, ngettext("restored %d large object\n",
						  "restored %d large objects\n",
						  AH->blobCount),
		  AH->blobCount);
1003 1004 1005
}


1006 1007 1008
/*
 * Called by a format handler to initiate restoration of a blob
 */
B
Bruce Momjian 已提交
1009
void
1010
StartRestoreBlob(ArchiveHandle *AH, Oid oid, bool drop)
1011
{
1012
	bool		old_blob_style = (AH->version < K_VERS_1_12);
1013
	Oid			loOid;
1014

1015 1016
	AH->blobCount++;

1017 1018 1019
	/* Initialize the LO Buffer */
	AH->lo_buf_used = 0;

1020
	ahlog(AH, 1, "restoring large object with OID %u\n", oid);
1021

1022 1023
	/* With an old archive we must do drop and create logic here */
	if (old_blob_style && drop)
1024
		DropBlobIfExists(AH, oid);
1025

1026
	if (AH->connection)
1027
	{
1028 1029 1030 1031
		if (old_blob_style)
		{
			loOid = lo_create(AH->connection, oid);
			if (loOid == 0 || loOid != oid)
1032 1033
				exit_horribly(modulename, "could not create large object %u: %s",
							  oid, PQerrorMessage(AH->connection));
1034
		}
1035 1036
		AH->loFd = lo_open(AH->connection, oid, INV_WRITE);
		if (AH->loFd == -1)
1037 1038
			exit_horribly(modulename, "could not open large object %u: %s",
						  oid, PQerrorMessage(AH->connection));
1039 1040 1041
	}
	else
	{
1042 1043 1044 1045 1046 1047
		if (old_blob_style)
			ahprintf(AH, "SELECT pg_catalog.lo_open(pg_catalog.lo_create('%u'), %d);\n",
					 oid, INV_WRITE);
		else
			ahprintf(AH, "SELECT pg_catalog.lo_open('%u', %d);\n",
					 oid, INV_WRITE);
1048
	}
1049

B
Bruce Momjian 已提交
1050
	AH->writingBlob = 1;
1051 1052
}

B
Bruce Momjian 已提交
1053
void
1054
EndRestoreBlob(ArchiveHandle *AH, Oid oid)
1055
{
1056 1057 1058
	if (AH->lo_buf_used > 0)
	{
		/* Write remaining bytes from the LO buffer */
1059
		dump_lo_buf(AH);
1060
	}
1061

B
Bruce Momjian 已提交
1062
	AH->writingBlob = 0;
1063

1064
	if (AH->connection)
1065
	{
1066 1067 1068 1069 1070
		lo_close(AH->connection, AH->loFd);
		AH->loFd = -1;
	}
	else
	{
1071
		ahprintf(AH, "SELECT pg_catalog.lo_close(0);\n\n");
1072
	}
1073 1074
}

B
Bruce Momjian 已提交
1075 1076 1077 1078
/***********
 * Sorting and Reordering
 ***********/

B
Bruce Momjian 已提交
1079 1080
void
SortTocFromFile(Archive *AHX, RestoreOptions *ropt)
B
Bruce Momjian 已提交
1081
{
B
Bruce Momjian 已提交
1082 1083
	ArchiveHandle *AH = (ArchiveHandle *) AHX;
	FILE	   *fh;
1084 1085
	char		buf[100];
	bool		incomplete_line;
B
Bruce Momjian 已提交
1086 1087

	/* Allocate space for the 'wanted' array, and init it */
1088
	ropt->idWanted = (bool *) pg_malloc(sizeof(bool) * AH->maxDumpId);
1089
	memset(ropt->idWanted, 0, sizeof(bool) * AH->maxDumpId);
B
Bruce Momjian 已提交
1090

B
Bruce Momjian 已提交
1091 1092 1093
	/* Setup the file */
	fh = fopen(ropt->tocFile, PG_BINARY_R);
	if (!fh)
1094 1095
		exit_horribly(modulename, "could not open TOC file \"%s\": %s\n",
					  ropt->tocFile, strerror(errno));
B
Bruce Momjian 已提交
1096

1097
	incomplete_line = false;
1098
	while (fgets(buf, sizeof(buf), fh) != NULL)
B
Bruce Momjian 已提交
1099
	{
1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117 1118 1119 1120
		bool		prev_incomplete_line = incomplete_line;
		int			buflen;
		char	   *cmnt;
		char	   *endptr;
		DumpId		id;
		TocEntry   *te;

		/*
		 * Some lines in the file might be longer than sizeof(buf).  This is
		 * no problem, since we only care about the leading numeric ID which
		 * can be at most a few characters; but we have to skip continuation
		 * bufferloads when processing a long line.
		 */
		buflen = strlen(buf);
		if (buflen > 0 && buf[buflen - 1] == '\n')
			incomplete_line = false;
		else
			incomplete_line = true;
		if (prev_incomplete_line)
			continue;

1121
		/* Truncate line at comment, if any */
B
Bruce Momjian 已提交
1122 1123 1124 1125
		cmnt = strchr(buf, ';');
		if (cmnt != NULL)
			cmnt[0] = '\0';

1126
		/* Ignore if all blank */
1127
		if (strspn(buf, " \t\r\n") == strlen(buf))
B
Bruce Momjian 已提交
1128 1129
			continue;

1130
		/* Get an ID, check it's valid and not already seen */
B
Bruce Momjian 已提交
1131
		id = strtol(buf, &endptr, 10);
1132 1133
		if (endptr == buf || id <= 0 || id > AH->maxDumpId ||
			ropt->idWanted[id - 1])
B
Bruce Momjian 已提交
1134
		{
1135
			write_msg(modulename, "WARNING: line ignored: %s\n", buf);
B
Bruce Momjian 已提交
1136 1137
			continue;
		}
B
Bruce Momjian 已提交
1138

B
Bruce Momjian 已提交
1139
		/* Find TOC entry */
1140
		te = getTocEntryByDumpId(AH, id);
B
Bruce Momjian 已提交
1141
		if (!te)
1142 1143
			exit_horribly(modulename, "could not find entry for ID %d\n",
						  id);
B
Bruce Momjian 已提交
1144

1145
		/* Mark it wanted */
1146
		ropt->idWanted[id - 1] = true;
B
Bruce Momjian 已提交
1147

1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159
		/*
		 * Move each item to the end of the list as it is selected, so that
		 * they are placed in the desired order.  Any unwanted items will end
		 * up at the front of the list, which may seem unintuitive but it's
		 * what we need.  In an ordinary serial restore that makes no
		 * difference, but in a parallel restore we need to mark unrestored
		 * items' dependencies as satisfied before we start examining
		 * restorable items.  Otherwise they could have surprising
		 * side-effects on the order in which restorable items actually get
		 * restored.
		 */
		_moveBefore(AH, AH->toc, te);
B
Bruce Momjian 已提交
1160
	}
B
Bruce Momjian 已提交
1161

B
Bruce Momjian 已提交
1162
	if (fclose(fh) != 0)
1163 1164
		exit_horribly(modulename, "could not close TOC file: %s\n",
					  strerror(errno));
B
Bruce Momjian 已提交
1165 1166 1167 1168 1169 1170 1171 1172
}

/**********************
 * 'Convenience functions that look like standard IO functions
 * for writing data when in dump mode.
 **********************/

/* Public */
B
Bruce Momjian 已提交
1173 1174 1175 1176
int
archputs(const char *s, Archive *AH)
{
	return WriteData(AH, s, strlen(s));
B
Bruce Momjian 已提交
1177 1178 1179
}

/* Public */
B
Bruce Momjian 已提交
1180 1181
int
archprintf(Archive *AH, const char *fmt,...)
B
Bruce Momjian 已提交
1182
{
B
Bruce Momjian 已提交
1183 1184 1185 1186 1187 1188
	char	   *p = NULL;
	va_list		ap;
	int			bSize = strlen(fmt) + 256;
	int			cnt = -1;

	/*
B
Bruce Momjian 已提交
1189 1190 1191
	 * This is paranoid: deal with the possibility that vsnprintf is willing
	 * to ignore trailing null or returns > 0 even if string does not fit. It
	 * may be the case that it returns cnt = bufsize
B
Bruce Momjian 已提交
1192 1193
	 */
	while (cnt < 0 || cnt >= (bSize - 1))
B
Bruce Momjian 已提交
1194
	{
B
Bruce Momjian 已提交
1195 1196
		if (p != NULL)
			free(p);
1197
		bSize *= 2;
1198
		p = (char *) pg_malloc(bSize);
1199 1200 1201
		va_start(ap, fmt);
		cnt = vsnprintf(p, bSize, fmt, ap);
		va_end(ap);
B
Bruce Momjian 已提交
1202 1203 1204 1205
	}
	WriteData(AH, p, cnt);
	free(p);
	return cnt;
B
Bruce Momjian 已提交
1206 1207 1208 1209 1210 1211 1212
}


/*******************************
 * Stuff below here should be 'private' to the archiver routines
 *******************************/

1213
static void
1214
SetOutput(ArchiveHandle *AH, const char *filename, int compression)
B
Bruce Momjian 已提交
1215
{
1216
	int			fn;
B
Bruce Momjian 已提交
1217 1218

	if (filename)
1219
		fn = -1;
B
Bruce Momjian 已提交
1220 1221 1222 1223
	else if (AH->FH)
		fn = fileno(AH->FH);
	else if (AH->fSpec)
	{
1224
		fn = -1;
B
Bruce Momjian 已提交
1225 1226 1227 1228 1229 1230
		filename = AH->fSpec;
	}
	else
		fn = fileno(stdout);

	/* If compression explicitly requested, use gzopen */
1231
#ifdef HAVE_LIBZ
B
Bruce Momjian 已提交
1232 1233
	if (compression != 0)
	{
1234 1235 1236
		char		fmode[10];

		/* Don't use PG_BINARY_x since this is zlib */
1237
		sprintf(fmode, "wb%d", compression);
1238 1239
		if (fn >= 0)
			AH->OF = gzdopen(dup(fn), fmode);
B
Bruce Momjian 已提交
1240 1241
		else
			AH->OF = gzopen(filename, fmode);
1242
		AH->gzOut = 1;
B
Bruce Momjian 已提交
1243 1244
	}
	else
B
Bruce Momjian 已提交
1245
#endif
1246
	{							/* Use fopen */
1247 1248 1249 1250 1251 1252 1253
		if (AH->mode == archModeAppend)
		{
			if (fn >= 0)
				AH->OF = fdopen(dup(fn), PG_BINARY_A);
			else
				AH->OF = fopen(filename, PG_BINARY_A);
		}
B
Bruce Momjian 已提交
1254
		else
1255 1256 1257 1258 1259 1260
		{
			if (fn >= 0)
				AH->OF = fdopen(dup(fn), PG_BINARY_W);
			else
				AH->OF = fopen(filename, PG_BINARY_W);
		}
1261
		AH->gzOut = 0;
B
Bruce Momjian 已提交
1262
	}
B
Bruce Momjian 已提交
1263

1264
	if (!AH->OF)
1265 1266
	{
		if (filename)
1267 1268
			exit_horribly(modulename, "could not open output file \"%s\": %s\n",
						  filename, strerror(errno));
1269
		else
1270 1271
			exit_horribly(modulename, "could not open output file: %s\n",
						  strerror(errno));
1272
	}
1273 1274 1275 1276 1277 1278 1279 1280 1281
}

static OutputContext
SaveOutput(ArchiveHandle *AH)
{
	OutputContext sav;

	sav.OF = AH->OF;
	sav.gzOut = AH->gzOut;
1282

B
Bruce Momjian 已提交
1283
	return sav;
B
Bruce Momjian 已提交
1284 1285
}

1286
static void
1287
RestoreOutput(ArchiveHandle *AH, OutputContext savedContext)
B
Bruce Momjian 已提交
1288
{
B
Bruce Momjian 已提交
1289
	int			res;
1290

B
Bruce Momjian 已提交
1291
	if (AH->gzOut)
1292
		res = GZCLOSE(AH->OF);
B
Bruce Momjian 已提交
1293
	else
1294 1295 1296
		res = fclose(AH->OF);

	if (res != 0)
1297
		exit_horribly(modulename, "could not close output file: %s\n",
1298
					  strerror(errno));
B
Bruce Momjian 已提交
1299

1300 1301
	AH->gzOut = savedContext.gzOut;
	AH->OF = savedContext.OF;
B
Bruce Momjian 已提交
1302 1303 1304 1305 1306
}



/*
B
Bruce Momjian 已提交
1307
 *	Print formatted text to the output file (usually stdout).
B
Bruce Momjian 已提交
1308
 */
B
Bruce Momjian 已提交
1309 1310
int
ahprintf(ArchiveHandle *AH, const char *fmt,...)
B
Bruce Momjian 已提交
1311
{
B
Bruce Momjian 已提交
1312 1313
	char	   *p = NULL;
	va_list		ap;
1314
	int			bSize = strlen(fmt) + 256;		/* Usually enough */
B
Bruce Momjian 已提交
1315 1316 1317
	int			cnt = -1;

	/*
B
Bruce Momjian 已提交
1318
	 * This is paranoid: deal with the possibility that vsnprintf is willing
1319 1320
	 * to ignore trailing null or returns > 0 even if string does not fit. It
	 * may be the case that it returns cnt = bufsize.
B
Bruce Momjian 已提交
1321 1322
	 */
	while (cnt < 0 || cnt >= (bSize - 1))
1323
	{
B
Bruce Momjian 已提交
1324 1325
		if (p != NULL)
			free(p);
1326
		bSize *= 2;
1327
		p = (char *) pg_malloc(bSize);
1328
		va_start(ap, fmt);
1329
		cnt = vsnprintf(p, bSize, fmt, ap);
1330
		va_end(ap);
B
Bruce Momjian 已提交
1331 1332 1333 1334
	}
	ahwrite(p, 1, cnt, AH);
	free(p);
	return cnt;
B
Bruce Momjian 已提交
1335 1336
}

B
Bruce Momjian 已提交
1337 1338
void
ahlog(ArchiveHandle *AH, int level, const char *fmt,...)
1339 1340 1341 1342 1343 1344 1345
{
	va_list		ap;

	if (AH->debugLevel < level && (!AH->public.verbose || level > 1))
		return;

	va_start(ap, fmt);
T
Tom Lane 已提交
1346
	vwrite_msg(NULL, fmt, ap);
1347 1348 1349
	va_end(ap);
}

1350 1351 1352
/*
 * Single place for logic which says 'We are restoring to a direct DB connection'.
 */
1353
static int
B
Bruce Momjian 已提交
1354
RestoringToDB(ArchiveHandle *AH)
1355 1356 1357 1358
{
	return (AH->ropt && AH->ropt->useDB && AH->connection);
}

1359 1360 1361 1362 1363 1364 1365 1366 1367 1368 1369
/*
 * Dump the current contents of the LO data buffer while writing a BLOB
 */
static void
dump_lo_buf(ArchiveHandle *AH)
{
	if (AH->connection)
	{
		size_t		res;

		res = lo_write(AH->connection, AH->loFd, AH->lo_buf, AH->lo_buf_used);
P
Peter Eisentraut 已提交
1370
		ahlog(AH, 5, ngettext("wrote %lu byte of large object data (result = %lu)\n",
1371
					 "wrote %lu bytes of large object data (result = %lu)\n",
P
Peter Eisentraut 已提交
1372
							  AH->lo_buf_used),
1373 1374
			  (unsigned long) AH->lo_buf_used, (unsigned long) res);
		if (res != AH->lo_buf_used)
1375
			exit_horribly(modulename,
B
Bruce Momjian 已提交
1376 1377
			"could not write to large object (result: %lu, expected: %lu)\n",
					   (unsigned long) res, (unsigned long) AH->lo_buf_used);
1378 1379 1380
	}
	else
	{
1381
		PQExpBuffer buf = createPQExpBuffer();
1382

1383 1384 1385 1386
		appendByteaLiteralAHX(buf,
							  (const unsigned char *) AH->lo_buf,
							  AH->lo_buf_used,
							  AH);
1387 1388 1389

		/* Hack: turn off writingBlob so ahwrite doesn't recurse to here */
		AH->writingBlob = 0;
1390
		ahprintf(AH, "SELECT pg_catalog.lowrite(0, %s);\n", buf->data);
1391 1392
		AH->writingBlob = 1;

1393
		destroyPQExpBuffer(buf);
1394 1395 1396 1397 1398
	}
	AH->lo_buf_used = 0;
}


B
Bruce Momjian 已提交
1399
/*
1400
 *	Write buffer to the output file (usually stdout). This is used for
B
Bruce Momjian 已提交
1401 1402
 *	outputting 'restore' scripts etc. It is even possible for an archive
 *	format to create a custom output routine to 'fake' a restore if it
1403
 *	wants to generate a script (see TAR output).
B
Bruce Momjian 已提交
1404
 */
B
Bruce Momjian 已提交
1405 1406
int
ahwrite(const void *ptr, size_t size, size_t nmemb, ArchiveHandle *AH)
B
Bruce Momjian 已提交
1407
{
P
Peter Eisentraut 已提交
1408
	size_t		res;
1409

B
Bruce Momjian 已提交
1410
	if (AH->writingBlob)
1411
	{
B
Bruce Momjian 已提交
1412
		size_t		remaining = size * nmemb;
1413 1414

		while (AH->lo_buf_used + remaining > AH->lo_buf_size)
P
Peter Eisentraut 已提交
1415
		{
1416 1417 1418 1419 1420 1421 1422
			size_t		avail = AH->lo_buf_size - AH->lo_buf_used;

			memcpy((char *) AH->lo_buf + AH->lo_buf_used, ptr, avail);
			ptr = (const void *) ((const char *) ptr + avail);
			remaining -= avail;
			AH->lo_buf_used += avail;
			dump_lo_buf(AH);
P
Peter Eisentraut 已提交
1423 1424
		}

1425 1426 1427
		memcpy((char *) AH->lo_buf + AH->lo_buf_used, ptr, remaining);
		AH->lo_buf_used += remaining;

P
Peter Eisentraut 已提交
1428
		return size * nmemb;
1429
	}
B
Bruce Momjian 已提交
1430
	else if (AH->gzOut)
1431
	{
1432
		res = GZWRITE(ptr, size, nmemb, AH->OF);
1433
		if (res != (nmemb * size))
1434
			exit_horribly(modulename, "could not write to output file: %s\n", strerror(errno));
1435 1436
		return res;
	}
B
Bruce Momjian 已提交
1437
	else if (AH->CustomOutPtr)
1438
	{
B
Bruce Momjian 已提交
1439 1440
		res = AH->CustomOutPtr (AH, ptr, size * nmemb);

1441
		if (res != (nmemb * size))
1442
			exit_horribly(modulename, "could not write to custom output routine\n");
1443 1444
		return res;
	}
1445 1446 1447
	else
	{
		/*
B
Bruce Momjian 已提交
1448 1449 1450
		 * If we're doing a restore, and it's direct to DB, and we're
		 * connected then send it to the DB.
		 */
1451
		if (RestoringToDB(AH))
1452
			return ExecuteSqlCommandBuf(AH, (const char *) ptr, size * nmemb);
1453
		else
1454
		{
1455
			res = fwrite(ptr, size, nmemb, AH->OF);
1456
			if (res != nmemb)
1457
				exit_horribly(modulename, "could not write to output file: %s\n",
1458
							  strerror(errno));
1459 1460
			return res;
		}
1461
	}
B
Bruce Momjian 已提交
1462
}
1463

1464 1465
/* on some error, we may decide to go on... */
void
1466
warn_or_exit_horribly(ArchiveHandle *AH,
1467
					  const char *modulename, const char *fmt,...)
1468
{
B
Bruce Momjian 已提交
1469
	va_list		ap;
1470

B
Bruce Momjian 已提交
1471 1472
	switch (AH->stage)
	{
1473 1474 1475 1476 1477 1478

		case STAGE_NONE:
			/* Do nothing special */
			break;

		case STAGE_INITIALIZING:
B
Bruce Momjian 已提交
1479
			if (AH->stage != AH->lastErrorStage)
1480 1481 1482 1483
				write_msg(modulename, "Error while INITIALIZING:\n");
			break;

		case STAGE_PROCESSING:
B
Bruce Momjian 已提交
1484
			if (AH->stage != AH->lastErrorStage)
1485 1486 1487 1488
				write_msg(modulename, "Error while PROCESSING TOC:\n");
			break;

		case STAGE_FINALIZING:
B
Bruce Momjian 已提交
1489
			if (AH->stage != AH->lastErrorStage)
1490 1491 1492
				write_msg(modulename, "Error while FINALIZING:\n");
			break;
	}
B
Bruce Momjian 已提交
1493 1494
	if (AH->currentTE != NULL && AH->currentTE != AH->lastErrorTE)
	{
1495 1496
		write_msg(modulename, "Error from TOC entry %d; %u %u %s %s %s\n",
				  AH->currentTE->dumpId,
B
Bruce Momjian 已提交
1497 1498
			 AH->currentTE->catalogId.tableoid, AH->currentTE->catalogId.oid,
			  AH->currentTE->desc, AH->currentTE->tag, AH->currentTE->owner);
1499 1500 1501 1502
	}
	AH->lastErrorStage = AH->stage;
	AH->lastErrorTE = AH->currentTE;

1503
	va_start(ap, fmt);
1504 1505 1506
	vwrite_msg(modulename, fmt, ap);
	va_end(ap);

1507
	if (AH->public.exit_on_error)
1508
		exit_nicely(1);
1509 1510 1511
	else
		AH->public.n_errors++;
}
1512

1513 1514
#ifdef NOT_USED

B
Bruce Momjian 已提交
1515 1516
static void
_moveAfter(ArchiveHandle *AH, TocEntry *pos, TocEntry *te)
B
Bruce Momjian 已提交
1517
{
1518
	/* Unlink te from list */
B
Bruce Momjian 已提交
1519 1520
	te->prev->next = te->next;
	te->next->prev = te->prev;
B
Bruce Momjian 已提交
1521

1522
	/* and insert it after "pos" */
B
Bruce Momjian 已提交
1523 1524 1525 1526
	te->prev = pos;
	te->next = pos->next;
	pos->next->prev = te;
	pos->next = te;
B
Bruce Momjian 已提交
1527
}
1528
#endif
1529

B
Bruce Momjian 已提交
1530 1531
static void
_moveBefore(ArchiveHandle *AH, TocEntry *pos, TocEntry *te)
B
Bruce Momjian 已提交
1532
{
1533
	/* Unlink te from list */
B
Bruce Momjian 已提交
1534 1535
	te->prev->next = te->next;
	te->next->prev = te->prev;
B
Bruce Momjian 已提交
1536

1537
	/* and insert it before "pos" */
B
Bruce Momjian 已提交
1538 1539 1540 1541
	te->prev = pos->prev;
	te->next = pos;
	pos->prev->next = te;
	pos->prev = te;
B
Bruce Momjian 已提交
1542
}
1543

1544 1545 1546 1547 1548 1549 1550
/*
 * Build index arrays for the TOC list
 *
 * This should be invoked only after we have created or read in all the TOC
 * items.
 *
 * The arrays are indexed by dump ID (so entry zero is unused).  Note that the
1551
 * array entries run only up to maxDumpId.	We might see dependency dump IDs
1552 1553 1554 1555 1556
 * beyond that (if the dump was partial); so always check the array bound
 * before trying to touch an array entry.
 */
static void
buildTocEntryArrays(ArchiveHandle *AH)
B
Bruce Momjian 已提交
1557
{
1558
	DumpId		maxDumpId = AH->maxDumpId;
B
Bruce Momjian 已提交
1559 1560
	TocEntry   *te;

1561 1562
	AH->tocsByDumpId = (TocEntry **) pg_malloc0((maxDumpId + 1) * sizeof(TocEntry *));
	AH->tableDataId = (DumpId *) pg_malloc0((maxDumpId + 1) * sizeof(DumpId));
1563

1564
	for (te = AH->toc->next; te != AH->toc; te = te->next)
B
Bruce Momjian 已提交
1565
	{
1566 1567
		/* this check is purely paranoia, maxDumpId should be correct */
		if (te->dumpId <= 0 || te->dumpId > maxDumpId)
1568
			exit_horribly(modulename, "bad dumpId\n");
1569 1570 1571 1572 1573 1574

		/* tocsByDumpId indexes all TOCs by their dump ID */
		AH->tocsByDumpId[te->dumpId] = te;

		/*
		 * tableDataId provides the TABLE DATA item's dump ID for each TABLE
1575
		 * TOC entry that has a DATA item.	We compute this by reversing the
1576 1577 1578 1579 1580 1581 1582 1583 1584 1585 1586 1587 1588
		 * TABLE DATA item's dependency, knowing that a TABLE DATA item has
		 * just one dependency and it is the TABLE item.
		 */
		if (strcmp(te->desc, "TABLE DATA") == 0 && te->nDeps > 0)
		{
			DumpId		tableId = te->dependencies[0];

			/*
			 * The TABLE item might not have been in the archive, if this was
			 * a data-only dump; but its dump ID should be less than its data
			 * item's dump ID, so there should be a place for it in the array.
			 */
			if (tableId <= 0 || tableId > maxDumpId)
1589
				exit_horribly(modulename, "bad table dumpId for TABLE DATA item\n");
1590 1591 1592

			AH->tableDataId[tableId] = te->dumpId;
		}
B
Bruce Momjian 已提交
1593
	}
1594 1595
}

A
Andrew Dunstan 已提交
1596
TocEntry *
1597 1598 1599 1600 1601 1602 1603 1604 1605
getTocEntryByDumpId(ArchiveHandle *AH, DumpId id)
{
	/* build index arrays if we didn't already */
	if (AH->tocsByDumpId == NULL)
		buildTocEntryArrays(AH);

	if (id > 0 && id <= AH->maxDumpId)
		return AH->tocsByDumpId[id];

B
Bruce Momjian 已提交
1606
	return NULL;
B
Bruce Momjian 已提交
1607 1608
}

1609
teReqs
1610
TocIDRequired(ArchiveHandle *AH, DumpId id)
B
Bruce Momjian 已提交
1611
{
1612
	TocEntry   *te = getTocEntryByDumpId(AH, id);
B
Bruce Momjian 已提交
1613

B
Bruce Momjian 已提交
1614 1615
	if (!te)
		return 0;
B
Bruce Momjian 已提交
1616

1617
	return te->reqs;
B
Bruce Momjian 已提交
1618 1619
}

1620
size_t
1621
WriteOffset(ArchiveHandle *AH, pgoff_t o, int wasSet)
1622
{
B
Bruce Momjian 已提交
1623
	int			off;
1624 1625 1626 1627

	/* Save the flag */
	(*AH->WriteBytePtr) (AH, wasSet);

1628 1629
	/* Write out pgoff_t smallest byte first, prevents endian mismatch */
	for (off = 0; off < sizeof(pgoff_t); off++)
1630
	{
B
Bruce Momjian 已提交
1631
		(*AH->WriteBytePtr) (AH, o & 0xFF);
1632 1633
		o >>= 8;
	}
1634
	return sizeof(pgoff_t) + 1;
1635 1636 1637
}

int
B
Bruce Momjian 已提交
1638
ReadOffset(ArchiveHandle *AH, pgoff_t * o)
1639
{
B
Bruce Momjian 已提交
1640 1641 1642
	int			i;
	int			off;
	int			offsetFlg;
1643 1644 1645 1646 1647 1648 1649 1650 1651 1652 1653

	/* Initialize to zero */
	*o = 0;

	/* Check for old version */
	if (AH->version < K_VERS_1_7)
	{
		/* Prior versions wrote offsets using WriteInt */
		i = ReadInt(AH);
		/* -1 means not set */
		if (i < 0)
B
Bruce Momjian 已提交
1654
			return K_OFFSET_POS_NOT_SET;
1655
		else if (i == 0)
B
Bruce Momjian 已提交
1656
			return K_OFFSET_NO_DATA;
1657

1658 1659
		/* Cast to pgoff_t because it was written as an int. */
		*o = (pgoff_t) i;
1660 1661 1662 1663
		return K_OFFSET_POS_SET;
	}

	/*
B
Bruce Momjian 已提交
1664 1665
	 * Read the flag indicating the state of the data pointer. Check if valid
	 * and die if not.
1666
	 *
1667 1668
	 * This used to be handled by a negative or zero pointer, now we use an
	 * extra byte specifically for the state.
1669 1670 1671 1672 1673 1674 1675 1676 1677
	 */
	offsetFlg = (*AH->ReadBytePtr) (AH) & 0xFF;

	switch (offsetFlg)
	{
		case K_OFFSET_POS_NOT_SET:
		case K_OFFSET_NO_DATA:
		case K_OFFSET_POS_SET:

B
Bruce Momjian 已提交
1678
			break;
1679 1680

		default:
1681
			exit_horribly(modulename, "unexpected data offset flag %d\n", offsetFlg);
1682 1683 1684 1685 1686 1687 1688
	}

	/*
	 * Read the bytes
	 */
	for (off = 0; off < AH->offSize; off++)
	{
1689 1690
		if (off < sizeof(pgoff_t))
			*o |= ((pgoff_t) ((*AH->ReadBytePtr) (AH))) << (off * 8);
1691 1692 1693
		else
		{
			if ((*AH->ReadBytePtr) (AH) != 0)
1694
				exit_horribly(modulename, "file offset in dump file is too large\n");
1695 1696 1697 1698 1699 1700
		}
	}

	return offsetFlg;
}

P
Peter Eisentraut 已提交
1701
size_t
B
Bruce Momjian 已提交
1702
WriteInt(ArchiveHandle *AH, int i)
B
Bruce Momjian 已提交
1703
{
B
Bruce Momjian 已提交
1704 1705 1706
	int			b;

	/*
B
Bruce Momjian 已提交
1707 1708 1709 1710 1711
	 * This is a bit yucky, but I don't want to make the binary format very
	 * dependent on representation, and not knowing much about it, I write out
	 * a sign byte. If you change this, don't forget to change the file
	 * version #, and modify readInt to read the new format AS WELL AS the old
	 * formats.
B
Bruce Momjian 已提交
1712 1713 1714 1715 1716 1717
	 */

	/* SIGN byte */
	if (i < 0)
	{
		(*AH->WriteBytePtr) (AH, 1);
1718
		i = -i;
B
Bruce Momjian 已提交
1719 1720 1721 1722 1723 1724 1725
	}
	else
		(*AH->WriteBytePtr) (AH, 0);

	for (b = 0; b < AH->intSize; b++)
	{
		(*AH->WriteBytePtr) (AH, i & 0xFF);
1726
		i >>= 8;
B
Bruce Momjian 已提交
1727 1728 1729
	}

	return AH->intSize + 1;
B
Bruce Momjian 已提交
1730 1731
}

B
Bruce Momjian 已提交
1732 1733
int
ReadInt(ArchiveHandle *AH)
B
Bruce Momjian 已提交
1734
{
B
Bruce Momjian 已提交
1735 1736 1737 1738 1739
	int			res = 0;
	int			bv,
				b;
	int			sign = 0;		/* Default positive */
	int			bitShift = 0;
B
Bruce Momjian 已提交
1740

B
Bruce Momjian 已提交
1741
	if (AH->version > K_VERS_1_0)
1742
		/* Read a sign byte */
B
Bruce Momjian 已提交
1743
		sign = (*AH->ReadBytePtr) (AH);
B
Bruce Momjian 已提交
1744

B
Bruce Momjian 已提交
1745 1746 1747
	for (b = 0; b < AH->intSize; b++)
	{
		bv = (*AH->ReadBytePtr) (AH) & 0xFF;
1748 1749 1750
		if (bv != 0)
			res = res + (bv << bitShift);
		bitShift += 8;
B
Bruce Momjian 已提交
1751
	}
B
Bruce Momjian 已提交
1752

B
Bruce Momjian 已提交
1753 1754
	if (sign)
		res = -res;
B
Bruce Momjian 已提交
1755

B
Bruce Momjian 已提交
1756
	return res;
B
Bruce Momjian 已提交
1757 1758
}

P
Peter Eisentraut 已提交
1759
size_t
1760
WriteStr(ArchiveHandle *AH, const char *c)
B
Bruce Momjian 已提交
1761
{
P
Peter Eisentraut 已提交
1762
	size_t		res;
1763 1764 1765 1766

	if (c)
	{
		res = WriteInt(AH, strlen(c));
B
Bruce Momjian 已提交
1767
		res += (*AH->WriteBufPtr) (AH, c, strlen(c));
1768 1769 1770 1771
	}
	else
		res = WriteInt(AH, -1);

B
Bruce Momjian 已提交
1772
	return res;
B
Bruce Momjian 已提交
1773 1774
}

B
Bruce Momjian 已提交
1775 1776
char *
ReadStr(ArchiveHandle *AH)
B
Bruce Momjian 已提交
1777
{
B
Bruce Momjian 已提交
1778 1779
	char	   *buf;
	int			l;
B
Bruce Momjian 已提交
1780

B
Bruce Momjian 已提交
1781
	l = ReadInt(AH);
1782
	if (l < 0)
1783 1784 1785
		buf = NULL;
	else
	{
1786
		buf = (char *) pg_malloc(l + 1);
1787
		if ((*AH->ReadBufPtr) (AH, (void *) buf, l) != l)
1788
			exit_horribly(modulename, "unexpected end of file\n");
1789

1790 1791
		buf[l] = '\0';
	}
B
Bruce Momjian 已提交
1792

B
Bruce Momjian 已提交
1793
	return buf;
B
Bruce Momjian 已提交
1794 1795
}

T
Tom Lane 已提交
1796
static int
B
Bruce Momjian 已提交
1797
_discoverArchiveFormat(ArchiveHandle *AH)
B
Bruce Momjian 已提交
1798
{
B
Bruce Momjian 已提交
1799 1800
	FILE	   *fh;
	char		sig[6];			/* More than enough */
P
Peter Eisentraut 已提交
1801
	size_t		cnt;
B
Bruce Momjian 已提交
1802
	int			wantClose = 0;
B
Bruce Momjian 已提交
1803

1804
#if 0
1805
	write_msg(modulename, "attempting to ascertain archive format\n");
1806
#endif
1807 1808 1809 1810 1811

	if (AH->lookahead)
		free(AH->lookahead);

	AH->lookaheadSize = 512;
1812
	AH->lookahead = pg_malloc0(512);
1813 1814
	AH->lookaheadLen = 0;
	AH->lookaheadPos = 0;
1815

B
Bruce Momjian 已提交
1816 1817
	if (AH->fSpec)
	{
1818
		struct stat st;
1819

1820
		wantClose = 1;
1821 1822 1823 1824 1825 1826 1827 1828

		/*
		 * Check if the specified archive is a directory. If so, check if
		 * there's a "toc.dat" (or "toc.dat.gz") file in it.
		 */
		if (stat(AH->fSpec, &st) == 0 && S_ISDIR(st.st_mode))
		{
			char		buf[MAXPGPATH];
1829

1830
			if (snprintf(buf, MAXPGPATH, "%s/toc.dat", AH->fSpec) >= MAXPGPATH)
1831 1832
				exit_horribly(modulename, "directory name too long: \"%s\"\n",
							  AH->fSpec);
1833 1834 1835 1836 1837 1838 1839 1840
			if (stat(buf, &st) == 0 && S_ISREG(st.st_mode))
			{
				AH->format = archDirectory;
				return AH->format;
			}

#ifdef HAVE_LIBZ
			if (snprintf(buf, MAXPGPATH, "%s/toc.dat.gz", AH->fSpec) >= MAXPGPATH)
1841 1842
				exit_horribly(modulename, "directory name too long: \"%s\"\n",
							  AH->fSpec);
1843 1844 1845 1846 1847 1848
			if (stat(buf, &st) == 0 && S_ISREG(st.st_mode))
			{
				AH->format = archDirectory;
				return AH->format;
			}
#endif
1849 1850
			exit_horribly(modulename, "directory \"%s\" does not appear to be a valid archive (\"toc.dat\" does not exist)\n",
						  AH->fSpec);
1851
			fh = NULL;			/* keep compiler quiet */
1852 1853 1854 1855 1856
		}
		else
		{
			fh = fopen(AH->fSpec, PG_BINARY_R);
			if (!fh)
1857 1858
				exit_horribly(modulename, "could not open input file \"%s\": %s\n",
							  AH->fSpec, strerror(errno));
1859
		}
B
Bruce Momjian 已提交
1860 1861
	}
	else
1862
	{
1863
		fh = stdin;
1864
		if (!fh)
1865 1866
			exit_horribly(modulename, "could not open input file: %s\n",
						  strerror(errno));
1867
	}
B
Bruce Momjian 已提交
1868

B
Bruce Momjian 已提交
1869
	cnt = fread(sig, 1, 5, fh);
B
Bruce Momjian 已提交
1870

B
Bruce Momjian 已提交
1871
	if (cnt != 5)
1872 1873
	{
		if (ferror(fh))
1874
			exit_horribly(modulename, "could not read input file: %s\n", strerror(errno));
1875
		else
1876 1877
			exit_horribly(modulename, "input file is too short (read %lu, expected 5)\n",
						  (unsigned long) cnt);
1878
	}
B
Bruce Momjian 已提交
1879

B
Bruce Momjian 已提交
1880
	/* Save it, just in case we need it later */
1881 1882
	strncpy(&AH->lookahead[0], sig, 5);
	AH->lookaheadLen = 5;
B
Bruce Momjian 已提交
1883

B
Bruce Momjian 已提交
1884
	if (strncmp(sig, "PGDMP", 5) == 0)
1885
	{
1886 1887 1888 1889 1890
		/*
		 * Finish reading (most of) a custom-format header.
		 *
		 * NB: this code must agree with ReadHead().
		 */
1891 1892 1893 1894 1895 1896 1897 1898
		AH->vmaj = fgetc(fh);
		AH->vmin = fgetc(fh);

		/* Save these too... */
		AH->lookahead[AH->lookaheadLen++] = AH->vmaj;
		AH->lookahead[AH->lookaheadLen++] = AH->vmin;

		/* Check header version; varies from V1.0 */
B
Bruce Momjian 已提交
1899 1900
		if (AH->vmaj > 1 || ((AH->vmaj == 1) && (AH->vmin > 0)))		/* Version > 1.0 */
		{
1901 1902 1903 1904 1905 1906
			AH->vrev = fgetc(fh);
			AH->lookahead[AH->lookaheadLen++] = AH->vrev;
		}
		else
			AH->vrev = 0;

1907 1908 1909
		/* Make a convenient integer <maj><min><rev>00 */
		AH->version = ((AH->vmaj * 256 + AH->vmin) * 256 + AH->vrev) * 256 + 0;

1910 1911 1912
		AH->intSize = fgetc(fh);
		AH->lookahead[AH->lookaheadLen++] = AH->intSize;

1913 1914 1915 1916 1917 1918 1919 1920
		if (AH->version >= K_VERS_1_7)
		{
			AH->offSize = fgetc(fh);
			AH->lookahead[AH->lookaheadLen++] = AH->offSize;
		}
		else
			AH->offSize = AH->intSize;

1921 1922
		AH->format = fgetc(fh);
		AH->lookahead[AH->lookaheadLen++] = AH->format;
B
Bruce Momjian 已提交
1923 1924 1925
	}
	else
	{
1926
		/*
1927 1928
		 * *Maybe* we have a tar archive format file or a text dump ... So,
		 * read first 512 byte header...
1929 1930 1931
		 */
		cnt = fread(&AH->lookahead[AH->lookaheadLen], 1, 512 - AH->lookaheadLen, fh);
		AH->lookaheadLen += cnt;
B
Bruce Momjian 已提交
1932

1933 1934 1935 1936
		if (AH->lookaheadLen >= strlen(TEXT_DUMPALL_HEADER) &&
			(strncmp(AH->lookahead, TEXT_DUMP_HEADER, strlen(TEXT_DUMP_HEADER)) == 0 ||
			 strncmp(AH->lookahead, TEXT_DUMPALL_HEADER, strlen(TEXT_DUMPALL_HEADER)) == 0))
		{
1937 1938 1939 1940
			/*
			 * looks like it's probably a text format dump. so suggest they
			 * try psql
			 */
1941
			exit_horribly(modulename, "input file appears to be a text format dump. Please use psql.\n");
1942 1943
		}

1944
		if (AH->lookaheadLen != 512)
1945
			exit_horribly(modulename, "input file does not appear to be a valid archive (too short?)\n");
B
Bruce Momjian 已提交
1946

1947
		if (!isValidTarHeader(AH->lookahead))
1948
			exit_horribly(modulename, "input file does not appear to be a valid archive\n");
B
Bruce Momjian 已提交
1949

1950 1951
		AH->format = archTar;
	}
B
Bruce Momjian 已提交
1952

B
Bruce Momjian 已提交
1953
	/* If we can't seek, then mark the header as read */
P
Peter Eisentraut 已提交
1954
	if (fseeko(fh, 0, SEEK_SET) != 0)
1955 1956
	{
		/*
B
Bruce Momjian 已提交
1957 1958
		 * NOTE: Formats that use the lookahead buffer can unset this in their
		 * Init routine.
1959 1960 1961 1962
		 */
		AH->readHeader = 1;
	}
	else
B
Bruce Momjian 已提交
1963
		AH->lookaheadLen = 0;	/* Don't bother since we've reset the file */
1964

B
Bruce Momjian 已提交
1965 1966
	/* Close the file */
	if (wantClose)
1967
		if (fclose(fh) != 0)
1968 1969
			exit_horribly(modulename, "could not close input file: %s\n",
						  strerror(errno));
B
Bruce Momjian 已提交
1970

B
Bruce Momjian 已提交
1971
	return AH->format;
B
Bruce Momjian 已提交
1972 1973 1974 1975 1976 1977
}


/*
 * Allocate an archive handle
 */
B
Bruce Momjian 已提交
1978 1979
static ArchiveHandle *
_allocAH(const char *FileSpec, const ArchiveFormat fmt,
A
Andrew Dunstan 已提交
1980
	  const int compression, ArchiveMode mode, SetupWorkerPtr setupWorkerPtr)
1981
{
B
Bruce Momjian 已提交
1982
	ArchiveHandle *AH;
B
Bruce Momjian 已提交
1983

1984
#if 0
1985
	write_msg(modulename, "allocating AH for %s, format %d\n", FileSpec, fmt);
1986
#endif
1987

1988
	AH = (ArchiveHandle *) pg_malloc0(sizeof(ArchiveHandle));
B
Bruce Momjian 已提交
1989

1990 1991
	/* AH->debugLevel = 100; */

B
Bruce Momjian 已提交
1992 1993
	AH->vmaj = K_VERS_MAJOR;
	AH->vmin = K_VERS_MINOR;
1994
	AH->vrev = K_VERS_REV;
B
Bruce Momjian 已提交
1995

1996 1997 1998
	/* Make a convenient integer <maj><min><rev>00 */
	AH->version = ((AH->vmaj * 256 + AH->vmin) * 256 + AH->vrev) * 256 + 0;

1999
	/* initialize for backwards compatible string processing */
2000
	AH->public.encoding = 0;	/* PG_SQL_ASCII */
2001 2002 2003 2004 2005 2006
	AH->public.std_strings = false;

	/* sql error handling */
	AH->public.exit_on_error = true;
	AH->public.n_errors = 0;

2007 2008
	AH->archiveDumpVersion = PG_VERSION;

2009 2010
	AH->createDate = time(NULL);

B
Bruce Momjian 已提交
2011
	AH->intSize = sizeof(int);
2012
	AH->offSize = sizeof(pgoff_t);
B
Bruce Momjian 已提交
2013 2014
	if (FileSpec)
	{
2015
		AH->fSpec = pg_strdup(FileSpec);
B
Bruce Momjian 已提交
2016

2017 2018 2019
		/*
		 * Not used; maybe later....
		 *
2020
		 * AH->workDir = pg_strdup(FileSpec); for(i=strlen(FileSpec) ; i > 0 ;
2021
		 * i--) if (AH->workDir[i-1] == '/')
2022
		 */
B
Bruce Momjian 已提交
2023 2024
	}
	else
2025
		AH->fSpec = NULL;
B
Bruce Momjian 已提交
2026

2027 2028 2029
	AH->currUser = NULL;		/* unknown */
	AH->currSchema = NULL;		/* ditto */
	AH->currTablespace = NULL;	/* ditto */
2030
	AH->currWithOids = -1;		/* force SET */
B
Bruce Momjian 已提交
2031

2032
	AH->toc = (TocEntry *) pg_malloc0(sizeof(TocEntry));
B
Bruce Momjian 已提交
2033

B
Bruce Momjian 已提交
2034 2035 2036 2037 2038
	AH->toc->next = AH->toc;
	AH->toc->prev = AH->toc;

	AH->mode = mode;
	AH->compression = compression;
B
Bruce Momjian 已提交
2039

2040 2041
	memset(&(AH->sqlparse), 0, sizeof(AH->sqlparse));

B
Bruce Momjian 已提交
2042 2043 2044
	/* Open stdout with no compression for AH output handle */
	AH->gzOut = 0;
	AH->OF = stdout;
B
Bruce Momjian 已提交
2045

2046 2047
	/*
	 * On Windows, we need to use binary mode to read/write non-text archive
B
Bruce Momjian 已提交
2048 2049
	 * formats.  Force stdin/stdout into binary mode if that is what we are
	 * using.
2050 2051
	 */
#ifdef WIN32
2052 2053
	if (fmt != archNull &&
		(AH->fSpec == NULL || strcmp(AH->fSpec, "") == 0))
2054 2055 2056 2057 2058 2059 2060 2061
	{
		if (mode == archModeWrite)
			setmode(fileno(stdout), O_BINARY);
		else
			setmode(fileno(stdin), O_BINARY);
	}
#endif

A
Andrew Dunstan 已提交
2062 2063
	AH->SetupWorkerPtr = setupWorkerPtr;

B
Bruce Momjian 已提交
2064
	if (fmt == archUnknown)
2065 2066 2067
		AH->format = _discoverArchiveFormat(AH);
	else
		AH->format = fmt;
B
Bruce Momjian 已提交
2068

2069 2070
	AH->promptPassword = TRI_DEFAULT;

B
Bruce Momjian 已提交
2071 2072
	switch (AH->format)
	{
2073 2074 2075
		case archCustom:
			InitArchiveFmt_Custom(AH);
			break;
B
Bruce Momjian 已提交
2076

2077 2078 2079
		case archNull:
			InitArchiveFmt_Null(AH);
			break;
B
Bruce Momjian 已提交
2080

2081 2082 2083 2084
		case archDirectory:
			InitArchiveFmt_Directory(AH);
			break;

2085 2086 2087 2088 2089
		case archTar:
			InitArchiveFmt_Tar(AH);
			break;

		default:
2090
			exit_horribly(modulename, "unrecognized file format \"%d\"\n", fmt);
B
Bruce Momjian 已提交
2091
	}
B
Bruce Momjian 已提交
2092

B
Bruce Momjian 已提交
2093
	return AH;
B
Bruce Momjian 已提交
2094 2095
}

B
Bruce Momjian 已提交
2096
void
A
Andrew Dunstan 已提交
2097
WriteDataChunks(ArchiveHandle *AH, ParallelState *pstate)
B
Bruce Momjian 已提交
2098
{
2099
	TocEntry   *te;
B
Bruce Momjian 已提交
2100

2101
	for (te = AH->toc->next; te != AH->toc; te = te->next)
B
Bruce Momjian 已提交
2102
	{
A
Andrew Dunstan 已提交
2103 2104
		if (!te->dataDumper)
			continue;
B
Bruce Momjian 已提交
2105

A
Andrew Dunstan 已提交
2106 2107
		if ((te->reqs & REQ_DATA) == 0)
			continue;
B
Bruce Momjian 已提交
2108

A
Andrew Dunstan 已提交
2109 2110
		if (pstate && pstate->numWorkers > 1)
		{
B
Bruce Momjian 已提交
2111
			/*
A
Andrew Dunstan 已提交
2112 2113
			 * If we are in a parallel backup, then we are always the master
			 * process.
B
Bruce Momjian 已提交
2114
			 */
A
Andrew Dunstan 已提交
2115 2116 2117 2118 2119 2120 2121 2122 2123
			EnsureIdleWorker(AH, pstate);
			Assert(GetIdleWorker(pstate) != NO_SLOT);
			DispatchJobForTocEntry(AH, pstate, te, ACT_DUMP);
		}
		else
			WriteDataChunksForTocEntry(AH, te);
	}
	EnsureWorkersFinished(AH, pstate);
}
B
Bruce Momjian 已提交
2124

A
Andrew Dunstan 已提交
2125 2126 2127 2128 2129
void
WriteDataChunksForTocEntry(ArchiveHandle *AH, TocEntry *te)
{
	StartDataPtr startPtr;
	EndDataPtr	endPtr;
B
Bruce Momjian 已提交
2130

A
Andrew Dunstan 已提交
2131 2132 2133 2134 2135 2136
	AH->currToc = te;

	if (strcmp(te->desc, "BLOBS") == 0)
	{
		startPtr = AH->StartBlobsPtr;
		endPtr = AH->EndBlobsPtr;
B
Bruce Momjian 已提交
2137
	}
A
Andrew Dunstan 已提交
2138 2139 2140 2141 2142 2143 2144 2145 2146 2147 2148 2149 2150 2151 2152 2153 2154 2155
	else
	{
		startPtr = AH->StartDataPtr;
		endPtr = AH->EndDataPtr;
	}

	if (startPtr != NULL)
		(*startPtr) (AH, te);

	/*
	 * The user-provided DataDumper routine needs to call AH->WriteData
	 */
	(*te->dataDumper) ((Archive *) AH, te->dataDumperArg);

	if (endPtr != NULL)
		(*endPtr) (AH, te);

	AH->currToc = NULL;
B
Bruce Momjian 已提交
2156 2157
}

B
Bruce Momjian 已提交
2158 2159
void
WriteToc(ArchiveHandle *AH)
B
Bruce Momjian 已提交
2160
{
2161 2162
	TocEntry   *te;
	char		workbuf[32];
2163
	int			tocCount;
2164
	int			i;
B
Bruce Momjian 已提交
2165

2166 2167 2168 2169 2170 2171 2172 2173 2174
	/* count entries that will actually be dumped */
	tocCount = 0;
	for (te = AH->toc->next; te != AH->toc; te = te->next)
	{
		if ((te->reqs & (REQ_SCHEMA | REQ_DATA | REQ_SPECIAL)) != 0)
			tocCount++;
	}

	/* printf("%d TOC Entries to save\n", tocCount); */
B
Bruce Momjian 已提交
2175

2176
	WriteInt(AH, tocCount);
2177 2178

	for (te = AH->toc->next; te != AH->toc; te = te->next)
B
Bruce Momjian 已提交
2179
	{
2180 2181 2182
		if ((te->reqs & (REQ_SCHEMA | REQ_DATA | REQ_SPECIAL)) == 0)
			continue;

2183
		WriteInt(AH, te->dumpId);
B
Bruce Momjian 已提交
2184
		WriteInt(AH, te->dataDumper ? 1 : 0);
2185 2186 2187 2188 2189 2190

		/* OID is recorded as a string for historical reasons */
		sprintf(workbuf, "%u", te->catalogId.tableoid);
		WriteStr(AH, workbuf);
		sprintf(workbuf, "%u", te->catalogId.oid);
		WriteStr(AH, workbuf);
2191

2192
		WriteStr(AH, te->tag);
B
Bruce Momjian 已提交
2193
		WriteStr(AH, te->desc);
2194
		WriteInt(AH, te->section);
B
Bruce Momjian 已提交
2195 2196 2197
		WriteStr(AH, te->defn);
		WriteStr(AH, te->dropStmt);
		WriteStr(AH, te->copyStmt);
2198
		WriteStr(AH, te->namespace);
2199
		WriteStr(AH, te->tablespace);
B
Bruce Momjian 已提交
2200
		WriteStr(AH, te->owner);
2201
		WriteStr(AH, te->withOids ? "true" : "false");
2202 2203

		/* Dump list of dependencies */
2204
		for (i = 0; i < te->nDeps; i++)
2205
		{
2206 2207
			sprintf(workbuf, "%d", te->dependencies[i]);
			WriteStr(AH, workbuf);
2208
		}
2209
		WriteStr(AH, NULL);		/* Terminate List */
2210

B
Bruce Momjian 已提交
2211 2212 2213
		if (AH->WriteExtraTocPtr)
			(*AH->WriteExtraTocPtr) (AH, te);
	}
B
Bruce Momjian 已提交
2214 2215
}

B
Bruce Momjian 已提交
2216 2217
void
ReadToc(ArchiveHandle *AH)
B
Bruce Momjian 已提交
2218
{
B
Bruce Momjian 已提交
2219
	int			i;
2220 2221
	char	   *tmp;
	DumpId	   *deps;
2222 2223
	int			depIdx;
	int			depSize;
2224
	TocEntry   *te;
B
Bruce Momjian 已提交
2225

B
Bruce Momjian 已提交
2226
	AH->tocCount = ReadInt(AH);
2227
	AH->maxDumpId = 0;
B
Bruce Momjian 已提交
2228

B
Bruce Momjian 已提交
2229 2230
	for (i = 0; i < AH->tocCount; i++)
	{
2231
		te = (TocEntry *) pg_malloc0(sizeof(TocEntry));
2232 2233 2234 2235
		te->dumpId = ReadInt(AH);

		if (te->dumpId > AH->maxDumpId)
			AH->maxDumpId = te->dumpId;
2236 2237

		/* Sanity check */
2238
		if (te->dumpId <= 0)
2239
			exit_horribly(modulename,
2240
					   "entry ID %d out of range -- perhaps a corrupt TOC\n",
2241
						  te->dumpId);
2242 2243

		te->hadDumper = ReadInt(AH);
2244 2245 2246 2247 2248 2249 2250 2251 2252 2253 2254 2255

		if (AH->version >= K_VERS_1_8)
		{
			tmp = ReadStr(AH);
			sscanf(tmp, "%u", &te->catalogId.tableoid);
			free(tmp);
		}
		else
			te->catalogId.tableoid = InvalidOid;
		tmp = ReadStr(AH);
		sscanf(tmp, "%u", &te->catalogId.oid);
		free(tmp);
2256

2257
		te->tag = ReadStr(AH);
2258
		te->desc = ReadStr(AH);
2259 2260 2261 2262 2263 2264 2265 2266

		if (AH->version >= K_VERS_1_11)
		{
			te->section = ReadInt(AH);
		}
		else
		{
			/*
2267 2268 2269
			 * Rules for pre-8.4 archives wherein pg_dump hasn't classified
			 * the entries into sections.  This list need not cover entry
			 * types added later than 8.4.
2270 2271
			 */
			if (strcmp(te->desc, "COMMENT") == 0 ||
2272
				strcmp(te->desc, "ACL") == 0 ||
2273
				strcmp(te->desc, "ACL LANGUAGE") == 0)
2274 2275 2276 2277 2278 2279 2280 2281 2282 2283 2284 2285 2286 2287 2288 2289
				te->section = SECTION_NONE;
			else if (strcmp(te->desc, "TABLE DATA") == 0 ||
					 strcmp(te->desc, "BLOBS") == 0 ||
					 strcmp(te->desc, "BLOB COMMENTS") == 0)
				te->section = SECTION_DATA;
			else if (strcmp(te->desc, "CONSTRAINT") == 0 ||
					 strcmp(te->desc, "CHECK CONSTRAINT") == 0 ||
					 strcmp(te->desc, "FK CONSTRAINT") == 0 ||
					 strcmp(te->desc, "INDEX") == 0 ||
					 strcmp(te->desc, "RULE") == 0 ||
					 strcmp(te->desc, "TRIGGER") == 0)
				te->section = SECTION_POST_DATA;
			else
				te->section = SECTION_PRE_DATA;
		}

2290 2291 2292 2293 2294 2295
		te->defn = ReadStr(AH);
		te->dropStmt = ReadStr(AH);

		if (AH->version >= K_VERS_1_3)
			te->copyStmt = ReadStr(AH);

2296 2297 2298
		if (AH->version >= K_VERS_1_6)
			te->namespace = ReadStr(AH);

2299 2300 2301
		if (AH->version >= K_VERS_1_10)
			te->tablespace = ReadStr(AH);

2302
		te->owner = ReadStr(AH);
2303 2304 2305 2306 2307 2308 2309 2310 2311
		if (AH->version >= K_VERS_1_9)
		{
			if (strcmp(ReadStr(AH), "true") == 0)
				te->withOids = true;
			else
				te->withOids = false;
		}
		else
			te->withOids = true;
B
Bruce Momjian 已提交
2312

2313 2314 2315 2316
		/* Read TOC entry dependencies */
		if (AH->version >= K_VERS_1_5)
		{
			depSize = 100;
2317
			deps = (DumpId *) pg_malloc(sizeof(DumpId) * depSize);
2318
			depIdx = 0;
2319
			for (;;)
2320
			{
2321 2322 2323
				tmp = ReadStr(AH);
				if (!tmp)
					break;		/* end of list */
2324
				if (depIdx >= depSize)
2325 2326
				{
					depSize *= 2;
T
Tom Lane 已提交
2327
					deps = (DumpId *) pg_realloc(deps, sizeof(DumpId) * depSize);
2328
				}
2329 2330 2331 2332
				sscanf(tmp, "%d", &deps[depIdx]);
				free(tmp);
				depIdx++;
			}
2333

2334 2335
			if (depIdx > 0)		/* We have a non-null entry */
			{
T
Tom Lane 已提交
2336
				deps = (DumpId *) pg_realloc(deps, sizeof(DumpId) * depIdx);
2337 2338 2339
				te->dependencies = deps;
				te->nDeps = depIdx;
			}
2340
			else
2341 2342
			{
				free(deps);
2343 2344
				te->dependencies = NULL;
				te->nDeps = 0;
2345
			}
2346
		}
2347
		else
2348 2349 2350 2351
		{
			te->dependencies = NULL;
			te->nDeps = 0;
		}
2352

B
Bruce Momjian 已提交
2353 2354
		if (AH->ReadExtraTocPtr)
			(*AH->ReadExtraTocPtr) (AH, te);
2355

2356 2357
		ahlog(AH, 3, "read TOC entry %d (ID %d) for %s %s\n",
			  i, te->dumpId, te->desc, te->tag);
2358

2359
		/* link completed entry into TOC circular list */
2360 2361 2362 2363
		te->prev = AH->toc->prev;
		AH->toc->prev->next = te;
		AH->toc->prev = te;
		te->next = AH->toc;
2364 2365 2366 2367 2368 2369

		/* special processing immediately upon read for some items */
		if (strcmp(te->desc, "ENCODING") == 0)
			processEncodingEntry(AH, te);
		else if (strcmp(te->desc, "STDSTRINGS") == 0)
			processStdStringsEntry(AH, te);
B
Bruce Momjian 已提交
2370
	}
B
Bruce Momjian 已提交
2371 2372
}

2373 2374 2375 2376
static void
processEncodingEntry(ArchiveHandle *AH, TocEntry *te)
{
	/* te->defn should have the form SET client_encoding = 'foo'; */
2377
	char	   *defn = pg_strdup(te->defn);
2378 2379 2380 2381 2382 2383 2384 2385 2386 2387 2388 2389
	char	   *ptr1;
	char	   *ptr2 = NULL;
	int			encoding;

	ptr1 = strchr(defn, '\'');
	if (ptr1)
		ptr2 = strchr(++ptr1, '\'');
	if (ptr2)
	{
		*ptr2 = '\0';
		encoding = pg_char_to_encoding(ptr1);
		if (encoding < 0)
2390 2391
			exit_horribly(modulename, "unrecognized encoding \"%s\"\n",
						  ptr1);
2392 2393 2394
		AH->public.encoding = encoding;
	}
	else
2395 2396
		exit_horribly(modulename, "invalid ENCODING item: %s\n",
					  te->defn);
2397 2398 2399 2400 2401 2402 2403 2404 2405 2406 2407 2408 2409 2410 2411 2412

	free(defn);
}

static void
processStdStringsEntry(ArchiveHandle *AH, TocEntry *te)
{
	/* te->defn should have the form SET standard_conforming_strings = 'x'; */
	char	   *ptr1;

	ptr1 = strchr(te->defn, '\'');
	if (ptr1 && strncmp(ptr1, "'on'", 4) == 0)
		AH->public.std_strings = true;
	else if (ptr1 && strncmp(ptr1, "'off'", 5) == 0)
		AH->public.std_strings = false;
	else
2413 2414
		exit_horribly(modulename, "invalid STDSTRINGS item: %s\n",
					  te->defn);
2415 2416
}

2417
static teReqs
2418
_tocEntryRequired(TocEntry *te, teSection curSection, RestoreOptions *ropt)
B
Bruce Momjian 已提交
2419
{
2420
	teReqs		res = REQ_SCHEMA | REQ_DATA;
B
Bruce Momjian 已提交
2421

2422
	/* ENCODING and STDSTRINGS items are treated specially */
2423 2424
	if (strcmp(te->desc, "ENCODING") == 0 ||
		strcmp(te->desc, "STDSTRINGS") == 0)
2425
		return REQ_SPECIAL;
2426

B
Bruce Momjian 已提交
2427
	/* If it's an ACL, maybe ignore it */
2428
	if (ropt->aclsSkip && _tocEntryIsACL(te))
2429
		return 0;
B
Bruce Momjian 已提交
2430

R
Robert Haas 已提交
2431
	/* If it's security labels, maybe ignore it */
2432
	if (ropt->no_security_labels && strcmp(te->desc, "SECURITY LABEL") == 0)
R
Robert Haas 已提交
2433 2434
		return 0;

2435 2436
	/* Ignore it if section is not to be dumped/restored */
	switch (curSection)
2437
	{
2438 2439 2440 2441 2442 2443 2444 2445 2446 2447 2448 2449 2450 2451
		case SECTION_PRE_DATA:
			if (!(ropt->dumpSections & DUMP_PRE_DATA))
				return 0;
			break;
		case SECTION_DATA:
			if (!(ropt->dumpSections & DUMP_DATA))
				return 0;
			break;
		case SECTION_POST_DATA:
			if (!(ropt->dumpSections & DUMP_POST_DATA))
				return 0;
			break;
		default:
			/* shouldn't get here, really, but ignore it */
2452 2453 2454
			return 0;
	}

2455 2456 2457 2458 2459 2460 2461 2462 2463 2464
	/* Check options for selective dump/restore */
	if (ropt->schemaNames)
	{
		/* If no namespace is specified, it means all. */
		if (!te->namespace)
			return 0;
		if (strcmp(ropt->schemaNames, te->namespace) != 0)
			return 0;
	}

B
Bruce Momjian 已提交
2465 2466
	if (ropt->selTypes)
	{
2467 2468
		if (strcmp(te->desc, "TABLE") == 0 ||
			strcmp(te->desc, "TABLE DATA") == 0)
2469 2470 2471
		{
			if (!ropt->selTable)
				return 0;
2472
			if (ropt->tableNames.head != NULL && (!(simple_string_list_member(&ropt->tableNames, te->tag))))
2473
				return 0;
B
Bruce Momjian 已提交
2474 2475 2476
		}
		else if (strcmp(te->desc, "INDEX") == 0)
		{
2477 2478
			if (!ropt->selIndex)
				return 0;
2479
			if (ropt->indexNames && strcmp(ropt->indexNames, te->tag) != 0)
2480
				return 0;
B
Bruce Momjian 已提交
2481 2482 2483
		}
		else if (strcmp(te->desc, "FUNCTION") == 0)
		{
2484 2485
			if (!ropt->selFunction)
				return 0;
2486
			if (ropt->functionNames && strcmp(ropt->functionNames, te->tag) != 0)
2487
				return 0;
B
Bruce Momjian 已提交
2488 2489 2490
		}
		else if (strcmp(te->desc, "TRIGGER") == 0)
		{
2491 2492
			if (!ropt->selTrigger)
				return 0;
2493
			if (ropt->triggerNames && strcmp(ropt->triggerNames, te->tag) != 0)
2494 2495
				return 0;
		}
B
Bruce Momjian 已提交
2496 2497
		else
			return 0;
B
Bruce Momjian 已提交
2498 2499
	}

2500
	/*
B
Bruce Momjian 已提交
2501
	 * Check if we had a dataDumper. Indicates if the entry is schema or data
2502 2503 2504 2505
	 */
	if (!te->hadDumper)
	{
		/*
B
Bruce Momjian 已提交
2506 2507 2508 2509 2510
		 * Special Case: If 'SEQUENCE SET' or anything to do with BLOBs, then
		 * it is considered a data entry.  We don't need to check for the
		 * BLOBS entry or old-style BLOB COMMENTS, because they will have
		 * hadDumper = true ... but we do need to check new-style BLOB
		 * comments.
2511
		 */
2512 2513 2514 2515 2516
		if (strcmp(te->desc, "SEQUENCE SET") == 0 ||
			strcmp(te->desc, "BLOB") == 0 ||
			(strcmp(te->desc, "ACL") == 0 &&
			 strncmp(te->tag, "LARGE OBJECT ", 13) == 0) ||
			(strcmp(te->desc, "COMMENT") == 0 &&
R
Robert Haas 已提交
2517 2518
			 strncmp(te->tag, "LARGE OBJECT ", 13) == 0) ||
			(strcmp(te->desc, "SECURITY LABEL") == 0 &&
2519
			 strncmp(te->tag, "LARGE OBJECT ", 13) == 0))
2520 2521
			res = res & REQ_DATA;
		else
2522 2523
			res = res & ~REQ_DATA;
	}
2524

2525
	/*
B
Bruce Momjian 已提交
2526 2527
	 * Special case: <Init> type with <Max OID> tag; this is obsolete and we
	 * always ignore it.
2528
	 */
2529
	if ((strcmp(te->desc, "<Init>") == 0) && (strcmp(te->tag, "Max OID") == 0))
2530
		return 0;
2531

B
Bruce Momjian 已提交
2532 2533
	/* Mask it if we only want schema */
	if (ropt->schemaOnly)
2534
		res = res & REQ_SCHEMA;
B
Bruce Momjian 已提交
2535

2536
	/* Mask it if we only want data */
2537
	if (ropt->dataOnly)
2538
		res = res & REQ_DATA;
B
Bruce Momjian 已提交
2539

2540
	/* Mask it if we don't have a schema contribution */
B
Bruce Momjian 已提交
2541
	if (!te->defn || strlen(te->defn) == 0)
2542
		res = res & ~REQ_SCHEMA;
B
Bruce Momjian 已提交
2543

2544 2545
	/* Finally, if there's a per-ID filter, limit based on that as well */
	if (ropt->idWanted && !ropt->idWanted[te->dumpId - 1])
2546
		return 0;
B
Bruce Momjian 已提交
2547

B
Bruce Momjian 已提交
2548
	return res;
B
Bruce Momjian 已提交
2549 2550
}

2551 2552 2553 2554 2555 2556 2557 2558 2559 2560 2561 2562 2563 2564
/*
 * Identify TOC entries that are ACLs.
 */
static bool
_tocEntryIsACL(TocEntry *te)
{
	/* "ACL LANGUAGE" was a crock emitted only in PG 7.4 */
	if (strcmp(te->desc, "ACL") == 0 ||
		strcmp(te->desc, "ACL LANGUAGE") == 0 ||
		strcmp(te->desc, "DEFAULT ACL") == 0)
		return true;
	return false;
}

2565 2566 2567 2568 2569 2570 2571
/*
 * Issue SET commands for parameters that we want to have set the same way
 * at all times during execution of a restore script.
 */
static void
_doSetFixedOutputState(ArchiveHandle *AH)
{
2572
	/* Disable statement_timeout since restore is probably slow */
2573
	ahprintf(AH, "SET statement_timeout = 0;\n");
2574

2575 2576 2577
	/* Likewise for lock_timeout */
	ahprintf(AH, "SET lock_timeout = 0;\n");

2578 2579 2580
	/* Select the correct character set encoding */
	ahprintf(AH, "SET client_encoding = '%s';\n",
			 pg_encoding_to_char(AH->public.encoding));
2581

2582 2583 2584
	/* Select the correct string literal syntax */
	ahprintf(AH, "SET standard_conforming_strings = %s;\n",
			 AH->public.std_strings ? "on" : "off");
2585

2586 2587 2588 2589
	/* Select the role to be used during restore */
	if (AH->ropt && AH->ropt->use_role)
		ahprintf(AH, "SET ROLE %s;\n", fmtId(AH->ropt->use_role));

2590 2591 2592
	/* Make sure function checking is disabled */
	ahprintf(AH, "SET check_function_bodies = false;\n");

2593 2594
	/* Avoid annoying notices etc */
	ahprintf(AH, "SET client_min_messages = warning;\n");
2595 2596
	if (!AH->public.std_strings)
		ahprintf(AH, "SET escape_string_warning = off;\n");
2597

2598 2599 2600
	ahprintf(AH, "\n");
}

2601 2602
/*
 * Issue a SET SESSION AUTHORIZATION command.  Caller is responsible
2603 2604
 * for updating state if appropriate.  If user is NULL or an empty string,
 * the specification DEFAULT will be used.
2605 2606
 */
static void
2607
_doSetSessionAuth(ArchiveHandle *AH, const char *user)
2608
{
2609
	PQExpBuffer cmd = createPQExpBuffer();
B
Bruce Momjian 已提交
2610

2611
	appendPQExpBuffer(cmd, "SET SESSION AUTHORIZATION ");
B
Bruce Momjian 已提交
2612

2613 2614 2615 2616
	/*
	 * SQL requires a string literal here.	Might as well be correct.
	 */
	if (user && *user)
2617
		appendStringLiteralAHX(cmd, user, AH);
2618 2619 2620 2621
	else
		appendPQExpBuffer(cmd, "DEFAULT");
	appendPQExpBuffer(cmd, ";");

2622 2623 2624 2625
	if (RestoringToDB(AH))
	{
		PGresult   *res;

2626
		res = PQexec(AH->connection, cmd->data);
2627 2628

		if (!res || PQresultStatus(res) != PGRES_COMMAND_OK)
2629 2630 2631
			/* NOT warn_or_exit_horribly... use -O instead to skip this. */
			exit_horribly(modulename, "could not set session user to \"%s\": %s",
						  user, PQerrorMessage(AH->connection));
2632 2633 2634 2635

		PQclear(res);
	}
	else
2636 2637 2638
		ahprintf(AH, "%s\n\n", cmd->data);

	destroyPQExpBuffer(cmd);
2639 2640
}

2641

2642 2643 2644 2645 2646 2647 2648 2649 2650 2651
/*
 * Issue a SET default_with_oids command.  Caller is responsible
 * for updating state if appropriate.
 */
static void
_doSetWithOids(ArchiveHandle *AH, const bool withOids)
{
	PQExpBuffer cmd = createPQExpBuffer();

	appendPQExpBuffer(cmd, "SET default_with_oids = %s;", withOids ?
B
Bruce Momjian 已提交
2652
					  "true" : "false");
2653 2654 2655 2656 2657 2658 2659 2660

	if (RestoringToDB(AH))
	{
		PGresult   *res;

		res = PQexec(AH->connection, cmd->data);

		if (!res || PQresultStatus(res) != PGRES_COMMAND_OK)
2661 2662 2663
			warn_or_exit_horribly(AH, modulename,
								  "could not set default_with_oids: %s",
								  PQerrorMessage(AH->connection));
2664 2665 2666 2667 2668 2669 2670 2671 2672 2673

		PQclear(res);
	}
	else
		ahprintf(AH, "%s\n\n", cmd->data);

	destroyPQExpBuffer(cmd);
}


2674
/*
2675
 * Issue the commands to connect to the specified database.
2676 2677
 *
 * If we're currently restoring right into a database, this will
B
Bruce Momjian 已提交
2678
 * actually establish a connection. Otherwise it puts a \connect into
2679
 * the script output.
2680 2681
 *
 * NULL dbname implies reconnecting to the current DB (pretty useless).
2682
 */
B
Bruce Momjian 已提交
2683
static void
2684
_reconnectToDB(ArchiveHandle *AH, const char *dbname)
2685
{
2686
	if (RestoringToDB(AH))
2687
		ReconnectToServer(AH, dbname, NULL);
2688
	else
2689 2690 2691
	{
		PQExpBuffer qry = createPQExpBuffer();

2692
		appendPQExpBuffer(qry, "\\connect %s\n\n",
2693
						  dbname ? fmtId(dbname) : "-");
2694
		ahprintf(AH, "%s", qry->data);
2695 2696
		destroyPQExpBuffer(qry);
	}
2697

2698
	/*
B
Bruce Momjian 已提交
2699 2700
	 * NOTE: currUser keeps track of what the imaginary session user in our
	 * script is.  It's now effectively reset to the original userID.
2701
	 */
2702 2703
	if (AH->currUser)
		free(AH->currUser);
2704
	AH->currUser = NULL;
2705

2706
	/* don't assume we still know the output schema, tablespace, etc either */
2707 2708
	if (AH->currSchema)
		free(AH->currSchema);
2709 2710 2711 2712
	AH->currSchema = NULL;
	if (AH->currTablespace)
		free(AH->currTablespace);
	AH->currTablespace = NULL;
2713
	AH->currWithOids = -1;
B
Bruce Momjian 已提交
2714

2715 2716
	/* re-establish fixed state */
	_doSetFixedOutputState(AH);
2717 2718
}

2719 2720 2721 2722 2723 2724 2725 2726 2727 2728 2729 2730 2731 2732 2733 2734 2735
/*
 * Become the specified user, and update state to avoid redundant commands
 *
 * NULL or empty argument is taken to mean restoring the session default
 */
static void
_becomeUser(ArchiveHandle *AH, const char *user)
{
	if (!user)
		user = "";				/* avoid null pointers */

	if (AH->currUser && strcmp(AH->currUser, user) == 0)
		return;					/* no need to do anything */

	_doSetSessionAuth(AH, user);

	/*
B
Bruce Momjian 已提交
2736 2737
	 * NOTE: currUser keeps track of what the imaginary session user in our
	 * script is
2738 2739 2740
	 */
	if (AH->currUser)
		free(AH->currUser);
2741
	AH->currUser = pg_strdup(user);
2742
}
2743 2744

/*
2745
 * Become the owner of the given TOC entry object.	If
2746 2747
 * changes in ownership are not allowed, this doesn't do anything.
 */
B
Bruce Momjian 已提交
2748
static void
2749
_becomeOwner(ArchiveHandle *AH, TocEntry *te)
2750
{
2751
	if (AH->ropt && (AH->ropt->noOwner || !AH->ropt->use_setsessauth))
2752 2753
		return;

2754
	_becomeUser(AH, te->owner);
2755 2756
}

2757

2758 2759 2760 2761 2762 2763 2764 2765 2766 2767 2768 2769 2770 2771
/*
 * Set the proper default_with_oids value for the table.
 */
static void
_setWithOids(ArchiveHandle *AH, TocEntry *te)
{
	if (AH->currWithOids != te->withOids)
	{
		_doSetWithOids(AH, te->withOids);
		AH->currWithOids = te->withOids;
	}
}


2772 2773 2774 2775 2776 2777 2778
/*
 * Issue the commands to select the specified schema as the current schema
 * in the target database.
 */
static void
_selectOutputSchema(ArchiveHandle *AH, const char *schemaName)
{
2779 2780
	PQExpBuffer qry;

2781
	if (!schemaName || *schemaName == '\0' ||
2782
		(AH->currSchema && strcmp(AH->currSchema, schemaName) == 0))
2783 2784
		return;					/* no need to do anything */

2785 2786 2787
	qry = createPQExpBuffer();

	appendPQExpBuffer(qry, "SET search_path = %s",
2788
					  fmtId(schemaName));
2789 2790 2791
	if (strcmp(schemaName, "pg_catalog") != 0)
		appendPQExpBuffer(qry, ", pg_catalog");

2792 2793 2794 2795 2796 2797 2798
	if (RestoringToDB(AH))
	{
		PGresult   *res;

		res = PQexec(AH->connection, qry->data);

		if (!res || PQresultStatus(res) != PGRES_COMMAND_OK)
2799 2800 2801
			warn_or_exit_horribly(AH, modulename,
								  "could not set search_path to \"%s\": %s",
								  schemaName, PQerrorMessage(AH->connection));
2802 2803 2804 2805

		PQclear(res);
	}
	else
2806
		ahprintf(AH, "%s;\n\n", qry->data);
2807 2808 2809

	if (AH->currSchema)
		free(AH->currSchema);
2810
	AH->currSchema = pg_strdup(schemaName);
2811 2812

	destroyPQExpBuffer(qry);
2813 2814
}

2815 2816 2817 2818 2819 2820 2821 2822
/*
 * Issue the commands to select the specified tablespace as the current one
 * in the target database.
 */
static void
_selectTablespace(ArchiveHandle *AH, const char *tablespace)
{
	PQExpBuffer qry;
B
Bruce Momjian 已提交
2823 2824
	const char *want,
			   *have;
2825

2826 2827 2828 2829
	/* do nothing in --no-tablespaces mode */
	if (AH->ropt->noTablespace)
		return;

2830 2831 2832 2833 2834 2835 2836 2837 2838 2839 2840 2841 2842 2843 2844 2845 2846 2847 2848 2849 2850 2851 2852 2853 2854 2855 2856 2857 2858 2859
	have = AH->currTablespace;
	want = tablespace;

	/* no need to do anything for non-tablespace object */
	if (!want)
		return;

	if (have && strcmp(want, have) == 0)
		return;					/* no need to do anything */

	qry = createPQExpBuffer();

	if (strcmp(want, "") == 0)
	{
		/* We want the tablespace to be the database's default */
		appendPQExpBuffer(qry, "SET default_tablespace = ''");
	}
	else
	{
		/* We want an explicit tablespace */
		appendPQExpBuffer(qry, "SET default_tablespace = %s", fmtId(want));
	}

	if (RestoringToDB(AH))
	{
		PGresult   *res;

		res = PQexec(AH->connection, qry->data);

		if (!res || PQresultStatus(res) != PGRES_COMMAND_OK)
2860
			warn_or_exit_horribly(AH, modulename,
2861 2862
								"could not set default_tablespace to %s: %s",
								fmtId(want), PQerrorMessage(AH->connection));
2863 2864 2865 2866 2867 2868 2869 2870

		PQclear(res);
	}
	else
		ahprintf(AH, "%s;\n\n", qry->data);

	if (AH->currTablespace)
		free(AH->currTablespace);
2871
	AH->currTablespace = pg_strdup(want);
2872 2873 2874

	destroyPQExpBuffer(qry);
}
2875

2876 2877 2878 2879 2880 2881 2882 2883
/*
 * Extract an object description for a TOC entry, and append it to buf.
 *
 * This is not quite as general as it may seem, since it really only
 * handles constructing the right thing to put into ALTER ... OWNER TO.
 *
 * The whole thing is pretty grotty, but we are kind of stuck since the
 * information used is all that's available in older dump files.
2884
 */
2885
static void
2886
_getObjectDescription(PQExpBuffer buf, TocEntry *te, ArchiveHandle *AH)
2887
{
2888 2889 2890
	const char *type = te->desc;

	/* Use ALTER TABLE for views and sequences */
A
Andrew Dunstan 已提交
2891
	if (strcmp(type, "VIEW") == 0 || strcmp(type, "SEQUENCE") == 0 ||
2892
		strcmp(type, "MATERIALIZED VIEW") == 0)
2893 2894 2895
		type = "TABLE";

	/* objects named by a schema and name */
P
Peter Eisentraut 已提交
2896 2897
	if (strcmp(type, "COLLATION") == 0 ||
		strcmp(type, "CONVERSION") == 0 ||
2898 2899
		strcmp(type, "DOMAIN") == 0 ||
		strcmp(type, "TABLE") == 0 ||
2900
		strcmp(type, "TYPE") == 0 ||
R
Robert Haas 已提交
2901
		strcmp(type, "FOREIGN TABLE") == 0 ||
2902 2903
		strcmp(type, "TEXT SEARCH DICTIONARY") == 0 ||
		strcmp(type, "TEXT SEARCH CONFIGURATION") == 0)
2904
	{
2905
		appendPQExpBuffer(buf, "%s ", type);
B
Bruce Momjian 已提交
2906
		if (te->namespace && te->namespace[0])	/* is null pre-7.3 */
2907
			appendPQExpBuffer(buf, "%s.", fmtId(te->namespace));
B
Bruce Momjian 已提交
2908

2909
		/*
B
Bruce Momjian 已提交
2910 2911 2912
		 * Pre-7.3 pg_dump would sometimes (not always) put a fmtId'd name
		 * into te->tag for an index. This check is heuristic, so make its
		 * scope as narrow as possible.
2913 2914 2915
		 */
		if (AH->version < K_VERS_1_7 &&
			te->tag[0] == '"' &&
B
Bruce Momjian 已提交
2916
			te->tag[strlen(te->tag) - 1] == '"' &&
2917 2918 2919 2920
			strcmp(type, "INDEX") == 0)
			appendPQExpBuffer(buf, "%s", te->tag);
		else
			appendPQExpBuffer(buf, "%s", fmtId(te->tag));
2921 2922
		return;
	}
2923

2924 2925
	/* objects named by just a name */
	if (strcmp(type, "DATABASE") == 0 ||
2926
		strcmp(type, "PROCEDURAL LANGUAGE") == 0 ||
2927 2928 2929 2930
		strcmp(type, "SCHEMA") == 0 ||
		strcmp(type, "FOREIGN DATA WRAPPER") == 0 ||
		strcmp(type, "SERVER") == 0 ||
		strcmp(type, "USER MAPPING") == 0)
2931 2932 2933 2934
	{
		appendPQExpBuffer(buf, "%s %s", type, fmtId(te->tag));
		return;
	}
2935

2936 2937 2938 2939 2940 2941 2942
	/* BLOBs just have a name, but it's numeric so must not use fmtId */
	if (strcmp(type, "BLOB") == 0)
	{
		appendPQExpBuffer(buf, "LARGE OBJECT %s", te->tag);
		return;
	}

B
Bruce Momjian 已提交
2943
	/*
B
Bruce Momjian 已提交
2944 2945
	 * These object types require additional decoration.  Fortunately, the
	 * information needed is exactly what's in the DROP command.
B
Bruce Momjian 已提交
2946
	 */
2947 2948 2949
	if (strcmp(type, "AGGREGATE") == 0 ||
		strcmp(type, "FUNCTION") == 0 ||
		strcmp(type, "OPERATOR") == 0 ||
2950 2951
		strcmp(type, "OPERATOR CLASS") == 0 ||
		strcmp(type, "OPERATOR FAMILY") == 0)
B
Bruce Momjian 已提交
2952
	{
2953
		/* Chop "DROP " off the front and make a modifiable copy */
2954
		char	   *first = pg_strdup(te->dropStmt + 5);
2955
		char	   *last;
2956

2957 2958
		/* point to last character in string */
		last = first + strlen(first) - 1;
2959

2960 2961 2962 2963
		/* Strip off any ';' or '\n' at the end */
		while (last >= first && (*last == '\n' || *last == ';'))
			last--;
		*(last + 1) = '\0';
B
Bruce Momjian 已提交
2964

2965
		appendPQExpBufferStr(buf, first);
B
Bruce Momjian 已提交
2966 2967

		free(first);
2968
		return;
2969 2970
	}

2971 2972
	write_msg(modulename, "WARNING: don't know how to set owner for object type %s\n",
			  type);
2973 2974 2975
}

static void
2976
_printTocEntry(ArchiveHandle *AH, TocEntry *te, RestoreOptions *ropt, bool isData, bool acl_pass)
B
Bruce Momjian 已提交
2977
{
2978 2979 2980
	/* ACLs are dumped only during acl pass */
	if (acl_pass)
	{
2981
		if (!_tocEntryIsACL(te))
2982 2983 2984 2985
			return;
	}
	else
	{
2986
		if (_tocEntryIsACL(te))
2987 2988 2989 2990 2991
			return;
	}

	/*
	 * Avoid dumping the public schema, as it will already be created ...
B
Bruce Momjian 已提交
2992
	 * unless we are using --clean mode, in which case it's been deleted and
2993
	 * we'd better recreate it.  Likewise for its comment, if any.
2994
	 */
2995 2996 2997 2998 2999
	if (!ropt->dropSchema)
	{
		if (strcmp(te->desc, "SCHEMA") == 0 &&
			strcmp(te->tag, "public") == 0)
			return;
3000
		/* The comment restore would require super-user privs, so avoid it. */
3001 3002 3003 3004
		if (strcmp(te->desc, "COMMENT") == 0 &&
			strcmp(te->tag, "SCHEMA public") == 0)
			return;
	}
3005

3006
	/* Select owner, schema, and tablespace as necessary */
3007 3008
	_becomeOwner(AH, te);
	_selectOutputSchema(AH, te->namespace);
3009
	_selectTablespace(AH, te->tablespace);
3010 3011 3012 3013 3014 3015

	/* Set up OID mode too */
	if (strcmp(te->desc, "TABLE") == 0)
		_setWithOids(AH, te);

	/* Emit header comment for item */
3016
	if (!AH->noTocComments)
3017
	{
3018
		const char *pfx;
3019 3020 3021
		char	   *sanitized_name;
		char	   *sanitized_schema;
		char	   *sanitized_owner;
3022 3023 3024 3025 3026 3027 3028 3029

		if (isData)
			pfx = "Data for ";
		else
			pfx = "";

		ahprintf(AH, "--\n");
		if (AH->public.verbose)
3030
		{
3031 3032 3033 3034 3035
			ahprintf(AH, "-- TOC entry %d (class %u OID %u)\n",
					 te->dumpId, te->catalogId.tableoid, te->catalogId.oid);
			if (te->nDeps > 0)
			{
				int			i;
3036

3037 3038 3039 3040 3041
				ahprintf(AH, "-- Dependencies:");
				for (i = 0; i < te->nDeps; i++)
					ahprintf(AH, " %d", te->dependencies[i]);
				ahprintf(AH, "\n");
			}
3042
		}
3043 3044 3045 3046 3047 3048 3049 3050 3051 3052 3053 3054 3055 3056 3057 3058 3059

		/*
		 * Zap any line endings embedded in user-supplied fields, to prevent
		 * corruption of the dump (which could, in the worst case, present an
		 * SQL injection vulnerability if someone were to incautiously load a
		 * dump containing objects with maliciously crafted names).
		 */
		sanitized_name = replace_line_endings(te->tag);
		if (te->namespace)
			sanitized_schema = replace_line_endings(te->namespace);
		else
			sanitized_schema = pg_strdup("-");
		if (!ropt->noOwner)
			sanitized_owner = replace_line_endings(te->owner);
		else
			sanitized_owner = pg_strdup("-");

3060
		ahprintf(AH, "-- %sName: %s; Type: %s; Schema: %s; Owner: %s",
3061 3062 3063 3064 3065 3066 3067
				 pfx, sanitized_name, te->desc, sanitized_schema,
				 sanitized_owner);

		free(sanitized_name);
		free(sanitized_schema);
		free(sanitized_owner);

3068
		if (te->tablespace && !ropt->noTablespace)
3069
		{
3070
			char	   *sanitized_tablespace;
3071 3072 3073 3074 3075

			sanitized_tablespace = replace_line_endings(te->tablespace);
			ahprintf(AH, "; Tablespace: %s", sanitized_tablespace);
			free(sanitized_tablespace);
		}
3076 3077
		ahprintf(AH, "\n");

B
Bruce Momjian 已提交
3078
		if (AH->PrintExtraTocPtr !=NULL)
3079 3080
			(*AH->PrintExtraTocPtr) (AH, te);
		ahprintf(AH, "--\n\n");
3081
	}
B
Bruce Momjian 已提交
3082

3083 3084 3085
	/*
	 * Actually print the definition.
	 *
B
Bruce Momjian 已提交
3086 3087 3088
	 * Really crude hack for suppressing AUTHORIZATION clause that old pg_dump
	 * versions put into CREATE SCHEMA.  We have to do this when --no-owner
	 * mode is selected.  This is ugly, but I see no other good way ...
3089
	 */
3090
	if (ropt->noOwner && strcmp(te->desc, "SCHEMA") == 0)
3091
	{
3092
		ahprintf(AH, "CREATE SCHEMA %s;\n\n\n", fmtId(te->tag));
3093
	}
3094
	else
3095
	{
3096 3097
		if (strlen(te->defn) > 0)
			ahprintf(AH, "%s\n\n", te->defn);
3098
	}
3099 3100 3101

	/*
	 * If we aren't using SET SESSION AUTH to determine ownership, we must
3102 3103 3104
	 * instead issue an ALTER OWNER command.  We assume that anything without
	 * a DROP command is not a separately ownable object.  All the categories
	 * with DROP commands must appear in one list or the other.
3105 3106
	 */
	if (!ropt->noOwner && !ropt->use_setsessauth &&
3107 3108 3109
		strlen(te->owner) > 0 && strlen(te->dropStmt) > 0)
	{
		if (strcmp(te->desc, "AGGREGATE") == 0 ||
3110
			strcmp(te->desc, "BLOB") == 0 ||
P
Peter Eisentraut 已提交
3111
			strcmp(te->desc, "COLLATION") == 0 ||
3112 3113 3114 3115 3116 3117
			strcmp(te->desc, "CONVERSION") == 0 ||
			strcmp(te->desc, "DATABASE") == 0 ||
			strcmp(te->desc, "DOMAIN") == 0 ||
			strcmp(te->desc, "FUNCTION") == 0 ||
			strcmp(te->desc, "OPERATOR") == 0 ||
			strcmp(te->desc, "OPERATOR CLASS") == 0 ||
3118
			strcmp(te->desc, "OPERATOR FAMILY") == 0 ||
3119
			strcmp(te->desc, "PROCEDURAL LANGUAGE") == 0 ||
3120 3121 3122 3123
			strcmp(te->desc, "SCHEMA") == 0 ||
			strcmp(te->desc, "TABLE") == 0 ||
			strcmp(te->desc, "TYPE") == 0 ||
			strcmp(te->desc, "VIEW") == 0 ||
3124
			strcmp(te->desc, "MATERIALIZED VIEW") == 0 ||
3125
			strcmp(te->desc, "SEQUENCE") == 0 ||
R
Robert Haas 已提交
3126
			strcmp(te->desc, "FOREIGN TABLE") == 0 ||
3127
			strcmp(te->desc, "TEXT SEARCH DICTIONARY") == 0 ||
3128 3129 3130
			strcmp(te->desc, "TEXT SEARCH CONFIGURATION") == 0 ||
			strcmp(te->desc, "FOREIGN DATA WRAPPER") == 0 ||
			strcmp(te->desc, "SERVER") == 0)
3131 3132 3133 3134
		{
			PQExpBuffer temp = createPQExpBuffer();

			appendPQExpBuffer(temp, "ALTER ");
3135
			_getObjectDescription(temp, te, AH);
3136 3137 3138 3139 3140 3141
			appendPQExpBuffer(temp, " OWNER TO %s;", fmtId(te->owner));
			ahprintf(AH, "%s\n\n", temp->data);
			destroyPQExpBuffer(temp);
		}
		else if (strcmp(te->desc, "CAST") == 0 ||
				 strcmp(te->desc, "CHECK CONSTRAINT") == 0 ||
3142
				 strcmp(te->desc, "CONSTRAINT") == 0 ||
3143 3144
				 strcmp(te->desc, "DEFAULT") == 0 ||
				 strcmp(te->desc, "FK CONSTRAINT") == 0 ||
3145
				 strcmp(te->desc, "INDEX") == 0 ||
3146
				 strcmp(te->desc, "RULE") == 0 ||
3147 3148
				 strcmp(te->desc, "TRIGGER") == 0 ||
				 strcmp(te->desc, "USER MAPPING") == 0)
3149 3150 3151 3152 3153 3154 3155 3156
		{
			/* these object types don't have separate owners */
		}
		else
		{
			write_msg(modulename, "WARNING: don't know how to set owner for object type %s\n",
					  te->desc);
		}
3157
	}
B
Bruce Momjian 已提交
3158

3159 3160
	/*
	 * If it's an ACL entry, it might contain SET SESSION AUTHORIZATION
B
Bruce Momjian 已提交
3161
	 * commands, so we can no longer assume we know the current auth setting.
3162
	 */
3163
	if (acl_pass)
3164 3165 3166 3167 3168
	{
		if (AH->currUser)
			free(AH->currUser);
		AH->currUser = NULL;
	}
B
Bruce Momjian 已提交
3169 3170
}

3171 3172 3173 3174 3175 3176 3177
/*
 * Sanitize a string to be included in an SQL comment, by replacing any
 * newlines with spaces.
 */
static char *
replace_line_endings(const char *str)
{
3178 3179
	char	   *result;
	char	   *s;
3180 3181 3182 3183 3184 3185 3186 3187 3188 3189 3190 3191

	result = pg_strdup(str);

	for (s = result; *s != '\0'; s++)
	{
		if (*s == '\n' || *s == '\r')
			*s = ' ';
	}

	return result;
}

B
Bruce Momjian 已提交
3192 3193
void
WriteHead(ArchiveHandle *AH)
B
Bruce Momjian 已提交
3194
{
B
Bruce Momjian 已提交
3195
	struct tm	crtm;
3196

B
Bruce Momjian 已提交
3197 3198 3199 3200 3201
	(*AH->WriteBufPtr) (AH, "PGDMP", 5);		/* Magic code */
	(*AH->WriteBytePtr) (AH, AH->vmaj);
	(*AH->WriteBytePtr) (AH, AH->vmin);
	(*AH->WriteBytePtr) (AH, AH->vrev);
	(*AH->WriteBytePtr) (AH, AH->intSize);
3202
	(*AH->WriteBytePtr) (AH, AH->offSize);
B
Bruce Momjian 已提交
3203
	(*AH->WriteBytePtr) (AH, AH->format);
B
Bruce Momjian 已提交
3204

3205
#ifndef HAVE_LIBZ
B
Bruce Momjian 已提交
3206
	if (AH->compression != 0)
3207
		write_msg(modulename, "WARNING: requested compression not available in this "
3208
				  "installation -- archive will be uncompressed\n");
B
Bruce Momjian 已提交
3209

B
Bruce Momjian 已提交
3210
	AH->compression = 0;
3211
#endif
B
Bruce Momjian 已提交
3212

3213 3214 3215 3216 3217 3218 3219 3220 3221 3222
	WriteInt(AH, AH->compression);

	crtm = *localtime(&AH->createDate);
	WriteInt(AH, crtm.tm_sec);
	WriteInt(AH, crtm.tm_min);
	WriteInt(AH, crtm.tm_hour);
	WriteInt(AH, crtm.tm_mday);
	WriteInt(AH, crtm.tm_mon);
	WriteInt(AH, crtm.tm_year);
	WriteInt(AH, crtm.tm_isdst);
3223
	WriteStr(AH, PQdb(AH->connection));
3224 3225
	WriteStr(AH, AH->public.remoteVersionStr);
	WriteStr(AH, PG_VERSION);
B
Bruce Momjian 已提交
3226 3227
}

B
Bruce Momjian 已提交
3228 3229
void
ReadHead(ArchiveHandle *AH)
B
Bruce Momjian 已提交
3230
{
B
Bruce Momjian 已提交
3231 3232
	char		tmpMag[7];
	int			fmt;
3233
	struct tm	crtm;
B
Bruce Momjian 已提交
3234

3235 3236 3237
	/*
	 * If we haven't already read the header, do so.
	 *
B
Bruce Momjian 已提交
3238 3239
	 * NB: this code must agree with _discoverArchiveFormat().	Maybe find a
	 * way to unify the cases?
3240
	 */
B
Bruce Momjian 已提交
3241 3242
	if (!AH->readHeader)
	{
3243
		if ((*AH->ReadBufPtr) (AH, tmpMag, 5) != 5)
3244
			exit_horribly(modulename, "unexpected end of file\n");
B
Bruce Momjian 已提交
3245

B
Bruce Momjian 已提交
3246
		if (strncmp(tmpMag, "PGDMP", 5) != 0)
3247
			exit_horribly(modulename, "did not find magic string in file header\n");
B
Bruce Momjian 已提交
3248

B
Bruce Momjian 已提交
3249 3250
		AH->vmaj = (*AH->ReadBytePtr) (AH);
		AH->vmin = (*AH->ReadBytePtr) (AH);
B
Bruce Momjian 已提交
3251

B
Bruce Momjian 已提交
3252 3253 3254
		if (AH->vmaj > 1 || ((AH->vmaj == 1) && (AH->vmin > 0)))		/* Version > 1.0 */
			AH->vrev = (*AH->ReadBytePtr) (AH);
		else
3255
			AH->vrev = 0;
B
Bruce Momjian 已提交
3256

B
Bruce Momjian 已提交
3257
		AH->version = ((AH->vmaj * 256 + AH->vmin) * 256 + AH->vrev) * 256 + 0;
B
Bruce Momjian 已提交
3258

3259
		if (AH->version < K_VERS_1_0 || AH->version > K_VERS_MAX)
3260 3261
			exit_horribly(modulename, "unsupported version (%d.%d) in file header\n",
						  AH->vmaj, AH->vmin);
B
Bruce Momjian 已提交
3262

B
Bruce Momjian 已提交
3263
		AH->intSize = (*AH->ReadBytePtr) (AH);
3264
		if (AH->intSize > 32)
3265 3266
			exit_horribly(modulename, "sanity check on integer size (%lu) failed\n",
						  (unsigned long) AH->intSize);
B
Bruce Momjian 已提交
3267

3268
		if (AH->intSize > sizeof(int))
3269
			write_msg(modulename, "WARNING: archive was made on a machine with larger integers, some operations might fail\n");
B
Bruce Momjian 已提交
3270

3271
		if (AH->version >= K_VERS_1_7)
B
Bruce Momjian 已提交
3272
			AH->offSize = (*AH->ReadBytePtr) (AH);
3273
		else
B
Bruce Momjian 已提交
3274
			AH->offSize = AH->intSize;
3275

B
Bruce Momjian 已提交
3276
		fmt = (*AH->ReadBytePtr) (AH);
B
Bruce Momjian 已提交
3277

3278
		if (AH->format != fmt)
3279 3280
			exit_horribly(modulename, "expected format (%d) differs from format found in file (%d)\n",
						  AH->format, fmt);
B
Bruce Momjian 已提交
3281
	}
B
Bruce Momjian 已提交
3282

B
Bruce Momjian 已提交
3283 3284
	if (AH->version >= K_VERS_1_2)
	{
3285
		if (AH->version < K_VERS_1_4)
B
Bruce Momjian 已提交
3286
			AH->compression = (*AH->ReadBytePtr) (AH);
3287 3288
		else
			AH->compression = ReadInt(AH);
B
Bruce Momjian 已提交
3289 3290
	}
	else
3291
		AH->compression = Z_DEFAULT_COMPRESSION;
B
Bruce Momjian 已提交
3292

3293
#ifndef HAVE_LIBZ
B
Bruce Momjian 已提交
3294
	if (AH->compression != 0)
3295
		write_msg(modulename, "WARNING: archive is compressed, but this installation does not support compression -- no data will be available\n");
B
Bruce Momjian 已提交
3296 3297
#endif

3298 3299 3300 3301 3302 3303 3304 3305 3306 3307 3308 3309 3310 3311
	if (AH->version >= K_VERS_1_4)
	{
		crtm.tm_sec = ReadInt(AH);
		crtm.tm_min = ReadInt(AH);
		crtm.tm_hour = ReadInt(AH);
		crtm.tm_mday = ReadInt(AH);
		crtm.tm_mon = ReadInt(AH);
		crtm.tm_year = ReadInt(AH);
		crtm.tm_isdst = ReadInt(AH);

		AH->archdbname = ReadStr(AH);

		AH->createDate = mktime(&crtm);

B
Bruce Momjian 已提交
3312
		if (AH->createDate == (time_t) -1)
3313
			write_msg(modulename, "WARNING: invalid creation date in header\n");
3314 3315
	}

3316 3317 3318 3319 3320
	if (AH->version >= K_VERS_1_10)
	{
		AH->archiveRemoteVersion = ReadStr(AH);
		AH->archiveDumpVersion = ReadStr(AH);
	}
B
Bruce Momjian 已提交
3321 3322 3323
}


3324 3325
/*
 * checkSeek
3326
 *	  check to see if ftell/fseek can be performed.
3327 3328 3329 3330
 */
bool
checkSeek(FILE *fp)
{
3331 3332 3333
	pgoff_t		tpos;

	/*
B
Bruce Momjian 已提交
3334 3335
	 * If pgoff_t is wider than long, we must have "real" fseeko and not an
	 * emulation using fseek.  Otherwise report no seek capability.
3336 3337 3338
	 */
#ifndef HAVE_FSEEKO
	if (sizeof(pgoff_t) > sizeof(long))
3339 3340
		return false;
#endif
3341 3342 3343 3344 3345 3346 3347 3348

	/* Check that ftello works on this file */
	errno = 0;
	tpos = ftello(fp);
	if (errno)
		return false;

	/*
B
Bruce Momjian 已提交
3349
	 * Check that fseeko(SEEK_SET) works, too.	NB: we used to try to test
3350 3351 3352 3353 3354 3355 3356
	 * this with fseeko(fp, 0, SEEK_CUR).  But some platforms treat that as a
	 * successful no-op even on files that are otherwise unseekable.
	 */
	if (fseeko(fp, tpos, SEEK_SET) != 0)
		return false;

	return true;
3357
}
3358 3359 3360 3361 3362 3363 3364 3365 3366 3367


/*
 * dumpTimestamp
 */
static void
dumpTimestamp(ArchiveHandle *AH, const char *msg, time_t tim)
{
	char		buf[256];

3368 3369 3370
	/*
	 * We don't print the timezone on Win32, because the names are long and
	 * localized, which means they may contain characters in various random
B
Bruce Momjian 已提交
3371 3372
	 * encodings; this has been seen to cause encoding errors when reading the
	 * dump script.
3373 3374 3375 3376 3377 3378 3379 3380
	 */
	if (strftime(buf, sizeof(buf),
#ifndef WIN32
				 "%Y-%m-%d %H:%M:%S %Z",
#else
				 "%Y-%m-%d %H:%M:%S",
#endif
				 localtime(&tim)) != 0)
3381 3382
		ahprintf(AH, "-- %s %s\n\n", msg, buf);
}
3383 3384 3385 3386 3387

/*
 * Main engine for parallel restore.
 *
 * Work is done in three phases.
3388
 * First we process all SECTION_PRE_DATA tocEntries, in a single connection,
3389
 * just as for a standard restore.	Second we process the remaining non-ACL
3390 3391 3392 3393
 * steps in parallel worker children (threads on Windows, processes on Unix),
 * each of which connects separately to the database.  Finally we process all
 * the ACL entries in a single connection (that happens back in
 * RestoreArchive).
3394 3395
 */
static void
A
Andrew Dunstan 已提交
3396
restore_toc_entries_prefork(ArchiveHandle *AH)
3397 3398
{
	RestoreOptions *ropt = AH->ropt;
3399
	bool		skipped_some;
3400 3401
	TocEntry   *next_work_item;

A
Andrew Dunstan 已提交
3402
	ahlog(AH, 2, "entering restore_toc_entries_prefork\n");
3403 3404 3405 3406 3407

	/* Adjust dependency information */
	fix_dependencies(AH);

	/*
3408 3409 3410
	 * Do all the early stuff in a single connection in the parent. There's no
	 * great point in running it in parallel, in fact it will actually run
	 * faster in a single connection because we avoid all the connection and
A
Andrew Dunstan 已提交
3411
	 * setup overhead.	Also, pre-9.2 pg_dump versions were not very good
3412 3413 3414 3415 3416 3417 3418
	 * about showing all the dependencies of SECTION_PRE_DATA items, so we do
	 * not risk trying to process them out-of-order.
	 *
	 * Note: as of 9.2, it should be guaranteed that all PRE_DATA items appear
	 * before DATA items, and all DATA items before POST_DATA items.  That is
	 * not certain to be true in older archives, though, so this loop is coded
	 * to not assume it.
3419
	 */
3420
	skipped_some = false;
3421
	for (next_work_item = AH->toc->next; next_work_item != AH->toc; next_work_item = next_work_item->next)
3422
	{
3423 3424 3425 3426 3427 3428 3429 3430 3431 3432 3433 3434 3435 3436 3437 3438 3439 3440 3441 3442 3443 3444
		/* NB: process-or-continue logic must be the inverse of loop below */
		if (next_work_item->section != SECTION_PRE_DATA)
		{
			/* DATA and POST_DATA items are just ignored for now */
			if (next_work_item->section == SECTION_DATA ||
				next_work_item->section == SECTION_POST_DATA)
			{
				skipped_some = true;
				continue;
			}
			else
			{
				/*
				 * SECTION_NONE items, such as comments, can be processed now
				 * if we are still in the PRE_DATA part of the archive.  Once
				 * we've skipped any items, we have to consider whether the
				 * comment's dependencies are satisfied, so skip it for now.
				 */
				if (skipped_some)
					continue;
			}
		}
3445 3446 3447 3448 3449 3450 3451

		ahlog(AH, 1, "processing item %d %s %s\n",
			  next_work_item->dumpId,
			  next_work_item->desc, next_work_item->tag);

		(void) restore_toc_entry(AH, next_work_item, ropt, false);

3452 3453
		/* there should be no touch of ready_list here, so pass NULL */
		reduce_dependencies(AH, next_work_item, NULL);
3454 3455 3456
	}

	/*
3457
	 * Now close parent connection in prep for parallel steps.	We do this
3458 3459 3460
	 * mainly to ensure that we don't exceed the specified number of parallel
	 * connections.
	 */
R
Robert Haas 已提交
3461
	DisconnectDatabase(&AH->public);
3462 3463 3464 3465 3466 3467 3468 3469 3470 3471 3472 3473

	/* blow away any transient state from the old connection */
	if (AH->currUser)
		free(AH->currUser);
	AH->currUser = NULL;
	if (AH->currSchema)
		free(AH->currSchema);
	AH->currSchema = NULL;
	if (AH->currTablespace)
		free(AH->currTablespace);
	AH->currTablespace = NULL;
	AH->currWithOids = -1;
A
Andrew Dunstan 已提交
3474 3475 3476 3477 3478 3479 3480 3481 3482 3483 3484 3485 3486 3487 3488 3489 3490 3491 3492 3493 3494 3495 3496 3497 3498
}

/*
 * Main engine for parallel restore.
 *
 * Work is done in three phases.
 * First we process all SECTION_PRE_DATA tocEntries, in a single connection,
 * just as for a standard restore. This is done in restore_toc_entries_prefork().
 * Second we process the remaining non-ACL steps in parallel worker children
 * (threads on Windows, processes on Unix), these fork off and set up their
 * connections before we call restore_toc_entries_parallel_forked.
 * Finally we process all the ACL entries in a single connection (that happens
 * back in RestoreArchive).
 */
static void
restore_toc_entries_parallel(ArchiveHandle *AH, ParallelState *pstate,
							 TocEntry *pending_list)
{
	int			work_status;
	bool		skipped_some;
	TocEntry	ready_list;
	TocEntry   *next_work_item;
	int			ret_child;

	ahlog(AH, 2, "entering restore_toc_entries_parallel\n");
3499

3500
	/*
A
Andrew Dunstan 已提交
3501 3502 3503 3504 3505 3506
	 * Initialize the lists of ready items, the list for pending items has
	 * already been initialized in the caller.	After this setup, the pending
	 * list is everything that needs to be done but is blocked by one or more
	 * dependencies, while the ready list contains items that have no
	 * remaining dependencies. Note: we don't yet filter out entries that
	 * aren't going to be restored. They might participate in dependency
B
Bruce Momjian 已提交
3507 3508
	 * chains connecting entries that should be restored, so we treat them as
	 * live until we actually process them.
3509 3510
	 */
	par_list_header_init(&ready_list);
3511
	skipped_some = false;
3512
	for (next_work_item = AH->toc->next; next_work_item != AH->toc; next_work_item = next_work_item->next)
3513
	{
3514 3515 3516 3517 3518 3519
		/* NB: process-or-continue logic must be the inverse of loop above */
		if (next_work_item->section == SECTION_PRE_DATA)
		{
			/* All PRE_DATA items were dealt with above */
			continue;
		}
3520 3521 3522
		if (next_work_item->section == SECTION_DATA ||
			next_work_item->section == SECTION_POST_DATA)
		{
3523 3524
			/* set this flag at same point that previous loop did */
			skipped_some = true;
3525
		}
3526 3527 3528 3529 3530 3531 3532 3533
		else
		{
			/* SECTION_NONE items must be processed if previous loop didn't */
			if (!skipped_some)
				continue;
		}

		if (next_work_item->depCount > 0)
A
Andrew Dunstan 已提交
3534
			par_list_append(pending_list, next_work_item);
3535 3536
		else
			par_list_append(&ready_list, next_work_item);
3537 3538
	}

3539 3540 3541 3542 3543 3544 3545
	/*
	 * main parent loop
	 *
	 * Keep going until there is no worker still running AND there is no work
	 * left to be done.
	 */

3546
	ahlog(AH, 1, "entering main parallel loop\n");
3547

A
Andrew Dunstan 已提交
3548 3549
	while ((next_work_item = get_next_work_item(AH, &ready_list, pstate)) != NULL ||
		   !IsEveryWorkerIdle(pstate))
3550 3551 3552
	{
		if (next_work_item != NULL)
		{
3553 3554 3555
			/* If not to be restored, don't waste time launching a worker */
			if ((next_work_item->reqs & (REQ_SCHEMA | REQ_DATA)) == 0 ||
				_tocEntryIsACL(next_work_item))
3556 3557 3558 3559 3560
			{
				ahlog(AH, 1, "skipping item %d %s %s\n",
					  next_work_item->dumpId,
					  next_work_item->desc, next_work_item->tag);

3561 3562
				par_list_remove(next_work_item);
				reduce_dependencies(AH, next_work_item, &ready_list);
3563 3564 3565 3566

				continue;
			}

A
Andrew Dunstan 已提交
3567 3568 3569
			ahlog(AH, 1, "launching item %d %s %s\n",
				  next_work_item->dumpId,
				  next_work_item->desc, next_work_item->tag);
3570

A
Andrew Dunstan 已提交
3571
			par_list_remove(next_work_item);
3572

A
Andrew Dunstan 已提交
3573 3574 3575 3576
			Assert(GetIdleWorker(pstate) != NO_SLOT);
			DispatchJobForTocEntry(AH, pstate, next_work_item, ACT_RESTORE);
		}
		else
3577
		{
A
Andrew Dunstan 已提交
3578 3579
			/* at least one child is working and we have nothing ready. */
			Assert(!IsEveryWorkerIdle(pstate));
3580
		}
3581

A
Andrew Dunstan 已提交
3582 3583 3584
		for (;;)
		{
			int			nTerm = 0;
3585

A
Andrew Dunstan 已提交
3586 3587 3588 3589 3590 3591 3592 3593 3594 3595 3596 3597
			/*
			 * In order to reduce dependencies as soon as possible and
			 * especially to reap the status of workers who are working on
			 * items that pending items depend on, we do a non-blocking check
			 * for ended workers first.
			 *
			 * However, if we do not have any other work items currently that
			 * workers can work on, we do not busy-loop here but instead
			 * really wait for at least one worker to terminate. Hence we call
			 * ListenToWorkers(..., ..., do_wait = true) in this case.
			 */
			ListenToWorkers(AH, pstate, !next_work_item);
3598

A
Andrew Dunstan 已提交
3599 3600 3601 3602
			while ((ret_child = ReapWorkerStatus(pstate, &work_status)) != NO_SLOT)
			{
				nTerm++;
				mark_work_done(AH, &ready_list, ret_child, work_status, pstate);
3603 3604
			}

A
Andrew Dunstan 已提交
3605 3606 3607 3608 3609 3610 3611
			/*
			 * We need to make sure that we have an idle worker before
			 * re-running the loop. If nTerm > 0 we already have that (quick
			 * check).
			 */
			if (nTerm > 0)
				break;
3612

A
Andrew Dunstan 已提交
3613 3614 3615 3616 3617 3618 3619 3620 3621
			/* if nobody terminated, explicitly check for an idle worker */
			if (GetIdleWorker(pstate) != NO_SLOT)
				break;

			/*
			 * If we have no idle worker, read the result of one or more
			 * workers and loop the loop to call ReapWorkerStatus() on them.
			 */
			ListenToWorkers(AH, pstate, true);
3622 3623 3624
		}
	}

3625
	ahlog(AH, 1, "finished main parallel loop\n");
A
Andrew Dunstan 已提交
3626
}
3627

A
Andrew Dunstan 已提交
3628 3629 3630 3631 3632 3633 3634
static void
restore_toc_entries_postfork(ArchiveHandle *AH, TocEntry *pending_list)
{
	RestoreOptions *ropt = AH->ropt;
	TocEntry   *te;

	ahlog(AH, 2, "entering restore_toc_entries_postfork\n");
3635

3636 3637 3638 3639 3640
	/*
	 * Now reconnect the single parent connection.
	 */
	ConnectDatabase((Archive *) AH, ropt->dbname,
					ropt->pghost, ropt->pgport, ropt->username,
3641
					ropt->promptPassword);
3642 3643 3644 3645

	_doSetFixedOutputState(AH);

	/*
3646 3647 3648
	 * Make sure there is no non-ACL work left due to, say, circular
	 * dependencies, or some other pathological condition. If so, do it in the
	 * single parent connection.
3649
	 */
A
Andrew Dunstan 已提交
3650
	for (te = pending_list->par_next; te != pending_list; te = te->par_next)
3651
	{
3652 3653 3654
		ahlog(AH, 1, "processing missed item %d %s %s\n",
			  te->dumpId, te->desc, te->tag);
		(void) restore_toc_entry(AH, te, ropt, false);
3655 3656 3657 3658 3659
	}

	/* The ACLs will be handled back in RestoreArchive. */
}

3660 3661 3662 3663 3664 3665 3666
/*
 * Check if te1 has an exclusive lock requirement for an item that te2 also
 * requires, whether or not te2's requirement is for an exclusive lock.
 */
static bool
has_lock_conflicts(TocEntry *te1, TocEntry *te2)
{
3667 3668
	int			j,
				k;
3669 3670 3671 3672 3673 3674 3675 3676 3677 3678 3679 3680 3681

	for (j = 0; j < te1->nLockDeps; j++)
	{
		for (k = 0; k < te2->nDeps; k++)
		{
			if (te1->lockDeps[j] == te2->dependencies[k])
				return true;
		}
	}
	return false;
}


3682 3683 3684 3685 3686 3687 3688 3689 3690 3691 3692 3693 3694 3695 3696 3697 3698 3699 3700 3701 3702 3703 3704 3705 3706 3707 3708 3709 3710 3711 3712 3713 3714
/*
 * Initialize the header of a parallel-processing list.
 *
 * These are circular lists with a dummy TocEntry as header, just like the
 * main TOC list; but we use separate list links so that an entry can be in
 * the main TOC list as well as in a parallel-processing list.
 */
static void
par_list_header_init(TocEntry *l)
{
	l->par_prev = l->par_next = l;
}

/* Append te to the end of the parallel-processing list headed by l */
static void
par_list_append(TocEntry *l, TocEntry *te)
{
	te->par_prev = l->par_prev;
	l->par_prev->par_next = te;
	l->par_prev = te;
	te->par_next = l;
}

/* Remove te from whatever parallel-processing list it's in */
static void
par_list_remove(TocEntry *te)
{
	te->par_prev->par_next = te->par_next;
	te->par_next->par_prev = te->par_prev;
	te->par_prev = NULL;
	te->par_next = NULL;
}

3715

3716 3717 3718 3719
/*
 * Find the next work item (if any) that is capable of being run now.
 *
 * To qualify, the item must have no remaining dependencies
3720 3721 3722
 * and no requirements for locks that are incompatible with
 * items currently running.  Items in the ready_list are known to have
 * no remaining dependencies, but we have to check for lock conflicts.
3723
 *
3724 3725
 * Note that the returned item has *not* been removed from ready_list.
 * The caller must do that after successfully dispatching the item.
3726 3727 3728 3729 3730 3731
 *
 * pref_non_data is for an alternative selection algorithm that gives
 * preference to non-data items if there is already a data load running.
 * It is currently disabled.
 */
static TocEntry *
3732
get_next_work_item(ArchiveHandle *AH, TocEntry *ready_list,
A
Andrew Dunstan 已提交
3733
				   ParallelState *pstate)
3734
{
3735 3736 3737 3738 3739
	bool		pref_non_data = false;	/* or get from AH->ropt */
	TocEntry   *data_te = NULL;
	TocEntry   *te;
	int			i,
				k;
3740 3741 3742 3743 3744 3745

	/*
	 * Bogus heuristics for pref_non_data
	 */
	if (pref_non_data)
	{
3746
		int			count = 0;
3747

A
Andrew Dunstan 已提交
3748 3749 3750
		for (k = 0; k < pstate->numWorkers; k++)
			if (pstate->parallelSlot[k].args->te != NULL &&
				pstate->parallelSlot[k].args->te->section == SECTION_DATA)
3751
				count++;
A
Andrew Dunstan 已提交
3752
		if (pstate->numWorkers == 0 || count * 4 < pstate->numWorkers)
3753 3754 3755 3756
			pref_non_data = false;
	}

	/*
3757
	 * Search the ready_list until we find a suitable item.
3758
	 */
3759
	for (te = ready_list->par_next; te != ready_list; te = te->par_next)
3760
	{
3761
		bool		conflicts = false;
3762 3763 3764

		/*
		 * Check to see if the item would need exclusive lock on something
3765 3766
		 * that a currently running item also needs lock on, or vice versa. If
		 * so, we don't want to schedule them together.
3767
		 */
A
Andrew Dunstan 已提交
3768
		for (i = 0; i < pstate->numWorkers && !conflicts; i++)
3769
		{
3770
			TocEntry   *running_te;
3771

A
Andrew Dunstan 已提交
3772
			if (pstate->parallelSlot[i].workerStatus != WRKR_WORKING)
3773
				continue;
A
Andrew Dunstan 已提交
3774
			running_te = pstate->parallelSlot[i].args->te;
3775 3776 3777

			if (has_lock_conflicts(te, running_te) ||
				has_lock_conflicts(running_te, te))
3778
			{
3779 3780
				conflicts = true;
				break;
3781 3782 3783 3784 3785 3786 3787 3788 3789 3790 3791 3792 3793 3794 3795 3796 3797 3798 3799 3800
			}
		}

		if (conflicts)
			continue;

		if (pref_non_data && te->section == SECTION_DATA)
		{
			if (data_te == NULL)
				data_te = te;
			continue;
		}

		/* passed all tests, so this item can run */
		return te;
	}

	if (data_te != NULL)
		return data_te;

3801
	ahlog(AH, 2, "no item ready\n");
3802 3803 3804 3805 3806 3807 3808
	return NULL;
}


/*
 * Restore a single TOC item in parallel with others
 *
A
Andrew Dunstan 已提交
3809 3810 3811 3812
 * this is run in the worker, i.e. in a thread (Windows) or a separate process
 * (everything else). A worker process executes several such work items during
 * a parallel backup or restore. Once we terminate here and report back that
 * our work is finished, the master process will assign us a new work item.
3813
 */
A
Andrew Dunstan 已提交
3814 3815
int
parallel_restore(ParallelArgs * args)
3816 3817
{
	ArchiveHandle *AH = args->AH;
3818
	TocEntry   *te = args->te;
3819
	RestoreOptions *ropt = AH->ropt;
A
Andrew Dunstan 已提交
3820
	int			status;
3821 3822 3823

	_doSetFixedOutputState(AH);

A
Andrew Dunstan 已提交
3824
	Assert(AH->connection != NULL);
3825

A
Andrew Dunstan 已提交
3826
	AH->public.n_errors = 0;
3827

A
Andrew Dunstan 已提交
3828 3829
	/* Restore the TOC item */
	status = restore_toc_entry(AH, te, ropt, true);
3830

A
Andrew Dunstan 已提交
3831
	return status;
3832 3833 3834 3835 3836 3837 3838 3839 3840 3841
}


/*
 * Housekeeping to be done after a step has been parallel restored.
 *
 * Clear the appropriate slot, free all the extra memory we allocated,
 * update status, and reduce the dependency count of any dependent items.
 */
static void
3842
mark_work_done(ArchiveHandle *AH, TocEntry *ready_list,
A
Andrew Dunstan 已提交
3843 3844
			   int worker, int status,
			   ParallelState *pstate)
3845
{
3846
	TocEntry   *te = NULL;
3847

A
Andrew Dunstan 已提交
3848
	te = pstate->parallelSlot[worker].args->te;
3849 3850

	if (te == NULL)
3851
		exit_horribly(modulename, "could not find slot of finished worker\n");
3852 3853 3854 3855 3856 3857 3858 3859 3860 3861 3862 3863 3864 3865

	ahlog(AH, 1, "finished item %d %s %s\n",
		  te->dumpId, te->desc, te->tag);

	if (status == WORKER_CREATE_DONE)
		mark_create_done(AH, te);
	else if (status == WORKER_INHIBIT_DATA)
	{
		inhibit_data_for_failed_table(AH, te);
		AH->public.n_errors++;
	}
	else if (status == WORKER_IGNORED_ERRORS)
		AH->public.n_errors++;
	else if (status != 0)
3866 3867
		exit_horribly(modulename, "worker process failed: exit code %d\n",
					  status);
3868

3869
	reduce_dependencies(AH, te, ready_list);
3870 3871 3872 3873 3874 3875
}


/*
 * Process the dependency information into a form useful for parallel restore.
 *
3876 3877 3878
 * This function takes care of fixing up some missing or badly designed
 * dependencies, and then prepares subsidiary data structures that will be
 * used in the main parallel-restore logic, including:
3879 3880
 * 1. We build the revDeps[] arrays of incoming dependency dumpIds.
 * 2. We set up depCount fields that are the number of as-yet-unprocessed
3881 3882 3883 3884 3885 3886 3887 3888 3889
 * dependencies for each TOC entry.
 *
 * We also identify locking dependencies so that we can avoid trying to
 * schedule conflicting items at the same time.
 */
static void
fix_dependencies(ArchiveHandle *AH)
{
	TocEntry   *te;
3890
	int			i;
3891 3892

	/*
3893 3894
	 * Initialize the depCount/revDeps/nRevDeps fields, and make sure the TOC
	 * items are marked as not being in any parallel-processing list.
3895 3896 3897 3898
	 */
	for (te = AH->toc->next; te != AH->toc; te = te->next)
	{
		te->depCount = te->nDeps;
3899 3900
		te->revDeps = NULL;
		te->nRevDeps = 0;
3901 3902
		te->par_prev = NULL;
		te->par_next = NULL;
3903 3904 3905 3906 3907
	}

	/*
	 * POST_DATA items that are shown as depending on a table need to be
	 * re-pointed to depend on that table's data, instead.  This ensures they
3908
	 * won't get scheduled until the data has been loaded.
3909
	 */
3910
	repoint_table_dependencies(AH);
3911 3912

	/*
3913 3914 3915
	 * Pre-8.4 versions of pg_dump neglected to set up a dependency from BLOB
	 * COMMENTS to BLOBS.  Cope.  (We assume there's only one BLOBS and only
	 * one BLOB COMMENTS in such files.)
3916 3917 3918 3919 3920 3921 3922 3923 3924 3925 3926 3927 3928
	 */
	if (AH->version < K_VERS_1_11)
	{
		for (te = AH->toc->next; te != AH->toc; te = te->next)
		{
			if (strcmp(te->desc, "BLOB COMMENTS") == 0 && te->nDeps == 0)
			{
				TocEntry   *te2;

				for (te2 = AH->toc->next; te2 != AH->toc; te2 = te2->next)
				{
					if (strcmp(te2->desc, "BLOBS") == 0)
					{
3929
						te->dependencies = (DumpId *) pg_malloc(sizeof(DumpId));
3930 3931 3932 3933 3934 3935 3936 3937 3938 3939 3940 3941
						te->dependencies[0] = te2->dumpId;
						te->nDeps++;
						te->depCount++;
						break;
					}
				}
				break;
			}
		}
	}

	/*
3942 3943 3944 3945 3946 3947
	 * At this point we start to build the revDeps reverse-dependency arrays,
	 * so all changes of dependencies must be complete.
	 */

	/*
	 * Count the incoming dependencies for each item.  Also, it is possible
3948
	 * that the dependencies list items that are not in the archive at all
A
Andrew Dunstan 已提交
3949 3950
	 * (that should not happen in 9.2 and later, but is highly likely in older
	 * archives).  Subtract such items from the depCounts.
3951 3952 3953 3954 3955
	 */
	for (te = AH->toc->next; te != AH->toc; te = te->next)
	{
		for (i = 0; i < te->nDeps; i++)
		{
3956 3957
			DumpId		depid = te->dependencies[i];

3958 3959
			if (depid <= AH->maxDumpId && AH->tocsByDumpId[depid] != NULL)
				AH->tocsByDumpId[depid]->nRevDeps++;
3960
			else
3961 3962 3963 3964
				te->depCount--;
		}
	}

3965
	/*
3966 3967
	 * Allocate space for revDeps[] arrays, and reset nRevDeps so we can use
	 * it as a counter below.
3968 3969 3970 3971
	 */
	for (te = AH->toc->next; te != AH->toc; te = te->next)
	{
		if (te->nRevDeps > 0)
3972
			te->revDeps = (DumpId *) pg_malloc(te->nRevDeps * sizeof(DumpId));
3973 3974 3975 3976
		te->nRevDeps = 0;
	}

	/*
3977 3978
	 * Build the revDeps[] arrays of incoming-dependency dumpIds.  This had
	 * better agree with the loops above.
3979 3980 3981 3982 3983 3984 3985
	 */
	for (te = AH->toc->next; te != AH->toc; te = te->next)
	{
		for (i = 0; i < te->nDeps; i++)
		{
			DumpId		depid = te->dependencies[i];

3986
			if (depid <= AH->maxDumpId && AH->tocsByDumpId[depid] != NULL)
3987
			{
3988
				TocEntry   *otherte = AH->tocsByDumpId[depid];
3989 3990 3991 3992 3993 3994

				otherte->revDeps[otherte->nRevDeps++] = te->dumpId;
			}
		}
	}

3995 3996 3997 3998 3999 4000 4001
	/*
	 * Lastly, work out the locking dependencies.
	 */
	for (te = AH->toc->next; te != AH->toc; te = te->next)
	{
		te->lockDeps = NULL;
		te->nLockDeps = 0;
4002
		identify_locking_dependencies(AH, te);
4003 4004 4005 4006
	}
}

/*
4007
 * Change dependencies on table items to depend on table data items instead,
4008 4009 4010
 * but only in POST_DATA items.
 */
static void
4011
repoint_table_dependencies(ArchiveHandle *AH)
4012 4013
{
	TocEntry   *te;
4014
	int			i;
4015
	DumpId		olddep;
4016 4017 4018 4019 4020 4021 4022

	for (te = AH->toc->next; te != AH->toc; te = te->next)
	{
		if (te->section != SECTION_POST_DATA)
			continue;
		for (i = 0; i < te->nDeps; i++)
		{
4023 4024 4025
			olddep = te->dependencies[i];
			if (olddep <= AH->maxDumpId &&
				AH->tableDataId[olddep] != 0)
4026
			{
4027
				te->dependencies[i] = AH->tableDataId[olddep];
4028
				ahlog(AH, 2, "transferring dependency %d -> %d to %d\n",
4029
					  te->dumpId, olddep, AH->tableDataId[olddep]);
4030 4031 4032 4033 4034 4035 4036 4037 4038 4039 4040
			}
		}
	}
}

/*
 * Identify which objects we'll need exclusive lock on in order to restore
 * the given TOC entry (*other* than the one identified by the TOC entry
 * itself).  Record their dump IDs in the entry's lockDeps[] array.
 */
static void
4041
identify_locking_dependencies(ArchiveHandle *AH, TocEntry *te)
4042 4043 4044 4045 4046 4047 4048 4049 4050 4051 4052 4053 4054 4055 4056 4057 4058 4059
{
	DumpId	   *lockids;
	int			nlockids;
	int			i;

	/* Quick exit if no dependencies at all */
	if (te->nDeps == 0)
		return;

	/* Exit if this entry doesn't need exclusive lock on other objects */
	if (!(strcmp(te->desc, "CONSTRAINT") == 0 ||
		  strcmp(te->desc, "CHECK CONSTRAINT") == 0 ||
		  strcmp(te->desc, "FK CONSTRAINT") == 0 ||
		  strcmp(te->desc, "RULE") == 0 ||
		  strcmp(te->desc, "TRIGGER") == 0))
		return;

	/*
4060
	 * We assume the item requires exclusive lock on each TABLE DATA item
4061 4062 4063 4064
	 * listed among its dependencies.  (This was originally a dependency on
	 * the TABLE, but fix_dependencies repointed it to the data item. Note
	 * that all the entry types we are interested in here are POST_DATA, so
	 * they will all have been changed this way.)
4065
	 */
4066
	lockids = (DumpId *) pg_malloc(te->nDeps * sizeof(DumpId));
4067 4068 4069
	nlockids = 0;
	for (i = 0; i < te->nDeps; i++)
	{
4070
		DumpId		depid = te->dependencies[i];
4071

4072 4073
		if (depid <= AH->maxDumpId && AH->tocsByDumpId[depid] != NULL &&
			strcmp(AH->tocsByDumpId[depid]->desc, "TABLE DATA") == 0)
4074 4075 4076 4077 4078 4079 4080 4081 4082
			lockids[nlockids++] = depid;
	}

	if (nlockids == 0)
	{
		free(lockids);
		return;
	}

T
Tom Lane 已提交
4083
	te->lockDeps = pg_realloc(lockids, nlockids * sizeof(DumpId));
4084 4085 4086 4087 4088
	te->nLockDeps = nlockids;
}

/*
 * Remove the specified TOC entry from the depCounts of items that depend on
4089 4090
 * it, thereby possibly making them ready-to-run.  Any pending item that
 * becomes ready should be moved to the ready list.
4091 4092
 */
static void
4093
reduce_dependencies(ArchiveHandle *AH, TocEntry *te, TocEntry *ready_list)
4094
{
4095
	int			i;
4096

4097
	ahlog(AH, 2, "reducing dependencies for %d\n", te->dumpId);
4098

4099
	for (i = 0; i < te->nRevDeps; i++)
4100
	{
4101
		TocEntry   *otherte = AH->tocsByDumpId[te->revDeps[i]];
4102 4103 4104

		otherte->depCount--;
		if (otherte->depCount == 0 && otherte->par_prev != NULL)
4105
		{
4106 4107 4108 4109
			/* It must be in the pending list, so remove it ... */
			par_list_remove(otherte);
			/* ... and add to ready_list */
			par_list_append(ready_list, otherte);
4110 4111 4112 4113 4114 4115 4116 4117 4118 4119 4120
		}
	}
}

/*
 * Set the created flag on the DATA member corresponding to the given
 * TABLE member
 */
static void
mark_create_done(ArchiveHandle *AH, TocEntry *te)
{
4121
	if (AH->tableDataId[te->dumpId] != 0)
4122
	{
4123 4124 4125
		TocEntry   *ted = AH->tocsByDumpId[AH->tableDataId[te->dumpId]];

		ted->created = true;
4126 4127 4128 4129 4130 4131 4132 4133 4134 4135 4136 4137 4138
	}
}

/*
 * Mark the DATA member corresponding to the given TABLE member
 * as not wanted
 */
static void
inhibit_data_for_failed_table(ArchiveHandle *AH, TocEntry *te)
{
	ahlog(AH, 1, "table \"%s\" could not be created, will not restore its data\n",
		  te->tag);

4139
	if (AH->tableDataId[te->dumpId] != 0)
4140
	{
4141 4142 4143
		TocEntry   *ted = AH->tocsByDumpId[AH->tableDataId[te->dumpId]];

		ted->reqs = 0;
4144 4145 4146 4147 4148 4149 4150 4151 4152
	}
}

/*
 * Clone and de-clone routines used in parallel restoration.
 *
 * Enough of the structure is cloned to ensure that there is no
 * conflict between different threads each with their own clone.
 */
A
Andrew Dunstan 已提交
4153
ArchiveHandle *
4154 4155 4156 4157 4158
CloneArchive(ArchiveHandle *AH)
{
	ArchiveHandle *clone;

	/* Make a "flat" copy */
4159
	clone = (ArchiveHandle *) pg_malloc(sizeof(ArchiveHandle));
4160 4161
	memcpy(clone, AH, sizeof(ArchiveHandle));

4162 4163
	/* Handle format-independent fields */
	memset(&(clone->sqlparse), 0, sizeof(clone->sqlparse));
4164 4165 4166 4167 4168 4169 4170 4171 4172 4173

	/* The clone will have its own connection, so disregard connection state */
	clone->connection = NULL;
	clone->currUser = NULL;
	clone->currSchema = NULL;
	clone->currTablespace = NULL;
	clone->currWithOids = -1;

	/* savedPassword must be local in case we change it while connecting */
	if (clone->savedPassword)
4174
		clone->savedPassword = pg_strdup(clone->savedPassword);
4175 4176 4177 4178

	/* clone has its own error count, too */
	clone->public.n_errors = 0;

A
Andrew Dunstan 已提交
4179 4180 4181 4182 4183 4184 4185 4186 4187 4188 4189 4190 4191 4192 4193 4194 4195 4196 4197 4198 4199 4200 4201 4202 4203 4204 4205 4206 4207 4208 4209 4210 4211 4212 4213 4214 4215 4216 4217 4218 4219 4220 4221 4222 4223 4224 4225 4226 4227 4228
	/*
	 * Connect our new clone object to the database: In parallel restore the
	 * parent is already disconnected, because we can connect the worker
	 * processes independently to the database (no snapshot sync required). In
	 * parallel backup we clone the parent's existing connection.
	 */
	if (AH->mode == archModeRead)
	{
		RestoreOptions *ropt = AH->ropt;

		Assert(AH->connection == NULL);
		/* this also sets clone->connection */
		ConnectDatabase((Archive *) clone, ropt->dbname,
						ropt->pghost, ropt->pgport, ropt->username,
						ropt->promptPassword);
	}
	else
	{
		char	   *dbname;
		char	   *pghost;
		char	   *pgport;
		char	   *username;
		const char *encname;

		Assert(AH->connection != NULL);

		/*
		 * Even though we are technically accessing the parent's database
		 * object here, these functions are fine to be called like that
		 * because all just return a pointer and do not actually send/receive
		 * any data to/from the database.
		 */
		dbname = PQdb(AH->connection);
		pghost = PQhost(AH->connection);
		pgport = PQport(AH->connection);
		username = PQuser(AH->connection);
		encname = pg_encoding_to_char(AH->public.encoding);

		/* this also sets clone->connection */
		ConnectDatabase((Archive *) clone, dbname, pghost, pgport, username, TRI_NO);

		/*
		 * Set the same encoding, whatever we set here is what we got from
		 * pg_encoding_to_char(), so we really shouldn't run into an error
		 * setting that very same value. Also see the comment in
		 * SetupConnection().
		 */
		PQsetClientEncoding(clone->connection, encname);
	}

4229 4230 4231
	/* Let the format-specific code have a chance too */
	(clone->ClonePtr) (clone);

A
Andrew Dunstan 已提交
4232
	Assert(clone->connection != NULL);
4233 4234 4235 4236 4237 4238 4239 4240
	return clone;
}

/*
 * Release clone-local storage.
 *
 * Note: we assume any clone-local connection was already closed.
 */
A
Andrew Dunstan 已提交
4241
void
4242 4243 4244 4245 4246
DeCloneArchive(ArchiveHandle *AH)
{
	/* Clear format-specific state */
	(AH->DeClonePtr) (AH);

4247 4248 4249
	/* Clear state allocated by CloneArchive */
	if (AH->sqlparse.curCmd)
		destroyPQExpBuffer(AH->sqlparse.curCmd);
4250 4251 4252 4253 4254 4255 4256 4257 4258 4259 4260 4261 4262

	/* Clear any connection-local state */
	if (AH->currUser)
		free(AH->currUser);
	if (AH->currSchema)
		free(AH->currSchema);
	if (AH->currTablespace)
		free(AH->currTablespace);
	if (AH->savedPassword)
		free(AH->savedPassword);

	free(AH);
}