postgres.c 112.2 KB
Newer Older
1 2
/*-------------------------------------------------------------------------
 *
3
 * postgres.c
4
 *	  POSTGRES C Backend Interface
5
 *
B
Bruce Momjian 已提交
6
 * Portions Copyright (c) 1996-2011, PostgreSQL Global Development Group
B
Add:  
Bruce Momjian 已提交
7
 * Portions Copyright (c) 1994, Regents of the University of California
8 9 10
 *
 *
 * IDENTIFICATION
11
 *	  src/backend/tcop/postgres.c
12 13
 *
 * NOTES
14 15
 *	  this is the "main" module of the postgres backend and
 *	  hence the main module of the "traffic cop".
16 17 18
 *
 *-------------------------------------------------------------------------
 */
B
Bruce Momjian 已提交
19

20 21
#include "postgres.h"

22 23 24
#include <fcntl.h>
#include <limits.h>
#include <signal.h>
25
#include <time.h>
B
Bruce Momjian 已提交
26
#include <unistd.h>
27
#include <sys/socket.h>
28
#ifdef HAVE_SYS_SELECT_H
29
#include <sys/select.h>
30
#endif
31
#ifdef HAVE_SYS_RESOURCE_H
32
#include <sys/time.h>
33 34
#include <sys/resource.h>
#endif
35
#ifdef HAVE_GETOPT_H
B
Bruce Momjian 已提交
36
#include <getopt.h>
37
#endif
38

39 40 41 42
#ifndef HAVE_GETRUSAGE
#include "rusagestub.h"
#endif

43
#include "access/printtup.h"
44
#include "access/xact.h"
45
#include "catalog/pg_type.h"
46
#include "commands/async.h"
47
#include "commands/prepare.h"
48
#include "libpq/libpq.h"
49
#include "libpq/pqformat.h"
50
#include "libpq/pqsignal.h"
B
Bruce Momjian 已提交
51
#include "miscadmin.h"
52
#include "nodes/print.h"
53
#include "optimizer/planner.h"
54 55
#include "pgstat.h"
#include "pg_trace.h"
56
#include "parser/analyze.h"
57
#include "parser/parser.h"
58
#include "postmaster/autovacuum.h"
59
#include "postmaster/postmaster.h"
60
#include "replication/walsender.h"
B
Bruce Momjian 已提交
61
#include "rewrite/rewriteHandler.h"
62
#include "storage/bufmgr.h"
63 64
#include "storage/ipc.h"
#include "storage/proc.h"
65
#include "storage/procsignal.h"
66
#include "storage/sinval.h"
67 68
#include "tcop/fastpath.h"
#include "tcop/pquery.h"
B
Bruce Momjian 已提交
69
#include "tcop/tcopprot.h"
70
#include "tcop/utility.h"
71
#include "utils/lsyscache.h"
72
#include "utils/memutils.h"
M
 
Marc G. Fournier 已提交
73
#include "utils/ps_status.h"
74
#include "utils/snapmgr.h"
B
Bruce Momjian 已提交
75
#include "mb/pg_wchar.h"
76

M
 
Marc G. Fournier 已提交
77

78
extern char *optarg;
79 80
extern int	optind;

81
#ifdef HAVE_INT_OPTRESET
82 83 84
extern int	optreset;			/* might not be declared by system headers */
#endif

85

86
/* ----------------
87
 *		global variables
88 89
 * ----------------
 */
90
const char *debug_query_string; /* client-supplied query string */
91

92
/* Note: whereToSendOutput is initialized for the bootstrap/standalone case */
93
CommandDest whereToSendOutput = DestDebug;
94

95
/* flag for logging end of session */
B
Bruce Momjian 已提交
96
bool		Log_disconnections = false;
97

98
int			log_statement = LOGSTMT_NONE;
99

100
/* GUC variable for maximum stack depth (measured in kilobytes) */
101
int			max_stack_depth = 100;
102

103 104 105 106
/* wait N seconds to allow attach from a debugger */
int			PostAuthDelay = 0;


107

108 109 110 111
/* ----------------
 *		private variables
 * ----------------
 */
112

113
/* max_stack_depth converted to bytes for speed of checking */
114
static long max_stack_depth_bytes = 100 * 1024L;
115

N
Neil Conway 已提交
116 117 118 119
/*
 * Stack base pointer -- initialized by PostgresMain. This is not static
 * so that PL/Java can modify it.
 */
B
Bruce Momjian 已提交
120
char	   *stack_base_ptr = NULL;
121

122 123 124 125 126 127
/*
 * On IA64 we also have to remember the register stack base.
 */
#if defined(__ia64__) || defined(__ia64)
char	   *register_stack_base_ptr = NULL;
#endif
128

129 130 131 132 133
/*
 * Flag to mark SIGHUP. Whenever the main loop comes around it
 * will reread the configuration file. (Better than doing the
 * reading in the signal handler, ey?)
 */
134
static volatile sig_atomic_t got_SIGHUP = false;
135

136 137 138 139 140 141
/*
 * Flag to keep track of whether we have started a transaction.
 * For extended query protocol this has to be remembered across messages.
 */
static bool xact_started = false;

142 143 144 145 146 147 148
/*
 * Flag to indicate that we are doing the outer loop's read-from-client,
 * as opposed to any random read from client that might happen within
 * commands like COPY FROM STDIN.
 */
static bool DoingCommandRead = false;

149 150 151 152 153 154 155 156 157 158 159 160
/*
 * Flags to implement skip-till-Sync-after-error behavior for messages of
 * the extended query protocol.
 */
static bool doing_extended_query_message = false;
static bool ignore_till_sync = false;

/*
 * If an unnamed prepared statement exists, it's stored here.
 * We keep it separate from the hashtable kept by commands/prepare.c
 * in order to reduce overhead for short-lived queries.
 */
161
static CachedPlanSource *unnamed_stmt_psrc = NULL;
B
Bruce Momjian 已提交
162

163
/* workspace for building a new unnamed statement in */
164 165 166
static MemoryContext unnamed_stmt_context = NULL;


167
/* assorted command-line switches */
B
Bruce Momjian 已提交
168
static const char *userDoption = NULL;	/* -D switch */
169

B
Bruce Momjian 已提交
170
static bool EchoQuery = false;	/* -E switch */
171 172 173 174

/*
 * people who want to use EOF should #define DONTUSENEWLINE in
 * tcop/tcopdebug.h
175 176
 */
#ifndef TCOP_DONTUSENEWLINE
B
Bruce Momjian 已提交
177
static int	UseNewLine = 1;		/* Use newlines query delimiters (the default) */
178
#else
179
static int	UseNewLine = 0;		/* Use EOF as query delimiters */
180
#endif   /* TCOP_DONTUSENEWLINE */
181

182
/* whether or not, and why, we were cancelled by conflict with recovery */
183
static bool RecoveryConflictPending = false;
184
static bool RecoveryConflictRetryable = true;
B
Bruce Momjian 已提交
185
static ProcSignalReason RecoveryConflictReason;
186 187

/* ----------------------------------------------------------------
188
 *		decls for routines only used in this file
189 190
 * ----------------------------------------------------------------
 */
191
static int	InteractiveBackend(StringInfo inBuf);
192
static int	interactive_getc(void);
193 194
static int	SocketBackend(StringInfo inBuf);
static int	ReadCommand(StringInfo inBuf);
195
static List *pg_rewrite_query(Query *query);
196
static bool check_log_statement(List *stmt_list);
197 198
static int	errdetail_execute(List *raw_parsetree_list);
static int	errdetail_params(ParamListInfo params);
B
Bruce Momjian 已提交
199 200
static int	errdetail_abort(void);
static int	errdetail_recovery_conflict(void);
201
static void start_xact_command(void);
202
static void finish_xact_command(void);
203 204 205
static bool IsTransactionExitStmt(Node *parsetree);
static bool IsTransactionExitStmtList(List *parseTrees);
static bool IsTransactionStmtList(List *parseTrees);
206
static void drop_unnamed_stmt(void);
207
static void SigHupHandler(SIGNAL_ARGS);
208
static void log_disconnections(int code, Datum arg);
209 210 211


/* ----------------------------------------------------------------
212
 *		routines to obtain user input
213 214 215 216
 * ----------------------------------------------------------------
 */

/* ----------------
217
 *	InteractiveBackend() is called for user interactive connections
218 219 220
 *
 *	the string entered by the user is placed in its parameter inBuf,
 *	and we act like a Q message was received.
221
 *
222
 *	EOF is returned if end-of-file input is seen; time to shut down.
223 224 225
 * ----------------
 */

226
static int
227
InteractiveBackend(StringInfo inBuf)
228
{
229 230 231
	int			c;				/* character read from getc() */
	bool		end = false;	/* end-of-input flag */
	bool		backslashSeen = false;	/* have we seen a \ ? */
232

233 234
	/*
	 * display a prompt and obtain input from the user
235
	 */
236
	printf("backend> ");
237
	fflush(stdout);
238

239
	resetStringInfo(inBuf);
240

241
	if (UseNewLine)
242
	{
243
		/*
B
Bruce Momjian 已提交
244 245
		 * if we are using \n as a delimiter, then read characters until the
		 * \n.
246 247
		 */
		while ((c = interactive_getc()) != EOF)
248
		{
249
			if (c == '\n')
250
			{
251
				if (backslashSeen)
252
				{
253 254 255 256
					/* discard backslash from inBuf */
					inBuf->data[--inBuf->len] = '\0';
					backslashSeen = false;
					continue;
257 258
				}
				else
259 260 261 262 263
				{
					/* keep the newline character */
					appendStringInfoChar(inBuf, '\n');
					break;
				}
264
			}
265 266 267 268
			else if (c == '\\')
				backslashSeen = true;
			else
				backslashSeen = false;
269

270
			appendStringInfoChar(inBuf, (char) c);
271 272
		}

273 274 275 276 277
		if (c == EOF)
			end = true;
	}
	else
	{
278
		/*
279
		 * otherwise read characters until EOF.
280
		 */
281 282 283 284 285 286
		while ((c = interactive_getc()) != EOF)
			appendStringInfoChar(inBuf, (char) c);

		/* No input before EOF signal means time to quit. */
		if (inBuf->len == 0)
			end = true;
287 288
	}

289 290 291 292 293 294 295
	if (end)
		return EOF;

	/*
	 * otherwise we have a user query so process it.
	 */

296 297 298
	/* Add '\0' to make it look the same as message case. */
	appendStringInfoChar(inBuf, (char) '\0');

299 300
	/*
	 * if the query echo flag was given, print the query..
301 302
	 */
	if (EchoQuery)
303
		printf("statement: %s\n", inBuf->data);
304
	fflush(stdout);
305

306
	return 'Q';
307 308
}

309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326
/*
 * interactive_getc -- collect one character from stdin
 *
 * Even though we are not reading from a "client" process, we still want to
 * respond to signals, particularly SIGTERM/SIGQUIT.  Hence we must use
 * prepare_for_client_read and client_read_ended.
 */
static int
interactive_getc(void)
{
	int			c;

	prepare_for_client_read();
	c = getc(stdin);
	client_read_ended();
	return c;
}

327
/* ----------------
328
 *	SocketBackend()		Is called for frontend-backend connections
329
 *
330
 *	Returns the message type code, and loads message body data into inBuf.
331
 *
332
 *	EOF is returned if the connection is lost.
333 334
 * ----------------
 */
335
static int
336
SocketBackend(StringInfo inBuf)
337
{
338
	int			qtype;
339

340
	/*
341
	 * Get message type code from the frontend.
342
	 */
343
	qtype = pq_getbyte();
344

345 346
	if (qtype == EOF)			/* frontend disconnected */
	{
347 348 349
		ereport(COMMERROR,
				(errcode(ERRCODE_PROTOCOL_VIOLATION),
				 errmsg("unexpected EOF on client connection")));
350 351 352 353
		return qtype;
	}

	/*
B
Bruce Momjian 已提交
354 355 356
	 * Validate message type code before trying to read body; if we have lost
	 * sync, better to say "command unknown" than to run out of memory because
	 * we used garbage as a length word.
357
	 *
358 359
	 * This also gives us a place to set the doing_extended_query_message flag
	 * as soon as possible.
360
	 */
361
	switch (qtype)
362
	{
363
		case 'Q':				/* simple query */
364
			doing_extended_query_message = false;
365 366 367 368 369
			if (PG_PROTOCOL_MAJOR(FrontendProtocol) < 3)
			{
				/* old style without length word; convert */
				if (pq_getstring(inBuf))
				{
370 371
					ereport(COMMERROR,
							(errcode(ERRCODE_PROTOCOL_VIOLATION),
B
Bruce Momjian 已提交
372
							 errmsg("unexpected EOF on client connection")));
373 374 375
					return EOF;
				}
			}
376 377
			break;

378
		case 'F':				/* fastpath function call */
379 380
			/* we let fastpath.c cope with old-style input of this */
			doing_extended_query_message = false;
381
			break;
382

383
		case 'X':				/* terminate */
384
			doing_extended_query_message = false;
385
			ignore_till_sync = false;
386 387 388 389 390 391 392 393 394 395 396
			break;

		case 'B':				/* bind */
		case 'C':				/* close */
		case 'D':				/* describe */
		case 'E':				/* execute */
		case 'H':				/* flush */
		case 'P':				/* parse */
			doing_extended_query_message = true;
			/* these are only legal in protocol 3 */
			if (PG_PROTOCOL_MAJOR(FrontendProtocol) < 3)
397 398
				ereport(FATAL,
						(errcode(ERRCODE_PROTOCOL_VIOLATION),
B
Bruce Momjian 已提交
399
						 errmsg("invalid frontend message type %d", qtype)));
400 401 402 403 404 405 406 407 408
			break;

		case 'S':				/* sync */
			/* stop any active skip-till-Sync */
			ignore_till_sync = false;
			/* mark not-extended, so that a new error doesn't begin skip */
			doing_extended_query_message = false;
			/* only legal in protocol 3 */
			if (PG_PROTOCOL_MAJOR(FrontendProtocol) < 3)
409 410
				ereport(FATAL,
						(errcode(ERRCODE_PROTOCOL_VIOLATION),
B
Bruce Momjian 已提交
411
						 errmsg("invalid frontend message type %d", qtype)));
412
			break;
413

414 415 416
		case 'd':				/* copy data */
		case 'c':				/* copy done */
		case 'f':				/* copy fail */
417 418 419
			doing_extended_query_message = false;
			/* these are only legal in protocol 3 */
			if (PG_PROTOCOL_MAJOR(FrontendProtocol) < 3)
420 421
				ereport(FATAL,
						(errcode(ERRCODE_PROTOCOL_VIOLATION),
B
Bruce Momjian 已提交
422
						 errmsg("invalid frontend message type %d", qtype)));
423
			break;
424

425
		default:
B
Bruce Momjian 已提交
426

427
			/*
B
Bruce Momjian 已提交
428 429 430
			 * Otherwise we got garbage from the frontend.	We treat this as
			 * fatal because we have probably lost message boundary sync, and
			 * there's no good way to recover.
431
			 */
432 433 434
			ereport(FATAL,
					(errcode(ERRCODE_PROTOCOL_VIOLATION),
					 errmsg("invalid frontend message type %d", qtype)));
435
			break;
436
	}
437

438
	/*
B
Bruce Momjian 已提交
439 440 441
	 * In protocol version 3, all frontend messages have a length word next
	 * after the type code; we can read the message contents independently of
	 * the type.
442 443 444 445 446 447 448
	 */
	if (PG_PROTOCOL_MAJOR(FrontendProtocol) >= 3)
	{
		if (pq_getmessage(inBuf, 0))
			return EOF;			/* suitable message already logged */
	}

449
	return qtype;
450 451 452
}

/* ----------------
453
 *		ReadCommand reads a command from either the frontend or
454 455 456
 *		standard input, places it in inBuf, and returns the
 *		message type code (first byte of the message).
 *		EOF is returned if end of file.
457 458
 * ----------------
 */
459
static int
460
ReadCommand(StringInfo inBuf)
461
{
462
	int			result;
463

464
	if (whereToSendOutput == DestRemote)
465
		result = SocketBackend(inBuf);
466
	else
467 468
		result = InteractiveBackend(inBuf);
	return result;
469 470
}

471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491
/*
 * prepare_for_client_read -- set up to possibly block on client input
 *
 * This must be called immediately before any low-level read from the
 * client connection.  It is necessary to do it at a sufficiently low level
 * that there won't be any other operations except the read kernel call
 * itself between this call and the subsequent client_read_ended() call.
 * In particular there mustn't be use of malloc() or other potentially
 * non-reentrant libc functions.  This restriction makes it safe for us
 * to allow interrupt service routines to execute nontrivial code while
 * we are waiting for input.
 */
void
prepare_for_client_read(void)
{
	if (DoingCommandRead)
	{
		/* Enable immediate processing of asynchronous signals */
		EnableNotifyInterrupt();
		EnableCatchupInterrupt();

492
		/* Allow cancel/die interrupts to be processed while waiting */
493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514
		ImmediateInterruptOK = true;

		/* And don't forget to detect one that already arrived */
		CHECK_FOR_INTERRUPTS();
	}
}

/*
 * client_read_ended -- get out of the client-input state
 */
void
client_read_ended(void)
{
	if (DoingCommandRead)
	{
		ImmediateInterruptOK = false;

		DisableNotifyInterrupt();
		DisableCatchupInterrupt();
	}
}

515

516 517 518 519 520 521 522 523 524 525 526 527 528
/*
 * Do raw parsing (only).
 *
 * A list of parsetrees is returned, since there might be multiple
 * commands in the given string.
 *
 * NOTE: for interactive queries, it is important to keep this routine
 * separate from the analysis & rewrite stages.  Analysis and rewriting
 * cannot be done in an aborted transaction, since they require access to
 * database tables.  So, we rely on the raw parser to determine whether
 * we've seen a COMMIT or ABORT command; when we are in abort state, other
 * commands are not processed any further than the raw parse stage.
 */
529
List *
530
pg_parse_query(const char *query_string)
531
{
532
	List	   *raw_parsetree_list;
533

534 535
	TRACE_POSTGRESQL_QUERY_PARSE_START(query_string);

B
Rename:  
Bruce Momjian 已提交
536
	if (log_parser_stats)
537 538
		ResetUsage();

539
	raw_parsetree_list = raw_parser(query_string);
540

541 542 543
	if (log_parser_stats)
		ShowUsage("PARSER STATISTICS");

544 545 546 547 548 549 550 551 552 553 554 555 556
#ifdef COPY_PARSE_PLAN_TREES
	/* Optional debugging check: pass raw parsetrees through copyObject() */
	{
		List	   *new_list = (List *) copyObject(raw_parsetree_list);

		/* This checks both copyObject() and the equal() routines... */
		if (!equal(new_list, raw_parsetree_list))
			elog(WARNING, "copyObject() failed to produce an equal raw parse tree");
		else
			raw_parsetree_list = new_list;
	}
#endif

557 558
	TRACE_POSTGRESQL_QUERY_PARSE_DONE(query_string);

559 560 561
	return raw_parsetree_list;
}

562
/*
563 564
 * Given a raw parsetree (gram.y output), and optionally information about
 * types of parameter symbols ($n), perform parse analysis and rule rewriting.
565 566 567 568 569 570
 *
 * A list of Query nodes is returned, since either the analyzer or the
 * rewriter might expand one query to several.
 *
 * NOTE: for reasons mentioned above, this must be separate from raw parsing.
 */
571
List *
572 573
pg_analyze_and_rewrite(Node *parsetree, const char *query_string,
					   Oid *paramTypes, int numParams)
574
{
575
	Query	   *query;
576 577
	List	   *querytree_list;

578 579
	TRACE_POSTGRESQL_QUERY_REWRITE_START(query_string);

580 581
	/*
	 * (1) Perform parse analysis.
582
	 */
B
Rename:  
Bruce Momjian 已提交
583
	if (log_parser_stats)
584 585
		ResetUsage();

586
	query = parse_analyze(parsetree, query_string, paramTypes, numParams);
587

B
Rename:  
Bruce Momjian 已提交
588
	if (log_parser_stats)
589
		ShowUsage("PARSE ANALYSIS STATISTICS");
590

591 592
	/*
	 * (2) Rewrite the queries, as necessary
593
	 */
594
	querytree_list = pg_rewrite_query(query);
595

596 597
	TRACE_POSTGRESQL_QUERY_REWRITE_DONE(query_string);

598 599 600
	return querytree_list;
}

601 602 603 604 605 606 607 608 609 610 611 612 613 614 615
/*
 * Do parse analysis and rewriting.  This is the same as pg_analyze_and_rewrite
 * except that external-parameter resolution is determined by parser callback
 * hooks instead of a fixed list of parameter datatypes.
 */
List *
pg_analyze_and_rewrite_params(Node *parsetree,
							  const char *query_string,
							  ParserSetupHook parserSetup,
							  void *parserSetupArg)
{
	ParseState *pstate;
	Query	   *query;
	List	   *querytree_list;

B
Bruce Momjian 已提交
616
	Assert(query_string != NULL);		/* required as of 8.4 */
617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646

	TRACE_POSTGRESQL_QUERY_REWRITE_START(query_string);

	/*
	 * (1) Perform parse analysis.
	 */
	if (log_parser_stats)
		ResetUsage();

	pstate = make_parsestate(NULL);
	pstate->p_sourcetext = query_string;
	(*parserSetup) (pstate, parserSetupArg);

	query = transformStmt(pstate, parsetree);

	free_parsestate(pstate);

	if (log_parser_stats)
		ShowUsage("PARSE ANALYSIS STATISTICS");

	/*
	 * (2) Rewrite the queries, as necessary
	 */
	querytree_list = pg_rewrite_query(query);

	TRACE_POSTGRESQL_QUERY_REWRITE_DONE(query_string);

	return querytree_list;
}

647
/*
648
 * Perform rewriting of a query produced by parse analysis.
649
 *
650 651
 * Note: query must just have come from the parser, because we do not do
 * AcquireRewriteLocks() on it.
652
 */
653
static List *
654
pg_rewrite_query(Query *query)
655
{
656
	List	   *querytree_list;
657

658
	if (Debug_print_parse)
659
		elog_node_display(LOG, "parse tree", query,
660
						  Debug_pretty_print);
661

662 663 664
	if (log_parser_stats)
		ResetUsage();

665 666 667 668 669 670 671 672 673
	if (query->commandType == CMD_UTILITY)
	{
		/* don't rewrite utilities, just dump 'em into result list */
		querytree_list = list_make1(query);
	}
	else
	{
		/* rewrite regular queries */
		querytree_list = QueryRewrite(query);
674 675
	}

B
Rename:  
Bruce Momjian 已提交
676
	if (log_parser_stats)
677
		ShowUsage("REWRITER STATISTICS");
678

679
#ifdef COPY_PARSE_PLAN_TREES
680 681 682
	/* Optional debugging check: pass querytree output through copyObject() */
	{
		List	   *new_list;
B
Bruce Momjian 已提交
683

684 685 686 687 688 689 690
		new_list = (List *) copyObject(querytree_list);
		/* This checks both copyObject() and the equal() routines... */
		if (!equal(new_list, querytree_list))
			elog(WARNING, "copyObject() failed to produce equal parse tree");
		else
			querytree_list = new_list;
	}
691 692
#endif

693
	if (Debug_print_rewritten)
694
		elog_node_display(LOG, "rewritten parse tree", querytree_list,
695
						  Debug_pretty_print);
696

697 698
	return querytree_list;
}
699 700


701 702 703 704
/*
 * Generate a plan for a single already-rewritten query.
 * This is a thin wrapper around planner() and takes the same parameters.
 */
705
PlannedStmt *
706
pg_plan_query(Query *querytree, int cursorOptions, ParamListInfo boundParams)
707
{
708
	PlannedStmt *plan;
709

710 711 712
	/* Utility commands have no plans. */
	if (querytree->commandType == CMD_UTILITY)
		return NULL;
713

714 715 716
	/* Planner must have a snapshot in case it calls user-defined functions. */
	Assert(ActiveSnapshotSet());

717 718
	TRACE_POSTGRESQL_QUERY_PLAN_START();

B
Rename:  
Bruce Momjian 已提交
719
	if (log_planner_stats)
720
		ResetUsage();
721

722
	/* call the optimizer */
723
	plan = planner(querytree, cursorOptions, boundParams);
724

B
Rename:  
Bruce Momjian 已提交
725
	if (log_planner_stats)
726
		ShowUsage("PLANNER STATISTICS");
727

728 729 730
#ifdef COPY_PARSE_PLAN_TREES
	/* Optional debugging check: pass plan output through copyObject() */
	{
731
		PlannedStmt *new_plan = (PlannedStmt *) copyObject(plan);
732

B
Bruce Momjian 已提交
733
		/*
B
Bruce Momjian 已提交
734 735
		 * equal() currently does not have routines to compare Plan nodes, so
		 * don't try to test equality here.  Perhaps fix someday?
736 737 738
		 */
#ifdef NOT_USED
		/* This checks both copyObject() and the equal() routines... */
B
Bruce Momjian 已提交
739
		if (!equal(new_plan, plan))
740
			elog(WARNING, "copyObject() failed to produce an equal plan tree");
741 742 743 744 745 746
		else
#endif
			plan = new_plan;
	}
#endif

747 748
	/*
	 * Print plan if debugging.
749
	 */
750
	if (Debug_print_plan)
751
		elog_node_display(LOG, "plan", plan, Debug_pretty_print);
752

753 754
	TRACE_POSTGRESQL_QUERY_PLAN_DONE();

755
	return plan;
756 757
}

758 759
/*
 * Generate plans for a list of already-rewritten queries.
760
 *
761 762
 * Normal optimizable statements generate PlannedStmt entries in the result
 * list.  Utility statements are simply represented by their statement nodes.
763 764
 */
List *
765
pg_plan_queries(List *querytrees, int cursorOptions, ParamListInfo boundParams)
766
{
767 768
	List	   *stmt_list = NIL;
	ListCell   *query_list;
769

770
	foreach(query_list, querytrees)
771
	{
772 773
		Query	   *query = (Query *) lfirst(query_list);
		Node	   *stmt;
774

775
		if (query->commandType == CMD_UTILITY)
776
		{
777 778 779 780 781
			/* Utility commands have no plans. */
			stmt = query->utilityStmt;
		}
		else
		{
782
			stmt = (Node *) pg_plan_query(query, cursorOptions, boundParams);
783 784
		}

785
		stmt_list = lappend(stmt_list, stmt);
786
	}
787

788
	return stmt_list;
789 790 791 792
}


/*
793
 * exec_simple_query
794
 *
795
 * Execute a "simple Query" protocol message.
796
 */
797
static void
798
exec_simple_query(const char *query_string)
799
{
B
Bruce Momjian 已提交
800
	CommandDest dest = whereToSendOutput;
801
	MemoryContext oldcontext;
802 803
	List	   *parsetree_list;
	ListCell   *parsetree_item;
804
	bool		save_log_statement_stats = log_statement_stats;
805
	bool		was_logged = false;
806
	bool		isTopLevel;
807
	char		msec_str[32];
B
Bruce Momjian 已提交
808

809

810 811 812
	/*
	 * Report query to various monitoring facilities.
	 */
813
	debug_query_string = query_string;
814

815 816
	pgstat_report_activity(query_string);

817 818
	TRACE_POSTGRESQL_QUERY_START(query_string);

819
	/*
820 821
	 * We use save_log_statement_stats so ShowUsage doesn't report incorrect
	 * results because ResetUsage wasn't called.
822
	 */
823 824 825
	if (save_log_statement_stats)
		ResetUsage();

826
	/*
B
Bruce Momjian 已提交
827 828
	 * Start up a transaction command.	All queries generated by the
	 * query_string will be in this same command block, *unless* we find a
B
Bruce Momjian 已提交
829 830 831
	 * BEGIN/COMMIT/ABORT statement; we have to force a new xact command after
	 * one of those, else bad things will happen in xact.c. (Note that this
	 * will normally change current memory context.)
832
	 */
833
	start_xact_command();
834 835

	/*
B
Bruce Momjian 已提交
836 837 838 839
	 * Zap any pre-existing unnamed statement.	(While not strictly necessary,
	 * it seems best to define simple-Query mode as if it used the unnamed
	 * statement and portal; this ensures we recover any storage used by prior
	 * unnamed operations.)
840
	 */
841
	drop_unnamed_stmt();
842

843 844 845
	/*
	 * Switch to appropriate context for constructing parsetrees.
	 */
846
	oldcontext = MemoryContextSwitchTo(MessageContext);
847

B
Bruce Momjian 已提交
848
	/*
B
Bruce Momjian 已提交
849 850
	 * Do basic parsing of the query or queries (this should be safe even if
	 * we are in aborted transaction state!)
851
	 */
852
	parsetree_list = pg_parse_query(query_string);
853

854
	/* Log immediately if dictated by log_statement */
855
	if (check_log_statement(parsetree_list))
856 857 858
	{
		ereport(LOG,
				(errmsg("statement: %s", query_string),
859
				 errhidestmt(true),
860 861 862
				 errdetail_execute(parsetree_list)));
		was_logged = true;
	}
863

864
	/*
865
	 * Switch back to transaction context to enter the loop.
866 867 868
	 */
	MemoryContextSwitchTo(oldcontext);

869
	/*
B
Bruce Momjian 已提交
870 871 872 873
	 * We'll tell PortalRun it's a top-level command iff there's exactly one
	 * raw parsetree.  If more than one, it's effectively a transaction block
	 * and we want PreventTransactionChain to reject unsafe commands. (Note:
	 * we're assuming that query rewrite cannot add commands that are
874 875 876 877
	 * significant to PreventTransactionChain.)
	 */
	isTopLevel = (list_length(parsetree_list) == 1);

878
	/*
879
	 * Run through the raw parsetree(s) and process each one.
880
	 */
881
	foreach(parsetree_item, parsetree_list)
882
	{
B
Bruce Momjian 已提交
883
		Node	   *parsetree = (Node *) lfirst(parsetree_item);
884
		bool		snapshot_set = false;
885 886
		const char *commandTag;
		char		completionTag[COMPLETION_TAG_BUFSIZE];
B
Bruce Momjian 已提交
887
		List	   *querytree_list,
888 889
				   *plantree_list;
		Portal		portal;
890 891
		DestReceiver *receiver;
		int16		format;
892

893
		/*
B
Bruce Momjian 已提交
894 895 896 897
		 * Get the command name for use in status display (it also becomes the
		 * default completion tag, down inside PortalRun).	Set ps_status and
		 * do any special start-of-SQL-command processing needed by the
		 * destination.
898 899 900
		 */
		commandTag = CreateCommandTag(parsetree);

901
		set_ps_display(commandTag, false);
902

903
		BeginCommand(commandTag, dest);
904

905
		/*
906
		 * If we are in an aborted transaction, reject all commands except
B
Bruce Momjian 已提交
907 908 909 910 911
		 * COMMIT/ABORT.  It is important that this test occur before we try
		 * to do parse analysis, rewrite, or planning, since all those phases
		 * try to do database accesses, which may fail in abort state. (It
		 * might be safe to allow some additional utility commands in this
		 * state, but not many...)
912
		 */
913 914 915 916 917
		if (IsAbortedTransactionBlockState() &&
			!IsTransactionExitStmt(parsetree))
			ereport(ERROR,
					(errcode(ERRCODE_IN_FAILED_SQL_TRANSACTION),
					 errmsg("current transaction is aborted, "
B
Bruce Momjian 已提交
918
						  "commands ignored until end of transaction block"),
919
					 errdetail_abort()));
920

921
		/* Make sure we are in a transaction command */
922
		start_xact_command();
923

924
		/* If we got a cancel signal in parsing or prior command, quit */
925
		CHECK_FOR_INTERRUPTS();
926

927 928 929 930 931 932 933 934 935
		/*
		 * Set up a snapshot if parse analysis/planning will need one.
		 */
		if (analyze_requires_snapshot(parsetree))
		{
			PushActiveSnapshot(GetTransactionSnapshot());
			snapshot_set = true;
		}

936
		/*
937
		 * OK to analyze, rewrite, and plan this query.
938
		 *
B
Bruce Momjian 已提交
939 940
		 * Switch to appropriate context for constructing querytrees (again,
		 * these must outlive the execution context).
941
		 */
942
		oldcontext = MemoryContextSwitchTo(MessageContext);
943

944 945
		querytree_list = pg_analyze_and_rewrite(parsetree, query_string,
												NULL, 0);
V
Vadim B. Mikheev 已提交
946

947
		plantree_list = pg_plan_queries(querytree_list, 0, NULL);
948 949 950 951

		/* Done with the snapshot used for parsing/planning */
		if (snapshot_set)
			PopActiveSnapshot();
952 953 954 955

		/* If we got a cancel signal in analysis or planning, quit */
		CHECK_FOR_INTERRUPTS();

956
		/*
B
Bruce Momjian 已提交
957 958
		 * Create unnamed portal to run the query or queries in. If there
		 * already is one, silently drop it.
959
		 */
960
		portal = CreatePortal("", true, true);
961 962
		/* Don't display the portal in pg_cursors */
		portal->visible = false;
963

964 965
		/*
		 * We don't have to copy anything into the portal, because everything
966
		 * we are passing here is in MessageContext, which will outlive the
967 968
		 * portal anyway.
		 */
969
		PortalDefineQuery(portal,
970
						  NULL,
971 972 973
						  query_string,
						  commandTag,
						  plantree_list,
974
						  NULL);
975

976
		/*
977
		 * Start the portal.  No parameters here.
978
		 */
979
		PortalStart(portal, NULL, InvalidSnapshot);
980

981
		/*
B
Bruce Momjian 已提交
982 983 984 985
		 * Select the appropriate output format: text unless we are doing a
		 * FETCH from a binary cursor.	(Pretty grotty to have to do this here
		 * --- but it avoids grottiness in other places.  Ah, the joys of
		 * backward compatibility...)
986 987 988 989 990 991 992 993 994 995 996 997
		 */
		format = 0;				/* TEXT is default */
		if (IsA(parsetree, FetchStmt))
		{
			FetchStmt  *stmt = (FetchStmt *) parsetree;

			if (!stmt->ismove)
			{
				Portal		fportal = GetPortalByName(stmt->portalname);

				if (PortalIsValid(fportal) &&
					(fportal->cursorOptions & CURSOR_OPT_BINARY))
B
Bruce Momjian 已提交
998
					format = 1; /* BINARY */
999 1000 1001 1002 1003 1004 1005
			}
		}
		PortalSetResultFormat(portal, 1, &format);

		/*
		 * Now we can create the destination receiver object.
		 */
1006 1007 1008
		receiver = CreateDestReceiver(dest);
		if (dest == DestRemote)
			SetRemoteDestReceiverParams(receiver, portal);
1009 1010 1011 1012 1013 1014 1015

		/*
		 * Switch back to transaction context for execution.
		 */
		MemoryContextSwitchTo(oldcontext);

		/*
B
Bruce Momjian 已提交
1016
		 * Run the portal to completion, and then drop it (and the receiver).
1017
		 */
1018 1019
		(void) PortalRun(portal,
						 FETCH_ALL,
1020
						 isTopLevel,
1021 1022
						 receiver,
						 receiver,
1023
						 completionTag);
1024

1025
		(*receiver->rDestroy) (receiver);
1026

1027
		PortalDrop(portal, false);
1028

1029
		if (IsA(parsetree, TransactionStmt))
1030
		{
1031
			/*
B
Bruce Momjian 已提交
1032 1033
			 * If this was a transaction control statement, commit it. We will
			 * start a new xact command for the next command (if any).
1034
			 */
1035
			finish_xact_command();
1036
		}
1037
		else if (lnext(parsetree_item) == NULL)
1038
		{
1039
			/*
B
Bruce Momjian 已提交
1040 1041 1042 1043 1044 1045 1046 1047
			 * If this is the last parsetree of the query string, close down
			 * transaction statement before reporting command-complete.  This
			 * is so that any end-of-transaction errors are reported before
			 * the command-complete message is issued, to avoid confusing
			 * clients who will expect either a command-complete message or an
			 * error, not one and then the other.  But for compatibility with
			 * historical Postgres behavior, we do not force a transaction
			 * boundary between queries appearing in a single query string.
1048
			 */
1049
			finish_xact_command();
1050
		}
1051
		else
1052
		{
1053
			/*
B
Bruce Momjian 已提交
1054 1055
			 * We need a CommandCounterIncrement after every query, except
			 * those that start or end a transaction block.
1056 1057
			 */
			CommandCounterIncrement();
1058
		}
1059 1060

		/*
B
Bruce Momjian 已提交
1061 1062 1063 1064
		 * Tell client that we're done with this query.  Note we emit exactly
		 * one EndCommand report for each raw parsetree, thus one for each SQL
		 * command the client sent, regardless of rewriting. (But a command
		 * aborted by error will not send an EndCommand report at all.)
1065
		 */
1066
		EndCommand(completionTag, dest);
B
Bruce Momjian 已提交
1067
	}							/* end loop over parsetrees */
1068

1069 1070 1071
	/*
	 * Close down transaction statement, if one is open.
	 */
1072
	finish_xact_command();
1073

1074 1075 1076
	/*
	 * If there were no parsetrees, return EmptyQueryResponse message.
	 */
1077
	if (!parsetree_list)
1078 1079
		NullCommand(dest);

1080
	/*
1081
	 * Emit duration logging if appropriate.
1082
	 */
1083
	switch (check_log_duration(msec_str, was_logged))
1084
	{
1085
		case 1:
1086
			ereport(LOG,
1087 1088
					(errmsg("duration: %s ms", msec_str),
					 errhidestmt(true)));
1089 1090
			break;
		case 2:
1091 1092 1093
			ereport(LOG,
					(errmsg("duration: %s ms  statement: %s",
							msec_str, query_string),
1094
					 errhidestmt(true),
1095
					 errdetail_execute(parsetree_list)));
1096
			break;
1097
	}
1098

1099 1100 1101
	if (save_log_statement_stats)
		ShowUsage("QUERY STATISTICS");

1102 1103
	TRACE_POSTGRESQL_QUERY_DONE(query_string);

1104
	debug_query_string = NULL;
1105 1106
}

1107 1108 1109 1110 1111 1112 1113 1114
/*
 * exec_parse_message
 *
 * Execute a "Parse" protocol message.
 */
static void
exec_parse_message(const char *query_string,	/* string to execute */
				   const char *stmt_name,		/* name for prepared stmt */
B
Bruce Momjian 已提交
1115 1116
				   Oid *paramTypes,		/* parameter types */
				   int numParams)		/* number of parameters */
1117 1118 1119
{
	MemoryContext oldcontext;
	List	   *parsetree_list;
1120
	Node	   *raw_parse_tree;
1121 1122
	const char *commandTag;
	List	   *querytree_list,
1123
			   *stmt_list;
1124
	bool		is_named;
1125
	bool		fully_planned;
1126
	bool		save_log_statement_stats = log_statement_stats;
1127
	char		msec_str[32];
1128 1129 1130 1131 1132 1133 1134 1135

	/*
	 * Report query to various monitoring facilities.
	 */
	debug_query_string = query_string;

	pgstat_report_activity(query_string);

1136
	set_ps_display("PARSE", false);
1137 1138 1139 1140

	if (save_log_statement_stats)
		ResetUsage();

1141 1142 1143 1144
	ereport(DEBUG2,
			(errmsg("parse %s: %s",
					*stmt_name ? stmt_name : "<unnamed>",
					query_string)));
1145

1146
	/*
B
Bruce Momjian 已提交
1147 1148 1149
	 * Start up a transaction command so we can run parse analysis etc. (Note
	 * that this will normally change current memory context.) Nothing happens
	 * if we are already in one.
1150
	 */
1151
	start_xact_command();
1152 1153 1154 1155

	/*
	 * Switch to appropriate context for constructing parsetrees.
	 *
B
Bruce Momjian 已提交
1156 1157 1158
	 * We have two strategies depending on whether the prepared statement is
	 * named or not.  For a named prepared statement, we do parsing in
	 * MessageContext and copy the finished trees into the prepared
1159
	 * statement's plancache entry; then the reset of MessageContext releases
B
Bruce Momjian 已提交
1160 1161 1162
	 * temporary space used by parsing and planning.  For an unnamed prepared
	 * statement, we assume the statement isn't going to hang around long, so
	 * getting rid of temp space quickly is probably not worth the costs of
1163 1164
	 * copying parse/plan trees.  So in this case, we create the plancache
	 * entry's context here, and do all the parsing work therein.
1165 1166 1167 1168 1169 1170 1171 1172 1173 1174
	 */
	is_named = (stmt_name[0] != '\0');
	if (is_named)
	{
		/* Named prepared statement --- parse in MessageContext */
		oldcontext = MemoryContextSwitchTo(MessageContext);
	}
	else
	{
		/* Unnamed prepared statement --- release any prior unnamed stmt */
1175 1176
		drop_unnamed_stmt();
		/* Create context for parsing/planning */
1177
		unnamed_stmt_context =
1178
			AllocSetContextCreate(CacheMemoryContext,
1179 1180 1181 1182 1183 1184 1185 1186
								  "unnamed prepared statement",
								  ALLOCSET_DEFAULT_MINSIZE,
								  ALLOCSET_DEFAULT_INITSIZE,
								  ALLOCSET_DEFAULT_MAXSIZE);
		oldcontext = MemoryContextSwitchTo(unnamed_stmt_context);
	}

	/*
B
Bruce Momjian 已提交
1187 1188
	 * Do basic parsing of the query or queries (this should be safe even if
	 * we are in aborted transaction state!)
1189 1190 1191 1192
	 */
	parsetree_list = pg_parse_query(query_string);

	/*
B
Bruce Momjian 已提交
1193 1194 1195
	 * We only allow a single user statement in a prepared statement. This is
	 * mainly to keep the protocol simple --- otherwise we'd need to worry
	 * about multiple result tupdescs and things like that.
1196
	 */
1197
	if (list_length(parsetree_list) > 1)
1198 1199
		ereport(ERROR,
				(errcode(ERRCODE_SYNTAX_ERROR),
B
Bruce Momjian 已提交
1200
		errmsg("cannot insert multiple commands into a prepared statement")));
1201 1202 1203

	if (parsetree_list != NIL)
	{
1204
		Query	   *query;
1205
		bool		snapshot_set = false;
B
Bruce Momjian 已提交
1206
		int			i;
1207

1208 1209
		raw_parse_tree = (Node *) linitial(parsetree_list);

1210 1211 1212
		/*
		 * Get the command name for possible use in status display.
		 */
1213
		commandTag = CreateCommandTag(raw_parse_tree);
1214 1215 1216

		/*
		 * If we are in an aborted transaction, reject all commands except
B
Bruce Momjian 已提交
1217 1218 1219 1220 1221
		 * COMMIT/ROLLBACK.  It is important that this test occur before we
		 * try to do parse analysis, rewrite, or planning, since all those
		 * phases try to do database accesses, which may fail in abort state.
		 * (It might be safe to allow some additional utility commands in this
		 * state, but not many...)
1222
		 */
1223
		if (IsAbortedTransactionBlockState() &&
1224
			!IsTransactionExitStmt(raw_parse_tree))
1225 1226 1227
			ereport(ERROR,
					(errcode(ERRCODE_IN_FAILED_SQL_TRANSACTION),
					 errmsg("current transaction is aborted, "
B
Bruce Momjian 已提交
1228
						  "commands ignored until end of transaction block"),
1229
					 errdetail_abort()));
1230

1231 1232 1233 1234 1235 1236 1237 1238 1239
		/*
		 * Set up a snapshot if parse analysis/planning will need one.
		 */
		if (analyze_requires_snapshot(raw_parse_tree))
		{
			PushActiveSnapshot(GetTransactionSnapshot());
			snapshot_set = true;
		}

1240 1241
		/*
		 * OK to analyze, rewrite, and plan this query.  Note that the
B
Bruce Momjian 已提交
1242 1243
		 * originally specified parameter set is not required to be complete,
		 * so we have to use parse_analyze_varparams().
1244
		 *
B
Bruce Momjian 已提交
1245 1246
		 * XXX must use copyObject here since parse analysis scribbles on its
		 * input, and we need the unmodified raw parse tree for possible
1247
		 * replanning later.
1248 1249 1250 1251
		 */
		if (log_parser_stats)
			ResetUsage();

1252 1253 1254 1255
		query = parse_analyze_varparams(copyObject(raw_parse_tree),
										query_string,
										&paramTypes,
										&numParams);
1256 1257

		/*
1258
		 * Check all parameter types got determined.
1259 1260 1261
		 */
		for (i = 0; i < numParams; i++)
		{
B
Bruce Momjian 已提交
1262
			Oid			ptype = paramTypes[i];
1263 1264

			if (ptype == InvalidOid || ptype == UNKNOWNOID)
1265 1266
				ereport(ERROR,
						(errcode(ERRCODE_INDETERMINATE_DATATYPE),
B
Bruce Momjian 已提交
1267 1268
					 errmsg("could not determine data type of parameter $%d",
							i + 1)));
1269 1270 1271 1272 1273
		}

		if (log_parser_stats)
			ShowUsage("PARSE ANALYSIS STATISTICS");

1274
		querytree_list = pg_rewrite_query(query);
1275

1276
		/*
B
Bruce Momjian 已提交
1277 1278
		 * If this is the unnamed statement and it has parameters, defer query
		 * planning until Bind.  Otherwise do it now.
1279 1280
		 */
		if (!is_named && numParams > 0)
1281 1282 1283 1284
		{
			stmt_list = querytree_list;
			fully_planned = false;
		}
1285
		else
1286
		{
1287
			stmt_list = pg_plan_queries(querytree_list, 0, NULL);
1288 1289
			fully_planned = true;
		}
1290 1291 1292 1293

		/* Done with the snapshot used for parsing/planning */
		if (snapshot_set)
			PopActiveSnapshot();
1294 1295 1296
	}
	else
	{
B
Bruce Momjian 已提交
1297
		/* Empty input string.	This is legal. */
1298
		raw_parse_tree = NULL;
1299
		commandTag = NULL;
1300 1301
		stmt_list = NIL;
		fully_planned = true;
1302 1303 1304 1305 1306 1307 1308 1309 1310 1311 1312
	}

	/* If we got a cancel signal in analysis or planning, quit */
	CHECK_FOR_INTERRUPTS();

	/*
	 * Store the query as a prepared statement.  See above comments.
	 */
	if (is_named)
	{
		StorePreparedStatement(stmt_name,
1313
							   raw_parse_tree,
1314 1315
							   query_string,
							   commandTag,
1316 1317
							   paramTypes,
							   numParams,
B
Bruce Momjian 已提交
1318
							   0,		/* default cursor options */
1319
							   stmt_list,
1320
							   false);
1321 1322 1323
	}
	else
	{
1324 1325 1326 1327
		/*
		 * paramTypes and query_string need to be copied into
		 * unnamed_stmt_context.  The rest is there already
		 */
B
Bruce Momjian 已提交
1328
		Oid		   *newParamTypes;
1329 1330 1331 1332 1333 1334 1335 1336 1337

		if (numParams > 0)
		{
			newParamTypes = (Oid *) palloc(numParams * sizeof(Oid));
			memcpy(newParamTypes, paramTypes, numParams * sizeof(Oid));
		}
		else
			newParamTypes = NULL;

1338 1339 1340
		unnamed_stmt_psrc = FastCreateCachedPlan(raw_parse_tree,
												 pstrdup(query_string),
												 commandTag,
1341
												 newParamTypes,
1342
												 numParams,
B
Bruce Momjian 已提交
1343
												 0,		/* cursor options */
1344 1345 1346 1347 1348 1349
												 stmt_list,
												 fully_planned,
												 true,
												 unnamed_stmt_context);
		/* context now belongs to the plancache entry */
		unnamed_stmt_context = NULL;
1350 1351 1352 1353 1354
	}

	MemoryContextSwitchTo(oldcontext);

	/*
B
Bruce Momjian 已提交
1355 1356 1357
	 * We do NOT close the open transaction command here; that only happens
	 * when the client sends Sync.	Instead, do CommandCounterIncrement just
	 * in case something happened during parse/plan.
1358 1359 1360 1361 1362 1363
	 */
	CommandCounterIncrement();

	/*
	 * Send ParseComplete.
	 */
1364
	if (whereToSendOutput == DestRemote)
1365 1366
		pq_putemptymessage('1');

1367 1368 1369
	/*
	 * Emit duration logging if appropriate.
	 */
1370 1371 1372 1373
	switch (check_log_duration(msec_str, false))
	{
		case 1:
			ereport(LOG,
1374 1375
					(errmsg("duration: %s ms", msec_str),
					 errhidestmt(true)));
1376 1377 1378 1379 1380 1381
			break;
		case 2:
			ereport(LOG,
					(errmsg("duration: %s ms  parse %s: %s",
							msec_str,
							*stmt_name ? stmt_name : "<unnamed>",
1382 1383
							query_string),
					 errhidestmt(true)));
1384 1385
			break;
	}
1386

1387 1388 1389 1390 1391 1392 1393 1394 1395 1396 1397 1398 1399 1400 1401 1402
	if (save_log_statement_stats)
		ShowUsage("PARSE MESSAGE STATISTICS");

	debug_query_string = NULL;
}

/*
 * exec_bind_message
 *
 * Process a "Bind" message to create a portal from a prepared statement
 */
static void
exec_bind_message(StringInfo input_message)
{
	const char *portal_name;
	const char *stmt_name;
1403 1404
	int			numPFormats;
	int16	   *pformats = NULL;
1405
	int			numParams;
1406 1407
	int			numRFormats;
	int16	   *rformats = NULL;
1408 1409
	CachedPlanSource *psrc;
	CachedPlan *cplan;
1410
	Portal		portal;
1411 1412
	char	   *query_string;
	char	   *saved_stmt_name;
1413
	ParamListInfo params;
1414
	List	   *plan_list;
1415
	MemoryContext oldContext;
1416
	bool		save_log_statement_stats = log_statement_stats;
1417
	bool		snapshot_set = false;
1418 1419 1420 1421 1422 1423 1424 1425 1426 1427 1428 1429 1430
	char		msec_str[32];

	/* Get the fixed part of the message */
	portal_name = pq_getmsgstring(input_message);
	stmt_name = pq_getmsgstring(input_message);

	ereport(DEBUG2,
			(errmsg("bind %s to %s",
					*portal_name ? portal_name : "<unnamed>",
					*stmt_name ? stmt_name : "<unnamed>")));

	/* Find prepared statement */
	if (stmt_name[0] != '\0')
1431 1432 1433
	{
		PreparedStatement *pstmt;

1434
		pstmt = FetchPreparedStatement(stmt_name, true);
1435 1436
		psrc = pstmt->plansource;
	}
1437 1438
	else
	{
1439
		/* Unnamed statements are re-prepared for every bind */
1440 1441
		psrc = unnamed_stmt_psrc;
		if (!psrc)
1442 1443 1444 1445 1446 1447 1448 1449
			ereport(ERROR,
					(errcode(ERRCODE_UNDEFINED_PSTATEMENT),
					 errmsg("unnamed prepared statement does not exist")));
	}

	/*
	 * Report query to various monitoring facilities.
	 */
1450
	debug_query_string = psrc->query_string;
1451

1452
	pgstat_report_activity(psrc->query_string);
1453

1454
	set_ps_display("BIND", false);
1455

1456 1457 1458
	if (save_log_statement_stats)
		ResetUsage();

1459
	/*
B
Bruce Momjian 已提交
1460 1461 1462
	 * Start up a transaction command so we can call functions etc. (Note that
	 * this will normally change current memory context.) Nothing happens if
	 * we are already in one.
1463
	 */
1464
	start_xact_command();
1465

1466 1467 1468 1469 1470 1471 1472
	/* Switch back to message context */
	MemoryContextSwitchTo(MessageContext);

	/* Get the parameter format codes */
	numPFormats = pq_getmsgint(input_message, 2);
	if (numPFormats > 0)
	{
B
Bruce Momjian 已提交
1473 1474
		int			i;

1475 1476 1477 1478 1479 1480 1481 1482 1483
		pformats = (int16 *) palloc(numPFormats * sizeof(int16));
		for (i = 0; i < numPFormats; i++)
			pformats[i] = pq_getmsgint(input_message, 2);
	}

	/* Get the parameter value count */
	numParams = pq_getmsgint(input_message, 2);

	if (numPFormats > 1 && numPFormats != numParams)
1484 1485
		ereport(ERROR,
				(errcode(ERRCODE_PROTOCOL_VIOLATION),
B
Bruce Momjian 已提交
1486 1487
			errmsg("bind message has %d parameter formats but %d parameters",
				   numPFormats, numParams)));
1488

1489
	if (numParams != psrc->num_params)
1490 1491 1492
		ereport(ERROR,
				(errcode(ERRCODE_PROTOCOL_VIOLATION),
				 errmsg("bind message supplies %d parameters, but prepared statement \"%s\" requires %d",
B
Bruce Momjian 已提交
1493
						numParams, stmt_name, psrc->num_params)));
1494

1495 1496
	/*
	 * If we are in aborted transaction state, the only portals we can
1497 1498 1499 1500 1501
	 * actually run are those containing COMMIT or ROLLBACK commands. We
	 * disallow binding anything else to avoid problems with infrastructure
	 * that expects to run inside a valid transaction.	We also disallow
	 * binding any parameters, since we can't risk calling user-defined I/O
	 * functions.
1502 1503
	 */
	if (IsAbortedTransactionBlockState() &&
1504
		(!IsTransactionExitStmt(psrc->raw_parse_tree) ||
1505 1506 1507 1508
		 numParams != 0))
		ereport(ERROR,
				(errcode(ERRCODE_IN_FAILED_SQL_TRANSACTION),
				 errmsg("current transaction is aborted, "
1509 1510
						"commands ignored until end of transaction block"),
				 errdetail_abort()));
1511

1512
	/*
B
Bruce Momjian 已提交
1513 1514
	 * Create the portal.  Allow silent replacement of an existing portal only
	 * if the unnamed portal is specified.
1515 1516 1517 1518 1519 1520
	 */
	if (portal_name[0] == '\0')
		portal = CreatePortal(portal_name, true, true);
	else
		portal = CreatePortal(portal_name, false, false);

1521 1522 1523 1524 1525 1526 1527 1528
	/*
	 * Prepare to copy stuff into the portal's memory context.  We do all this
	 * copying first, because it could possibly fail (out-of-memory) and we
	 * don't want a failure to occur between RevalidateCachedPlan and
	 * PortalDefineQuery; that would result in leaking our plancache refcount.
	 */
	oldContext = MemoryContextSwitchTo(PortalGetHeapMemory(portal));

1529 1530
	/* Copy the plan's query string into the portal */
	query_string = pstrdup(psrc->query_string);
1531 1532 1533 1534 1535 1536 1537

	/* Likewise make a copy of the statement name, unless it's unnamed */
	if (stmt_name[0])
		saved_stmt_name = pstrdup(stmt_name);
	else
		saved_stmt_name = NULL;

1538 1539 1540 1541 1542 1543 1544 1545 1546 1547 1548
	/*
	 * Set a snapshot if we have parameters to fetch (since the input
	 * functions might need it) or the query isn't a utility command (and
	 * hence could require redoing parse analysis and planning).
	 */
	if (numParams > 0 || analyze_requires_snapshot(psrc->raw_parse_tree))
	{
		PushActiveSnapshot(GetTransactionSnapshot());
		snapshot_set = true;
	}

1549 1550 1551 1552 1553
	/*
	 * Fetch parameters, if any, and store in the portal's memory context.
	 */
	if (numParams > 0)
	{
1554
		int			paramno;
1555

1556 1557
		/* sizeof(ParamListInfoData) includes the first array element */
		params = (ParamListInfo) palloc(sizeof(ParamListInfoData) +
1558
								  (numParams - 1) * sizeof(ParamExternData));
1559 1560 1561 1562 1563
		/* we have static list of params, so no hooks needed */
		params->paramFetch = NULL;
		params->paramFetchArg = NULL;
		params->parserSetup = NULL;
		params->parserSetupArg = NULL;
1564
		params->numParams = numParams;
1565

1566
		for (paramno = 0; paramno < numParams; paramno++)
1567
		{
1568
			Oid			ptype = psrc->param_types[paramno];
1569
			int32		plength;
1570
			Datum		pval;
1571
			bool		isNull;
1572 1573 1574
			StringInfoData pbuf;
			char		csave;
			int16		pformat;
1575

1576 1577 1578
			plength = pq_getmsgint(input_message, 4);
			isNull = (plength == -1);

1579 1580
			if (!isNull)
			{
1581
				const char *pvalue = pq_getmsgbytes(input_message, plength);
1582 1583 1584

				/*
				 * Rather than copying data around, we just set up a phony
1585 1586 1587 1588 1589
				 * StringInfo pointing to the correct portion of the message
				 * buffer.	We assume we can scribble on the message buffer so
				 * as to maintain the convention that StringInfos have a
				 * trailing null.  This is grotty but is a big win when
				 * dealing with very large parameter strings.
1590 1591 1592 1593 1594 1595 1596 1597
				 */
				pbuf.data = (char *) pvalue;
				pbuf.maxlen = plength + 1;
				pbuf.len = plength;
				pbuf.cursor = 0;

				csave = pbuf.data[plength];
				pbuf.data[plength] = '\0';
1598 1599 1600 1601 1602 1603
			}
			else
			{
				pbuf.data = NULL;		/* keep compiler quiet */
				csave = 0;
			}
1604

1605
			if (numPFormats > 1)
1606
				pformat = pformats[paramno];
1607 1608 1609 1610 1611
			else if (numPFormats > 0)
				pformat = pformats[0];
			else
				pformat = 0;	/* default = text */

1612
			if (pformat == 0)	/* text mode */
1613 1614 1615
			{
				Oid			typinput;
				Oid			typioparam;
1616
				char	   *pstring;
1617

1618
				getTypeInputInfo(ptype, &typinput, &typioparam);
1619

1620 1621 1622 1623 1624 1625 1626
				/*
				 * We have to do encoding conversion before calling the
				 * typinput routine.
				 */
				if (isNull)
					pstring = NULL;
				else
1627
					pstring = pg_client_to_server(pbuf.data, plength);
1628

1629
				pval = OidInputFunctionCall(typinput, pstring, typioparam, -1);
1630

1631 1632 1633 1634
				/* Free result of encoding conversion, if any */
				if (pstring && pstring != pbuf.data)
					pfree(pstring);
			}
B
Bruce Momjian 已提交
1635
			else if (pformat == 1)		/* binary mode */
1636 1637 1638 1639 1640 1641 1642 1643 1644 1645 1646 1647
			{
				Oid			typreceive;
				Oid			typioparam;
				StringInfo	bufptr;

				/*
				 * Call the parameter type's binary input converter
				 */
				getTypeBinaryInputInfo(ptype, &typreceive, &typioparam);

				if (isNull)
					bufptr = NULL;
1648
				else
1649 1650
					bufptr = &pbuf;

1651
				pval = OidReceiveFunctionCall(typreceive, bufptr, typioparam, -1);
1652 1653 1654

				/* Trouble if it didn't eat the whole buffer */
				if (!isNull && pbuf.cursor != pbuf.len)
1655
					ereport(ERROR,
1656 1657
							(errcode(ERRCODE_INVALID_BINARY_REPRESENTATION),
							 errmsg("incorrect binary data format in bind parameter %d",
1658
									paramno + 1)));
1659 1660 1661 1662 1663 1664 1665
			}
			else
			{
				ereport(ERROR,
						(errcode(ERRCODE_INVALID_PARAMETER_VALUE),
						 errmsg("unsupported format code: %d",
								pformat)));
1666
				pval = 0;		/* keep compiler quiet */
1667
			}
1668

1669 1670
			/* Restore message buffer contents */
			if (!isNull)
1671
				pbuf.data[plength] = csave;
1672

1673
			params->params[paramno].value = pval;
1674
			params->params[paramno].isnull = isNull;
B
Bruce Momjian 已提交
1675

1676 1677 1678 1679 1680 1681 1682
			/*
			 * We mark the params as CONST.  This has no effect if we already
			 * did planning, but if we didn't, it licenses the planner to
			 * substitute the parameters directly into the one-shot plan we
			 * will generate below.
			 */
			params->params[paramno].pflags = PARAM_FLAG_CONST;
1683
			params->params[paramno].ptype = ptype;
1684 1685 1686 1687 1688
		}
	}
	else
		params = NULL;

1689 1690 1691
	/* Done storing stuff in portal's context */
	MemoryContextSwitchTo(oldContext);

1692 1693 1694 1695
	/* Get the result format codes */
	numRFormats = pq_getmsgint(input_message, 2);
	if (numRFormats > 0)
	{
B
Bruce Momjian 已提交
1696
		int			i;
1697

1698 1699 1700 1701 1702
		rformats = (int16 *) palloc(numRFormats * sizeof(int16));
		for (i = 0; i < numRFormats; i++)
			rformats[i] = pq_getmsgint(input_message, 2);
	}

1703 1704
	pq_getmsgend(input_message);

1705
	if (psrc->fully_planned)
1706
	{
1707 1708
		/*
		 * Revalidate the cached plan; this may result in replanning.  Any
B
Bruce Momjian 已提交
1709 1710
		 * cruft will be generated in MessageContext.  The plan refcount will
		 * be assigned to the Portal, so it will be released at portal
1711 1712 1713 1714
		 * destruction.
		 */
		cplan = RevalidateCachedPlan(psrc, false);
		plan_list = cplan->stmt_list;
1715 1716
	}
	else
1717
	{
1718 1719 1720 1721 1722 1723 1724 1725 1726
		List	   *query_list;

		/*
		 * Revalidate the cached plan; this may result in redoing parse
		 * analysis and rewriting (but not planning).  Any cruft will be
		 * generated in MessageContext.  The plan refcount is assigned to
		 * CurrentResourceOwner.
		 */
		cplan = RevalidateCachedPlan(psrc, true);
1727

1728 1729 1730 1731 1732 1733 1734 1735 1736 1737 1738 1739 1740 1741
		/*
		 * We didn't plan the query before, so do it now.  This allows the
		 * planner to make use of the concrete parameter values we now have.
		 * Because we use PARAM_FLAG_CONST, the plan is good only for this set
		 * of param values, and so we generate the plan in the portal's own
		 * memory context where it will be thrown away after use. As in
		 * exec_parse_message, we make no attempt to recover planner temporary
		 * memory until the end of the operation.
		 *
		 * XXX because the planner has a bad habit of scribbling on its input,
		 * we have to make a copy of the parse trees.  FIXME someday.
		 */
		oldContext = MemoryContextSwitchTo(PortalGetHeapMemory(portal));
		query_list = copyObject(cplan->stmt_list);
1742
		plan_list = pg_plan_queries(query_list, 0, params);
1743
		MemoryContextSwitchTo(oldContext);
1744 1745 1746 1747 1748

		/* We no longer need the cached plan refcount ... */
		ReleaseCachedPlan(cplan, true);
		/* ... and we don't want the portal to depend on it, either */
		cplan = NULL;
1749 1750 1751
	}

	/*
1752 1753 1754 1755
	 * Now we can define the portal.
	 *
	 * DO NOT put any code that could possibly throw an error between the
	 * above "RevalidateCachedPlan(psrc, false)" call and here.
1756 1757
	 */
	PortalDefineQuery(portal,
1758 1759
					  saved_stmt_name,
					  query_string,
1760
					  psrc->commandTag,
1761
					  plan_list,
1762
					  cplan);
1763

1764 1765 1766 1767 1768 1769 1770
	/* Done with the snapshot used for parameter I/O and parsing/planning */
	if (snapshot_set)
		PopActiveSnapshot();

	/*
	 * And we're ready to start portal execution.
	 */
1771
	PortalStart(portal, params, InvalidSnapshot);
1772

1773 1774 1775 1776 1777
	/*
	 * Apply the result format requests to the portal.
	 */
	PortalSetResultFormat(portal, numRFormats, rformats);

1778 1779 1780
	/*
	 * Send BindComplete.
	 */
1781
	if (whereToSendOutput == DestRemote)
1782
		pq_putemptymessage('2');
1783 1784 1785 1786

	/*
	 * Emit duration logging if appropriate.
	 */
1787 1788 1789 1790
	switch (check_log_duration(msec_str, false))
	{
		case 1:
			ereport(LOG,
1791 1792
					(errmsg("duration: %s ms", msec_str),
					 errhidestmt(true)));
1793 1794 1795
			break;
		case 2:
			ereport(LOG,
1796
					(errmsg("duration: %s ms  bind %s%s%s: %s",
1797 1798
							msec_str,
							*stmt_name ? stmt_name : "<unnamed>",
1799 1800
							*portal_name ? "/" : "",
							*portal_name ? portal_name : "",
1801
							psrc->query_string),
1802
					 errhidestmt(true),
1803 1804 1805
					 errdetail_params(params)));
			break;
	}
1806 1807 1808 1809 1810

	if (save_log_statement_stats)
		ShowUsage("BIND MESSAGE STATISTICS");

	debug_query_string = NULL;
1811 1812 1813 1814 1815 1816 1817 1818
}

/*
 * exec_execute_message
 *
 * Process an "Execute" message for a portal
 */
static void
1819
exec_execute_message(const char *portal_name, long max_rows)
1820
{
B
Bruce Momjian 已提交
1821
	CommandDest dest;
1822
	DestReceiver *receiver;
1823 1824 1825
	Portal		portal;
	bool		completed;
	char		completionTag[COMPLETION_TAG_BUFSIZE];
1826
	const char *sourceText;
1827
	const char *prepStmtName;
1828
	ParamListInfo portalParams;
1829
	bool		save_log_statement_stats = log_statement_stats;
1830 1831
	bool		is_xact_command;
	bool		execute_is_fetch;
1832 1833
	bool		was_logged = false;
	char		msec_str[32];
1834 1835 1836

	/* Adjust destination to tell printtup.c what to do */
	dest = whereToSendOutput;
1837 1838
	if (dest == DestRemote)
		dest = DestRemoteExecute;
1839 1840 1841

	portal = GetPortalByName(portal_name);
	if (!PortalIsValid(portal))
1842 1843 1844
		ereport(ERROR,
				(errcode(ERRCODE_UNDEFINED_CURSOR),
				 errmsg("portal \"%s\" does not exist", portal_name)));
1845 1846

	/*
B
Bruce Momjian 已提交
1847 1848
	 * If the original query was a null string, just return
	 * EmptyQueryResponse.
1849 1850 1851
	 */
	if (portal->commandTag == NULL)
	{
1852
		Assert(portal->stmts == NIL);
1853 1854 1855 1856
		NullCommand(dest);
		return;
	}

1857
	/* Does the portal contain a transaction command? */
1858
	is_xact_command = IsTransactionStmtList(portal->stmts);
1859

1860
	/*
B
Bruce Momjian 已提交
1861 1862 1863
	 * We must copy the sourceText and prepStmtName into MessageContext in
	 * case the portal is destroyed during finish_xact_command. Can avoid the
	 * copy if it's not an xact command, though.
1864 1865
	 */
	if (is_xact_command)
1866
	{
1867
		sourceText = pstrdup(portal->sourceText);
1868 1869 1870 1871
		if (portal->prepStmtName)
			prepStmtName = pstrdup(portal->prepStmtName);
		else
			prepStmtName = "<unnamed>";
B
Bruce Momjian 已提交
1872

1873 1874 1875 1876 1877 1878
		/*
		 * An xact command shouldn't have any parameters, which is a good
		 * thing because they wouldn't be around after finish_xact_command.
		 */
		portalParams = NULL;
	}
1879 1880
	else
	{
1881 1882 1883
		sourceText = portal->sourceText;
		if (portal->prepStmtName)
			prepStmtName = portal->prepStmtName;
1884
		else
1885 1886
			prepStmtName = "<unnamed>";
		portalParams = portal->portalParams;
1887
	}
1888

1889 1890 1891
	/*
	 * Report query to various monitoring facilities.
	 */
1892
	debug_query_string = sourceText;
1893

1894
	pgstat_report_activity(sourceText);
1895 1896 1897 1898 1899 1900

	set_ps_display(portal->commandTag, false);

	if (save_log_statement_stats)
		ResetUsage();

1901 1902
	BeginCommand(portal->commandTag, dest);

1903
	/*
B
Bruce Momjian 已提交
1904 1905
	 * Create dest receiver in MessageContext (we don't want it in transaction
	 * context, because that may get deleted if portal contains VACUUM).
1906
	 */
1907 1908 1909
	receiver = CreateDestReceiver(dest);
	if (dest == DestRemoteExecute)
		SetRemoteDestReceiverParams(receiver, portal);
1910

1911
	/*
B
Bruce Momjian 已提交
1912 1913
	 * Ensure we are in a transaction command (this should normally be the
	 * case already due to prior BIND).
1914
	 */
1915
	start_xact_command();
1916

1917 1918 1919 1920 1921 1922 1923 1924
	/*
	 * If we re-issue an Execute protocol request against an existing portal,
	 * then we are only fetching more rows rather than completely re-executing
	 * the query from the start. atStart is never reset for a v3 portal, so we
	 * are safe to use this check.
	 */
	execute_is_fetch = !portal->atStart;

1925
	/* Log immediately if dictated by log_statement */
1926
	if (check_log_statement(portal->stmts))
1927 1928
	{
		ereport(LOG,
1929
				(errmsg("%s %s%s%s: %s",
1930
						execute_is_fetch ?
1931 1932
						_("execute fetch from") :
						_("execute"),
1933 1934 1935
						prepStmtName,
						*portal_name ? "/" : "",
						*portal_name ? portal_name : "",
1936
						sourceText),
1937
				 errhidestmt(true),
1938 1939 1940 1941
				 errdetail_params(portalParams)));
		was_logged = true;
	}

1942 1943 1944 1945
	/*
	 * If we are in aborted transaction state, the only portals we can
	 * actually run are those containing COMMIT or ROLLBACK commands.
	 */
1946
	if (IsAbortedTransactionBlockState() &&
1947
		!IsTransactionExitStmtList(portal->stmts))
1948 1949 1950
		ereport(ERROR,
				(errcode(ERRCODE_IN_FAILED_SQL_TRANSACTION),
				 errmsg("current transaction is aborted, "
1951 1952
						"commands ignored until end of transaction block"),
				 errdetail_abort()));
1953 1954 1955 1956 1957 1958 1959 1960 1961 1962 1963 1964

	/* Check for cancel signal before we start execution */
	CHECK_FOR_INTERRUPTS();

	/*
	 * Okay to run the portal.
	 */
	if (max_rows <= 0)
		max_rows = FETCH_ALL;

	completed = PortalRun(portal,
						  max_rows,
B
Bruce Momjian 已提交
1965
						  true, /* always top level */
1966 1967
						  receiver,
						  receiver,
1968 1969
						  completionTag);

1970
	(*receiver->rDestroy) (receiver);
1971

1972 1973
	if (completed)
	{
1974
		if (is_xact_command)
1975 1976
		{
			/*
B
Bruce Momjian 已提交
1977
			 * If this was a transaction control statement, commit it.	We
B
Bruce Momjian 已提交
1978
			 * will start a new xact command for the next command (if any).
1979
			 */
1980
			finish_xact_command();
1981 1982 1983 1984
		}
		else
		{
			/*
B
Bruce Momjian 已提交
1985 1986
			 * We need a CommandCounterIncrement after every query, except
			 * those that start or end a transaction block.
1987 1988 1989 1990 1991 1992 1993 1994 1995 1996
			 */
			CommandCounterIncrement();
		}

		/* Send appropriate CommandComplete to client */
		EndCommand(completionTag, dest);
	}
	else
	{
		/* Portal run not complete, so send PortalSuspended */
1997
		if (whereToSendOutput == DestRemote)
1998 1999 2000
			pq_putemptymessage('s');
	}

2001
	/*
2002
	 * Emit duration logging if appropriate.
2003
	 */
2004
	switch (check_log_duration(msec_str, was_logged))
2005
	{
2006
		case 1:
2007
			ereport(LOG,
2008 2009
					(errmsg("duration: %s ms", msec_str),
					 errhidestmt(true)));
2010 2011
			break;
		case 2:
2012
			ereport(LOG,
2013
					(errmsg("duration: %s ms  %s %s%s%s: %s",
2014 2015 2016 2017 2018 2019 2020
							msec_str,
							execute_is_fetch ?
							_("execute fetch from") :
							_("execute"),
							prepStmtName,
							*portal_name ? "/" : "",
							*portal_name ? portal_name : "",
2021
							sourceText),
2022
					 errhidestmt(true),
2023
					 errdetail_params(portalParams)));
2024
			break;
2025 2026 2027 2028 2029 2030 2031 2032 2033
	}

	if (save_log_statement_stats)
		ShowUsage("EXECUTE MESSAGE STATISTICS");

	debug_query_string = NULL;
}

/*
2034
 * check_log_statement
2035 2036
 *		Determine whether command should be logged because of log_statement
 *
2037 2038
 * parsetree_list can be either raw grammar output or a list of planned
 * statements
2039 2040
 */
static bool
2041
check_log_statement(List *stmt_list)
2042
{
2043
	ListCell   *stmt_item;
2044 2045 2046 2047 2048 2049 2050

	if (log_statement == LOGSTMT_NONE)
		return false;
	if (log_statement == LOGSTMT_ALL)
		return true;

	/* Else we have to inspect the statement(s) to see whether to log */
2051
	foreach(stmt_item, stmt_list)
2052
	{
2053
		Node	   *stmt = (Node *) lfirst(stmt_item);
2054

2055
		if (GetCommandLogLevel(stmt) <= log_statement)
2056 2057 2058 2059 2060 2061 2062 2063 2064 2065
			return true;
	}

	return false;
}

/*
 * check_log_duration
 *		Determine whether current command's duration should be logged
 *
2066 2067 2068 2069 2070
 * Returns:
 *		0 if no logging is needed
 *		1 if just the duration should be logged
 *		2 if duration and query details should be logged
 *
2071 2072
 * If logging is needed, the duration in msec is formatted into msec_str[],
 * which must be a 32-byte buffer.
2073 2074 2075
 *
 * was_logged should be TRUE if caller already logged query details (this
 * essentially prevents 2 from being returned).
2076
 */
2077 2078
int
check_log_duration(char *msec_str, bool was_logged)
2079
{
2080
	if (log_duration || log_min_duration_statement >= 0)
2081
	{
2082 2083 2084
		long		secs;
		int			usecs;
		int			msecs;
2085
		bool		exceeded;
2086

2087 2088 2089 2090
		TimestampDifference(GetCurrentStatementStartTimestamp(),
							GetCurrentTimestamp(),
							&secs, &usecs);
		msecs = usecs / 1000;
2091 2092

		/*
B
Bruce Momjian 已提交
2093 2094 2095
		 * This odd-looking test for log_min_duration_statement being exceeded
		 * is designed to avoid integer overflow with very long durations:
		 * don't compute secs * 1000 until we've verified it will fit in int.
2096
		 */
2097 2098 2099 2100 2101 2102
		exceeded = (log_min_duration_statement == 0 ||
					(log_min_duration_statement > 0 &&
					 (secs > log_min_duration_statement / 1000 ||
					  secs * 1000 + msecs >= log_min_duration_statement)));

		if (exceeded || log_duration)
2103
		{
2104 2105
			snprintf(msec_str, 32, "%ld.%03d",
					 secs * 1000 + msecs, usecs % 1000);
2106 2107 2108 2109
			if (exceeded && !was_logged)
				return 2;
			else
				return 1;
2110
		}
2111 2112
	}

2113
	return 0;
2114
}
2115

2116 2117 2118 2119 2120 2121 2122 2123 2124 2125 2126 2127 2128 2129 2130 2131 2132 2133 2134 2135 2136
/*
 * errdetail_execute
 *
 * Add an errdetail() line showing the query referenced by an EXECUTE, if any.
 * The argument is the raw parsetree list.
 */
static int
errdetail_execute(List *raw_parsetree_list)
{
	ListCell   *parsetree_item;

	foreach(parsetree_item, raw_parsetree_list)
	{
		Node	   *parsetree = (Node *) lfirst(parsetree_item);

		if (IsA(parsetree, ExecuteStmt))
		{
			ExecuteStmt *stmt = (ExecuteStmt *) parsetree;
			PreparedStatement *pstmt;

			pstmt = FetchPreparedStatement(stmt->name, false);
2137
			if (pstmt)
2138
			{
2139
				errdetail("prepare: %s", pstmt->plansource->query_string);
2140 2141 2142 2143 2144 2145 2146 2147 2148 2149 2150 2151 2152 2153 2154 2155 2156 2157 2158 2159 2160 2161 2162 2163 2164 2165 2166 2167 2168 2169 2170 2171 2172 2173 2174 2175 2176 2177 2178 2179 2180 2181 2182 2183 2184 2185 2186 2187 2188 2189 2190 2191 2192
				return 0;
			}
		}
	}

	return 0;
}

/*
 * errdetail_params
 *
 * Add an errdetail() line showing bind-parameter data, if available.
 */
static int
errdetail_params(ParamListInfo params)
{
	/* We mustn't call user-defined I/O functions when in an aborted xact */
	if (params && params->numParams > 0 && !IsAbortedTransactionBlockState())
	{
		StringInfoData param_str;
		MemoryContext oldcontext;
		int			paramno;

		/* Make sure any trash is generated in MessageContext */
		oldcontext = MemoryContextSwitchTo(MessageContext);

		initStringInfo(&param_str);

		for (paramno = 0; paramno < params->numParams; paramno++)
		{
			ParamExternData *prm = &params->params[paramno];
			Oid			typoutput;
			bool		typisvarlena;
			char	   *pstring;
			char	   *p;

			appendStringInfo(&param_str, "%s$%d = ",
							 paramno > 0 ? ", " : "",
							 paramno + 1);

			if (prm->isnull || !OidIsValid(prm->ptype))
			{
				appendStringInfoString(&param_str, "NULL");
				continue;
			}

			getTypeOutputInfo(prm->ptype, &typoutput, &typisvarlena);

			pstring = OidOutputFunctionCall(typoutput, prm->value);

			appendStringInfoCharMacro(&param_str, '\'');
			for (p = pstring; *p; p++)
			{
B
Bruce Momjian 已提交
2193
				if (*p == '\'') /* double single quotes */
2194 2195 2196 2197 2198 2199 2200 2201 2202 2203 2204 2205 2206 2207 2208 2209
					appendStringInfoCharMacro(&param_str, *p);
				appendStringInfoCharMacro(&param_str, *p);
			}
			appendStringInfoCharMacro(&param_str, '\'');

			pfree(pstring);
		}

		errdetail("parameters: %s", param_str.data);

		pfree(param_str.data);

		MemoryContextSwitchTo(oldcontext);
	}

	return 0;
2210 2211
}

2212 2213 2214 2215 2216 2217 2218 2219 2220 2221 2222 2223 2224 2225
/*
 * errdetail_abort
 *
 * Add an errdetail() line showing abort reason, if any.
 */
static int
errdetail_abort(void)
{
	if (MyProc->recoveryConflictPending)
		errdetail("abort reason: recovery conflict");

	return 0;
}

2226 2227 2228 2229 2230 2231 2232 2233 2234 2235 2236
/*
 * errdetail_recovery_conflict
 *
 * Add an errdetail() line showing conflict source.
 */
static int
errdetail_recovery_conflict(void)
{
	switch (RecoveryConflictReason)
	{
		case PROCSIG_RECOVERY_CONFLICT_BUFFERPIN:
B
Bruce Momjian 已提交
2237 2238
			errdetail("User was holding shared buffer pin for too long.");
			break;
2239
		case PROCSIG_RECOVERY_CONFLICT_LOCK:
B
Bruce Momjian 已提交
2240 2241
			errdetail("User was holding a relation lock for too long.");
			break;
2242
		case PROCSIG_RECOVERY_CONFLICT_TABLESPACE:
P
Peter Eisentraut 已提交
2243
			errdetail("User was or might have been using tablespace that must be dropped.");
B
Bruce Momjian 已提交
2244
			break;
2245
		case PROCSIG_RECOVERY_CONFLICT_SNAPSHOT:
B
Bruce Momjian 已提交
2246 2247
			errdetail("User query might have needed to see row versions that must be removed.");
			break;
2248
		case PROCSIG_RECOVERY_CONFLICT_STARTUP_DEADLOCK:
B
Bruce Momjian 已提交
2249 2250
			errdetail("User transaction caused buffer deadlock with recovery.");
			break;
2251
		case PROCSIG_RECOVERY_CONFLICT_DATABASE:
B
Bruce Momjian 已提交
2252 2253
			errdetail("User was connected to a database that must be dropped.");
			break;
2254
		default:
B
Bruce Momjian 已提交
2255 2256
			break;
			/* no errdetail */
2257 2258 2259 2260 2261
	}

	return 0;
}

2262 2263 2264 2265 2266 2267 2268 2269
/*
 * exec_describe_statement_message
 *
 * Process a "Describe" message for a prepared statement
 */
static void
exec_describe_statement_message(const char *stmt_name)
{
2270
	CachedPlanSource *psrc;
2271
	StringInfoData buf;
2272
	int			i;
2273

2274 2275 2276 2277
	/*
	 * Start up a transaction command. (Note that this will normally change
	 * current memory context.) Nothing happens if we are already in one.
	 */
2278
	start_xact_command();
2279 2280 2281 2282

	/* Switch back to message context */
	MemoryContextSwitchTo(MessageContext);

2283 2284
	/* Find prepared statement */
	if (stmt_name[0] != '\0')
2285 2286 2287
	{
		PreparedStatement *pstmt;

2288
		pstmt = FetchPreparedStatement(stmt_name, true);
2289 2290
		psrc = pstmt->plansource;
	}
2291 2292 2293
	else
	{
		/* special-case the unnamed statement */
2294 2295
		psrc = unnamed_stmt_psrc;
		if (!psrc)
2296 2297
			ereport(ERROR,
					(errcode(ERRCODE_UNDEFINED_PSTATEMENT),
B
Bruce Momjian 已提交
2298
					 errmsg("unnamed prepared statement does not exist")));
2299 2300
	}

2301 2302 2303
	/* Prepared statements shouldn't have changeable result descs */
	Assert(psrc->fixed_result);

2304
	/*
2305
	 * If we are in aborted transaction state, we can't run
B
Bruce Momjian 已提交
2306 2307
	 * SendRowDescriptionMessage(), because that needs catalog accesses. (We
	 * can't do RevalidateCachedPlan, either, but that's a lesser problem.)
2308 2309 2310 2311 2312
	 * Hence, refuse to Describe statements that return data.  (We shouldn't
	 * just refuse all Describes, since that might break the ability of some
	 * clients to issue COMMIT or ROLLBACK commands, if they use code that
	 * blindly Describes whatever it does.)  We can Describe parameters
	 * without doing anything dangerous, so we don't restrict that.
2313 2314
	 */
	if (IsAbortedTransactionBlockState() &&
2315
		psrc->resultDesc)
2316 2317 2318
		ereport(ERROR,
				(errcode(ERRCODE_IN_FAILED_SQL_TRANSACTION),
				 errmsg("current transaction is aborted, "
2319 2320
						"commands ignored until end of transaction block"),
				 errdetail_abort()));
2321

2322
	if (whereToSendOutput != DestRemote)
2323 2324
		return;					/* can't actually do anything... */

2325 2326 2327
	/*
	 * First describe the parameters...
	 */
B
Bruce Momjian 已提交
2328
	pq_beginmessage(&buf, 't'); /* parameter description message type */
2329
	pq_sendint(&buf, psrc->num_params, 2);
2330

2331
	for (i = 0; i < psrc->num_params; i++)
2332
	{
2333
		Oid			ptype = psrc->param_types[i];
2334 2335 2336 2337

		pq_sendint(&buf, (int) ptype, 4);
	}
	pq_endmessage(&buf);
2338 2339 2340 2341

	/*
	 * Next send RowDescription or NoData to describe the result...
	 */
2342 2343 2344 2345 2346 2347 2348 2349 2350 2351 2352 2353 2354 2355 2356
	if (psrc->resultDesc)
	{
		CachedPlan *cplan;
		List	   *tlist;

		/* Make sure the plan is up to date */
		cplan = RevalidateCachedPlan(psrc, true);

		/* Get the primary statement and find out what it returns */
		tlist = FetchStatementTargetList(PortalListGetPrimaryStmt(cplan->stmt_list));

		SendRowDescriptionMessage(psrc->resultDesc, tlist, NULL);

		ReleaseCachedPlan(cplan, true);
	}
2357 2358 2359
	else
		pq_putemptymessage('n');	/* NoData */

2360 2361 2362 2363 2364 2365 2366 2367 2368 2369 2370 2371
}

/*
 * exec_describe_portal_message
 *
 * Process a "Describe" message for a portal
 */
static void
exec_describe_portal_message(const char *portal_name)
{
	Portal		portal;

2372 2373 2374 2375
	/*
	 * Start up a transaction command. (Note that this will normally change
	 * current memory context.) Nothing happens if we are already in one.
	 */
2376
	start_xact_command();
2377 2378 2379 2380

	/* Switch back to message context */
	MemoryContextSwitchTo(MessageContext);

2381 2382
	portal = GetPortalByName(portal_name);
	if (!PortalIsValid(portal))
2383 2384 2385
		ereport(ERROR,
				(errcode(ERRCODE_UNDEFINED_CURSOR),
				 errmsg("portal \"%s\" does not exist", portal_name)));
2386

2387 2388 2389
	/*
	 * If we are in aborted transaction state, we can't run
	 * SendRowDescriptionMessage(), because that needs catalog accesses.
B
Bruce Momjian 已提交
2390
	 * Hence, refuse to Describe portals that return data.	(We shouldn't just
2391 2392 2393 2394 2395 2396 2397 2398 2399
	 * refuse all Describes, since that might break the ability of some
	 * clients to issue COMMIT or ROLLBACK commands, if they use code that
	 * blindly Describes whatever it does.)
	 */
	if (IsAbortedTransactionBlockState() &&
		portal->tupDesc)
		ereport(ERROR,
				(errcode(ERRCODE_IN_FAILED_SQL_TRANSACTION),
				 errmsg("current transaction is aborted, "
2400 2401
						"commands ignored until end of transaction block"),
				 errdetail_abort()));
2402

2403
	if (whereToSendOutput != DestRemote)
2404 2405 2406
		return;					/* can't actually do anything... */

	if (portal->tupDesc)
2407 2408
		SendRowDescriptionMessage(portal->tupDesc,
								  FetchPortalTargetList(portal),
2409
								  portal->formats);
2410 2411 2412 2413 2414
	else
		pq_putemptymessage('n');	/* NoData */
}


2415
/*
2416
 * Convenience routines for starting/committing a single command.
2417 2418
 */
static void
2419
start_xact_command(void)
2420
{
2421
	if (!xact_started)
2422
	{
2423 2424 2425
		ereport(DEBUG3,
				(errmsg_internal("StartTransactionCommand")));
		StartTransactionCommand();
2426 2427

		/* Set statement timeout running, if any */
2428
		/* NB: this mustn't be enabled until we are within an xact */
2429 2430
		if (StatementTimeout > 0)
			enable_sig_alarm(StatementTimeout, true);
2431 2432
		else
			cancel_from_timeout = false;
B
Bruce Momjian 已提交
2433

2434 2435 2436 2437 2438 2439 2440 2441 2442
		xact_started = true;
	}
}

static void
finish_xact_command(void)
{
	if (xact_started)
	{
2443 2444 2445 2446
		/* Cancel any active statement timeout before committing */
		disable_sig_alarm(true);

		/* Now commit the command */
2447 2448
		ereport(DEBUG3,
				(errmsg_internal("CommitTransactionCommand")));
2449

2450
		CommitTransactionCommand();
2451

2452 2453 2454 2455 2456 2457
#ifdef MEMORY_CONTEXT_CHECKING
		/* Check all memory contexts that weren't freed during commit */
		/* (those that were, were checked before being deleted) */
		MemoryContextCheck(TopMemoryContext);
#endif

2458
#ifdef SHOW_MEMORY_STATS
2459
		/* Print mem stats after each commit for leak tracking */
2460
		MemoryContextStats(TopMemoryContext);
2461
#endif
2462 2463 2464

		xact_started = false;
	}
2465 2466 2467
}


2468 2469 2470 2471 2472
/*
 * Convenience routines for checking whether a statement is one of the
 * ones that we allow in transaction-aborted state.
 */

2473
/* Test a bare parsetree */
2474 2475 2476 2477 2478 2479 2480 2481 2482 2483 2484 2485 2486 2487 2488 2489
static bool
IsTransactionExitStmt(Node *parsetree)
{
	if (parsetree && IsA(parsetree, TransactionStmt))
	{
		TransactionStmt *stmt = (TransactionStmt *) parsetree;

		if (stmt->kind == TRANS_STMT_COMMIT ||
			stmt->kind == TRANS_STMT_PREPARE ||
			stmt->kind == TRANS_STMT_ROLLBACK ||
			stmt->kind == TRANS_STMT_ROLLBACK_TO)
			return true;
	}
	return false;
}

2490
/* Test a list that might contain Query nodes or bare parsetrees */
2491 2492 2493 2494 2495
static bool
IsTransactionExitStmtList(List *parseTrees)
{
	if (list_length(parseTrees) == 1)
	{
2496 2497 2498 2499 2500
		Node	   *stmt = (Node *) linitial(parseTrees);

		if (IsA(stmt, Query))
		{
			Query	   *query = (Query *) stmt;
2501

2502 2503 2504 2505 2506
			if (query->commandType == CMD_UTILITY &&
				IsTransactionExitStmt(query->utilityStmt))
				return true;
		}
		else if (IsTransactionExitStmt(stmt))
2507 2508 2509 2510 2511
			return true;
	}
	return false;
}

2512
/* Test a list that might contain Query nodes or bare parsetrees */
2513 2514 2515 2516 2517
static bool
IsTransactionStmtList(List *parseTrees)
{
	if (list_length(parseTrees) == 1)
	{
2518
		Node	   *stmt = (Node *) linitial(parseTrees);
2519

2520 2521 2522 2523 2524 2525 2526 2527 2528
		if (IsA(stmt, Query))
		{
			Query	   *query = (Query *) stmt;

			if (query->commandType == CMD_UTILITY &&
				IsA(query->utilityStmt, TransactionStmt))
				return true;
		}
		else if (IsA(stmt, TransactionStmt))
2529 2530 2531 2532 2533
			return true;
	}
	return false;
}

2534 2535 2536 2537 2538 2539 2540 2541
/* Release any existing unnamed prepared statement */
static void
drop_unnamed_stmt(void)
{
	/* Release any completed unnamed statement */
	if (unnamed_stmt_psrc)
		DropCachedPlan(unnamed_stmt_psrc);
	unnamed_stmt_psrc = NULL;
B
Bruce Momjian 已提交
2542

2543 2544 2545 2546 2547 2548 2549 2550 2551 2552
	/*
	 * If we failed while trying to build a prior unnamed statement, we may
	 * have a memory context that wasn't assigned to a completed plancache
	 * entry.  If so, drop it to avoid a permanent memory leak.
	 */
	if (unnamed_stmt_context)
		MemoryContextDelete(unnamed_stmt_context);
	unnamed_stmt_context = NULL;
}

2553

2554
/* --------------------------------
2555
 *		signal handler routines used in PostgresMain()
2556 2557 2558
 * --------------------------------
 */

2559
/*
T
Tom Lane 已提交
2560
 * quickdie() occurs when signalled SIGQUIT by the postmaster.
2561 2562 2563 2564
 *
 * Some backend has bought the farm,
 * so we need to stop what we're doing and exit.
 */
T
Tom Lane 已提交
2565
void
2566
quickdie(SIGNAL_ARGS)
2567
{
B
Bruce Momjian 已提交
2568
	sigaddset(&BlockSig, SIGQUIT);		/* prevent nested calls */
2569
	PG_SETMASK(&BlockSig);
B
Bruce Momjian 已提交
2570

2571 2572
	/*
	 * If we're aborting out of client auth, don't risk trying to send
B
Bruce Momjian 已提交
2573 2574 2575
	 * anything to the client; we will likely violate the protocol, not to
	 * mention that we may have interrupted the guts of OpenSSL or some
	 * authentication library.
2576 2577 2578 2579
	 */
	if (ClientAuthInProgress && whereToSendOutput == DestRemote)
		whereToSendOutput = DestNone;

2580
	/*
B
Bruce Momjian 已提交
2581 2582
	 * Ideally this should be ereport(FATAL), but then we'd not get control
	 * back...
2583 2584 2585
	 */
	ereport(WARNING,
			(errcode(ERRCODE_CRASH_SHUTDOWN),
B
Bruce Momjian 已提交
2586
			 errmsg("terminating connection because of crash of another server process"),
B
Bruce Momjian 已提交
2587 2588 2589 2590
	errdetail("The postmaster has commanded this server process to roll back"
			  " the current transaction and exit, because another"
			  " server process exited abnormally and possibly corrupted"
			  " shared memory."),
2591
			 errhint("In a moment you should be able to reconnect to the"
2592
					 " database and repeat your command.")));
B
Bruce Momjian 已提交
2593

2594
	/*
2595 2596 2597 2598 2599 2600 2601 2602 2603 2604
	 * We DO NOT want to run proc_exit() callbacks -- we're here because
	 * shared memory may be corrupted, so we don't want to try to clean up our
	 * transaction.  Just nail the windows shut and get out of town.  Now that
	 * there's an atexit callback to prevent third-party code from breaking
	 * things by calling exit() directly, we have to reset the callbacks
	 * explicitly to make this work as intended.
	 */
	on_exit_reset();

	/*
2605
	 * Note we do exit(2) not exit(0).	This is to force the postmaster into a
B
Bruce Momjian 已提交
2606 2607
	 * system reset cycle if some idiot DBA sends a manual SIGQUIT to a random
	 * backend.  This is necessary precisely because we don't clean up our
2608
	 * shared memory state.  (The "dead man switch" mechanism in pmsignal.c
2609 2610
	 * should ensure the postmaster sees this as a crash, too, but no harm in
	 * being doubly sure.)
2611
	 */
2612
	exit(2);
2613 2614
}

2615
/*
2616 2617
 * Shutdown signal from postmaster: abort transaction and exit
 * at soonest convenient time
2618
 */
2619
void
2620
die(SIGNAL_ARGS)
2621
{
2622 2623 2624
	int			save_errno = errno;

	/* Don't joggle the elbow of proc_exit */
B
Bruce Momjian 已提交
2625
	if (!proc_exit_inprogress)
2626
	{
2627
		InterruptPending = true;
2628
		ProcDiePending = true;
B
Bruce Momjian 已提交
2629

2630
		/*
B
Bruce Momjian 已提交
2631 2632
		 * If it's safe to interrupt, and we're waiting for input or a lock,
		 * service the interrupt immediately
2633
		 */
2634 2635
		if (ImmediateInterruptOK && InterruptHoldoffCount == 0 &&
			CritSectionCount == 0)
2636
		{
2637 2638 2639
			/* bump holdoff count to make ProcessInterrupts() a no-op */
			/* until we are done getting ready for it */
			InterruptHoldoffCount++;
2640
			LockWaitCancel();	/* prevent CheckDeadLock from running */
2641
			DisableNotifyInterrupt();
2642
			DisableCatchupInterrupt();
2643
			InterruptHoldoffCount--;
2644 2645
			ProcessInterrupts();
		}
2646 2647 2648

		/* Interrupt any sync rep wait which is currently in progress. */
		SetLatch(&(MyProc->waitLatch));
2649
	}
2650 2651

	errno = save_errno;
2652 2653
}

2654
/*
2655 2656
 * Query-cancel signal from postmaster: abort current transaction
 * at soonest convenient time
2657
 */
2658
void
2659
StatementCancelHandler(SIGNAL_ARGS)
2660
{
2661 2662
	int			save_errno = errno;

B
Bruce Momjian 已提交
2663
	/*
2664
	 * Don't joggle the elbow of proc_exit
B
Bruce Momjian 已提交
2665
	 */
2666
	if (!proc_exit_inprogress)
2667
	{
2668 2669
		InterruptPending = true;
		QueryCancelPending = true;
B
Bruce Momjian 已提交
2670

2671
		/*
2672 2673
		 * If it's safe to interrupt, and we're waiting for input or a lock,
		 * service the interrupt immediately
2674
		 */
2675 2676
		if (ImmediateInterruptOK && InterruptHoldoffCount == 0 &&
			CritSectionCount == 0)
2677
		{
2678 2679 2680
			/* bump holdoff count to make ProcessInterrupts() a no-op */
			/* until we are done getting ready for it */
			InterruptHoldoffCount++;
2681 2682 2683 2684 2685
			LockWaitCancel();	/* prevent CheckDeadLock from running */
			DisableNotifyInterrupt();
			DisableCatchupInterrupt();
			InterruptHoldoffCount--;
			ProcessInterrupts();
2686
		}
2687 2688 2689

		/* Interrupt any sync rep wait which is currently in progress. */
		SetLatch(&(MyProc->waitLatch));
2690 2691
	}

2692
	errno = save_errno;
2693 2694
}

2695
/* signal handler for floating point exception */
2696
void
2697 2698
FloatExceptionHandler(SIGNAL_ARGS)
{
2699 2700 2701
	ereport(ERROR,
			(errcode(ERRCODE_FLOATING_POINT_EXCEPTION),
			 errmsg("floating-point exception"),
B
Bruce Momjian 已提交
2702 2703 2704
			 errdetail("An invalid floating-point operation was signaled. "
					   "This probably means an out-of-range result or an "
					   "invalid operation, such as division by zero.")));
2705 2706
}

2707
/* SIGHUP: set flag to re-read config file at next convenient time */
2708
static void
2709
SigHupHandler(SIGNAL_ARGS)
2710
{
2711
	got_SIGHUP = true;
2712 2713
}

2714 2715
/*
 * RecoveryConflictInterrupt: out-of-line portion of recovery conflict
2716
 * handling following receipt of SIGUSR1. Designed to be similar to die()
2717 2718 2719 2720 2721 2722
 * and StatementCancelHandler(). Called only by a normal user backend
 * that begins a transaction during recovery.
 */
void
RecoveryConflictInterrupt(ProcSignalReason reason)
{
B
Bruce Momjian 已提交
2723
	int			save_errno = errno;
2724 2725

	/*
B
Bruce Momjian 已提交
2726 2727
	 * Don't joggle the elbow of proc_exit
	 */
2728 2729
	if (!proc_exit_inprogress)
	{
2730
		RecoveryConflictReason = reason;
2731 2732
		switch (reason)
		{
2733 2734
			case PROCSIG_RECOVERY_CONFLICT_STARTUP_DEADLOCK:

B
Bruce Momjian 已提交
2735 2736 2737 2738 2739 2740 2741
				/*
				 * If we aren't waiting for a lock we can never deadlock.
				 */
				if (!IsWaitingForLock())
					return;

				/* Intentional drop through to check wait for pin */
2742

2743 2744
			case PROCSIG_RECOVERY_CONFLICT_BUFFERPIN:

B
Bruce Momjian 已提交
2745 2746 2747 2748 2749 2750 2751 2752
				/*
				 * If we aren't blocking the Startup process there is nothing
				 * more to do.
				 */
				if (!HoldingBufferPinThatDelaysRecovery())
					return;

				MyProc->recoveryConflictPending = true;
2753

B
Bruce Momjian 已提交
2754
				/* Intentional drop through to error handling */
2755

2756 2757 2758 2759
			case PROCSIG_RECOVERY_CONFLICT_LOCK:
			case PROCSIG_RECOVERY_CONFLICT_TABLESPACE:
			case PROCSIG_RECOVERY_CONFLICT_SNAPSHOT:

B
Bruce Momjian 已提交
2760 2761 2762 2763 2764 2765 2766 2767 2768 2769 2770 2771 2772 2773 2774 2775 2776
				/*
				 * If we aren't in a transaction any longer then ignore.
				 */
				if (!IsTransactionOrTransactionBlock())
					return;

				/*
				 * If we can abort just the current subtransaction then we are
				 * OK to throw an ERROR to resolve the conflict. Otherwise
				 * drop through to the FATAL case.
				 *
				 * XXX other times that we can throw just an ERROR *may* be
				 * PROCSIG_RECOVERY_CONFLICT_LOCK if no locks are held in
				 * parent transactions
				 *
				 * PROCSIG_RECOVERY_CONFLICT_SNAPSHOT if no snapshots are held
				 * by parent transactions and the transaction is not
2777
				 * transaction-snapshot mode
B
Bruce Momjian 已提交
2778 2779 2780 2781 2782 2783
				 *
				 * PROCSIG_RECOVERY_CONFLICT_TABLESPACE if no temp files or
				 * cursors open in parent transactions
				 */
				if (!IsSubTransaction())
				{
2784
					/*
B
Bruce Momjian 已提交
2785 2786 2787
					 * If we already aborted then we no longer need to cancel.
					 * We do this here since we do not wish to ignore aborted
					 * subtransactions, which must cause FATAL, currently.
2788
					 */
B
Bruce Momjian 已提交
2789 2790
					if (IsAbortedTransactionBlockState())
						return;
2791 2792

					RecoveryConflictPending = true;
B
Bruce Momjian 已提交
2793
					QueryCancelPending = true;
2794 2795
					InterruptPending = true;
					break;
B
Bruce Momjian 已提交
2796 2797 2798 2799 2800 2801 2802 2803 2804
				}

				/* Intentional drop through to session cancel */

			case PROCSIG_RECOVERY_CONFLICT_DATABASE:
				RecoveryConflictPending = true;
				ProcDiePending = true;
				InterruptPending = true;
				break;
2805 2806

			default:
2807 2808
				elog(FATAL, "unrecognized conflict mode: %d",
					 (int) reason);
2809 2810
		}

2811 2812
		Assert(RecoveryConflictPending && (QueryCancelPending || ProcDiePending));

2813 2814 2815
		/*
		 * All conflicts apart from database cause dynamic errors where the
		 * command or transaction can be retried at a later point with some
B
Bruce Momjian 已提交
2816 2817
		 * potential for success. No need to reset this, since non-retryable
		 * conflict errors are currently FATAL.
2818 2819 2820 2821
		 */
		if (reason == PROCSIG_RECOVERY_CONFLICT_DATABASE)
			RecoveryConflictRetryable = false;

2822 2823 2824 2825 2826 2827 2828 2829 2830 2831 2832 2833 2834 2835 2836 2837 2838 2839 2840 2841
		/*
		 * If it's safe to interrupt, and we're waiting for input or a lock,
		 * service the interrupt immediately
		 */
		if (ImmediateInterruptOK && InterruptHoldoffCount == 0 &&
			CritSectionCount == 0)
		{
			/* bump holdoff count to make ProcessInterrupts() a no-op */
			/* until we are done getting ready for it */
			InterruptHoldoffCount++;
			LockWaitCancel();	/* prevent CheckDeadLock from running */
			DisableNotifyInterrupt();
			DisableCatchupInterrupt();
			InterruptHoldoffCount--;
			ProcessInterrupts();
		}
	}

	errno = save_errno;
}
2842

2843 2844 2845 2846 2847 2848 2849 2850 2851 2852
/*
 * ProcessInterrupts: out-of-line portion of CHECK_FOR_INTERRUPTS() macro
 *
 * If an interrupt condition is pending, and it's safe to service it,
 * then clear the flag and accept the interrupt.  Called only when
 * InterruptPending is true.
 */
void
ProcessInterrupts(void)
{
2853 2854
	/* OK to accept interrupt now? */
	if (InterruptHoldoffCount != 0 || CritSectionCount != 0)
2855 2856 2857 2858 2859
		return;
	InterruptPending = false;
	if (ProcDiePending)
	{
		ProcDiePending = false;
B
Bruce Momjian 已提交
2860 2861
		QueryCancelPending = false;		/* ProcDie trumps QueryCancel */
		ImmediateInterruptOK = false;	/* not idle anymore */
2862
		DisableNotifyInterrupt();
2863
		DisableCatchupInterrupt();
2864 2865 2866
		/* As in quickdie, don't risk sending to client during auth */
		if (ClientAuthInProgress && whereToSendOutput == DestRemote)
			whereToSendOutput = DestNone;
2867 2868 2869 2870
		if (IsAutoVacuumWorkerProcess())
			ereport(FATAL,
					(errcode(ERRCODE_ADMIN_SHUTDOWN),
					 errmsg("terminating autovacuum process due to administrator command")));
2871
		else if (RecoveryConflictPending && RecoveryConflictRetryable)
2872 2873
		{
			pgstat_report_recovery_conflict(RecoveryConflictReason);
2874 2875 2876 2877
			ereport(FATAL,
					(errcode(ERRCODE_T_R_SERIALIZATION_FAILURE),
			  errmsg("terminating connection due to conflict with recovery"),
					 errdetail_recovery_conflict()));
2878
		}
2879
		else if (RecoveryConflictPending)
2880
		{
2881 2882
			/* Currently there is only one non-retryable recovery conflict */
			Assert(RecoveryConflictReason == PROCSIG_RECOVERY_CONFLICT_DATABASE);
2883
			pgstat_report_recovery_conflict(RecoveryConflictReason);
2884
			ereport(FATAL,
2885
					(errcode(ERRCODE_DATABASE_DROPPED),
B
Bruce Momjian 已提交
2886
			  errmsg("terminating connection due to conflict with recovery"),
2887
					 errdetail_recovery_conflict()));
2888
		}
2889 2890 2891
		else
			ereport(FATAL,
					(errcode(ERRCODE_ADMIN_SHUTDOWN),
B
Bruce Momjian 已提交
2892
			 errmsg("terminating connection due to administrator command")));
2893 2894 2895 2896
	}
	if (QueryCancelPending)
	{
		QueryCancelPending = false;
2897
		if (ClientAuthInProgress)
2898
		{
B
Bruce Momjian 已提交
2899
			ImmediateInterruptOK = false;		/* not idle anymore */
2900 2901 2902 2903 2904
			DisableNotifyInterrupt();
			DisableCatchupInterrupt();
			/* As in quickdie, don't risk sending to client during auth */
			if (whereToSendOutput == DestRemote)
				whereToSendOutput = DestNone;
2905 2906 2907
			ereport(ERROR,
					(errcode(ERRCODE_QUERY_CANCELED),
					 errmsg("canceling authentication due to timeout")));
2908 2909 2910
		}
		if (cancel_from_timeout)
		{
B
Bruce Momjian 已提交
2911
			ImmediateInterruptOK = false;		/* not idle anymore */
2912 2913
			DisableNotifyInterrupt();
			DisableCatchupInterrupt();
2914 2915 2916
			ereport(ERROR,
					(errcode(ERRCODE_QUERY_CANCELED),
					 errmsg("canceling statement due to statement timeout")));
2917 2918 2919
		}
		if (IsAutoVacuumWorkerProcess())
		{
B
Bruce Momjian 已提交
2920
			ImmediateInterruptOK = false;		/* not idle anymore */
2921 2922
			DisableNotifyInterrupt();
			DisableCatchupInterrupt();
2923 2924 2925
			ereport(ERROR,
					(errcode(ERRCODE_QUERY_CANCELED),
					 errmsg("canceling autovacuum task")));
2926
		}
2927
		if (RecoveryConflictPending)
2928
		{
B
Bruce Momjian 已提交
2929
			ImmediateInterruptOK = false;		/* not idle anymore */
2930
			RecoveryConflictPending = false;
2931 2932
			DisableNotifyInterrupt();
			DisableCatchupInterrupt();
2933
			pgstat_report_recovery_conflict(RecoveryConflictReason);
2934 2935
			if (DoingCommandRead)
				ereport(FATAL,
2936
						(errcode(ERRCODE_T_R_SERIALIZATION_FAILURE),
2937 2938
						 errmsg("terminating connection due to conflict with recovery"),
						 errdetail_recovery_conflict(),
B
Bruce Momjian 已提交
2939 2940
				 errhint("In a moment you should be able to reconnect to the"
						 " database and repeat your command.")));
2941 2942
			else
				ereport(ERROR,
2943
						(errcode(ERRCODE_T_R_SERIALIZATION_FAILURE),
B
Bruce Momjian 已提交
2944
				 errmsg("canceling statement due to conflict with recovery"),
2945
						 errdetail_recovery_conflict()));
2946
		}
2947

2948
		/*
B
Bruce Momjian 已提交
2949 2950 2951
		 * If we are reading a command from the client, just ignore the cancel
		 * request --- sending an extra error message won't accomplish
		 * anything.  Otherwise, go ahead and throw the error.
2952 2953 2954
		 */
		if (!DoingCommandRead)
		{
B
Bruce Momjian 已提交
2955
			ImmediateInterruptOK = false;		/* not idle anymore */
2956 2957
			DisableNotifyInterrupt();
			DisableCatchupInterrupt();
2958 2959 2960
			ereport(ERROR,
					(errcode(ERRCODE_QUERY_CANCELED),
					 errmsg("canceling statement due to user request")));
2961
		}
2962 2963 2964 2965
	}
	/* If we get here, do nothing (probably, QueryCancelPending was reset) */
}

2966

2967 2968 2969
/*
 * IA64-specific code to fetch the AR.BSP register for stack depth checks.
 *
2970
 * We currently support gcc, icc, and HP-UX inline assembly here.
2971 2972 2973
 */
#if defined(__ia64__) || defined(__ia64)

2974 2975 2976 2977 2978
#if defined(__hpux) && !defined(__GNUC__) && !defined __INTEL_COMPILER
#include <ia64/sys/inline.h>
#define ia64_get_bsp() ((char *) (_Asm_mov_from_ar(_AREG_BSP, _NO_FENCE)))
#else

2979
#ifdef __INTEL_COMPILER
2980
#include <asm/ia64regs.h>
2981
#endif
2982 2983 2984 2985 2986 2987 2988 2989

static __inline__ char *
ia64_get_bsp(void)
{
	char	   *ret;

#ifndef __INTEL_COMPILER
	/* the ;; is a "stop", seems to be required before fetching BSP */
2990 2991 2992 2993
	__asm__		__volatile__(
										 ";;\n"
										 "	mov	%0=ar.bsp	\n"
							 :			 "=r"(ret));
2994
#else
2995
	ret = (char *) __getReg(_IA64_REG_AR_BSP);
2996
#endif
2997
	return ret;
2998
}
2999
#endif
3000
#endif   /* IA64 */
3001 3002


3003 3004 3005 3006 3007 3008
/*
 * check_stack_depth: check for excessively deep recursion
 *
 * This should be called someplace in any recursive routine that might possibly
 * recurse deep enough to overflow the stack.  Most Unixen treat stack
 * overflow as an unrecoverable SIGSEGV, so we want to error out ourselves
3009
 * before hitting the hardware limit.
3010 3011 3012 3013
 */
void
check_stack_depth(void)
{
B
Bruce Momjian 已提交
3014
	char		stack_top_loc;
3015
	long		stack_depth;
3016 3017 3018 3019

	/*
	 * Compute distance from PostgresMain's local variables to my own
	 */
3020
	stack_depth = (long) (stack_base_ptr - &stack_top_loc);
B
Bruce Momjian 已提交
3021

3022
	/*
B
Bruce Momjian 已提交
3023
	 * Take abs value, since stacks grow up on some machines, down on others
3024 3025 3026
	 */
	if (stack_depth < 0)
		stack_depth = -stack_depth;
B
Bruce Momjian 已提交
3027

3028 3029 3030
	/*
	 * Trouble?
	 *
3031 3032 3033 3034
	 * The test on stack_base_ptr prevents us from erroring out if called
	 * during process setup or in a non-backend process.  Logically it should
	 * be done first, but putting it here avoids wasting cycles during normal
	 * cases.
3035 3036 3037 3038 3039 3040 3041
	 */
	if (stack_depth > max_stack_depth_bytes &&
		stack_base_ptr != NULL)
	{
		ereport(ERROR,
				(errcode(ERRCODE_STATEMENT_TOO_COMPLEX),
				 errmsg("stack depth limit exceeded"),
3042
				 errhint("Increase the configuration parameter \"max_stack_depth\" (currently %dkB), "
3043
			  "after ensuring the platform's stack depth limit is adequate.",
3044
						 max_stack_depth)));
3045
	}
3046 3047 3048 3049 3050 3051 3052 3053 3054 3055 3056 3057 3058 3059 3060 3061 3062 3063 3064

	/*
	 * On IA64 there is a separate "register" stack that requires its own
	 * independent check.  For this, we have to measure the change in the
	 * "BSP" pointer from PostgresMain to here.  Logic is just as above,
	 * except that we know IA64's register stack grows up.
	 *
	 * Note we assume that the same max_stack_depth applies to both stacks.
	 */
#if defined(__ia64__) || defined(__ia64)
	stack_depth = (long) (ia64_get_bsp() - register_stack_base_ptr);

	if (stack_depth > max_stack_depth_bytes &&
		register_stack_base_ptr != NULL)
	{
		ereport(ERROR,
				(errcode(ERRCODE_STATEMENT_TOO_COMPLEX),
				 errmsg("stack depth limit exceeded"),
				 errhint("Increase the configuration parameter \"max_stack_depth\" (currently %dkB), "
3065
			  "after ensuring the platform's stack depth limit is adequate.",
3066 3067
						 max_stack_depth)));
	}
3068
#endif   /* IA64 */
3069 3070
}

3071
/* GUC check hook for max_stack_depth */
3072
bool
3073
check_max_stack_depth(int *newval, void **extra, GucSource source)
3074
{
3075
	long		newval_bytes = *newval * 1024L;
3076 3077 3078 3079
	long		stack_rlimit = get_stack_depth_rlimit();

	if (stack_rlimit > 0 && newval_bytes > stack_rlimit - STACK_DEPTH_SLOP)
	{
3080 3081 3082
		GUC_check_errdetail("\"max_stack_depth\" must not exceed %ldkB.",
							(stack_rlimit - STACK_DEPTH_SLOP) / 1024L);
		GUC_check_errhint("Increase the platform's stack depth limit via \"ulimit -s\" or local equivalent.");
3083 3084
		return false;
	}
3085 3086 3087
	return true;
}

3088 3089 3090 3091 3092 3093 3094 3095 3096
/* GUC assign hook for max_stack_depth */
void
assign_max_stack_depth(int newval, void *extra)
{
	long		newval_bytes = newval * 1024L;

	max_stack_depth_bytes = newval_bytes;
}

3097

3098 3099 3100 3101 3102 3103 3104 3105 3106 3107 3108 3109 3110 3111 3112 3113 3114 3115 3116 3117 3118 3119 3120 3121 3122 3123 3124 3125 3126 3127 3128 3129 3130 3131 3132
/*
 * set_debug_options --- apply "-d N" command line option
 *
 * -d is not quite the same as setting log_min_messages because it enables
 * other output options.
 */
void
set_debug_options(int debug_flag, GucContext context, GucSource source)
{
	if (debug_flag > 0)
	{
		char		debugstr[64];

		sprintf(debugstr, "debug%d", debug_flag);
		SetConfigOption("log_min_messages", debugstr, context, source);
	}
	else
		SetConfigOption("log_min_messages", "notice", context, source);

	if (debug_flag >= 1 && context == PGC_POSTMASTER)
	{
		SetConfigOption("log_connections", "true", context, source);
		SetConfigOption("log_disconnections", "true", context, source);
	}
	if (debug_flag >= 2)
		SetConfigOption("log_statement", "all", context, source);
	if (debug_flag >= 3)
		SetConfigOption("debug_print_parse", "true", context, source);
	if (debug_flag >= 4)
		SetConfigOption("debug_print_plan", "true", context, source);
	if (debug_flag >= 5)
		SetConfigOption("debug_print_rewritten", "true", context, source);
}


3133 3134 3135
bool
set_plan_disabling_options(const char *arg, GucContext context, GucSource source)
{
B
Bruce Momjian 已提交
3136
	char	   *tmp = NULL;
3137 3138 3139

	switch (arg[0])
	{
B
Bruce Momjian 已提交
3140
		case 's':				/* seqscan */
3141 3142
			tmp = "enable_seqscan";
			break;
B
Bruce Momjian 已提交
3143
		case 'i':				/* indexscan */
3144 3145
			tmp = "enable_indexscan";
			break;
B
Bruce Momjian 已提交
3146
		case 'b':				/* bitmapscan */
3147 3148
			tmp = "enable_bitmapscan";
			break;
B
Bruce Momjian 已提交
3149
		case 't':				/* tidscan */
3150 3151
			tmp = "enable_tidscan";
			break;
B
Bruce Momjian 已提交
3152
		case 'n':				/* nestloop */
3153 3154
			tmp = "enable_nestloop";
			break;
B
Bruce Momjian 已提交
3155
		case 'm':				/* mergejoin */
3156 3157
			tmp = "enable_mergejoin";
			break;
B
Bruce Momjian 已提交
3158
		case 'h':				/* hashjoin */
3159 3160 3161 3162 3163 3164 3165 3166 3167 3168 3169 3170 3171 3172 3173 3174 3175 3176 3177
			tmp = "enable_hashjoin";
			break;
	}
	if (tmp)
	{
		SetConfigOption(tmp, "false", context, source);
		return true;
	}
	else
		return false;
}


const char *
get_stats_option_name(const char *arg)
{
	switch (arg[0])
	{
		case 'p':
B
Bruce Momjian 已提交
3178
			if (optarg[1] == 'a')		/* "parser" */
3179
				return "log_parser_stats";
B
Bruce Momjian 已提交
3180
			else if (optarg[1] == 'l')	/* "planner" */
3181 3182 3183
				return "log_planner_stats";
			break;

B
Bruce Momjian 已提交
3184
		case 'e':				/* "executor" */
3185 3186 3187 3188 3189 3190 3191 3192
			return "log_executor_stats";
			break;
	}

	return NULL;
}


3193
/* ----------------------------------------------------------------
3194 3195
 * process_postgres_switches
 *	   Parse command line arguments for PostgresMain
3196
 *
3197 3198 3199 3200 3201
 * This is called twice, once for the "secure" options coming from the
 * postmaster or command line, and once for the "insecure" options coming
 * from the client's startup packet.  The latter have the same syntax but
 * may be restricted in what they can do.
 *
3202
 * argv[0] is ignored in either case (it's assumed to be the program name).
3203 3204 3205 3206 3207 3208
 *
 * ctx is PGC_POSTMASTER for secure options, PGC_BACKEND for insecure options
 * coming from the client, or PGC_SUSET for insecure options coming from
 * a superuser client.
 *
 * Returns the database name extracted from the command line, if any.
3209 3210
 * ----------------------------------------------------------------
 */
3211
const char *
3212
process_postgres_switches(int argc, char *argv[], GucContext ctx)
3213
{
3214 3215
	const char *dbname;
	bool		secure = (ctx == PGC_POSTMASTER);
3216
	int			errs = 0;
3217
	GucSource	gucsource;
3218
	int			flag;
3219

3220
	if (secure)
3221
	{
B
Bruce Momjian 已提交
3222
		gucsource = PGC_S_ARGV; /* switches came from command line */
3223

3224 3225 3226 3227 3228 3229 3230 3231
		/* Ignore the initial --single argument, if present */
		if (argc > 1 && strcmp(argv[1], "--single") == 0)
		{
			argv++;
			argc--;
		}
	}
	else
3232
	{
3233
		gucsource = PGC_S_CLIENT;		/* switches came from client */
3234 3235
	}

3236
	/*
B
Bruce Momjian 已提交
3237 3238 3239
	 * Parse command-line options.	CAUTION: keep this in sync with
	 * postmaster/postmaster.c (the option sets should not conflict) and with
	 * the common help() function in main/main.c.
3240
	 */
3241
	while ((flag = getopt(argc, argv, "A:B:bc:D:d:EeFf:h:ijk:lN:nOo:Pp:r:S:sTt:v:W:-:")) != -1)
3242
	{
3243 3244
		switch (flag)
		{
M
 
Marc G. Fournier 已提交
3245
			case 'A':
3246
				SetConfigOption("debug_assertions", optarg, ctx, gucsource);
M
 
Marc G. Fournier 已提交
3247
				break;
3248

3249
			case 'B':
3250
				SetConfigOption("shared_buffers", optarg, ctx, gucsource);
3251
				break;
3252

3253 3254 3255 3256 3257
			case 'b':
				/* Undocumented flag used for binary upgrades */
				IsBinaryUpgrade = true;
				break;

3258
			case 'D':
3259
				if (secure)
3260
					userDoption = strdup(optarg);
M
 
Marc G. Fournier 已提交
3261
				break;
3262

3263
			case 'd':
3264
				set_debug_options(atoi(optarg), ctx, gucsource);
3265
				break;
3266 3267

			case 'E':
3268
				EchoQuery = true;
3269
				break;
3270 3271

			case 'e':
3272
				SetConfigOption("datestyle", "euro", ctx, gucsource);
3273
				break;
3274 3275

			case 'F':
3276
				SetConfigOption("fsync", "false", ctx, gucsource);
3277
				break;
3278 3279

			case 'f':
3280 3281 3282
				if (!set_plan_disabling_options(optarg, ctx, gucsource))
					errs++;
				break;
3283

3284 3285
			case 'h':
				SetConfigOption("listen_addresses", optarg, ctx, gucsource);
3286 3287
				break;

3288 3289 3290
			case 'i':
				SetConfigOption("listen_addresses", "*", ctx, gucsource);
				break;
3291

3292
			case 'j':
3293 3294
				UseNewLine = 0;
				break;
3295

3296 3297 3298
			case 'k':
				SetConfigOption("unix_socket_directory", optarg, ctx, gucsource);
				break;
3299

3300 3301
			case 'l':
				SetConfigOption("ssl", "true", ctx, gucsource);
3302 3303
				break;

3304 3305 3306
			case 'N':
				SetConfigOption("max_connections", optarg, ctx, gucsource);
				break;
3307

3308 3309 3310 3311 3312 3313
			case 'n':
				/* ignored for consistency with postmaster */
				break;

			case 'O':
				SetConfigOption("allow_system_table_mods", "true", ctx, gucsource);
H
Hiroshi Inoue 已提交
3314 3315
				break;

T
Tom Lane 已提交
3316
			case 'o':
3317 3318
				errs++;
				break;
3319

3320 3321
			case 'P':
				SetConfigOption("ignore_system_indexes", "true", ctx, gucsource);
T
Tom Lane 已提交
3322 3323
				break;

3324
			case 'p':
3325 3326
				SetConfigOption("port", optarg, ctx, gucsource);
				break;
B
Bruce Momjian 已提交
3327

3328 3329
			case 'r':
				/* send output (stdout and stderr) to the given file */
3330
				if (secure)
3331
					strlcpy(OutputFileName, optarg, MAXPGPATH);
3332
				break;
3333

3334
			case 'S':
3335
				SetConfigOption("work_mem", optarg, ctx, gucsource);
3336
				break;
3337 3338

			case 's':
3339
				SetConfigOption("log_statement_stats", "true", ctx, gucsource);
M
 
Marc G. Fournier 已提交
3340 3341
				break;

3342 3343 3344 3345
			case 'T':
				/* ignored for consistency with postmaster */
				break;

3346
			case 't':
3347
				{
B
Bruce Momjian 已提交
3348 3349 3350
					const char *tmp = get_stats_option_name(optarg);

					if (tmp)
3351
						SetConfigOption(tmp, "true", ctx, gucsource);
3352
					else
B
Bruce Momjian 已提交
3353 3354
						errs++;
					break;
3355
				}
3356

3357
			case 'v':
B
Bruce Momjian 已提交
3358

3359 3360
				/*
				 * -v is no longer used in normal operation, since
B
Bruce Momjian 已提交
3361 3362 3363 3364
				 * FrontendProtocol is already set before we get here. We keep
				 * the switch only for possible use in standalone operation,
				 * in case we ever support using normal FE/BE protocol with a
				 * standalone backend.
3365
				 */
3366 3367
				if (secure)
					FrontendProtocol = (ProtocolVersion) atoi(optarg);
3368 3369
				break;

M
 
Marc G. Fournier 已提交
3370
			case 'W':
3371 3372
				SetConfigOption("post_auth_delay", optarg, ctx, gucsource);
				break;
3373

3374
			case 'c':
3375
			case '-':
3376
				{
B
Bruce Momjian 已提交
3377 3378
					char	   *name,
							   *value;
3379

B
Bruce Momjian 已提交
3380 3381 3382 3383
					ParseLongOption(optarg, &name, &value);
					if (!value)
					{
						if (flag == '-')
3384 3385 3386 3387
							ereport(ERROR,
									(errcode(ERRCODE_SYNTAX_ERROR),
									 errmsg("--%s requires a value",
											optarg)));
B
Bruce Momjian 已提交
3388
						else
3389 3390 3391 3392
							ereport(ERROR,
									(errcode(ERRCODE_SYNTAX_ERROR),
									 errmsg("-c %s requires a value",
											optarg)));
B
Bruce Momjian 已提交
3393
					}
3394
					SetConfigOption(name, value, ctx, gucsource);
B
Bruce Momjian 已提交
3395 3396 3397 3398 3399
					free(name);
					if (value)
						free(value);
					break;
				}
3400

3401 3402
			default:
				errs++;
T
Tom Lane 已提交
3403
				break;
3404
		}
3405 3406
	}

3407
	/*
3408 3409
	 * Should be no more arguments except an optional database name, and
	 * that's only in the secure case.
3410
	 */
3411
	if (errs || argc - optind > 1 || (argc != optind && !secure))
3412
	{
3413 3414 3415 3416 3417
		/* spell the error message a bit differently depending on context */
		if (IsUnderPostmaster)
			ereport(FATAL,
					(errcode(ERRCODE_SYNTAX_ERROR),
				 errmsg("invalid command-line arguments for server process"),
B
Bruce Momjian 已提交
3418
			  errhint("Try \"%s --help\" for more information.", progname)));
3419 3420 3421 3422
		else
			ereport(FATAL,
					(errcode(ERRCODE_SYNTAX_ERROR),
					 errmsg("%s: invalid command-line arguments",
3423
							progname),
B
Bruce Momjian 已提交
3424
			  errhint("Try \"%s --help\" for more information.", progname)));
3425
	}
3426

3427 3428 3429 3430
	if (argc - optind == 1)
		dbname = strdup(argv[optind]);
	else
		dbname = NULL;
3431

3432 3433 3434 3435 3436
	/*
	 * Reset getopt(3) library so that it will work correctly in subprocesses
	 * or when this function is called a second time with another array.
	 */
	optind = 1;
3437
#ifdef HAVE_INT_OPTRESET
3438 3439
	optreset = 1;				/* some systems need this too */
#endif
3440

3441 3442
	return dbname;
}
3443

3444 3445 3446 3447 3448 3449 3450 3451 3452 3453 3454 3455 3456 3457 3458 3459 3460 3461 3462 3463 3464 3465 3466 3467 3468 3469 3470 3471 3472 3473 3474 3475 3476 3477 3478 3479 3480 3481 3482 3483 3484 3485 3486 3487

/* ----------------------------------------------------------------
 * PostgresMain
 *	   postgres main loop -- all backends, interactive or otherwise start here
 *
 * argc/argv are the command line arguments to be used.  (When being forked
 * by the postmaster, these are not the original argv array of the process.)
 * username is the (possibly authenticated) PostgreSQL user name to be used
 * for the session.
 * ----------------------------------------------------------------
 */
int
PostgresMain(int argc, char *argv[], const char *username)
{
	const char *dbname;
	int			firstchar;
	char		stack_base;
	StringInfoData input_message;
	sigjmp_buf	local_sigjmp_buf;
	volatile bool send_ready_for_query = true;

	/*
	 * Initialize globals (already done if under postmaster, but not if
	 * standalone).
	 */
	if (!IsUnderPostmaster)
	{
		MyProcPid = getpid();

		MyStartTime = time(NULL);
	}

	/*
	 * Fire up essential subsystems: error and memory management
	 *
	 * If we are running under the postmaster, this is done already.
	 */
	if (!IsUnderPostmaster)
		MemoryContextInit();

	SetProcessingMode(InitProcessing);

	/* Set up reference point for stack depth checking */
	stack_base_ptr = &stack_base;
3488 3489 3490
#if defined(__ia64__) || defined(__ia64)
	register_stack_base_ptr = ia64_get_bsp();
#endif
3491 3492 3493 3494 3495 3496 3497 3498 3499 3500 3501 3502 3503 3504 3505 3506 3507 3508 3509 3510 3511 3512 3513 3514 3515 3516 3517 3518 3519

	/* Compute paths, if we didn't inherit them from postmaster */
	if (my_exec_path[0] == '\0')
	{
		if (find_my_exec(argv[0], my_exec_path) < 0)
			elog(FATAL, "%s: could not locate my own executable path",
				 argv[0]);
	}

	if (pkglib_path[0] == '\0')
		get_pkglib_path(my_exec_path, pkglib_path);

	/*
	 * Set default values for command-line options.
	 */
	if (!IsUnderPostmaster)
		InitializeGUCOptions();

	/*
	 * Parse command-line options.
	 */
	dbname = process_postgres_switches(argc, argv, PGC_POSTMASTER);

	/* Must have gotten a database name, or have a default (the username) */
	if (dbname == NULL)
	{
		dbname = username;
		if (dbname == NULL)
			ereport(FATAL,
B
Bruce Momjian 已提交
3520 3521 3522
					(errcode(ERRCODE_INVALID_PARAMETER_VALUE),
					 errmsg("%s: no database nor user name specified",
							progname)));
3523 3524
	}

3525 3526
	/* Acquire configuration parameters, unless inherited from postmaster */
	if (!IsUnderPostmaster)
3527
	{
3528
		if (!SelectConfigFiles(userDoption, progname))
3529
			proc_exit(1);
3530 3531
		/* If timezone is not set, determine what the OS uses */
		pg_timezone_initialize();
3532 3533
		/* If timezone_abbreviations is not set, select default */
		pg_timezone_abbrev_initialize();
3534
	}
3535

3536 3537 3538 3539 3540
	/*
	 * You might expect to see a setsid() call here, but it's not needed,
	 * because if we are under a postmaster then BackendInitialize() did it.
	 */

3541
	/*
3542
	 * Set up signal handlers and masks.
3543
	 *
3544 3545 3546
	 * Note that postmaster blocked all signals before forking child process,
	 * so there is no race condition whereby we might receive a signal before
	 * we have set up the handler.
T
Tom Lane 已提交
3547
	 *
B
Bruce Momjian 已提交
3548 3549 3550 3551 3552 3553
	 * Also note: it's best not to use any signals that are SIG_IGNored in the
	 * postmaster.	If such a signal arrives before we are able to change the
	 * handler to non-SIG_IGN, it'll get dropped.  Instead, make a dummy
	 * handler in the postmaster to reserve the signal. (Of course, this isn't
	 * an issue for signals that are locally generated, such as SIGALRM and
	 * SIGPIPE.)
3554
	 */
3555 3556
	if (am_walsender)
		WalSndSignals();
3557
	else
3558
	{
B
Bruce Momjian 已提交
3559 3560 3561 3562
		pqsignal(SIGHUP, SigHupHandler);		/* set flag to read config
												 * file */
		pqsignal(SIGINT, StatementCancelHandler);		/* cancel current query */
		pqsignal(SIGTERM, die); /* cancel current query and exit */
3563

3564 3565
		/*
		 * In a standalone backend, SIGQUIT can be generated from the keyboard
B
Bruce Momjian 已提交
3566 3567
		 * easily, while SIGTERM cannot, so we make both signals do die()
		 * rather than quickdie().
3568 3569
		 */
		if (IsUnderPostmaster)
B
Bruce Momjian 已提交
3570
			pqsignal(SIGQUIT, quickdie);		/* hard crash time */
3571
		else
B
Bruce Momjian 已提交
3572 3573
			pqsignal(SIGQUIT, die);		/* cancel current query and exit */
		pqsignal(SIGALRM, handle_sig_alarm);	/* timeout conditions */
3574

3575 3576 3577
		/*
		 * Ignore failure to write to frontend. Note: if frontend closes
		 * connection, we will notice it and exit cleanly when control next
B
Bruce Momjian 已提交
3578 3579
		 * returns to outer loop.  This seems safer than forcing exit in the
		 * midst of output during who-knows-what operation...
3580 3581 3582 3583 3584 3585 3586
		 */
		pqsignal(SIGPIPE, SIG_IGN);
		pqsignal(SIGUSR1, procsignal_sigusr1_handler);
		pqsignal(SIGUSR2, SIG_IGN);
		pqsignal(SIGFPE, FloatExceptionHandler);

		/*
B
Bruce Momjian 已提交
3587 3588
		 * Reset some signals that are accepted by postmaster but not by
		 * backend
3589
		 */
B
Bruce Momjian 已提交
3590 3591
		pqsignal(SIGCHLD, SIG_DFL);		/* system() requires this on some
										 * platforms */
3592
	}
3593

3594 3595
	pqinitmask();

3596 3597 3598 3599 3600
	if (IsUnderPostmaster)
	{
		/* We allow SIGQUIT (quickdie) at all times */
		sigdelset(&BlockSig, SIGQUIT);
	}
3601

T
Tom Lane 已提交
3602
	PG_SETMASK(&BlockSig);		/* block everything except SIGQUIT */
3603

3604
	if (!IsUnderPostmaster)
3605
	{
3606
		/*
B
Bruce Momjian 已提交
3607 3608
		 * Validate we have been given a reasonable-looking DataDir (if under
		 * postmaster, assume postmaster did this already).
3609
		 */
3610
		Assert(DataDir);
3611 3612
		ValidatePgVersion(DataDir);

3613 3614 3615
		/* Change into DataDir (if under postmaster, was done already) */
		ChangeToDataDir();

3616
		/*
3617
		 * Create lockfile for data directory.
3618
		 */
3619
		CreateDataDirLockFile(false);
3620 3621
	}

3622 3623 3624
	/* Early initialization */
	BaseInit();

3625
	/*
B
Bruce Momjian 已提交
3626 3627 3628 3629
	 * Create a per-backend PGPROC struct in shared memory, except in the
	 * EXEC_BACKEND case where this was done in SubPostmasterMain. We must do
	 * this before we can use LWLocks (and in the EXEC_BACKEND case we already
	 * had to do some stuff with LWLocks).
3630 3631 3632 3633 3634 3635 3636 3637
	 */
#ifdef EXEC_BACKEND
	if (!IsUnderPostmaster)
		InitProcess();
#else
	InitProcess();
#endif

3638 3639 3640
	/* We need to allow SIGINT, etc during the initial transaction */
	PG_SETMASK(&UnBlockSig);

3641
	/*
3642 3643
	 * General initialization.
	 *
3644 3645 3646
	 * NOTE: if you are tempted to add code in this vicinity, consider putting
	 * it inside InitPostgres() instead.  In particular, anything that
	 * involves database access should be there, not here.
3647
	 */
3648
	InitPostgres(dbname, InvalidOid, username, NULL);
3649

3650 3651 3652 3653 3654 3655 3656 3657 3658 3659 3660 3661 3662
	/*
	 * If the PostmasterContext is still around, recycle the space; we don't
	 * need it anymore after InitPostgres completes.  Note this does not trash
	 * *MyProcPort, because ConnCreate() allocated that space with malloc()
	 * ... else we'd need to copy the Port data first.  Also, subsidiary data
	 * such as the username isn't lost either; see ProcessStartupPacket().
	 */
	if (PostmasterContext)
	{
		MemoryContextDelete(PostmasterContext);
		PostmasterContext = NULL;
	}

3663
	SetProcessingMode(NormalProcessing);
3664

3665 3666 3667 3668 3669 3670
	/*
	 * Now all GUC states are fully set up.  Report them to client if
	 * appropriate.
	 */
	BeginReportingGUCOptions();

3671
	/*
B
Bruce Momjian 已提交
3672 3673
	 * Also set up handler to log session end; we have to wait till now to be
	 * sure Log_disconnections has its final value.
3674 3675 3676 3677
	 */
	if (IsUnderPostmaster && Log_disconnections)
		on_proc_exit(log_disconnections, 0);

3678 3679 3680 3681
	/* If this is a WAL sender process, we're done with initialization. */
	if (am_walsender)
		proc_exit(WalSenderMain());

3682
	/*
B
Bruce Momjian 已提交
3683 3684
	 * process any libraries that should be preloaded at backend start (this
	 * likewise can't be done until GUC settings are complete)
3685 3686 3687
	 */
	process_local_preload_libraries();

3688 3689
	/*
	 * Send this backend's cancellation info to the frontend.
3690
	 */
3691
	if (whereToSendOutput == DestRemote &&
M
 
Marc G. Fournier 已提交
3692 3693
		PG_PROTOCOL_MAJOR(FrontendProtocol) >= 2)
	{
3694
		StringInfoData buf;
B
Bruce Momjian 已提交
3695

3696
		pq_beginmessage(&buf, 'K');
3697 3698 3699
		pq_sendint(&buf, (int32) MyProcPid, sizeof(int32));
		pq_sendint(&buf, (int32) MyCancelKey, sizeof(int32));
		pq_endmessage(&buf);
M
 
Marc G. Fournier 已提交
3700 3701 3702
		/* Need not flush since ReadyForQuery will do it. */
	}

3703
	/* Welcome banner for standalone case */
3704
	if (whereToSendOutput == DestDebug)
3705
		printf("\nPostgreSQL stand-alone backend %s\n", PG_VERSION);
3706

3707 3708 3709
	/*
	 * Create the memory context we will use in the main loop.
	 *
3710 3711
	 * MessageContext is reset once per iteration of the main loop, ie, upon
	 * completion of processing of each command message from the client.
3712
	 */
3713 3714 3715 3716 3717
	MessageContext = AllocSetContextCreate(TopMemoryContext,
										   "MessageContext",
										   ALLOCSET_DEFAULT_MINSIZE,
										   ALLOCSET_DEFAULT_INITSIZE,
										   ALLOCSET_DEFAULT_MAXSIZE);
3718

3719
	/*
3720
	 * Remember stand-alone backend startup time
3721 3722
	 */
	if (!IsUnderPostmaster)
3723
		PgStartTime = GetCurrentTimestamp();
3724

3725 3726
	/*
	 * POSTGRES main processing loop begins here
3727
	 *
B
Bruce Momjian 已提交
3728 3729
	 * If an exception is encountered, processing resumes here so we abort the
	 * current transaction and start a new one.
3730
	 *
3731 3732 3733 3734 3735 3736 3737
	 * You might wonder why this isn't coded as an infinite loop around a
	 * PG_TRY construct.  The reason is that this is the bottom of the
	 * exception stack, and so with PG_TRY there would be no exception handler
	 * in force at all during the CATCH part.  By leaving the outermost setjmp
	 * always active, we have at least some chance of recovering from an error
	 * during error recovery.  (If we get into an infinite loop thereby, it
	 * will soon be stopped by overflow of elog.c's internal state stack.)
3738 3739
	 */

3740
	if (sigsetjmp(local_sigjmp_buf, 1) != 0)
3741
	{
3742
		/*
3743
		 * NOTE: if you are tempted to add more code in this if-block,
3744
		 * consider the high probability that it should be in
B
Bruce Momjian 已提交
3745
		 * AbortTransaction() instead.	The only stuff done directly here
B
Bruce Momjian 已提交
3746 3747
		 * should be stuff that is guaranteed to apply *only* for outer-level
		 * error recovery, such as adjusting the FE/BE protocol status.
3748 3749 3750 3751 3752 3753 3754 3755 3756
		 */

		/* Since not using PG_TRY, must reset error stack by hand */
		error_context_stack = NULL;

		/* Prevent interrupts while cleaning up */
		HOLD_INTERRUPTS();

		/*
B
Bruce Momjian 已提交
3757 3758
		 * Forget any pending QueryCancel request, since we're returning to
		 * the idle loop anyway, and cancel the statement timer if running.
3759 3760
		 */
		QueryCancelPending = false;
3761
		disable_sig_alarm(true);
B
Bruce Momjian 已提交
3762
		QueryCancelPending = false;		/* again in case timeout occurred */
3763 3764

		/*
B
Bruce Momjian 已提交
3765 3766 3767
		 * Turn off these interrupts too.  This is only needed here and not in
		 * other exception-catching places since these interrupts are only
		 * enabled while we wait for client input.
3768
		 */
3769
		DoingCommandRead = false;
3770
		DisableNotifyInterrupt();
3771
		DisableCatchupInterrupt();
3772

3773 3774 3775
		/* Make sure libpq is in a good state */
		pq_comm_reset();

3776 3777
		/* Report the error to the client and/or server log */
		EmitErrorReport();
3778

3779
		/*
B
Bruce Momjian 已提交
3780 3781
		 * Make sure debug_query_string gets reset before we possibly clobber
		 * the storage it points at.
3782
		 */
3783
		debug_query_string = NULL;
3784

3785
		/*
3786
		 * Abort the current transaction in order to recover.
3787
		 */
3788
		AbortCurrentTransaction();
3789 3790

		/*
B
Bruce Momjian 已提交
3791 3792
		 * Now return to normal top-level context and clear ErrorContext for
		 * next time.
3793 3794
		 */
		MemoryContextSwitchTo(TopMemoryContext);
3795
		FlushErrorState();
3796

3797
		/*
B
Bruce Momjian 已提交
3798 3799
		 * If we were handling an extended-query-protocol message, initiate
		 * skip till next Sync.  This also causes us not to issue
B
Bruce Momjian 已提交
3800
		 * ReadyForQuery (until we get Sync).
3801 3802 3803
		 */
		if (doing_extended_query_message)
			ignore_till_sync = true;
3804

3805 3806
		/* We don't have a transaction command open anymore */
		xact_started = false;
3807

3808
		/* Now we can allow interrupts again */
3809
		RESUME_INTERRUPTS();
3810
	}
3811

3812 3813
	/* We can now handle ereport(ERROR) */
	PG_exception_stack = &local_sigjmp_buf;
3814

3815
	if (!ignore_till_sync)
B
Bruce Momjian 已提交
3816
		send_ready_for_query = true;	/* initially, or after error */
3817

3818 3819
	/*
	 * Non-error queries loop here.
3820 3821 3822 3823
	 */

	for (;;)
	{
3824
		/*
B
Bruce Momjian 已提交
3825 3826
		 * At top of loop, reset extended-query-message flag, so that any
		 * errors encountered in "idle" state don't provoke skip.
3827 3828 3829
		 */
		doing_extended_query_message = false;

3830
		/*
B
Bruce Momjian 已提交
3831 3832
		 * Release storage left over from prior query cycle, and create a new
		 * query input buffer in the cleared MessageContext.
3833
		 */
3834 3835
		MemoryContextSwitchTo(MessageContext);
		MemoryContextResetAndDeleteChildren(MessageContext);
3836

3837
		initStringInfo(&input_message);
3838

3839
		/*
B
Bruce Momjian 已提交
3840 3841
		 * (1) If we've reached idle state, tell the frontend we're ready for
		 * a new query.
3842
		 *
3843
		 * Note: this includes fflush()'ing the last of the prior output.
3844 3845 3846
		 *
		 * This is also a good time to send collected statistics to the
		 * collector, and to update the PS stats display.  We avoid doing
B
Bruce Momjian 已提交
3847 3848
		 * those every time through the message loop because it'd slow down
		 * processing of batched messages, and because we don't want to report
B
Bruce Momjian 已提交
3849
		 * uncommitted updates (that confuses autovacuum).	The notification
3850
		 * processor wants a call too, if we are not in a transaction block.
B
Bruce Momjian 已提交
3851
		 */
3852
		if (send_ready_for_query)
3853
		{
3854 3855 3856 3857 3858 3859
			if (IsAbortedTransactionBlockState())
			{
				set_ps_display("idle in transaction (aborted)", false);
				pgstat_report_activity("<IDLE> in transaction (aborted)");
			}
			else if (IsTransactionOrTransactionBlock())
3860
			{
3861
				set_ps_display("idle in transaction", false);
3862 3863 3864 3865
				pgstat_report_activity("<IDLE> in transaction");
			}
			else
			{
3866
				ProcessCompletedNotifies();
3867
				pgstat_report_stat(false);
3868

3869
				set_ps_display("idle", false);
3870 3871
				pgstat_report_activity("<IDLE>");
			}
3872

3873
			ReadyForQuery(whereToSendOutput);
3874
			send_ready_for_query = false;
3875
		}
3876

3877
		/*
B
Bruce Momjian 已提交
3878 3879 3880 3881
		 * (2) Allow asynchronous signals to be executed immediately if they
		 * come in while we are waiting for client input. (This must be
		 * conditional since we don't want, say, reads on behalf of COPY FROM
		 * STDIN doing the same thing.)
3882
		 */
3883
		DoingCommandRead = true;
3884

3885 3886
		/*
		 * (3) read a command (loop blocks here)
3887
		 */
3888
		firstchar = ReadCommand(&input_message);
3889

3890 3891
		/*
		 * (4) disable async signal conditions again.
3892
		 */
3893
		DoingCommandRead = false;
3894

3895
		/*
B
Bruce Momjian 已提交
3896 3897
		 * (5) check for any other interesting events that happened while we
		 * slept.
3898 3899 3900 3901 3902 3903 3904
		 */
		if (got_SIGHUP)
		{
			got_SIGHUP = false;
			ProcessConfigFile(PGC_SIGHUP);
		}

3905
		/*
B
Bruce Momjian 已提交
3906 3907
		 * (6) process the command.  But ignore it if we're skipping till
		 * Sync.
3908
		 */
3909
		if (ignore_till_sync && firstchar != EOF)
3910 3911
			continue;

3912 3913
		switch (firstchar)
		{
3914
			case 'Q':			/* simple query */
3915
				{
3916 3917
					const char *query_string;

3918 3919 3920
					/* Set statement_timestamp() */
					SetCurrentStatementStartTimestamp();

3921 3922
					query_string = pq_getmsgstring(&input_message);
					pq_getmsgend(&input_message);
3923

3924
					exec_simple_query(query_string);
3925

3926
					send_ready_for_query = true;
3927
				}
3928 3929
				break;

3930 3931 3932 3933 3934 3935 3936
			case 'P':			/* parse */
				{
					const char *stmt_name;
					const char *query_string;
					int			numParams;
					Oid		   *paramTypes = NULL;

3937 3938 3939
					/* Set statement_timestamp() */
					SetCurrentStatementStartTimestamp();

3940 3941 3942
					stmt_name = pq_getmsgstring(&input_message);
					query_string = pq_getmsgstring(&input_message);
					numParams = pq_getmsgint(&input_message, 2);
3943 3944
					if (numParams > 0)
					{
B
Bruce Momjian 已提交
3945
						int			i;
3946 3947 3948

						paramTypes = (Oid *) palloc(numParams * sizeof(Oid));
						for (i = 0; i < numParams; i++)
3949
							paramTypes[i] = pq_getmsgint(&input_message, 4);
3950
					}
3951
					pq_getmsgend(&input_message);
3952 3953 3954 3955 3956 3957 3958

					exec_parse_message(query_string, stmt_name,
									   paramTypes, numParams);
				}
				break;

			case 'B':			/* bind */
3959 3960
				/* Set statement_timestamp() */
				SetCurrentStatementStartTimestamp();
B
Bruce Momjian 已提交
3961

3962
				/*
B
Bruce Momjian 已提交
3963 3964
				 * this message is complex enough that it seems best to put
				 * the field extraction out-of-line
3965
				 */
3966
				exec_bind_message(&input_message);
3967 3968 3969 3970 3971
				break;

			case 'E':			/* execute */
				{
					const char *portal_name;
3972
					int			max_rows;
3973

3974 3975 3976
					/* Set statement_timestamp() */
					SetCurrentStatementStartTimestamp();

3977
					portal_name = pq_getmsgstring(&input_message);
3978
					max_rows = pq_getmsgint(&input_message, 4);
3979
					pq_getmsgend(&input_message);
3980

3981
					exec_execute_message(portal_name, max_rows);
3982 3983 3984
				}
				break;

3985
			case 'F':			/* fastpath function call */
3986 3987 3988
				/* Set statement_timestamp() */
				SetCurrentStatementStartTimestamp();

3989
				/* Report query to various monitoring facilities. */
3990
				pgstat_report_activity("<FASTPATH> function call");
3991
				set_ps_display("<FASTPATH>", false);
3992

3993
				/* start an xact for this function invocation */
3994
				start_xact_command();
3995

3996 3997
				/*
				 * Note: we may at this point be inside an aborted
B
Bruce Momjian 已提交
3998 3999
				 * transaction.  We can't throw error for that until we've
				 * finished reading the function-call message, so
4000 4001 4002 4003 4004
				 * HandleFunctionRequest() must check for it after doing so.
				 * Be careful not to do anything that assumes we're inside a
				 * valid transaction here.
				 */

4005 4006 4007
				/* switch back to message context */
				MemoryContextSwitchTo(MessageContext);

4008
				if (HandleFunctionRequest(&input_message) == EOF)
4009 4010
				{
					/* lost frontend connection during F message input */
B
Bruce Momjian 已提交
4011

4012
					/*
4013
					 * Reset whereToSendOutput to prevent ereport from
B
Bruce Momjian 已提交
4014
					 * attempting to send any more messages to client.
4015
					 */
4016 4017
					if (whereToSendOutput == DestRemote)
						whereToSendOutput = DestNone;
4018

4019
					proc_exit(0);
4020
				}
4021 4022

				/* commit the function-invocation transaction */
4023
				finish_xact_command();
4024

4025
				send_ready_for_query = true;
4026 4027
				break;

B
Bruce Momjian 已提交
4028
			case 'C':			/* close */
4029
				{
B
Bruce Momjian 已提交
4030
					int			close_type;
4031 4032
					const char *close_target;

4033 4034 4035
					close_type = pq_getmsgbyte(&input_message);
					close_target = pq_getmsgstring(&input_message);
					pq_getmsgend(&input_message);
4036 4037 4038 4039 4040 4041 4042 4043 4044

					switch (close_type)
					{
						case 'S':
							if (close_target[0] != '\0')
								DropPreparedStatement(close_target, false);
							else
							{
								/* special-case the unnamed statement */
4045
								drop_unnamed_stmt();
4046 4047 4048 4049 4050 4051 4052 4053 4054 4055 4056 4057
							}
							break;
						case 'P':
							{
								Portal		portal;

								portal = GetPortalByName(close_target);
								if (PortalIsValid(portal))
									PortalDrop(portal, false);
							}
							break;
						default:
4058 4059
							ereport(ERROR,
									(errcode(ERRCODE_PROTOCOL_VIOLATION),
B
Bruce Momjian 已提交
4060 4061
								   errmsg("invalid CLOSE message subtype %d",
										  close_type)));
4062 4063 4064
							break;
					}

4065
					if (whereToSendOutput == DestRemote)
B
Bruce Momjian 已提交
4066
						pq_putemptymessage('3');		/* CloseComplete */
4067 4068 4069 4070 4071
				}
				break;

			case 'D':			/* describe */
				{
B
Bruce Momjian 已提交
4072
					int			describe_type;
4073 4074
					const char *describe_target;

4075 4076 4077
					/* Set statement_timestamp() (needed for xact) */
					SetCurrentStatementStartTimestamp();

4078 4079 4080
					describe_type = pq_getmsgbyte(&input_message);
					describe_target = pq_getmsgstring(&input_message);
					pq_getmsgend(&input_message);
4081 4082 4083 4084 4085 4086 4087 4088 4089 4090

					switch (describe_type)
					{
						case 'S':
							exec_describe_statement_message(describe_target);
							break;
						case 'P':
							exec_describe_portal_message(describe_target);
							break;
						default:
4091 4092
							ereport(ERROR,
									(errcode(ERRCODE_PROTOCOL_VIOLATION),
B
Bruce Momjian 已提交
4093 4094
								errmsg("invalid DESCRIBE message subtype %d",
									   describe_type)));
4095 4096 4097 4098 4099
							break;
					}
				}
				break;

B
Bruce Momjian 已提交
4100
			case 'H':			/* flush */
4101
				pq_getmsgend(&input_message);
4102
				if (whereToSendOutput == DestRemote)
4103 4104 4105
					pq_flush();
				break;

B
Bruce Momjian 已提交
4106
			case 'S':			/* sync */
4107
				pq_getmsgend(&input_message);
4108
				finish_xact_command();
4109
				send_ready_for_query = true;
4110 4111
				break;

4112
				/*
B
Bruce Momjian 已提交
4113 4114 4115
				 * 'X' means that the frontend is closing down the socket. EOF
				 * means unexpected loss of frontend connection. Either way,
				 * perform normal shutdown.
4116 4117
				 */
			case 'X':
4118
			case EOF:
B
Bruce Momjian 已提交
4119

4120
				/*
B
Bruce Momjian 已提交
4121 4122
				 * Reset whereToSendOutput to prevent ereport from attempting
				 * to send any more messages to client.
4123
				 */
4124 4125
				if (whereToSendOutput == DestRemote)
					whereToSendOutput = DestNone;
B
Bruce Momjian 已提交
4126

4127 4128
				/*
				 * NOTE: if you are tempted to add more code here, DON'T!
B
Bruce Momjian 已提交
4129
				 * Whatever you had in mind to do should be set up as an
B
Bruce Momjian 已提交
4130 4131 4132
				 * on_proc_exit or on_shmem_exit callback, instead. Otherwise
				 * it will fail to be called during other backend-shutdown
				 * scenarios.
4133
				 */
4134
				proc_exit(0);
4135

B
Bruce Momjian 已提交
4136 4137 4138 4139
			case 'd':			/* copy data */
			case 'c':			/* copy done */
			case 'f':			/* copy fail */

4140
				/*
B
Bruce Momjian 已提交
4141
				 * Accept but ignore these messages, per protocol spec; we
B
Bruce Momjian 已提交
4142 4143
				 * probably got here because a COPY failed, and the frontend
				 * is still sending data.
4144 4145 4146
				 */
				break;

4147
			default:
4148 4149 4150 4151
				ereport(FATAL,
						(errcode(ERRCODE_PROTOCOL_VIOLATION),
						 errmsg("invalid frontend message type %d",
								firstchar)));
4152
		}
4153
	}							/* end of input-reading loop */
4154

4155 4156
	/* can't get here because the above loop never exits */
	Assert(false);
4157

4158
	return 1;					/* keep compiler quiet */
4159 4160
}

4161 4162 4163 4164

/*
 * Obtain platform stack depth limit (in bytes)
 *
4165
 * Return -1 if unknown
4166 4167 4168 4169 4170 4171 4172 4173 4174 4175 4176 4177 4178 4179 4180
 */
long
get_stack_depth_rlimit(void)
{
#if defined(HAVE_GETRLIMIT) && defined(RLIMIT_STACK)
	static long val = 0;

	/* This won't change after process launch, so check just once */
	if (val == 0)
	{
		struct rlimit rlim;

		if (getrlimit(RLIMIT_STACK, &rlim) < 0)
			val = -1;
		else if (rlim.rlim_cur == RLIM_INFINITY)
4181 4182 4183 4184
			val = LONG_MAX;
		/* rlim_cur is probably of an unsigned type, so check for overflow */
		else if (rlim.rlim_cur >= LONG_MAX)
			val = LONG_MAX;
4185 4186 4187 4188
		else
			val = rlim.rlim_cur;
	}
	return val;
B
Bruce Momjian 已提交
4189
#else							/* no getrlimit */
4190 4191 4192
#if defined(WIN32) || defined(__CYGWIN__)
	/* On Windows we set the backend stack size in src/backend/Makefile */
	return WIN32_STACK_RLIMIT;
B
Bruce Momjian 已提交
4193
#else							/* not windows ... give up */
4194 4195
	return -1;
#endif
4196
#endif
4197 4198
}

4199

4200 4201
static struct rusage Save_r;
static struct timeval Save_t;
4202 4203

void
4204
ResetUsage(void)
4205
{
4206
	getrusage(RUSAGE_SELF, &Save_r);
4207
	gettimeofday(&Save_t, NULL);
4208 4209 4210
}

void
4211
ShowUsage(const char *title)
4212
{
4213
	StringInfoData str;
4214 4215 4216 4217
	struct timeval user,
				sys;
	struct timeval elapse_t;
	struct rusage r;
4218 4219

	getrusage(RUSAGE_SELF, &r);
4220
	gettimeofday(&elapse_t, NULL);
4221 4222
	memcpy((char *) &user, (char *) &r.ru_utime, sizeof(user));
	memcpy((char *) &sys, (char *) &r.ru_stime, sizeof(sys));
4223 4224 4225 4226 4227 4228 4229 4230 4231 4232 4233 4234 4235 4236 4237 4238 4239 4240
	if (elapse_t.tv_usec < Save_t.tv_usec)
	{
		elapse_t.tv_sec--;
		elapse_t.tv_usec += 1000000;
	}
	if (r.ru_utime.tv_usec < Save_r.ru_utime.tv_usec)
	{
		r.ru_utime.tv_sec--;
		r.ru_utime.tv_usec += 1000000;
	}
	if (r.ru_stime.tv_usec < Save_r.ru_stime.tv_usec)
	{
		r.ru_stime.tv_sec--;
		r.ru_stime.tv_usec += 1000000;
	}

	/*
	 * the only stats we don't show here are for memory usage -- i can't
B
Bruce Momjian 已提交
4241 4242 4243 4244
	 * figure out how to interpret the relevant fields in the rusage struct,
	 * and they change names across o/s platforms, anyway. if you can figure
	 * out what the entries mean, you can somehow extract resident set size,
	 * shared text size, and unshared data and stack sizes.
4245
	 */
4246
	initStringInfo(&str);
4247

4248 4249
	appendStringInfo(&str, "! system usage stats:\n");
	appendStringInfo(&str,
B
Bruce Momjian 已提交
4250
				"!\t%ld.%06ld elapsed %ld.%06ld user %ld.%06ld system sec\n",
4251 4252 4253
					 (long) (elapse_t.tv_sec - Save_t.tv_sec),
					 (long) (elapse_t.tv_usec - Save_t.tv_usec),
					 (long) (r.ru_utime.tv_sec - Save_r.ru_utime.tv_sec),
B
Bruce Momjian 已提交
4254
					 (long) (r.ru_utime.tv_usec - Save_r.ru_utime.tv_usec),
4255
					 (long) (r.ru_stime.tv_sec - Save_r.ru_stime.tv_sec),
B
Bruce Momjian 已提交
4256
					 (long) (r.ru_stime.tv_usec - Save_r.ru_stime.tv_usec));
4257
	appendStringInfo(&str,
B
Bruce Momjian 已提交
4258
					 "!\t[%ld.%06ld user %ld.%06ld sys total]\n",
4259 4260 4261 4262
					 (long) user.tv_sec,
					 (long) user.tv_usec,
					 (long) sys.tv_sec,
					 (long) sys.tv_usec);
4263
#if defined(HAVE_GETRUSAGE)
4264
	appendStringInfo(&str,
B
Bruce Momjian 已提交
4265 4266
					 "!\t%ld/%ld [%ld/%ld] filesystem blocks in/out\n",
					 r.ru_inblock - Save_r.ru_inblock,
4267
	/* they only drink coffee at dec */
B
Bruce Momjian 已提交
4268 4269
					 r.ru_oublock - Save_r.ru_oublock,
					 r.ru_inblock, r.ru_oublock);
4270
	appendStringInfo(&str,
B
Bruce Momjian 已提交
4271
			  "!\t%ld/%ld [%ld/%ld] page faults/reclaims, %ld [%ld] swaps\n",
B
Bruce Momjian 已提交
4272 4273 4274 4275 4276
					 r.ru_majflt - Save_r.ru_majflt,
					 r.ru_minflt - Save_r.ru_minflt,
					 r.ru_majflt, r.ru_minflt,
					 r.ru_nswap - Save_r.ru_nswap,
					 r.ru_nswap);
4277
	appendStringInfo(&str,
B
Bruce Momjian 已提交
4278
		 "!\t%ld [%ld] signals rcvd, %ld/%ld [%ld/%ld] messages rcvd/sent\n",
B
Bruce Momjian 已提交
4279 4280 4281 4282 4283
					 r.ru_nsignals - Save_r.ru_nsignals,
					 r.ru_nsignals,
					 r.ru_msgrcv - Save_r.ru_msgrcv,
					 r.ru_msgsnd - Save_r.ru_msgsnd,
					 r.ru_msgrcv, r.ru_msgsnd);
4284
	appendStringInfo(&str,
B
Bruce Momjian 已提交
4285
			 "!\t%ld/%ld [%ld/%ld] voluntary/involuntary context switches\n",
B
Bruce Momjian 已提交
4286 4287 4288
					 r.ru_nvcsw - Save_r.ru_nvcsw,
					 r.ru_nivcsw - Save_r.ru_nivcsw,
					 r.ru_nvcsw, r.ru_nivcsw);
4289
#endif   /* HAVE_GETRUSAGE */
4290 4291

	/* remove trailing newline */
B
Bruce Momjian 已提交
4292
	if (str.data[str.len - 1] == '\n')
4293 4294
		str.data[--str.len] = '\0';

4295 4296 4297
	ereport(LOG,
			(errmsg_internal("%s", title),
			 errdetail("%s", str.data)));
4298 4299

	pfree(str.data);
4300
}
4301 4302 4303 4304

/*
 * on_proc_exit handler to log end of session
 */
B
Bruce Momjian 已提交
4305
static void
4306
log_disconnections(int code, Datum arg)
4307
{
B
Bruce Momjian 已提交
4308
	Port	   *port = MyProcPort;
4309 4310 4311
	long		secs;
	int			usecs;
	int			msecs;
B
Bruce Momjian 已提交
4312 4313 4314
	int			hours,
				minutes,
				seconds;
4315

4316 4317 4318 4319
	TimestampDifference(port->SessionStartTime,
						GetCurrentTimestamp(),
						&secs, &usecs);
	msecs = usecs / 1000;
4320

4321 4322 4323 4324
	hours = secs / SECS_PER_HOUR;
	secs %= SECS_PER_HOUR;
	minutes = secs / SECS_PER_MINUTE;
	seconds = secs % SECS_PER_MINUTE;
4325

4326
	ereport(LOG,
4327
			(errmsg("disconnection: session time: %d:%02d:%02d.%03d "
4328
					"user=%s database=%s host=%s%s%s",
4329
					hours, minutes, seconds, msecs,
4330
					port->user_name, port->database_name, port->remote_host,
B
Bruce Momjian 已提交
4331
				  port->remote_port[0] ? " port=" : "", port->remote_port)));
4332
}