postgres.c 109.9 KB
Newer Older
1 2
/*-------------------------------------------------------------------------
 *
3
 * postgres.c
4
 *	  POSTGRES C Backend Interface
5
 *
6
 * Portions Copyright (c) 1996-2010, PostgreSQL Global Development Group
B
Add:  
Bruce Momjian 已提交
7
 * Portions Copyright (c) 1994, Regents of the University of California
8 9 10
 *
 *
 * IDENTIFICATION
11
 *	  $PostgreSQL: pgsql/src/backend/tcop/postgres.c,v 1.589 2010/02/16 20:15:14 momjian Exp $
12 13
 *
 * NOTES
14 15
 *	  this is the "main" module of the postgres backend and
 *	  hence the main module of the "traffic cop".
16 17 18
 *
 *-------------------------------------------------------------------------
 */
B
Bruce Momjian 已提交
19

20 21
#include "postgres.h"

22
#include <time.h>
B
Bruce Momjian 已提交
23
#include <unistd.h>
24
#include <signal.h>
B
Bruce Momjian 已提交
25
#include <fcntl.h>
26
#include <sys/socket.h>
27
#ifdef HAVE_SYS_SELECT_H
28
#include <sys/select.h>
29
#endif
30
#ifdef HAVE_SYS_RESOURCE_H
31
#include <sys/time.h>
32 33
#include <sys/resource.h>
#endif
34
#ifdef HAVE_GETOPT_H
B
Bruce Momjian 已提交
35
#include <getopt.h>
36
#endif
37

38 39 40 41
#ifndef HAVE_GETRUSAGE
#include "rusagestub.h"
#endif

42
#include "access/printtup.h"
43
#include "access/xact.h"
44
#include "catalog/pg_type.h"
45
#include "commands/async.h"
46
#include "commands/prepare.h"
47
#include "libpq/libpq.h"
48
#include "libpq/pqformat.h"
49
#include "libpq/pqsignal.h"
B
Bruce Momjian 已提交
50
#include "miscadmin.h"
51
#include "nodes/print.h"
52
#include "optimizer/planner.h"
53 54
#include "pgstat.h"
#include "pg_trace.h"
55
#include "parser/analyze.h"
56
#include "parser/parser.h"
57
#include "postmaster/autovacuum.h"
58
#include "postmaster/postmaster.h"
59
#include "replication/walsender.h"
B
Bruce Momjian 已提交
60
#include "rewrite/rewriteHandler.h"
61
#include "storage/bufmgr.h"
62 63
#include "storage/ipc.h"
#include "storage/proc.h"
64
#include "storage/procsignal.h"
65
#include "storage/sinval.h"
66 67
#include "tcop/fastpath.h"
#include "tcop/pquery.h"
B
Bruce Momjian 已提交
68
#include "tcop/tcopprot.h"
69
#include "tcop/utility.h"
70
#include "utils/lsyscache.h"
71
#include "utils/memutils.h"
M
 
Marc G. Fournier 已提交
72
#include "utils/ps_status.h"
73
#include "utils/snapmgr.h"
B
Bruce Momjian 已提交
74
#include "mb/pg_wchar.h"
75

M
 
Marc G. Fournier 已提交
76

77
extern char *optarg;
78 79 80 81 82 83
extern int	optind;

#ifdef HAVE_INT_OPTRESET
extern int	optreset;			/* might not be declared by system headers */
#endif

84

85
/* ----------------
86
 *		global variables
87 88
 * ----------------
 */
89
const char *debug_query_string; /* client-supplied query string */
90

91
/* Note: whereToSendOutput is initialized for the bootstrap/standalone case */
92
CommandDest whereToSendOutput = DestDebug;
93

94
/* flag for logging end of session */
B
Bruce Momjian 已提交
95
bool		Log_disconnections = false;
96

97
int			log_statement = LOGSTMT_NONE;
98

99
/* GUC variable for maximum stack depth (measured in kilobytes) */
100
int			max_stack_depth = 100;
101

102 103 104 105
/* wait N seconds to allow attach from a debugger */
int			PostAuthDelay = 0;


106

107 108 109 110
/* ----------------
 *		private variables
 * ----------------
 */
111

112
/* max_stack_depth converted to bytes for speed of checking */
113
static long max_stack_depth_bytes = 100 * 1024L;
114

N
Neil Conway 已提交
115 116 117 118
/*
 * Stack base pointer -- initialized by PostgresMain. This is not static
 * so that PL/Java can modify it.
 */
B
Bruce Momjian 已提交
119
char	   *stack_base_ptr = NULL;
120 121


122 123 124 125 126
/*
 * Flag to mark SIGHUP. Whenever the main loop comes around it
 * will reread the configuration file. (Better than doing the
 * reading in the signal handler, ey?)
 */
127
static volatile sig_atomic_t got_SIGHUP = false;
128

129 130 131 132 133 134
/*
 * Flag to keep track of whether we have started a transaction.
 * For extended query protocol this has to be remembered across messages.
 */
static bool xact_started = false;

135 136 137 138 139 140 141
/*
 * Flag to indicate that we are doing the outer loop's read-from-client,
 * as opposed to any random read from client that might happen within
 * commands like COPY FROM STDIN.
 */
static bool DoingCommandRead = false;

142 143 144 145 146 147 148 149 150 151 152 153
/*
 * Flags to implement skip-till-Sync-after-error behavior for messages of
 * the extended query protocol.
 */
static bool doing_extended_query_message = false;
static bool ignore_till_sync = false;

/*
 * If an unnamed prepared statement exists, it's stored here.
 * We keep it separate from the hashtable kept by commands/prepare.c
 * in order to reduce overhead for short-lived queries.
 */
154
static CachedPlanSource *unnamed_stmt_psrc = NULL;
B
Bruce Momjian 已提交
155

156
/* workspace for building a new unnamed statement in */
157 158 159
static MemoryContext unnamed_stmt_context = NULL;


160 161 162 163
/* assorted command-line switches */
static const char *userDoption = NULL;		/* -D switch */

static bool EchoQuery = false;				/* -E switch */
164 165 166 167

/*
 * people who want to use EOF should #define DONTUSENEWLINE in
 * tcop/tcopdebug.h
168 169
 */
#ifndef TCOP_DONTUSENEWLINE
B
Bruce Momjian 已提交
170
static int	UseNewLine = 1;		/* Use newlines query delimiters (the default) */
171
#else
172
static int	UseNewLine = 0;		/* Use EOF as query delimiters */
173
#endif   /* TCOP_DONTUSENEWLINE */
174

175
/* whether or not, and why, we were cancelled by conflict with recovery */
176
static bool RecoveryConflictPending = false;
177
static ProcSignalReason	RecoveryConflictReason;
178 179

/* ----------------------------------------------------------------
180
 *		decls for routines only used in this file
181 182
 * ----------------------------------------------------------------
 */
183
static int	InteractiveBackend(StringInfo inBuf);
184
static int	interactive_getc(void);
185 186
static int	SocketBackend(StringInfo inBuf);
static int	ReadCommand(StringInfo inBuf);
187
static List *pg_rewrite_query(Query *query);
188
static bool check_log_statement(List *stmt_list);
189 190
static int	errdetail_execute(List *raw_parsetree_list);
static int	errdetail_params(ParamListInfo params);
191
static int  errdetail_abort(void);
192
static int  errdetail_recovery_conflict(void);
193
static void start_xact_command(void);
194
static void finish_xact_command(void);
195 196 197
static bool IsTransactionExitStmt(Node *parsetree);
static bool IsTransactionExitStmtList(List *parseTrees);
static bool IsTransactionStmtList(List *parseTrees);
198
static void drop_unnamed_stmt(void);
199
static void SigHupHandler(SIGNAL_ARGS);
200
static void log_disconnections(int code, Datum arg);
201 202 203


/* ----------------------------------------------------------------
204
 *		routines to obtain user input
205 206 207 208
 * ----------------------------------------------------------------
 */

/* ----------------
209
 *	InteractiveBackend() is called for user interactive connections
210 211 212
 *
 *	the string entered by the user is placed in its parameter inBuf,
 *	and we act like a Q message was received.
213
 *
214
 *	EOF is returned if end-of-file input is seen; time to shut down.
215 216 217
 * ----------------
 */

218
static int
219
InteractiveBackend(StringInfo inBuf)
220
{
221 222 223
	int			c;				/* character read from getc() */
	bool		end = false;	/* end-of-input flag */
	bool		backslashSeen = false;	/* have we seen a \ ? */
224

225 226
	/*
	 * display a prompt and obtain input from the user
227
	 */
228
	printf("backend> ");
229
	fflush(stdout);
230

231
	resetStringInfo(inBuf);
232

233
	if (UseNewLine)
234
	{
235
		/*
B
Bruce Momjian 已提交
236 237
		 * if we are using \n as a delimiter, then read characters until the
		 * \n.
238 239
		 */
		while ((c = interactive_getc()) != EOF)
240
		{
241
			if (c == '\n')
242
			{
243
				if (backslashSeen)
244
				{
245 246 247 248
					/* discard backslash from inBuf */
					inBuf->data[--inBuf->len] = '\0';
					backslashSeen = false;
					continue;
249 250
				}
				else
251 252 253 254 255
				{
					/* keep the newline character */
					appendStringInfoChar(inBuf, '\n');
					break;
				}
256
			}
257 258 259 260
			else if (c == '\\')
				backslashSeen = true;
			else
				backslashSeen = false;
261

262
			appendStringInfoChar(inBuf, (char) c);
263 264
		}

265 266 267 268 269
		if (c == EOF)
			end = true;
	}
	else
	{
270
		/*
271
		 * otherwise read characters until EOF.
272
		 */
273 274 275 276 277 278
		while ((c = interactive_getc()) != EOF)
			appendStringInfoChar(inBuf, (char) c);

		/* No input before EOF signal means time to quit. */
		if (inBuf->len == 0)
			end = true;
279 280
	}

281 282 283 284 285 286 287
	if (end)
		return EOF;

	/*
	 * otherwise we have a user query so process it.
	 */

288 289 290
	/* Add '\0' to make it look the same as message case. */
	appendStringInfoChar(inBuf, (char) '\0');

291 292
	/*
	 * if the query echo flag was given, print the query..
293 294
	 */
	if (EchoQuery)
295
		printf("statement: %s\n", inBuf->data);
296
	fflush(stdout);
297

298
	return 'Q';
299 300
}

301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318
/*
 * interactive_getc -- collect one character from stdin
 *
 * Even though we are not reading from a "client" process, we still want to
 * respond to signals, particularly SIGTERM/SIGQUIT.  Hence we must use
 * prepare_for_client_read and client_read_ended.
 */
static int
interactive_getc(void)
{
	int			c;

	prepare_for_client_read();
	c = getc(stdin);
	client_read_ended();
	return c;
}

319
/* ----------------
320
 *	SocketBackend()		Is called for frontend-backend connections
321
 *
322
 *	Returns the message type code, and loads message body data into inBuf.
323
 *
324
 *	EOF is returned if the connection is lost.
325 326
 * ----------------
 */
327
static int
328
SocketBackend(StringInfo inBuf)
329
{
330
	int			qtype;
331

332
	/*
333
	 * Get message type code from the frontend.
334
	 */
335
	qtype = pq_getbyte();
336

337 338
	if (qtype == EOF)			/* frontend disconnected */
	{
339 340 341
		ereport(COMMERROR,
				(errcode(ERRCODE_PROTOCOL_VIOLATION),
				 errmsg("unexpected EOF on client connection")));
342 343 344 345
		return qtype;
	}

	/*
B
Bruce Momjian 已提交
346 347 348
	 * Validate message type code before trying to read body; if we have lost
	 * sync, better to say "command unknown" than to run out of memory because
	 * we used garbage as a length word.
349
	 *
350 351
	 * This also gives us a place to set the doing_extended_query_message flag
	 * as soon as possible.
352
	 */
353
	switch (qtype)
354
	{
355
		case 'Q':				/* simple query */
356
			doing_extended_query_message = false;
357 358 359 360 361
			if (PG_PROTOCOL_MAJOR(FrontendProtocol) < 3)
			{
				/* old style without length word; convert */
				if (pq_getstring(inBuf))
				{
362 363
					ereport(COMMERROR,
							(errcode(ERRCODE_PROTOCOL_VIOLATION),
B
Bruce Momjian 已提交
364
							 errmsg("unexpected EOF on client connection")));
365 366 367
					return EOF;
				}
			}
368 369
			break;

370
		case 'F':				/* fastpath function call */
371 372
			/* we let fastpath.c cope with old-style input of this */
			doing_extended_query_message = false;
373
			break;
374

375
		case 'X':				/* terminate */
376
			doing_extended_query_message = false;
377
			ignore_till_sync = false;
378 379 380 381 382 383 384 385 386 387 388
			break;

		case 'B':				/* bind */
		case 'C':				/* close */
		case 'D':				/* describe */
		case 'E':				/* execute */
		case 'H':				/* flush */
		case 'P':				/* parse */
			doing_extended_query_message = true;
			/* these are only legal in protocol 3 */
			if (PG_PROTOCOL_MAJOR(FrontendProtocol) < 3)
389 390
				ereport(FATAL,
						(errcode(ERRCODE_PROTOCOL_VIOLATION),
B
Bruce Momjian 已提交
391
						 errmsg("invalid frontend message type %d", qtype)));
392 393 394 395 396 397 398 399 400
			break;

		case 'S':				/* sync */
			/* stop any active skip-till-Sync */
			ignore_till_sync = false;
			/* mark not-extended, so that a new error doesn't begin skip */
			doing_extended_query_message = false;
			/* only legal in protocol 3 */
			if (PG_PROTOCOL_MAJOR(FrontendProtocol) < 3)
401 402
				ereport(FATAL,
						(errcode(ERRCODE_PROTOCOL_VIOLATION),
B
Bruce Momjian 已提交
403
						 errmsg("invalid frontend message type %d", qtype)));
404
			break;
405

406 407 408
		case 'd':				/* copy data */
		case 'c':				/* copy done */
		case 'f':				/* copy fail */
409 410 411
			doing_extended_query_message = false;
			/* these are only legal in protocol 3 */
			if (PG_PROTOCOL_MAJOR(FrontendProtocol) < 3)
412 413
				ereport(FATAL,
						(errcode(ERRCODE_PROTOCOL_VIOLATION),
B
Bruce Momjian 已提交
414
						 errmsg("invalid frontend message type %d", qtype)));
415
			break;
416

417
		default:
B
Bruce Momjian 已提交
418

419
			/*
B
Bruce Momjian 已提交
420 421 422
			 * Otherwise we got garbage from the frontend.	We treat this as
			 * fatal because we have probably lost message boundary sync, and
			 * there's no good way to recover.
423
			 */
424 425 426
			ereport(FATAL,
					(errcode(ERRCODE_PROTOCOL_VIOLATION),
					 errmsg("invalid frontend message type %d", qtype)));
427
			break;
428
	}
429

430
	/*
B
Bruce Momjian 已提交
431 432 433
	 * In protocol version 3, all frontend messages have a length word next
	 * after the type code; we can read the message contents independently of
	 * the type.
434 435 436 437 438 439 440
	 */
	if (PG_PROTOCOL_MAJOR(FrontendProtocol) >= 3)
	{
		if (pq_getmessage(inBuf, 0))
			return EOF;			/* suitable message already logged */
	}

441
	return qtype;
442 443 444
}

/* ----------------
445
 *		ReadCommand reads a command from either the frontend or
446 447 448
 *		standard input, places it in inBuf, and returns the
 *		message type code (first byte of the message).
 *		EOF is returned if end of file.
449 450
 * ----------------
 */
451
static int
452
ReadCommand(StringInfo inBuf)
453
{
454
	int			result;
455

456
	if (whereToSendOutput == DestRemote)
457
		result = SocketBackend(inBuf);
458
	else
459 460
		result = InteractiveBackend(inBuf);
	return result;
461 462
}

463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483
/*
 * prepare_for_client_read -- set up to possibly block on client input
 *
 * This must be called immediately before any low-level read from the
 * client connection.  It is necessary to do it at a sufficiently low level
 * that there won't be any other operations except the read kernel call
 * itself between this call and the subsequent client_read_ended() call.
 * In particular there mustn't be use of malloc() or other potentially
 * non-reentrant libc functions.  This restriction makes it safe for us
 * to allow interrupt service routines to execute nontrivial code while
 * we are waiting for input.
 */
void
prepare_for_client_read(void)
{
	if (DoingCommandRead)
	{
		/* Enable immediate processing of asynchronous signals */
		EnableNotifyInterrupt();
		EnableCatchupInterrupt();

484
		/* Allow cancel/die interrupts to be processed while waiting */
485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506
		ImmediateInterruptOK = true;

		/* And don't forget to detect one that already arrived */
		CHECK_FOR_INTERRUPTS();
	}
}

/*
 * client_read_ended -- get out of the client-input state
 */
void
client_read_ended(void)
{
	if (DoingCommandRead)
	{
		ImmediateInterruptOK = false;

		DisableNotifyInterrupt();
		DisableCatchupInterrupt();
	}
}

507 508 509 510 511 512

/*
 * Parse a query string and pass it through the rewriter.
 *
 * A list of Query nodes is returned, since the string might contain
 * multiple queries and/or the rewriter might expand one query to several.
513 514 515
 *
 * NOTE: this routine is no longer used for processing interactive queries,
 * but it is still needed for parsing of SQL function bodies.
516
 */
517
List *
B
Bruce Momjian 已提交
518
pg_parse_and_rewrite(const char *query_string,	/* string to execute */
519
					 Oid *paramTypes,	/* parameter types */
B
Bruce Momjian 已提交
520
					 int numParams)		/* number of parameters */
521
{
522
	List	   *raw_parsetree_list;
523
	List	   *querytree_list;
524
	ListCell   *list_item;
525

526 527
	/*
	 * (1) parse the request string into a list of raw parse trees.
528
	 */
529
	raw_parsetree_list = pg_parse_query(query_string);
530

531 532
	/*
	 * (2) Do parse analysis and rule rewrite.
533 534 535 536
	 */
	querytree_list = NIL;
	foreach(list_item, raw_parsetree_list)
	{
B
Bruce Momjian 已提交
537
		Node	   *parsetree = (Node *) lfirst(list_item);
538

539
		querytree_list = list_concat(querytree_list,
B
Bruce Momjian 已提交
540
									 pg_analyze_and_rewrite(parsetree,
541
															query_string,
B
Bruce Momjian 已提交
542 543
															paramTypes,
															numParams));
544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561
	}

	return querytree_list;
}

/*
 * Do raw parsing (only).
 *
 * A list of parsetrees is returned, since there might be multiple
 * commands in the given string.
 *
 * NOTE: for interactive queries, it is important to keep this routine
 * separate from the analysis & rewrite stages.  Analysis and rewriting
 * cannot be done in an aborted transaction, since they require access to
 * database tables.  So, we rely on the raw parser to determine whether
 * we've seen a COMMIT or ABORT command; when we are in abort state, other
 * commands are not processed any further than the raw parse stage.
 */
562
List *
563
pg_parse_query(const char *query_string)
564
{
565
	List	   *raw_parsetree_list;
566

567 568
	TRACE_POSTGRESQL_QUERY_PARSE_START(query_string);

B
Rename:  
Bruce Momjian 已提交
569
	if (log_parser_stats)
570 571
		ResetUsage();

572
	raw_parsetree_list = raw_parser(query_string);
573

574 575 576
	if (log_parser_stats)
		ShowUsage("PARSER STATISTICS");

577 578 579 580 581 582 583 584 585 586 587 588 589
#ifdef COPY_PARSE_PLAN_TREES
	/* Optional debugging check: pass raw parsetrees through copyObject() */
	{
		List	   *new_list = (List *) copyObject(raw_parsetree_list);

		/* This checks both copyObject() and the equal() routines... */
		if (!equal(new_list, raw_parsetree_list))
			elog(WARNING, "copyObject() failed to produce an equal raw parse tree");
		else
			raw_parsetree_list = new_list;
	}
#endif

590 591
	TRACE_POSTGRESQL_QUERY_PARSE_DONE(query_string);

592 593 594
	return raw_parsetree_list;
}

595
/*
596 597
 * Given a raw parsetree (gram.y output), and optionally information about
 * types of parameter symbols ($n), perform parse analysis and rule rewriting.
598 599 600 601 602 603
 *
 * A list of Query nodes is returned, since either the analyzer or the
 * rewriter might expand one query to several.
 *
 * NOTE: for reasons mentioned above, this must be separate from raw parsing.
 */
604
List *
605 606
pg_analyze_and_rewrite(Node *parsetree, const char *query_string,
					   Oid *paramTypes, int numParams)
607
{
608
	Query	   *query;
609 610
	List	   *querytree_list;

611 612
	TRACE_POSTGRESQL_QUERY_REWRITE_START(query_string);

613 614
	/*
	 * (1) Perform parse analysis.
615
	 */
B
Rename:  
Bruce Momjian 已提交
616
	if (log_parser_stats)
617 618
		ResetUsage();

619
	query = parse_analyze(parsetree, query_string, paramTypes, numParams);
620

B
Rename:  
Bruce Momjian 已提交
621
	if (log_parser_stats)
622
		ShowUsage("PARSE ANALYSIS STATISTICS");
623

624 625
	/*
	 * (2) Rewrite the queries, as necessary
626
	 */
627
	querytree_list = pg_rewrite_query(query);
628

629 630
	TRACE_POSTGRESQL_QUERY_REWRITE_DONE(query_string);

631 632 633
	return querytree_list;
}

634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679
/*
 * Do parse analysis and rewriting.  This is the same as pg_analyze_and_rewrite
 * except that external-parameter resolution is determined by parser callback
 * hooks instead of a fixed list of parameter datatypes.
 */
List *
pg_analyze_and_rewrite_params(Node *parsetree,
							  const char *query_string,
							  ParserSetupHook parserSetup,
							  void *parserSetupArg)
{
	ParseState *pstate;
	Query	   *query;
	List	   *querytree_list;

	Assert(query_string != NULL); /* required as of 8.4 */

	TRACE_POSTGRESQL_QUERY_REWRITE_START(query_string);

	/*
	 * (1) Perform parse analysis.
	 */
	if (log_parser_stats)
		ResetUsage();

	pstate = make_parsestate(NULL);
	pstate->p_sourcetext = query_string;
	(*parserSetup) (pstate, parserSetupArg);

	query = transformStmt(pstate, parsetree);

	free_parsestate(pstate);

	if (log_parser_stats)
		ShowUsage("PARSE ANALYSIS STATISTICS");

	/*
	 * (2) Rewrite the queries, as necessary
	 */
	querytree_list = pg_rewrite_query(query);

	TRACE_POSTGRESQL_QUERY_REWRITE_DONE(query_string);

	return querytree_list;
}

680
/*
681
 * Perform rewriting of a query produced by parse analysis.
682
 *
683 684
 * Note: query must just have come from the parser, because we do not do
 * AcquireRewriteLocks() on it.
685
 */
686
static List *
687
pg_rewrite_query(Query *query)
688
{
689
	List	   *querytree_list;
690

691
	if (Debug_print_parse)
692
		elog_node_display(LOG, "parse tree", query,
693
						  Debug_pretty_print);
694

695 696 697
	if (log_parser_stats)
		ResetUsage();

698 699 700 701 702 703 704 705 706
	if (query->commandType == CMD_UTILITY)
	{
		/* don't rewrite utilities, just dump 'em into result list */
		querytree_list = list_make1(query);
	}
	else
	{
		/* rewrite regular queries */
		querytree_list = QueryRewrite(query);
707 708
	}

B
Rename:  
Bruce Momjian 已提交
709
	if (log_parser_stats)
710
		ShowUsage("REWRITER STATISTICS");
711

712
#ifdef COPY_PARSE_PLAN_TREES
713 714 715
	/* Optional debugging check: pass querytree output through copyObject() */
	{
		List	   *new_list;
B
Bruce Momjian 已提交
716

717 718 719 720 721 722 723
		new_list = (List *) copyObject(querytree_list);
		/* This checks both copyObject() and the equal() routines... */
		if (!equal(new_list, querytree_list))
			elog(WARNING, "copyObject() failed to produce equal parse tree");
		else
			querytree_list = new_list;
	}
724 725
#endif

726
	if (Debug_print_rewritten)
727
		elog_node_display(LOG, "rewritten parse tree", querytree_list,
728
						  Debug_pretty_print);
729

730 731
	return querytree_list;
}
732 733


734 735 736 737
/*
 * Generate a plan for a single already-rewritten query.
 * This is a thin wrapper around planner() and takes the same parameters.
 */
738
PlannedStmt *
739
pg_plan_query(Query *querytree, int cursorOptions, ParamListInfo boundParams)
740
{
741
	PlannedStmt *plan;
742

743 744 745
	/* Utility commands have no plans. */
	if (querytree->commandType == CMD_UTILITY)
		return NULL;
746

747 748 749
	/* Planner must have a snapshot in case it calls user-defined functions. */
	Assert(ActiveSnapshotSet());

750 751
	TRACE_POSTGRESQL_QUERY_PLAN_START();

B
Rename:  
Bruce Momjian 已提交
752
	if (log_planner_stats)
753
		ResetUsage();
754

755
	/* call the optimizer */
756
	plan = planner(querytree, cursorOptions, boundParams);
757

B
Rename:  
Bruce Momjian 已提交
758
	if (log_planner_stats)
759
		ShowUsage("PLANNER STATISTICS");
760

761 762 763
#ifdef COPY_PARSE_PLAN_TREES
	/* Optional debugging check: pass plan output through copyObject() */
	{
764
		PlannedStmt *new_plan = (PlannedStmt *) copyObject(plan);
765

B
Bruce Momjian 已提交
766
		/*
B
Bruce Momjian 已提交
767 768
		 * equal() currently does not have routines to compare Plan nodes, so
		 * don't try to test equality here.  Perhaps fix someday?
769 770 771
		 */
#ifdef NOT_USED
		/* This checks both copyObject() and the equal() routines... */
B
Bruce Momjian 已提交
772
		if (!equal(new_plan, plan))
773
			elog(WARNING, "copyObject() failed to produce an equal plan tree");
774 775 776 777 778 779
		else
#endif
			plan = new_plan;
	}
#endif

780 781
	/*
	 * Print plan if debugging.
782
	 */
783
	if (Debug_print_plan)
784
		elog_node_display(LOG, "plan", plan, Debug_pretty_print);
785

786 787
	TRACE_POSTGRESQL_QUERY_PLAN_DONE();

788
	return plan;
789 790
}

791 792
/*
 * Generate plans for a list of already-rewritten queries.
793
 *
794 795
 * Normal optimizable statements generate PlannedStmt entries in the result
 * list.  Utility statements are simply represented by their statement nodes.
796 797
 */
List *
798
pg_plan_queries(List *querytrees, int cursorOptions, ParamListInfo boundParams)
799
{
800 801
	List	   *stmt_list = NIL;
	ListCell   *query_list;
802

803
	foreach(query_list, querytrees)
804
	{
805 806
		Query	   *query = (Query *) lfirst(query_list);
		Node	   *stmt;
807

808
		if (query->commandType == CMD_UTILITY)
809
		{
810 811 812 813 814
			/* Utility commands have no plans. */
			stmt = query->utilityStmt;
		}
		else
		{
815
			stmt = (Node *) pg_plan_query(query, cursorOptions, boundParams);
816 817
		}

818
		stmt_list = lappend(stmt_list, stmt);
819
	}
820

821
	return stmt_list;
822 823 824 825
}


/*
826
 * exec_simple_query
827
 *
828
 * Execute a "simple Query" protocol message.
829
 */
830
static void
831
exec_simple_query(const char *query_string)
832
{
B
Bruce Momjian 已提交
833
	CommandDest dest = whereToSendOutput;
834
	MemoryContext oldcontext;
835 836
	List	   *parsetree_list;
	ListCell   *parsetree_item;
837
	bool		save_log_statement_stats = log_statement_stats;
838
	bool		was_logged = false;
839
	bool		isTopLevel;
840
	char		msec_str[32];
B
Bruce Momjian 已提交
841

842

843 844 845
	/*
	 * Report query to various monitoring facilities.
	 */
846
	debug_query_string = query_string;
847

848 849
	pgstat_report_activity(query_string);

850 851
	TRACE_POSTGRESQL_QUERY_START(query_string);

852
	/*
853 854
	 * We use save_log_statement_stats so ShowUsage doesn't report incorrect
	 * results because ResetUsage wasn't called.
855
	 */
856 857 858
	if (save_log_statement_stats)
		ResetUsage();

859
	/*
B
Bruce Momjian 已提交
860 861
	 * Start up a transaction command.	All queries generated by the
	 * query_string will be in this same command block, *unless* we find a
B
Bruce Momjian 已提交
862 863 864
	 * BEGIN/COMMIT/ABORT statement; we have to force a new xact command after
	 * one of those, else bad things will happen in xact.c. (Note that this
	 * will normally change current memory context.)
865
	 */
866
	start_xact_command();
867 868

	/*
B
Bruce Momjian 已提交
869 870 871 872
	 * Zap any pre-existing unnamed statement.	(While not strictly necessary,
	 * it seems best to define simple-Query mode as if it used the unnamed
	 * statement and portal; this ensures we recover any storage used by prior
	 * unnamed operations.)
873
	 */
874
	drop_unnamed_stmt();
875

876 877 878
	/*
	 * Switch to appropriate context for constructing parsetrees.
	 */
879
	oldcontext = MemoryContextSwitchTo(MessageContext);
880

B
Bruce Momjian 已提交
881
	/*
B
Bruce Momjian 已提交
882 883
	 * Do basic parsing of the query or queries (this should be safe even if
	 * we are in aborted transaction state!)
884
	 */
885
	parsetree_list = pg_parse_query(query_string);
886

887
	/* Log immediately if dictated by log_statement */
888
	if (check_log_statement(parsetree_list))
889 890 891
	{
		ereport(LOG,
				(errmsg("statement: %s", query_string),
892
				 errhidestmt(true),
893 894 895
				 errdetail_execute(parsetree_list)));
		was_logged = true;
	}
896

897
	/*
898
	 * Switch back to transaction context to enter the loop.
899 900 901
	 */
	MemoryContextSwitchTo(oldcontext);

902
	/*
B
Bruce Momjian 已提交
903 904 905 906
	 * We'll tell PortalRun it's a top-level command iff there's exactly one
	 * raw parsetree.  If more than one, it's effectively a transaction block
	 * and we want PreventTransactionChain to reject unsafe commands. (Note:
	 * we're assuming that query rewrite cannot add commands that are
907 908 909 910
	 * significant to PreventTransactionChain.)
	 */
	isTopLevel = (list_length(parsetree_list) == 1);

911
	/*
912
	 * Run through the raw parsetree(s) and process each one.
913
	 */
914
	foreach(parsetree_item, parsetree_list)
915
	{
B
Bruce Momjian 已提交
916
		Node	   *parsetree = (Node *) lfirst(parsetree_item);
917
		bool		snapshot_set = false;
918 919
		const char *commandTag;
		char		completionTag[COMPLETION_TAG_BUFSIZE];
B
Bruce Momjian 已提交
920
		List	   *querytree_list,
921 922
				   *plantree_list;
		Portal		portal;
923 924
		DestReceiver *receiver;
		int16		format;
925

926
		/*
B
Bruce Momjian 已提交
927 928 929 930
		 * Get the command name for use in status display (it also becomes the
		 * default completion tag, down inside PortalRun).	Set ps_status and
		 * do any special start-of-SQL-command processing needed by the
		 * destination.
931 932 933
		 */
		commandTag = CreateCommandTag(parsetree);

934
		set_ps_display(commandTag, false);
935

936
		BeginCommand(commandTag, dest);
937

938
		/*
939
		 * If we are in an aborted transaction, reject all commands except
B
Bruce Momjian 已提交
940 941 942 943 944
		 * COMMIT/ABORT.  It is important that this test occur before we try
		 * to do parse analysis, rewrite, or planning, since all those phases
		 * try to do database accesses, which may fail in abort state. (It
		 * might be safe to allow some additional utility commands in this
		 * state, but not many...)
945
		 */
946 947 948 949 950
		if (IsAbortedTransactionBlockState() &&
			!IsTransactionExitStmt(parsetree))
			ereport(ERROR,
					(errcode(ERRCODE_IN_FAILED_SQL_TRANSACTION),
					 errmsg("current transaction is aborted, "
951 952
							"commands ignored until end of transaction block"),
					 errdetail_abort()));
953

954
		/* Make sure we are in a transaction command */
955
		start_xact_command();
956

957
		/* If we got a cancel signal in parsing or prior command, quit */
958
		CHECK_FOR_INTERRUPTS();
959

960 961 962 963 964 965 966 967 968
		/*
		 * Set up a snapshot if parse analysis/planning will need one.
		 */
		if (analyze_requires_snapshot(parsetree))
		{
			PushActiveSnapshot(GetTransactionSnapshot());
			snapshot_set = true;
		}

969
		/*
970
		 * OK to analyze, rewrite, and plan this query.
971
		 *
B
Bruce Momjian 已提交
972 973
		 * Switch to appropriate context for constructing querytrees (again,
		 * these must outlive the execution context).
974
		 */
975
		oldcontext = MemoryContextSwitchTo(MessageContext);
976

977 978
		querytree_list = pg_analyze_and_rewrite(parsetree, query_string,
												NULL, 0);
V
Vadim B. Mikheev 已提交
979

980
		plantree_list = pg_plan_queries(querytree_list, 0, NULL);
981 982 983 984

		/* Done with the snapshot used for parsing/planning */
		if (snapshot_set)
			PopActiveSnapshot();
985 986 987 988

		/* If we got a cancel signal in analysis or planning, quit */
		CHECK_FOR_INTERRUPTS();

989
		/*
B
Bruce Momjian 已提交
990 991
		 * Create unnamed portal to run the query or queries in. If there
		 * already is one, silently drop it.
992
		 */
993
		portal = CreatePortal("", true, true);
994 995
		/* Don't display the portal in pg_cursors */
		portal->visible = false;
996

997 998
		/*
		 * We don't have to copy anything into the portal, because everything
999
		 * we are passing here is in MessageContext, which will outlive the
1000 1001
		 * portal anyway.
		 */
1002
		PortalDefineQuery(portal,
1003
						  NULL,
1004 1005 1006
						  query_string,
						  commandTag,
						  plantree_list,
1007
						  NULL);
1008

1009
		/*
1010
		 * Start the portal.  No parameters here.
1011
		 */
1012
		PortalStart(portal, NULL, InvalidSnapshot);
1013

1014
		/*
B
Bruce Momjian 已提交
1015 1016 1017 1018
		 * Select the appropriate output format: text unless we are doing a
		 * FETCH from a binary cursor.	(Pretty grotty to have to do this here
		 * --- but it avoids grottiness in other places.  Ah, the joys of
		 * backward compatibility...)
1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029 1030
		 */
		format = 0;				/* TEXT is default */
		if (IsA(parsetree, FetchStmt))
		{
			FetchStmt  *stmt = (FetchStmt *) parsetree;

			if (!stmt->ismove)
			{
				Portal		fportal = GetPortalByName(stmt->portalname);

				if (PortalIsValid(fportal) &&
					(fportal->cursorOptions & CURSOR_OPT_BINARY))
B
Bruce Momjian 已提交
1031
					format = 1; /* BINARY */
1032 1033 1034 1035 1036 1037 1038
			}
		}
		PortalSetResultFormat(portal, 1, &format);

		/*
		 * Now we can create the destination receiver object.
		 */
1039 1040 1041
		receiver = CreateDestReceiver(dest);
		if (dest == DestRemote)
			SetRemoteDestReceiverParams(receiver, portal);
1042 1043 1044 1045 1046 1047 1048

		/*
		 * Switch back to transaction context for execution.
		 */
		MemoryContextSwitchTo(oldcontext);

		/*
B
Bruce Momjian 已提交
1049
		 * Run the portal to completion, and then drop it (and the receiver).
1050
		 */
1051 1052
		(void) PortalRun(portal,
						 FETCH_ALL,
1053
						 isTopLevel,
1054 1055
						 receiver,
						 receiver,
1056
						 completionTag);
1057

1058
		(*receiver->rDestroy) (receiver);
1059

1060
		PortalDrop(portal, false);
1061

1062
		if (IsA(parsetree, TransactionStmt))
1063
		{
1064
			/*
B
Bruce Momjian 已提交
1065 1066
			 * If this was a transaction control statement, commit it. We will
			 * start a new xact command for the next command (if any).
1067
			 */
1068
			finish_xact_command();
1069
		}
1070
		else if (lnext(parsetree_item) == NULL)
1071
		{
1072
			/*
B
Bruce Momjian 已提交
1073 1074 1075 1076 1077 1078 1079 1080
			 * If this is the last parsetree of the query string, close down
			 * transaction statement before reporting command-complete.  This
			 * is so that any end-of-transaction errors are reported before
			 * the command-complete message is issued, to avoid confusing
			 * clients who will expect either a command-complete message or an
			 * error, not one and then the other.  But for compatibility with
			 * historical Postgres behavior, we do not force a transaction
			 * boundary between queries appearing in a single query string.
1081
			 */
1082
			finish_xact_command();
1083
		}
1084
		else
1085
		{
1086
			/*
B
Bruce Momjian 已提交
1087 1088
			 * We need a CommandCounterIncrement after every query, except
			 * those that start or end a transaction block.
1089 1090
			 */
			CommandCounterIncrement();
1091
		}
1092 1093

		/*
B
Bruce Momjian 已提交
1094 1095 1096 1097
		 * Tell client that we're done with this query.  Note we emit exactly
		 * one EndCommand report for each raw parsetree, thus one for each SQL
		 * command the client sent, regardless of rewriting. (But a command
		 * aborted by error will not send an EndCommand report at all.)
1098
		 */
1099
		EndCommand(completionTag, dest);
B
Bruce Momjian 已提交
1100
	}							/* end loop over parsetrees */
1101

1102 1103 1104
	/*
	 * Close down transaction statement, if one is open.
	 */
1105
	finish_xact_command();
1106

1107 1108 1109
	/*
	 * If there were no parsetrees, return EmptyQueryResponse message.
	 */
1110
	if (!parsetree_list)
1111 1112
		NullCommand(dest);

1113
	/*
1114
	 * Emit duration logging if appropriate.
1115
	 */
1116
	switch (check_log_duration(msec_str, was_logged))
1117
	{
1118
		case 1:
1119
			ereport(LOG,
1120 1121
					(errmsg("duration: %s ms", msec_str),
					 errhidestmt(true)));
1122 1123
			break;
		case 2:
1124 1125 1126
			ereport(LOG,
					(errmsg("duration: %s ms  statement: %s",
							msec_str, query_string),
1127
					 errhidestmt(true),
1128
					 errdetail_execute(parsetree_list)));
1129
			break;
1130
	}
1131

1132 1133 1134
	if (save_log_statement_stats)
		ShowUsage("QUERY STATISTICS");

1135 1136
	TRACE_POSTGRESQL_QUERY_DONE(query_string);

1137
	debug_query_string = NULL;
1138 1139
}

1140 1141 1142 1143 1144 1145 1146 1147
/*
 * exec_parse_message
 *
 * Execute a "Parse" protocol message.
 */
static void
exec_parse_message(const char *query_string,	/* string to execute */
				   const char *stmt_name,		/* name for prepared stmt */
B
Bruce Momjian 已提交
1148 1149
				   Oid *paramTypes,		/* parameter types */
				   int numParams)		/* number of parameters */
1150 1151 1152
{
	MemoryContext oldcontext;
	List	   *parsetree_list;
1153
	Node	   *raw_parse_tree;
1154 1155
	const char *commandTag;
	List	   *querytree_list,
1156
			   *stmt_list;
1157
	bool		is_named;
1158
	bool		fully_planned;
1159
	bool		save_log_statement_stats = log_statement_stats;
1160
	char		msec_str[32];
1161 1162 1163 1164 1165 1166 1167 1168

	/*
	 * Report query to various monitoring facilities.
	 */
	debug_query_string = query_string;

	pgstat_report_activity(query_string);

1169
	set_ps_display("PARSE", false);
1170 1171 1172 1173

	if (save_log_statement_stats)
		ResetUsage();

1174 1175 1176 1177
	ereport(DEBUG2,
			(errmsg("parse %s: %s",
					*stmt_name ? stmt_name : "<unnamed>",
					query_string)));
1178

1179
	/*
B
Bruce Momjian 已提交
1180 1181 1182
	 * Start up a transaction command so we can run parse analysis etc. (Note
	 * that this will normally change current memory context.) Nothing happens
	 * if we are already in one.
1183
	 */
1184
	start_xact_command();
1185 1186 1187 1188

	/*
	 * Switch to appropriate context for constructing parsetrees.
	 *
B
Bruce Momjian 已提交
1189 1190 1191
	 * We have two strategies depending on whether the prepared statement is
	 * named or not.  For a named prepared statement, we do parsing in
	 * MessageContext and copy the finished trees into the prepared
1192
	 * statement's plancache entry; then the reset of MessageContext releases
B
Bruce Momjian 已提交
1193 1194 1195
	 * temporary space used by parsing and planning.  For an unnamed prepared
	 * statement, we assume the statement isn't going to hang around long, so
	 * getting rid of temp space quickly is probably not worth the costs of
1196 1197
	 * copying parse/plan trees.  So in this case, we create the plancache
	 * entry's context here, and do all the parsing work therein.
1198 1199 1200 1201 1202 1203 1204 1205 1206 1207
	 */
	is_named = (stmt_name[0] != '\0');
	if (is_named)
	{
		/* Named prepared statement --- parse in MessageContext */
		oldcontext = MemoryContextSwitchTo(MessageContext);
	}
	else
	{
		/* Unnamed prepared statement --- release any prior unnamed stmt */
1208 1209
		drop_unnamed_stmt();
		/* Create context for parsing/planning */
1210
		unnamed_stmt_context =
1211
			AllocSetContextCreate(CacheMemoryContext,
1212 1213 1214 1215 1216 1217 1218 1219
								  "unnamed prepared statement",
								  ALLOCSET_DEFAULT_MINSIZE,
								  ALLOCSET_DEFAULT_INITSIZE,
								  ALLOCSET_DEFAULT_MAXSIZE);
		oldcontext = MemoryContextSwitchTo(unnamed_stmt_context);
	}

	/*
B
Bruce Momjian 已提交
1220 1221
	 * Do basic parsing of the query or queries (this should be safe even if
	 * we are in aborted transaction state!)
1222 1223 1224 1225
	 */
	parsetree_list = pg_parse_query(query_string);

	/*
B
Bruce Momjian 已提交
1226 1227 1228
	 * We only allow a single user statement in a prepared statement. This is
	 * mainly to keep the protocol simple --- otherwise we'd need to worry
	 * about multiple result tupdescs and things like that.
1229
	 */
1230
	if (list_length(parsetree_list) > 1)
1231 1232
		ereport(ERROR,
				(errcode(ERRCODE_SYNTAX_ERROR),
B
Bruce Momjian 已提交
1233
		errmsg("cannot insert multiple commands into a prepared statement")));
1234 1235 1236

	if (parsetree_list != NIL)
	{
1237
		Query	   *query;
1238
		bool		snapshot_set = false;
B
Bruce Momjian 已提交
1239
		int			i;
1240

1241 1242
		raw_parse_tree = (Node *) linitial(parsetree_list);

1243 1244 1245
		/*
		 * Get the command name for possible use in status display.
		 */
1246
		commandTag = CreateCommandTag(raw_parse_tree);
1247 1248 1249

		/*
		 * If we are in an aborted transaction, reject all commands except
B
Bruce Momjian 已提交
1250 1251 1252 1253 1254
		 * COMMIT/ROLLBACK.  It is important that this test occur before we
		 * try to do parse analysis, rewrite, or planning, since all those
		 * phases try to do database accesses, which may fail in abort state.
		 * (It might be safe to allow some additional utility commands in this
		 * state, but not many...)
1255
		 */
1256
		if (IsAbortedTransactionBlockState() &&
1257
			!IsTransactionExitStmt(raw_parse_tree))
1258 1259 1260
			ereport(ERROR,
					(errcode(ERRCODE_IN_FAILED_SQL_TRANSACTION),
					 errmsg("current transaction is aborted, "
1261 1262
							"commands ignored until end of transaction block"),
					 errdetail_abort()));
1263

1264 1265 1266 1267 1268 1269 1270 1271 1272
		/*
		 * Set up a snapshot if parse analysis/planning will need one.
		 */
		if (analyze_requires_snapshot(raw_parse_tree))
		{
			PushActiveSnapshot(GetTransactionSnapshot());
			snapshot_set = true;
		}

1273 1274
		/*
		 * OK to analyze, rewrite, and plan this query.  Note that the
B
Bruce Momjian 已提交
1275 1276
		 * originally specified parameter set is not required to be complete,
		 * so we have to use parse_analyze_varparams().
1277
		 *
B
Bruce Momjian 已提交
1278 1279
		 * XXX must use copyObject here since parse analysis scribbles on its
		 * input, and we need the unmodified raw parse tree for possible
1280
		 * replanning later.
1281 1282 1283 1284
		 */
		if (log_parser_stats)
			ResetUsage();

1285 1286 1287 1288
		query = parse_analyze_varparams(copyObject(raw_parse_tree),
										query_string,
										&paramTypes,
										&numParams);
1289 1290

		/*
1291
		 * Check all parameter types got determined.
1292 1293 1294
		 */
		for (i = 0; i < numParams; i++)
		{
B
Bruce Momjian 已提交
1295
			Oid			ptype = paramTypes[i];
1296 1297

			if (ptype == InvalidOid || ptype == UNKNOWNOID)
1298 1299
				ereport(ERROR,
						(errcode(ERRCODE_INDETERMINATE_DATATYPE),
B
Bruce Momjian 已提交
1300 1301
					 errmsg("could not determine data type of parameter $%d",
							i + 1)));
1302 1303 1304 1305 1306
		}

		if (log_parser_stats)
			ShowUsage("PARSE ANALYSIS STATISTICS");

1307
		querytree_list = pg_rewrite_query(query);
1308

1309
		/*
B
Bruce Momjian 已提交
1310 1311
		 * If this is the unnamed statement and it has parameters, defer query
		 * planning until Bind.  Otherwise do it now.
1312 1313
		 */
		if (!is_named && numParams > 0)
1314 1315 1316 1317
		{
			stmt_list = querytree_list;
			fully_planned = false;
		}
1318
		else
1319
		{
1320
			stmt_list = pg_plan_queries(querytree_list, 0, NULL);
1321 1322
			fully_planned = true;
		}
1323 1324 1325 1326

		/* Done with the snapshot used for parsing/planning */
		if (snapshot_set)
			PopActiveSnapshot();
1327 1328 1329
	}
	else
	{
B
Bruce Momjian 已提交
1330
		/* Empty input string.	This is legal. */
1331
		raw_parse_tree = NULL;
1332
		commandTag = NULL;
1333 1334
		stmt_list = NIL;
		fully_planned = true;
1335 1336 1337 1338 1339 1340 1341 1342 1343 1344 1345
	}

	/* If we got a cancel signal in analysis or planning, quit */
	CHECK_FOR_INTERRUPTS();

	/*
	 * Store the query as a prepared statement.  See above comments.
	 */
	if (is_named)
	{
		StorePreparedStatement(stmt_name,
1346
							   raw_parse_tree,
1347 1348
							   query_string,
							   commandTag,
1349 1350
							   paramTypes,
							   numParams,
B
Bruce Momjian 已提交
1351
							   0,		/* default cursor options */
1352
							   stmt_list,
1353
							   false);
1354 1355 1356
	}
	else
	{
1357 1358 1359 1360
		/*
		 * paramTypes and query_string need to be copied into
		 * unnamed_stmt_context.  The rest is there already
		 */
B
Bruce Momjian 已提交
1361
		Oid		   *newParamTypes;
1362 1363 1364 1365 1366 1367 1368 1369 1370

		if (numParams > 0)
		{
			newParamTypes = (Oid *) palloc(numParams * sizeof(Oid));
			memcpy(newParamTypes, paramTypes, numParams * sizeof(Oid));
		}
		else
			newParamTypes = NULL;

1371 1372 1373
		unnamed_stmt_psrc = FastCreateCachedPlan(raw_parse_tree,
												 pstrdup(query_string),
												 commandTag,
1374
												 newParamTypes,
1375
												 numParams,
B
Bruce Momjian 已提交
1376
												 0,		/* cursor options */
1377 1378 1379 1380 1381 1382
												 stmt_list,
												 fully_planned,
												 true,
												 unnamed_stmt_context);
		/* context now belongs to the plancache entry */
		unnamed_stmt_context = NULL;
1383 1384 1385 1386 1387
	}

	MemoryContextSwitchTo(oldcontext);

	/*
B
Bruce Momjian 已提交
1388 1389 1390
	 * We do NOT close the open transaction command here; that only happens
	 * when the client sends Sync.	Instead, do CommandCounterIncrement just
	 * in case something happened during parse/plan.
1391 1392 1393 1394 1395 1396
	 */
	CommandCounterIncrement();

	/*
	 * Send ParseComplete.
	 */
1397
	if (whereToSendOutput == DestRemote)
1398 1399
		pq_putemptymessage('1');

1400 1401 1402
	/*
	 * Emit duration logging if appropriate.
	 */
1403 1404 1405 1406
	switch (check_log_duration(msec_str, false))
	{
		case 1:
			ereport(LOG,
1407 1408
					(errmsg("duration: %s ms", msec_str),
					 errhidestmt(true)));
1409 1410 1411 1412 1413 1414
			break;
		case 2:
			ereport(LOG,
					(errmsg("duration: %s ms  parse %s: %s",
							msec_str,
							*stmt_name ? stmt_name : "<unnamed>",
1415 1416
							query_string),
					 errhidestmt(true)));
1417 1418
			break;
	}
1419

1420 1421 1422 1423 1424 1425 1426 1427 1428 1429 1430 1431 1432 1433 1434 1435
	if (save_log_statement_stats)
		ShowUsage("PARSE MESSAGE STATISTICS");

	debug_query_string = NULL;
}

/*
 * exec_bind_message
 *
 * Process a "Bind" message to create a portal from a prepared statement
 */
static void
exec_bind_message(StringInfo input_message)
{
	const char *portal_name;
	const char *stmt_name;
1436 1437
	int			numPFormats;
	int16	   *pformats = NULL;
1438
	int			numParams;
1439 1440
	int			numRFormats;
	int16	   *rformats = NULL;
1441 1442
	CachedPlanSource *psrc;
	CachedPlan *cplan;
1443
	Portal		portal;
1444 1445
	char	   *query_string;
	char	   *saved_stmt_name;
1446
	ParamListInfo params;
1447
	List	   *plan_list;
1448
	MemoryContext oldContext;
1449
	bool		save_log_statement_stats = log_statement_stats;
1450
	bool		snapshot_set = false;
1451 1452 1453 1454 1455 1456 1457 1458 1459 1460 1461 1462 1463
	char		msec_str[32];

	/* Get the fixed part of the message */
	portal_name = pq_getmsgstring(input_message);
	stmt_name = pq_getmsgstring(input_message);

	ereport(DEBUG2,
			(errmsg("bind %s to %s",
					*portal_name ? portal_name : "<unnamed>",
					*stmt_name ? stmt_name : "<unnamed>")));

	/* Find prepared statement */
	if (stmt_name[0] != '\0')
1464 1465 1466
	{
		PreparedStatement *pstmt;

1467
		pstmt = FetchPreparedStatement(stmt_name, true);
1468 1469
		psrc = pstmt->plansource;
	}
1470 1471
	else
	{
1472
		/* Unnamed statements are re-prepared for every bind */
1473 1474
		psrc = unnamed_stmt_psrc;
		if (!psrc)
1475 1476 1477 1478 1479 1480 1481 1482
			ereport(ERROR,
					(errcode(ERRCODE_UNDEFINED_PSTATEMENT),
					 errmsg("unnamed prepared statement does not exist")));
	}

	/*
	 * Report query to various monitoring facilities.
	 */
1483
	debug_query_string = psrc->query_string;
1484

1485
	pgstat_report_activity(psrc->query_string);
1486

1487
	set_ps_display("BIND", false);
1488

1489 1490 1491
	if (save_log_statement_stats)
		ResetUsage();

1492
	/*
B
Bruce Momjian 已提交
1493 1494 1495
	 * Start up a transaction command so we can call functions etc. (Note that
	 * this will normally change current memory context.) Nothing happens if
	 * we are already in one.
1496
	 */
1497
	start_xact_command();
1498

1499 1500 1501 1502 1503 1504 1505
	/* Switch back to message context */
	MemoryContextSwitchTo(MessageContext);

	/* Get the parameter format codes */
	numPFormats = pq_getmsgint(input_message, 2);
	if (numPFormats > 0)
	{
B
Bruce Momjian 已提交
1506 1507
		int			i;

1508 1509 1510 1511 1512 1513 1514 1515 1516
		pformats = (int16 *) palloc(numPFormats * sizeof(int16));
		for (i = 0; i < numPFormats; i++)
			pformats[i] = pq_getmsgint(input_message, 2);
	}

	/* Get the parameter value count */
	numParams = pq_getmsgint(input_message, 2);

	if (numPFormats > 1 && numPFormats != numParams)
1517 1518
		ereport(ERROR,
				(errcode(ERRCODE_PROTOCOL_VIOLATION),
B
Bruce Momjian 已提交
1519 1520
			errmsg("bind message has %d parameter formats but %d parameters",
				   numPFormats, numParams)));
1521

1522
	if (numParams != psrc->num_params)
1523 1524 1525
		ereport(ERROR,
				(errcode(ERRCODE_PROTOCOL_VIOLATION),
				 errmsg("bind message supplies %d parameters, but prepared statement \"%s\" requires %d",
B
Bruce Momjian 已提交
1526
						numParams, stmt_name, psrc->num_params)));
1527

1528 1529
	/*
	 * If we are in aborted transaction state, the only portals we can
1530 1531 1532 1533 1534
	 * actually run are those containing COMMIT or ROLLBACK commands. We
	 * disallow binding anything else to avoid problems with infrastructure
	 * that expects to run inside a valid transaction.	We also disallow
	 * binding any parameters, since we can't risk calling user-defined I/O
	 * functions.
1535 1536
	 */
	if (IsAbortedTransactionBlockState() &&
1537
		(!IsTransactionExitStmt(psrc->raw_parse_tree) ||
1538 1539 1540 1541
		 numParams != 0))
		ereport(ERROR,
				(errcode(ERRCODE_IN_FAILED_SQL_TRANSACTION),
				 errmsg("current transaction is aborted, "
1542 1543
						"commands ignored until end of transaction block"),
				 errdetail_abort()));
1544

1545
	/*
B
Bruce Momjian 已提交
1546 1547
	 * Create the portal.  Allow silent replacement of an existing portal only
	 * if the unnamed portal is specified.
1548 1549 1550 1551 1552 1553
	 */
	if (portal_name[0] == '\0')
		portal = CreatePortal(portal_name, true, true);
	else
		portal = CreatePortal(portal_name, false, false);

1554 1555 1556 1557 1558 1559 1560 1561
	/*
	 * Prepare to copy stuff into the portal's memory context.  We do all this
	 * copying first, because it could possibly fail (out-of-memory) and we
	 * don't want a failure to occur between RevalidateCachedPlan and
	 * PortalDefineQuery; that would result in leaking our plancache refcount.
	 */
	oldContext = MemoryContextSwitchTo(PortalGetHeapMemory(portal));

1562 1563
	/* Copy the plan's query string into the portal */
	query_string = pstrdup(psrc->query_string);
1564 1565 1566 1567 1568 1569 1570

	/* Likewise make a copy of the statement name, unless it's unnamed */
	if (stmt_name[0])
		saved_stmt_name = pstrdup(stmt_name);
	else
		saved_stmt_name = NULL;

1571 1572 1573 1574 1575 1576 1577 1578 1579 1580 1581
	/*
	 * Set a snapshot if we have parameters to fetch (since the input
	 * functions might need it) or the query isn't a utility command (and
	 * hence could require redoing parse analysis and planning).
	 */
	if (numParams > 0 || analyze_requires_snapshot(psrc->raw_parse_tree))
	{
		PushActiveSnapshot(GetTransactionSnapshot());
		snapshot_set = true;
	}

1582 1583 1584 1585 1586
	/*
	 * Fetch parameters, if any, and store in the portal's memory context.
	 */
	if (numParams > 0)
	{
1587
		int			paramno;
1588

1589 1590
		/* sizeof(ParamListInfoData) includes the first array element */
		params = (ParamListInfo) palloc(sizeof(ParamListInfoData) +
B
Bruce Momjian 已提交
1591
								   (numParams - 1) *sizeof(ParamExternData));
1592 1593 1594 1595 1596
		/* we have static list of params, so no hooks needed */
		params->paramFetch = NULL;
		params->paramFetchArg = NULL;
		params->parserSetup = NULL;
		params->parserSetupArg = NULL;
1597
		params->numParams = numParams;
1598

1599
		for (paramno = 0; paramno < numParams; paramno++)
1600
		{
1601
			Oid			ptype = psrc->param_types[paramno];
1602
			int32		plength;
1603
			Datum		pval;
1604
			bool		isNull;
1605 1606 1607
			StringInfoData pbuf;
			char		csave;
			int16		pformat;
1608

1609 1610 1611
			plength = pq_getmsgint(input_message, 4);
			isNull = (plength == -1);

1612 1613
			if (!isNull)
			{
1614
				const char *pvalue = pq_getmsgbytes(input_message, plength);
1615 1616 1617

				/*
				 * Rather than copying data around, we just set up a phony
1618 1619 1620 1621 1622
				 * StringInfo pointing to the correct portion of the message
				 * buffer.	We assume we can scribble on the message buffer so
				 * as to maintain the convention that StringInfos have a
				 * trailing null.  This is grotty but is a big win when
				 * dealing with very large parameter strings.
1623 1624 1625 1626 1627 1628 1629 1630
				 */
				pbuf.data = (char *) pvalue;
				pbuf.maxlen = plength + 1;
				pbuf.len = plength;
				pbuf.cursor = 0;

				csave = pbuf.data[plength];
				pbuf.data[plength] = '\0';
1631 1632 1633 1634 1635 1636
			}
			else
			{
				pbuf.data = NULL;		/* keep compiler quiet */
				csave = 0;
			}
1637

1638
			if (numPFormats > 1)
1639
				pformat = pformats[paramno];
1640 1641 1642 1643 1644
			else if (numPFormats > 0)
				pformat = pformats[0];
			else
				pformat = 0;	/* default = text */

1645
			if (pformat == 0)	/* text mode */
1646 1647 1648
			{
				Oid			typinput;
				Oid			typioparam;
1649
				char	   *pstring;
1650

1651
				getTypeInputInfo(ptype, &typinput, &typioparam);
1652

1653 1654 1655 1656 1657 1658 1659
				/*
				 * We have to do encoding conversion before calling the
				 * typinput routine.
				 */
				if (isNull)
					pstring = NULL;
				else
1660
					pstring = pg_client_to_server(pbuf.data, plength);
1661

1662
				pval = OidInputFunctionCall(typinput, pstring, typioparam, -1);
1663

1664 1665 1666 1667
				/* Free result of encoding conversion, if any */
				if (pstring && pstring != pbuf.data)
					pfree(pstring);
			}
B
Bruce Momjian 已提交
1668
			else if (pformat == 1)		/* binary mode */
1669 1670 1671 1672 1673 1674 1675 1676 1677 1678 1679 1680
			{
				Oid			typreceive;
				Oid			typioparam;
				StringInfo	bufptr;

				/*
				 * Call the parameter type's binary input converter
				 */
				getTypeBinaryInputInfo(ptype, &typreceive, &typioparam);

				if (isNull)
					bufptr = NULL;
1681
				else
1682 1683
					bufptr = &pbuf;

1684
				pval = OidReceiveFunctionCall(typreceive, bufptr, typioparam, -1);
1685 1686 1687

				/* Trouble if it didn't eat the whole buffer */
				if (!isNull && pbuf.cursor != pbuf.len)
1688
					ereport(ERROR,
1689 1690
							(errcode(ERRCODE_INVALID_BINARY_REPRESENTATION),
							 errmsg("incorrect binary data format in bind parameter %d",
1691
									paramno + 1)));
1692 1693 1694 1695 1696 1697 1698
			}
			else
			{
				ereport(ERROR,
						(errcode(ERRCODE_INVALID_PARAMETER_VALUE),
						 errmsg("unsupported format code: %d",
								pformat)));
1699
				pval = 0;		/* keep compiler quiet */
1700
			}
1701

1702 1703
			/* Restore message buffer contents */
			if (!isNull)
1704
				pbuf.data[plength] = csave;
1705

1706
			params->params[paramno].value = pval;
1707
			params->params[paramno].isnull = isNull;
B
Bruce Momjian 已提交
1708

1709 1710 1711 1712 1713 1714 1715
			/*
			 * We mark the params as CONST.  This has no effect if we already
			 * did planning, but if we didn't, it licenses the planner to
			 * substitute the parameters directly into the one-shot plan we
			 * will generate below.
			 */
			params->params[paramno].pflags = PARAM_FLAG_CONST;
1716
			params->params[paramno].ptype = ptype;
1717 1718 1719 1720 1721
		}
	}
	else
		params = NULL;

1722 1723 1724
	/* Done storing stuff in portal's context */
	MemoryContextSwitchTo(oldContext);

1725 1726 1727 1728
	/* Get the result format codes */
	numRFormats = pq_getmsgint(input_message, 2);
	if (numRFormats > 0)
	{
B
Bruce Momjian 已提交
1729
		int			i;
1730

1731 1732 1733 1734 1735
		rformats = (int16 *) palloc(numRFormats * sizeof(int16));
		for (i = 0; i < numRFormats; i++)
			rformats[i] = pq_getmsgint(input_message, 2);
	}

1736 1737
	pq_getmsgend(input_message);

1738
	if (psrc->fully_planned)
1739
	{
1740 1741
		/*
		 * Revalidate the cached plan; this may result in replanning.  Any
B
Bruce Momjian 已提交
1742 1743
		 * cruft will be generated in MessageContext.  The plan refcount will
		 * be assigned to the Portal, so it will be released at portal
1744 1745 1746 1747
		 * destruction.
		 */
		cplan = RevalidateCachedPlan(psrc, false);
		plan_list = cplan->stmt_list;
1748 1749
	}
	else
1750
	{
1751 1752 1753 1754 1755 1756 1757 1758 1759
		List	   *query_list;

		/*
		 * Revalidate the cached plan; this may result in redoing parse
		 * analysis and rewriting (but not planning).  Any cruft will be
		 * generated in MessageContext.  The plan refcount is assigned to
		 * CurrentResourceOwner.
		 */
		cplan = RevalidateCachedPlan(psrc, true);
1760

1761 1762 1763 1764 1765 1766 1767 1768 1769 1770 1771 1772 1773 1774
		/*
		 * We didn't plan the query before, so do it now.  This allows the
		 * planner to make use of the concrete parameter values we now have.
		 * Because we use PARAM_FLAG_CONST, the plan is good only for this set
		 * of param values, and so we generate the plan in the portal's own
		 * memory context where it will be thrown away after use. As in
		 * exec_parse_message, we make no attempt to recover planner temporary
		 * memory until the end of the operation.
		 *
		 * XXX because the planner has a bad habit of scribbling on its input,
		 * we have to make a copy of the parse trees.  FIXME someday.
		 */
		oldContext = MemoryContextSwitchTo(PortalGetHeapMemory(portal));
		query_list = copyObject(cplan->stmt_list);
1775
		plan_list = pg_plan_queries(query_list, 0, params);
1776
		MemoryContextSwitchTo(oldContext);
1777 1778 1779 1780 1781

		/* We no longer need the cached plan refcount ... */
		ReleaseCachedPlan(cplan, true);
		/* ... and we don't want the portal to depend on it, either */
		cplan = NULL;
1782 1783 1784
	}

	/*
1785 1786 1787 1788
	 * Now we can define the portal.
	 *
	 * DO NOT put any code that could possibly throw an error between the
	 * above "RevalidateCachedPlan(psrc, false)" call and here.
1789 1790
	 */
	PortalDefineQuery(portal,
1791 1792
					  saved_stmt_name,
					  query_string,
1793
					  psrc->commandTag,
1794
					  plan_list,
1795
					  cplan);
1796

1797 1798 1799 1800 1801 1802 1803
	/* Done with the snapshot used for parameter I/O and parsing/planning */
	if (snapshot_set)
		PopActiveSnapshot();

	/*
	 * And we're ready to start portal execution.
	 */
1804
	PortalStart(portal, params, InvalidSnapshot);
1805

1806 1807 1808 1809 1810
	/*
	 * Apply the result format requests to the portal.
	 */
	PortalSetResultFormat(portal, numRFormats, rformats);

1811 1812 1813
	/*
	 * Send BindComplete.
	 */
1814
	if (whereToSendOutput == DestRemote)
1815
		pq_putemptymessage('2');
1816 1817 1818 1819

	/*
	 * Emit duration logging if appropriate.
	 */
1820 1821 1822 1823
	switch (check_log_duration(msec_str, false))
	{
		case 1:
			ereport(LOG,
1824 1825
					(errmsg("duration: %s ms", msec_str),
					 errhidestmt(true)));
1826 1827 1828
			break;
		case 2:
			ereport(LOG,
1829
					(errmsg("duration: %s ms  bind %s%s%s: %s",
1830 1831
							msec_str,
							*stmt_name ? stmt_name : "<unnamed>",
1832 1833
							*portal_name ? "/" : "",
							*portal_name ? portal_name : "",
1834
							psrc->query_string),
1835
					 errhidestmt(true),
1836 1837 1838
					 errdetail_params(params)));
			break;
	}
1839 1840 1841 1842 1843

	if (save_log_statement_stats)
		ShowUsage("BIND MESSAGE STATISTICS");

	debug_query_string = NULL;
1844 1845 1846 1847 1848 1849 1850 1851
}

/*
 * exec_execute_message
 *
 * Process an "Execute" message for a portal
 */
static void
1852
exec_execute_message(const char *portal_name, long max_rows)
1853
{
B
Bruce Momjian 已提交
1854
	CommandDest dest;
1855
	DestReceiver *receiver;
1856 1857 1858
	Portal		portal;
	bool		completed;
	char		completionTag[COMPLETION_TAG_BUFSIZE];
1859
	const char *sourceText;
1860
	const char *prepStmtName;
1861
	ParamListInfo portalParams;
1862
	bool		save_log_statement_stats = log_statement_stats;
1863 1864
	bool		is_xact_command;
	bool		execute_is_fetch;
1865 1866
	bool		was_logged = false;
	char		msec_str[32];
1867 1868 1869

	/* Adjust destination to tell printtup.c what to do */
	dest = whereToSendOutput;
1870 1871
	if (dest == DestRemote)
		dest = DestRemoteExecute;
1872 1873 1874

	portal = GetPortalByName(portal_name);
	if (!PortalIsValid(portal))
1875 1876 1877
		ereport(ERROR,
				(errcode(ERRCODE_UNDEFINED_CURSOR),
				 errmsg("portal \"%s\" does not exist", portal_name)));
1878 1879

	/*
B
Bruce Momjian 已提交
1880 1881
	 * If the original query was a null string, just return
	 * EmptyQueryResponse.
1882 1883 1884
	 */
	if (portal->commandTag == NULL)
	{
1885
		Assert(portal->stmts == NIL);
1886 1887 1888 1889
		NullCommand(dest);
		return;
	}

1890
	/* Does the portal contain a transaction command? */
1891
	is_xact_command = IsTransactionStmtList(portal->stmts);
1892

1893
	/*
B
Bruce Momjian 已提交
1894 1895 1896
	 * We must copy the sourceText and prepStmtName into MessageContext in
	 * case the portal is destroyed during finish_xact_command. Can avoid the
	 * copy if it's not an xact command, though.
1897 1898
	 */
	if (is_xact_command)
1899
	{
1900
		sourceText = pstrdup(portal->sourceText);
1901 1902 1903 1904
		if (portal->prepStmtName)
			prepStmtName = pstrdup(portal->prepStmtName);
		else
			prepStmtName = "<unnamed>";
B
Bruce Momjian 已提交
1905

1906 1907 1908 1909 1910 1911
		/*
		 * An xact command shouldn't have any parameters, which is a good
		 * thing because they wouldn't be around after finish_xact_command.
		 */
		portalParams = NULL;
	}
1912 1913
	else
	{
1914 1915 1916
		sourceText = portal->sourceText;
		if (portal->prepStmtName)
			prepStmtName = portal->prepStmtName;
1917
		else
1918 1919
			prepStmtName = "<unnamed>";
		portalParams = portal->portalParams;
1920
	}
1921

1922 1923 1924
	/*
	 * Report query to various monitoring facilities.
	 */
1925
	debug_query_string = sourceText;
1926

1927
	pgstat_report_activity(sourceText);
1928 1929 1930 1931 1932 1933

	set_ps_display(portal->commandTag, false);

	if (save_log_statement_stats)
		ResetUsage();

1934 1935
	BeginCommand(portal->commandTag, dest);

1936
	/*
B
Bruce Momjian 已提交
1937 1938
	 * Create dest receiver in MessageContext (we don't want it in transaction
	 * context, because that may get deleted if portal contains VACUUM).
1939
	 */
1940 1941 1942
	receiver = CreateDestReceiver(dest);
	if (dest == DestRemoteExecute)
		SetRemoteDestReceiverParams(receiver, portal);
1943

1944
	/*
B
Bruce Momjian 已提交
1945 1946
	 * Ensure we are in a transaction command (this should normally be the
	 * case already due to prior BIND).
1947
	 */
1948
	start_xact_command();
1949

1950 1951 1952 1953 1954 1955 1956 1957
	/*
	 * If we re-issue an Execute protocol request against an existing portal,
	 * then we are only fetching more rows rather than completely re-executing
	 * the query from the start. atStart is never reset for a v3 portal, so we
	 * are safe to use this check.
	 */
	execute_is_fetch = !portal->atStart;

1958
	/* Log immediately if dictated by log_statement */
1959
	if (check_log_statement(portal->stmts))
1960 1961
	{
		ereport(LOG,
1962
				(errmsg("%s %s%s%s: %s",
1963
						execute_is_fetch ?
1964 1965
						_("execute fetch from") :
						_("execute"),
1966 1967 1968
						prepStmtName,
						*portal_name ? "/" : "",
						*portal_name ? portal_name : "",
1969
						sourceText),
1970
				 errhidestmt(true),
1971 1972 1973 1974
				 errdetail_params(portalParams)));
		was_logged = true;
	}

1975 1976 1977 1978
	/*
	 * If we are in aborted transaction state, the only portals we can
	 * actually run are those containing COMMIT or ROLLBACK commands.
	 */
1979
	if (IsAbortedTransactionBlockState() &&
1980
		!IsTransactionExitStmtList(portal->stmts))
1981 1982 1983
		ereport(ERROR,
				(errcode(ERRCODE_IN_FAILED_SQL_TRANSACTION),
				 errmsg("current transaction is aborted, "
1984 1985
						"commands ignored until end of transaction block"),
				 errdetail_abort()));
1986 1987 1988 1989 1990 1991 1992 1993 1994 1995 1996 1997

	/* Check for cancel signal before we start execution */
	CHECK_FOR_INTERRUPTS();

	/*
	 * Okay to run the portal.
	 */
	if (max_rows <= 0)
		max_rows = FETCH_ALL;

	completed = PortalRun(portal,
						  max_rows,
B
Bruce Momjian 已提交
1998
						  true, /* always top level */
1999 2000
						  receiver,
						  receiver,
2001 2002
						  completionTag);

2003
	(*receiver->rDestroy) (receiver);
2004

2005 2006
	if (completed)
	{
2007
		if (is_xact_command)
2008 2009
		{
			/*
B
Bruce Momjian 已提交
2010
			 * If this was a transaction control statement, commit it.	We
B
Bruce Momjian 已提交
2011
			 * will start a new xact command for the next command (if any).
2012
			 */
2013
			finish_xact_command();
2014 2015 2016 2017
		}
		else
		{
			/*
B
Bruce Momjian 已提交
2018 2019
			 * We need a CommandCounterIncrement after every query, except
			 * those that start or end a transaction block.
2020 2021 2022 2023 2024 2025 2026 2027 2028 2029
			 */
			CommandCounterIncrement();
		}

		/* Send appropriate CommandComplete to client */
		EndCommand(completionTag, dest);
	}
	else
	{
		/* Portal run not complete, so send PortalSuspended */
2030
		if (whereToSendOutput == DestRemote)
2031 2032 2033
			pq_putemptymessage('s');
	}

2034
	/*
2035
	 * Emit duration logging if appropriate.
2036
	 */
2037
	switch (check_log_duration(msec_str, was_logged))
2038
	{
2039
		case 1:
2040
			ereport(LOG,
2041 2042
					(errmsg("duration: %s ms", msec_str),
					 errhidestmt(true)));
2043 2044
			break;
		case 2:
2045
			ereport(LOG,
2046
					(errmsg("duration: %s ms  %s %s%s%s: %s",
2047 2048 2049 2050 2051 2052 2053
							msec_str,
							execute_is_fetch ?
							_("execute fetch from") :
							_("execute"),
							prepStmtName,
							*portal_name ? "/" : "",
							*portal_name ? portal_name : "",
2054
							sourceText),
2055
					 errhidestmt(true),
2056
					 errdetail_params(portalParams)));
2057
			break;
2058 2059 2060 2061 2062 2063 2064 2065 2066
	}

	if (save_log_statement_stats)
		ShowUsage("EXECUTE MESSAGE STATISTICS");

	debug_query_string = NULL;
}

/*
2067
 * check_log_statement
2068 2069
 *		Determine whether command should be logged because of log_statement
 *
2070 2071
 * parsetree_list can be either raw grammar output or a list of planned
 * statements
2072 2073
 */
static bool
2074
check_log_statement(List *stmt_list)
2075
{
2076
	ListCell   *stmt_item;
2077 2078 2079 2080 2081 2082 2083

	if (log_statement == LOGSTMT_NONE)
		return false;
	if (log_statement == LOGSTMT_ALL)
		return true;

	/* Else we have to inspect the statement(s) to see whether to log */
2084
	foreach(stmt_item, stmt_list)
2085
	{
2086
		Node	   *stmt = (Node *) lfirst(stmt_item);
2087

2088
		if (GetCommandLogLevel(stmt) <= log_statement)
2089 2090 2091 2092 2093 2094 2095 2096 2097 2098
			return true;
	}

	return false;
}

/*
 * check_log_duration
 *		Determine whether current command's duration should be logged
 *
2099 2100 2101 2102 2103
 * Returns:
 *		0 if no logging is needed
 *		1 if just the duration should be logged
 *		2 if duration and query details should be logged
 *
2104 2105
 * If logging is needed, the duration in msec is formatted into msec_str[],
 * which must be a 32-byte buffer.
2106 2107 2108
 *
 * was_logged should be TRUE if caller already logged query details (this
 * essentially prevents 2 from being returned).
2109
 */
2110 2111
int
check_log_duration(char *msec_str, bool was_logged)
2112
{
2113
	if (log_duration || log_min_duration_statement >= 0)
2114
	{
2115 2116 2117
		long		secs;
		int			usecs;
		int			msecs;
2118
		bool		exceeded;
2119

2120 2121 2122 2123
		TimestampDifference(GetCurrentStatementStartTimestamp(),
							GetCurrentTimestamp(),
							&secs, &usecs);
		msecs = usecs / 1000;
2124 2125

		/*
B
Bruce Momjian 已提交
2126 2127 2128
		 * This odd-looking test for log_min_duration_statement being exceeded
		 * is designed to avoid integer overflow with very long durations:
		 * don't compute secs * 1000 until we've verified it will fit in int.
2129
		 */
2130 2131 2132 2133 2134 2135
		exceeded = (log_min_duration_statement == 0 ||
					(log_min_duration_statement > 0 &&
					 (secs > log_min_duration_statement / 1000 ||
					  secs * 1000 + msecs >= log_min_duration_statement)));

		if (exceeded || log_duration)
2136
		{
2137 2138
			snprintf(msec_str, 32, "%ld.%03d",
					 secs * 1000 + msecs, usecs % 1000);
2139 2140 2141 2142
			if (exceeded && !was_logged)
				return 2;
			else
				return 1;
2143
		}
2144 2145
	}

2146
	return 0;
2147
}
2148

2149 2150 2151 2152 2153 2154 2155 2156 2157 2158 2159 2160 2161 2162 2163 2164 2165 2166 2167 2168 2169
/*
 * errdetail_execute
 *
 * Add an errdetail() line showing the query referenced by an EXECUTE, if any.
 * The argument is the raw parsetree list.
 */
static int
errdetail_execute(List *raw_parsetree_list)
{
	ListCell   *parsetree_item;

	foreach(parsetree_item, raw_parsetree_list)
	{
		Node	   *parsetree = (Node *) lfirst(parsetree_item);

		if (IsA(parsetree, ExecuteStmt))
		{
			ExecuteStmt *stmt = (ExecuteStmt *) parsetree;
			PreparedStatement *pstmt;

			pstmt = FetchPreparedStatement(stmt->name, false);
2170
			if (pstmt)
2171
			{
2172
				errdetail("prepare: %s", pstmt->plansource->query_string);
2173 2174 2175 2176 2177 2178 2179 2180 2181 2182 2183 2184 2185 2186 2187 2188 2189 2190 2191 2192 2193 2194 2195 2196 2197 2198 2199 2200 2201 2202 2203 2204 2205 2206 2207 2208 2209 2210 2211 2212 2213 2214 2215 2216 2217 2218 2219 2220 2221 2222 2223 2224 2225
				return 0;
			}
		}
	}

	return 0;
}

/*
 * errdetail_params
 *
 * Add an errdetail() line showing bind-parameter data, if available.
 */
static int
errdetail_params(ParamListInfo params)
{
	/* We mustn't call user-defined I/O functions when in an aborted xact */
	if (params && params->numParams > 0 && !IsAbortedTransactionBlockState())
	{
		StringInfoData param_str;
		MemoryContext oldcontext;
		int			paramno;

		/* Make sure any trash is generated in MessageContext */
		oldcontext = MemoryContextSwitchTo(MessageContext);

		initStringInfo(&param_str);

		for (paramno = 0; paramno < params->numParams; paramno++)
		{
			ParamExternData *prm = &params->params[paramno];
			Oid			typoutput;
			bool		typisvarlena;
			char	   *pstring;
			char	   *p;

			appendStringInfo(&param_str, "%s$%d = ",
							 paramno > 0 ? ", " : "",
							 paramno + 1);

			if (prm->isnull || !OidIsValid(prm->ptype))
			{
				appendStringInfoString(&param_str, "NULL");
				continue;
			}

			getTypeOutputInfo(prm->ptype, &typoutput, &typisvarlena);

			pstring = OidOutputFunctionCall(typoutput, prm->value);

			appendStringInfoCharMacro(&param_str, '\'');
			for (p = pstring; *p; p++)
			{
B
Bruce Momjian 已提交
2226
				if (*p == '\'') /* double single quotes */
2227 2228 2229 2230 2231 2232 2233 2234 2235 2236 2237 2238 2239 2240 2241 2242
					appendStringInfoCharMacro(&param_str, *p);
				appendStringInfoCharMacro(&param_str, *p);
			}
			appendStringInfoCharMacro(&param_str, '\'');

			pfree(pstring);
		}

		errdetail("parameters: %s", param_str.data);

		pfree(param_str.data);

		MemoryContextSwitchTo(oldcontext);
	}

	return 0;
2243 2244
}

2245 2246 2247 2248 2249 2250 2251 2252 2253 2254 2255 2256 2257 2258
/*
 * errdetail_abort
 *
 * Add an errdetail() line showing abort reason, if any.
 */
static int
errdetail_abort(void)
{
	if (MyProc->recoveryConflictPending)
		errdetail("abort reason: recovery conflict");

	return 0;
}

2259 2260 2261 2262 2263 2264 2265 2266 2267 2268 2269 2270 2271 2272 2273 2274 2275 2276 2277 2278 2279 2280
/*
 * errdetail_recovery_conflict
 *
 * Add an errdetail() line showing conflict source.
 */
static int
errdetail_recovery_conflict(void)
{
	switch (RecoveryConflictReason)
	{
		case PROCSIG_RECOVERY_CONFLICT_BUFFERPIN:
				errdetail("User was holding shared buffer pin for too long.");
				break;
		case PROCSIG_RECOVERY_CONFLICT_LOCK:
				errdetail("User was holding a relation lock for too long.");
				break;
		case PROCSIG_RECOVERY_CONFLICT_TABLESPACE:
				errdetail("User was or may have been using tablespace that must be dropped.");
				break;
		case PROCSIG_RECOVERY_CONFLICT_SNAPSHOT:
				errdetail("User query might have needed to see row versions that must be removed.");
				break;
2281 2282 2283
		case PROCSIG_RECOVERY_CONFLICT_STARTUP_DEADLOCK:
				errdetail("User transaction caused buffer deadlock with recovery.");
				break;
2284 2285 2286 2287 2288 2289 2290 2291 2292 2293 2294
		case PROCSIG_RECOVERY_CONFLICT_DATABASE:
				errdetail("User was connected to a database that must be dropped.");
				break;
		default:
				break;
				/* no errdetail */
	}

	return 0;
}

2295 2296 2297 2298 2299 2300 2301 2302
/*
 * exec_describe_statement_message
 *
 * Process a "Describe" message for a prepared statement
 */
static void
exec_describe_statement_message(const char *stmt_name)
{
2303
	CachedPlanSource *psrc;
2304
	StringInfoData buf;
2305
	int			i;
2306

2307 2308 2309 2310
	/*
	 * Start up a transaction command. (Note that this will normally change
	 * current memory context.) Nothing happens if we are already in one.
	 */
2311
	start_xact_command();
2312 2313 2314 2315

	/* Switch back to message context */
	MemoryContextSwitchTo(MessageContext);

2316 2317
	/* Find prepared statement */
	if (stmt_name[0] != '\0')
2318 2319 2320
	{
		PreparedStatement *pstmt;

2321
		pstmt = FetchPreparedStatement(stmt_name, true);
2322 2323
		psrc = pstmt->plansource;
	}
2324 2325 2326
	else
	{
		/* special-case the unnamed statement */
2327 2328
		psrc = unnamed_stmt_psrc;
		if (!psrc)
2329 2330
			ereport(ERROR,
					(errcode(ERRCODE_UNDEFINED_PSTATEMENT),
B
Bruce Momjian 已提交
2331
					 errmsg("unnamed prepared statement does not exist")));
2332 2333
	}

2334 2335 2336
	/* Prepared statements shouldn't have changeable result descs */
	Assert(psrc->fixed_result);

2337
	/*
2338
	 * If we are in aborted transaction state, we can't run
B
Bruce Momjian 已提交
2339 2340
	 * SendRowDescriptionMessage(), because that needs catalog accesses. (We
	 * can't do RevalidateCachedPlan, either, but that's a lesser problem.)
2341 2342 2343 2344 2345
	 * Hence, refuse to Describe statements that return data.  (We shouldn't
	 * just refuse all Describes, since that might break the ability of some
	 * clients to issue COMMIT or ROLLBACK commands, if they use code that
	 * blindly Describes whatever it does.)  We can Describe parameters
	 * without doing anything dangerous, so we don't restrict that.
2346 2347
	 */
	if (IsAbortedTransactionBlockState() &&
2348
		psrc->resultDesc)
2349 2350 2351
		ereport(ERROR,
				(errcode(ERRCODE_IN_FAILED_SQL_TRANSACTION),
				 errmsg("current transaction is aborted, "
2352 2353
						"commands ignored until end of transaction block"),
				 errdetail_abort()));
2354

2355
	if (whereToSendOutput != DestRemote)
2356 2357
		return;					/* can't actually do anything... */

2358 2359 2360
	/*
	 * First describe the parameters...
	 */
B
Bruce Momjian 已提交
2361
	pq_beginmessage(&buf, 't'); /* parameter description message type */
2362
	pq_sendint(&buf, psrc->num_params, 2);
2363

2364
	for (i = 0; i < psrc->num_params; i++)
2365
	{
2366
		Oid			ptype = psrc->param_types[i];
2367 2368 2369 2370

		pq_sendint(&buf, (int) ptype, 4);
	}
	pq_endmessage(&buf);
2371 2372 2373 2374

	/*
	 * Next send RowDescription or NoData to describe the result...
	 */
2375 2376 2377 2378 2379 2380 2381 2382 2383 2384 2385 2386 2387 2388 2389
	if (psrc->resultDesc)
	{
		CachedPlan *cplan;
		List	   *tlist;

		/* Make sure the plan is up to date */
		cplan = RevalidateCachedPlan(psrc, true);

		/* Get the primary statement and find out what it returns */
		tlist = FetchStatementTargetList(PortalListGetPrimaryStmt(cplan->stmt_list));

		SendRowDescriptionMessage(psrc->resultDesc, tlist, NULL);

		ReleaseCachedPlan(cplan, true);
	}
2390 2391 2392
	else
		pq_putemptymessage('n');	/* NoData */

2393 2394 2395 2396 2397 2398 2399 2400 2401 2402 2403 2404
}

/*
 * exec_describe_portal_message
 *
 * Process a "Describe" message for a portal
 */
static void
exec_describe_portal_message(const char *portal_name)
{
	Portal		portal;

2405 2406 2407 2408
	/*
	 * Start up a transaction command. (Note that this will normally change
	 * current memory context.) Nothing happens if we are already in one.
	 */
2409
	start_xact_command();
2410 2411 2412 2413

	/* Switch back to message context */
	MemoryContextSwitchTo(MessageContext);

2414 2415
	portal = GetPortalByName(portal_name);
	if (!PortalIsValid(portal))
2416 2417 2418
		ereport(ERROR,
				(errcode(ERRCODE_UNDEFINED_CURSOR),
				 errmsg("portal \"%s\" does not exist", portal_name)));
2419

2420 2421 2422
	/*
	 * If we are in aborted transaction state, we can't run
	 * SendRowDescriptionMessage(), because that needs catalog accesses.
B
Bruce Momjian 已提交
2423
	 * Hence, refuse to Describe portals that return data.	(We shouldn't just
2424 2425 2426 2427 2428 2429 2430 2431 2432
	 * refuse all Describes, since that might break the ability of some
	 * clients to issue COMMIT or ROLLBACK commands, if they use code that
	 * blindly Describes whatever it does.)
	 */
	if (IsAbortedTransactionBlockState() &&
		portal->tupDesc)
		ereport(ERROR,
				(errcode(ERRCODE_IN_FAILED_SQL_TRANSACTION),
				 errmsg("current transaction is aborted, "
2433 2434
						"commands ignored until end of transaction block"),
				 errdetail_abort()));
2435

2436
	if (whereToSendOutput != DestRemote)
2437 2438 2439
		return;					/* can't actually do anything... */

	if (portal->tupDesc)
2440 2441
		SendRowDescriptionMessage(portal->tupDesc,
								  FetchPortalTargetList(portal),
2442
								  portal->formats);
2443 2444 2445 2446 2447
	else
		pq_putemptymessage('n');	/* NoData */
}


2448
/*
2449
 * Convenience routines for starting/committing a single command.
2450 2451
 */
static void
2452
start_xact_command(void)
2453
{
2454
	if (!xact_started)
2455
	{
2456 2457 2458
		ereport(DEBUG3,
				(errmsg_internal("StartTransactionCommand")));
		StartTransactionCommand();
2459 2460

		/* Set statement timeout running, if any */
2461
		/* NB: this mustn't be enabled until we are within an xact */
2462 2463
		if (StatementTimeout > 0)
			enable_sig_alarm(StatementTimeout, true);
2464 2465
		else
			cancel_from_timeout = false;
B
Bruce Momjian 已提交
2466

2467 2468 2469 2470 2471 2472 2473 2474 2475
		xact_started = true;
	}
}

static void
finish_xact_command(void)
{
	if (xact_started)
	{
2476 2477 2478 2479
		/* Cancel any active statement timeout before committing */
		disable_sig_alarm(true);

		/* Now commit the command */
2480 2481
		ereport(DEBUG3,
				(errmsg_internal("CommitTransactionCommand")));
2482

2483
		CommitTransactionCommand();
2484

2485 2486 2487 2488 2489 2490
#ifdef MEMORY_CONTEXT_CHECKING
		/* Check all memory contexts that weren't freed during commit */
		/* (those that were, were checked before being deleted) */
		MemoryContextCheck(TopMemoryContext);
#endif

2491
#ifdef SHOW_MEMORY_STATS
2492
		/* Print mem stats after each commit for leak tracking */
2493
		MemoryContextStats(TopMemoryContext);
2494
#endif
2495 2496 2497

		xact_started = false;
	}
2498 2499 2500
}


2501 2502 2503 2504 2505
/*
 * Convenience routines for checking whether a statement is one of the
 * ones that we allow in transaction-aborted state.
 */

2506
/* Test a bare parsetree */
2507 2508 2509 2510 2511 2512 2513 2514 2515 2516 2517 2518 2519 2520 2521 2522
static bool
IsTransactionExitStmt(Node *parsetree)
{
	if (parsetree && IsA(parsetree, TransactionStmt))
	{
		TransactionStmt *stmt = (TransactionStmt *) parsetree;

		if (stmt->kind == TRANS_STMT_COMMIT ||
			stmt->kind == TRANS_STMT_PREPARE ||
			stmt->kind == TRANS_STMT_ROLLBACK ||
			stmt->kind == TRANS_STMT_ROLLBACK_TO)
			return true;
	}
	return false;
}

2523
/* Test a list that might contain Query nodes or bare parsetrees */
2524 2525 2526 2527 2528
static bool
IsTransactionExitStmtList(List *parseTrees)
{
	if (list_length(parseTrees) == 1)
	{
2529 2530 2531 2532 2533
		Node	   *stmt = (Node *) linitial(parseTrees);

		if (IsA(stmt, Query))
		{
			Query	   *query = (Query *) stmt;
2534

2535 2536 2537 2538 2539
			if (query->commandType == CMD_UTILITY &&
				IsTransactionExitStmt(query->utilityStmt))
				return true;
		}
		else if (IsTransactionExitStmt(stmt))
2540 2541 2542 2543 2544
			return true;
	}
	return false;
}

2545
/* Test a list that might contain Query nodes or bare parsetrees */
2546 2547 2548 2549 2550
static bool
IsTransactionStmtList(List *parseTrees)
{
	if (list_length(parseTrees) == 1)
	{
2551
		Node	   *stmt = (Node *) linitial(parseTrees);
2552

2553 2554 2555 2556 2557 2558 2559 2560 2561
		if (IsA(stmt, Query))
		{
			Query	   *query = (Query *) stmt;

			if (query->commandType == CMD_UTILITY &&
				IsA(query->utilityStmt, TransactionStmt))
				return true;
		}
		else if (IsA(stmt, TransactionStmt))
2562 2563 2564 2565 2566
			return true;
	}
	return false;
}

2567 2568 2569 2570 2571 2572 2573 2574
/* Release any existing unnamed prepared statement */
static void
drop_unnamed_stmt(void)
{
	/* Release any completed unnamed statement */
	if (unnamed_stmt_psrc)
		DropCachedPlan(unnamed_stmt_psrc);
	unnamed_stmt_psrc = NULL;
B
Bruce Momjian 已提交
2575

2576 2577 2578 2579 2580 2581 2582 2583 2584 2585
	/*
	 * If we failed while trying to build a prior unnamed statement, we may
	 * have a memory context that wasn't assigned to a completed plancache
	 * entry.  If so, drop it to avoid a permanent memory leak.
	 */
	if (unnamed_stmt_context)
		MemoryContextDelete(unnamed_stmt_context);
	unnamed_stmt_context = NULL;
}

2586

2587
/* --------------------------------
2588
 *		signal handler routines used in PostgresMain()
2589 2590 2591
 * --------------------------------
 */

2592
/*
T
Tom Lane 已提交
2593
 * quickdie() occurs when signalled SIGQUIT by the postmaster.
2594 2595 2596 2597
 *
 * Some backend has bought the farm,
 * so we need to stop what we're doing and exit.
 */
T
Tom Lane 已提交
2598
void
2599
quickdie(SIGNAL_ARGS)
2600
{
2601
	sigaddset(&BlockSig, SIGQUIT); /* prevent nested calls */
2602
	PG_SETMASK(&BlockSig);
B
Bruce Momjian 已提交
2603

2604 2605 2606 2607 2608 2609 2610 2611 2612
	/*
	 * If we're aborting out of client auth, don't risk trying to send
	 * anything to the client; we will likely violate the protocol,
	 * not to mention that we may have interrupted the guts of OpenSSL
	 * or some authentication library.
	 */
	if (ClientAuthInProgress && whereToSendOutput == DestRemote)
		whereToSendOutput = DestNone;

2613
	/*
B
Bruce Momjian 已提交
2614 2615
	 * Ideally this should be ereport(FATAL), but then we'd not get control
	 * back...
2616 2617 2618
	 */
	ereport(WARNING,
			(errcode(ERRCODE_CRASH_SHUTDOWN),
B
Bruce Momjian 已提交
2619
			 errmsg("terminating connection because of crash of another server process"),
B
Bruce Momjian 已提交
2620 2621 2622 2623
	errdetail("The postmaster has commanded this server process to roll back"
			  " the current transaction and exit, because another"
			  " server process exited abnormally and possibly corrupted"
			  " shared memory."),
2624
			 errhint("In a moment you should be able to reconnect to the"
2625
					 " database and repeat your command.")));
B
Bruce Momjian 已提交
2626

2627
	/*
2628 2629 2630 2631 2632 2633 2634 2635 2636 2637
	 * We DO NOT want to run proc_exit() callbacks -- we're here because
	 * shared memory may be corrupted, so we don't want to try to clean up our
	 * transaction.  Just nail the windows shut and get out of town.  Now that
	 * there's an atexit callback to prevent third-party code from breaking
	 * things by calling exit() directly, we have to reset the callbacks
	 * explicitly to make this work as intended.
	 */
	on_exit_reset();

	/*
2638
	 * Note we do exit(2) not exit(0).	This is to force the postmaster into a
B
Bruce Momjian 已提交
2639 2640
	 * system reset cycle if some idiot DBA sends a manual SIGQUIT to a random
	 * backend.  This is necessary precisely because we don't clean up our
2641
	 * shared memory state.  (The "dead man switch" mechanism in pmsignal.c
2642 2643
	 * should ensure the postmaster sees this as a crash, too, but no harm in
	 * being doubly sure.)
2644
	 */
2645
	exit(2);
2646 2647
}

2648
/*
2649 2650
 * Shutdown signal from postmaster: abort transaction and exit
 * at soonest convenient time
2651
 */
2652
void
2653
die(SIGNAL_ARGS)
2654
{
2655 2656 2657
	int			save_errno = errno;

	/* Don't joggle the elbow of proc_exit */
B
Bruce Momjian 已提交
2658
	if (!proc_exit_inprogress)
2659
	{
2660
		InterruptPending = true;
2661
		ProcDiePending = true;
B
Bruce Momjian 已提交
2662

2663
		/*
B
Bruce Momjian 已提交
2664 2665
		 * If it's safe to interrupt, and we're waiting for input or a lock,
		 * service the interrupt immediately
2666
		 */
2667 2668
		if (ImmediateInterruptOK && InterruptHoldoffCount == 0 &&
			CritSectionCount == 0)
2669
		{
2670 2671 2672
			/* bump holdoff count to make ProcessInterrupts() a no-op */
			/* until we are done getting ready for it */
			InterruptHoldoffCount++;
2673
			LockWaitCancel();	/* prevent CheckDeadLock from running */
2674
			DisableNotifyInterrupt();
2675
			DisableCatchupInterrupt();
2676
			InterruptHoldoffCount--;
2677 2678
			ProcessInterrupts();
		}
2679
	}
2680 2681

	errno = save_errno;
2682 2683
}

2684
/*
2685 2686
 * Query-cancel signal from postmaster: abort current transaction
 * at soonest convenient time
2687
 */
2688
void
2689
StatementCancelHandler(SIGNAL_ARGS)
2690
{
2691 2692
	int			save_errno = errno;

B
Bruce Momjian 已提交
2693
	/*
2694
	 * Don't joggle the elbow of proc_exit
B
Bruce Momjian 已提交
2695
	 */
2696
	if (!proc_exit_inprogress)
2697
	{
2698 2699
		InterruptPending = true;
		QueryCancelPending = true;
B
Bruce Momjian 已提交
2700

2701
		/*
2702 2703
		 * If it's safe to interrupt, and we're waiting for input or a lock,
		 * service the interrupt immediately
2704
		 */
2705 2706
		if (ImmediateInterruptOK && InterruptHoldoffCount == 0 &&
			CritSectionCount == 0)
2707
		{
2708 2709 2710
			/* bump holdoff count to make ProcessInterrupts() a no-op */
			/* until we are done getting ready for it */
			InterruptHoldoffCount++;
2711 2712 2713 2714 2715
			LockWaitCancel();	/* prevent CheckDeadLock from running */
			DisableNotifyInterrupt();
			DisableCatchupInterrupt();
			InterruptHoldoffCount--;
			ProcessInterrupts();
2716
		}
2717 2718
	}

2719
	errno = save_errno;
2720 2721
}

2722
/* signal handler for floating point exception */
2723
void
2724 2725
FloatExceptionHandler(SIGNAL_ARGS)
{
2726 2727 2728
	ereport(ERROR,
			(errcode(ERRCODE_FLOATING_POINT_EXCEPTION),
			 errmsg("floating-point exception"),
B
Bruce Momjian 已提交
2729 2730 2731
			 errdetail("An invalid floating-point operation was signaled. "
					   "This probably means an out-of-range result or an "
					   "invalid operation, such as division by zero.")));
2732 2733
}

2734
/* SIGHUP: set flag to re-read config file at next convenient time */
2735
static void
2736
SigHupHandler(SIGNAL_ARGS)
2737
{
2738
	got_SIGHUP = true;
2739 2740
}

2741 2742 2743 2744 2745 2746 2747 2748 2749 2750 2751 2752 2753 2754 2755 2756
/*
 * RecoveryConflictInterrupt: out-of-line portion of recovery conflict
 * handling ollowing receipt of SIGUSR1. Designed to be similar to die()
 * and StatementCancelHandler(). Called only by a normal user backend
 * that begins a transaction during recovery.
 */
void
RecoveryConflictInterrupt(ProcSignalReason reason)
{
	int                     save_errno = errno;

	/*
	* Don't joggle the elbow of proc_exit
	*/
	if (!proc_exit_inprogress)
	{
2757
		RecoveryConflictReason = reason;
2758 2759
		switch (reason)
		{
2760 2761 2762 2763 2764 2765 2766 2767 2768
			case PROCSIG_RECOVERY_CONFLICT_STARTUP_DEADLOCK:
					/*
					 * If we aren't waiting for a lock we can never deadlock.
					 */
					if (!IsWaitingForLock())
						return;

					/* Intentional drop through to check wait for pin */

2769 2770 2771 2772 2773 2774 2775 2776 2777 2778 2779 2780
			case PROCSIG_RECOVERY_CONFLICT_BUFFERPIN:
					/*
					 * If we aren't blocking the Startup process there is
					 * nothing more to do.
					 */
					if (!HoldingBufferPinThatDelaysRecovery())
						return;

					MyProc->recoveryConflictPending = true;

					/* Intentional drop through to error handling */

2781 2782 2783 2784 2785 2786 2787 2788 2789 2790 2791 2792 2793 2794 2795 2796 2797 2798 2799 2800 2801 2802 2803 2804 2805 2806 2807 2808 2809 2810 2811 2812 2813 2814 2815 2816 2817 2818 2819 2820 2821 2822 2823 2824 2825 2826 2827 2828 2829 2830 2831 2832 2833
			case PROCSIG_RECOVERY_CONFLICT_LOCK:
			case PROCSIG_RECOVERY_CONFLICT_TABLESPACE:
			case PROCSIG_RECOVERY_CONFLICT_SNAPSHOT:
					/*
					 * If we aren't in a transaction any longer then ignore.
					 */
					if (!IsTransactionOrTransactionBlock())
						return;

					/*
					 * If we can abort just the current subtransaction then we
					 * are OK to throw an ERROR to resolve the conflict. Otherwise
					 * drop through to the FATAL case.
					 *
					 * XXX other times that we can throw just an ERROR *may* be
					 *   PROCSIG_RECOVERY_CONFLICT_LOCK
					 *		if no locks are held in parent transactions
					 *
					 *   PROCSIG_RECOVERY_CONFLICT_SNAPSHOT
					 *		if no snapshots are held by parent transactions
					 *		and the transaction is not serializable
					 *
					 *   PROCSIG_RECOVERY_CONFLICT_TABLESPACE
					 *		if no temp files or cursors open in parent transactions
					 */
					if (!IsSubTransaction())
					{
						/*
						 * If we already aborted then we no longer need to cancel.
						 * We do this here since we do not wish to ignore aborted
						 * subtransactions, which must cause FATAL, currently.
						 */
						if (IsAbortedTransactionBlockState())
							return;

						RecoveryConflictPending = true;
						QueryCancelPending = true;
						InterruptPending = true;
						break;
					}

					/* Intentional drop through to session cancel */

			case PROCSIG_RECOVERY_CONFLICT_DATABASE:
					RecoveryConflictPending = true;
					ProcDiePending = true;
					InterruptPending = true;
					break;

			default:
					elog(FATAL, "Unknown conflict mode");
		}

2834 2835
		Assert(RecoveryConflictPending && (QueryCancelPending || ProcDiePending));

2836 2837 2838 2839 2840 2841 2842 2843 2844 2845 2846 2847 2848 2849 2850 2851 2852 2853 2854 2855
		/*
		 * If it's safe to interrupt, and we're waiting for input or a lock,
		 * service the interrupt immediately
		 */
		if (ImmediateInterruptOK && InterruptHoldoffCount == 0 &&
			CritSectionCount == 0)
		{
			/* bump holdoff count to make ProcessInterrupts() a no-op */
			/* until we are done getting ready for it */
			InterruptHoldoffCount++;
			LockWaitCancel();	/* prevent CheckDeadLock from running */
			DisableNotifyInterrupt();
			DisableCatchupInterrupt();
			InterruptHoldoffCount--;
			ProcessInterrupts();
		}
	}

	errno = save_errno;
}
2856

2857 2858 2859 2860 2861 2862 2863 2864 2865 2866
/*
 * ProcessInterrupts: out-of-line portion of CHECK_FOR_INTERRUPTS() macro
 *
 * If an interrupt condition is pending, and it's safe to service it,
 * then clear the flag and accept the interrupt.  Called only when
 * InterruptPending is true.
 */
void
ProcessInterrupts(void)
{
2867 2868
	/* OK to accept interrupt now? */
	if (InterruptHoldoffCount != 0 || CritSectionCount != 0)
2869 2870 2871 2872 2873
		return;
	InterruptPending = false;
	if (ProcDiePending)
	{
		ProcDiePending = false;
B
Bruce Momjian 已提交
2874 2875
		QueryCancelPending = false;		/* ProcDie trumps QueryCancel */
		ImmediateInterruptOK = false;	/* not idle anymore */
2876
		DisableNotifyInterrupt();
2877
		DisableCatchupInterrupt();
2878 2879 2880
		/* As in quickdie, don't risk sending to client during auth */
		if (ClientAuthInProgress && whereToSendOutput == DestRemote)
			whereToSendOutput = DestNone;
2881 2882 2883 2884
		if (IsAutoVacuumWorkerProcess())
			ereport(FATAL,
					(errcode(ERRCODE_ADMIN_SHUTDOWN),
					 errmsg("terminating autovacuum process due to administrator command")));
2885 2886 2887
		else if (RecoveryConflictPending)
			ereport(FATAL,
					(errcode(ERRCODE_ADMIN_SHUTDOWN),
2888 2889
					 errmsg("terminating connection due to conflict with recovery"),
					 errdetail_recovery_conflict()));
2890 2891 2892
		else
			ereport(FATAL,
					(errcode(ERRCODE_ADMIN_SHUTDOWN),
B
Bruce Momjian 已提交
2893
			 errmsg("terminating connection due to administrator command")));
2894 2895 2896 2897
	}
	if (QueryCancelPending)
	{
		QueryCancelPending = false;
2898
		if (ClientAuthInProgress)
2899 2900 2901 2902 2903 2904 2905
		{
			ImmediateInterruptOK = false;	/* not idle anymore */
			DisableNotifyInterrupt();
			DisableCatchupInterrupt();
			/* As in quickdie, don't risk sending to client during auth */
			if (whereToSendOutput == DestRemote)
				whereToSendOutput = DestNone;
2906 2907 2908
			ereport(ERROR,
					(errcode(ERRCODE_QUERY_CANCELED),
					 errmsg("canceling authentication due to timeout")));
2909 2910 2911 2912 2913 2914
		}
		if (cancel_from_timeout)
		{
			ImmediateInterruptOK = false;	/* not idle anymore */
			DisableNotifyInterrupt();
			DisableCatchupInterrupt();
2915 2916 2917
			ereport(ERROR,
					(errcode(ERRCODE_QUERY_CANCELED),
					 errmsg("canceling statement due to statement timeout")));
2918 2919 2920 2921 2922 2923
		}
		if (IsAutoVacuumWorkerProcess())
		{
			ImmediateInterruptOK = false;	/* not idle anymore */
			DisableNotifyInterrupt();
			DisableCatchupInterrupt();
2924 2925 2926
			ereport(ERROR,
					(errcode(ERRCODE_QUERY_CANCELED),
					 errmsg("canceling autovacuum task")));
2927
		}
2928
		if (RecoveryConflictPending)
2929
		{
2930
			ImmediateInterruptOK = false;	/* not idle anymore */
2931
			RecoveryConflictPending = false;
2932 2933 2934 2935 2936
			DisableNotifyInterrupt();
			DisableCatchupInterrupt();
			if (DoingCommandRead)
				ereport(FATAL,
						(errcode(ERRCODE_ADMIN_SHUTDOWN),
2937 2938 2939 2940
						 errmsg("terminating connection due to conflict with recovery"),
						 errdetail_recovery_conflict(),
						 errhint("In a moment you should be able to reconnect to the"
								 " database and repeat your command.")));
2941 2942 2943
			else
				ereport(ERROR,
						(errcode(ERRCODE_QUERY_CANCELED),
2944 2945
						 errmsg("canceling statement due to conflict with recovery"),
						 errdetail_recovery_conflict()));
2946
		}
2947

2948 2949 2950 2951 2952 2953 2954 2955 2956 2957
		/*
		 * If we are reading a command from the client, just ignore the
		 * cancel request --- sending an extra error message won't
		 * accomplish anything.  Otherwise, go ahead and throw the error.
		 */
		if (!DoingCommandRead)
		{
			ImmediateInterruptOK = false;	/* not idle anymore */
			DisableNotifyInterrupt();
			DisableCatchupInterrupt();
2958 2959 2960
			ereport(ERROR,
					(errcode(ERRCODE_QUERY_CANCELED),
					 errmsg("canceling statement due to user request")));
2961
		}
2962 2963 2964 2965
	}
	/* If we get here, do nothing (probably, QueryCancelPending was reset) */
}

2966

2967 2968 2969 2970 2971 2972
/*
 * check_stack_depth: check for excessively deep recursion
 *
 * This should be called someplace in any recursive routine that might possibly
 * recurse deep enough to overflow the stack.  Most Unixen treat stack
 * overflow as an unrecoverable SIGSEGV, so we want to error out ourselves
2973
 * before hitting the hardware limit.
2974 2975 2976 2977
 */
void
check_stack_depth(void)
{
B
Bruce Momjian 已提交
2978
	char		stack_top_loc;
2979
	long		stack_depth;
2980 2981 2982 2983

	/*
	 * Compute distance from PostgresMain's local variables to my own
	 */
2984
	stack_depth = (long) (stack_base_ptr - &stack_top_loc);
B
Bruce Momjian 已提交
2985

2986
	/*
B
Bruce Momjian 已提交
2987
	 * Take abs value, since stacks grow up on some machines, down on others
2988 2989 2990
	 */
	if (stack_depth < 0)
		stack_depth = -stack_depth;
B
Bruce Momjian 已提交
2991

2992 2993 2994
	/*
	 * Trouble?
	 *
2995 2996 2997 2998
	 * The test on stack_base_ptr prevents us from erroring out if called
	 * during process setup or in a non-backend process.  Logically it should
	 * be done first, but putting it here avoids wasting cycles during normal
	 * cases.
2999 3000 3001 3002 3003 3004 3005
	 */
	if (stack_depth > max_stack_depth_bytes &&
		stack_base_ptr != NULL)
	{
		ereport(ERROR,
				(errcode(ERRCODE_STATEMENT_TOO_COMPLEX),
				 errmsg("stack depth limit exceeded"),
B
Bruce Momjian 已提交
3006 3007
		 errhint("Increase the configuration parameter \"max_stack_depth\", "
		   "after ensuring the platform's stack depth limit is adequate.")));
3008 3009 3010
	}
}

3011
/* GUC assign hook for max_stack_depth */
3012 3013 3014
bool
assign_max_stack_depth(int newval, bool doit, GucSource source)
{
3015 3016 3017 3018 3019
	long		newval_bytes = newval * 1024L;
	long		stack_rlimit = get_stack_depth_rlimit();

	if (stack_rlimit > 0 && newval_bytes > stack_rlimit - STACK_DEPTH_SLOP)
	{
3020
		ereport(GUC_complaint_elevel(source),
3021 3022 3023 3024 3025 3026
				(errcode(ERRCODE_INVALID_PARAMETER_VALUE),
				 errmsg("\"max_stack_depth\" must not exceed %ldkB",
						(stack_rlimit - STACK_DEPTH_SLOP) / 1024L),
				 errhint("Increase the platform's stack depth limit via \"ulimit -s\" or local equivalent.")));
		return false;
	}
3027
	if (doit)
3028
		max_stack_depth_bytes = newval_bytes;
3029 3030 3031 3032
	return true;
}


3033 3034 3035 3036 3037 3038 3039 3040 3041 3042 3043 3044 3045 3046 3047 3048 3049 3050 3051 3052 3053 3054 3055 3056 3057 3058 3059 3060 3061 3062 3063 3064 3065 3066 3067
/*
 * set_debug_options --- apply "-d N" command line option
 *
 * -d is not quite the same as setting log_min_messages because it enables
 * other output options.
 */
void
set_debug_options(int debug_flag, GucContext context, GucSource source)
{
	if (debug_flag > 0)
	{
		char		debugstr[64];

		sprintf(debugstr, "debug%d", debug_flag);
		SetConfigOption("log_min_messages", debugstr, context, source);
	}
	else
		SetConfigOption("log_min_messages", "notice", context, source);

	if (debug_flag >= 1 && context == PGC_POSTMASTER)
	{
		SetConfigOption("log_connections", "true", context, source);
		SetConfigOption("log_disconnections", "true", context, source);
	}
	if (debug_flag >= 2)
		SetConfigOption("log_statement", "all", context, source);
	if (debug_flag >= 3)
		SetConfigOption("debug_print_parse", "true", context, source);
	if (debug_flag >= 4)
		SetConfigOption("debug_print_plan", "true", context, source);
	if (debug_flag >= 5)
		SetConfigOption("debug_print_rewritten", "true", context, source);
}


3068 3069 3070
bool
set_plan_disabling_options(const char *arg, GucContext context, GucSource source)
{
B
Bruce Momjian 已提交
3071
	char	   *tmp = NULL;
3072 3073 3074

	switch (arg[0])
	{
B
Bruce Momjian 已提交
3075
		case 's':				/* seqscan */
3076 3077
			tmp = "enable_seqscan";
			break;
B
Bruce Momjian 已提交
3078
		case 'i':				/* indexscan */
3079 3080
			tmp = "enable_indexscan";
			break;
B
Bruce Momjian 已提交
3081
		case 'b':				/* bitmapscan */
3082 3083
			tmp = "enable_bitmapscan";
			break;
B
Bruce Momjian 已提交
3084
		case 't':				/* tidscan */
3085 3086
			tmp = "enable_tidscan";
			break;
B
Bruce Momjian 已提交
3087
		case 'n':				/* nestloop */
3088 3089
			tmp = "enable_nestloop";
			break;
B
Bruce Momjian 已提交
3090
		case 'm':				/* mergejoin */
3091 3092
			tmp = "enable_mergejoin";
			break;
B
Bruce Momjian 已提交
3093
		case 'h':				/* hashjoin */
3094 3095 3096 3097 3098 3099 3100 3101 3102 3103 3104 3105 3106 3107 3108 3109 3110 3111 3112
			tmp = "enable_hashjoin";
			break;
	}
	if (tmp)
	{
		SetConfigOption(tmp, "false", context, source);
		return true;
	}
	else
		return false;
}


const char *
get_stats_option_name(const char *arg)
{
	switch (arg[0])
	{
		case 'p':
B
Bruce Momjian 已提交
3113
			if (optarg[1] == 'a')		/* "parser" */
3114
				return "log_parser_stats";
B
Bruce Momjian 已提交
3115
			else if (optarg[1] == 'l')	/* "planner" */
3116 3117 3118
				return "log_planner_stats";
			break;

B
Bruce Momjian 已提交
3119
		case 'e':				/* "executor" */
3120 3121 3122 3123 3124 3125 3126 3127
			return "log_executor_stats";
			break;
	}

	return NULL;
}


3128
/* ----------------------------------------------------------------
3129 3130
 * process_postgres_switches
 *	   Parse command line arguments for PostgresMain
3131
 *
3132 3133 3134 3135 3136
 * This is called twice, once for the "secure" options coming from the
 * postmaster or command line, and once for the "insecure" options coming
 * from the client's startup packet.  The latter have the same syntax but
 * may be restricted in what they can do.
 *
3137
 * argv[0] is ignored in either case (it's assumed to be the program name).
3138 3139 3140 3141 3142 3143
 *
 * ctx is PGC_POSTMASTER for secure options, PGC_BACKEND for insecure options
 * coming from the client, or PGC_SUSET for insecure options coming from
 * a superuser client.
 *
 * Returns the database name extracted from the command line, if any.
3144 3145
 * ----------------------------------------------------------------
 */
3146
const char *
3147
process_postgres_switches(int argc, char *argv[], GucContext ctx)
3148
{
3149 3150
	const char *dbname;
	bool		secure = (ctx == PGC_POSTMASTER);
3151
	int			errs = 0;
3152
	GucSource	gucsource;
3153
	int			flag;
3154

3155
	if (secure)
3156
	{
3157
		gucsource = PGC_S_ARGV;			/* switches came from command line */
3158

3159 3160 3161 3162 3163 3164 3165 3166
		/* Ignore the initial --single argument, if present */
		if (argc > 1 && strcmp(argv[1], "--single") == 0)
		{
			argv++;
			argc--;
		}
	}
	else
3167
	{
3168
		gucsource = PGC_S_CLIENT;		/* switches came from client */
3169 3170
	}

3171
	/*
B
Bruce Momjian 已提交
3172 3173 3174
	 * Parse command-line options.	CAUTION: keep this in sync with
	 * postmaster/postmaster.c (the option sets should not conflict) and with
	 * the common help() function in main/main.c.
3175
	 */
3176
	while ((flag = getopt(argc, argv, "A:B:c:D:d:EeFf:h:ijk:lN:nOo:Pp:r:S:sTt:v:W:-:")) != -1)
3177
	{
3178 3179
		switch (flag)
		{
M
 
Marc G. Fournier 已提交
3180
			case 'A':
3181
				SetConfigOption("debug_assertions", optarg, ctx, gucsource);
M
 
Marc G. Fournier 已提交
3182
				break;
3183

3184
			case 'B':
3185
				SetConfigOption("shared_buffers", optarg, ctx, gucsource);
3186
				break;
3187

3188
			case 'D':
3189
				if (secure)
3190
					userDoption = strdup(optarg);
M
 
Marc G. Fournier 已提交
3191
				break;
3192

3193
			case 'd':
3194
				set_debug_options(atoi(optarg), ctx, gucsource);
3195
				break;
3196 3197

			case 'E':
3198
				EchoQuery = true;
3199
				break;
3200 3201

			case 'e':
3202
				SetConfigOption("datestyle", "euro", ctx, gucsource);
3203
				break;
3204 3205

			case 'F':
3206
				SetConfigOption("fsync", "false", ctx, gucsource);
3207
				break;
3208 3209

			case 'f':
3210 3211 3212
				if (!set_plan_disabling_options(optarg, ctx, gucsource))
					errs++;
				break;
3213

3214 3215
			case 'h':
				SetConfigOption("listen_addresses", optarg, ctx, gucsource);
3216 3217
				break;

3218 3219 3220
			case 'i':
				SetConfigOption("listen_addresses", "*", ctx, gucsource);
				break;
3221

3222
			case 'j':
3223 3224
				UseNewLine = 0;
				break;
3225

3226 3227 3228
			case 'k':
				SetConfigOption("unix_socket_directory", optarg, ctx, gucsource);
				break;
3229

3230 3231
			case 'l':
				SetConfigOption("ssl", "true", ctx, gucsource);
3232 3233
				break;

3234 3235 3236
			case 'N':
				SetConfigOption("max_connections", optarg, ctx, gucsource);
				break;
3237

3238 3239 3240 3241 3242 3243
			case 'n':
				/* ignored for consistency with postmaster */
				break;

			case 'O':
				SetConfigOption("allow_system_table_mods", "true", ctx, gucsource);
H
Hiroshi Inoue 已提交
3244 3245
				break;

T
Tom Lane 已提交
3246
			case 'o':
3247 3248
				errs++;
				break;
3249

3250 3251
			case 'P':
				SetConfigOption("ignore_system_indexes", "true", ctx, gucsource);
T
Tom Lane 已提交
3252 3253
				break;

3254
			case 'p':
3255 3256
				SetConfigOption("port", optarg, ctx, gucsource);
				break;
B
Bruce Momjian 已提交
3257

3258 3259
			case 'r':
				/* send output (stdout and stderr) to the given file */
3260
				if (secure)
3261
					strlcpy(OutputFileName, optarg, MAXPGPATH);
3262
				break;
3263

3264
			case 'S':
3265
				SetConfigOption("work_mem", optarg, ctx, gucsource);
3266
				break;
3267 3268

			case 's':
3269
				SetConfigOption("log_statement_stats", "true", ctx, gucsource);
M
 
Marc G. Fournier 已提交
3270 3271
				break;

3272 3273 3274 3275
			case 'T':
				/* ignored for consistency with postmaster */
				break;

3276
			case 't':
3277
				{
B
Bruce Momjian 已提交
3278 3279 3280
					const char *tmp = get_stats_option_name(optarg);

					if (tmp)
3281
						SetConfigOption(tmp, "true", ctx, gucsource);
3282
					else
B
Bruce Momjian 已提交
3283 3284
						errs++;
					break;
3285
				}
3286

3287
			case 'v':
3288 3289 3290 3291 3292 3293 3294
				/*
				 * -v is no longer used in normal operation, since
				 * FrontendProtocol is already set before we get here.
				 * We keep the switch only for possible use in standalone
				 * operation, in case we ever support using normal FE/BE
				 * protocol with a standalone backend.
				 */
3295 3296
				if (secure)
					FrontendProtocol = (ProtocolVersion) atoi(optarg);
3297 3298
				break;

M
 
Marc G. Fournier 已提交
3299
			case 'W':
3300 3301
				SetConfigOption("post_auth_delay", optarg, ctx, gucsource);
				break;
3302

3303
			case 'c':
3304
			case '-':
3305
				{
B
Bruce Momjian 已提交
3306 3307
					char	   *name,
							   *value;
3308

B
Bruce Momjian 已提交
3309 3310 3311 3312
					ParseLongOption(optarg, &name, &value);
					if (!value)
					{
						if (flag == '-')
3313 3314 3315 3316
							ereport(ERROR,
									(errcode(ERRCODE_SYNTAX_ERROR),
									 errmsg("--%s requires a value",
											optarg)));
B
Bruce Momjian 已提交
3317
						else
3318 3319 3320 3321
							ereport(ERROR,
									(errcode(ERRCODE_SYNTAX_ERROR),
									 errmsg("-c %s requires a value",
											optarg)));
B
Bruce Momjian 已提交
3322
					}
3323
					SetConfigOption(name, value, ctx, gucsource);
B
Bruce Momjian 已提交
3324 3325 3326 3327 3328
					free(name);
					if (value)
						free(value);
					break;
				}
3329

3330 3331
			default:
				errs++;
T
Tom Lane 已提交
3332
				break;
3333
		}
3334 3335
	}

3336
	/*
3337 3338
	 * Should be no more arguments except an optional database name, and
	 * that's only in the secure case.
3339
	 */
3340
	if (errs || argc - optind > 1 || (argc != optind && !secure))
3341
	{
3342 3343 3344 3345 3346
		/* spell the error message a bit differently depending on context */
		if (IsUnderPostmaster)
			ereport(FATAL,
					(errcode(ERRCODE_SYNTAX_ERROR),
				 errmsg("invalid command-line arguments for server process"),
3347
			   errhint("Try \"%s --help\" for more information.", progname)));
3348 3349 3350 3351
		else
			ereport(FATAL,
					(errcode(ERRCODE_SYNTAX_ERROR),
					 errmsg("%s: invalid command-line arguments",
3352 3353
							progname),
			   errhint("Try \"%s --help\" for more information.", progname)));
3354
	}
3355

3356 3357 3358 3359
	if (argc - optind == 1)
		dbname = strdup(argv[optind]);
	else
		dbname = NULL;
3360

3361 3362 3363 3364 3365 3366 3367 3368
	/*
	 * Reset getopt(3) library so that it will work correctly in subprocesses
	 * or when this function is called a second time with another array.
	 */
	optind = 1;
#ifdef HAVE_INT_OPTRESET
	optreset = 1;				/* some systems need this too */
#endif
3369

3370 3371
	return dbname;
}
3372

3373 3374 3375 3376 3377 3378 3379 3380 3381 3382 3383 3384 3385 3386 3387 3388 3389 3390 3391 3392 3393 3394 3395 3396 3397 3398 3399 3400 3401 3402 3403 3404 3405 3406 3407 3408 3409 3410 3411 3412 3413 3414 3415 3416 3417 3418 3419 3420 3421 3422 3423 3424 3425 3426 3427 3428 3429 3430 3431 3432 3433 3434 3435 3436 3437 3438 3439 3440 3441 3442 3443 3444 3445 3446 3447

/* ----------------------------------------------------------------
 * PostgresMain
 *	   postgres main loop -- all backends, interactive or otherwise start here
 *
 * argc/argv are the command line arguments to be used.  (When being forked
 * by the postmaster, these are not the original argv array of the process.)
 * username is the (possibly authenticated) PostgreSQL user name to be used
 * for the session.
 * ----------------------------------------------------------------
 */
int
PostgresMain(int argc, char *argv[], const char *username)
{
	const char *dbname;
	int			firstchar;
	char		stack_base;
	StringInfoData input_message;
	sigjmp_buf	local_sigjmp_buf;
	volatile bool send_ready_for_query = true;

	/*
	 * Initialize globals (already done if under postmaster, but not if
	 * standalone).
	 */
	if (!IsUnderPostmaster)
	{
		MyProcPid = getpid();

		MyStartTime = time(NULL);
	}

	/*
	 * Fire up essential subsystems: error and memory management
	 *
	 * If we are running under the postmaster, this is done already.
	 */
	if (!IsUnderPostmaster)
		MemoryContextInit();

	SetProcessingMode(InitProcessing);

	/* Set up reference point for stack depth checking */
	stack_base_ptr = &stack_base;

	/* Compute paths, if we didn't inherit them from postmaster */
	if (my_exec_path[0] == '\0')
	{
		if (find_my_exec(argv[0], my_exec_path) < 0)
			elog(FATAL, "%s: could not locate my own executable path",
				 argv[0]);
	}

	if (pkglib_path[0] == '\0')
		get_pkglib_path(my_exec_path, pkglib_path);

	/*
	 * Set default values for command-line options.
	 */
	if (!IsUnderPostmaster)
		InitializeGUCOptions();

	/*
	 * Parse command-line options.
	 */
	dbname = process_postgres_switches(argc, argv, PGC_POSTMASTER);

	/* Must have gotten a database name, or have a default (the username) */
	if (dbname == NULL)
	{
		dbname = username;
		if (dbname == NULL)
			ereport(FATAL,
				(errcode(ERRCODE_INVALID_PARAMETER_VALUE),
				 errmsg("%s: no database nor user name specified",
3448
						progname)));
3449 3450
	}

3451 3452
	/* Acquire configuration parameters, unless inherited from postmaster */
	if (!IsUnderPostmaster)
3453
	{
3454
		if (!SelectConfigFiles(userDoption, progname))
3455
			proc_exit(1);
3456 3457
		/* If timezone is not set, determine what the OS uses */
		pg_timezone_initialize();
3458 3459
		/* If timezone_abbreviations is not set, select default */
		pg_timezone_abbrev_initialize();
3460
	}
3461

3462 3463 3464 3465 3466
	/*
	 * You might expect to see a setsid() call here, but it's not needed,
	 * because if we are under a postmaster then BackendInitialize() did it.
	 */

3467
	/*
3468
	 * Set up signal handlers and masks.
3469
	 *
3470 3471 3472
	 * Note that postmaster blocked all signals before forking child process,
	 * so there is no race condition whereby we might receive a signal before
	 * we have set up the handler.
T
Tom Lane 已提交
3473
	 *
B
Bruce Momjian 已提交
3474 3475 3476 3477 3478 3479
	 * Also note: it's best not to use any signals that are SIG_IGNored in the
	 * postmaster.	If such a signal arrives before we are able to change the
	 * handler to non-SIG_IGN, it'll get dropped.  Instead, make a dummy
	 * handler in the postmaster to reserve the signal. (Of course, this isn't
	 * an issue for signals that are locally generated, such as SIGALRM and
	 * SIGPIPE.)
3480
	 */
3481 3482
	if (am_walsender)
		WalSndSignals();
3483
	else
3484 3485 3486 3487
	{
		pqsignal(SIGHUP, SigHupHandler);	/* set flag to read config file */
		pqsignal(SIGINT, StatementCancelHandler);	/* cancel current query */
		pqsignal(SIGTERM, die);		/* cancel current query and exit */
3488

3489 3490 3491 3492 3493 3494 3495 3496 3497 3498
		/*
		 * In a standalone backend, SIGQUIT can be generated from the keyboard
		 * easily, while SIGTERM cannot, so we make both signals do die() rather
		 * than quickdie().
		 */
		if (IsUnderPostmaster)
			pqsignal(SIGQUIT, quickdie);	/* hard crash time */
		else
			pqsignal(SIGQUIT, die); /* cancel current query and exit */
		pqsignal(SIGALRM, handle_sig_alarm);		/* timeout conditions */
3499

3500 3501 3502 3503 3504 3505 3506 3507 3508 3509 3510 3511 3512 3513 3514 3515
		/*
		 * Ignore failure to write to frontend. Note: if frontend closes
		 * connection, we will notice it and exit cleanly when control next
		 * returns to outer loop.  This seems safer than forcing exit in the midst
		 * of output during who-knows-what operation...
		 */
		pqsignal(SIGPIPE, SIG_IGN);
		pqsignal(SIGUSR1, procsignal_sigusr1_handler);
		pqsignal(SIGUSR2, SIG_IGN);
		pqsignal(SIGFPE, FloatExceptionHandler);

		/*
		 * Reset some signals that are accepted by postmaster but not by backend
		 */
		pqsignal(SIGCHLD, SIG_DFL); /* system() requires this on some platforms */
	}
3516

3517 3518
	pqinitmask();

3519 3520 3521 3522 3523
	if (IsUnderPostmaster)
	{
		/* We allow SIGQUIT (quickdie) at all times */
		sigdelset(&BlockSig, SIGQUIT);
	}
3524

T
Tom Lane 已提交
3525
	PG_SETMASK(&BlockSig);		/* block everything except SIGQUIT */
3526

3527
	if (IsUnderPostmaster)
3528
	{
3529
		BaseInit();
3530
	}
3531
	else
3532
	{
3533
		/*
B
Bruce Momjian 已提交
3534 3535
		 * Validate we have been given a reasonable-looking DataDir (if under
		 * postmaster, assume postmaster did this already).
3536
		 */
3537
		Assert(DataDir);
3538 3539
		ValidatePgVersion(DataDir);

3540 3541 3542
		/* Change into DataDir (if under postmaster, was done already) */
		ChangeToDataDir();

3543
		/*
3544
		 * Create lockfile for data directory.
3545
		 */
3546
		CreateDataDirLockFile(false);
3547

3548
		BaseInit();
3549 3550 3551 3552 3553

		/*
		 * Start up xlog for standalone backend, and register to have it
		 * closed down at exit.
		 */
3554
		StartupXLOG();
3555
		on_shmem_exit(ShutdownXLOG, 0);
3556 3557
	}

3558
	/*
B
Bruce Momjian 已提交
3559 3560 3561 3562
	 * Create a per-backend PGPROC struct in shared memory, except in the
	 * EXEC_BACKEND case where this was done in SubPostmasterMain. We must do
	 * this before we can use LWLocks (and in the EXEC_BACKEND case we already
	 * had to do some stuff with LWLocks).
3563 3564 3565 3566 3567 3568 3569 3570
	 */
#ifdef EXEC_BACKEND
	if (!IsUnderPostmaster)
		InitProcess();
#else
	InitProcess();
#endif

3571 3572 3573
	/* We need to allow SIGINT, etc during the initial transaction */
	PG_SETMASK(&UnBlockSig);

3574
	/*
3575 3576
	 * General initialization.
	 *
3577 3578 3579
	 * NOTE: if you are tempted to add code in this vicinity, consider putting
	 * it inside InitPostgres() instead.  In particular, anything that
	 * involves database access should be there, not here.
3580
	 */
3581
	InitPostgres(dbname, InvalidOid, username, NULL);
3582

3583 3584 3585 3586 3587 3588 3589 3590 3591 3592 3593 3594 3595
	/*
	 * If the PostmasterContext is still around, recycle the space; we don't
	 * need it anymore after InitPostgres completes.  Note this does not trash
	 * *MyProcPort, because ConnCreate() allocated that space with malloc()
	 * ... else we'd need to copy the Port data first.  Also, subsidiary data
	 * such as the username isn't lost either; see ProcessStartupPacket().
	 */
	if (PostmasterContext)
	{
		MemoryContextDelete(PostmasterContext);
		PostmasterContext = NULL;
	}

3596
	SetProcessingMode(NormalProcessing);
3597

3598 3599 3600 3601 3602 3603
	/*
	 * Now all GUC states are fully set up.  Report them to client if
	 * appropriate.
	 */
	BeginReportingGUCOptions();

3604
	/*
B
Bruce Momjian 已提交
3605 3606
	 * Also set up handler to log session end; we have to wait till now to be
	 * sure Log_disconnections has its final value.
3607 3608 3609 3610
	 */
	if (IsUnderPostmaster && Log_disconnections)
		on_proc_exit(log_disconnections, 0);

3611 3612 3613 3614
	/* If this is a WAL sender process, we're done with initialization. */
	if (am_walsender)
		proc_exit(WalSenderMain());

3615
	/*
B
Bruce Momjian 已提交
3616 3617
	 * process any libraries that should be preloaded at backend start (this
	 * likewise can't be done until GUC settings are complete)
3618 3619 3620
	 */
	process_local_preload_libraries();

3621 3622
	/*
	 * Send this backend's cancellation info to the frontend.
3623
	 */
3624
	if (whereToSendOutput == DestRemote &&
M
 
Marc G. Fournier 已提交
3625 3626
		PG_PROTOCOL_MAJOR(FrontendProtocol) >= 2)
	{
3627
		StringInfoData buf;
B
Bruce Momjian 已提交
3628

3629
		pq_beginmessage(&buf, 'K');
3630 3631 3632
		pq_sendint(&buf, (int32) MyProcPid, sizeof(int32));
		pq_sendint(&buf, (int32) MyCancelKey, sizeof(int32));
		pq_endmessage(&buf);
M
 
Marc G. Fournier 已提交
3633 3634 3635
		/* Need not flush since ReadyForQuery will do it. */
	}

3636
	/* Welcome banner for standalone case */
3637
	if (whereToSendOutput == DestDebug)
3638
		printf("\nPostgreSQL stand-alone backend %s\n", PG_VERSION);
3639

3640 3641 3642
	/*
	 * Create the memory context we will use in the main loop.
	 *
3643 3644
	 * MessageContext is reset once per iteration of the main loop, ie, upon
	 * completion of processing of each command message from the client.
3645
	 */
3646 3647 3648 3649 3650
	MessageContext = AllocSetContextCreate(TopMemoryContext,
										   "MessageContext",
										   ALLOCSET_DEFAULT_MINSIZE,
										   ALLOCSET_DEFAULT_INITSIZE,
										   ALLOCSET_DEFAULT_MAXSIZE);
3651

3652
	/*
3653
	 * Remember stand-alone backend startup time
3654 3655
	 */
	if (!IsUnderPostmaster)
3656
		PgStartTime = GetCurrentTimestamp();
3657

3658 3659
	/*
	 * POSTGRES main processing loop begins here
3660
	 *
B
Bruce Momjian 已提交
3661 3662
	 * If an exception is encountered, processing resumes here so we abort the
	 * current transaction and start a new one.
3663
	 *
3664 3665 3666 3667 3668 3669 3670
	 * You might wonder why this isn't coded as an infinite loop around a
	 * PG_TRY construct.  The reason is that this is the bottom of the
	 * exception stack, and so with PG_TRY there would be no exception handler
	 * in force at all during the CATCH part.  By leaving the outermost setjmp
	 * always active, we have at least some chance of recovering from an error
	 * during error recovery.  (If we get into an infinite loop thereby, it
	 * will soon be stopped by overflow of elog.c's internal state stack.)
3671 3672
	 */

3673
	if (sigsetjmp(local_sigjmp_buf, 1) != 0)
3674
	{
3675
		/*
3676
		 * NOTE: if you are tempted to add more code in this if-block,
3677
		 * consider the high probability that it should be in
B
Bruce Momjian 已提交
3678
		 * AbortTransaction() instead.	The only stuff done directly here
B
Bruce Momjian 已提交
3679 3680
		 * should be stuff that is guaranteed to apply *only* for outer-level
		 * error recovery, such as adjusting the FE/BE protocol status.
3681 3682 3683 3684 3685 3686 3687 3688 3689
		 */

		/* Since not using PG_TRY, must reset error stack by hand */
		error_context_stack = NULL;

		/* Prevent interrupts while cleaning up */
		HOLD_INTERRUPTS();

		/*
B
Bruce Momjian 已提交
3690 3691
		 * Forget any pending QueryCancel request, since we're returning to
		 * the idle loop anyway, and cancel the statement timer if running.
3692 3693
		 */
		QueryCancelPending = false;
3694
		disable_sig_alarm(true);
B
Bruce Momjian 已提交
3695
		QueryCancelPending = false;		/* again in case timeout occurred */
3696 3697

		/*
B
Bruce Momjian 已提交
3698 3699 3700
		 * Turn off these interrupts too.  This is only needed here and not in
		 * other exception-catching places since these interrupts are only
		 * enabled while we wait for client input.
3701
		 */
3702
		DoingCommandRead = false;
3703
		DisableNotifyInterrupt();
3704
		DisableCatchupInterrupt();
3705

3706 3707 3708
		/* Make sure libpq is in a good state */
		pq_comm_reset();

3709 3710
		/* Report the error to the client and/or server log */
		EmitErrorReport();
3711

3712
		/*
B
Bruce Momjian 已提交
3713 3714
		 * Make sure debug_query_string gets reset before we possibly clobber
		 * the storage it points at.
3715
		 */
3716
		debug_query_string = NULL;
3717

3718
		/*
3719
		 * Abort the current transaction in order to recover.
3720
		 */
3721
		AbortCurrentTransaction();
3722 3723

		/*
B
Bruce Momjian 已提交
3724 3725
		 * Now return to normal top-level context and clear ErrorContext for
		 * next time.
3726 3727
		 */
		MemoryContextSwitchTo(TopMemoryContext);
3728
		FlushErrorState();
3729

3730
		/*
B
Bruce Momjian 已提交
3731 3732
		 * If we were handling an extended-query-protocol message, initiate
		 * skip till next Sync.  This also causes us not to issue
B
Bruce Momjian 已提交
3733
		 * ReadyForQuery (until we get Sync).
3734 3735 3736
		 */
		if (doing_extended_query_message)
			ignore_till_sync = true;
3737

3738 3739
		/* We don't have a transaction command open anymore */
		xact_started = false;
3740

3741
		/* Now we can allow interrupts again */
3742
		RESUME_INTERRUPTS();
3743
	}
3744

3745 3746
	/* We can now handle ereport(ERROR) */
	PG_exception_stack = &local_sigjmp_buf;
3747

3748
	if (!ignore_till_sync)
B
Bruce Momjian 已提交
3749
		send_ready_for_query = true;	/* initially, or after error */
3750

3751 3752
	/*
	 * Non-error queries loop here.
3753 3754 3755 3756
	 */

	for (;;)
	{
3757
		/*
B
Bruce Momjian 已提交
3758 3759
		 * At top of loop, reset extended-query-message flag, so that any
		 * errors encountered in "idle" state don't provoke skip.
3760 3761 3762
		 */
		doing_extended_query_message = false;

3763
		/*
B
Bruce Momjian 已提交
3764 3765
		 * Release storage left over from prior query cycle, and create a new
		 * query input buffer in the cleared MessageContext.
3766
		 */
3767 3768
		MemoryContextSwitchTo(MessageContext);
		MemoryContextResetAndDeleteChildren(MessageContext);
3769

3770
		initStringInfo(&input_message);
3771

3772
		/*
B
Bruce Momjian 已提交
3773 3774
		 * (1) If we've reached idle state, tell the frontend we're ready for
		 * a new query.
3775
		 *
3776
		 * Note: this includes fflush()'ing the last of the prior output.
3777 3778 3779
		 *
		 * This is also a good time to send collected statistics to the
		 * collector, and to update the PS stats display.  We avoid doing
B
Bruce Momjian 已提交
3780 3781 3782
		 * those every time through the message loop because it'd slow down
		 * processing of batched messages, and because we don't want to report
		 * uncommitted updates (that confuses autovacuum).
B
Bruce Momjian 已提交
3783
		 */
3784
		if (send_ready_for_query)
3785
		{
3786 3787 3788 3789 3790 3791
			if (IsAbortedTransactionBlockState())
			{
				set_ps_display("idle in transaction (aborted)", false);
				pgstat_report_activity("<IDLE> in transaction (aborted)");
			}
			else if (IsTransactionOrTransactionBlock())
3792
			{
3793
				set_ps_display("idle in transaction", false);
3794 3795 3796 3797
				pgstat_report_activity("<IDLE> in transaction");
			}
			else
			{
3798
				pgstat_report_stat(false);
3799

3800
				set_ps_display("idle", false);
3801 3802
				pgstat_report_activity("<IDLE>");
			}
3803

3804
			ReadyForQuery(whereToSendOutput);
3805
			send_ready_for_query = false;
3806
		}
3807

3808
		/*
B
Bruce Momjian 已提交
3809 3810 3811 3812
		 * (2) Allow asynchronous signals to be executed immediately if they
		 * come in while we are waiting for client input. (This must be
		 * conditional since we don't want, say, reads on behalf of COPY FROM
		 * STDIN doing the same thing.)
3813
		 */
3814
		DoingCommandRead = true;
3815

3816 3817
		/*
		 * (3) read a command (loop blocks here)
3818
		 */
3819
		firstchar = ReadCommand(&input_message);
3820

3821 3822
		/*
		 * (4) disable async signal conditions again.
3823
		 */
3824
		DoingCommandRead = false;
3825

3826
		/*
B
Bruce Momjian 已提交
3827 3828
		 * (5) check for any other interesting events that happened while we
		 * slept.
3829 3830 3831 3832 3833 3834 3835
		 */
		if (got_SIGHUP)
		{
			got_SIGHUP = false;
			ProcessConfigFile(PGC_SIGHUP);
		}

3836
		/*
B
Bruce Momjian 已提交
3837 3838
		 * (6) process the command.  But ignore it if we're skipping till
		 * Sync.
3839
		 */
3840
		if (ignore_till_sync && firstchar != EOF)
3841 3842
			continue;

3843 3844
		switch (firstchar)
		{
3845
			case 'Q':			/* simple query */
3846
				{
3847 3848
					const char *query_string;

3849 3850 3851
					/* Set statement_timestamp() */
					SetCurrentStatementStartTimestamp();

3852 3853
					query_string = pq_getmsgstring(&input_message);
					pq_getmsgend(&input_message);
3854

3855
					exec_simple_query(query_string);
3856

3857
					send_ready_for_query = true;
3858
				}
3859 3860
				break;

3861 3862 3863 3864 3865 3866 3867
			case 'P':			/* parse */
				{
					const char *stmt_name;
					const char *query_string;
					int			numParams;
					Oid		   *paramTypes = NULL;

3868 3869 3870
					/* Set statement_timestamp() */
					SetCurrentStatementStartTimestamp();

3871 3872 3873
					stmt_name = pq_getmsgstring(&input_message);
					query_string = pq_getmsgstring(&input_message);
					numParams = pq_getmsgint(&input_message, 2);
3874 3875
					if (numParams > 0)
					{
B
Bruce Momjian 已提交
3876
						int			i;
3877 3878 3879

						paramTypes = (Oid *) palloc(numParams * sizeof(Oid));
						for (i = 0; i < numParams; i++)
3880
							paramTypes[i] = pq_getmsgint(&input_message, 4);
3881
					}
3882
					pq_getmsgend(&input_message);
3883 3884 3885 3886 3887 3888 3889

					exec_parse_message(query_string, stmt_name,
									   paramTypes, numParams);
				}
				break;

			case 'B':			/* bind */
3890 3891
				/* Set statement_timestamp() */
				SetCurrentStatementStartTimestamp();
B
Bruce Momjian 已提交
3892

3893
				/*
B
Bruce Momjian 已提交
3894 3895
				 * this message is complex enough that it seems best to put
				 * the field extraction out-of-line
3896
				 */
3897
				exec_bind_message(&input_message);
3898 3899 3900 3901 3902
				break;

			case 'E':			/* execute */
				{
					const char *portal_name;
3903
					int			max_rows;
3904

3905 3906 3907
					/* Set statement_timestamp() */
					SetCurrentStatementStartTimestamp();

3908
					portal_name = pq_getmsgstring(&input_message);
3909
					max_rows = pq_getmsgint(&input_message, 4);
3910
					pq_getmsgend(&input_message);
3911

3912
					exec_execute_message(portal_name, max_rows);
3913 3914 3915
				}
				break;

3916
			case 'F':			/* fastpath function call */
3917 3918 3919
				/* Set statement_timestamp() */
				SetCurrentStatementStartTimestamp();

3920
				/* Tell the collector what we're doing */
3921 3922
				pgstat_report_activity("<FASTPATH> function call");

3923
				/* start an xact for this function invocation */
3924
				start_xact_command();
3925

3926 3927
				/*
				 * Note: we may at this point be inside an aborted
B
Bruce Momjian 已提交
3928 3929
				 * transaction.  We can't throw error for that until we've
				 * finished reading the function-call message, so
3930 3931 3932 3933 3934
				 * HandleFunctionRequest() must check for it after doing so.
				 * Be careful not to do anything that assumes we're inside a
				 * valid transaction here.
				 */

3935 3936 3937
				/* switch back to message context */
				MemoryContextSwitchTo(MessageContext);

3938
				if (HandleFunctionRequest(&input_message) == EOF)
3939 3940
				{
					/* lost frontend connection during F message input */
B
Bruce Momjian 已提交
3941

3942
					/*
3943
					 * Reset whereToSendOutput to prevent ereport from
B
Bruce Momjian 已提交
3944
					 * attempting to send any more messages to client.
3945
					 */
3946 3947
					if (whereToSendOutput == DestRemote)
						whereToSendOutput = DestNone;
3948

3949
					proc_exit(0);
3950
				}
3951 3952

				/* commit the function-invocation transaction */
3953
				finish_xact_command();
3954

3955
				send_ready_for_query = true;
3956 3957
				break;

B
Bruce Momjian 已提交
3958
			case 'C':			/* close */
3959
				{
B
Bruce Momjian 已提交
3960
					int			close_type;
3961 3962
					const char *close_target;

3963 3964 3965
					close_type = pq_getmsgbyte(&input_message);
					close_target = pq_getmsgstring(&input_message);
					pq_getmsgend(&input_message);
3966 3967 3968 3969 3970 3971 3972 3973 3974

					switch (close_type)
					{
						case 'S':
							if (close_target[0] != '\0')
								DropPreparedStatement(close_target, false);
							else
							{
								/* special-case the unnamed statement */
3975
								drop_unnamed_stmt();
3976 3977 3978 3979 3980 3981 3982 3983 3984 3985 3986 3987
							}
							break;
						case 'P':
							{
								Portal		portal;

								portal = GetPortalByName(close_target);
								if (PortalIsValid(portal))
									PortalDrop(portal, false);
							}
							break;
						default:
3988 3989
							ereport(ERROR,
									(errcode(ERRCODE_PROTOCOL_VIOLATION),
B
Bruce Momjian 已提交
3990 3991
								   errmsg("invalid CLOSE message subtype %d",
										  close_type)));
3992 3993 3994
							break;
					}

3995
					if (whereToSendOutput == DestRemote)
B
Bruce Momjian 已提交
3996
						pq_putemptymessage('3');		/* CloseComplete */
3997 3998 3999 4000 4001
				}
				break;

			case 'D':			/* describe */
				{
B
Bruce Momjian 已提交
4002
					int			describe_type;
4003 4004
					const char *describe_target;

4005 4006 4007
					/* Set statement_timestamp() (needed for xact) */
					SetCurrentStatementStartTimestamp();

4008 4009 4010
					describe_type = pq_getmsgbyte(&input_message);
					describe_target = pq_getmsgstring(&input_message);
					pq_getmsgend(&input_message);
4011 4012 4013 4014 4015 4016 4017 4018 4019 4020

					switch (describe_type)
					{
						case 'S':
							exec_describe_statement_message(describe_target);
							break;
						case 'P':
							exec_describe_portal_message(describe_target);
							break;
						default:
4021 4022
							ereport(ERROR,
									(errcode(ERRCODE_PROTOCOL_VIOLATION),
B
Bruce Momjian 已提交
4023 4024
								errmsg("invalid DESCRIBE message subtype %d",
									   describe_type)));
4025 4026 4027 4028 4029
							break;
					}
				}
				break;

B
Bruce Momjian 已提交
4030
			case 'H':			/* flush */
4031
				pq_getmsgend(&input_message);
4032
				if (whereToSendOutput == DestRemote)
4033 4034 4035
					pq_flush();
				break;

B
Bruce Momjian 已提交
4036
			case 'S':			/* sync */
4037
				pq_getmsgend(&input_message);
4038
				finish_xact_command();
4039
				send_ready_for_query = true;
4040 4041
				break;

4042
				/*
B
Bruce Momjian 已提交
4043 4044 4045
				 * 'X' means that the frontend is closing down the socket. EOF
				 * means unexpected loss of frontend connection. Either way,
				 * perform normal shutdown.
4046 4047
				 */
			case 'X':
4048
			case EOF:
B
Bruce Momjian 已提交
4049

4050
				/*
B
Bruce Momjian 已提交
4051 4052
				 * Reset whereToSendOutput to prevent ereport from attempting
				 * to send any more messages to client.
4053
				 */
4054 4055
				if (whereToSendOutput == DestRemote)
					whereToSendOutput = DestNone;
B
Bruce Momjian 已提交
4056

4057 4058
				/*
				 * NOTE: if you are tempted to add more code here, DON'T!
B
Bruce Momjian 已提交
4059
				 * Whatever you had in mind to do should be set up as an
B
Bruce Momjian 已提交
4060 4061 4062
				 * on_proc_exit or on_shmem_exit callback, instead. Otherwise
				 * it will fail to be called during other backend-shutdown
				 * scenarios.
4063
				 */
4064
				proc_exit(0);
4065

B
Bruce Momjian 已提交
4066 4067 4068 4069
			case 'd':			/* copy data */
			case 'c':			/* copy done */
			case 'f':			/* copy fail */

4070
				/*
B
Bruce Momjian 已提交
4071
				 * Accept but ignore these messages, per protocol spec; we
B
Bruce Momjian 已提交
4072 4073
				 * probably got here because a COPY failed, and the frontend
				 * is still sending data.
4074 4075 4076
				 */
				break;

4077
			default:
4078 4079 4080 4081
				ereport(FATAL,
						(errcode(ERRCODE_PROTOCOL_VIOLATION),
						 errmsg("invalid frontend message type %d",
								firstchar)));
4082
		}
4083
	}							/* end of input-reading loop */
4084

4085 4086
	/* can't get here because the above loop never exits */
	Assert(false);
4087

4088
	return 1;					/* keep compiler quiet */
4089 4090
}

4091 4092 4093 4094 4095 4096 4097 4098 4099 4100 4101 4102 4103 4104 4105 4106 4107 4108 4109 4110 4111 4112 4113 4114 4115

/*
 * Obtain platform stack depth limit (in bytes)
 *
 * Return -1 if unlimited or not known
 */
long
get_stack_depth_rlimit(void)
{
#if defined(HAVE_GETRLIMIT) && defined(RLIMIT_STACK)
	static long val = 0;

	/* This won't change after process launch, so check just once */
	if (val == 0)
	{
		struct rlimit rlim;

		if (getrlimit(RLIMIT_STACK, &rlim) < 0)
			val = -1;
		else if (rlim.rlim_cur == RLIM_INFINITY)
			val = -1;
		else
			val = rlim.rlim_cur;
	}
	return val;
B
Bruce Momjian 已提交
4116
#else							/* no getrlimit */
4117 4118 4119
#if defined(WIN32) || defined(__CYGWIN__)
	/* On Windows we set the backend stack size in src/backend/Makefile */
	return WIN32_STACK_RLIMIT;
B
Bruce Momjian 已提交
4120
#else							/* not windows ... give up */
4121 4122
	return -1;
#endif
4123
#endif
4124 4125
}

4126

4127 4128
static struct rusage Save_r;
static struct timeval Save_t;
4129 4130

void
4131
ResetUsage(void)
4132
{
4133
	getrusage(RUSAGE_SELF, &Save_r);
4134
	gettimeofday(&Save_t, NULL);
4135 4136 4137
}

void
4138
ShowUsage(const char *title)
4139
{
4140
	StringInfoData str;
4141 4142 4143 4144
	struct timeval user,
				sys;
	struct timeval elapse_t;
	struct rusage r;
4145 4146

	getrusage(RUSAGE_SELF, &r);
4147
	gettimeofday(&elapse_t, NULL);
4148 4149
	memcpy((char *) &user, (char *) &r.ru_utime, sizeof(user));
	memcpy((char *) &sys, (char *) &r.ru_stime, sizeof(sys));
4150 4151 4152 4153 4154 4155 4156 4157 4158 4159 4160 4161 4162 4163 4164 4165 4166 4167
	if (elapse_t.tv_usec < Save_t.tv_usec)
	{
		elapse_t.tv_sec--;
		elapse_t.tv_usec += 1000000;
	}
	if (r.ru_utime.tv_usec < Save_r.ru_utime.tv_usec)
	{
		r.ru_utime.tv_sec--;
		r.ru_utime.tv_usec += 1000000;
	}
	if (r.ru_stime.tv_usec < Save_r.ru_stime.tv_usec)
	{
		r.ru_stime.tv_sec--;
		r.ru_stime.tv_usec += 1000000;
	}

	/*
	 * the only stats we don't show here are for memory usage -- i can't
B
Bruce Momjian 已提交
4168 4169 4170 4171
	 * figure out how to interpret the relevant fields in the rusage struct,
	 * and they change names across o/s platforms, anyway. if you can figure
	 * out what the entries mean, you can somehow extract resident set size,
	 * shared text size, and unshared data and stack sizes.
4172
	 */
4173
	initStringInfo(&str);
4174

4175 4176
	appendStringInfo(&str, "! system usage stats:\n");
	appendStringInfo(&str,
B
Bruce Momjian 已提交
4177
				"!\t%ld.%06ld elapsed %ld.%06ld user %ld.%06ld system sec\n",
4178 4179 4180
					 (long) (elapse_t.tv_sec - Save_t.tv_sec),
					 (long) (elapse_t.tv_usec - Save_t.tv_usec),
					 (long) (r.ru_utime.tv_sec - Save_r.ru_utime.tv_sec),
B
Bruce Momjian 已提交
4181
					 (long) (r.ru_utime.tv_usec - Save_r.ru_utime.tv_usec),
4182
					 (long) (r.ru_stime.tv_sec - Save_r.ru_stime.tv_sec),
B
Bruce Momjian 已提交
4183
					 (long) (r.ru_stime.tv_usec - Save_r.ru_stime.tv_usec));
4184
	appendStringInfo(&str,
B
Bruce Momjian 已提交
4185
					 "!\t[%ld.%06ld user %ld.%06ld sys total]\n",
4186 4187 4188 4189
					 (long) user.tv_sec,
					 (long) user.tv_usec,
					 (long) sys.tv_sec,
					 (long) sys.tv_usec);
4190
#if defined(HAVE_GETRUSAGE)
4191
	appendStringInfo(&str,
B
Bruce Momjian 已提交
4192 4193
					 "!\t%ld/%ld [%ld/%ld] filesystem blocks in/out\n",
					 r.ru_inblock - Save_r.ru_inblock,
4194
	/* they only drink coffee at dec */
B
Bruce Momjian 已提交
4195 4196
					 r.ru_oublock - Save_r.ru_oublock,
					 r.ru_inblock, r.ru_oublock);
4197
	appendStringInfo(&str,
B
Bruce Momjian 已提交
4198
			  "!\t%ld/%ld [%ld/%ld] page faults/reclaims, %ld [%ld] swaps\n",
B
Bruce Momjian 已提交
4199 4200 4201 4202 4203
					 r.ru_majflt - Save_r.ru_majflt,
					 r.ru_minflt - Save_r.ru_minflt,
					 r.ru_majflt, r.ru_minflt,
					 r.ru_nswap - Save_r.ru_nswap,
					 r.ru_nswap);
4204
	appendStringInfo(&str,
B
Bruce Momjian 已提交
4205
		 "!\t%ld [%ld] signals rcvd, %ld/%ld [%ld/%ld] messages rcvd/sent\n",
B
Bruce Momjian 已提交
4206 4207 4208 4209 4210
					 r.ru_nsignals - Save_r.ru_nsignals,
					 r.ru_nsignals,
					 r.ru_msgrcv - Save_r.ru_msgrcv,
					 r.ru_msgsnd - Save_r.ru_msgsnd,
					 r.ru_msgrcv, r.ru_msgsnd);
4211
	appendStringInfo(&str,
B
Bruce Momjian 已提交
4212
			 "!\t%ld/%ld [%ld/%ld] voluntary/involuntary context switches\n",
B
Bruce Momjian 已提交
4213 4214 4215
					 r.ru_nvcsw - Save_r.ru_nvcsw,
					 r.ru_nivcsw - Save_r.ru_nivcsw,
					 r.ru_nvcsw, r.ru_nivcsw);
4216
#endif   /* HAVE_GETRUSAGE */
4217 4218

	/* remove trailing newline */
B
Bruce Momjian 已提交
4219
	if (str.data[str.len - 1] == '\n')
4220 4221
		str.data[--str.len] = '\0';

4222 4223 4224
	ereport(LOG,
			(errmsg_internal("%s", title),
			 errdetail("%s", str.data)));
4225 4226

	pfree(str.data);
4227
}
4228 4229 4230 4231

/*
 * on_proc_exit handler to log end of session
 */
B
Bruce Momjian 已提交
4232
static void
4233
log_disconnections(int code, Datum arg)
4234
{
B
Bruce Momjian 已提交
4235
	Port	   *port = MyProcPort;
4236 4237 4238
	long		secs;
	int			usecs;
	int			msecs;
B
Bruce Momjian 已提交
4239 4240 4241
	int			hours,
				minutes,
				seconds;
4242

4243 4244 4245 4246
	TimestampDifference(port->SessionStartTime,
						GetCurrentTimestamp(),
						&secs, &usecs);
	msecs = usecs / 1000;
4247

4248 4249 4250 4251
	hours = secs / SECS_PER_HOUR;
	secs %= SECS_PER_HOUR;
	minutes = secs / SECS_PER_MINUTE;
	seconds = secs % SECS_PER_MINUTE;
4252

4253
	ereport(LOG,
4254
			(errmsg("disconnection: session time: %d:%02d:%02d.%03d "
4255
					"user=%s database=%s host=%s%s%s",
4256
					hours, minutes, seconds, msecs,
4257
					port->user_name, port->database_name, port->remote_host,
B
Bruce Momjian 已提交
4258
				  port->remote_port[0] ? " port=" : "", port->remote_port)));
4259
}