postgres.c 87.0 KB
Newer Older
1 2
/*-------------------------------------------------------------------------
 *
3
 * postgres.c
4
 *	  POSTGRES C Backend Interface
5
 *
P
 
PostgreSQL Daemon 已提交
6
 * Portions Copyright (c) 1996-2005, PostgreSQL Global Development Group
B
Add:  
Bruce Momjian 已提交
7
 * Portions Copyright (c) 1994, Regents of the University of California
8 9 10
 *
 *
 * IDENTIFICATION
11
 *	  $PostgreSQL: pgsql/src/backend/tcop/postgres.c,v 1.443 2005/04/21 19:18:13 tgl Exp $
12 13
 *
 * NOTES
14 15
 *	  this is the "main" module of the postgres backend and
 *	  hence the main module of the "traffic cop".
16 17 18
 *
 *-------------------------------------------------------------------------
 */
B
Bruce Momjian 已提交
19

20 21
#include "postgres.h"

B
Bruce Momjian 已提交
22
#include <unistd.h>
23
#include <signal.h>
B
Bruce Momjian 已提交
24
#include <fcntl.h>
25
#include <sys/socket.h>
26
#if HAVE_SYS_SELECT_H
27
#include <sys/select.h>
28
#endif
29
#ifdef HAVE_GETOPT_H
B
Bruce Momjian 已提交
30
#include <getopt.h>
31
#endif
32

33
#include "access/printtup.h"
34
#include "access/xlog.h"
35
#include "catalog/pg_type.h"
36
#include "commands/async.h"
37
#include "commands/prepare.h"
38
#include "commands/trigger.h"
39
#include "libpq/libpq.h"
40
#include "libpq/pqformat.h"
41
#include "libpq/pqsignal.h"
B
Bruce Momjian 已提交
42
#include "miscadmin.h"
43 44
#include "nodes/print.h"
#include "optimizer/cost.h"
45
#include "optimizer/planner.h"
46
#include "parser/analyze.h"
47
#include "parser/parser.h"
B
Bruce Momjian 已提交
48
#include "rewrite/rewriteHandler.h"
49
#include "storage/freespace.h"
50
#include "storage/ipc.h"
51
#include "storage/pg_shmem.h"
52
#include "storage/proc.h"
53
#include "storage/sinval.h"
54 55
#include "tcop/fastpath.h"
#include "tcop/pquery.h"
B
Bruce Momjian 已提交
56
#include "tcop/tcopprot.h"
57
#include "tcop/utility.h"
58
#include "utils/flatfiles.h"
59
#include "utils/guc.h"
60
#include "utils/lsyscache.h"
61
#include "utils/memutils.h"
M
 
Marc G. Fournier 已提交
62
#include "utils/ps_status.h"
B
Bruce Momjian 已提交
63
#include "mb/pg_wchar.h"
64

65
#include "pgstat.h"
M
 
Marc G. Fournier 已提交
66

67 68 69
extern int	optind;
extern char *optarg;

70
/* ----------------
71
 *		global variables
72 73
 * ----------------
 */
74
const char *debug_query_string; /* for pgmonitor and
B
Bruce Momjian 已提交
75
								 * log_min_error_statement */
76

77
/* Note: whereToSendOutput is initialized for the bootstrap/standalone case */
78
CommandDest whereToSendOutput = Debug;
79

80
/* flag for logging end of session */
B
Bruce Momjian 已提交
81
bool		Log_disconnections = false;
82

83 84
LogStmtLevel log_statement = LOGSTMT_NONE;

85 86 87
/* flag indicating if the statement satisfies log_statement */
bool		statement_logged;

88 89 90 91
/* GUC variable for maximum stack depth (measured in kilobytes) */
int			max_stack_depth = 2048;


92 93 94 95
/* ----------------
 *		private variables
 * ----------------
 */
96

97
/* max_stack_depth converted to bytes for speed of checking */
B
Bruce Momjian 已提交
98
static int	max_stack_depth_bytes = 2048 * 1024;
99 100 101 102 103

/* stack base pointer (initialized by PostgresMain) */
static char *stack_base_ptr = NULL;


104 105 106 107 108
/*
 * Flag to mark SIGHUP. Whenever the main loop comes around it
 * will reread the configuration file. (Better than doing the
 * reading in the signal handler, ey?)
 */
109
static volatile sig_atomic_t got_SIGHUP = false;
110

111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137
/*
 * Flag to keep track of whether we have started a transaction.
 * For extended query protocol this has to be remembered across messages.
 */
static bool xact_started = false;

/*
 * Flags to implement skip-till-Sync-after-error behavior for messages of
 * the extended query protocol.
 */
static bool doing_extended_query_message = false;
static bool ignore_till_sync = false;

/*
 * If an unnamed prepared statement exists, it's stored here.
 * We keep it separate from the hashtable kept by commands/prepare.c
 * in order to reduce overhead for short-lived queries.
 */
static MemoryContext unnamed_stmt_context = NULL;
static PreparedStatement *unnamed_stmt_pstmt = NULL;


static bool EchoQuery = false;	/* default don't echo */

/*
 * people who want to use EOF should #define DONTUSENEWLINE in
 * tcop/tcopdebug.h
138 139
 */
#ifndef TCOP_DONTUSENEWLINE
140
static int	UseNewLine = 1;		/* Use newlines query delimiters (the
141
								 * default) */
B
Bruce Momjian 已提交
142

143
#else
144
static int	UseNewLine = 0;		/* Use EOF as query delimiters */
145
#endif   /* TCOP_DONTUSENEWLINE */
146 147 148


/* ----------------------------------------------------------------
149
 *		decls for routines only used in this file
150 151
 * ----------------------------------------------------------------
 */
152 153 154
static int	InteractiveBackend(StringInfo inBuf);
static int	SocketBackend(StringInfo inBuf);
static int	ReadCommand(StringInfo inBuf);
155
static void start_xact_command(void);
156
static void finish_xact_command(void);
157 158
static void SigHupHandler(SIGNAL_ARGS);
static void FloatExceptionHandler(SIGNAL_ARGS);
159
static void log_disconnections(int code, Datum arg);
160 161 162


/* ----------------------------------------------------------------
163
 *		routines to obtain user input
164 165 166 167
 * ----------------------------------------------------------------
 */

/* ----------------
168
 *	InteractiveBackend() is called for user interactive connections
169 170 171
 *
 *	the string entered by the user is placed in its parameter inBuf,
 *	and we act like a Q message was received.
172
 *
173
 *	EOF is returned if end-of-file input is seen; time to shut down.
174 175 176
 * ----------------
 */

177
static int
178
InteractiveBackend(StringInfo inBuf)
179
{
180 181 182
	int			c;				/* character read from getc() */
	bool		end = false;	/* end-of-input flag */
	bool		backslashSeen = false;	/* have we seen a \ ? */
183

184 185
	/*
	 * display a prompt and obtain input from the user
186
	 */
187
	printf("backend> ");
188
	fflush(stdout);
189

190 191 192
	/* Reset inBuf to empty */
	inBuf->len = 0;
	inBuf->data[0] = '\0';
193
	inBuf->cursor = 0;
194

195 196 197 198
	for (;;)
	{
		if (UseNewLine)
		{
199 200 201
			/*
			 * if we are using \n as a delimiter, then read characters
			 * until the \n.
202 203 204 205 206 207 208
			 */
			while ((c = getc(stdin)) != EOF)
			{
				if (c == '\n')
				{
					if (backslashSeen)
					{
209 210 211
						/* discard backslash from inBuf */
						inBuf->data[--inBuf->len] = '\0';
						backslashSeen = false;
212 213 214 215 216
						continue;
					}
					else
					{
						/* keep the newline character */
217
						appendStringInfoChar(inBuf, '\n');
218 219 220 221 222 223 224 225
						break;
					}
				}
				else if (c == '\\')
					backslashSeen = true;
				else
					backslashSeen = false;

226
				appendStringInfoChar(inBuf, (char) c);
227 228 229 230 231 232 233
			}

			if (c == EOF)
				end = true;
		}
		else
		{
234 235
			/*
			 * otherwise read characters until EOF.
236 237
			 */
			while ((c = getc(stdin)) != EOF)
238
				appendStringInfoChar(inBuf, (char) c);
239

240
			if (inBuf->len == 0)
241 242 243 244
				end = true;
		}

		if (end)
245
			return EOF;
246

247 248
		/*
		 * otherwise we have a user query so process it.
249 250 251 252
		 */
		break;
	}

253 254 255
	/* Add '\0' to make it look the same as message case. */
	appendStringInfoChar(inBuf, (char) '\0');

256 257
	/*
	 * if the query echo flag was given, print the query..
258 259
	 */
	if (EchoQuery)
260
		printf("statement: %s\n", inBuf->data);
261
	fflush(stdout);
262

263
	return 'Q';
264 265 266
}

/* ----------------
267
 *	SocketBackend()		Is called for frontend-backend connections
268
 *
269
 *	Returns the message type code, and loads message body data into inBuf.
270
 *
271
 *	EOF is returned if the connection is lost.
272 273
 * ----------------
 */
274
static int
275
SocketBackend(StringInfo inBuf)
276
{
277
	int			qtype;
278

279
	/*
280
	 * Get message type code from the frontend.
281
	 */
282
	qtype = pq_getbyte();
283

284 285
	if (qtype == EOF)			/* frontend disconnected */
	{
286 287 288
		ereport(COMMERROR,
				(errcode(ERRCODE_PROTOCOL_VIOLATION),
				 errmsg("unexpected EOF on client connection")));
289 290 291 292 293
		return qtype;
	}

	/*
	 * Validate message type code before trying to read body; if we have
B
Bruce Momjian 已提交
294 295
	 * lost sync, better to say "command unknown" than to run out of
	 * memory because we used garbage as a length word.
296 297 298
	 *
	 * This also gives us a place to set the doing_extended_query_message
	 * flag as soon as possible.
299
	 */
300
	switch (qtype)
301
	{
302
		case 'Q':				/* simple query */
303
			doing_extended_query_message = false;
304 305 306 307 308
			if (PG_PROTOCOL_MAJOR(FrontendProtocol) < 3)
			{
				/* old style without length word; convert */
				if (pq_getstring(inBuf))
				{
309 310
					ereport(COMMERROR,
							(errcode(ERRCODE_PROTOCOL_VIOLATION),
B
Bruce Momjian 已提交
311
						 errmsg("unexpected EOF on client connection")));
312 313 314
					return EOF;
				}
			}
315 316
			break;

317
		case 'F':				/* fastpath function call */
318 319
			/* we let fastpath.c cope with old-style input of this */
			doing_extended_query_message = false;
320
			break;
321

322
		case 'X':				/* terminate */
323
			doing_extended_query_message = false;
324
			ignore_till_sync = false;
325 326 327 328 329 330 331 332 333 334 335
			break;

		case 'B':				/* bind */
		case 'C':				/* close */
		case 'D':				/* describe */
		case 'E':				/* execute */
		case 'H':				/* flush */
		case 'P':				/* parse */
			doing_extended_query_message = true;
			/* these are only legal in protocol 3 */
			if (PG_PROTOCOL_MAJOR(FrontendProtocol) < 3)
336 337
				ereport(FATAL,
						(errcode(ERRCODE_PROTOCOL_VIOLATION),
B
Bruce Momjian 已提交
338
					 errmsg("invalid frontend message type %d", qtype)));
339 340 341 342 343 344 345 346 347
			break;

		case 'S':				/* sync */
			/* stop any active skip-till-Sync */
			ignore_till_sync = false;
			/* mark not-extended, so that a new error doesn't begin skip */
			doing_extended_query_message = false;
			/* only legal in protocol 3 */
			if (PG_PROTOCOL_MAJOR(FrontendProtocol) < 3)
348 349
				ereport(FATAL,
						(errcode(ERRCODE_PROTOCOL_VIOLATION),
B
Bruce Momjian 已提交
350
					 errmsg("invalid frontend message type %d", qtype)));
351
			break;
352

353 354 355
		case 'd':				/* copy data */
		case 'c':				/* copy done */
		case 'f':				/* copy fail */
356 357 358
			doing_extended_query_message = false;
			/* these are only legal in protocol 3 */
			if (PG_PROTOCOL_MAJOR(FrontendProtocol) < 3)
359 360
				ereport(FATAL,
						(errcode(ERRCODE_PROTOCOL_VIOLATION),
B
Bruce Momjian 已提交
361
					 errmsg("invalid frontend message type %d", qtype)));
362
			break;
363

364
		default:
B
Bruce Momjian 已提交
365

366
			/*
B
Bruce Momjian 已提交
367 368 369
			 * Otherwise we got garbage from the frontend.	We treat this
			 * as fatal because we have probably lost message boundary
			 * sync, and there's no good way to recover.
370
			 */
371 372 373
			ereport(FATAL,
					(errcode(ERRCODE_PROTOCOL_VIOLATION),
					 errmsg("invalid frontend message type %d", qtype)));
374
			break;
375
	}
376

377 378 379 380 381 382 383 384 385 386 387
	/*
	 * In protocol version 3, all frontend messages have a length word
	 * next after the type code; we can read the message contents
	 * independently of the type.
	 */
	if (PG_PROTOCOL_MAJOR(FrontendProtocol) >= 3)
	{
		if (pq_getmessage(inBuf, 0))
			return EOF;			/* suitable message already logged */
	}

388
	return qtype;
389 390 391
}

/* ----------------
392
 *		ReadCommand reads a command from either the frontend or
393 394 395
 *		standard input, places it in inBuf, and returns the
 *		message type code (first byte of the message).
 *		EOF is returned if end of file.
396 397
 * ----------------
 */
398
static int
399
ReadCommand(StringInfo inBuf)
400
{
401
	int			result;
402

403
	if (whereToSendOutput == Remote)
404
		result = SocketBackend(inBuf);
405
	else
406 407
		result = InteractiveBackend(inBuf);
	return result;
408 409
}

410 411 412 413 414 415

/*
 * Parse a query string and pass it through the rewriter.
 *
 * A list of Query nodes is returned, since the string might contain
 * multiple queries and/or the rewriter might expand one query to several.
416 417 418
 *
 * NOTE: this routine is no longer used for processing interactive queries,
 * but it is still needed for parsing of SQL function bodies.
419
 */
420
List *
B
Bruce Momjian 已提交
421
pg_parse_and_rewrite(const char *query_string,	/* string to execute */
422
					 Oid *paramTypes,	/* parameter types */
B
Bruce Momjian 已提交
423
					 int numParams)		/* number of parameters */
424
{
425
	List	   *raw_parsetree_list;
426
	List	   *querytree_list;
427
	ListCell   *list_item;
428

429 430
	/*
	 * (1) parse the request string into a list of raw parse trees.
431
	 */
432
	raw_parsetree_list = pg_parse_query(query_string);
433

434 435
	/*
	 * (2) Do parse analysis and rule rewrite.
436 437 438 439
	 */
	querytree_list = NIL;
	foreach(list_item, raw_parsetree_list)
	{
B
Bruce Momjian 已提交
440
		Node	   *parsetree = (Node *) lfirst(list_item);
441

442
		querytree_list = list_concat(querytree_list,
B
Bruce Momjian 已提交
443 444 445
									 pg_analyze_and_rewrite(parsetree,
															paramTypes,
															numParams));
446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463
	}

	return querytree_list;
}

/*
 * Do raw parsing (only).
 *
 * A list of parsetrees is returned, since there might be multiple
 * commands in the given string.
 *
 * NOTE: for interactive queries, it is important to keep this routine
 * separate from the analysis & rewrite stages.  Analysis and rewriting
 * cannot be done in an aborted transaction, since they require access to
 * database tables.  So, we rely on the raw parser to determine whether
 * we've seen a COMMIT or ABORT command; when we are in abort state, other
 * commands are not processed any further than the raw parse stage.
 */
464
List *
465
pg_parse_query(const char *query_string)
466
{
467 468
	List	   *raw_parsetree_list;
	ListCell   *parsetree_item;
469

470
	statement_logged = false;
471
	if (log_statement == LOGSTMT_ALL)
472
	{
473
		ereport(LOG,
B
Bruce Momjian 已提交
474
				(errmsg("statement: %s", query_string)));
475 476
		statement_logged = true;
	}
477

B
Rename:  
Bruce Momjian 已提交
478
	if (log_parser_stats)
479 480
		ResetUsage();

481
	raw_parsetree_list = raw_parser(query_string);
482

483 484 485 486 487 488 489 490
	/* do log_statement tests for mod and ddl */
	if (log_statement == LOGSTMT_MOD ||
		log_statement == LOGSTMT_DDL)
	{
		foreach(parsetree_item, raw_parsetree_list)
		{
			Node	   *parsetree = (Node *) lfirst(parsetree_item);
			const char *commandTag;
B
Bruce Momjian 已提交
491

492
			if (IsA(parsetree, ExplainStmt) &&
B
Bruce Momjian 已提交
493 494 495
				((ExplainStmt *) parsetree)->analyze)
				parsetree = (Node *) (((ExplainStmt *) parsetree)->query);

496
			if (IsA(parsetree, PrepareStmt))
B
Bruce Momjian 已提交
497 498
				parsetree = (Node *) (((PrepareStmt *) parsetree)->query);

499
			if (IsA(parsetree, SelectStmt))
B
Bruce Momjian 已提交
500 501
				continue;		/* optimization for frequent command */

502 503 504 505 506 507
			if (log_statement == LOGSTMT_MOD &&
				(IsA(parsetree, InsertStmt) ||
				 IsA(parsetree, UpdateStmt) ||
				 IsA(parsetree, DeleteStmt) ||
				 IsA(parsetree, TruncateStmt) ||
				 (IsA(parsetree, CopyStmt) &&
B
Bruce Momjian 已提交
508
				  ((CopyStmt *) parsetree)->is_from)))	/* COPY FROM */
509 510 511
			{
				ereport(LOG,
						(errmsg("statement: %s", query_string)));
512
				statement_logged = true;
513 514 515 516 517 518 519 520 521 522 523
				break;
			}
			commandTag = CreateCommandTag(parsetree);
			if (strncmp(commandTag, "CREATE ", strlen("CREATE ")) == 0 ||
				strncmp(commandTag, "ALTER ", strlen("ALTER ")) == 0 ||
				strncmp(commandTag, "DROP ", strlen("DROP ")) == 0 ||
				IsA(parsetree, GrantStmt) ||	/* GRANT or REVOKE */
				IsA(parsetree, CommentStmt))
			{
				ereport(LOG,
						(errmsg("statement: %s", query_string)));
524
				statement_logged = true;
525 526 527 528 529
				break;
			}
		}
	}

B
Rename:  
Bruce Momjian 已提交
530
	if (log_parser_stats)
531
		ShowUsage("PARSER STATISTICS");
532 533 534 535 536

	return raw_parsetree_list;
}

/*
537 538
 * Given a raw parsetree (gram.y output), and optionally information about
 * types of parameter symbols ($n), perform parse analysis and rule rewriting.
539 540 541 542 543 544
 *
 * A list of Query nodes is returned, since either the analyzer or the
 * rewriter might expand one query to several.
 *
 * NOTE: for reasons mentioned above, this must be separate from raw parsing.
 */
545
List *
546
pg_analyze_and_rewrite(Node *parsetree, Oid *paramTypes, int numParams)
547 548 549
{
	List	   *querytree_list;

550 551
	/*
	 * (1) Perform parse analysis.
552
	 */
B
Rename:  
Bruce Momjian 已提交
553
	if (log_parser_stats)
554 555
		ResetUsage();

556
	querytree_list = parse_analyze(parsetree, paramTypes, numParams);
557

B
Rename:  
Bruce Momjian 已提交
558
	if (log_parser_stats)
559
		ShowUsage("PARSE ANALYSIS STATISTICS");
560

561 562
	/*
	 * (2) Rewrite the queries, as necessary
563 564 565 566 567 568 569 570 571 572 573 574 575
	 */
	querytree_list = pg_rewrite_queries(querytree_list);

	return querytree_list;
}

/*
 * Perform rewriting of a list of queries produced by parse analysis.
 */
List *
pg_rewrite_queries(List *querytree_list)
{
	List	   *new_list = NIL;
576
	ListCell   *list_item;
577 578 579 580 581

	if (log_parser_stats)
		ResetUsage();

	/*
B
Bruce Momjian 已提交
582 583
	 * rewritten queries are collected in new_list.  Note there may be
	 * more or fewer than in the original list.
584
	 */
585
	foreach(list_item, querytree_list)
586
	{
587
		Query	   *querytree = (Query *) lfirst(list_item);
588

589
		if (Debug_print_parse)
590
			elog_node_display(DEBUG1, "parse tree", querytree,
591
							  Debug_pretty_print);
592 593 594

		if (querytree->commandType == CMD_UTILITY)
		{
595 596
			/* don't rewrite utilities, just dump 'em into new_list */
			new_list = lappend(new_list, querytree);
597
		}
598
		else
599
		{
600
			/* rewrite regular queries */
601 602
			List	   *rewritten = QueryRewrite(querytree);

603
			new_list = list_concat(new_list, rewritten);
604 605 606 607 608
		}
	}

	querytree_list = new_list;

B
Rename:  
Bruce Momjian 已提交
609
	if (log_parser_stats)
610
		ShowUsage("REWRITER STATISTICS");
611

612
#ifdef COPY_PARSE_PLAN_TREES
B
Bruce Momjian 已提交
613 614 615 616 617

	/*
	 * Optional debugging check: pass querytree output through
	 * copyObject()
	 */
618 619
	new_list = (List *) copyObject(querytree_list);
	/* This checks both copyObject() and the equal() routines... */
B
Bruce Momjian 已提交
620
	if (!equal(new_list, querytree_list))
621
		elog(WARNING, "copyObject() failed to produce an equal parse tree");
622 623
	else
		querytree_list = new_list;
624 625
#endif

626
	if (Debug_print_rewritten)
627
		elog_node_display(DEBUG1, "rewritten parse tree", querytree_list,
628
						  Debug_pretty_print);
629

630 631
	return querytree_list;
}
632 633


634
/* Generate a plan for a single already-rewritten query. */
635
Plan *
636
pg_plan_query(Query *querytree, ParamListInfo boundParams)
637 638
{
	Plan	   *plan;
639

640 641 642
	/* Utility commands have no plans. */
	if (querytree->commandType == CMD_UTILITY)
		return NULL;
643

B
Rename:  
Bruce Momjian 已提交
644
	if (log_planner_stats)
645
		ResetUsage();
646

647
	/* call the optimizer */
648
	plan = planner(querytree, false, 0, boundParams);
649

B
Rename:  
Bruce Momjian 已提交
650
	if (log_planner_stats)
651
		ShowUsage("PLANNER STATISTICS");
652

653 654 655
#ifdef COPY_PARSE_PLAN_TREES
	/* Optional debugging check: pass plan output through copyObject() */
	{
B
Bruce Momjian 已提交
656
		Plan	   *new_plan = (Plan *) copyObject(plan);
657

B
Bruce Momjian 已提交
658 659
		/*
		 * equal() currently does not have routines to compare Plan nodes,
660 661 662 663
		 * so don't try to test equality here.  Perhaps fix someday?
		 */
#ifdef NOT_USED
		/* This checks both copyObject() and the equal() routines... */
B
Bruce Momjian 已提交
664
		if (!equal(new_plan, plan))
665
			elog(WARNING, "copyObject() failed to produce an equal plan tree");
666 667 668 669 670 671
		else
#endif
			plan = new_plan;
	}
#endif

672 673
	/*
	 * Print plan if debugging.
674
	 */
675
	if (Debug_print_plan)
676
		elog_node_display(DEBUG1, "plan", plan, Debug_pretty_print);
677

678
	return plan;
679 680
}

681 682
/*
 * Generate plans for a list of already-rewritten queries.
683
 *
684 685 686 687 688 689 690 691 692
 * If needSnapshot is TRUE, we haven't yet set a snapshot for the current
 * query.  A snapshot must be set before invoking the planner, since it
 * might try to evaluate user-defined functions.  But we must not set a
 * snapshot if the list contains only utility statements, because some
 * utility statements depend on not having frozen the snapshot yet.
 * (We assume that such statements cannot appear together with plannable
 * statements in the rewriter's output.)
 */
List *
693 694
pg_plan_queries(List *querytrees, ParamListInfo boundParams,
				bool needSnapshot)
695 696
{
	List	   *plan_list = NIL;
697
	ListCell   *query_list;
698 699 700 701 702 703 704 705 706 707 708 709 710 711 712

	foreach(query_list, querytrees)
	{
		Query	   *query = (Query *) lfirst(query_list);
		Plan	   *plan;

		if (query->commandType == CMD_UTILITY)
		{
			/* Utility commands have no plans. */
			plan = NULL;
		}
		else
		{
			if (needSnapshot)
			{
713
				ActiveSnapshot = CopySnapshot(GetTransactionSnapshot());
714 715
				needSnapshot = false;
			}
716
			plan = pg_plan_query(query, boundParams);
717 718 719 720 721 722 723 724 725 726
		}

		plan_list = lappend(plan_list, plan);
	}

	return plan_list;
}


/*
727
 * exec_simple_query
728
 *
729
 * Execute a "simple Query" protocol message.
730
 */
731
static void
732
exec_simple_query(const char *query_string)
733
{
B
Bruce Momjian 已提交
734
	CommandDest dest = whereToSendOutput;
735
	MemoryContext oldcontext;
736 737
	List	   *parsetree_list;
	ListCell   *parsetree_item;
B
Bruce Momjian 已提交
738 739
	struct timeval start_t,
				stop_t;
B
Rename:  
Bruce Momjian 已提交
740
	bool		save_log_duration = log_duration;
B
Bruce Momjian 已提交
741
	int			save_log_min_duration_statement = log_min_duration_statement;
742
	bool		save_log_statement_stats = log_statement_stats;
743

744 745 746
	/*
	 * Report query to various monitoring facilities.
	 */
747
	debug_query_string = query_string;
748

749 750
	pgstat_report_activity(query_string);

751
	/*
B
Bruce Momjian 已提交
752 753 754 755
	 * We use save_log_* so "SET log_duration = true"  and "SET
	 * log_min_duration_statement = true" don't report incorrect time
	 * because gettimeofday() wasn't called. Similarly,
	 * log_statement_stats has to be captured once.
756
	 */
757
	if (save_log_duration || save_log_min_duration_statement != -1)
758
		gettimeofday(&start_t, NULL);
759

760 761 762
	if (save_log_statement_stats)
		ResetUsage();

763
	/*
B
Bruce Momjian 已提交
764 765 766 767
	 * Start up a transaction command.	All queries generated by the
	 * query_string will be in this same command block, *unless* we find a
	 * BEGIN/COMMIT/ABORT statement; we have to force a new xact command
	 * after one of those, else bad things will happen in xact.c. (Note
768
	 * that this will normally change current memory context.)
769 770
	 */
	start_xact_command();
771 772

	/*
B
Bruce Momjian 已提交
773 774 775 776
	 * Zap any pre-existing unnamed statement.	(While not strictly
	 * necessary, it seems best to define simple-Query mode as if it used
	 * the unnamed statement and portal; this ensures we recover any
	 * storage used by prior unnamed operations.)
777 778 779 780 781 782 783 784
	 */
	unnamed_stmt_pstmt = NULL;
	if (unnamed_stmt_context)
	{
		DropDependentPortals(unnamed_stmt_context);
		MemoryContextDelete(unnamed_stmt_context);
	}
	unnamed_stmt_context = NULL;
785

786 787 788
	/*
	 * Switch to appropriate context for constructing parsetrees.
	 */
789
	oldcontext = MemoryContextSwitchTo(MessageContext);
790

791 792
	QueryContext = CurrentMemoryContext;

B
Bruce Momjian 已提交
793
	/*
B
Bruce Momjian 已提交
794 795
	 * Do basic parsing of the query or queries (this should be safe even
	 * if we are in aborted transaction state!)
796
	 */
797
	parsetree_list = pg_parse_query(query_string);
798

799
	/*
800
	 * Switch back to transaction context to enter the loop.
801 802 803 804
	 */
	MemoryContextSwitchTo(oldcontext);

	/*
805
	 * Run through the raw parsetree(s) and process each one.
806
	 */
807
	foreach(parsetree_item, parsetree_list)
808
	{
B
Bruce Momjian 已提交
809
		Node	   *parsetree = (Node *) lfirst(parsetree_item);
810 811
		const char *commandTag;
		char		completionTag[COMPLETION_TAG_BUFSIZE];
B
Bruce Momjian 已提交
812
		List	   *querytree_list,
813 814
				   *plantree_list;
		Portal		portal;
815 816
		DestReceiver *receiver;
		int16		format;
817

818
		/*
B
Bruce Momjian 已提交
819 820 821 822
		 * Get the command name for use in status display (it also becomes
		 * the default completion tag, down inside PortalRun).	Set
		 * ps_status and do any special start-of-SQL-command processing
		 * needed by the destination.
823 824 825 826 827
		 */
		commandTag = CreateCommandTag(parsetree);

		set_ps_display(commandTag);

828
		BeginCommand(commandTag, dest);
829

830
		/*
831
		 * If we are in an aborted transaction, reject all commands except
832 833
		 * COMMIT/ABORT.  It is important that this test occur before we
		 * try to do parse analysis, rewrite, or planning, since all those
B
Bruce Momjian 已提交
834 835 836
		 * phases try to do database accesses, which may fail in abort
		 * state. (It might be safe to allow some additional utility
		 * commands in this state, but not many...)
837 838
		 */
		if (IsAbortedTransactionBlockState())
839
		{
B
Bruce Momjian 已提交
840
			bool		allowit = false;
841

842
			if (IsA(parsetree, TransactionStmt))
843 844 845
			{
				TransactionStmt *stmt = (TransactionStmt *) parsetree;

846
				if (stmt->kind == TRANS_STMT_COMMIT ||
847 848
					stmt->kind == TRANS_STMT_ROLLBACK ||
					stmt->kind == TRANS_STMT_ROLLBACK_TO)
849
					allowit = true;
850
			}
851

B
Bruce Momjian 已提交
852
			if (!allowit)
853 854 855
				ereport(ERROR,
						(errcode(ERRCODE_IN_FAILED_SQL_TRANSACTION),
						 errmsg("current transaction is aborted, "
B
Bruce Momjian 已提交
856
					"commands ignored until end of transaction block")));
857
		}
858

859
		/* Make sure we are in a transaction command */
860
		start_xact_command();
861

862
		/* If we got a cancel signal in parsing or prior command, quit */
863
		CHECK_FOR_INTERRUPTS();
864 865

		/*
866
		 * OK to analyze, rewrite, and plan this query.
867
		 *
B
Bruce Momjian 已提交
868 869
		 * Switch to appropriate context for constructing querytrees (again,
		 * these must outlive the execution context).
870
		 */
871
		oldcontext = MemoryContextSwitchTo(MessageContext);
872

873
		querytree_list = pg_analyze_and_rewrite(parsetree, NULL, 0);
V
Vadim B. Mikheev 已提交
874

875
		plantree_list = pg_plan_queries(querytree_list, NULL, true);
876 877 878 879

		/* If we got a cancel signal in analysis or planning, quit */
		CHECK_FOR_INTERRUPTS();

880
		/*
B
Bruce Momjian 已提交
881 882
		 * Create unnamed portal to run the query or queries in. If there
		 * already is one, silently drop it.
883
		 */
884
		portal = CreatePortal("", true, true);
885

886 887 888 889 890 891
		PortalDefineQuery(portal,
						  query_string,
						  commandTag,
						  querytree_list,
						  plantree_list,
						  MessageContext);
892

893
		/*
894
		 * Start the portal.  No parameters here.
895
		 */
896
		PortalStart(portal, NULL, InvalidSnapshot);
897

898 899
		/*
		 * Select the appropriate output format: text unless we are doing
B
Bruce Momjian 已提交
900 901 902
		 * a FETCH from a binary cursor.  (Pretty grotty to have to do
		 * this here --- but it avoids grottiness in other places.	Ah,
		 * the joys of backward compatibility...)
903 904 905 906 907 908 909 910 911 912 913 914
		 */
		format = 0;				/* TEXT is default */
		if (IsA(parsetree, FetchStmt))
		{
			FetchStmt  *stmt = (FetchStmt *) parsetree;

			if (!stmt->ismove)
			{
				Portal		fportal = GetPortalByName(stmt->portalname);

				if (PortalIsValid(fportal) &&
					(fportal->cursorOptions & CURSOR_OPT_BINARY))
B
Bruce Momjian 已提交
915
					format = 1; /* BINARY */
916 917 918 919 920 921 922 923 924 925 926 927 928 929 930
			}
		}
		PortalSetResultFormat(portal, 1, &format);

		/*
		 * Now we can create the destination receiver object.
		 */
		receiver = CreateDestReceiver(dest, portal);

		/*
		 * Switch back to transaction context for execution.
		 */
		MemoryContextSwitchTo(oldcontext);

		/*
B
Bruce Momjian 已提交
931 932
		 * Run the portal to completion, and then drop it (and the
		 * receiver).
933
		 */
934 935
		(void) PortalRun(portal,
						 FETCH_ALL,
936 937
						 receiver,
						 receiver,
938
						 completionTag);
939

940
		(*receiver->rDestroy) (receiver);
941

942
		PortalDrop(portal, false);
943

944
		if (IsA(parsetree, TransactionStmt))
945
		{
946
			/*
B
Bruce Momjian 已提交
947 948 949
			 * If this was a transaction control statement, commit it. We
			 * will start a new xact command for the next command (if
			 * any).
950
			 */
951
			finish_xact_command();
952
		}
953
		else if (lnext(parsetree_item) == NULL)
954
		{
955
			/*
B
Bruce Momjian 已提交
956 957 958 959 960 961 962 963 964
			 * If this is the last parsetree of the query string, close
			 * down transaction statement before reporting
			 * command-complete.  This is so that any end-of-transaction
			 * errors are reported before the command-complete message is
			 * issued, to avoid confusing clients who will expect either a
			 * command-complete message or an error, not one and then the
			 * other.  But for compatibility with historical Postgres
			 * behavior, we do not force a transaction boundary between
			 * queries appearing in a single query string.
965
			 */
966
			finish_xact_command();
967
		}
968
		else
969
		{
970
			/*
B
Bruce Momjian 已提交
971 972
			 * We need a CommandCounterIncrement after every query, except
			 * those that start or end a transaction block.
973 974
			 */
			CommandCounterIncrement();
975
		}
976 977 978

		/*
		 * Tell client that we're done with this query.  Note we emit
B
Bruce Momjian 已提交
979 980 981 982
		 * exactly one EndCommand report for each raw parsetree, thus one
		 * for each SQL command the client sent, regardless of rewriting.
		 * (But a command aborted by error will not send an EndCommand
		 * report at all.)
983
		 */
984
		EndCommand(completionTag, dest);
B
Bruce Momjian 已提交
985
	}							/* end loop over parsetrees */
986

987 988 989 990 991
	/*
	 * Close down transaction statement, if one is open.
	 */
	finish_xact_command();

992 993 994
	/*
	 * If there were no parsetrees, return EmptyQueryResponse message.
	 */
995
	if (!parsetree_list)
996 997
		NullCommand(dest);

998
	QueryContext = NULL;
999

1000
	/*
B
Bruce Momjian 已提交
1001 1002
	 * Combine processing here as we need to calculate the query duration
	 * in both instances.
1003
	 */
1004
	if (save_log_duration || save_log_min_duration_statement != -1)
1005
	{
B
Bruce Momjian 已提交
1006 1007
		long		usecs;

1008
		gettimeofday(&stop_t, NULL);
1009 1010 1011 1012 1013
		if (stop_t.tv_usec < start_t.tv_usec)
		{
			stop_t.tv_sec--;
			stop_t.tv_usec += 1000000;
		}
B
Bruce Momjian 已提交
1014 1015
		usecs = (long) (stop_t.tv_sec - start_t.tv_sec) * 1000000 + (long) (stop_t.tv_usec - start_t.tv_usec);

1016 1017
		/* Only print duration if we previously printed the statement. */
		if (statement_logged && save_log_duration)
B
Bruce Momjian 已提交
1018 1019
			ereport(LOG,
					(errmsg("duration: %ld.%03ld ms",
B
Bruce Momjian 已提交
1020 1021 1022
						(long) ((stop_t.tv_sec - start_t.tv_sec) * 1000 +
							  (stop_t.tv_usec - start_t.tv_usec) / 1000),
					 (long) (stop_t.tv_usec - start_t.tv_usec) % 1000)));
B
Bruce Momjian 已提交
1023

B
Bruce Momjian 已提交
1024
		/*
B
Bruce Momjian 已提交
1025 1026
		 * Output a duration_statement to the log if the query has
		 * exceeded the min duration, or if we are to print all durations.
B
Bruce Momjian 已提交
1027
		 */
B
Bruce Momjian 已提交
1028 1029 1030
		if (save_log_min_duration_statement == 0 ||
			(save_log_min_duration_statement > 0 &&
			 usecs >= save_log_min_duration_statement * 1000))
1031
			ereport(LOG,
B
Bruce Momjian 已提交
1032
					(errmsg("duration: %ld.%03ld ms  statement: %s",
B
Bruce Momjian 已提交
1033 1034 1035
						(long) ((stop_t.tv_sec - start_t.tv_sec) * 1000 +
							  (stop_t.tv_usec - start_t.tv_usec) / 1000),
						(long) (stop_t.tv_usec - start_t.tv_usec) % 1000,
B
Bruce Momjian 已提交
1036
							query_string)));
1037
	}
1038

1039 1040 1041
	if (save_log_statement_stats)
		ShowUsage("QUERY STATISTICS");

1042
	debug_query_string = NULL;
1043 1044
}

1045 1046 1047 1048 1049 1050 1051 1052
/*
 * exec_parse_message
 *
 * Execute a "Parse" protocol message.
 */
static void
exec_parse_message(const char *query_string,	/* string to execute */
				   const char *stmt_name,		/* name for prepared stmt */
B
Bruce Momjian 已提交
1053 1054
				   Oid *paramTypes,		/* parameter types */
				   int numParams)		/* number of parameters */
1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086
{
	MemoryContext oldcontext;
	List	   *parsetree_list;
	const char *commandTag;
	List	   *querytree_list,
			   *plantree_list,
			   *param_list;
	bool		is_named;
	bool		save_log_statement_stats = log_statement_stats;

	/*
	 * Report query to various monitoring facilities.
	 */
	debug_query_string = query_string;

	pgstat_report_activity(query_string);

	set_ps_display("PARSE");

	if (save_log_statement_stats)
		ResetUsage();

	/*
	 * Start up a transaction command so we can run parse analysis etc.
	 * (Note that this will normally change current memory context.)
	 * Nothing happens if we are already in one.
	 */
	start_xact_command();

	/*
	 * Switch to appropriate context for constructing parsetrees.
	 *
B
Bruce Momjian 已提交
1087 1088 1089 1090 1091 1092 1093 1094 1095 1096
	 * We have two strategies depending on whether the prepared statement is
	 * named or not.  For a named prepared statement, we do parsing in
	 * MessageContext and copy the finished trees into the prepared
	 * statement's private context; then the reset of MessageContext
	 * releases temporary space used by parsing and planning.  For an
	 * unnamed prepared statement, we assume the statement isn't going to
	 * hang around long, so getting rid of temp space quickly is probably
	 * not worth the costs of copying parse/plan trees.  So in this case,
	 * we set up a special context for the unnamed statement, and do all
	 * the parsing/planning therein.
1097 1098 1099 1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117 1118 1119 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132
	 */
	is_named = (stmt_name[0] != '\0');
	if (is_named)
	{
		/* Named prepared statement --- parse in MessageContext */
		oldcontext = MemoryContextSwitchTo(MessageContext);
	}
	else
	{
		/* Unnamed prepared statement --- release any prior unnamed stmt */
		unnamed_stmt_pstmt = NULL;
		if (unnamed_stmt_context)
		{
			DropDependentPortals(unnamed_stmt_context);
			MemoryContextDelete(unnamed_stmt_context);
		}
		unnamed_stmt_context = NULL;
		/* create context for parsing/planning */
		unnamed_stmt_context =
			AllocSetContextCreate(TopMemoryContext,
								  "unnamed prepared statement",
								  ALLOCSET_DEFAULT_MINSIZE,
								  ALLOCSET_DEFAULT_INITSIZE,
								  ALLOCSET_DEFAULT_MAXSIZE);
		oldcontext = MemoryContextSwitchTo(unnamed_stmt_context);
	}

	QueryContext = CurrentMemoryContext;

	/*
	 * Do basic parsing of the query or queries (this should be safe even
	 * if we are in aborted transaction state!)
	 */
	parsetree_list = pg_parse_query(query_string);

	/*
B
Bruce Momjian 已提交
1133 1134 1135
	 * We only allow a single user statement in a prepared statement. This
	 * is mainly to keep the protocol simple --- otherwise we'd need to
	 * worry about multiple result tupdescs and things like that.
1136
	 */
1137
	if (list_length(parsetree_list) > 1)
1138 1139 1140
		ereport(ERROR,
				(errcode(ERRCODE_SYNTAX_ERROR),
				 errmsg("cannot insert multiple commands into a prepared statement")));
1141 1142 1143

	if (parsetree_list != NIL)
	{
1144
		Node	   *parsetree = (Node *) linitial(parsetree_list);
B
Bruce Momjian 已提交
1145
		int			i;
1146 1147 1148 1149 1150 1151 1152 1153

		/*
		 * Get the command name for possible use in status display.
		 */
		commandTag = CreateCommandTag(parsetree);

		/*
		 * If we are in an aborted transaction, reject all commands except
B
Bruce Momjian 已提交
1154 1155 1156 1157
		 * COMMIT/ROLLBACK.  It is important that this test occur before
		 * we try to do parse analysis, rewrite, or planning, since all
		 * those phases try to do database accesses, which may fail in
		 * abort state. (It might be safe to allow some additional utility
1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168
		 * commands in this state, but not many...)
		 */
		if (IsAbortedTransactionBlockState())
		{
			bool		allowit = false;

			if (IsA(parsetree, TransactionStmt))
			{
				TransactionStmt *stmt = (TransactionStmt *) parsetree;

				if (stmt->kind == TRANS_STMT_COMMIT ||
1169 1170
					stmt->kind == TRANS_STMT_ROLLBACK ||
					stmt->kind == TRANS_STMT_ROLLBACK_TO)
1171 1172 1173 1174
					allowit = true;
			}

			if (!allowit)
1175 1176 1177
				ereport(ERROR,
						(errcode(ERRCODE_IN_FAILED_SQL_TRANSACTION),
						 errmsg("current transaction is aborted, "
B
Bruce Momjian 已提交
1178
					"commands ignored until end of transaction block")));
1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193 1194 1195 1196 1197 1198 1199
		}

		/*
		 * OK to analyze, rewrite, and plan this query.  Note that the
		 * originally specified parameter set is not required to be
		 * complete, so we have to use parse_analyze_varparams().
		 */
		if (log_parser_stats)
			ResetUsage();

		querytree_list = parse_analyze_varparams(parsetree,
												 &paramTypes,
												 &numParams);

		/*
		 * Check all parameter types got determined, and convert array
		 * representation to a list for storage.
		 */
		param_list = NIL;
		for (i = 0; i < numParams; i++)
		{
B
Bruce Momjian 已提交
1200
			Oid			ptype = paramTypes[i];
1201 1202

			if (ptype == InvalidOid || ptype == UNKNOWNOID)
1203 1204
				ereport(ERROR,
						(errcode(ERRCODE_INDETERMINATE_DATATYPE),
B
Bruce Momjian 已提交
1205 1206
				 errmsg("could not determine data type of parameter $%d",
						i + 1)));
1207
			param_list = lappend_oid(param_list, ptype);
1208 1209 1210 1211 1212 1213 1214
		}

		if (log_parser_stats)
			ShowUsage("PARSE ANALYSIS STATISTICS");

		querytree_list = pg_rewrite_queries(querytree_list);

1215 1216 1217 1218 1219 1220 1221 1222
		/*
		 * If this is the unnamed statement and it has parameters, defer
		 * query planning until Bind.  Otherwise do it now.
		 */
		if (!is_named && numParams > 0)
			plantree_list = NIL;
		else
			plantree_list = pg_plan_queries(querytree_list, NULL, true);
1223 1224 1225
	}
	else
	{
B
Bruce Momjian 已提交
1226
		/* Empty input string.	This is legal. */
1227 1228 1229 1230 1231 1232 1233 1234 1235 1236 1237 1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256 1257 1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269
		commandTag = NULL;
		querytree_list = NIL;
		plantree_list = NIL;
		param_list = NIL;
	}

	/* If we got a cancel signal in analysis or planning, quit */
	CHECK_FOR_INTERRUPTS();

	/*
	 * Store the query as a prepared statement.  See above comments.
	 */
	if (is_named)
	{
		StorePreparedStatement(stmt_name,
							   query_string,
							   commandTag,
							   querytree_list,
							   plantree_list,
							   param_list);
	}
	else
	{
		PreparedStatement *pstmt;

		pstmt = (PreparedStatement *) palloc0(sizeof(PreparedStatement));
		/* query_string needs to be copied into unnamed_stmt_context */
		pstmt->query_string = pstrdup(query_string);
		/* the rest is there already */
		pstmt->commandTag = commandTag;
		pstmt->query_list = querytree_list;
		pstmt->plan_list = plantree_list;
		pstmt->argtype_list = param_list;
		pstmt->context = unnamed_stmt_context;
		/* Now the unnamed statement is complete and valid */
		unnamed_stmt_pstmt = pstmt;
	}

	MemoryContextSwitchTo(oldcontext);

	QueryContext = NULL;

	/*
B
Bruce Momjian 已提交
1270 1271 1272 1273
	 * We do NOT close the open transaction command here; that only
	 * happens when the client sends Sync.	Instead, do
	 * CommandCounterIncrement just in case something happened during
	 * parse/plan.
1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295 1296 1297 1298
	 */
	CommandCounterIncrement();

	/*
	 * Send ParseComplete.
	 */
	if (whereToSendOutput == Remote)
		pq_putemptymessage('1');

	if (save_log_statement_stats)
		ShowUsage("PARSE MESSAGE STATISTICS");

	debug_query_string = NULL;
}

/*
 * exec_bind_message
 *
 * Process a "Bind" message to create a portal from a prepared statement
 */
static void
exec_bind_message(StringInfo input_message)
{
	const char *portal_name;
	const char *stmt_name;
1299 1300
	int			numPFormats;
	int16	   *pformats = NULL;
1301
	int			numParams;
1302 1303 1304
	int			numRFormats;
	int16	   *rformats = NULL;
	int			i;
1305 1306 1307
	PreparedStatement *pstmt;
	Portal		portal;
	ParamListInfo params;
1308
	bool		isaborted = IsAbortedTransactionBlockState();
1309 1310 1311 1312 1313 1314

	pgstat_report_activity("<BIND>");

	set_ps_display("BIND");

	/*
B
Bruce Momjian 已提交
1315 1316 1317
	 * Start up a transaction command so we can call functions etc. (Note
	 * that this will normally change current memory context.) Nothing
	 * happens if we are already in one.
1318 1319 1320
	 */
	start_xact_command();

1321 1322 1323
	/* Switch back to message context */
	MemoryContextSwitchTo(MessageContext);

1324 1325 1326 1327
	/* Get the fixed part of the message */
	portal_name = pq_getmsgstring(input_message);
	stmt_name = pq_getmsgstring(input_message);

1328 1329 1330 1331 1332 1333 1334 1335 1336 1337 1338 1339 1340
	/* Get the parameter format codes */
	numPFormats = pq_getmsgint(input_message, 2);
	if (numPFormats > 0)
	{
		pformats = (int16 *) palloc(numPFormats * sizeof(int16));
		for (i = 0; i < numPFormats; i++)
			pformats[i] = pq_getmsgint(input_message, 2);
	}

	/* Get the parameter value count */
	numParams = pq_getmsgint(input_message, 2);

	if (numPFormats > 1 && numPFormats != numParams)
1341 1342
		ereport(ERROR,
				(errcode(ERRCODE_PROTOCOL_VIOLATION),
B
Bruce Momjian 已提交
1343 1344
		errmsg("bind message has %d parameter formats but %d parameters",
			   numPFormats, numParams)));
1345 1346 1347 1348 1349 1350 1351 1352 1353

	/* Find prepared statement */
	if (stmt_name[0] != '\0')
		pstmt = FetchPreparedStatement(stmt_name, true);
	else
	{
		/* special-case the unnamed statement */
		pstmt = unnamed_stmt_pstmt;
		if (!pstmt)
1354 1355
			ereport(ERROR,
					(errcode(ERRCODE_UNDEFINED_PSTATEMENT),
B
Bruce Momjian 已提交
1356
				   errmsg("unnamed prepared statement does not exist")));
1357 1358
	}

1359
	if (numParams != list_length(pstmt->argtype_list))
1360 1361 1362
		ereport(ERROR,
				(errcode(ERRCODE_PROTOCOL_VIOLATION),
				 errmsg("bind message supplies %d parameters, but prepared statement \"%s\" requires %d",
B
Bruce Momjian 已提交
1363
			   numParams, stmt_name, list_length(pstmt->argtype_list))));
1364 1365 1366 1367 1368 1369 1370 1371 1372 1373 1374 1375 1376

	/*
	 * Create the portal.  Allow silent replacement of an existing portal
	 * only if the unnamed portal is specified.
	 */
	if (portal_name[0] == '\0')
		portal = CreatePortal(portal_name, true, true);
	else
		portal = CreatePortal(portal_name, false, false);

	/*
	 * Fetch parameters, if any, and store in the portal's memory context.
	 *
B
Bruce Momjian 已提交
1377 1378 1379
	 * In an aborted transaction, we can't risk calling user-defined
	 * functions, but we can't fail to Bind either, so bind all parameters
	 * to null values.
1380 1381 1382
	 */
	if (numParams > 0)
	{
1383
		ListCell   *l;
1384 1385 1386 1387 1388 1389 1390
		MemoryContext oldContext;

		oldContext = MemoryContextSwitchTo(PortalGetHeapMemory(portal));

		params = (ParamListInfo)
			palloc0((numParams + 1) * sizeof(ParamListInfoData));

1391
		i = 0;
1392 1393
		foreach(l, pstmt->argtype_list)
		{
1394
			Oid			ptype = lfirst_oid(l);
1395
			int32		plength;
1396 1397
			bool		isNull;

1398 1399 1400
			plength = pq_getmsgint(input_message, 4);
			isNull = (plength == -1);

1401 1402
			if (!isNull)
			{
1403
				const char *pvalue = pq_getmsgbytes(input_message, plength);
1404 1405

				if (isaborted)
1406 1407
				{
					/* We don't bother to check the format in this case */
1408
					isNull = true;
1409
				}
1410 1411
				else
				{
B
Bruce Momjian 已提交
1412
					int16		pformat;
1413
					StringInfoData pbuf;
B
Bruce Momjian 已提交
1414
					char		csave;
1415 1416 1417 1418 1419 1420

					if (numPFormats > 1)
						pformat = pformats[i];
					else if (numPFormats > 0)
						pformat = pformats[0];
					else
B
Bruce Momjian 已提交
1421
						pformat = 0;	/* default = text */
1422

1423
					/*
B
Bruce Momjian 已提交
1424 1425 1426 1427 1428 1429 1430
					 * Rather than copying data around, we just set up a
					 * phony StringInfo pointing to the correct portion of
					 * the message buffer.	We assume we can scribble on
					 * the message buffer so as to maintain the convention
					 * that StringInfos have a trailing null.  This is
					 * grotty but is a big win when dealing with very
					 * large parameter strings.
1431 1432 1433 1434 1435 1436 1437 1438 1439
					 */
					pbuf.data = (char *) pvalue;
					pbuf.maxlen = plength + 1;
					pbuf.len = plength;
					pbuf.cursor = 0;

					csave = pbuf.data[plength];
					pbuf.data[plength] = '\0';

1440 1441
					if (pformat == 0)
					{
1442 1443
						Oid			typinput;
						Oid			typioparam;
1444 1445
						char	   *pstring;

1446
						getTypeInputInfo(ptype, &typinput, &typioparam);
B
Bruce Momjian 已提交
1447

1448
						/*
B
Bruce Momjian 已提交
1449 1450
						 * We have to do encoding conversion before
						 * calling the typinput routine.
1451 1452 1453 1454 1455
						 */
						pstring = (char *)
							pg_client_to_server((unsigned char *) pbuf.data,
												plength);
						params[i].value =
1456
							OidFunctionCall3(typinput,
1457
											 CStringGetDatum(pstring),
1458
											 ObjectIdGetDatum(typioparam),
1459 1460 1461 1462 1463 1464 1465
											 Int32GetDatum(-1));
						/* Free result of encoding conversion, if any */
						if (pstring != pbuf.data)
							pfree(pstring);
					}
					else if (pformat == 1)
					{
1466 1467
						Oid			typreceive;
						Oid			typioparam;
1468

B
Bruce Momjian 已提交
1469 1470 1471 1472
						/*
						 * Call the parameter type's binary input
						 * converter
						 */
1473
						getTypeBinaryInputInfo(ptype, &typreceive, &typioparam);
1474 1475

						params[i].value =
1476
							OidFunctionCall2(typreceive,
1477
											 PointerGetDatum(&pbuf),
B
Bruce Momjian 已提交
1478
										   ObjectIdGetDatum(typioparam));
1479 1480 1481

						/* Trouble if it didn't eat the whole buffer */
						if (pbuf.cursor != pbuf.len)
1482 1483 1484
							ereport(ERROR,
									(errcode(ERRCODE_INVALID_BINARY_REPRESENTATION),
									 errmsg("incorrect binary data format in bind parameter %d",
B
Bruce Momjian 已提交
1485
											i + 1)));
1486 1487 1488
					}
					else
					{
1489 1490 1491 1492
						ereport(ERROR,
								(errcode(ERRCODE_INVALID_PARAMETER_VALUE),
								 errmsg("unsupported format code: %d",
										pformat)));
1493
					}
1494 1495 1496

					/* Restore message buffer contents */
					pbuf.data[plength] = csave;
1497 1498
				}
			}
1499

1500 1501
			params[i].kind = PARAM_NUM;
			params[i].id = i + 1;
1502
			params[i].ptype = ptype;
1503 1504 1505 1506 1507 1508 1509 1510 1511 1512 1513 1514
			params[i].isnull = isNull;

			i++;
		}

		params[i].kind = PARAM_INVALID;

		MemoryContextSwitchTo(oldContext);
	}
	else
		params = NULL;

1515 1516 1517 1518 1519 1520 1521 1522 1523
	/* Get the result format codes */
	numRFormats = pq_getmsgint(input_message, 2);
	if (numRFormats > 0)
	{
		rformats = (int16 *) palloc(numRFormats * sizeof(int16));
		for (i = 0; i < numRFormats; i++)
			rformats[i] = pq_getmsgint(input_message, 2);
	}

1524 1525 1526
	pq_getmsgend(input_message);

	/*
1527 1528 1529
	 * If we didn't plan the query before, do it now.  This allows the
	 * planner to make use of the concrete parameter values we now have.
	 *
B
Bruce Momjian 已提交
1530 1531
	 * This happens only for unnamed statements, and so switching into the
	 * statement context for planning is correct (see notes in
1532
	 * exec_parse_message).
1533
	 */
1534 1535 1536 1537 1538 1539 1540 1541 1542 1543 1544 1545 1546 1547 1548 1549 1550 1551 1552
	if (pstmt->plan_list == NIL && pstmt->query_list != NIL &&
		!isaborted)
	{
		MemoryContext oldContext = MemoryContextSwitchTo(pstmt->context);

		pstmt->plan_list = pg_plan_queries(pstmt->query_list, params, true);
		MemoryContextSwitchTo(oldContext);
	}

	/*
	 * Define portal and start execution.
	 */
	PortalDefineQuery(portal,
					  pstmt->query_string,
					  pstmt->commandTag,
					  pstmt->query_list,
					  pstmt->plan_list,
					  pstmt->context);

1553
	PortalStart(portal, params, InvalidSnapshot);
1554

1555 1556 1557 1558 1559
	/*
	 * Apply the result format requests to the portal.
	 */
	PortalSetResultFormat(portal, numRFormats, rformats);

1560 1561 1562 1563 1564 1565 1566 1567 1568 1569 1570 1571 1572
	/*
	 * Send BindComplete.
	 */
	if (whereToSendOutput == Remote)
		pq_putemptymessage('2');
}

/*
 * exec_execute_message
 *
 * Process an "Execute" message for a portal
 */
static void
1573
exec_execute_message(const char *portal_name, long max_rows)
1574
{
B
Bruce Momjian 已提交
1575
	CommandDest dest;
1576
	DestReceiver *receiver;
1577 1578 1579 1580 1581 1582 1583 1584 1585
	Portal		portal;
	bool		is_trans_stmt = false;
	bool		is_trans_exit = false;
	bool		completed;
	char		completionTag[COMPLETION_TAG_BUFSIZE];

	/* Adjust destination to tell printtup.c what to do */
	dest = whereToSendOutput;
	if (dest == Remote)
1586
		dest = RemoteExecute;
1587 1588 1589

	portal = GetPortalByName(portal_name);
	if (!PortalIsValid(portal))
1590 1591 1592
		ereport(ERROR,
				(errcode(ERRCODE_UNDEFINED_CURSOR),
				 errmsg("portal \"%s\" does not exist", portal_name)));
1593 1594

	/*
B
Bruce Momjian 已提交
1595 1596
	 * If the original query was a null string, just return
	 * EmptyQueryResponse.
1597 1598 1599 1600 1601 1602 1603 1604 1605 1606 1607 1608 1609 1610 1611 1612 1613 1614 1615 1616 1617 1618 1619 1620
	 */
	if (portal->commandTag == NULL)
	{
		Assert(portal->parseTrees == NIL);
		NullCommand(dest);
		return;
	}

	if (portal->sourceText)
	{
		debug_query_string = portal->sourceText;
		pgstat_report_activity(portal->sourceText);
	}
	else
	{
		debug_query_string = "execute message";
		pgstat_report_activity("<EXECUTE>");
	}

	set_ps_display(portal->commandTag);

	BeginCommand(portal->commandTag, dest);

	/* Check for transaction-control commands */
1621
	if (list_length(portal->parseTrees) == 1)
1622
	{
1623
		Query	   *query = (Query *) linitial(portal->parseTrees);
1624 1625 1626 1627 1628 1629 1630 1631 1632

		if (query->commandType == CMD_UTILITY &&
			query->utilityStmt != NULL &&
			IsA(query->utilityStmt, TransactionStmt))
		{
			TransactionStmt *stmt = (TransactionStmt *) query->utilityStmt;

			is_trans_stmt = true;
			if (stmt->kind == TRANS_STMT_COMMIT ||
1633 1634
				stmt->kind == TRANS_STMT_ROLLBACK ||
				stmt->kind == TRANS_STMT_ROLLBACK_TO)
1635 1636 1637 1638
				is_trans_exit = true;
		}
	}

1639
	/*
B
Bruce Momjian 已提交
1640 1641 1642
	 * Create dest receiver in MessageContext (we don't want it in
	 * transaction context, because that may get deleted if portal
	 * contains VACUUM).
1643 1644 1645
	 */
	receiver = CreateDestReceiver(dest, portal);

1646
	/*
B
Bruce Momjian 已提交
1647 1648
	 * Ensure we are in a transaction command (this should normally be the
	 * case already due to prior BIND).
1649 1650 1651 1652 1653 1654 1655 1656 1657 1658
	 */
	start_xact_command();

	/*
	 * If we are in aborted transaction state, the only portals we can
	 * actually run are those containing COMMIT or ROLLBACK commands.
	 */
	if (IsAbortedTransactionBlockState())
	{
		if (!is_trans_exit)
1659 1660 1661
			ereport(ERROR,
					(errcode(ERRCODE_IN_FAILED_SQL_TRANSACTION),
					 errmsg("current transaction is aborted, "
B
Bruce Momjian 已提交
1662
					"commands ignored until end of transaction block")));
1663 1664 1665 1666 1667 1668 1669 1670 1671 1672 1673 1674 1675
	}

	/* Check for cancel signal before we start execution */
	CHECK_FOR_INTERRUPTS();

	/*
	 * Okay to run the portal.
	 */
	if (max_rows <= 0)
		max_rows = FETCH_ALL;

	completed = PortalRun(portal,
						  max_rows,
1676 1677
						  receiver,
						  receiver,
1678 1679
						  completionTag);

1680
	(*receiver->rDestroy) (receiver);
1681

1682 1683 1684 1685 1686
	if (completed)
	{
		if (is_trans_stmt)
		{
			/*
B
Bruce Momjian 已提交
1687 1688 1689
			 * If this was a transaction control statement, commit it.	We
			 * will start a new xact command for the next command (if
			 * any).
1690
			 */
1691
			finish_xact_command();
1692 1693 1694 1695
		}
		else
		{
			/*
B
Bruce Momjian 已提交
1696 1697
			 * We need a CommandCounterIncrement after every query, except
			 * those that start or end a transaction block.
1698 1699 1700 1701 1702 1703 1704 1705 1706 1707 1708 1709 1710 1711 1712 1713 1714 1715 1716 1717 1718 1719 1720 1721 1722 1723
			 */
			CommandCounterIncrement();
		}

		/* Send appropriate CommandComplete to client */
		EndCommand(completionTag, dest);
	}
	else
	{
		/* Portal run not complete, so send PortalSuspended */
		if (whereToSendOutput == Remote)
			pq_putemptymessage('s');
	}

	debug_query_string = NULL;
}

/*
 * exec_describe_statement_message
 *
 * Process a "Describe" message for a prepared statement
 */
static void
exec_describe_statement_message(const char *stmt_name)
{
	PreparedStatement *pstmt;
1724
	TupleDesc	tupdesc;
1725
	ListCell   *l;
1726 1727 1728 1729 1730 1731 1732 1733 1734 1735
	StringInfoData buf;

	/* Find prepared statement */
	if (stmt_name[0] != '\0')
		pstmt = FetchPreparedStatement(stmt_name, true);
	else
	{
		/* special-case the unnamed statement */
		pstmt = unnamed_stmt_pstmt;
		if (!pstmt)
1736 1737
			ereport(ERROR,
					(errcode(ERRCODE_UNDEFINED_PSTATEMENT),
B
Bruce Momjian 已提交
1738
				   errmsg("unnamed prepared statement does not exist")));
1739 1740 1741 1742 1743
	}

	if (whereToSendOutput != Remote)
		return;					/* can't actually do anything... */

1744 1745 1746
	/*
	 * First describe the parameters...
	 */
B
Bruce Momjian 已提交
1747
	pq_beginmessage(&buf, 't'); /* parameter description message type */
1748
	pq_sendint(&buf, list_length(pstmt->argtype_list), 2);
1749 1750 1751

	foreach(l, pstmt->argtype_list)
	{
1752
		Oid			ptype = lfirst_oid(l);
1753 1754 1755 1756

		pq_sendint(&buf, (int) ptype, 4);
	}
	pq_endmessage(&buf);
1757 1758 1759 1760 1761 1762 1763

	/*
	 * Next send RowDescription or NoData to describe the result...
	 */
	tupdesc = FetchPreparedStatementResultDesc(pstmt);
	if (tupdesc)
	{
B
Bruce Momjian 已提交
1764
		List	   *targetlist;
1765 1766

		if (ChoosePortalStrategy(pstmt->query_list) == PORTAL_ONE_SELECT)
1767
			targetlist = ((Query *) linitial(pstmt->query_list))->targetList;
1768 1769
		else
			targetlist = NIL;
1770
		SendRowDescriptionMessage(tupdesc, targetlist, NULL);
1771 1772 1773 1774
	}
	else
		pq_putemptymessage('n');	/* NoData */

1775 1776 1777 1778 1779 1780 1781 1782 1783 1784 1785 1786 1787 1788
}

/*
 * exec_describe_portal_message
 *
 * Process a "Describe" message for a portal
 */
static void
exec_describe_portal_message(const char *portal_name)
{
	Portal		portal;

	portal = GetPortalByName(portal_name);
	if (!PortalIsValid(portal))
1789 1790 1791
		ereport(ERROR,
				(errcode(ERRCODE_UNDEFINED_CURSOR),
				 errmsg("portal \"%s\" does not exist", portal_name)));
1792 1793 1794 1795 1796

	if (whereToSendOutput != Remote)
		return;					/* can't actually do anything... */

	if (portal->tupDesc)
1797
	{
B
Bruce Momjian 已提交
1798
		List	   *targetlist;
1799 1800

		if (portal->strategy == PORTAL_ONE_SELECT)
1801
			targetlist = ((Query *) linitial(portal->parseTrees))->targetList;
1802 1803
		else
			targetlist = NIL;
1804 1805
		SendRowDescriptionMessage(portal->tupDesc, targetlist,
								  portal->formats);
1806
	}
1807 1808 1809 1810 1811
	else
		pq_putemptymessage('n');	/* NoData */
}


1812 1813 1814 1815 1816 1817
/*
 * Convenience routines for starting/committing a single command.
 */
static void
start_xact_command(void)
{
1818 1819
	if (!xact_started)
	{
1820 1821
		ereport(DEBUG3,
				(errmsg_internal("StartTransactionCommand")));
1822
		StartTransactionCommand();
1823 1824 1825 1826

		/* Set statement timeout running, if any */
		if (StatementTimeout > 0)
			enable_sig_alarm(StatementTimeout, true);
1827

1828 1829
		xact_started = true;
	}
1830 1831 1832
}

static void
1833
finish_xact_command(void)
1834
{
1835 1836 1837 1838
	if (xact_started)
	{
		/* Cancel any active statement timeout before committing */
		disable_sig_alarm(true);
1839

1840
		/* Now commit the command */
1841 1842
		ereport(DEBUG3,
				(errmsg_internal("CommitTransactionCommand")));
1843

1844
		CommitTransactionCommand();
1845

1846 1847 1848 1849 1850 1851
#ifdef MEMORY_CONTEXT_CHECKING
		/* Check all memory contexts that weren't freed during commit */
		/* (those that were, were checked before being deleted) */
		MemoryContextCheck(TopMemoryContext);
#endif

1852
#ifdef SHOW_MEMORY_STATS
1853
		/* Print mem stats after each commit for leak tracking */
1854 1855
		if (ShowStats)
			MemoryContextStats(TopMemoryContext);
1856
#endif
1857 1858 1859

		xact_started = false;
	}
1860 1861 1862
}


1863
/* --------------------------------
1864
 *		signal handler routines used in PostgresMain()
1865 1866 1867
 * --------------------------------
 */

1868
/*
T
Tom Lane 已提交
1869
 * quickdie() occurs when signalled SIGQUIT by the postmaster.
1870 1871 1872 1873
 *
 * Some backend has bought the farm,
 * so we need to stop what we're doing and exit.
 */
T
Tom Lane 已提交
1874
void
1875
quickdie(SIGNAL_ARGS)
1876
{
1877
	PG_SETMASK(&BlockSig);
B
Bruce Momjian 已提交
1878

1879
	/*
B
Bruce Momjian 已提交
1880
	 * Ideally this should be ereport(FATAL), but then we'd not get
1881
	 * control back...
1882 1883 1884
	 */
	ereport(WARNING,
			(errcode(ERRCODE_CRASH_SHUTDOWN),
B
Bruce Momjian 已提交
1885 1886 1887 1888 1889
			 errmsg("terminating connection because of crash of another server process"),
			 errdetail("The postmaster has commanded this server process to roll back"
					 " the current transaction and exit, because another"
			   " server process exited abnormally and possibly corrupted"
					   " shared memory."),
1890
			 errhint("In a moment you should be able to reconnect to the"
1891
					 " database and repeat your command.")));
B
Bruce Momjian 已提交
1892

1893
	/*
1894 1895 1896 1897
	 * DO NOT proc_exit() -- we're here because shared memory may be
	 * corrupted, so we don't want to try to clean up our transaction.
	 * Just nail the windows shut and get out of town.
	 *
B
Bruce Momjian 已提交
1898 1899 1900 1901
	 * Note we do exit(1) not exit(0).	This is to force the postmaster into
	 * a system reset cycle if some idiot DBA sends a manual SIGQUIT to a
	 * random backend.	This is necessary precisely because we don't clean
	 * up our shared memory state.
1902
	 */
1903
	exit(1);
1904 1905
}

1906
/*
1907 1908
 * Shutdown signal from postmaster: abort transaction and exit
 * at soonest convenient time
1909
 */
1910
void
1911
die(SIGNAL_ARGS)
1912
{
1913 1914 1915
	int			save_errno = errno;

	/* Don't joggle the elbow of proc_exit */
B
Bruce Momjian 已提交
1916
	if (!proc_exit_inprogress)
1917
	{
1918
		InterruptPending = true;
1919
		ProcDiePending = true;
B
Bruce Momjian 已提交
1920

1921
		/*
B
Bruce Momjian 已提交
1922 1923
		 * If it's safe to interrupt, and we're waiting for input or a
		 * lock, service the interrupt immediately
1924
		 */
1925 1926
		if (ImmediateInterruptOK && InterruptHoldoffCount == 0 &&
			CritSectionCount == 0)
1927
		{
1928 1929 1930
			/* bump holdoff count to make ProcessInterrupts() a no-op */
			/* until we are done getting ready for it */
			InterruptHoldoffCount++;
1931
			DisableNotifyInterrupt();
1932
			DisableCatchupInterrupt();
1933
			/* Make sure CheckDeadLock won't run while shutting down... */
1934
			LockWaitCancel();
1935
			InterruptHoldoffCount--;
1936 1937
			ProcessInterrupts();
		}
1938
	}
1939 1940

	errno = save_errno;
1941 1942
}

1943
/*
1944
 * Timeout or shutdown signal from postmaster during client authentication.
1945
 * Simply exit(0).
1946 1947 1948
 *
 * XXX: possible future improvement: try to send a message indicating
 * why we are disconnecting.  Problem is to be sure we don't block while
1949
 * doing so, nor mess up the authentication message exchange.
1950 1951 1952 1953 1954 1955 1956
 */
void
authdie(SIGNAL_ARGS)
{
	exit(0);
}

1957
/*
1958 1959
 * Query-cancel signal from postmaster: abort current transaction
 * at soonest convenient time
1960
 */
1961
static void
1962
StatementCancelHandler(SIGNAL_ARGS)
1963
{
1964 1965
	int			save_errno = errno;

B
Bruce Momjian 已提交
1966
	/*
1967
	 * Don't joggle the elbow of proc_exit
B
Bruce Momjian 已提交
1968
	 */
1969
	if (!proc_exit_inprogress)
1970
	{
1971 1972
		InterruptPending = true;
		QueryCancelPending = true;
B
Bruce Momjian 已提交
1973

1974
		/*
1975
		 * If it's safe to interrupt, and we're waiting for a lock,
B
Bruce Momjian 已提交
1976 1977
		 * service the interrupt immediately.  No point in interrupting if
		 * we're waiting for input, however.
1978
		 */
1979
		if (ImmediateInterruptOK && InterruptHoldoffCount == 0 &&
1980
			CritSectionCount == 0)
1981
		{
1982 1983 1984 1985 1986 1987
			/* bump holdoff count to make ProcessInterrupts() a no-op */
			/* until we are done getting ready for it */
			InterruptHoldoffCount++;
			if (LockWaitCancel())
			{
				DisableNotifyInterrupt();
1988
				DisableCatchupInterrupt();
T
Tom Lane 已提交
1989
				InterruptHoldoffCount--;
1990 1991 1992 1993
				ProcessInterrupts();
			}
			else
				InterruptHoldoffCount--;
1994
		}
1995 1996
	}

1997
	errno = save_errno;
1998 1999
}

2000 2001 2002 2003
/* signal handler for floating point exception */
static void
FloatExceptionHandler(SIGNAL_ARGS)
{
2004 2005 2006
	ereport(ERROR,
			(errcode(ERRCODE_FLOATING_POINT_EXCEPTION),
			 errmsg("floating-point exception"),
B
Bruce Momjian 已提交
2007 2008 2009
		   errdetail("An invalid floating-point operation was signaled. "
					 "This probably means an out-of-range result or an "
					 "invalid operation, such as division by zero.")));
2010 2011
}

2012
/* SIGHUP: set flag to re-read config file at next convenient time */
2013
static void
2014
SigHupHandler(SIGNAL_ARGS)
2015
{
2016
	got_SIGHUP = true;
2017 2018
}

2019

2020 2021 2022 2023 2024 2025 2026 2027 2028 2029
/*
 * ProcessInterrupts: out-of-line portion of CHECK_FOR_INTERRUPTS() macro
 *
 * If an interrupt condition is pending, and it's safe to service it,
 * then clear the flag and accept the interrupt.  Called only when
 * InterruptPending is true.
 */
void
ProcessInterrupts(void)
{
2030 2031
	/* OK to accept interrupt now? */
	if (InterruptHoldoffCount != 0 || CritSectionCount != 0)
2032 2033 2034 2035 2036
		return;
	InterruptPending = false;
	if (ProcDiePending)
	{
		ProcDiePending = false;
B
Bruce Momjian 已提交
2037 2038
		QueryCancelPending = false;		/* ProcDie trumps QueryCancel */
		ImmediateInterruptOK = false;	/* not idle anymore */
2039
		DisableNotifyInterrupt();
2040
		DisableCatchupInterrupt();
2041 2042
		ereport(FATAL,
				(errcode(ERRCODE_ADMIN_SHUTDOWN),
B
Bruce Momjian 已提交
2043
		 errmsg("terminating connection due to administrator command")));
2044 2045 2046 2047
	}
	if (QueryCancelPending)
	{
		QueryCancelPending = false;
B
Bruce Momjian 已提交
2048
		ImmediateInterruptOK = false;	/* not idle anymore */
2049
		DisableNotifyInterrupt();
2050
		DisableCatchupInterrupt();
2051 2052 2053
		ereport(ERROR,
				(errcode(ERRCODE_QUERY_CANCELED),
				 errmsg("canceling query due to user request")));
2054 2055 2056 2057
	}
	/* If we get here, do nothing (probably, QueryCancelPending was reset) */
}

2058

2059 2060 2061 2062 2063 2064 2065 2066 2067 2068 2069 2070 2071
/*
 * check_stack_depth: check for excessively deep recursion
 *
 * This should be called someplace in any recursive routine that might possibly
 * recurse deep enough to overflow the stack.  Most Unixen treat stack
 * overflow as an unrecoverable SIGSEGV, so we want to error out ourselves
 * before hitting the hardware limit.  Unfortunately we have no direct way
 * to detect the hardware limit, so we have to rely on the admin to set a
 * GUC variable for it ...
 */
void
check_stack_depth(void)
{
B
Bruce Momjian 已提交
2072 2073
	char		stack_top_loc;
	int			stack_depth;
2074 2075 2076 2077 2078

	/*
	 * Compute distance from PostgresMain's local variables to my own
	 *
	 * Note: in theory stack_depth should be ptrdiff_t or some such, but
B
Bruce Momjian 已提交
2079 2080
	 * since the whole point of this code is to bound the value to
	 * something much less than integer-sized, int should work fine.
2081 2082
	 */
	stack_depth = (int) (stack_base_ptr - &stack_top_loc);
B
Bruce Momjian 已提交
2083

2084
	/*
B
Bruce Momjian 已提交
2085 2086
	 * Take abs value, since stacks grow up on some machines, down on
	 * others
2087 2088 2089
	 */
	if (stack_depth < 0)
		stack_depth = -stack_depth;
B
Bruce Momjian 已提交
2090

2091 2092 2093 2094
	/*
	 * Trouble?
	 *
	 * The test on stack_base_ptr prevents us from erroring out if called
B
Bruce Momjian 已提交
2095 2096 2097
	 * during process setup or in a non-backend process.  Logically it
	 * should be done first, but putting it here avoids wasting cycles
	 * during normal cases.
2098 2099 2100 2101 2102 2103 2104 2105 2106 2107 2108 2109 2110 2111 2112 2113 2114 2115 2116 2117 2118 2119
	 */
	if (stack_depth > max_stack_depth_bytes &&
		stack_base_ptr != NULL)
	{
		ereport(ERROR,
				(errcode(ERRCODE_STATEMENT_TOO_COMPLEX),
				 errmsg("stack depth limit exceeded"),
				 errhint("Increase the configuration parameter \"max_stack_depth\".")));
	}
}

/* GUC assign hook to update max_stack_depth_bytes from max_stack_depth */
bool
assign_max_stack_depth(int newval, bool doit, GucSource source)
{
	/* Range check was already handled by guc.c */
	if (doit)
		max_stack_depth_bytes = newval * 1024;
	return true;
}


2120
static void
2121
usage(const char *progname)
2122
{
2123
	printf(_("%s is the PostgreSQL stand-alone backend.  It is not\nintended to be used by normal users.\n\n"), progname);
2124

2125 2126
	printf(_("Usage:\n  %s [OPTION]... [DBNAME]\n\n"), progname);
	printf(_("Options:\n"));
M
 
Marc G. Fournier 已提交
2127
#ifdef USE_ASSERT_CHECKING
2128
	printf(_("  -A 1|0          enable/disable run-time assert checking\n"));
M
 
Marc G. Fournier 已提交
2129
#endif
2130 2131 2132 2133 2134 2135 2136 2137 2138 2139 2140 2141 2142 2143 2144 2145 2146 2147 2148 2149 2150 2151
	printf(_("  -B NBUFFERS     number of shared buffers\n"));
	printf(_("  -c NAME=VALUE   set run-time parameter\n"));
	printf(_("  -d 0-5          debugging level (0 is off)\n"));
	printf(_("  -D DATADIR      database directory\n"));
	printf(_("  -e              use European date input format (DMY)\n"));
	printf(_("  -E              echo query before execution\n"));
	printf(_("  -F              turn fsync off\n"));
	printf(_("  -N              do not use newline as interactive query delimiter\n"));
	printf(_("  -o FILENAME     send stdout and stderr to given file\n"));
	printf(_("  -P              disable system indexes\n"));
	printf(_("  -s              show statistics after each query\n"));
	printf(_("  -S WORK-MEM     set amount of memory for sorts (in kB)\n"));
	printf(_("  --describe-config  describe configuration parameters, then exit\n"));
	printf(_("  --help          show this help, then exit\n"));
	printf(_("  --version       output version information, then exit\n"));
	printf(_("\nDeveloper options:\n"));
	printf(_("  -f s|i|n|m|h    forbid use of some plan types\n"));
	printf(_("  -i              do not execute queries\n"));
	printf(_("  -O              allow system table structure changes\n"));
	printf(_("  -t pa|pl|ex     show timings after each query\n"));
	printf(_("  -W NUM          wait NUM seconds to allow attach from a debugger\n"));
	printf(_("\nReport bugs to <pgsql-bugs@postgresql.org>.\n"));
2152 2153
}

2154

2155 2156 2157 2158 2159 2160 2161 2162 2163 2164 2165 2166 2167 2168 2169 2170 2171 2172 2173 2174 2175 2176 2177 2178 2179 2180 2181 2182 2183 2184 2185 2186 2187 2188 2189
/*
 * set_debug_options --- apply "-d N" command line option
 *
 * -d is not quite the same as setting log_min_messages because it enables
 * other output options.
 */
void
set_debug_options(int debug_flag, GucContext context, GucSource source)
{
	if (debug_flag > 0)
	{
		char		debugstr[64];

		sprintf(debugstr, "debug%d", debug_flag);
		SetConfigOption("log_min_messages", debugstr, context, source);
	}
	else
		SetConfigOption("log_min_messages", "notice", context, source);

	if (debug_flag >= 1 && context == PGC_POSTMASTER)
	{
		SetConfigOption("log_connections", "true", context, source);
		SetConfigOption("log_disconnections", "true", context, source);
	}
	if (debug_flag >= 2)
		SetConfigOption("log_statement", "all", context, source);
	if (debug_flag >= 3)
		SetConfigOption("debug_print_parse", "true", context, source);
	if (debug_flag >= 4)
		SetConfigOption("debug_print_plan", "true", context, source);
	if (debug_flag >= 5)
		SetConfigOption("debug_print_rewritten", "true", context, source);
}


2190
/* ----------------------------------------------------------------
2191
 * PostgresMain
B
Bruce Momjian 已提交
2192
 *	   postgres main loop -- all backends, interactive or otherwise start here
2193
 *
2194 2195 2196 2197
 * argc/argv are the command line arguments to be used.  (When being forked
 * by the postmaster, these are not the original argv array of the process.)
 * username is the (possibly authenticated) PostgreSQL user name to be used
 * for the session.
2198 2199 2200
 * ----------------------------------------------------------------
 */
int
2201
PostgresMain(int argc, char *argv[], const char *username)
2202
{
2203
	int			flag;
2204
	const char *dbname = NULL;
2205
	char	   *userDoption = NULL;
2206
	bool		secure;
2207
	int			errs = 0;
2208
	int			debug_flag = -1;		/* -1 means not given */
2209
	List	   *guc_names = NIL;		/* for SUSET options */
2210 2211
	List	   *guc_values = NIL;
	GucContext	ctx;
2212
	GucSource	gucsource;
2213
	bool		am_superuser;
2214
	char	   *tmp;
2215
	int			firstchar;
2216
	char		stack_base;
B
Bruce Momjian 已提交
2217
	StringInfoData input_message;
2218
	sigjmp_buf	local_sigjmp_buf;
2219
	volatile bool send_rfq = true;
B
Bruce Momjian 已提交
2220

2221 2222 2223 2224
#define PendingConfigOption(name,val) \
	(guc_names = lappend(guc_names, pstrdup(name)), \
	 guc_values = lappend(guc_values, pstrdup(val)))

2225
	/*
B
Bruce Momjian 已提交
2226 2227
	 * Catch standard options before doing much else.  This even works on
	 * systems without getopt_long.
2228 2229 2230
	 */
	if (!IsUnderPostmaster && argc > 1)
	{
B
Bruce Momjian 已提交
2231
		if (strcmp(argv[1], "--help") == 0 || strcmp(argv[1], "-?") == 0)
2232 2233 2234 2235
		{
			usage(argv[0]);
			exit(0);
		}
B
Bruce Momjian 已提交
2236
		if (strcmp(argv[1], "--version") == 0 || strcmp(argv[1], "-V") == 0)
2237
		{
2238
			puts(PG_VERSIONSTR);
2239 2240
			exit(0);
		}
B
Bruce Momjian 已提交
2241
	}
2242

2243 2244 2245 2246 2247 2248
	/*
	 * initialize globals (already done if under postmaster, but not if
	 * standalone; cheap enough to do over)
	 */
	MyProcPid = getpid();

2249 2250 2251 2252 2253
	/*
	 * Fire up essential subsystems: error and memory management
	 *
	 * If we are running under the postmaster, this is done already.
	 */
2254
	if (!IsUnderPostmaster)
2255 2256
		MemoryContextInit();

2257 2258
	set_ps_display("startup");

2259 2260
	SetProcessingMode(InitProcessing);

2261 2262 2263
	/* Set up reference point for stack depth checking */
	stack_base_ptr = &stack_base;

2264 2265 2266 2267 2268 2269 2270
	/* Compute paths, if we didn't inherit them from postmaster */
	if (my_exec_path[0] == '\0')
	{
		if (find_my_exec(argv[0], my_exec_path) < 0)
			elog(FATAL, "%s: could not locate my own executable path",
				 argv[0]);
	}
B
Bruce Momjian 已提交
2271

B
Bruce Momjian 已提交
2272 2273
	if (pkglib_path[0] == '\0')
		get_pkglib_path(my_exec_path, pkglib_path);
2274

2275
	/*
2276
	 * Set default values for command-line options.
2277
	 */
2278
	EchoQuery = false;
2279

2280
	if (!IsUnderPostmaster)
2281
		InitializeGUCOptions();
2282

2283 2284 2285 2286 2287 2288 2289 2290 2291 2292 2293 2294 2295 2296 2297 2298 2299
	/* ----------------
	 *	parse command line arguments
	 *
	 *	There are now two styles of command line layout for the backend:
	 *
	 *	For interactive use (not started from postmaster) the format is
	 *		postgres [switches] [databasename]
	 *	If the databasename is omitted it is taken to be the user name.
	 *
	 *	When started from the postmaster, the format is
	 *		postgres [secure switches] -p databasename [insecure switches]
	 *	Switches appearing after -p came from the client (via "options"
	 *	field of connection request).  For security reasons we restrict
	 *	what these switches can do.
	 * ----------------
	 */

2300 2301
	/* all options are allowed until '-p' */
	secure = true;
2302
	ctx = PGC_POSTMASTER;
2303
	gucsource = PGC_S_ARGV;		/* initial switches came from command line */
2304

2305
	while ((flag = getopt(argc, argv, "A:B:c:D:d:Eef:FiNOPo:p:S:st:v:W:-:")) != -1)
2306
	{
2307 2308
		switch (flag)
		{
M
 
Marc G. Fournier 已提交
2309 2310
			case 'A':
#ifdef USE_ASSERT_CHECKING
2311
				SetConfigOption("debug_assertions", optarg, ctx, gucsource);
M
 
Marc G. Fournier 已提交
2312
#else
2313 2314 2315
				ereport(WARNING,
						(errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
						 errmsg("assert checking is not compiled in")));
M
 
Marc G. Fournier 已提交
2316 2317
#endif
				break;
2318

2319
			case 'B':
2320 2321 2322

				/*
				 * specify the size of buffer pool
2323
				 */
2324
				SetConfigOption("shared_buffers", optarg, ctx, gucsource);
2325
				break;
2326

2327
			case 'D':			/* PGDATA or config directory */
2328
				if (secure)
2329
					userDoption = optarg;
M
 
Marc G. Fournier 已提交
2330
				break;
2331

2332
			case 'd':			/* debug level */
2333
				debug_flag = atoi(optarg);
2334
				break;
2335 2336

			case 'E':
2337 2338 2339

				/*
				 * E - echo the query the user entered
2340
				 */
2341
				EchoQuery = true;
2342
				break;
2343 2344

			case 'e':
2345 2346

				/*
2347
				 * Use European date input format (DMY)
2348
				 */
2349
				SetConfigOption("datestyle", "euro", ctx, gucsource);
2350
				break;
2351 2352

			case 'F':
2353 2354 2355

				/*
				 * turn off fsync
2356
				 */
2357
				SetConfigOption("fsync", "false", ctx, gucsource);
2358
				break;
2359 2360

			case 'f':
2361 2362 2363

				/*
				 * f - forbid generation of certain plans
2364
				 */
2365
				tmp = NULL;
2366 2367 2368
				switch (optarg[0])
				{
					case 's':	/* seqscan */
2369
						tmp = "enable_seqscan";
2370 2371
						break;
					case 'i':	/* indexscan */
2372
						tmp = "enable_indexscan";
2373
						break;
2374 2375 2376
					case 'b':	/* bitmapscan */
						tmp = "enable_bitmapscan";
						break;
2377
					case 't':	/* tidscan */
2378
						tmp = "enable_tidscan";
2379 2380
						break;
					case 'n':	/* nestloop */
2381
						tmp = "enable_nestloop";
2382 2383
						break;
					case 'm':	/* mergejoin */
2384
						tmp = "enable_mergejoin";
2385 2386
						break;
					case 'h':	/* hashjoin */
2387
						tmp = "enable_hashjoin";
2388 2389 2390 2391
						break;
					default:
						errs++;
				}
2392
				if (tmp)
2393
					SetConfigOption(tmp, "false", ctx, gucsource);
2394 2395
				break;

2396
			case 'N':
2397 2398 2399

				/*
				 * N - Don't use newline as a query delimiter
2400 2401 2402
				 */
				UseNewLine = 0;
				break;
2403

2404
			case 'O':
2405 2406 2407

				/*
				 * allow system table structure modifications
2408
				 */
2409 2410
				if (secure)		/* XXX safe to allow from client??? */
					allowSystemTableMods = true;
2411 2412
				break;

H
Hiroshi Inoue 已提交
2413
			case 'P':
2414 2415 2416

				/*
				 * ignore system indexes
2417
				 *
B
Bruce Momjian 已提交
2418 2419 2420
				 * As of PG 7.4 this is safe to allow from the client, since
				 * it only disables reading the system indexes, not
				 * writing them.  Worst case consequence is slowness.
H
Hiroshi Inoue 已提交
2421
				 */
2422
				IgnoreSystemIndexes(true);
H
Hiroshi Inoue 已提交
2423 2424
				break;

T
Tom Lane 已提交
2425
			case 'o':
2426 2427 2428

				/*
				 * o - send output (stdout and stderr) to the given file
T
Tom Lane 已提交
2429
				 */
2430 2431
				if (secure)
					StrNCpy(OutputFileName, optarg, MAXPGPATH);
T
Tom Lane 已提交
2432 2433
				break;

2434
			case 'p':
B
Bruce Momjian 已提交
2435

2436 2437 2438
				/*
				 * p - special flag passed if backend was forked by a
				 * postmaster.
2439
				 */
2440 2441
				if (secure)
				{
2442
					dbname = strdup(optarg);
2443

B
Bruce Momjian 已提交
2444 2445
					secure = false;		/* subsequent switches are NOT
										 * secure */
2446
					ctx = PGC_BACKEND;
2447
					gucsource = PGC_S_CLIENT;
2448
				}
2449
				break;
2450

2451
			case 'S':
2452 2453 2454

				/*
				 * S - amount of sort memory to use in 1k bytes
2455
				 */
2456
				SetConfigOption("work_mem", optarg, ctx, gucsource);
2457
				break;
2458 2459

			case 's':
2460 2461 2462

				/*
				 * s - report usage statistics (timings) after each query
2463 2464 2465
				 *
				 * Since log options are SUSET, we need to postpone unless
				 * still in secure context
2466
				 */
2467 2468 2469 2470 2471
				if (ctx == PGC_BACKEND)
					PendingConfigOption("log_statement_stats", "true");
				else
					SetConfigOption("log_statement_stats", "true",
									ctx, gucsource);
M
 
Marc G. Fournier 已提交
2472 2473
				break;

2474
			case 't':
2475
				/* ---------------
2476 2477 2478 2479 2480 2481 2482 2483 2484
				 *	tell postgres to report usage statistics (timings) for
				 *	each query
				 *
				 *	-tpa[rser] = print stats for parser time of each query
				 *	-tpl[anner] = print stats for planner time of each query
				 *	-te[xecutor] = print stats for executor time of each query
				 *	caution: -s can not be used together with -t.
				 * ----------------
				 */
2485
				tmp = NULL;
2486 2487 2488 2489
				switch (optarg[0])
				{
					case 'p':
						if (optarg[1] == 'a')
B
Rename:  
Bruce Momjian 已提交
2490
							tmp = "log_parser_stats";
2491
						else if (optarg[1] == 'l')
B
Rename:  
Bruce Momjian 已提交
2492
							tmp = "log_planner_stats";
2493 2494 2495 2496
						else
							errs++;
						break;
					case 'e':
2497
						tmp = "log_executor_stats";
2498 2499 2500 2501 2502
						break;
					default:
						errs++;
						break;
				}
2503
				if (tmp)
2504 2505 2506 2507 2508 2509
				{
					if (ctx == PGC_BACKEND)
						PendingConfigOption(tmp, "true");
					else
						SetConfigOption(tmp, "true", ctx, gucsource);
				}
2510 2511
				break;

2512
			case 'v':
2513 2514
				if (secure)
					FrontendProtocol = (ProtocolVersion) atoi(optarg);
2515 2516
				break;

M
 
Marc G. Fournier 已提交
2517
			case 'W':
2518 2519 2520

				/*
				 * wait N seconds to allow attach from a debugger
M
 
Marc G. Fournier 已提交
2521
				 */
B
Bruce Momjian 已提交
2522
				pg_usleep(atoi(optarg) * 1000000L);
M
 
Marc G. Fournier 已提交
2523 2524
				break;

2525
			case 'c':
2526
			case '-':
2527
				{
B
Bruce Momjian 已提交
2528 2529
					char	   *name,
							   *value;
2530

B
Bruce Momjian 已提交
2531 2532 2533 2534
					ParseLongOption(optarg, &name, &value);
					if (!value)
					{
						if (flag == '-')
2535 2536 2537 2538
							ereport(ERROR,
									(errcode(ERRCODE_SYNTAX_ERROR),
									 errmsg("--%s requires a value",
											optarg)));
B
Bruce Momjian 已提交
2539
						else
2540 2541 2542 2543
							ereport(ERROR,
									(errcode(ERRCODE_SYNTAX_ERROR),
									 errmsg("-c %s requires a value",
											optarg)));
B
Bruce Momjian 已提交
2544 2545
					}

2546 2547 2548 2549 2550 2551 2552 2553
					/*
					 * If a SUSET option, must postpone evaluation, unless
					 * we are still reading secure switches.
					 */
					if (ctx == PGC_BACKEND && IsSuperuserConfigOption(name))
						PendingConfigOption(name, value);
					else
						SetConfigOption(name, value, ctx, gucsource);
B
Bruce Momjian 已提交
2554 2555 2556 2557 2558
					free(name);
					if (value)
						free(value);
					break;
				}
2559

2560 2561
			default:
				errs++;
T
Tom Lane 已提交
2562
				break;
2563
		}
2564 2565
	}

2566 2567 2568 2569 2570 2571 2572 2573 2574 2575 2576 2577 2578 2579 2580 2581 2582 2583 2584 2585 2586 2587 2588 2589 2590 2591
	/*
	 * Process any additional GUC variable settings passed in startup
	 * packet.  These are handled exactly like command-line variables.
	 */
	if (MyProcPort != NULL)
	{
		ListCell   *gucopts = list_head(MyProcPort->guc_options);

		while (gucopts)
		{
			char	   *name;
			char	   *value;

			name = lfirst(gucopts);
			gucopts = lnext(gucopts);

			value = lfirst(gucopts);
			gucopts = lnext(gucopts);

			if (IsSuperuserConfigOption(name))
				PendingConfigOption(name, value);
			else
				SetConfigOption(name, value, PGC_BACKEND, PGC_S_CLIENT);
		}
	}

2592 2593
	/* Acquire configuration parameters, unless inherited from postmaster */
	if (!IsUnderPostmaster)
2594
	{
2595 2596
		if (!SelectConfigFiles(userDoption, argv[0]))
			proc_exit(1);
2597
	}
2598

2599
	/*
2600
	 * Set up signal handlers and masks.
2601
	 *
2602
	 * Note that postmaster blocked all signals before forking child process,
B
Bruce Momjian 已提交
2603 2604
	 * so there is no race condition whereby we might receive a signal
	 * before we have set up the handler.
T
Tom Lane 已提交
2605 2606
	 *
	 * Also note: it's best not to use any signals that are SIG_IGNored in
B
Bruce Momjian 已提交
2607
	 * the postmaster.	If such a signal arrives before we are able to
2608
	 * change the handler to non-SIG_IGN, it'll get dropped.  Instead,
B
Bruce Momjian 已提交
2609 2610
	 * make a dummy handler in the postmaster to reserve the signal. (Of
	 * course, this isn't an issue for signals that are locally generated,
2611
	 * such as SIGALRM and SIGPIPE.)
2612
	 */
2613
	pqsignal(SIGHUP, SigHupHandler);	/* set flag to read config file */
B
Bruce Momjian 已提交
2614
	pqsignal(SIGINT, StatementCancelHandler);	/* cancel current query */
2615
	pqsignal(SIGTERM, die);		/* cancel current query and exit */
2616
	pqsignal(SIGQUIT, quickdie);	/* hard crash time */
B
Bruce Momjian 已提交
2617
	pqsignal(SIGALRM, handle_sig_alarm);		/* timeout conditions */
2618 2619 2620 2621 2622

	/*
	 * Ignore failure to write to frontend. Note: if frontend closes
	 * connection, we will notice it and exit cleanly when control next
	 * returns to outer loop.  This seems safer than forcing exit in the
2623 2624 2625
	 * midst of output during who-knows-what operation...
	 */
	pqsignal(SIGPIPE, SIG_IGN);
2626 2627
	pqsignal(SIGUSR1, CatchupInterruptHandler);
	pqsignal(SIGUSR2, NotifyInterruptHandler);
2628
	pqsignal(SIGFPE, FloatExceptionHandler);
2629 2630

	/*
B
Bruce Momjian 已提交
2631 2632
	 * Reset some signals that are accepted by postmaster but not by
	 * backend
2633
	 */
2634 2635
	pqsignal(SIGCHLD, SIG_DFL); /* system() requires this on some
								 * platforms */
2636

2637 2638
	pqinitmask();

T
Tom Lane 已提交
2639
	/* We allow SIGQUIT (quickdie) at all times */
2640
#ifdef HAVE_SIGPROCMASK
T
Tom Lane 已提交
2641
	sigdelset(&BlockSig, SIGQUIT);
2642
#else
T
Tom Lane 已提交
2643
	BlockSig &= ~(sigmask(SIGQUIT));
2644 2645
#endif

T
Tom Lane 已提交
2646
	PG_SETMASK(&BlockSig);		/* block everything except SIGQUIT */
2647

2648

2649
	if (IsUnderPostmaster)
2650
	{
2651
		/* noninteractive case: nothing should be left after switches */
2652
		if (errs || argc != optind || dbname == NULL)
2653
		{
2654 2655
			ereport(FATAL,
					(errcode(ERRCODE_SYNTAX_ERROR),
B
Bruce Momjian 已提交
2656 2657
			 errmsg("invalid command-line arguments for server process"),
			errhint("Try \"%s --help\" for more information.", argv[0])));
2658
		}
2659

2660 2661 2662
		XLOGPathInit();

		BaseInit();
2663
	}
2664
	else
2665
	{
2666 2667 2668
		/* interactive case: database name can be last arg on command line */
		if (errs || argc - optind > 1)
		{
2669 2670 2671 2672
			ereport(FATAL,
					(errcode(ERRCODE_SYNTAX_ERROR),
					 errmsg("%s: invalid command-line arguments",
							argv[0]),
B
Bruce Momjian 已提交
2673
			errhint("Try \"%s --help\" for more information.", argv[0])));
2674 2675
		}
		else if (argc - optind == 1)
2676 2677
			dbname = argv[optind];
		else if ((dbname = username) == NULL)
2678
		{
2679 2680 2681 2682
			ereport(FATAL,
					(errcode(ERRCODE_INVALID_PARAMETER_VALUE),
					 errmsg("%s: no database nor user name specified",
							argv[0])));
2683
		}
2684

2685
		/*
2686 2687
		 * Validate we have been given a reasonable-looking DataDir (if
		 * under postmaster, assume postmaster did this already).
2688
		 */
2689
		Assert(DataDir);
2690 2691
		ValidatePgVersion(DataDir);

2692
		/*
2693
		 * Create lockfile for data directory.
2694
		 */
2695
		CreateDataDirLockFile(DataDir, false);
2696

2697
		XLOGPathInit();
2698
		BaseInit();
2699 2700 2701 2702 2703

		/*
		 * Start up xlog for standalone backend, and register to have it
		 * closed down at exit.
		 */
2704
		StartupXLOG();
2705
		on_shmem_exit(ShutdownXLOG, 0);
2706 2707 2708 2709 2710 2711 2712

		/*
		 * Read any existing FSM cache file, and register to write one out
		 * at exit.
		 */
		LoadFreeSpaceMap();
		on_shmem_exit(DumpFreeSpaceMap, 0);
2713 2714 2715 2716 2717 2718

		/*
		 * We have to build the flat file for pg_database, but not for
		 * the user and group tables, since we won't try to do authentication.
		 */
		BuildFlatFiles(true);
2719 2720
	}

2721
	/*
2722 2723 2724 2725 2726
	 * General initialization.
	 *
	 * NOTE: if you are tempted to add code in this vicinity, consider
	 * putting it inside InitPostgres() instead.  In particular, anything
	 * that involves database access should be there, not here.
2727
	 */
2728 2729
	ereport(DEBUG3,
			(errmsg_internal("InitPostgres")));
2730
	am_superuser = InitPostgres(dbname, username);
2731

2732
	SetProcessingMode(NormalProcessing);
2733

2734
	/*
2735 2736
	 * Now that we know if client is a superuser, we can try to apply SUSET
	 * GUC options that came from the client.
2737 2738 2739 2740 2741 2742 2743 2744 2745 2746 2747 2748 2749 2750 2751 2752 2753 2754 2755 2756 2757 2758 2759 2760 2761 2762 2763 2764
	 */
	ctx = am_superuser ? PGC_SUSET : PGC_USERSET;

	if (debug_flag >= 0)
		set_debug_options(debug_flag, ctx, PGC_S_CLIENT);

	if (guc_names != NIL)
	{
		ListCell   *namcell,
				   *valcell;

		forboth(namcell, guc_names, valcell, guc_values)
		{
			char	   *name = (char *) lfirst(namcell);
			char	   *value = (char *) lfirst(valcell);

			SetConfigOption(name, value, ctx, PGC_S_CLIENT);
			pfree(name);
			pfree(value);
		}
	}

	/*
	 * Now all GUC states are fully set up.  Report them to client if
	 * appropriate.
	 */
	BeginReportingGUCOptions();

2765 2766 2767 2768 2769 2770 2771
	/*
	 * Also set up handler to log session end; we have to wait till now
	 * to be sure Log_disconnections has its final value.
	 */
	if (IsUnderPostmaster && Log_disconnections)
		on_proc_exit(log_disconnections, 0);

2772 2773
	/*
	 * Send this backend's cancellation info to the frontend.
2774
	 */
M
 
Marc G. Fournier 已提交
2775 2776 2777
	if (whereToSendOutput == Remote &&
		PG_PROTOCOL_MAJOR(FrontendProtocol) >= 2)
	{
2778
		StringInfoData buf;
B
Bruce Momjian 已提交
2779

2780
		pq_beginmessage(&buf, 'K');
2781 2782 2783
		pq_sendint(&buf, (int32) MyProcPid, sizeof(int32));
		pq_sendint(&buf, (int32) MyCancelKey, sizeof(int32));
		pq_endmessage(&buf);
M
 
Marc G. Fournier 已提交
2784 2785 2786
		/* Need not flush since ReadyForQuery will do it. */
	}

2787 2788
	/* Welcome banner for standalone case */
	if (whereToSendOutput == Debug)
2789
		printf("\nPostgreSQL stand-alone backend %s\n", PG_VERSION);
2790

2791 2792 2793
	/*
	 * Create the memory context we will use in the main loop.
	 *
2794 2795
	 * MessageContext is reset once per iteration of the main loop, ie, upon
	 * completion of processing of each command message from the client.
2796
	 */
2797 2798 2799 2800 2801
	MessageContext = AllocSetContextCreate(TopMemoryContext,
										   "MessageContext",
										   ALLOCSET_DEFAULT_MINSIZE,
										   ALLOCSET_DEFAULT_INITSIZE,
										   ALLOCSET_DEFAULT_MAXSIZE);
2802

2803 2804 2805 2806 2807 2808 2809
	/* ----------
	 * Tell the statistics collector that we're alive and
	 * to which database we belong.
	 * ----------
	 */
	pgstat_bestart();

2810 2811
	/*
	 * POSTGRES main processing loop begins here
2812
	 *
2813 2814
	 * If an exception is encountered, processing resumes here so we abort
	 * the current transaction and start a new one.
2815
	 *
B
Bruce Momjian 已提交
2816 2817
	 * You might wonder why this isn't coded as an infinite loop around a
	 * PG_TRY construct.  The reason is that this is the bottom of the
2818 2819 2820
	 * exception stack, and so with PG_TRY there would be no exception
	 * handler in force at all during the CATCH part.  By leaving the
	 * outermost setjmp always active, we have at least some chance of
B
Bruce Momjian 已提交
2821 2822
	 * recovering from an error during error recovery.	(If we get into an
	 * infinite loop thereby, it will soon be stopped by overflow of
2823
	 * elog.c's internal state stack.)
2824 2825
	 */

2826
	if (sigsetjmp(local_sigjmp_buf, 1) != 0)
2827
	{
2828
		/*
2829
		 * NOTE: if you are tempted to add more code in this if-block,
2830
		 * consider the high probability that it should be in
B
Bruce Momjian 已提交
2831 2832 2833 2834
		 * AbortTransaction() instead.	The only stuff done directly here
		 * should be stuff that is guaranteed to apply *only* for
		 * outer-level error recovery, such as adjusting the FE/BE
		 * protocol status.
2835 2836 2837 2838 2839 2840 2841 2842 2843 2844
		 */

		/* Since not using PG_TRY, must reset error stack by hand */
		error_context_stack = NULL;

		/* Prevent interrupts while cleaning up */
		HOLD_INTERRUPTS();

		/*
		 * Forget any pending QueryCancel request, since we're returning
B
Bruce Momjian 已提交
2845 2846
		 * to the idle loop anyway, and cancel the statement timer if
		 * running.
2847 2848
		 */
		QueryCancelPending = false;
2849
		disable_sig_alarm(true);
B
Bruce Momjian 已提交
2850
		QueryCancelPending = false;		/* again in case timeout occurred */
2851 2852

		/*
B
Bruce Momjian 已提交
2853 2854 2855
		 * Turn off these interrupts too.  This is only needed here and
		 * not in other exception-catching places since these interrupts
		 * are only enabled while we wait for client input.
2856
		 */
2857
		DisableNotifyInterrupt();
2858
		DisableCatchupInterrupt();
2859

2860 2861 2862
		/* Make sure libpq is in a good state */
		pq_comm_reset();

2863 2864
		/* Report the error to the client and/or server log */
		EmitErrorReport();
2865

2866
		/*
B
Bruce Momjian 已提交
2867 2868
		 * Make sure debug_query_string gets reset before we possibly
		 * clobber the storage it points at.
2869
		 */
2870
		debug_query_string = NULL;
2871

2872
		/*
2873
		 * Abort the current transaction in order to recover.
2874
		 */
2875
		AbortCurrentTransaction();
2876 2877

		/*
2878 2879
		 * Now return to normal top-level context and clear ErrorContext
		 * for next time.
2880 2881
		 */
		MemoryContextSwitchTo(TopMemoryContext);
2882
		FlushErrorState();
2883
		QueryContext = NULL;
2884

2885 2886
		/*
		 * If we were handling an extended-query-protocol message,
B
Bruce Momjian 已提交
2887 2888
		 * initiate skip till next Sync.  This also causes us not to issue
		 * ReadyForQuery (until we get Sync).
2889 2890 2891
		 */
		if (doing_extended_query_message)
			ignore_till_sync = true;
2892

2893 2894 2895 2896
		/* We don't have a transaction command open anymore */
		xact_started = false;

		/* Now we can allow interrupts again */
2897
		RESUME_INTERRUPTS();
2898
	}
2899

2900 2901
	/* We can now handle ereport(ERROR) */
	PG_exception_stack = &local_sigjmp_buf;
2902

2903
	PG_SETMASK(&UnBlockSig);
2904

2905 2906
	if (!ignore_till_sync)
		send_rfq = true;		/* initially, or after error */
2907

2908 2909
	/*
	 * Non-error queries loop here.
2910 2911 2912 2913
	 */

	for (;;)
	{
2914
		/*
B
Bruce Momjian 已提交
2915 2916
		 * At top of loop, reset extended-query-message flag, so that any
		 * errors encountered in "idle" state don't provoke skip.
2917 2918 2919
		 */
		doing_extended_query_message = false;

2920
		/*
B
Bruce Momjian 已提交
2921
		 * Release storage left over from prior query cycle, and create a
2922
		 * new query input buffer in the cleared MessageContext.
2923
		 */
2924 2925
		MemoryContextSwitchTo(MessageContext);
		MemoryContextResetAndDeleteChildren(MessageContext);
2926

2927
		initStringInfo(&input_message);
2928

2929
		/*
2930 2931
		 * (1) If we've reached idle state, tell the frontend we're ready
		 * for a new query.
2932
		 *
2933
		 * Note: this includes fflush()'ing the last of the prior output.
2934 2935 2936
		 *
		 * This is also a good time to send collected statistics to the
		 * collector, and to update the PS stats display.  We avoid doing
B
Bruce Momjian 已提交
2937
		 * those every time through the message loop because it'd slow
2938 2939
		 * down processing of batched messages, and because we don't want
		 * to report uncommitted updates (that confuses autovacuum).
B
Bruce Momjian 已提交
2940
		 */
2941 2942
		if (send_rfq)
		{
2943
			if (IsTransactionOrTransactionBlock())
2944 2945 2946 2947 2948 2949
			{
				set_ps_display("idle in transaction");
				pgstat_report_activity("<IDLE> in transaction");
			}
			else
			{
2950 2951
				pgstat_report_tabstat();

2952 2953 2954
				set_ps_display("idle");
				pgstat_report_activity("<IDLE>");
			}
2955

2956 2957
			ReadyForQuery(whereToSendOutput);
			send_rfq = false;
2958
		}
2959

2960 2961 2962 2963
		/*
		 * (2) deal with pending asynchronous NOTIFY from other backends,
		 * and enable async.c's signal handler to execute NOTIFY directly.
		 * Then set up other stuff needed before blocking for input.
2964
		 */
B
Bruce Momjian 已提交
2965 2966
		QueryCancelPending = false;		/* forget any earlier CANCEL
										 * signal */
2967 2968

		EnableNotifyInterrupt();
2969
		EnableCatchupInterrupt();
2970

2971 2972 2973 2974 2975 2976
		/* Allow "die" interrupt to be processed while waiting */
		ImmediateInterruptOK = true;
		/* and don't forget to detect one that already arrived */
		QueryCancelPending = false;
		CHECK_FOR_INTERRUPTS();

2977 2978
		/*
		 * (3) read a command (loop blocks here)
2979
		 */
2980
		firstchar = ReadCommand(&input_message);
2981

2982 2983
		/*
		 * (4) disable async signal conditions again.
2984
		 */
2985
		ImmediateInterruptOK = false;
B
Bruce Momjian 已提交
2986
		QueryCancelPending = false;		/* forget any CANCEL signal */
2987

2988
		DisableNotifyInterrupt();
2989
		DisableCatchupInterrupt();
2990

2991 2992 2993
		/*
		 * (5) check for any other interesting events that happened while
		 * we slept.
2994 2995 2996 2997 2998 2999 3000
		 */
		if (got_SIGHUP)
		{
			got_SIGHUP = false;
			ProcessConfigFile(PGC_SIGHUP);
		}

3001
		/*
B
Bruce Momjian 已提交
3002 3003
		 * (6) process the command.  But ignore it if we're skipping till
		 * Sync.
3004
		 */
3005
		if (ignore_till_sync && firstchar != EOF)
3006 3007
			continue;

3008 3009
		switch (firstchar)
		{
3010
			case 'Q':			/* simple query */
3011
				{
3012 3013
					const char *query_string;

3014 3015
					query_string = pq_getmsgstring(&input_message);
					pq_getmsgend(&input_message);
3016

3017
					exec_simple_query(query_string);
3018

3019 3020
					send_rfq = true;
				}
3021 3022
				break;

3023 3024 3025 3026 3027 3028 3029
			case 'P':			/* parse */
				{
					const char *stmt_name;
					const char *query_string;
					int			numParams;
					Oid		   *paramTypes = NULL;

3030 3031 3032
					stmt_name = pq_getmsgstring(&input_message);
					query_string = pq_getmsgstring(&input_message);
					numParams = pq_getmsgint(&input_message, 2);
3033 3034
					if (numParams > 0)
					{
B
Bruce Momjian 已提交
3035
						int			i;
3036 3037 3038

						paramTypes = (Oid *) palloc(numParams * sizeof(Oid));
						for (i = 0; i < numParams; i++)
3039
							paramTypes[i] = pq_getmsgint(&input_message, 4);
3040
					}
3041
					pq_getmsgend(&input_message);
3042 3043 3044 3045 3046 3047 3048

					exec_parse_message(query_string, stmt_name,
									   paramTypes, numParams);
				}
				break;

			case 'B':			/* bind */
B
Bruce Momjian 已提交
3049

3050
				/*
B
Bruce Momjian 已提交
3051 3052
				 * this message is complex enough that it seems best to
				 * put the field extraction out-of-line
3053
				 */
3054
				exec_bind_message(&input_message);
3055 3056 3057 3058 3059
				break;

			case 'E':			/* execute */
				{
					const char *portal_name;
B
Bruce Momjian 已提交
3060
					int			max_rows;
3061

3062 3063 3064
					portal_name = pq_getmsgstring(&input_message);
					max_rows = pq_getmsgint(&input_message, 4);
					pq_getmsgend(&input_message);
3065

3066
					exec_execute_message(portal_name, max_rows);
3067 3068 3069
				}
				break;

3070 3071
			case 'F':			/* fastpath function call */
				/* Tell the collector what we're doing */
3072 3073
				pgstat_report_activity("<FASTPATH> function call");

3074
				/* start an xact for this function invocation */
3075
				start_xact_command();
3076

3077 3078 3079
				/* switch back to message context */
				MemoryContextSwitchTo(MessageContext);

3080 3081 3082
				/* set snapshot in case function needs one */
				ActiveSnapshot = CopySnapshot(GetTransactionSnapshot());

3083
				if (HandleFunctionRequest(&input_message) == EOF)
3084 3085
				{
					/* lost frontend connection during F message input */
B
Bruce Momjian 已提交
3086

3087
					/*
3088
					 * Reset whereToSendOutput to prevent ereport from
B
Bruce Momjian 已提交
3089
					 * attempting to send any more messages to client.
3090 3091 3092 3093
					 */
					if (whereToSendOutput == Remote)
						whereToSendOutput = None;

3094
					proc_exit(0);
3095
				}
3096 3097

				/* commit the function-invocation transaction */
3098
				finish_xact_command();
3099

3100
				send_rfq = true;
3101 3102
				break;

B
Bruce Momjian 已提交
3103
			case 'C':			/* close */
3104
				{
B
Bruce Momjian 已提交
3105
					int			close_type;
3106 3107
					const char *close_target;

3108 3109 3110
					close_type = pq_getmsgbyte(&input_message);
					close_target = pq_getmsgstring(&input_message);
					pq_getmsgend(&input_message);
3111 3112 3113 3114 3115 3116 3117 3118 3119 3120 3121 3122 3123 3124 3125 3126 3127 3128 3129 3130 3131 3132 3133 3134 3135 3136 3137 3138

					switch (close_type)
					{
						case 'S':
							if (close_target[0] != '\0')
								DropPreparedStatement(close_target, false);
							else
							{
								/* special-case the unnamed statement */
								unnamed_stmt_pstmt = NULL;
								if (unnamed_stmt_context)
								{
									DropDependentPortals(unnamed_stmt_context);
									MemoryContextDelete(unnamed_stmt_context);
								}
								unnamed_stmt_context = NULL;
							}
							break;
						case 'P':
							{
								Portal		portal;

								portal = GetPortalByName(close_target);
								if (PortalIsValid(portal))
									PortalDrop(portal, false);
							}
							break;
						default:
3139 3140
							ereport(ERROR,
									(errcode(ERRCODE_PROTOCOL_VIOLATION),
B
Bruce Momjian 已提交
3141 3142
							   errmsg("invalid CLOSE message subtype %d",
									  close_type)));
3143 3144 3145 3146
							break;
					}

					if (whereToSendOutput == Remote)
B
Bruce Momjian 已提交
3147
						pq_putemptymessage('3');		/* CloseComplete */
3148 3149 3150 3151 3152
				}
				break;

			case 'D':			/* describe */
				{
B
Bruce Momjian 已提交
3153
					int			describe_type;
3154 3155
					const char *describe_target;

3156 3157 3158
					describe_type = pq_getmsgbyte(&input_message);
					describe_target = pq_getmsgstring(&input_message);
					pq_getmsgend(&input_message);
3159 3160 3161 3162 3163 3164 3165 3166 3167 3168

					switch (describe_type)
					{
						case 'S':
							exec_describe_statement_message(describe_target);
							break;
						case 'P':
							exec_describe_portal_message(describe_target);
							break;
						default:
3169 3170
							ereport(ERROR,
									(errcode(ERRCODE_PROTOCOL_VIOLATION),
B
Bruce Momjian 已提交
3171 3172
							errmsg("invalid DESCRIBE message subtype %d",
								   describe_type)));
3173 3174 3175 3176 3177
							break;
					}
				}
				break;

B
Bruce Momjian 已提交
3178
			case 'H':			/* flush */
3179
				pq_getmsgend(&input_message);
3180 3181 3182 3183
				if (whereToSendOutput == Remote)
					pq_flush();
				break;

B
Bruce Momjian 已提交
3184
			case 'S':			/* sync */
3185
				pq_getmsgend(&input_message);
3186
				finish_xact_command();
3187 3188 3189
				send_rfq = true;
				break;

3190
				/*
B
Bruce Momjian 已提交
3191 3192 3193
				 * 'X' means that the frontend is closing down the socket.
				 * EOF means unexpected loss of frontend connection.
				 * Either way, perform normal shutdown.
3194 3195
				 */
			case 'X':
3196
			case EOF:
B
Bruce Momjian 已提交
3197

3198
				/*
B
Bruce Momjian 已提交
3199 3200
				 * Reset whereToSendOutput to prevent ereport from
				 * attempting to send any more messages to client.
3201 3202 3203
				 */
				if (whereToSendOutput == Remote)
					whereToSendOutput = None;
B
Bruce Momjian 已提交
3204

3205 3206
				/*
				 * NOTE: if you are tempted to add more code here, DON'T!
B
Bruce Momjian 已提交
3207 3208
				 * Whatever you had in mind to do should be set up as an
				 * on_proc_exit or on_shmem_exit callback, instead.
3209 3210 3211
				 * Otherwise it will fail to be called during other
				 * backend-shutdown scenarios.
				 */
3212
				proc_exit(0);
3213

B
Bruce Momjian 已提交
3214 3215 3216 3217
			case 'd':			/* copy data */
			case 'c':			/* copy done */
			case 'f':			/* copy fail */

3218
				/*
B
Bruce Momjian 已提交
3219 3220
				 * Accept but ignore these messages, per protocol spec; we
				 * probably got here because a COPY failed, and the
3221 3222 3223 3224
				 * frontend is still sending data.
				 */
				break;

3225
			default:
3226 3227 3228 3229
				ereport(FATAL,
						(errcode(ERRCODE_PROTOCOL_VIOLATION),
						 errmsg("invalid frontend message type %d",
								firstchar)));
3230
		}
3231
	}							/* end of input-reading loop */
3232

3233 3234
	/* can't get here because the above loop never exits */
	Assert(false);
3235

3236
	return 1;					/* keep compiler quiet */
3237 3238
}

3239
#ifndef HAVE_GETRUSAGE
B
Bruce Momjian 已提交
3240 3241
#include "rusagestub.h"
#else
3242
#include <sys/resource.h>
3243
#endif   /* HAVE_GETRUSAGE */
3244

3245 3246
static struct rusage Save_r;
static struct timeval Save_t;
3247 3248

void
3249
ResetUsage(void)
3250
{
3251
	getrusage(RUSAGE_SELF, &Save_r);
3252
	gettimeofday(&Save_t, NULL);
3253
	ResetBufferUsage();
3254
	/* ResetTupleCount(); */
3255 3256 3257
}

void
3258
ShowUsage(const char *title)
3259
{
3260
	StringInfoData str;
3261 3262 3263 3264
	struct timeval user,
				sys;
	struct timeval elapse_t;
	struct rusage r;
B
Bruce Momjian 已提交
3265
	char	   *bufusage;
3266 3267

	getrusage(RUSAGE_SELF, &r);
3268
	gettimeofday(&elapse_t, NULL);
3269 3270
	memcpy((char *) &user, (char *) &r.ru_utime, sizeof(user));
	memcpy((char *) &sys, (char *) &r.ru_stime, sizeof(sys));
3271 3272 3273 3274 3275 3276 3277 3278 3279 3280 3281 3282 3283 3284 3285 3286 3287 3288 3289 3290 3291 3292 3293 3294
	if (elapse_t.tv_usec < Save_t.tv_usec)
	{
		elapse_t.tv_sec--;
		elapse_t.tv_usec += 1000000;
	}
	if (r.ru_utime.tv_usec < Save_r.ru_utime.tv_usec)
	{
		r.ru_utime.tv_sec--;
		r.ru_utime.tv_usec += 1000000;
	}
	if (r.ru_stime.tv_usec < Save_r.ru_stime.tv_usec)
	{
		r.ru_stime.tv_sec--;
		r.ru_stime.tv_usec += 1000000;
	}

	/*
	 * the only stats we don't show here are for memory usage -- i can't
	 * figure out how to interpret the relevant fields in the rusage
	 * struct, and they change names across o/s platforms, anyway. if you
	 * can figure out what the entries mean, you can somehow extract
	 * resident set size, shared text size, and unshared data and stack
	 * sizes.
	 */
3295
	initStringInfo(&str);
3296

3297 3298
	appendStringInfo(&str, "! system usage stats:\n");
	appendStringInfo(&str,
3299
			"!\t%ld.%06ld elapsed %ld.%06ld user %ld.%06ld system sec\n",
3300 3301 3302
					 (long) (elapse_t.tv_sec - Save_t.tv_sec),
					 (long) (elapse_t.tv_usec - Save_t.tv_usec),
					 (long) (r.ru_utime.tv_sec - Save_r.ru_utime.tv_sec),
B
Bruce Momjian 已提交
3303
				   (long) (r.ru_utime.tv_usec - Save_r.ru_utime.tv_usec),
3304
					 (long) (r.ru_stime.tv_sec - Save_r.ru_stime.tv_sec),
B
Bruce Momjian 已提交
3305
				  (long) (r.ru_stime.tv_usec - Save_r.ru_stime.tv_usec));
3306
	appendStringInfo(&str,
B
Bruce Momjian 已提交
3307
					 "!\t[%ld.%06ld user %ld.%06ld sys total]\n",
3308 3309 3310 3311
					 (long) user.tv_sec,
					 (long) user.tv_usec,
					 (long) sys.tv_sec,
					 (long) sys.tv_usec);
3312
/* BeOS has rusage but only has some fields, and not these... */
3313
#if defined(HAVE_GETRUSAGE)
3314
	appendStringInfo(&str,
B
Bruce Momjian 已提交
3315 3316
					 "!\t%ld/%ld [%ld/%ld] filesystem blocks in/out\n",
					 r.ru_inblock - Save_r.ru_inblock,
3317
	/* they only drink coffee at dec */
B
Bruce Momjian 已提交
3318 3319
					 r.ru_oublock - Save_r.ru_oublock,
					 r.ru_inblock, r.ru_oublock);
3320
	appendStringInfo(&str,
3321
		  "!\t%ld/%ld [%ld/%ld] page faults/reclaims, %ld [%ld] swaps\n",
B
Bruce Momjian 已提交
3322 3323 3324 3325 3326
					 r.ru_majflt - Save_r.ru_majflt,
					 r.ru_minflt - Save_r.ru_minflt,
					 r.ru_majflt, r.ru_minflt,
					 r.ru_nswap - Save_r.ru_nswap,
					 r.ru_nswap);
3327
	appendStringInfo(&str,
3328
	 "!\t%ld [%ld] signals rcvd, %ld/%ld [%ld/%ld] messages rcvd/sent\n",
B
Bruce Momjian 已提交
3329 3330 3331 3332 3333
					 r.ru_nsignals - Save_r.ru_nsignals,
					 r.ru_nsignals,
					 r.ru_msgrcv - Save_r.ru_msgrcv,
					 r.ru_msgsnd - Save_r.ru_msgsnd,
					 r.ru_msgrcv, r.ru_msgsnd);
3334
	appendStringInfo(&str,
3335
		 "!\t%ld/%ld [%ld/%ld] voluntary/involuntary context switches\n",
B
Bruce Momjian 已提交
3336 3337 3338
					 r.ru_nvcsw - Save_r.ru_nvcsw,
					 r.ru_nivcsw - Save_r.ru_nivcsw,
					 r.ru_nvcsw, r.ru_nivcsw);
3339
#endif   /* HAVE_GETRUSAGE */
3340 3341

	bufusage = ShowBufferUsage();
3342
	appendStringInfo(&str, "! buffer usage stats:\n%s", bufusage);
3343 3344 3345
	pfree(bufusage);

	/* remove trailing newline */
B
Bruce Momjian 已提交
3346
	if (str.data[str.len - 1] == '\n')
3347 3348
		str.data[--str.len] = '\0';

3349 3350 3351
	ereport(LOG,
			(errmsg_internal("%s", title),
			 errdetail("%s", str.data)));
3352 3353

	pfree(str.data);
3354
}
3355 3356 3357 3358

/*
 * on_proc_exit handler to log end of session
 */
B
Bruce Momjian 已提交
3359
static void
3360
log_disconnections(int code, Datum arg)
3361
{
B
Bruce Momjian 已提交
3362
	Port	   *port = MyProcPort;
3363
	struct timeval end;
B
Bruce Momjian 已提交
3364 3365 3366 3367 3368 3369 3370 3371 3372 3373 3374 3375 3376
	int			hours,
				minutes,
				seconds;

	char		session_time[20];
	char		uname[6 + NAMEDATALEN];
	char		dbname[10 + NAMEDATALEN];
	char		remote_host[7 + NI_MAXHOST];
	char		remote_port[7 + NI_MAXSERV];

	snprintf(uname, sizeof(uname), " user=%s", port->user_name);
	snprintf(dbname, sizeof(dbname), " database=%s", port->database_name);
	snprintf(remote_host, sizeof(remote_host), " host=%s",
3377
			 port->remote_host);
B
Bruce Momjian 已提交
3378
	snprintf(remote_port, sizeof(remote_port), " port=%s", port->remote_port);
3379 3380


B
Bruce Momjian 已提交
3381
	gettimeofday(&end, NULL);
3382 3383 3384 3385 3386 3387 3388 3389 3390 3391 3392 3393 3394 3395 3396 3397 3398

	if (end.tv_usec < port->session_start.tv_usec)
	{
		end.tv_sec--;
		end.tv_usec += 1000000;
	}
	end.tv_sec -= port->session_start.tv_sec;
	end.tv_usec -= port->session_start.tv_usec;

	hours = end.tv_sec / 3600;
	end.tv_sec %= 3600;
	minutes = end.tv_sec / 60;
	seconds = end.tv_sec % 60;

	/* if time has gone backwards for some reason say so, or print time */

	if (end.tv_sec < 0)
B
Bruce Momjian 已提交
3399
		snprintf(session_time, sizeof(session_time), "negative!");
3400
	else
B
Bruce Momjian 已提交
3401 3402 3403 3404 3405

		/*
		 * for stricter accuracy here we could round - this is close
		 * enough
		 */
3406
		snprintf(session_time, sizeof(session_time),
B
Bruce Momjian 已提交
3407 3408 3409
				 "%d:%02d:%02d.%02d",
				 hours, minutes, seconds, (int) (end.tv_usec / 10000));

3410
	ereport(
B
Bruce Momjian 已提交
3411 3412 3413
			LOG,
			(errmsg("disconnection: session time: %s%s%s%s%s",
				session_time, uname, dbname, remote_host, remote_port)));
3414 3415

}