execMain.c 52.5 KB
Newer Older
1 2
/*-------------------------------------------------------------------------
 *
3
 * execMain.c
4
 *	  top level executor interface routines
5 6
 *
 * INTERFACE ROUTINES
7 8 9
 *	ExecutorStart()
 *	ExecutorRun()
 *	ExecutorEnd()
10
 *
11 12 13 14
 *	The old ExecutorMain() has been replaced by ExecutorStart(),
 *	ExecutorRun() and ExecutorEnd()
 *
 *	These three procedures are the external interfaces to the executor.
15
 *	In each case, the query descriptor is required as an argument.
16
 *
17
 *	ExecutorStart() must be called at the beginning of execution of any
18 19 20
 *	query plan and ExecutorEnd() should always be called at the end of
 *	execution of a plan.
 *
21
 *	ExecutorRun accepts direction and count arguments that specify whether
22
 *	the plan is to be executed forwards, backwards, and for how many tuples.
23
 *
B
Bruce Momjian 已提交
24
 * Portions Copyright (c) 1996-2002, PostgreSQL Global Development Group
B
Add:  
Bruce Momjian 已提交
25
 * Portions Copyright (c) 1994, Regents of the University of California
26 27 28
 *
 *
 * IDENTIFICATION
29
 *	  $Header: /cvsroot/pgsql/src/backend/executor/execMain.c,v 1.201 2003/03/10 03:53:49 tgl Exp $
30 31 32
 *
 *-------------------------------------------------------------------------
 */
33 34
#include "postgres.h"

35 36
#include "access/heapam.h"
#include "catalog/heap.h"
37
#include "catalog/namespace.h"
38
#include "commands/tablecmds.h"
39
#include "commands/trigger.h"
B
Bruce Momjian 已提交
40 41 42 43 44 45
#include "executor/execdebug.h"
#include "executor/execdefs.h"
#include "miscadmin.h"
#include "optimizer/var.h"
#include "parser/parsetree.h"
#include "utils/acl.h"
46
#include "utils/lsyscache.h"
47

48

49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64
typedef struct execRowMark
{
	Relation	relation;
	Index		rti;
	char		resname[32];
} execRowMark;

typedef struct evalPlanQual
{
	Index		rti;
	EState	   *estate;
	PlanState  *planstate;
	struct evalPlanQual *next;	/* stack of active PlanQual plans */
	struct evalPlanQual *free;	/* list of free PlanQual plans */
} evalPlanQual;

65
/* decls for local routines only used within this module */
66
static void InitPlan(QueryDesc *queryDesc);
67
static void initResultRelInfo(ResultRelInfo *resultRelInfo,
B
Bruce Momjian 已提交
68 69 70
				  Index resultRelationIndex,
				  List *rangeTable,
				  CmdType operation);
71
static TupleTableSlot *ExecutePlan(EState *estate, PlanState *planstate,
B
Bruce Momjian 已提交
72 73 74 75
			CmdType operation,
			long numberTuples,
			ScanDirection direction,
			DestReceiver *destfunc);
76
static void ExecSelect(TupleTableSlot *slot,
B
Bruce Momjian 已提交
77 78
		   DestReceiver *destfunc,
		   EState *estate);
79
static void ExecInsert(TupleTableSlot *slot, ItemPointer tupleid,
B
Bruce Momjian 已提交
80
		   EState *estate);
81
static void ExecDelete(TupleTableSlot *slot, ItemPointer tupleid,
B
Bruce Momjian 已提交
82
		   EState *estate);
83
static void ExecUpdate(TupleTableSlot *slot, ItemPointer tupleid,
B
Bruce Momjian 已提交
84
		   EState *estate);
85
static TupleTableSlot *EvalPlanQualNext(EState *estate);
86
static void EndEvalPlanQual(EState *estate);
87
static void ExecCheckRTEPerms(RangeTblEntry *rte, CmdType operation);
88
static void ExecCheckXactReadOnly(Query *parsetree, CmdType operation);
89 90 91
static void EvalPlanQualStart(evalPlanQual *epq, EState *estate,
							  evalPlanQual *priorepq);
static void EvalPlanQualStop(evalPlanQual *epq);
92

93 94
/* end of local decls */

95

96
/* ----------------------------------------------------------------
97 98 99 100 101
 *		ExecutorStart
 *
 *		This routine must be called at the beginning of any execution of any
 *		query plan
 *
102 103 104 105
 * Takes a QueryDesc previously created by CreateQueryDesc (it's not real
 * clear why we bother to separate the two functions, but...).  The tupDesc
 * field of the QueryDesc is filled in to describe the tuples that will be
 * returned, and the internal fields (estate and planstate) are set up.
106
 *
107 108
 * NB: the CurrentMemoryContext when this is called will become the parent
 * of the per-query context used for this Executor invocation.
109 110
 * ----------------------------------------------------------------
 */
111 112
void
ExecutorStart(QueryDesc *queryDesc)
113
{
114
	EState	   *estate;
115
	MemoryContext oldcontext;
116

117
	/* sanity checks: queryDesc must not be started already */
118
	Assert(queryDesc != NULL);
119 120 121
	Assert(queryDesc->estate == NULL);

	/*
122
	 * Build EState, switch into per-query memory context for startup.
123 124 125 126
	 */
	estate = CreateExecutorState();
	queryDesc->estate = estate;

127 128 129 130 131
	oldcontext = MemoryContextSwitchTo(estate->es_query_cxt);

	/*
	 * Fill in parameters, if any, from queryDesc
	 */
132
	estate->es_param_list_info = queryDesc->params;
133

V
Vadim B. Mikheev 已提交
134
	if (queryDesc->plantree->nParamExec > 0)
135
		estate->es_param_exec_vals = (ParamExecData *)
136
			palloc0(queryDesc->plantree->nParamExec * sizeof(ParamExecData));
137

138 139
	estate->es_instrument = queryDesc->doInstrument;

140
	/*
141 142
	 * Make our own private copy of the current query snapshot data.
	 *
B
Bruce Momjian 已提交
143 144 145
	 * This "freezes" our idea of which tuples are good and which are not for
	 * the life of this query, even if it outlives the current command and
	 * current snapshot.
146
	 */
147
	estate->es_snapshot = CopyQuerySnapshot();
148

149
	/*
150
	 * Initialize the plan state tree
151
	 */
152
	InitPlan(queryDesc);
153 154

	MemoryContextSwitchTo(oldcontext);
155 156 157
}

/* ----------------------------------------------------------------
158 159 160 161 162 163 164
 *		ExecutorRun
 *
 *		This is the main routine of the executor module. It accepts
 *		the query descriptor from the traffic cop and executes the
 *		query plan.
 *
 *		ExecutorStart must have been called already.
165
 *
166 167 168
 *		If direction is NoMovementScanDirection then nothing is done
 *		except to start up/shut down the destination.  Otherwise,
 *		we retrieve up to 'count' tuples in the specified direction.
169
 *
170
 *		Note: count = 0 is interpreted as no portal limit, i.e., run to
171
 *		completion.
172
 *
173 174
 * ----------------------------------------------------------------
 */
175
TupleTableSlot *
176
ExecutorRun(QueryDesc *queryDesc,
177
			ScanDirection direction, long count)
178
{
179
	EState	   *estate;
180
	CmdType		operation;
B
Bruce Momjian 已提交
181 182
	CommandDest dest;
	DestReceiver *destfunc;
183
	TupleTableSlot *result;
184 185 186 187 188 189 190 191
	MemoryContext oldcontext;

	/* sanity checks */
	Assert(queryDesc != NULL);

	estate = queryDesc->estate;

	Assert(estate != NULL);
192

B
Bruce Momjian 已提交
193
	/*
194
	 * Switch into per-query memory context
195
	 */
196
	oldcontext = MemoryContextSwitchTo(estate->es_query_cxt);
197

B
Bruce Momjian 已提交
198
	/*
B
Bruce Momjian 已提交
199 200
	 * extract information from the query descriptor and the query
	 * feature.
201
	 */
202 203 204
	operation = queryDesc->operation;
	dest = queryDesc->dest;

205 206 207 208 209 210 211 212
	/*
	 * If the transaction is read-only, we need to check if any writes
	 * are planned to non-temporary tables.  This is done here at this
	 * rather late stage so that we can handle EXPLAIN vs. EXPLAIN
	 * ANALYZE easily.
	 */
	ExecCheckXactReadOnly(queryDesc->parsetree, operation);

B
Bruce Momjian 已提交
213
	/*
214
	 * startup tuple receiver
215
	 */
216 217
	estate->es_processed = 0;
	estate->es_lastoid = InvalidOid;
218

219 220 221
	destfunc = DestToFunction(dest);
	(*destfunc->setup) (destfunc, (int) operation,
						queryDesc->portalName, queryDesc->tupDesc);
222

223 224 225 226 227 228 229
	/*
	 * run plan
	 */
	if (direction == NoMovementScanDirection)
		result = NULL;
	else
		result = ExecutePlan(estate,
230
							 queryDesc->planstate,
231 232 233 234
							 operation,
							 count,
							 direction,
							 destfunc);
235

236 237 238
	/*
	 * shutdown receiver
	 */
239 240
	(*destfunc->cleanup) (destfunc);

241 242
	MemoryContextSwitchTo(oldcontext);

243
	return result;
244 245 246
}

/* ----------------------------------------------------------------
247 248
 *		ExecutorEnd
 *
249
 *		This routine must be called at the end of execution of any
250
 *		query plan
251 252 253
 * ----------------------------------------------------------------
 */
void
254
ExecutorEnd(QueryDesc *queryDesc)
255
{
256
	EState	   *estate;
257
	MemoryContext oldcontext;
258

259 260
	/* sanity checks */
	Assert(queryDesc != NULL);
261

262 263
	estate = queryDesc->estate;

264
	Assert(estate != NULL);
265

266
	/*
267
	 * Switch into per-query memory context to run ExecEndPlan
268
	 */
269 270 271
	oldcontext = MemoryContextSwitchTo(estate->es_query_cxt);

	ExecEndPlan(queryDesc->planstate, estate);
272

273
	/*
274
	 * Must switch out of context before destroying it
275
	 */
276
	MemoryContextSwitchTo(oldcontext);
277

278
	/*
279 280
	 * Release EState and per-query memory context.  This should release
	 * everything the executor has allocated.
281
	 */
282 283 284 285 286 287
	FreeExecutorState(estate);

	/* Reset queryDesc fields that no longer point to anything */
	queryDesc->tupDesc = NULL;
	queryDesc->estate = NULL;
	queryDesc->planstate = NULL;
288
}
289

290

291 292 293 294
/*
 * ExecCheckRTPerms
 *		Check access permissions for all relations listed in a range table.
 */
295
void
296
ExecCheckRTPerms(List *rangeTable, CmdType operation)
297 298 299 300
{
	List	   *lp;

	foreach(lp, rangeTable)
301
	{
302 303
		RangeTblEntry *rte = lfirst(lp);

304
		ExecCheckRTEPerms(rte, operation);
305 306 307 308 309 310 311 312
	}
}

/*
 * ExecCheckRTEPerms
 *		Check access permissions for a single RTE.
 */
static void
313
ExecCheckRTEPerms(RangeTblEntry *rte, CmdType operation)
314
{
315
	Oid			relOid;
316
	AclId		userid;
317
	AclResult	aclcheck_result;
318

B
Bruce Momjian 已提交
319
	/*
320 321 322 323 324 325 326 327 328 329 330 331
	 * If it's a subquery, recursively examine its rangetable.
	 */
	if (rte->rtekind == RTE_SUBQUERY)
	{
		ExecCheckRTPerms(rte->subquery->rtable, operation);
		return;
	}

	/*
	 * Otherwise, only plain-relation RTEs need to be checked here.
	 * Function RTEs are checked by init_fcache when the function is prepared
	 * for execution. Join and special RTEs need no checks.
B
Bruce Momjian 已提交
332
	 */
333
	if (rte->rtekind != RTE_RELATION)
334 335
		return;

336
	relOid = rte->relid;
337 338

	/*
B
Bruce Momjian 已提交
339 340
	 * userid to check as: current user unless we have a setuid
	 * indication.
341
	 *
B
Bruce Momjian 已提交
342 343
	 * Note: GetUserId() is presently fast enough that there's no harm in
	 * calling it separately for each RTE.	If that stops being true, we
344
	 * could call it once in ExecCheckRTPerms and pass the userid down
B
Bruce Momjian 已提交
345
	 * from there.	But for now, no need for the extra clutter.
346
	 */
347
	userid = rte->checkAsUser ? rte->checkAsUser : GetUserId();
348

349
#define CHECK(MODE)		pg_class_aclcheck(relOid, userid, MODE)
350

351
	if (rte->checkForRead)
352
	{
353
		aclcheck_result = CHECK(ACL_SELECT);
354
		if (aclcheck_result != ACLCHECK_OK)
355
			aclcheck_error(aclcheck_result, get_rel_name(relOid));
356 357 358 359 360 361 362 363 364
	}

	if (rte->checkForWrite)
	{
		/*
		 * Note: write access in a SELECT context means SELECT FOR UPDATE.
		 * Right now we don't distinguish that from true update as far as
		 * permissions checks are concerned.
		 */
365 366 367
		switch (operation)
		{
			case CMD_INSERT:
368
				aclcheck_result = CHECK(ACL_INSERT);
369
				break;
370
			case CMD_SELECT:
371
			case CMD_UPDATE:
372 373 374 375
				aclcheck_result = CHECK(ACL_UPDATE);
				break;
			case CMD_DELETE:
				aclcheck_result = CHECK(ACL_DELETE);
376 377 378 379
				break;
			default:
				elog(ERROR, "ExecCheckRTEPerms: bogus operation %d",
					 operation);
380
				aclcheck_result = ACLCHECK_OK;	/* keep compiler quiet */
381 382
				break;
		}
383
		if (aclcheck_result != ACLCHECK_OK)
384
			aclcheck_error(aclcheck_result, get_rel_name(relOid));
385
	}
386 387
}

388

389 390 391 392 393 394 395
/* ===============================================================
 * ===============================================================
						 static routines follow
 * ===============================================================
 * ===============================================================
 */

396

397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421
static void
ExecCheckXactReadOnly(Query *parsetree, CmdType operation)
{
	if (!XactReadOnly)
		return;

	/* CREATE TABLE AS or SELECT INTO */
	if (operation == CMD_SELECT && parsetree->into != NULL)
		goto fail;

	if (operation == CMD_DELETE || operation == CMD_INSERT
		|| operation == CMD_UPDATE)
	{
		List *lp;

		foreach(lp, parsetree->rtable)
		{
			RangeTblEntry *rte = lfirst(lp);

			if (rte->rtekind != RTE_RELATION)
				continue;

			if (!rte->checkForWrite)
				continue;

422
			if (isTempNamespace(get_rel_namespace(rte->relid)))
423 424 425 426 427 428 429 430 431 432 433 434 435
				continue;

			goto fail;
		}
	}

	return;

fail:
	elog(ERROR, "transaction is read-only");
}


436
/* ----------------------------------------------------------------
437 438 439 440
 *		InitPlan
 *
 *		Initializes the query plan: open files, allocate storage
 *		and start up the rule manager
441 442
 * ----------------------------------------------------------------
 */
443 444
static void
InitPlan(QueryDesc *queryDesc)
445
{
446 447 448 449 450
	CmdType		operation = queryDesc->operation;
	Query *parseTree = queryDesc->parsetree;
	Plan *plan = queryDesc->plantree;
	EState *estate = queryDesc->estate;
	PlanState  *planstate;
B
Bruce Momjian 已提交
451 452
	List	   *rangeTable;
	Relation	intoRelationDesc;
453
	bool		do_select_into;
B
Bruce Momjian 已提交
454
	TupleDesc	tupType;
455

456
	/*
457 458 459
	 * Do permissions checks.  It's sufficient to examine the query's
	 * top rangetable here --- subplan RTEs will be checked during
	 * ExecInitSubPlan().
460
	 */
461
	ExecCheckRTPerms(parseTree->rtable, operation);
462

B
Bruce Momjian 已提交
463
	/*
B
Bruce Momjian 已提交
464
	 * get information from query descriptor
465
	 */
466
	rangeTable = parseTree->rtable;
467

B
Bruce Momjian 已提交
468
	/*
B
Bruce Momjian 已提交
469
	 * initialize the node's execution state
470
	 */
471 472
	estate->es_range_table = rangeTable;

B
Bruce Momjian 已提交
473
	/*
474
	 * if there is a result relation, initialize result relation stuff
475
	 */
476
	if (parseTree->resultRelation != 0 && operation != CMD_SELECT)
477
	{
478 479 480
		List	   *resultRelations = parseTree->resultRelations;
		int			numResultRelations;
		ResultRelInfo *resultRelInfos;
B
Bruce Momjian 已提交
481

482 483 484 485 486 487 488
		if (resultRelations != NIL)
		{
			/*
			 * Multiple result relations (due to inheritance)
			 * parseTree->resultRelations identifies them all
			 */
			ResultRelInfo *resultRelInfo;
489

490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506
			numResultRelations = length(resultRelations);
			resultRelInfos = (ResultRelInfo *)
				palloc(numResultRelations * sizeof(ResultRelInfo));
			resultRelInfo = resultRelInfos;
			while (resultRelations != NIL)
			{
				initResultRelInfo(resultRelInfo,
								  lfirsti(resultRelations),
								  rangeTable,
								  operation);
				resultRelInfo++;
				resultRelations = lnext(resultRelations);
			}
		}
		else
		{
			/*
B
Bruce Momjian 已提交
507 508
			 * Single result relation identified by
			 * parseTree->resultRelation
509 510 511 512 513 514 515 516
			 */
			numResultRelations = 1;
			resultRelInfos = (ResultRelInfo *) palloc(sizeof(ResultRelInfo));
			initResultRelInfo(resultRelInfos,
							  parseTree->resultRelation,
							  rangeTable,
							  operation);
		}
517

518 519 520 521
		estate->es_result_relations = resultRelInfos;
		estate->es_num_result_relations = numResultRelations;
		/* Initialize to first or only result rel */
		estate->es_result_relation_info = resultRelInfos;
522
	}
523 524
	else
	{
B
Bruce Momjian 已提交
525
		/*
B
Bruce Momjian 已提交
526
		 * if no result relation, then set state appropriately
527
		 */
528 529
		estate->es_result_relations = NULL;
		estate->es_num_result_relations = 0;
530 531 532
		estate->es_result_relation_info = NULL;
	}

533 534 535 536 537 538 539
	/*
	 * Detect whether we're doing SELECT INTO.  If so, set the force_oids
	 * flag appropriately so that the plan tree will be initialized with
	 * the correct tuple descriptors.
	 */
	do_select_into = false;

540
	if (operation == CMD_SELECT && parseTree->into != NULL)
541 542 543 544 545 546 547 548 549 550
	{
		do_select_into = true;
		/*
		 * For now, always create OIDs in SELECT INTO; this is for backwards
		 * compatibility with pre-7.3 behavior.  Eventually we might want
		 * to allow the user to choose.
		 */
		estate->es_force_oids = true;
	}

551 552 553
	/*
	 * Have to lock relations selected for update
	 */
554 555
	estate->es_rowMark = NIL;
	if (parseTree->rowMarks != NIL)
556
	{
B
Bruce Momjian 已提交
557
		List	   *l;
558

559
		foreach(l, parseTree->rowMarks)
560
		{
561 562
			Index		rti = lfirsti(l);
			Oid			relid = getrelid(rti, rangeTable);
563 564 565 566
			Relation	relation;
			execRowMark *erm;

			relation = heap_open(relid, RowShareLock);
B
Bruce Momjian 已提交
567
			erm = (execRowMark *) palloc(sizeof(execRowMark));
568
			erm->relation = relation;
569
			erm->rti = rti;
570
			snprintf(erm->resname, 32, "ctid%u", rti);
571 572 573
			estate->es_rowMark = lappend(estate->es_rowMark, erm);
		}
	}
574

B
Bruce Momjian 已提交
575
	/*
576
	 * initialize the executor "tuple" table.  We need slots for all the
577 578 579
	 * plan nodes, plus possibly output slots for the junkfilter(s). At
	 * this point we aren't sure if we need junkfilters, so just add slots
	 * for them unconditionally.
580 581
	 */
	{
582
		int			nSlots = ExecCountSlotsNode(plan);
583

584 585 586 587 588
		if (parseTree->resultRelations != NIL)
			nSlots += length(parseTree->resultRelations);
		else
			nSlots += 1;
		estate->es_tupleTable = ExecCreateTupleTable(nSlots);
589
	}
590

591
	/* mark EvalPlanQual not active */
592
	estate->es_topPlan = plan;
593 594
	estate->es_evalPlanQual = NULL;
	estate->es_evTupleNull = NULL;
595
	estate->es_evTuple = NULL;
596 597
	estate->es_useEvalPlan = false;

B
Bruce Momjian 已提交
598
	/*
B
Bruce Momjian 已提交
599 600
	 * initialize the private state information for all the nodes in the
	 * query tree.	This opens files, allocates storage and leaves us
601
	 * ready to start processing tuples.
602
	 */
603
	planstate = ExecInitNode(plan, estate);
604

B
Bruce Momjian 已提交
605
	/*
606
	 * Get the tuple descriptor describing the type of tuples to return.
B
Bruce Momjian 已提交
607
	 * (this is especially important if we are creating a relation with
608
	 * "SELECT INTO")
609
	 */
610
	tupType = ExecGetTupType(planstate);
611

B
Bruce Momjian 已提交
612
	/*
613 614 615 616 617
	 * Initialize the junk filter if needed.  SELECT and INSERT queries need a
	 * filter if there are any junk attrs in the tlist.  INSERT and SELECT
	 * INTO also need a filter if the top plan node is a scan node that's not
	 * doing projection (else we'll be scribbling on the scan tuple!)  UPDATE
	 * and DELETE always need a filter, since there's always a junk 'ctid'
B
Bruce Momjian 已提交
618
	 * attribute present --- no need to look first.
619 620
	 */
	{
621 622 623
		bool		junk_filter_needed = false;
		List	   *tlist;

624
		switch (operation)
625
		{
626 627
			case CMD_SELECT:
			case CMD_INSERT:
628
				foreach(tlist, plan->targetlist)
629
				{
630 631 632 633 634 635 636
					TargetEntry *tle = (TargetEntry *) lfirst(tlist);

					if (tle->resdom->resjunk)
					{
						junk_filter_needed = true;
						break;
					}
637
				}
638 639 640 641 642 643 644 645 646 647 648 649 650
				if (!junk_filter_needed &&
					(operation == CMD_INSERT || do_select_into))
				{
					if (IsA(planstate, SeqScanState) ||
						IsA(planstate, IndexScanState) ||
						IsA(planstate, TidScanState) ||
						IsA(planstate, SubqueryScanState) ||
						IsA(planstate, FunctionScanState))
					{
						if (planstate->ps_ProjInfo == NULL)
							junk_filter_needed = true;
					}
				}
651 652 653 654 655 656 657
				break;
			case CMD_UPDATE:
			case CMD_DELETE:
				junk_filter_needed = true;
				break;
			default:
				break;
658 659
		}

660
		if (junk_filter_needed)
661
		{
662
			/*
B
Bruce Momjian 已提交
663 664 665 666
			 * If there are multiple result relations, each one needs its
			 * own junk filter.  Note this is only possible for
			 * UPDATE/DELETE, so we can't be fooled by some needing a
			 * filter and some not.
667 668 669
			 */
			if (parseTree->resultRelations != NIL)
			{
670 671
				PlanState **appendplans;
				int			as_nplans;
672
				ResultRelInfo *resultRelInfo;
673
				int			i;
674 675 676 677

				/* Top plan had better be an Append here. */
				Assert(IsA(plan, Append));
				Assert(((Append *) plan)->isTarget);
678 679 680 681
				Assert(IsA(planstate, AppendState));
				appendplans = ((AppendState *) planstate)->appendplans;
				as_nplans = ((AppendState *) planstate)->as_nplans;
				Assert(as_nplans == estate->es_num_result_relations);
682
				resultRelInfo = estate->es_result_relations;
683
				for (i = 0; i < as_nplans; i++)
684
				{
685
					PlanState  *subplan = appendplans[i];
686 687
					JunkFilter *j;

688
					j = ExecInitJunkFilter(subplan->plan->targetlist,
689
										   ExecGetTupType(subplan),
690
							  ExecAllocTableSlot(estate->es_tupleTable));
691 692 693
					resultRelInfo->ri_junkFilter = j;
					resultRelInfo++;
				}
B
Bruce Momjian 已提交
694

695 696 697 698 699 700 701 702 703 704
				/*
				 * Set active junkfilter too; at this point ExecInitAppend
				 * has already selected an active result relation...
				 */
				estate->es_junkFilter =
					estate->es_result_relation_info->ri_junkFilter;
			}
			else
			{
				/* Normal case with just one JunkFilter */
705
				JunkFilter *j;
706

707
				j = ExecInitJunkFilter(planstate->plan->targetlist,
708
									   tupType,
709
							  ExecAllocTableSlot(estate->es_tupleTable));
710 711 712
				estate->es_junkFilter = j;
				if (estate->es_result_relation_info)
					estate->es_result_relation_info->ri_junkFilter = j;
713

714 715 716 717
				/* For SELECT, want to return the cleaned tuple type */
				if (operation == CMD_SELECT)
					tupType = j->jf_cleanTupType;
			}
718 719 720 721
		}
		else
			estate->es_junkFilter = NULL;
	}
722

B
Bruce Momjian 已提交
723
	/*
724 725 726
	 * If doing SELECT INTO, initialize the "into" relation.  We must wait
	 * till now so we have the "clean" result tuple type to create the
	 * new table from.
727 728 729
	 */
	intoRelationDesc = (Relation) NULL;

730
	if (do_select_into)
731
	{
732 733 734 735 736
		char	   *intoName;
		Oid			namespaceId;
		AclResult	aclresult;
		Oid			intoRelationId;
		TupleDesc	tupdesc;
737

738 739 740 741 742
		/*
		 * find namespace to create in, check permissions
		 */
		intoName = parseTree->into->relname;
		namespaceId = RangeVarGetCreationNamespace(parseTree->into);
743

744 745 746 747
		aclresult = pg_namespace_aclcheck(namespaceId, GetUserId(),
										  ACL_CREATE);
		if (aclresult != ACLCHECK_OK)
			aclcheck_error(aclresult, get_namespace_name(namespaceId));
748

749 750 751 752
		/*
		 * have to copy tupType to get rid of constraints
		 */
		tupdesc = CreateTupleDescCopy(tupType);
753

754 755 756 757 758 759 760
		intoRelationId = heap_create_with_catalog(intoName,
												  namespaceId,
												  tupdesc,
												  RELKIND_RELATION,
												  false,
												  ONCOMMIT_NOOP,
												  allowSystemTableMods);
761

762
		FreeTupleDesc(tupdesc);
763

764 765 766 767 768
		/*
		 * Advance command counter so that the newly-created
		 * relation's catalog tuples will be visible to heap_open.
		 */
		CommandCounterIncrement();
769

770 771 772 773 774 775 776
		/*
		 * If necessary, create a TOAST table for the into
		 * relation. Note that AlterTableCreateToastTable ends
		 * with CommandCounterIncrement(), so that the TOAST table
		 * will be visible for insertion.
		 */
		AlterTableCreateToastTable(intoRelationId, true);
777

778 779 780 781
		/*
		 * And open the constructed table for writing.
		 */
		intoRelationDesc = heap_open(intoRelationId, AccessExclusiveLock);
782 783 784 785
	}

	estate->es_into_relation_descriptor = intoRelationDesc;

786 787
	queryDesc->tupDesc = tupType;
	queryDesc->planstate = planstate;
788 789
}

790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827
/*
 * Initialize ResultRelInfo data for one result relation
 */
static void
initResultRelInfo(ResultRelInfo *resultRelInfo,
				  Index resultRelationIndex,
				  List *rangeTable,
				  CmdType operation)
{
	Oid			resultRelationOid;
	Relation	resultRelationDesc;

	resultRelationOid = getrelid(resultRelationIndex, rangeTable);
	resultRelationDesc = heap_open(resultRelationOid, RowExclusiveLock);

	switch (resultRelationDesc->rd_rel->relkind)
	{
		case RELKIND_SEQUENCE:
			elog(ERROR, "You can't change sequence relation %s",
				 RelationGetRelationName(resultRelationDesc));
			break;
		case RELKIND_TOASTVALUE:
			elog(ERROR, "You can't change toast relation %s",
				 RelationGetRelationName(resultRelationDesc));
			break;
		case RELKIND_VIEW:
			elog(ERROR, "You can't change view relation %s",
				 RelationGetRelationName(resultRelationDesc));
			break;
	}

	MemSet(resultRelInfo, 0, sizeof(ResultRelInfo));
	resultRelInfo->type = T_ResultRelInfo;
	resultRelInfo->ri_RangeTableIndex = resultRelationIndex;
	resultRelInfo->ri_RelationDesc = resultRelationDesc;
	resultRelInfo->ri_NumIndices = 0;
	resultRelInfo->ri_IndexRelationDescs = NULL;
	resultRelInfo->ri_IndexRelationInfo = NULL;
828 829
	/* make a copy so as not to depend on relcache info not changing... */
	resultRelInfo->ri_TrigDesc = CopyTriggerDesc(resultRelationDesc->trigdesc);
830
	resultRelInfo->ri_TrigFunctions = NULL;
831 832 833 834 835 836
	resultRelInfo->ri_ConstraintExprs = NULL;
	resultRelInfo->ri_junkFilter = NULL;

	/*
	 * If there are indices on the result relation, open them and save
	 * descriptors in the result relation info, so that we can add new
B
Bruce Momjian 已提交
837 838
	 * index entries for the tuples we add/update.	We need not do this
	 * for a DELETE, however, since deletion doesn't affect indexes.
839 840 841 842 843 844
	 */
	if (resultRelationDesc->rd_rel->relhasindex &&
		operation != CMD_DELETE)
		ExecOpenIndices(resultRelInfo);
}

845
/* ----------------------------------------------------------------
846
 *		ExecEndPlan
847
 *
848
 *		Cleans up the query plan -- closes files and frees up storage
849 850 851 852 853 854
 *
 * NOTE: we are no longer very worried about freeing storage per se
 * in this code; FreeExecutorState should be guaranteed to release all
 * memory that needs to be released.  What we are worried about doing
 * is closing relations and dropping buffer pins.  Thus, for example,
 * tuple tables must be cleared or dropped to ensure pins are released.
855 856
 * ----------------------------------------------------------------
 */
857 858
void
ExecEndPlan(PlanState *planstate, EState *estate)
859
{
860 861
	ResultRelInfo *resultRelInfo;
	int			i;
862
	List	   *l;
863

864 865 866 867 868 869
	/*
	 * shut down any PlanQual processing we were doing
	 */
	if (estate->es_evalPlanQual != NULL)
		EndEvalPlanQual(estate);

B
Bruce Momjian 已提交
870
	/*
871
	 * shut down the node-type-specific query processing
872
	 */
873
	ExecEndNode(planstate);
874

B
Bruce Momjian 已提交
875
	/*
B
Bruce Momjian 已提交
876
	 * destroy the executor "tuple" table.
877
	 */
878 879
	ExecDropTupleTable(estate->es_tupleTable, true);
	estate->es_tupleTable = NULL;
880

B
Bruce Momjian 已提交
881
	/*
B
Bruce Momjian 已提交
882
	 * close the result relation(s) if any, but hold locks until xact
883
	 * commit.
884
	 */
885 886
	resultRelInfo = estate->es_result_relations;
	for (i = estate->es_num_result_relations; i > 0; i--)
887
	{
888 889 890 891
		/* Close indices and then the relation itself */
		ExecCloseIndices(resultRelInfo);
		heap_close(resultRelInfo->ri_RelationDesc, NoLock);
		resultRelInfo++;
892 893
	}

B
Bruce Momjian 已提交
894
	/*
895
	 * close the "into" relation if necessary, again keeping lock
896
	 */
897 898
	if (estate->es_into_relation_descriptor != NULL)
		heap_close(estate->es_into_relation_descriptor, NoLock);
899 900 901 902 903 904 905 906 907 908

	/*
	 * close any relations selected FOR UPDATE, again keeping locks
	 */
	foreach(l, estate->es_rowMark)
	{
		execRowMark *erm = lfirst(l);

		heap_close(erm->relation, NoLock);
	}
909 910 911
}

/* ----------------------------------------------------------------
912 913
 *		ExecutePlan
 *
914
 *		processes the query plan to retrieve 'numberTuples' tuples in the
915
 *		direction specified.
916
 *
917
 *		Retrieves all tuples if numberTuples is 0
918
 *
919
 *		result is either a slot containing the last tuple in the case
920
 *		of a SELECT or NULL otherwise.
921
 *
922 923
 * Note: the ctid attribute is a 'junk' attribute that is removed before the
 * user can see it
924 925 926
 * ----------------------------------------------------------------
 */
static TupleTableSlot *
927
ExecutePlan(EState *estate,
928
			PlanState *planstate,
929
			CmdType operation,
930
			long numberTuples,
931
			ScanDirection direction,
932
			DestReceiver *destfunc)
933
{
934 935 936 937 938 939
	JunkFilter			*junkfilter;
	TupleTableSlot		*slot;
	ItemPointer			 tupleid = NULL;
	ItemPointerData		 tuple_ctid;
	long				 current_tuple_count;
	TupleTableSlot		*result;
940

B
Bruce Momjian 已提交
941
	/*
B
Bruce Momjian 已提交
942
	 * initialize local variables
943
	 */
944 945 946 947
	slot = NULL;
	current_tuple_count = 0;
	result = NULL;

B
Bruce Momjian 已提交
948 949
	/*
	 * Set the direction.
950
	 */
951 952
	estate->es_direction = direction;

953 954 955 956 957 958 959 960 961 962 963 964 965 966 967 968
	/*
	 * Process BEFORE EACH STATEMENT triggers
	 */
	switch (operation)
	{
		case CMD_UPDATE:
			ExecBSUpdateTriggers(estate, estate->es_result_relation_info);
			break;
		case CMD_DELETE:
			ExecBSDeleteTriggers(estate, estate->es_result_relation_info);
			break;
		case CMD_INSERT:
			ExecBSInsertTriggers(estate, estate->es_result_relation_info);
			break;
		default:
			/* do nothing */
969
			break;
970 971
	}

B
Bruce Momjian 已提交
972
	/*
B
Bruce Momjian 已提交
973
	 * Loop until we've processed the proper number of tuples from the
974
	 * plan.
975 976 977 978
	 */

	for (;;)
	{
979 980
		/* Reset the per-output-tuple exprcontext */
		ResetPerTupleExprContext(estate);
B
Bruce Momjian 已提交
981

B
Bruce Momjian 已提交
982
		/*
B
Bruce Momjian 已提交
983
		 * Execute the plan and obtain a tuple
984
		 */
B
Bruce Momjian 已提交
985
lnext:	;
986 987 988 989
		if (estate->es_useEvalPlan)
		{
			slot = EvalPlanQualNext(estate);
			if (TupIsNull(slot))
990
				slot = ExecProcNode(planstate);
991 992
		}
		else
993
			slot = ExecProcNode(planstate);
994

B
Bruce Momjian 已提交
995
		/*
B
Bruce Momjian 已提交
996 997
		 * if the tuple is null, then we assume there is nothing more to
		 * process so we just return null...
998 999 1000 1001 1002
		 */
		if (TupIsNull(slot))
		{
			result = NULL;
			break;
1003 1004
		}

B
Bruce Momjian 已提交
1005
		/*
B
Bruce Momjian 已提交
1006 1007
		 * if we have a junk filter, then project a new tuple with the
		 * junk removed.
1008
		 *
1009 1010 1011
		 * Store this new "clean" tuple in the junkfilter's resultSlot.
		 * (Formerly, we stored it back over the "dirty" tuple, which is
		 * WRONG because that tuple slot has the wrong descriptor.)
1012
		 *
B
Bruce Momjian 已提交
1013
		 * Also, extract all the junk information we need.
1014 1015 1016
		 */
		if ((junkfilter = estate->es_junkFilter) != (JunkFilter *) NULL)
		{
1017 1018 1019
			Datum		datum;
			HeapTuple	newTuple;
			bool		isNull;
1020

B
Bruce Momjian 已提交
1021
			/*
1022 1023 1024 1025 1026 1027 1028 1029 1030
			 * extract the 'ctid' junk attribute.
			 */
			if (operation == CMD_UPDATE || operation == CMD_DELETE)
			{
				if (!ExecGetJunkAttribute(junkfilter,
										  slot,
										  "ctid",
										  &datum,
										  &isNull))
1031
					elog(ERROR, "ExecutePlan: NO (junk) `ctid' was found!");
1032

1033
				/* shouldn't ever get a null result... */
1034
				if (isNull)
1035
					elog(ERROR, "ExecutePlan: (junk) `ctid' is NULL!");
1036 1037 1038 1039 1040 1041

				tupleid = (ItemPointer) DatumGetPointer(datum);
				tuple_ctid = *tupleid;	/* make sure we don't free the
										 * ctid!! */
				tupleid = &tuple_ctid;
			}
1042
			else if (estate->es_rowMark != NIL)
1043
			{
B
Bruce Momjian 已提交
1044
				List	   *l;
1045

B
Bruce Momjian 已提交
1046 1047
		lmark:	;
				foreach(l, estate->es_rowMark)
1048
				{
1049 1050 1051 1052 1053 1054
					execRowMark *erm = lfirst(l);
					Buffer		buffer;
					HeapTupleData tuple;
					TupleTableSlot *newSlot;
					int			test;

1055 1056 1057 1058 1059
					if (!ExecGetJunkAttribute(junkfilter,
											  slot,
											  erm->resname,
											  &datum,
											  &isNull))
1060 1061
						elog(ERROR, "ExecutePlan: NO (junk) `%s' was found!",
							 erm->resname);
1062

1063
					/* shouldn't ever get a null result... */
1064
					if (isNull)
1065 1066
						elog(ERROR, "ExecutePlan: (junk) `%s' is NULL!",
							 erm->resname);
1067 1068

					tuple.t_self = *((ItemPointer) DatumGetPointer(datum));
1069 1070
					test = heap_mark4update(erm->relation, &tuple, &buffer,
											estate->es_snapshot->curcid);
1071 1072 1073 1074
					ReleaseBuffer(buffer);
					switch (test)
					{
						case HeapTupleSelfUpdated:
1075 1076 1077
							/* treat it as deleted; do not process */
							goto lnext;

1078 1079 1080 1081 1082 1083
						case HeapTupleMayBeUpdated:
							break;

						case HeapTupleUpdated:
							if (XactIsoLevel == XACT_SERIALIZABLE)
								elog(ERROR, "Can't serialize access due to concurrent update");
1084
							if (!(ItemPointerEquals(&(tuple.t_self),
B
Bruce Momjian 已提交
1085
								  (ItemPointer) DatumGetPointer(datum))))
1086
							{
B
Bruce Momjian 已提交
1087
								newSlot = EvalPlanQual(estate, erm->rti, &(tuple.t_self));
1088 1089 1090 1091 1092 1093 1094
								if (!(TupIsNull(newSlot)))
								{
									slot = newSlot;
									estate->es_useEvalPlan = true;
									goto lmark;
								}
							}
B
Bruce Momjian 已提交
1095 1096 1097

							/*
							 * if tuple was deleted or PlanQual failed for
1098
							 * updated tuple - we must not return this
B
Bruce Momjian 已提交
1099
							 * tuple!
1100 1101
							 */
							goto lnext;
1102 1103 1104

						default:
							elog(ERROR, "Unknown status %u from heap_mark4update", test);
B
Bruce Momjian 已提交
1105
							return (NULL);
1106 1107 1108
					}
				}
			}
1109

B
Bruce Momjian 已提交
1110
			/*
1111 1112 1113 1114 1115 1116
			 * Finally create a new "clean" tuple with all junk attributes
			 * removed
			 */
			newTuple = ExecRemoveJunk(junkfilter, slot);

			slot = ExecStoreTuple(newTuple,		/* tuple to store */
1117
								  junkfilter->jf_resultSlot,	/* dest slot */
B
Bruce Momjian 已提交
1118 1119
								  InvalidBuffer,		/* this tuple has no
														 * buffer */
1120
								  true);		/* tuple should be pfreed */
1121
		}
1122

B
Bruce Momjian 已提交
1123
		/*
B
Bruce Momjian 已提交
1124 1125
		 * now that we have a tuple, do the appropriate thing with it..
		 * either return it to the user, add it to a relation someplace,
B
Bruce Momjian 已提交
1126
		 * delete it from a relation, or modify some of its attributes.
1127 1128 1129
		 */
		switch (operation)
		{
1130
			case CMD_SELECT:
B
Bruce Momjian 已提交
1131 1132 1133
				ExecSelect(slot,	/* slot containing tuple */
						   destfunc,	/* destination's tuple-receiver
										 * obj */
1134
						   estate);
1135 1136
				result = slot;
				break;
1137

1138
			case CMD_INSERT:
1139
				ExecInsert(slot, tupleid, estate);
1140 1141
				result = NULL;
				break;
1142

1143 1144 1145 1146
			case CMD_DELETE:
				ExecDelete(slot, tupleid, estate);
				result = NULL;
				break;
1147

1148
			case CMD_UPDATE:
1149
				ExecUpdate(slot, tupleid, estate);
1150 1151
				result = NULL;
				break;
1152

1153
			default:
1154
				elog(LOG, "ExecutePlan: unknown operation in queryDesc");
1155
				result = NULL;
1156
				break;
1157
		}
B
Bruce Momjian 已提交
1158

B
Bruce Momjian 已提交
1159
		/*
1160
		 * check our tuple count.. if we've processed the proper number
1161
		 * then quit, else loop again and process more tuples.  Zero
1162
		 * numberTuples means no limit.
1163
		 */
1164
		current_tuple_count++;
1165
		if (numberTuples && numberTuples == current_tuple_count)
1166
			break;
1167
	}
1168

1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184
	/*
	 * Process AFTER EACH STATEMENT triggers
	 */
	switch (operation)
	{
		case CMD_UPDATE:
			ExecASUpdateTriggers(estate, estate->es_result_relation_info);
			break;
		case CMD_DELETE:
			ExecASDeleteTriggers(estate, estate->es_result_relation_info);
			break;
		case CMD_INSERT:
			ExecASInsertTriggers(estate, estate->es_result_relation_info);
			break;
		default:
			/* do nothing */
1185
			break;
1186 1187
	}

B
Bruce Momjian 已提交
1188
	/*
B
Bruce Momjian 已提交
1189
	 * here, result is either a slot containing a tuple in the case of a
1190
	 * SELECT or NULL otherwise.
1191
	 */
1192
	return result;
1193 1194 1195
}

/* ----------------------------------------------------------------
1196
 *		ExecSelect
1197
 *
1198
 *		SELECTs are easy.. we just pass the tuple to the appropriate
1199
 *		print function.  The only complexity is when we do a
1200
 *		"SELECT INTO", in which case we insert the tuple into
1201 1202
 *		the appropriate relation (note: this is a newly created relation
 *		so we don't need to worry about indices or locks.)
1203 1204 1205
 * ----------------------------------------------------------------
 */
static void
1206 1207 1208
ExecSelect(TupleTableSlot *slot,
		   DestReceiver *destfunc,
		   EState *estate)
1209
{
1210 1211
	HeapTuple	tuple;
	TupleDesc	attrtype;
1212

B
Bruce Momjian 已提交
1213
	/*
B
Bruce Momjian 已提交
1214
	 * get the heap tuple out of the tuple table slot
1215 1216 1217 1218
	 */
	tuple = slot->val;
	attrtype = slot->ttc_tupleDescriptor;

B
Bruce Momjian 已提交
1219
	/*
B
Bruce Momjian 已提交
1220
	 * insert the tuple into the "into relation"
1221 1222 1223
	 */
	if (estate->es_into_relation_descriptor != NULL)
	{
1224 1225
		heap_insert(estate->es_into_relation_descriptor, tuple,
					estate->es_snapshot->curcid);
1226 1227 1228
		IncrAppended();
	}

B
Bruce Momjian 已提交
1229
	/*
B
Bruce Momjian 已提交
1230
	 * send the tuple to the front end (or the screen)
1231
	 */
1232
	(*destfunc->receiveTuple) (tuple, attrtype, destfunc);
1233 1234
	IncrRetrieved();
	(estate->es_processed)++;
1235 1236 1237
}

/* ----------------------------------------------------------------
1238
 *		ExecInsert
1239
 *
1240
 *		INSERTs are trickier.. we have to insert the tuple into
1241 1242
 *		the base relation and insert appropriate tuples into the
 *		index relations.
1243 1244 1245
 * ----------------------------------------------------------------
 */
static void
1246
ExecInsert(TupleTableSlot *slot,
1247
		   ItemPointer tupleid,
1248
		   EState *estate)
1249
{
1250
	HeapTuple	tuple;
1251
	ResultRelInfo *resultRelInfo;
1252 1253 1254
	Relation	resultRelationDesc;
	int			numIndices;
	Oid			newId;
1255

B
Bruce Momjian 已提交
1256
	/*
B
Bruce Momjian 已提交
1257
	 * get the heap tuple out of the tuple table slot
1258 1259 1260
	 */
	tuple = slot->val;

B
Bruce Momjian 已提交
1261
	/*
1262
	 * get information on the (current) result relation
1263
	 */
1264 1265
	resultRelInfo = estate->es_result_relation_info;
	resultRelationDesc = resultRelInfo->ri_RelationDesc;
1266 1267

	/* BEFORE ROW INSERT Triggers */
1268
	if (resultRelInfo->ri_TrigDesc &&
1269
		resultRelInfo->ri_TrigDesc->n_before_row[TRIGGER_EVENT_INSERT] > 0)
1270
	{
1271
		HeapTuple	newtuple;
1272

1273
		newtuple = ExecBRInsertTriggers(estate, resultRelInfo, tuple);
1274 1275 1276 1277 1278 1279

		if (newtuple == NULL)	/* "do nothing" */
			return;

		if (newtuple != tuple)	/* modified by Trigger(s) */
		{
1280 1281 1282
			/*
			 * Insert modified tuple into tuple table slot, replacing the
			 * original.  We assume that it was allocated in per-tuple
B
Bruce Momjian 已提交
1283 1284
			 * memory context, and therefore will go away by itself. The
			 * tuple table slot should not try to clear it.
1285 1286 1287
			 */
			ExecStoreTuple(newtuple, slot, InvalidBuffer, false);
			tuple = newtuple;
1288 1289 1290
		}
	}

B
Bruce Momjian 已提交
1291
	/*
1292
	 * Check the constraints of the tuple
1293 1294
	 */
	if (resultRelationDesc->rd_att->constr)
1295
		ExecConstraints("ExecInsert", resultRelInfo, slot, estate);
1296

B
Bruce Momjian 已提交
1297
	/*
B
Bruce Momjian 已提交
1298
	 * insert the tuple
1299
	 */
1300 1301
	newId = heap_insert(resultRelationDesc, tuple,
						estate->es_snapshot->curcid);
1302

1303
	IncrAppended();
1304 1305
	(estate->es_processed)++;
	estate->es_lastoid = newId;
T
Tom Lane 已提交
1306
	setLastTid(&(tuple->t_self));
1307

B
Bruce Momjian 已提交
1308
	/*
B
Bruce Momjian 已提交
1309
	 * process indices
1310
	 *
B
Bruce Momjian 已提交
1311 1312 1313
	 * Note: heap_insert adds a new tuple to a relation.  As a side effect,
	 * the tupleid of the new tuple is placed in the new tuple's t_ctid
	 * field.
1314
	 */
1315
	numIndices = resultRelInfo->ri_NumIndices;
1316
	if (numIndices > 0)
1317
		ExecInsertIndexTuples(slot, &(tuple->t_self), estate, false);
1318 1319

	/* AFTER ROW INSERT Triggers */
1320
	ExecARInsertTriggers(estate, resultRelInfo, tuple);
1321 1322 1323
}

/* ----------------------------------------------------------------
1324
 *		ExecDelete
1325
 *
1326
 *		DELETE is like UPDATE, we delete the tuple and its
1327
 *		index tuples.
1328 1329 1330
 * ----------------------------------------------------------------
 */
static void
1331
ExecDelete(TupleTableSlot *slot,
1332
		   ItemPointer tupleid,
1333
		   EState *estate)
1334
{
1335
	ResultRelInfo *resultRelInfo;
B
Bruce Momjian 已提交
1336 1337 1338
	Relation	resultRelationDesc;
	ItemPointerData ctid;
	int			result;
1339

B
Bruce Momjian 已提交
1340
	/*
1341
	 * get information on the (current) result relation
1342
	 */
1343 1344
	resultRelInfo = estate->es_result_relation_info;
	resultRelationDesc = resultRelInfo->ri_RelationDesc;
1345 1346

	/* BEFORE ROW DELETE Triggers */
1347
	if (resultRelInfo->ri_TrigDesc &&
1348
	  resultRelInfo->ri_TrigDesc->n_before_row[TRIGGER_EVENT_DELETE] > 0)
1349
	{
1350
		bool		dodelete;
1351

1352
		dodelete = ExecBRDeleteTriggers(estate, resultRelInfo, tupleid);
1353 1354 1355 1356 1357

		if (!dodelete)			/* "do nothing" */
			return;
	}

V
Vadim B. Mikheev 已提交
1358
	/*
B
Bruce Momjian 已提交
1359
	 * delete the tuple
1360
	 */
1361
ldelete:;
1362 1363 1364
	result = heap_delete(resultRelationDesc, tupleid,
						 &ctid,
						 estate->es_snapshot->curcid);
V
Vadim B. Mikheev 已提交
1365 1366 1367
	switch (result)
	{
		case HeapTupleSelfUpdated:
1368
			/* already deleted by self; nothing to do */
V
Vadim B. Mikheev 已提交
1369 1370 1371 1372 1373 1374
			return;

		case HeapTupleMayBeUpdated:
			break;

		case HeapTupleUpdated:
1375 1376
			if (XactIsoLevel == XACT_SERIALIZABLE)
				elog(ERROR, "Can't serialize access due to concurrent update");
1377 1378
			else if (!(ItemPointerEquals(tupleid, &ctid)))
			{
B
Bruce Momjian 已提交
1379
				TupleTableSlot *epqslot = EvalPlanQual(estate,
B
Bruce Momjian 已提交
1380
							   resultRelInfo->ri_RangeTableIndex, &ctid);
1381

V
Vadim B. Mikheev 已提交
1382
				if (!TupIsNull(epqslot))
1383 1384 1385 1386 1387
				{
					*tupleid = ctid;
					goto ldelete;
				}
			}
1388
			/* tuple already deleted; nothing to do */
V
Vadim B. Mikheev 已提交
1389 1390 1391 1392 1393 1394
			return;

		default:
			elog(ERROR, "Unknown status %u from heap_delete", result);
			return;
	}
1395 1396 1397 1398

	IncrDeleted();
	(estate->es_processed)++;

B
Bruce Momjian 已提交
1399
	/*
B
Bruce Momjian 已提交
1400 1401
	 * Note: Normally one would think that we have to delete index tuples
	 * associated with the heap tuple now..
1402
	 *
B
Bruce Momjian 已提交
1403 1404 1405
	 * ... but in POSTGRES, we have no need to do this because the vacuum
	 * daemon automatically opens an index scan and deletes index tuples
	 * when it finds deleted heap tuples. -cim 9/27/89
1406 1407 1408
	 */

	/* AFTER ROW DELETE Triggers */
1409
	ExecARDeleteTriggers(estate, resultRelInfo, tupleid);
1410 1411 1412
}

/* ----------------------------------------------------------------
1413
 *		ExecUpdate
1414
 *
1415 1416 1417 1418
 *		note: we can't run UPDATE queries with transactions
 *		off because UPDATEs are actually INSERTs and our
 *		scan will mistakenly loop forever, updating the tuple
 *		it just inserted..	This should be fixed but until it
1419 1420
 *		is, we don't want to get stuck in an infinite loop
 *		which corrupts your database..
1421 1422 1423
 * ----------------------------------------------------------------
 */
static void
1424
ExecUpdate(TupleTableSlot *slot,
B
Bruce Momjian 已提交
1425 1426
		   ItemPointer tupleid,
		   EState *estate)
1427
{
B
Bruce Momjian 已提交
1428
	HeapTuple	tuple;
1429
	ResultRelInfo *resultRelInfo;
B
Bruce Momjian 已提交
1430 1431 1432 1433
	Relation	resultRelationDesc;
	ItemPointerData ctid;
	int			result;
	int			numIndices;
1434

B
Bruce Momjian 已提交
1435
	/*
B
Bruce Momjian 已提交
1436
	 * abort the operation if not running transactions
1437 1438 1439
	 */
	if (IsBootstrapProcessingMode())
	{
1440
		elog(WARNING, "ExecUpdate: UPDATE can't run without transactions");
1441 1442 1443
		return;
	}

B
Bruce Momjian 已提交
1444
	/*
B
Bruce Momjian 已提交
1445
	 * get the heap tuple out of the tuple table slot
1446 1447 1448
	 */
	tuple = slot->val;

B
Bruce Momjian 已提交
1449
	/*
1450
	 * get information on the (current) result relation
1451
	 */
1452 1453
	resultRelInfo = estate->es_result_relation_info;
	resultRelationDesc = resultRelInfo->ri_RelationDesc;
1454 1455

	/* BEFORE ROW UPDATE Triggers */
1456
	if (resultRelInfo->ri_TrigDesc &&
1457
	  resultRelInfo->ri_TrigDesc->n_before_row[TRIGGER_EVENT_UPDATE] > 0)
1458
	{
1459
		HeapTuple	newtuple;
1460

1461 1462
		newtuple = ExecBRUpdateTriggers(estate, resultRelInfo,
										tupleid, tuple);
1463 1464 1465 1466 1467 1468

		if (newtuple == NULL)	/* "do nothing" */
			return;

		if (newtuple != tuple)	/* modified by Trigger(s) */
		{
1469 1470 1471
			/*
			 * Insert modified tuple into tuple table slot, replacing the
			 * original.  We assume that it was allocated in per-tuple
B
Bruce Momjian 已提交
1472 1473
			 * memory context, and therefore will go away by itself. The
			 * tuple table slot should not try to clear it.
1474 1475 1476
			 */
			ExecStoreTuple(newtuple, slot, InvalidBuffer, false);
			tuple = newtuple;
1477 1478 1479
		}
	}

B
Bruce Momjian 已提交
1480
	/*
1481
	 * Check the constraints of the tuple
1482
	 *
1483 1484 1485 1486 1487
	 * If we generate a new candidate tuple after EvalPlanQual testing, we
	 * must loop back here and recheck constraints.  (We don't need to
	 * redo triggers, however.	If there are any BEFORE triggers then
	 * trigger.c will have done mark4update to lock the correct tuple, so
	 * there's no need to do them again.)
1488
	 */
1489
lreplace:;
1490
	if (resultRelationDesc->rd_att->constr)
1491
		ExecConstraints("ExecUpdate", resultRelInfo, slot, estate);
1492

V
Vadim B. Mikheev 已提交
1493
	/*
B
Bruce Momjian 已提交
1494
	 * replace the heap tuple
1495
	 */
1496 1497 1498
	result = heap_update(resultRelationDesc, tupleid, tuple,
						 &ctid,
						 estate->es_snapshot->curcid);
V
Vadim B. Mikheev 已提交
1499 1500 1501
	switch (result)
	{
		case HeapTupleSelfUpdated:
1502
			/* already deleted by self; nothing to do */
V
Vadim B. Mikheev 已提交
1503 1504 1505 1506 1507 1508
			return;

		case HeapTupleMayBeUpdated:
			break;

		case HeapTupleUpdated:
1509 1510
			if (XactIsoLevel == XACT_SERIALIZABLE)
				elog(ERROR, "Can't serialize access due to concurrent update");
1511 1512
			else if (!(ItemPointerEquals(tupleid, &ctid)))
			{
B
Bruce Momjian 已提交
1513
				TupleTableSlot *epqslot = EvalPlanQual(estate,
B
Bruce Momjian 已提交
1514
							   resultRelInfo->ri_RangeTableIndex, &ctid);
1515

V
Vadim B. Mikheev 已提交
1516
				if (!TupIsNull(epqslot))
1517 1518
				{
					*tupleid = ctid;
V
Vadim B. Mikheev 已提交
1519
					tuple = ExecRemoveJunk(estate->es_junkFilter, epqslot);
1520
					slot = ExecStoreTuple(tuple,
1521
									estate->es_junkFilter->jf_resultSlot,
1522
										  InvalidBuffer, true);
1523 1524 1525
					goto lreplace;
				}
			}
1526
			/* tuple already deleted; nothing to do */
V
Vadim B. Mikheev 已提交
1527 1528 1529
			return;

		default:
1530
			elog(ERROR, "Unknown status %u from heap_update", result);
V
Vadim B. Mikheev 已提交
1531
			return;
1532 1533 1534 1535 1536
	}

	IncrReplaced();
	(estate->es_processed)++;

B
Bruce Momjian 已提交
1537
	/*
B
Bruce Momjian 已提交
1538
	 * Note: instead of having to update the old index tuples associated
B
Bruce Momjian 已提交
1539
	 * with the heap tuple, all we do is form and insert new index tuples.
1540
	 * This is because UPDATEs are actually DELETEs and INSERTs and index
B
Bruce Momjian 已提交
1541 1542
	 * tuple deletion is done automagically by the vacuum daemon. All we
	 * do is insert new index tuples.  -cim 9/27/89
1543 1544
	 */

B
Bruce Momjian 已提交
1545
	/*
B
Bruce Momjian 已提交
1546
	 * process indices
1547
	 *
1548
	 * heap_update updates a tuple in the base relation by invalidating it
1549
	 * and then inserting a new tuple to the relation.	As a side effect,
B
Bruce Momjian 已提交
1550 1551 1552
	 * the tupleid of the new tuple is placed in the new tuple's t_ctid
	 * field.  So we now insert index tuples using the new tupleid stored
	 * there.
1553 1554
	 */

1555
	numIndices = resultRelInfo->ri_NumIndices;
1556
	if (numIndices > 0)
1557
		ExecInsertIndexTuples(slot, &(tuple->t_self), estate, false);
1558 1559

	/* AFTER ROW UPDATE Triggers */
1560
	ExecARUpdateTriggers(estate, resultRelInfo, tupleid, tuple);
1561
}
V
Vadim B. Mikheev 已提交
1562

1563
static char *
1564 1565
ExecRelCheck(ResultRelInfo *resultRelInfo,
			 TupleTableSlot *slot, EState *estate)
V
Vadim B. Mikheev 已提交
1566
{
1567
	Relation	rel = resultRelInfo->ri_RelationDesc;
1568 1569
	int			ncheck = rel->rd_att->constr->num_check;
	ConstrCheck *check = rel->rd_att->constr->check;
1570
	ExprContext *econtext;
1571
	MemoryContext oldContext;
1572 1573
	List	   *qual;
	int			i;
1574

1575 1576 1577 1578 1579 1580 1581 1582 1583 1584 1585 1586 1587
	/*
	 * If first time through for this result relation, build expression
	 * nodetrees for rel's constraint expressions.  Keep them in the
	 * per-query memory context so they'll survive throughout the query.
	 */
	if (resultRelInfo->ri_ConstraintExprs == NULL)
	{
		oldContext = MemoryContextSwitchTo(estate->es_query_cxt);
		resultRelInfo->ri_ConstraintExprs =
			(List **) palloc(ncheck * sizeof(List *));
		for (i = 0; i < ncheck; i++)
		{
			qual = (List *) stringToNode(check[i].ccbin);
1588
			resultRelInfo->ri_ConstraintExprs[i] = (List *)
1589
				ExecPrepareExpr((Expr *) qual, estate);
1590 1591 1592 1593
		}
		MemoryContextSwitchTo(oldContext);
	}

1594
	/*
B
Bruce Momjian 已提交
1595 1596
	 * We will use the EState's per-tuple context for evaluating
	 * constraint expressions (creating it if it's not already there).
1597
	 */
1598
	econtext = GetPerTupleExprContext(estate);
1599

1600 1601 1602 1603
	/* Arrange for econtext's scan tuple to be the tuple under test */
	econtext->ecxt_scantuple = slot;

	/* And evaluate the constraints */
1604 1605
	for (i = 0; i < ncheck; i++)
	{
1606
		qual = resultRelInfo->ri_ConstraintExprs[i];
1607

1608 1609
		/*
		 * NOTE: SQL92 specifies that a NULL result from a constraint
1610 1611
		 * expression is not to be treated as a failure.  Therefore, tell
		 * ExecQual to return TRUE for NULL.
1612
		 */
1613
		if (!ExecQual(qual, econtext, true))
1614
			return check[i].ccname;
1615 1616
	}

1617
	/* NULL result means no error */
1618
	return (char *) NULL;
V
Vadim B. Mikheev 已提交
1619 1620
}

1621
void
1622
ExecConstraints(const char *caller, ResultRelInfo *resultRelInfo,
1623
				TupleTableSlot *slot, EState *estate)
V
Vadim B. Mikheev 已提交
1624
{
1625
	Relation	rel = resultRelInfo->ri_RelationDesc;
1626 1627 1628 1629
	HeapTuple	tuple = slot->val;
	TupleConstr *constr = rel->rd_att->constr;

	Assert(constr);
1630

1631
	if (constr->has_not_null)
V
Vadim B. Mikheev 已提交
1632
	{
1633
		int			natts = rel->rd_att->natts;
1634
		int			attrChk;
1635

1636
		for (attrChk = 1; attrChk <= natts; attrChk++)
1637
		{
B
Bruce Momjian 已提交
1638
			if (rel->rd_att->attrs[attrChk - 1]->attnotnull &&
1639
				heap_attisnull(tuple, attrChk))
1640
				elog(ERROR, "%s: Fail to add null value in not null attribute %s",
B
Bruce Momjian 已提交
1641
					 caller, NameStr(rel->rd_att->attrs[attrChk - 1]->attname));
1642 1643 1644
		}
	}

1645
	if (constr->num_check > 0)
1646
	{
1647
		char	   *failed;
1648

1649
		if ((failed = ExecRelCheck(resultRelInfo, slot, estate)) != NULL)
B
Bruce Momjian 已提交
1650 1651
			elog(ERROR, "%s: rejected due to CHECK constraint \"%s\" on \"%s\"",
				 caller, failed, RelationGetRelationName(rel));
1652
	}
V
Vadim B. Mikheev 已提交
1653
}
1654

1655 1656 1657 1658 1659 1660
/*
 * Check a modified tuple to see if we want to process its updated version
 * under READ COMMITTED rules.
 *
 * See backend/executor/README for some info about how this works.
 */
B
Bruce Momjian 已提交
1661
TupleTableSlot *
1662 1663
EvalPlanQual(EState *estate, Index rti, ItemPointer tid)
{
1664 1665
	evalPlanQual *epq;
	EState	   *epqstate;
B
Bruce Momjian 已提交
1666 1667
	Relation	relation;
	HeapTupleData tuple;
1668 1669
	HeapTuple	copyTuple = NULL;
	bool		endNode;
1670 1671 1672

	Assert(rti != 0);

1673 1674 1675 1676 1677 1678 1679 1680 1681 1682 1683 1684 1685 1686 1687 1688 1689 1690 1691 1692 1693 1694 1695 1696 1697 1698 1699 1700 1701 1702 1703 1704 1705
	/*
	 * find relation containing target tuple
	 */
	if (estate->es_result_relation_info != NULL &&
		estate->es_result_relation_info->ri_RangeTableIndex == rti)
		relation = estate->es_result_relation_info->ri_RelationDesc;
	else
	{
		List	   *l;

		relation = NULL;
		foreach(l, estate->es_rowMark)
		{
			if (((execRowMark *) lfirst(l))->rti == rti)
			{
				relation = ((execRowMark *) lfirst(l))->relation;
				break;
			}
		}
		if (relation == NULL)
			elog(ERROR, "EvalPlanQual: can't find RTE %d", (int) rti);
	}

	/*
	 * fetch tid tuple
	 *
	 * Loop here to deal with updated or busy tuples
	 */
	tuple.t_self = *tid;
	for (;;)
	{
		Buffer		buffer;

1706
		if (heap_fetch(relation, SnapshotDirty, &tuple, &buffer, false, NULL))
1707 1708 1709 1710 1711 1712 1713 1714 1715 1716 1717 1718 1719 1720 1721 1722 1723 1724 1725 1726 1727 1728 1729 1730 1731 1732 1733 1734 1735 1736 1737 1738 1739 1740 1741 1742 1743 1744 1745 1746 1747 1748 1749 1750 1751 1752 1753 1754 1755 1756 1757
		{
			TransactionId xwait = SnapshotDirty->xmax;

			if (TransactionIdIsValid(SnapshotDirty->xmin))
				elog(ERROR, "EvalPlanQual: t_xmin is uncommitted ?!");

			/*
			 * If tuple is being updated by other transaction then we have
			 * to wait for its commit/abort.
			 */
			if (TransactionIdIsValid(xwait))
			{
				ReleaseBuffer(buffer);
				XactLockTableWait(xwait);
				continue;
			}

			/*
			 * We got tuple - now copy it for use by recheck query.
			 */
			copyTuple = heap_copytuple(&tuple);
			ReleaseBuffer(buffer);
			break;
		}

		/*
		 * Oops! Invalid tuple. Have to check is it updated or deleted.
		 * Note that it's possible to get invalid SnapshotDirty->tid if
		 * tuple updated by this transaction. Have we to check this ?
		 */
		if (ItemPointerIsValid(&(SnapshotDirty->tid)) &&
			!(ItemPointerEquals(&(tuple.t_self), &(SnapshotDirty->tid))))
		{
			/* updated, so look at the updated copy */
			tuple.t_self = SnapshotDirty->tid;
			continue;
		}

		/*
		 * Deleted or updated by this transaction; forget it.
		 */
		return NULL;
	}

	/*
	 * For UPDATE/DELETE we have to return tid of actual row we're
	 * executing PQ for.
	 */
	*tid = tuple.t_self;

	/*
1758
	 * Need to run a recheck subquery.	Find or create a PQ stack entry.
1759
	 */
1760
	epq = estate->es_evalPlanQual;
1761 1762
	endNode = true;

1763 1764
	if (epq != NULL && epq->rti == 0)
	{
1765
		/* Top PQ stack entry is idle, so re-use it */
1766
		Assert(!(estate->es_useEvalPlan) && epq->next == NULL);
1767 1768 1769 1770 1771 1772
		epq->rti = rti;
		endNode = false;
	}

	/*
	 * If this is request for another RTE - Ra, - then we have to check
B
Bruce Momjian 已提交
1773 1774 1775
	 * wasn't PlanQual requested for Ra already and if so then Ra' row was
	 * updated again and we have to re-start old execution for Ra and
	 * forget all what we done after Ra was suspended. Cool? -:))
1776
	 */
B
Bruce Momjian 已提交
1777
	if (epq != NULL && epq->rti != rti &&
1778
		epq->estate->es_evTuple[rti - 1] != NULL)
1779 1780 1781
	{
		do
		{
1782 1783
			evalPlanQual *oldepq;

1784
			/* stop execution */
1785 1786 1787 1788
			EvalPlanQualStop(epq);
			/* pop previous PlanQual from the stack */
			oldepq = epq->next;
			Assert(oldepq && oldepq->rti != 0);
1789 1790 1791
			/* push current PQ to freePQ stack */
			oldepq->free = epq;
			epq = oldepq;
1792
			estate->es_evalPlanQual = epq;
1793 1794 1795
		} while (epq->rti != rti);
	}

B
Bruce Momjian 已提交
1796
	/*
1797 1798 1799 1800 1801 1802
	 * If we are requested for another RTE then we have to suspend
	 * execution of current PlanQual and start execution for new one.
	 */
	if (epq == NULL || epq->rti != rti)
	{
		/* try to reuse plan used previously */
B
Bruce Momjian 已提交
1803
		evalPlanQual *newepq = (epq != NULL) ? epq->free : NULL;
1804

1805
		if (newepq == NULL)		/* first call or freePQ stack is empty */
1806
		{
1807
			newepq = (evalPlanQual *) palloc0(sizeof(evalPlanQual));
1808
			newepq->free = NULL;
1809 1810
			newepq->estate = NULL;
			newepq->planstate = NULL;
1811 1812
		}
		else
1813
		{
1814 1815 1816
			/* recycle previously used PlanQual */
			Assert(newepq->estate == NULL);
			epq->free = NULL;
1817
		}
1818
		/* push current PQ to the stack */
1819
		newepq->next = epq;
1820
		epq = newepq;
1821
		estate->es_evalPlanQual = epq;
1822 1823 1824 1825
		epq->rti = rti;
		endNode = false;
	}

1826
	Assert(epq->rti == rti);
1827 1828

	/*
1829 1830
	 * Ok - we're requested for the same RTE.  Unfortunately we still have
	 * to end and restart execution of the plan, because ExecReScan
1831
	 * wouldn't ensure that upper plan nodes would reset themselves.  We
1832 1833 1834
	 * could make that work if insertion of the target tuple were
	 * integrated with the Param mechanism somehow, so that the upper plan
	 * nodes know that their children's outputs have changed.
1835 1836 1837 1838 1839
	 *
	 * Note that the stack of free evalPlanQual nodes is quite useless at
	 * the moment, since it only saves us from pallocing/releasing the
	 * evalPlanQual nodes themselves.  But it will be useful once we
	 * implement ReScan instead of end/restart for re-using PlanQual nodes.
1840 1841
	 */
	if (endNode)
1842
	{
1843
		/* stop execution */
1844
		EvalPlanQualStop(epq);
1845
	}
1846

1847 1848 1849 1850 1851 1852 1853 1854 1855 1856
	/*
	 * Initialize new recheck query.
	 *
	 * Note: if we were re-using PlanQual plans via ExecReScan, we'd need
	 * to instead copy down changeable state from the top plan (including
	 * es_result_relation_info, es_junkFilter) and reset locally changeable
	 * state in the epq (including es_param_exec_vals, es_evTupleNull).
	 */
	EvalPlanQualStart(epq, estate, epq->next);

1857
	/*
1858 1859
	 * free old RTE' tuple, if any, and store target tuple where
	 * relation's scan node will see it
1860
	 */
1861
	epqstate = epq->estate;
1862 1863 1864
	if (epqstate->es_evTuple[rti - 1] != NULL)
		heap_freetuple(epqstate->es_evTuple[rti - 1]);
	epqstate->es_evTuple[rti - 1] = copyTuple;
1865

1866
	return EvalPlanQualNext(estate);
1867 1868
}

B
Bruce Momjian 已提交
1869
static TupleTableSlot *
1870 1871
EvalPlanQualNext(EState *estate)
{
1872 1873
	evalPlanQual *epq = estate->es_evalPlanQual;
	MemoryContext oldcontext;
B
Bruce Momjian 已提交
1874
	TupleTableSlot *slot;
1875 1876 1877 1878

	Assert(epq->rti != 0);

lpqnext:;
1879
	oldcontext = MemoryContextSwitchTo(epq->estate->es_query_cxt);
1880
	slot = ExecProcNode(epq->planstate);
1881
	MemoryContextSwitchTo(oldcontext);
1882 1883 1884 1885 1886 1887

	/*
	 * No more tuples for this PQ. Continue previous one.
	 */
	if (TupIsNull(slot))
	{
1888 1889
		evalPlanQual *oldepq;

1890
		/* stop execution */
1891
		EvalPlanQualStop(epq);
1892
		/* pop old PQ from the stack */
1893 1894
		oldepq = epq->next;
		if (oldepq == NULL)
1895
		{
1896 1897 1898 1899 1900
			/* this is the first (oldest) PQ - mark as free */
			epq->rti = 0;
			estate->es_useEvalPlan = false;
			/* and continue Query execution */
			return (NULL);
1901 1902 1903 1904 1905
		}
		Assert(oldepq->rti != 0);
		/* push current PQ to freePQ stack */
		oldepq->free = epq;
		epq = oldepq;
1906
		estate->es_evalPlanQual = epq;
1907 1908 1909 1910 1911
		goto lpqnext;
	}

	return (slot);
}
1912 1913 1914 1915

static void
EndEvalPlanQual(EState *estate)
{
1916
	evalPlanQual *epq = estate->es_evalPlanQual;
1917

1918 1919
	if (epq->rti == 0)			/* plans already shutdowned */
	{
1920
		Assert(epq->next == NULL);
1921
		return;
1922
	}
1923 1924 1925

	for (;;)
	{
1926 1927
		evalPlanQual *oldepq;

1928
		/* stop execution */
1929
		EvalPlanQualStop(epq);
1930
		/* pop old PQ from the stack */
1931 1932
		oldepq = epq->next;
		if (oldepq == NULL)
1933
		{
1934 1935 1936
			/* this is the first (oldest) PQ - mark as free */
			epq->rti = 0;
			estate->es_useEvalPlan = false;
1937 1938 1939 1940 1941 1942
			break;
		}
		Assert(oldepq->rti != 0);
		/* push current PQ to freePQ stack */
		oldepq->free = epq;
		epq = oldepq;
1943 1944 1945 1946 1947 1948 1949 1950 1951 1952 1953 1954 1955 1956 1957 1958 1959 1960 1961 1962 1963 1964 1965 1966 1967 1968 1969 1970 1971 1972 1973 1974 1975 1976 1977 1978 1979 1980 1981 1982 1983 1984 1985
		estate->es_evalPlanQual = epq;
	}
}

/*
 * Start execution of one level of PlanQual.
 *
 * This is a cut-down version of ExecutorStart(): we copy some state from
 * the top-level estate rather than initializing it fresh.
 */
static void
EvalPlanQualStart(evalPlanQual *epq, EState *estate, evalPlanQual *priorepq)
{
	EState	   *epqstate;
	int			rtsize;
	MemoryContext oldcontext;

	rtsize = length(estate->es_range_table);

	epq->estate = epqstate = CreateExecutorState();

	oldcontext = MemoryContextSwitchTo(epqstate->es_query_cxt);

	/*
	 * The epqstates share the top query's copy of unchanging state such
	 * as the snapshot, rangetable, result-rel info, and external Param info.
	 * They need their own copies of local state, including a tuple table,
	 * es_param_exec_vals, etc.
	 */
	epqstate->es_direction = ForwardScanDirection;
	epqstate->es_snapshot = estate->es_snapshot;
	epqstate->es_range_table = estate->es_range_table;
	epqstate->es_result_relations = estate->es_result_relations;
	epqstate->es_num_result_relations = estate->es_num_result_relations;
	epqstate->es_result_relation_info = estate->es_result_relation_info;
	epqstate->es_junkFilter = estate->es_junkFilter;
	epqstate->es_into_relation_descriptor = estate->es_into_relation_descriptor;
	epqstate->es_param_list_info = estate->es_param_list_info;
	if (estate->es_topPlan->nParamExec > 0)
		epqstate->es_param_exec_vals = (ParamExecData *)
			palloc0(estate->es_topPlan->nParamExec * sizeof(ParamExecData));
	epqstate->es_rowMark = estate->es_rowMark;
	epqstate->es_instrument = estate->es_instrument;
1986
	epqstate->es_force_oids = estate->es_force_oids;
1987 1988 1989 1990 1991 1992 1993 1994 1995 1996 1997 1998 1999 2000 2001 2002 2003 2004 2005 2006 2007 2008 2009 2010 2011 2012 2013 2014 2015 2016 2017 2018 2019 2020 2021 2022 2023 2024 2025 2026 2027 2028 2029 2030 2031 2032 2033 2034
	epqstate->es_topPlan = estate->es_topPlan;
	/*
	 * Each epqstate must have its own es_evTupleNull state, but
	 * all the stack entries share es_evTuple state.  This allows
	 * sub-rechecks to inherit the value being examined by an
	 * outer recheck.
	 */
	epqstate->es_evTupleNull = (bool *) palloc0(rtsize * sizeof(bool));
	if (priorepq == NULL)
		/* first PQ stack entry */
		epqstate->es_evTuple = (HeapTuple *)
			palloc0(rtsize * sizeof(HeapTuple));
	else
		/* later stack entries share the same storage */
		epqstate->es_evTuple = priorepq->estate->es_evTuple;

	epqstate->es_tupleTable =
		ExecCreateTupleTable(estate->es_tupleTable->size);

	epq->planstate = ExecInitNode(estate->es_topPlan, epqstate);

	MemoryContextSwitchTo(oldcontext);
}

/*
 * End execution of one level of PlanQual.
 *
 * This is a cut-down version of ExecutorEnd(); basically we want to do most
 * of the normal cleanup, but *not* close result relations (which we are
 * just sharing from the outer query).
 */
static void
EvalPlanQualStop(evalPlanQual *epq)
{
	EState	   *epqstate = epq->estate;
	MemoryContext oldcontext;

	oldcontext = MemoryContextSwitchTo(epqstate->es_query_cxt);

	ExecEndNode(epq->planstate);

	ExecDropTupleTable(epqstate->es_tupleTable, true);
	epqstate->es_tupleTable = NULL;

	if (epqstate->es_evTuple[epq->rti - 1] != NULL)
	{
		heap_freetuple(epqstate->es_evTuple[epq->rti - 1]);
		epqstate->es_evTuple[epq->rti - 1] = NULL;
2035
	}
2036 2037 2038 2039 2040 2041 2042

	MemoryContextSwitchTo(oldcontext);

	FreeExecutorState(epqstate);

	epq->estate = NULL;
	epq->planstate = NULL;
2043
}