execMain.c 52.5 KB
Newer Older
1 2
/*-------------------------------------------------------------------------
 *
3
 * execMain.c
4
 *	  top level executor interface routines
5 6
 *
 * INTERFACE ROUTINES
7 8 9
 *	ExecutorStart()
 *	ExecutorRun()
 *	ExecutorEnd()
10
 *
11 12 13 14
 *	The old ExecutorMain() has been replaced by ExecutorStart(),
 *	ExecutorRun() and ExecutorEnd()
 *
 *	These three procedures are the external interfaces to the executor.
15
 *	In each case, the query descriptor is required as an argument.
16
 *
17
 *	ExecutorStart() must be called at the beginning of execution of any
18 19 20
 *	query plan and ExecutorEnd() should always be called at the end of
 *	execution of a plan.
 *
21
 *	ExecutorRun accepts direction and count arguments that specify whether
22
 *	the plan is to be executed forwards, backwards, and for how many tuples.
23
 *
B
Bruce Momjian 已提交
24
 * Portions Copyright (c) 1996-2002, PostgreSQL Global Development Group
B
Add:  
Bruce Momjian 已提交
25
 * Portions Copyright (c) 1994, Regents of the University of California
26 27 28
 *
 *
 * IDENTIFICATION
29
 *	  $Header: /cvsroot/pgsql/src/backend/executor/execMain.c,v 1.200 2003/02/03 15:07:06 tgl Exp $
30 31 32
 *
 *-------------------------------------------------------------------------
 */
33 34
#include "postgres.h"

35 36
#include "access/heapam.h"
#include "catalog/heap.h"
37
#include "catalog/namespace.h"
38
#include "commands/tablecmds.h"
39
#include "commands/trigger.h"
B
Bruce Momjian 已提交
40 41 42 43 44 45
#include "executor/execdebug.h"
#include "executor/execdefs.h"
#include "miscadmin.h"
#include "optimizer/var.h"
#include "parser/parsetree.h"
#include "utils/acl.h"
46
#include "utils/lsyscache.h"
47

48

49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64
typedef struct execRowMark
{
	Relation	relation;
	Index		rti;
	char		resname[32];
} execRowMark;

typedef struct evalPlanQual
{
	Index		rti;
	EState	   *estate;
	PlanState  *planstate;
	struct evalPlanQual *next;	/* stack of active PlanQual plans */
	struct evalPlanQual *free;	/* list of free PlanQual plans */
} evalPlanQual;

65
/* decls for local routines only used within this module */
66
static void InitPlan(QueryDesc *queryDesc);
67
static void initResultRelInfo(ResultRelInfo *resultRelInfo,
B
Bruce Momjian 已提交
68 69 70
				  Index resultRelationIndex,
				  List *rangeTable,
				  CmdType operation);
71
static TupleTableSlot *ExecutePlan(EState *estate, PlanState *planstate,
B
Bruce Momjian 已提交
72 73 74 75
			CmdType operation,
			long numberTuples,
			ScanDirection direction,
			DestReceiver *destfunc);
76
static void ExecSelect(TupleTableSlot *slot,
B
Bruce Momjian 已提交
77 78
		   DestReceiver *destfunc,
		   EState *estate);
79
static void ExecInsert(TupleTableSlot *slot, ItemPointer tupleid,
B
Bruce Momjian 已提交
80
		   EState *estate);
81
static void ExecDelete(TupleTableSlot *slot, ItemPointer tupleid,
B
Bruce Momjian 已提交
82
		   EState *estate);
83
static void ExecUpdate(TupleTableSlot *slot, ItemPointer tupleid,
B
Bruce Momjian 已提交
84
		   EState *estate);
85
static TupleTableSlot *EvalPlanQualNext(EState *estate);
86
static void EndEvalPlanQual(EState *estate);
87
static void ExecCheckRTEPerms(RangeTblEntry *rte, CmdType operation);
88
static void ExecCheckXactReadOnly(Query *parsetree, CmdType operation);
89 90 91
static void EvalPlanQualStart(evalPlanQual *epq, EState *estate,
							  evalPlanQual *priorepq);
static void EvalPlanQualStop(evalPlanQual *epq);
92

93 94
/* end of local decls */

95

96
/* ----------------------------------------------------------------
97 98 99 100 101
 *		ExecutorStart
 *
 *		This routine must be called at the beginning of any execution of any
 *		query plan
 *
102 103 104 105
 * Takes a QueryDesc previously created by CreateQueryDesc (it's not real
 * clear why we bother to separate the two functions, but...).  The tupDesc
 * field of the QueryDesc is filled in to describe the tuples that will be
 * returned, and the internal fields (estate and planstate) are set up.
106
 *
107 108
 * NB: the CurrentMemoryContext when this is called will become the parent
 * of the per-query context used for this Executor invocation.
109 110
 * ----------------------------------------------------------------
 */
111 112
void
ExecutorStart(QueryDesc *queryDesc)
113
{
114
	EState	   *estate;
115
	MemoryContext oldcontext;
116

117
	/* sanity checks: queryDesc must not be started already */
118
	Assert(queryDesc != NULL);
119 120 121
	Assert(queryDesc->estate == NULL);

	/*
122
	 * Build EState, switch into per-query memory context for startup.
123 124 125 126
	 */
	estate = CreateExecutorState();
	queryDesc->estate = estate;

127 128 129 130 131
	oldcontext = MemoryContextSwitchTo(estate->es_query_cxt);

	/*
	 * Fill in parameters, if any, from queryDesc
	 */
132
	estate->es_param_list_info = queryDesc->params;
133

V
Vadim B. Mikheev 已提交
134
	if (queryDesc->plantree->nParamExec > 0)
135
		estate->es_param_exec_vals = (ParamExecData *)
136
			palloc0(queryDesc->plantree->nParamExec * sizeof(ParamExecData));
137

138 139
	estate->es_instrument = queryDesc->doInstrument;

140
	/*
141 142
	 * Make our own private copy of the current query snapshot data.
	 *
B
Bruce Momjian 已提交
143 144 145
	 * This "freezes" our idea of which tuples are good and which are not for
	 * the life of this query, even if it outlives the current command and
	 * current snapshot.
146
	 */
147
	estate->es_snapshot = CopyQuerySnapshot();
148

149
	/*
150
	 * Initialize the plan state tree
151
	 */
152
	InitPlan(queryDesc);
153 154

	MemoryContextSwitchTo(oldcontext);
155 156 157
}

/* ----------------------------------------------------------------
158 159 160 161 162 163 164
 *		ExecutorRun
 *
 *		This is the main routine of the executor module. It accepts
 *		the query descriptor from the traffic cop and executes the
 *		query plan.
 *
 *		ExecutorStart must have been called already.
165
 *
166 167 168
 *		If direction is NoMovementScanDirection then nothing is done
 *		except to start up/shut down the destination.  Otherwise,
 *		we retrieve up to 'count' tuples in the specified direction.
169
 *
170
 *		Note: count = 0 is interpreted as no portal limit, i.e., run to
171
 *		completion.
172
 *
173 174
 * ----------------------------------------------------------------
 */
175
TupleTableSlot *
176
ExecutorRun(QueryDesc *queryDesc,
177
			ScanDirection direction, long count)
178
{
179
	EState	   *estate;
180
	CmdType		operation;
B
Bruce Momjian 已提交
181 182
	CommandDest dest;
	DestReceiver *destfunc;
183
	TupleTableSlot *result;
184 185 186 187 188 189 190 191
	MemoryContext oldcontext;

	/* sanity checks */
	Assert(queryDesc != NULL);

	estate = queryDesc->estate;

	Assert(estate != NULL);
192

B
Bruce Momjian 已提交
193
	/*
194
	 * Switch into per-query memory context
195
	 */
196
	oldcontext = MemoryContextSwitchTo(estate->es_query_cxt);
197

B
Bruce Momjian 已提交
198
	/*
B
Bruce Momjian 已提交
199 200
	 * extract information from the query descriptor and the query
	 * feature.
201
	 */
202 203 204
	operation = queryDesc->operation;
	dest = queryDesc->dest;

205 206 207 208 209 210 211 212
	/*
	 * If the transaction is read-only, we need to check if any writes
	 * are planned to non-temporary tables.  This is done here at this
	 * rather late stage so that we can handle EXPLAIN vs. EXPLAIN
	 * ANALYZE easily.
	 */
	ExecCheckXactReadOnly(queryDesc->parsetree, operation);

B
Bruce Momjian 已提交
213
	/*
214
	 * startup tuple receiver
215
	 */
216 217
	estate->es_processed = 0;
	estate->es_lastoid = InvalidOid;
218

219 220 221
	destfunc = DestToFunction(dest);
	(*destfunc->setup) (destfunc, (int) operation,
						queryDesc->portalName, queryDesc->tupDesc);
222

223 224 225 226 227 228 229
	/*
	 * run plan
	 */
	if (direction == NoMovementScanDirection)
		result = NULL;
	else
		result = ExecutePlan(estate,
230
							 queryDesc->planstate,
231 232 233 234
							 operation,
							 count,
							 direction,
							 destfunc);
235

236 237 238
	/*
	 * shutdown receiver
	 */
239 240
	(*destfunc->cleanup) (destfunc);

241 242
	MemoryContextSwitchTo(oldcontext);

243
	return result;
244 245 246
}

/* ----------------------------------------------------------------
247 248
 *		ExecutorEnd
 *
249
 *		This routine must be called at the end of execution of any
250
 *		query plan
251 252 253
 * ----------------------------------------------------------------
 */
void
254
ExecutorEnd(QueryDesc *queryDesc)
255
{
256
	EState	   *estate;
257
	MemoryContext oldcontext;
258

259 260
	/* sanity checks */
	Assert(queryDesc != NULL);
261

262 263
	estate = queryDesc->estate;

264
	Assert(estate != NULL);
265

266
	/*
267
	 * Switch into per-query memory context to run ExecEndPlan
268
	 */
269 270 271
	oldcontext = MemoryContextSwitchTo(estate->es_query_cxt);

	ExecEndPlan(queryDesc->planstate, estate);
272

273
	/*
274
	 * Must switch out of context before destroying it
275
	 */
276
	MemoryContextSwitchTo(oldcontext);
277

278
	/*
279 280
	 * Release EState and per-query memory context.  This should release
	 * everything the executor has allocated.
281
	 */
282 283 284 285 286 287
	FreeExecutorState(estate);

	/* Reset queryDesc fields that no longer point to anything */
	queryDesc->tupDesc = NULL;
	queryDesc->estate = NULL;
	queryDesc->planstate = NULL;
288
}
289

290

291 292 293 294
/*
 * ExecCheckRTPerms
 *		Check access permissions for all relations listed in a range table.
 */
295
void
296
ExecCheckRTPerms(List *rangeTable, CmdType operation)
297 298 299 300
{
	List	   *lp;

	foreach(lp, rangeTable)
301
	{
302 303
		RangeTblEntry *rte = lfirst(lp);

304
		ExecCheckRTEPerms(rte, operation);
305 306 307 308 309 310 311 312
	}
}

/*
 * ExecCheckRTEPerms
 *		Check access permissions for a single RTE.
 */
static void
313
ExecCheckRTEPerms(RangeTblEntry *rte, CmdType operation)
314
{
315
	Oid			relOid;
316
	AclId		userid;
317
	AclResult	aclcheck_result;
318

B
Bruce Momjian 已提交
319
	/*
320 321 322 323 324 325 326 327 328 329 330 331
	 * If it's a subquery, recursively examine its rangetable.
	 */
	if (rte->rtekind == RTE_SUBQUERY)
	{
		ExecCheckRTPerms(rte->subquery->rtable, operation);
		return;
	}

	/*
	 * Otherwise, only plain-relation RTEs need to be checked here.
	 * Function RTEs are checked by init_fcache when the function is prepared
	 * for execution. Join and special RTEs need no checks.
B
Bruce Momjian 已提交
332
	 */
333
	if (rte->rtekind != RTE_RELATION)
334 335
		return;

336
	relOid = rte->relid;
337 338

	/*
B
Bruce Momjian 已提交
339 340
	 * userid to check as: current user unless we have a setuid
	 * indication.
341
	 *
B
Bruce Momjian 已提交
342 343
	 * Note: GetUserId() is presently fast enough that there's no harm in
	 * calling it separately for each RTE.	If that stops being true, we
344
	 * could call it once in ExecCheckRTPerms and pass the userid down
B
Bruce Momjian 已提交
345
	 * from there.	But for now, no need for the extra clutter.
346
	 */
347
	userid = rte->checkAsUser ? rte->checkAsUser : GetUserId();
348

349
#define CHECK(MODE)		pg_class_aclcheck(relOid, userid, MODE)
350

351
	if (rte->checkForRead)
352
	{
353
		aclcheck_result = CHECK(ACL_SELECT);
354
		if (aclcheck_result != ACLCHECK_OK)
355
			aclcheck_error(aclcheck_result, get_rel_name(relOid));
356 357 358 359 360 361 362 363 364
	}

	if (rte->checkForWrite)
	{
		/*
		 * Note: write access in a SELECT context means SELECT FOR UPDATE.
		 * Right now we don't distinguish that from true update as far as
		 * permissions checks are concerned.
		 */
365 366 367
		switch (operation)
		{
			case CMD_INSERT:
368
				aclcheck_result = CHECK(ACL_INSERT);
369
				break;
370
			case CMD_SELECT:
371
			case CMD_UPDATE:
372 373 374 375
				aclcheck_result = CHECK(ACL_UPDATE);
				break;
			case CMD_DELETE:
				aclcheck_result = CHECK(ACL_DELETE);
376 377 378 379
				break;
			default:
				elog(ERROR, "ExecCheckRTEPerms: bogus operation %d",
					 operation);
380
				aclcheck_result = ACLCHECK_OK;	/* keep compiler quiet */
381 382
				break;
		}
383
		if (aclcheck_result != ACLCHECK_OK)
384
			aclcheck_error(aclcheck_result, get_rel_name(relOid));
385
	}
386 387
}

388

389 390 391 392 393 394 395
/* ===============================================================
 * ===============================================================
						 static routines follow
 * ===============================================================
 * ===============================================================
 */

396

397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421
static void
ExecCheckXactReadOnly(Query *parsetree, CmdType operation)
{
	if (!XactReadOnly)
		return;

	/* CREATE TABLE AS or SELECT INTO */
	if (operation == CMD_SELECT && parsetree->into != NULL)
		goto fail;

	if (operation == CMD_DELETE || operation == CMD_INSERT
		|| operation == CMD_UPDATE)
	{
		List *lp;

		foreach(lp, parsetree->rtable)
		{
			RangeTblEntry *rte = lfirst(lp);

			if (rte->rtekind != RTE_RELATION)
				continue;

			if (!rte->checkForWrite)
				continue;

422
			if (isTempNamespace(get_rel_namespace(rte->relid)))
423 424 425 426 427 428 429 430 431 432 433 434 435
				continue;

			goto fail;
		}
	}

	return;

fail:
	elog(ERROR, "transaction is read-only");
}


436
/* ----------------------------------------------------------------
437 438 439 440
 *		InitPlan
 *
 *		Initializes the query plan: open files, allocate storage
 *		and start up the rule manager
441 442
 * ----------------------------------------------------------------
 */
443 444
static void
InitPlan(QueryDesc *queryDesc)
445
{
446 447 448 449 450
	CmdType		operation = queryDesc->operation;
	Query *parseTree = queryDesc->parsetree;
	Plan *plan = queryDesc->plantree;
	EState *estate = queryDesc->estate;
	PlanState  *planstate;
B
Bruce Momjian 已提交
451 452
	List	   *rangeTable;
	Relation	intoRelationDesc;
453
	bool		do_select_into;
B
Bruce Momjian 已提交
454
	TupleDesc	tupType;
455

456
	/*
457 458 459
	 * Do permissions checks.  It's sufficient to examine the query's
	 * top rangetable here --- subplan RTEs will be checked during
	 * ExecInitSubPlan().
460
	 */
461
	ExecCheckRTPerms(parseTree->rtable, operation);
462

B
Bruce Momjian 已提交
463
	/*
B
Bruce Momjian 已提交
464
	 * get information from query descriptor
465
	 */
466
	rangeTable = parseTree->rtable;
467

B
Bruce Momjian 已提交
468
	/*
B
Bruce Momjian 已提交
469
	 * initialize the node's execution state
470
	 */
471 472
	estate->es_range_table = rangeTable;

B
Bruce Momjian 已提交
473
	/*
474
	 * if there is a result relation, initialize result relation stuff
475
	 */
476
	if (parseTree->resultRelation != 0 && operation != CMD_SELECT)
477
	{
478 479 480
		List	   *resultRelations = parseTree->resultRelations;
		int			numResultRelations;
		ResultRelInfo *resultRelInfos;
B
Bruce Momjian 已提交
481

482 483 484 485 486 487 488
		if (resultRelations != NIL)
		{
			/*
			 * Multiple result relations (due to inheritance)
			 * parseTree->resultRelations identifies them all
			 */
			ResultRelInfo *resultRelInfo;
489

490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506
			numResultRelations = length(resultRelations);
			resultRelInfos = (ResultRelInfo *)
				palloc(numResultRelations * sizeof(ResultRelInfo));
			resultRelInfo = resultRelInfos;
			while (resultRelations != NIL)
			{
				initResultRelInfo(resultRelInfo,
								  lfirsti(resultRelations),
								  rangeTable,
								  operation);
				resultRelInfo++;
				resultRelations = lnext(resultRelations);
			}
		}
		else
		{
			/*
B
Bruce Momjian 已提交
507 508
			 * Single result relation identified by
			 * parseTree->resultRelation
509 510 511 512 513 514 515 516
			 */
			numResultRelations = 1;
			resultRelInfos = (ResultRelInfo *) palloc(sizeof(ResultRelInfo));
			initResultRelInfo(resultRelInfos,
							  parseTree->resultRelation,
							  rangeTable,
							  operation);
		}
517

518 519 520 521
		estate->es_result_relations = resultRelInfos;
		estate->es_num_result_relations = numResultRelations;
		/* Initialize to first or only result rel */
		estate->es_result_relation_info = resultRelInfos;
522
	}
523 524
	else
	{
B
Bruce Momjian 已提交
525
		/*
B
Bruce Momjian 已提交
526
		 * if no result relation, then set state appropriately
527
		 */
528 529
		estate->es_result_relations = NULL;
		estate->es_num_result_relations = 0;
530 531 532
		estate->es_result_relation_info = NULL;
	}

533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552
	/*
	 * Detect whether we're doing SELECT INTO.  If so, set the force_oids
	 * flag appropriately so that the plan tree will be initialized with
	 * the correct tuple descriptors.
	 */
	do_select_into = false;

	if (operation == CMD_SELECT &&
		!parseTree->isPortal &&
		parseTree->into != NULL)
	{
		do_select_into = true;
		/*
		 * For now, always create OIDs in SELECT INTO; this is for backwards
		 * compatibility with pre-7.3 behavior.  Eventually we might want
		 * to allow the user to choose.
		 */
		estate->es_force_oids = true;
	}

553 554 555
	/*
	 * Have to lock relations selected for update
	 */
556 557
	estate->es_rowMark = NIL;
	if (parseTree->rowMarks != NIL)
558
	{
B
Bruce Momjian 已提交
559
		List	   *l;
560

561
		foreach(l, parseTree->rowMarks)
562
		{
563 564
			Index		rti = lfirsti(l);
			Oid			relid = getrelid(rti, rangeTable);
565 566 567 568
			Relation	relation;
			execRowMark *erm;

			relation = heap_open(relid, RowShareLock);
B
Bruce Momjian 已提交
569
			erm = (execRowMark *) palloc(sizeof(execRowMark));
570
			erm->relation = relation;
571
			erm->rti = rti;
572
			snprintf(erm->resname, 32, "ctid%u", rti);
573 574 575
			estate->es_rowMark = lappend(estate->es_rowMark, erm);
		}
	}
576

B
Bruce Momjian 已提交
577
	/*
578
	 * initialize the executor "tuple" table.  We need slots for all the
579 580 581
	 * plan nodes, plus possibly output slots for the junkfilter(s). At
	 * this point we aren't sure if we need junkfilters, so just add slots
	 * for them unconditionally.
582 583
	 */
	{
584
		int			nSlots = ExecCountSlotsNode(plan);
585

586 587 588 589 590
		if (parseTree->resultRelations != NIL)
			nSlots += length(parseTree->resultRelations);
		else
			nSlots += 1;
		estate->es_tupleTable = ExecCreateTupleTable(nSlots);
591
	}
592

593
	/* mark EvalPlanQual not active */
594
	estate->es_topPlan = plan;
595 596
	estate->es_evalPlanQual = NULL;
	estate->es_evTupleNull = NULL;
597
	estate->es_evTuple = NULL;
598 599
	estate->es_useEvalPlan = false;

B
Bruce Momjian 已提交
600
	/*
B
Bruce Momjian 已提交
601 602
	 * initialize the private state information for all the nodes in the
	 * query tree.	This opens files, allocates storage and leaves us
603
	 * ready to start processing tuples.
604
	 */
605
	planstate = ExecInitNode(plan, estate);
606

B
Bruce Momjian 已提交
607
	/*
608
	 * Get the tuple descriptor describing the type of tuples to return.
B
Bruce Momjian 已提交
609
	 * (this is especially important if we are creating a relation with
610
	 * "SELECT INTO")
611
	 */
612
	tupType = ExecGetTupType(planstate);
613

B
Bruce Momjian 已提交
614
	/*
615 616 617 618 619
	 * Initialize the junk filter if needed.  SELECT and INSERT queries need a
	 * filter if there are any junk attrs in the tlist.  INSERT and SELECT
	 * INTO also need a filter if the top plan node is a scan node that's not
	 * doing projection (else we'll be scribbling on the scan tuple!)  UPDATE
	 * and DELETE always need a filter, since there's always a junk 'ctid'
B
Bruce Momjian 已提交
620
	 * attribute present --- no need to look first.
621 622
	 */
	{
623 624 625
		bool		junk_filter_needed = false;
		List	   *tlist;

626
		switch (operation)
627
		{
628 629
			case CMD_SELECT:
			case CMD_INSERT:
630
				foreach(tlist, plan->targetlist)
631
				{
632 633 634 635 636 637 638
					TargetEntry *tle = (TargetEntry *) lfirst(tlist);

					if (tle->resdom->resjunk)
					{
						junk_filter_needed = true;
						break;
					}
639
				}
640 641 642 643 644 645 646 647 648 649 650 651 652
				if (!junk_filter_needed &&
					(operation == CMD_INSERT || do_select_into))
				{
					if (IsA(planstate, SeqScanState) ||
						IsA(planstate, IndexScanState) ||
						IsA(planstate, TidScanState) ||
						IsA(planstate, SubqueryScanState) ||
						IsA(planstate, FunctionScanState))
					{
						if (planstate->ps_ProjInfo == NULL)
							junk_filter_needed = true;
					}
				}
653 654 655 656 657 658 659
				break;
			case CMD_UPDATE:
			case CMD_DELETE:
				junk_filter_needed = true;
				break;
			default:
				break;
660 661
		}

662
		if (junk_filter_needed)
663
		{
664
			/*
B
Bruce Momjian 已提交
665 666 667 668
			 * If there are multiple result relations, each one needs its
			 * own junk filter.  Note this is only possible for
			 * UPDATE/DELETE, so we can't be fooled by some needing a
			 * filter and some not.
669 670 671
			 */
			if (parseTree->resultRelations != NIL)
			{
672 673
				PlanState **appendplans;
				int			as_nplans;
674
				ResultRelInfo *resultRelInfo;
675
				int			i;
676 677 678 679

				/* Top plan had better be an Append here. */
				Assert(IsA(plan, Append));
				Assert(((Append *) plan)->isTarget);
680 681 682 683
				Assert(IsA(planstate, AppendState));
				appendplans = ((AppendState *) planstate)->appendplans;
				as_nplans = ((AppendState *) planstate)->as_nplans;
				Assert(as_nplans == estate->es_num_result_relations);
684
				resultRelInfo = estate->es_result_relations;
685
				for (i = 0; i < as_nplans; i++)
686
				{
687
					PlanState  *subplan = appendplans[i];
688 689
					JunkFilter *j;

690
					j = ExecInitJunkFilter(subplan->plan->targetlist,
691
										   ExecGetTupType(subplan),
692
							  ExecAllocTableSlot(estate->es_tupleTable));
693 694 695
					resultRelInfo->ri_junkFilter = j;
					resultRelInfo++;
				}
B
Bruce Momjian 已提交
696

697 698 699 700 701 702 703 704 705 706
				/*
				 * Set active junkfilter too; at this point ExecInitAppend
				 * has already selected an active result relation...
				 */
				estate->es_junkFilter =
					estate->es_result_relation_info->ri_junkFilter;
			}
			else
			{
				/* Normal case with just one JunkFilter */
707
				JunkFilter *j;
708

709
				j = ExecInitJunkFilter(planstate->plan->targetlist,
710
									   tupType,
711
							  ExecAllocTableSlot(estate->es_tupleTable));
712 713 714
				estate->es_junkFilter = j;
				if (estate->es_result_relation_info)
					estate->es_result_relation_info->ri_junkFilter = j;
715

716 717 718 719
				/* For SELECT, want to return the cleaned tuple type */
				if (operation == CMD_SELECT)
					tupType = j->jf_cleanTupType;
			}
720 721 722 723
		}
		else
			estate->es_junkFilter = NULL;
	}
724

B
Bruce Momjian 已提交
725
	/*
726 727 728
	 * If doing SELECT INTO, initialize the "into" relation.  We must wait
	 * till now so we have the "clean" result tuple type to create the
	 * new table from.
729 730 731
	 */
	intoRelationDesc = (Relation) NULL;

732
	if (do_select_into)
733
	{
734 735 736 737 738
		char	   *intoName;
		Oid			namespaceId;
		AclResult	aclresult;
		Oid			intoRelationId;
		TupleDesc	tupdesc;
739

740 741 742 743 744
		/*
		 * find namespace to create in, check permissions
		 */
		intoName = parseTree->into->relname;
		namespaceId = RangeVarGetCreationNamespace(parseTree->into);
745

746 747 748 749
		aclresult = pg_namespace_aclcheck(namespaceId, GetUserId(),
										  ACL_CREATE);
		if (aclresult != ACLCHECK_OK)
			aclcheck_error(aclresult, get_namespace_name(namespaceId));
750

751 752 753 754
		/*
		 * have to copy tupType to get rid of constraints
		 */
		tupdesc = CreateTupleDescCopy(tupType);
755

756 757 758 759 760 761 762
		intoRelationId = heap_create_with_catalog(intoName,
												  namespaceId,
												  tupdesc,
												  RELKIND_RELATION,
												  false,
												  ONCOMMIT_NOOP,
												  allowSystemTableMods);
763

764
		FreeTupleDesc(tupdesc);
765

766 767 768 769 770
		/*
		 * Advance command counter so that the newly-created
		 * relation's catalog tuples will be visible to heap_open.
		 */
		CommandCounterIncrement();
771

772 773 774 775 776 777 778
		/*
		 * If necessary, create a TOAST table for the into
		 * relation. Note that AlterTableCreateToastTable ends
		 * with CommandCounterIncrement(), so that the TOAST table
		 * will be visible for insertion.
		 */
		AlterTableCreateToastTable(intoRelationId, true);
779

780 781 782 783
		/*
		 * And open the constructed table for writing.
		 */
		intoRelationDesc = heap_open(intoRelationId, AccessExclusiveLock);
784 785 786 787
	}

	estate->es_into_relation_descriptor = intoRelationDesc;

788 789
	queryDesc->tupDesc = tupType;
	queryDesc->planstate = planstate;
790 791
}

792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829
/*
 * Initialize ResultRelInfo data for one result relation
 */
static void
initResultRelInfo(ResultRelInfo *resultRelInfo,
				  Index resultRelationIndex,
				  List *rangeTable,
				  CmdType operation)
{
	Oid			resultRelationOid;
	Relation	resultRelationDesc;

	resultRelationOid = getrelid(resultRelationIndex, rangeTable);
	resultRelationDesc = heap_open(resultRelationOid, RowExclusiveLock);

	switch (resultRelationDesc->rd_rel->relkind)
	{
		case RELKIND_SEQUENCE:
			elog(ERROR, "You can't change sequence relation %s",
				 RelationGetRelationName(resultRelationDesc));
			break;
		case RELKIND_TOASTVALUE:
			elog(ERROR, "You can't change toast relation %s",
				 RelationGetRelationName(resultRelationDesc));
			break;
		case RELKIND_VIEW:
			elog(ERROR, "You can't change view relation %s",
				 RelationGetRelationName(resultRelationDesc));
			break;
	}

	MemSet(resultRelInfo, 0, sizeof(ResultRelInfo));
	resultRelInfo->type = T_ResultRelInfo;
	resultRelInfo->ri_RangeTableIndex = resultRelationIndex;
	resultRelInfo->ri_RelationDesc = resultRelationDesc;
	resultRelInfo->ri_NumIndices = 0;
	resultRelInfo->ri_IndexRelationDescs = NULL;
	resultRelInfo->ri_IndexRelationInfo = NULL;
830 831
	/* make a copy so as not to depend on relcache info not changing... */
	resultRelInfo->ri_TrigDesc = CopyTriggerDesc(resultRelationDesc->trigdesc);
832
	resultRelInfo->ri_TrigFunctions = NULL;
833 834 835 836 837 838
	resultRelInfo->ri_ConstraintExprs = NULL;
	resultRelInfo->ri_junkFilter = NULL;

	/*
	 * If there are indices on the result relation, open them and save
	 * descriptors in the result relation info, so that we can add new
B
Bruce Momjian 已提交
839 840
	 * index entries for the tuples we add/update.	We need not do this
	 * for a DELETE, however, since deletion doesn't affect indexes.
841 842 843 844 845 846
	 */
	if (resultRelationDesc->rd_rel->relhasindex &&
		operation != CMD_DELETE)
		ExecOpenIndices(resultRelInfo);
}

847
/* ----------------------------------------------------------------
848
 *		ExecEndPlan
849
 *
850
 *		Cleans up the query plan -- closes files and frees up storage
851 852 853 854 855 856
 *
 * NOTE: we are no longer very worried about freeing storage per se
 * in this code; FreeExecutorState should be guaranteed to release all
 * memory that needs to be released.  What we are worried about doing
 * is closing relations and dropping buffer pins.  Thus, for example,
 * tuple tables must be cleared or dropped to ensure pins are released.
857 858
 * ----------------------------------------------------------------
 */
859 860
void
ExecEndPlan(PlanState *planstate, EState *estate)
861
{
862 863
	ResultRelInfo *resultRelInfo;
	int			i;
864
	List	   *l;
865

866 867 868 869 870 871
	/*
	 * shut down any PlanQual processing we were doing
	 */
	if (estate->es_evalPlanQual != NULL)
		EndEvalPlanQual(estate);

B
Bruce Momjian 已提交
872
	/*
873
	 * shut down the node-type-specific query processing
874
	 */
875
	ExecEndNode(planstate);
876

B
Bruce Momjian 已提交
877
	/*
B
Bruce Momjian 已提交
878
	 * destroy the executor "tuple" table.
879
	 */
880 881
	ExecDropTupleTable(estate->es_tupleTable, true);
	estate->es_tupleTable = NULL;
882

B
Bruce Momjian 已提交
883
	/*
B
Bruce Momjian 已提交
884
	 * close the result relation(s) if any, but hold locks until xact
885
	 * commit.
886
	 */
887 888
	resultRelInfo = estate->es_result_relations;
	for (i = estate->es_num_result_relations; i > 0; i--)
889
	{
890 891 892 893
		/* Close indices and then the relation itself */
		ExecCloseIndices(resultRelInfo);
		heap_close(resultRelInfo->ri_RelationDesc, NoLock);
		resultRelInfo++;
894 895
	}

B
Bruce Momjian 已提交
896
	/*
897
	 * close the "into" relation if necessary, again keeping lock
898
	 */
899 900
	if (estate->es_into_relation_descriptor != NULL)
		heap_close(estate->es_into_relation_descriptor, NoLock);
901 902 903 904 905 906 907 908 909 910

	/*
	 * close any relations selected FOR UPDATE, again keeping locks
	 */
	foreach(l, estate->es_rowMark)
	{
		execRowMark *erm = lfirst(l);

		heap_close(erm->relation, NoLock);
	}
911 912 913
}

/* ----------------------------------------------------------------
914 915
 *		ExecutePlan
 *
916
 *		processes the query plan to retrieve 'numberTuples' tuples in the
917
 *		direction specified.
918
 *
919
 *		Retrieves all tuples if numberTuples is 0
920
 *
921
 *		result is either a slot containing the last tuple in the case
922
 *		of a SELECT or NULL otherwise.
923
 *
924 925
 * Note: the ctid attribute is a 'junk' attribute that is removed before the
 * user can see it
926 927 928
 * ----------------------------------------------------------------
 */
static TupleTableSlot *
929
ExecutePlan(EState *estate,
930
			PlanState *planstate,
931
			CmdType operation,
932
			long numberTuples,
933
			ScanDirection direction,
934
			DestReceiver *destfunc)
935
{
936 937 938 939 940 941
	JunkFilter			*junkfilter;
	TupleTableSlot		*slot;
	ItemPointer			 tupleid = NULL;
	ItemPointerData		 tuple_ctid;
	long				 current_tuple_count;
	TupleTableSlot		*result;
942

B
Bruce Momjian 已提交
943
	/*
B
Bruce Momjian 已提交
944
	 * initialize local variables
945
	 */
946 947 948 949
	slot = NULL;
	current_tuple_count = 0;
	result = NULL;

B
Bruce Momjian 已提交
950 951
	/*
	 * Set the direction.
952
	 */
953 954
	estate->es_direction = direction;

955 956 957 958 959 960 961 962 963 964 965 966 967 968 969 970
	/*
	 * Process BEFORE EACH STATEMENT triggers
	 */
	switch (operation)
	{
		case CMD_UPDATE:
			ExecBSUpdateTriggers(estate, estate->es_result_relation_info);
			break;
		case CMD_DELETE:
			ExecBSDeleteTriggers(estate, estate->es_result_relation_info);
			break;
		case CMD_INSERT:
			ExecBSInsertTriggers(estate, estate->es_result_relation_info);
			break;
		default:
			/* do nothing */
971
			break;
972 973
	}

B
Bruce Momjian 已提交
974
	/*
B
Bruce Momjian 已提交
975
	 * Loop until we've processed the proper number of tuples from the
976
	 * plan.
977 978 979 980
	 */

	for (;;)
	{
981 982
		/* Reset the per-output-tuple exprcontext */
		ResetPerTupleExprContext(estate);
B
Bruce Momjian 已提交
983

B
Bruce Momjian 已提交
984
		/*
B
Bruce Momjian 已提交
985
		 * Execute the plan and obtain a tuple
986
		 */
B
Bruce Momjian 已提交
987
lnext:	;
988 989 990 991
		if (estate->es_useEvalPlan)
		{
			slot = EvalPlanQualNext(estate);
			if (TupIsNull(slot))
992
				slot = ExecProcNode(planstate);
993 994
		}
		else
995
			slot = ExecProcNode(planstate);
996

B
Bruce Momjian 已提交
997
		/*
B
Bruce Momjian 已提交
998 999
		 * if the tuple is null, then we assume there is nothing more to
		 * process so we just return null...
1000 1001 1002 1003 1004
		 */
		if (TupIsNull(slot))
		{
			result = NULL;
			break;
1005 1006
		}

B
Bruce Momjian 已提交
1007
		/*
B
Bruce Momjian 已提交
1008 1009
		 * if we have a junk filter, then project a new tuple with the
		 * junk removed.
1010
		 *
1011 1012 1013
		 * Store this new "clean" tuple in the junkfilter's resultSlot.
		 * (Formerly, we stored it back over the "dirty" tuple, which is
		 * WRONG because that tuple slot has the wrong descriptor.)
1014
		 *
B
Bruce Momjian 已提交
1015
		 * Also, extract all the junk information we need.
1016 1017 1018
		 */
		if ((junkfilter = estate->es_junkFilter) != (JunkFilter *) NULL)
		{
1019 1020 1021
			Datum		datum;
			HeapTuple	newTuple;
			bool		isNull;
1022

B
Bruce Momjian 已提交
1023
			/*
1024 1025 1026 1027 1028 1029 1030 1031 1032
			 * extract the 'ctid' junk attribute.
			 */
			if (operation == CMD_UPDATE || operation == CMD_DELETE)
			{
				if (!ExecGetJunkAttribute(junkfilter,
										  slot,
										  "ctid",
										  &datum,
										  &isNull))
1033
					elog(ERROR, "ExecutePlan: NO (junk) `ctid' was found!");
1034

1035
				/* shouldn't ever get a null result... */
1036
				if (isNull)
1037
					elog(ERROR, "ExecutePlan: (junk) `ctid' is NULL!");
1038 1039 1040 1041 1042 1043

				tupleid = (ItemPointer) DatumGetPointer(datum);
				tuple_ctid = *tupleid;	/* make sure we don't free the
										 * ctid!! */
				tupleid = &tuple_ctid;
			}
1044
			else if (estate->es_rowMark != NIL)
1045
			{
B
Bruce Momjian 已提交
1046
				List	   *l;
1047

B
Bruce Momjian 已提交
1048 1049
		lmark:	;
				foreach(l, estate->es_rowMark)
1050
				{
1051 1052 1053 1054 1055 1056
					execRowMark *erm = lfirst(l);
					Buffer		buffer;
					HeapTupleData tuple;
					TupleTableSlot *newSlot;
					int			test;

1057 1058 1059 1060 1061
					if (!ExecGetJunkAttribute(junkfilter,
											  slot,
											  erm->resname,
											  &datum,
											  &isNull))
1062 1063
						elog(ERROR, "ExecutePlan: NO (junk) `%s' was found!",
							 erm->resname);
1064

1065
					/* shouldn't ever get a null result... */
1066
					if (isNull)
1067 1068
						elog(ERROR, "ExecutePlan: (junk) `%s' is NULL!",
							 erm->resname);
1069 1070

					tuple.t_self = *((ItemPointer) DatumGetPointer(datum));
1071 1072
					test = heap_mark4update(erm->relation, &tuple, &buffer,
											estate->es_snapshot->curcid);
1073 1074 1075 1076
					ReleaseBuffer(buffer);
					switch (test)
					{
						case HeapTupleSelfUpdated:
1077 1078 1079
							/* treat it as deleted; do not process */
							goto lnext;

1080 1081 1082 1083 1084 1085
						case HeapTupleMayBeUpdated:
							break;

						case HeapTupleUpdated:
							if (XactIsoLevel == XACT_SERIALIZABLE)
								elog(ERROR, "Can't serialize access due to concurrent update");
1086
							if (!(ItemPointerEquals(&(tuple.t_self),
B
Bruce Momjian 已提交
1087
								  (ItemPointer) DatumGetPointer(datum))))
1088
							{
B
Bruce Momjian 已提交
1089
								newSlot = EvalPlanQual(estate, erm->rti, &(tuple.t_self));
1090 1091 1092 1093 1094 1095 1096
								if (!(TupIsNull(newSlot)))
								{
									slot = newSlot;
									estate->es_useEvalPlan = true;
									goto lmark;
								}
							}
B
Bruce Momjian 已提交
1097 1098 1099

							/*
							 * if tuple was deleted or PlanQual failed for
1100
							 * updated tuple - we must not return this
B
Bruce Momjian 已提交
1101
							 * tuple!
1102 1103
							 */
							goto lnext;
1104 1105 1106

						default:
							elog(ERROR, "Unknown status %u from heap_mark4update", test);
B
Bruce Momjian 已提交
1107
							return (NULL);
1108 1109 1110
					}
				}
			}
1111

B
Bruce Momjian 已提交
1112
			/*
1113 1114 1115 1116 1117 1118
			 * Finally create a new "clean" tuple with all junk attributes
			 * removed
			 */
			newTuple = ExecRemoveJunk(junkfilter, slot);

			slot = ExecStoreTuple(newTuple,		/* tuple to store */
1119
								  junkfilter->jf_resultSlot,	/* dest slot */
B
Bruce Momjian 已提交
1120 1121
								  InvalidBuffer,		/* this tuple has no
														 * buffer */
1122
								  true);		/* tuple should be pfreed */
1123
		}
1124

B
Bruce Momjian 已提交
1125
		/*
B
Bruce Momjian 已提交
1126 1127
		 * now that we have a tuple, do the appropriate thing with it..
		 * either return it to the user, add it to a relation someplace,
B
Bruce Momjian 已提交
1128
		 * delete it from a relation, or modify some of its attributes.
1129 1130 1131
		 */
		switch (operation)
		{
1132
			case CMD_SELECT:
B
Bruce Momjian 已提交
1133 1134 1135
				ExecSelect(slot,	/* slot containing tuple */
						   destfunc,	/* destination's tuple-receiver
										 * obj */
1136
						   estate);
1137 1138
				result = slot;
				break;
1139

1140
			case CMD_INSERT:
1141
				ExecInsert(slot, tupleid, estate);
1142 1143
				result = NULL;
				break;
1144

1145 1146 1147 1148
			case CMD_DELETE:
				ExecDelete(slot, tupleid, estate);
				result = NULL;
				break;
1149

1150
			case CMD_UPDATE:
1151
				ExecUpdate(slot, tupleid, estate);
1152 1153
				result = NULL;
				break;
1154

1155
			default:
1156
				elog(LOG, "ExecutePlan: unknown operation in queryDesc");
1157
				result = NULL;
1158
				break;
1159
		}
B
Bruce Momjian 已提交
1160

B
Bruce Momjian 已提交
1161
		/*
1162
		 * check our tuple count.. if we've processed the proper number
1163
		 * then quit, else loop again and process more tuples.  Zero
1164
		 * numberTuples means no limit.
1165
		 */
1166
		current_tuple_count++;
1167
		if (numberTuples && numberTuples == current_tuple_count)
1168
			break;
1169
	}
1170

1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186
	/*
	 * Process AFTER EACH STATEMENT triggers
	 */
	switch (operation)
	{
		case CMD_UPDATE:
			ExecASUpdateTriggers(estate, estate->es_result_relation_info);
			break;
		case CMD_DELETE:
			ExecASDeleteTriggers(estate, estate->es_result_relation_info);
			break;
		case CMD_INSERT:
			ExecASInsertTriggers(estate, estate->es_result_relation_info);
			break;
		default:
			/* do nothing */
1187
			break;
1188 1189
	}

B
Bruce Momjian 已提交
1190
	/*
B
Bruce Momjian 已提交
1191
	 * here, result is either a slot containing a tuple in the case of a
1192
	 * SELECT or NULL otherwise.
1193
	 */
1194
	return result;
1195 1196 1197
}

/* ----------------------------------------------------------------
1198
 *		ExecSelect
1199
 *
1200
 *		SELECTs are easy.. we just pass the tuple to the appropriate
1201
 *		print function.  The only complexity is when we do a
1202
 *		"SELECT INTO", in which case we insert the tuple into
1203 1204
 *		the appropriate relation (note: this is a newly created relation
 *		so we don't need to worry about indices or locks.)
1205 1206 1207
 * ----------------------------------------------------------------
 */
static void
1208 1209 1210
ExecSelect(TupleTableSlot *slot,
		   DestReceiver *destfunc,
		   EState *estate)
1211
{
1212 1213
	HeapTuple	tuple;
	TupleDesc	attrtype;
1214

B
Bruce Momjian 已提交
1215
	/*
B
Bruce Momjian 已提交
1216
	 * get the heap tuple out of the tuple table slot
1217 1218 1219 1220
	 */
	tuple = slot->val;
	attrtype = slot->ttc_tupleDescriptor;

B
Bruce Momjian 已提交
1221
	/*
B
Bruce Momjian 已提交
1222
	 * insert the tuple into the "into relation"
1223 1224 1225
	 */
	if (estate->es_into_relation_descriptor != NULL)
	{
1226 1227
		heap_insert(estate->es_into_relation_descriptor, tuple,
					estate->es_snapshot->curcid);
1228 1229 1230
		IncrAppended();
	}

B
Bruce Momjian 已提交
1231
	/*
B
Bruce Momjian 已提交
1232
	 * send the tuple to the front end (or the screen)
1233
	 */
1234
	(*destfunc->receiveTuple) (tuple, attrtype, destfunc);
1235 1236
	IncrRetrieved();
	(estate->es_processed)++;
1237 1238 1239
}

/* ----------------------------------------------------------------
1240
 *		ExecInsert
1241
 *
1242
 *		INSERTs are trickier.. we have to insert the tuple into
1243 1244
 *		the base relation and insert appropriate tuples into the
 *		index relations.
1245 1246 1247
 * ----------------------------------------------------------------
 */
static void
1248
ExecInsert(TupleTableSlot *slot,
1249
		   ItemPointer tupleid,
1250
		   EState *estate)
1251
{
1252
	HeapTuple	tuple;
1253
	ResultRelInfo *resultRelInfo;
1254 1255 1256
	Relation	resultRelationDesc;
	int			numIndices;
	Oid			newId;
1257

B
Bruce Momjian 已提交
1258
	/*
B
Bruce Momjian 已提交
1259
	 * get the heap tuple out of the tuple table slot
1260 1261 1262
	 */
	tuple = slot->val;

B
Bruce Momjian 已提交
1263
	/*
1264
	 * get information on the (current) result relation
1265
	 */
1266 1267
	resultRelInfo = estate->es_result_relation_info;
	resultRelationDesc = resultRelInfo->ri_RelationDesc;
1268 1269

	/* BEFORE ROW INSERT Triggers */
1270
	if (resultRelInfo->ri_TrigDesc &&
1271
		resultRelInfo->ri_TrigDesc->n_before_row[TRIGGER_EVENT_INSERT] > 0)
1272
	{
1273
		HeapTuple	newtuple;
1274

1275
		newtuple = ExecBRInsertTriggers(estate, resultRelInfo, tuple);
1276 1277 1278 1279 1280 1281

		if (newtuple == NULL)	/* "do nothing" */
			return;

		if (newtuple != tuple)	/* modified by Trigger(s) */
		{
1282 1283 1284
			/*
			 * Insert modified tuple into tuple table slot, replacing the
			 * original.  We assume that it was allocated in per-tuple
B
Bruce Momjian 已提交
1285 1286
			 * memory context, and therefore will go away by itself. The
			 * tuple table slot should not try to clear it.
1287 1288 1289
			 */
			ExecStoreTuple(newtuple, slot, InvalidBuffer, false);
			tuple = newtuple;
1290 1291 1292
		}
	}

B
Bruce Momjian 已提交
1293
	/*
1294
	 * Check the constraints of the tuple
1295 1296
	 */
	if (resultRelationDesc->rd_att->constr)
1297
		ExecConstraints("ExecInsert", resultRelInfo, slot, estate);
1298

B
Bruce Momjian 已提交
1299
	/*
B
Bruce Momjian 已提交
1300
	 * insert the tuple
1301
	 */
1302 1303
	newId = heap_insert(resultRelationDesc, tuple,
						estate->es_snapshot->curcid);
1304

1305
	IncrAppended();
1306 1307
	(estate->es_processed)++;
	estate->es_lastoid = newId;
T
Tom Lane 已提交
1308
	setLastTid(&(tuple->t_self));
1309

B
Bruce Momjian 已提交
1310
	/*
B
Bruce Momjian 已提交
1311
	 * process indices
1312
	 *
B
Bruce Momjian 已提交
1313 1314 1315
	 * Note: heap_insert adds a new tuple to a relation.  As a side effect,
	 * the tupleid of the new tuple is placed in the new tuple's t_ctid
	 * field.
1316
	 */
1317
	numIndices = resultRelInfo->ri_NumIndices;
1318
	if (numIndices > 0)
1319
		ExecInsertIndexTuples(slot, &(tuple->t_self), estate, false);
1320 1321

	/* AFTER ROW INSERT Triggers */
1322
	ExecARInsertTriggers(estate, resultRelInfo, tuple);
1323 1324 1325
}

/* ----------------------------------------------------------------
1326
 *		ExecDelete
1327
 *
1328
 *		DELETE is like UPDATE, we delete the tuple and its
1329
 *		index tuples.
1330 1331 1332
 * ----------------------------------------------------------------
 */
static void
1333
ExecDelete(TupleTableSlot *slot,
1334
		   ItemPointer tupleid,
1335
		   EState *estate)
1336
{
1337
	ResultRelInfo *resultRelInfo;
B
Bruce Momjian 已提交
1338 1339 1340
	Relation	resultRelationDesc;
	ItemPointerData ctid;
	int			result;
1341

B
Bruce Momjian 已提交
1342
	/*
1343
	 * get information on the (current) result relation
1344
	 */
1345 1346
	resultRelInfo = estate->es_result_relation_info;
	resultRelationDesc = resultRelInfo->ri_RelationDesc;
1347 1348

	/* BEFORE ROW DELETE Triggers */
1349
	if (resultRelInfo->ri_TrigDesc &&
1350
	  resultRelInfo->ri_TrigDesc->n_before_row[TRIGGER_EVENT_DELETE] > 0)
1351
	{
1352
		bool		dodelete;
1353

1354
		dodelete = ExecBRDeleteTriggers(estate, resultRelInfo, tupleid);
1355 1356 1357 1358 1359

		if (!dodelete)			/* "do nothing" */
			return;
	}

V
Vadim B. Mikheev 已提交
1360
	/*
B
Bruce Momjian 已提交
1361
	 * delete the tuple
1362
	 */
1363
ldelete:;
1364 1365 1366
	result = heap_delete(resultRelationDesc, tupleid,
						 &ctid,
						 estate->es_snapshot->curcid);
V
Vadim B. Mikheev 已提交
1367 1368 1369
	switch (result)
	{
		case HeapTupleSelfUpdated:
1370
			/* already deleted by self; nothing to do */
V
Vadim B. Mikheev 已提交
1371 1372 1373 1374 1375 1376
			return;

		case HeapTupleMayBeUpdated:
			break;

		case HeapTupleUpdated:
1377 1378
			if (XactIsoLevel == XACT_SERIALIZABLE)
				elog(ERROR, "Can't serialize access due to concurrent update");
1379 1380
			else if (!(ItemPointerEquals(tupleid, &ctid)))
			{
B
Bruce Momjian 已提交
1381
				TupleTableSlot *epqslot = EvalPlanQual(estate,
B
Bruce Momjian 已提交
1382
							   resultRelInfo->ri_RangeTableIndex, &ctid);
1383

V
Vadim B. Mikheev 已提交
1384
				if (!TupIsNull(epqslot))
1385 1386 1387 1388 1389
				{
					*tupleid = ctid;
					goto ldelete;
				}
			}
1390
			/* tuple already deleted; nothing to do */
V
Vadim B. Mikheev 已提交
1391 1392 1393 1394 1395 1396
			return;

		default:
			elog(ERROR, "Unknown status %u from heap_delete", result);
			return;
	}
1397 1398 1399 1400

	IncrDeleted();
	(estate->es_processed)++;

B
Bruce Momjian 已提交
1401
	/*
B
Bruce Momjian 已提交
1402 1403
	 * Note: Normally one would think that we have to delete index tuples
	 * associated with the heap tuple now..
1404
	 *
B
Bruce Momjian 已提交
1405 1406 1407
	 * ... but in POSTGRES, we have no need to do this because the vacuum
	 * daemon automatically opens an index scan and deletes index tuples
	 * when it finds deleted heap tuples. -cim 9/27/89
1408 1409 1410
	 */

	/* AFTER ROW DELETE Triggers */
1411
	ExecARDeleteTriggers(estate, resultRelInfo, tupleid);
1412 1413 1414
}

/* ----------------------------------------------------------------
1415
 *		ExecUpdate
1416
 *
1417 1418 1419 1420
 *		note: we can't run UPDATE queries with transactions
 *		off because UPDATEs are actually INSERTs and our
 *		scan will mistakenly loop forever, updating the tuple
 *		it just inserted..	This should be fixed but until it
1421 1422
 *		is, we don't want to get stuck in an infinite loop
 *		which corrupts your database..
1423 1424 1425
 * ----------------------------------------------------------------
 */
static void
1426
ExecUpdate(TupleTableSlot *slot,
B
Bruce Momjian 已提交
1427 1428
		   ItemPointer tupleid,
		   EState *estate)
1429
{
B
Bruce Momjian 已提交
1430
	HeapTuple	tuple;
1431
	ResultRelInfo *resultRelInfo;
B
Bruce Momjian 已提交
1432 1433 1434 1435
	Relation	resultRelationDesc;
	ItemPointerData ctid;
	int			result;
	int			numIndices;
1436

B
Bruce Momjian 已提交
1437
	/*
B
Bruce Momjian 已提交
1438
	 * abort the operation if not running transactions
1439 1440 1441
	 */
	if (IsBootstrapProcessingMode())
	{
1442
		elog(WARNING, "ExecUpdate: UPDATE can't run without transactions");
1443 1444 1445
		return;
	}

B
Bruce Momjian 已提交
1446
	/*
B
Bruce Momjian 已提交
1447
	 * get the heap tuple out of the tuple table slot
1448 1449 1450
	 */
	tuple = slot->val;

B
Bruce Momjian 已提交
1451
	/*
1452
	 * get information on the (current) result relation
1453
	 */
1454 1455
	resultRelInfo = estate->es_result_relation_info;
	resultRelationDesc = resultRelInfo->ri_RelationDesc;
1456 1457

	/* BEFORE ROW UPDATE Triggers */
1458
	if (resultRelInfo->ri_TrigDesc &&
1459
	  resultRelInfo->ri_TrigDesc->n_before_row[TRIGGER_EVENT_UPDATE] > 0)
1460
	{
1461
		HeapTuple	newtuple;
1462

1463 1464
		newtuple = ExecBRUpdateTriggers(estate, resultRelInfo,
										tupleid, tuple);
1465 1466 1467 1468 1469 1470

		if (newtuple == NULL)	/* "do nothing" */
			return;

		if (newtuple != tuple)	/* modified by Trigger(s) */
		{
1471 1472 1473
			/*
			 * Insert modified tuple into tuple table slot, replacing the
			 * original.  We assume that it was allocated in per-tuple
B
Bruce Momjian 已提交
1474 1475
			 * memory context, and therefore will go away by itself. The
			 * tuple table slot should not try to clear it.
1476 1477 1478
			 */
			ExecStoreTuple(newtuple, slot, InvalidBuffer, false);
			tuple = newtuple;
1479 1480 1481
		}
	}

B
Bruce Momjian 已提交
1482
	/*
1483
	 * Check the constraints of the tuple
1484
	 *
1485 1486 1487 1488 1489
	 * If we generate a new candidate tuple after EvalPlanQual testing, we
	 * must loop back here and recheck constraints.  (We don't need to
	 * redo triggers, however.	If there are any BEFORE triggers then
	 * trigger.c will have done mark4update to lock the correct tuple, so
	 * there's no need to do them again.)
1490
	 */
1491
lreplace:;
1492
	if (resultRelationDesc->rd_att->constr)
1493
		ExecConstraints("ExecUpdate", resultRelInfo, slot, estate);
1494

V
Vadim B. Mikheev 已提交
1495
	/*
B
Bruce Momjian 已提交
1496
	 * replace the heap tuple
1497
	 */
1498 1499 1500
	result = heap_update(resultRelationDesc, tupleid, tuple,
						 &ctid,
						 estate->es_snapshot->curcid);
V
Vadim B. Mikheev 已提交
1501 1502 1503
	switch (result)
	{
		case HeapTupleSelfUpdated:
1504
			/* already deleted by self; nothing to do */
V
Vadim B. Mikheev 已提交
1505 1506 1507 1508 1509 1510
			return;

		case HeapTupleMayBeUpdated:
			break;

		case HeapTupleUpdated:
1511 1512
			if (XactIsoLevel == XACT_SERIALIZABLE)
				elog(ERROR, "Can't serialize access due to concurrent update");
1513 1514
			else if (!(ItemPointerEquals(tupleid, &ctid)))
			{
B
Bruce Momjian 已提交
1515
				TupleTableSlot *epqslot = EvalPlanQual(estate,
B
Bruce Momjian 已提交
1516
							   resultRelInfo->ri_RangeTableIndex, &ctid);
1517

V
Vadim B. Mikheev 已提交
1518
				if (!TupIsNull(epqslot))
1519 1520
				{
					*tupleid = ctid;
V
Vadim B. Mikheev 已提交
1521
					tuple = ExecRemoveJunk(estate->es_junkFilter, epqslot);
1522
					slot = ExecStoreTuple(tuple,
1523
									estate->es_junkFilter->jf_resultSlot,
1524
										  InvalidBuffer, true);
1525 1526 1527
					goto lreplace;
				}
			}
1528
			/* tuple already deleted; nothing to do */
V
Vadim B. Mikheev 已提交
1529 1530 1531
			return;

		default:
1532
			elog(ERROR, "Unknown status %u from heap_update", result);
V
Vadim B. Mikheev 已提交
1533
			return;
1534 1535 1536 1537 1538
	}

	IncrReplaced();
	(estate->es_processed)++;

B
Bruce Momjian 已提交
1539
	/*
B
Bruce Momjian 已提交
1540
	 * Note: instead of having to update the old index tuples associated
B
Bruce Momjian 已提交
1541
	 * with the heap tuple, all we do is form and insert new index tuples.
1542
	 * This is because UPDATEs are actually DELETEs and INSERTs and index
B
Bruce Momjian 已提交
1543 1544
	 * tuple deletion is done automagically by the vacuum daemon. All we
	 * do is insert new index tuples.  -cim 9/27/89
1545 1546
	 */

B
Bruce Momjian 已提交
1547
	/*
B
Bruce Momjian 已提交
1548
	 * process indices
1549
	 *
1550
	 * heap_update updates a tuple in the base relation by invalidating it
1551
	 * and then inserting a new tuple to the relation.	As a side effect,
B
Bruce Momjian 已提交
1552 1553 1554
	 * the tupleid of the new tuple is placed in the new tuple's t_ctid
	 * field.  So we now insert index tuples using the new tupleid stored
	 * there.
1555 1556
	 */

1557
	numIndices = resultRelInfo->ri_NumIndices;
1558
	if (numIndices > 0)
1559
		ExecInsertIndexTuples(slot, &(tuple->t_self), estate, false);
1560 1561

	/* AFTER ROW UPDATE Triggers */
1562
	ExecARUpdateTriggers(estate, resultRelInfo, tupleid, tuple);
1563
}
V
Vadim B. Mikheev 已提交
1564

1565
static char *
1566 1567
ExecRelCheck(ResultRelInfo *resultRelInfo,
			 TupleTableSlot *slot, EState *estate)
V
Vadim B. Mikheev 已提交
1568
{
1569
	Relation	rel = resultRelInfo->ri_RelationDesc;
1570 1571
	int			ncheck = rel->rd_att->constr->num_check;
	ConstrCheck *check = rel->rd_att->constr->check;
1572
	ExprContext *econtext;
1573
	MemoryContext oldContext;
1574 1575
	List	   *qual;
	int			i;
1576

1577 1578 1579 1580 1581 1582 1583 1584 1585 1586 1587 1588 1589
	/*
	 * If first time through for this result relation, build expression
	 * nodetrees for rel's constraint expressions.  Keep them in the
	 * per-query memory context so they'll survive throughout the query.
	 */
	if (resultRelInfo->ri_ConstraintExprs == NULL)
	{
		oldContext = MemoryContextSwitchTo(estate->es_query_cxt);
		resultRelInfo->ri_ConstraintExprs =
			(List **) palloc(ncheck * sizeof(List *));
		for (i = 0; i < ncheck; i++)
		{
			qual = (List *) stringToNode(check[i].ccbin);
1590
			resultRelInfo->ri_ConstraintExprs[i] = (List *)
1591
				ExecPrepareExpr((Expr *) qual, estate);
1592 1593 1594 1595
		}
		MemoryContextSwitchTo(oldContext);
	}

1596
	/*
B
Bruce Momjian 已提交
1597 1598
	 * We will use the EState's per-tuple context for evaluating
	 * constraint expressions (creating it if it's not already there).
1599
	 */
1600
	econtext = GetPerTupleExprContext(estate);
1601

1602 1603 1604 1605
	/* Arrange for econtext's scan tuple to be the tuple under test */
	econtext->ecxt_scantuple = slot;

	/* And evaluate the constraints */
1606 1607
	for (i = 0; i < ncheck; i++)
	{
1608
		qual = resultRelInfo->ri_ConstraintExprs[i];
1609

1610 1611
		/*
		 * NOTE: SQL92 specifies that a NULL result from a constraint
1612 1613
		 * expression is not to be treated as a failure.  Therefore, tell
		 * ExecQual to return TRUE for NULL.
1614
		 */
1615
		if (!ExecQual(qual, econtext, true))
1616
			return check[i].ccname;
1617 1618
	}

1619
	/* NULL result means no error */
1620
	return (char *) NULL;
V
Vadim B. Mikheev 已提交
1621 1622
}

1623
void
1624
ExecConstraints(const char *caller, ResultRelInfo *resultRelInfo,
1625
				TupleTableSlot *slot, EState *estate)
V
Vadim B. Mikheev 已提交
1626
{
1627
	Relation	rel = resultRelInfo->ri_RelationDesc;
1628 1629 1630 1631
	HeapTuple	tuple = slot->val;
	TupleConstr *constr = rel->rd_att->constr;

	Assert(constr);
1632

1633
	if (constr->has_not_null)
V
Vadim B. Mikheev 已提交
1634
	{
1635
		int			natts = rel->rd_att->natts;
1636
		int			attrChk;
1637

1638
		for (attrChk = 1; attrChk <= natts; attrChk++)
1639
		{
B
Bruce Momjian 已提交
1640
			if (rel->rd_att->attrs[attrChk - 1]->attnotnull &&
1641
				heap_attisnull(tuple, attrChk))
1642
				elog(ERROR, "%s: Fail to add null value in not null attribute %s",
B
Bruce Momjian 已提交
1643
					 caller, NameStr(rel->rd_att->attrs[attrChk - 1]->attname));
1644 1645 1646
		}
	}

1647
	if (constr->num_check > 0)
1648
	{
1649
		char	   *failed;
1650

1651
		if ((failed = ExecRelCheck(resultRelInfo, slot, estate)) != NULL)
B
Bruce Momjian 已提交
1652 1653
			elog(ERROR, "%s: rejected due to CHECK constraint \"%s\" on \"%s\"",
				 caller, failed, RelationGetRelationName(rel));
1654
	}
V
Vadim B. Mikheev 已提交
1655
}
1656

1657 1658 1659 1660 1661 1662
/*
 * Check a modified tuple to see if we want to process its updated version
 * under READ COMMITTED rules.
 *
 * See backend/executor/README for some info about how this works.
 */
B
Bruce Momjian 已提交
1663
TupleTableSlot *
1664 1665
EvalPlanQual(EState *estate, Index rti, ItemPointer tid)
{
1666 1667
	evalPlanQual *epq;
	EState	   *epqstate;
B
Bruce Momjian 已提交
1668 1669
	Relation	relation;
	HeapTupleData tuple;
1670 1671
	HeapTuple	copyTuple = NULL;
	bool		endNode;
1672 1673 1674

	Assert(rti != 0);

1675 1676 1677 1678 1679 1680 1681 1682 1683 1684 1685 1686 1687 1688 1689 1690 1691 1692 1693 1694 1695 1696 1697 1698 1699 1700 1701 1702 1703 1704 1705 1706 1707
	/*
	 * find relation containing target tuple
	 */
	if (estate->es_result_relation_info != NULL &&
		estate->es_result_relation_info->ri_RangeTableIndex == rti)
		relation = estate->es_result_relation_info->ri_RelationDesc;
	else
	{
		List	   *l;

		relation = NULL;
		foreach(l, estate->es_rowMark)
		{
			if (((execRowMark *) lfirst(l))->rti == rti)
			{
				relation = ((execRowMark *) lfirst(l))->relation;
				break;
			}
		}
		if (relation == NULL)
			elog(ERROR, "EvalPlanQual: can't find RTE %d", (int) rti);
	}

	/*
	 * fetch tid tuple
	 *
	 * Loop here to deal with updated or busy tuples
	 */
	tuple.t_self = *tid;
	for (;;)
	{
		Buffer		buffer;

1708
		if (heap_fetch(relation, SnapshotDirty, &tuple, &buffer, false, NULL))
1709 1710 1711 1712 1713 1714 1715 1716 1717 1718 1719 1720 1721 1722 1723 1724 1725 1726 1727 1728 1729 1730 1731 1732 1733 1734 1735 1736 1737 1738 1739 1740 1741 1742 1743 1744 1745 1746 1747 1748 1749 1750 1751 1752 1753 1754 1755 1756 1757 1758 1759
		{
			TransactionId xwait = SnapshotDirty->xmax;

			if (TransactionIdIsValid(SnapshotDirty->xmin))
				elog(ERROR, "EvalPlanQual: t_xmin is uncommitted ?!");

			/*
			 * If tuple is being updated by other transaction then we have
			 * to wait for its commit/abort.
			 */
			if (TransactionIdIsValid(xwait))
			{
				ReleaseBuffer(buffer);
				XactLockTableWait(xwait);
				continue;
			}

			/*
			 * We got tuple - now copy it for use by recheck query.
			 */
			copyTuple = heap_copytuple(&tuple);
			ReleaseBuffer(buffer);
			break;
		}

		/*
		 * Oops! Invalid tuple. Have to check is it updated or deleted.
		 * Note that it's possible to get invalid SnapshotDirty->tid if
		 * tuple updated by this transaction. Have we to check this ?
		 */
		if (ItemPointerIsValid(&(SnapshotDirty->tid)) &&
			!(ItemPointerEquals(&(tuple.t_self), &(SnapshotDirty->tid))))
		{
			/* updated, so look at the updated copy */
			tuple.t_self = SnapshotDirty->tid;
			continue;
		}

		/*
		 * Deleted or updated by this transaction; forget it.
		 */
		return NULL;
	}

	/*
	 * For UPDATE/DELETE we have to return tid of actual row we're
	 * executing PQ for.
	 */
	*tid = tuple.t_self;

	/*
1760
	 * Need to run a recheck subquery.	Find or create a PQ stack entry.
1761
	 */
1762
	epq = estate->es_evalPlanQual;
1763 1764
	endNode = true;

1765 1766
	if (epq != NULL && epq->rti == 0)
	{
1767
		/* Top PQ stack entry is idle, so re-use it */
1768
		Assert(!(estate->es_useEvalPlan) && epq->next == NULL);
1769 1770 1771 1772 1773 1774
		epq->rti = rti;
		endNode = false;
	}

	/*
	 * If this is request for another RTE - Ra, - then we have to check
B
Bruce Momjian 已提交
1775 1776 1777
	 * wasn't PlanQual requested for Ra already and if so then Ra' row was
	 * updated again and we have to re-start old execution for Ra and
	 * forget all what we done after Ra was suspended. Cool? -:))
1778
	 */
B
Bruce Momjian 已提交
1779
	if (epq != NULL && epq->rti != rti &&
1780
		epq->estate->es_evTuple[rti - 1] != NULL)
1781 1782 1783
	{
		do
		{
1784 1785
			evalPlanQual *oldepq;

1786
			/* stop execution */
1787 1788 1789 1790
			EvalPlanQualStop(epq);
			/* pop previous PlanQual from the stack */
			oldepq = epq->next;
			Assert(oldepq && oldepq->rti != 0);
1791 1792 1793
			/* push current PQ to freePQ stack */
			oldepq->free = epq;
			epq = oldepq;
1794
			estate->es_evalPlanQual = epq;
1795 1796 1797
		} while (epq->rti != rti);
	}

B
Bruce Momjian 已提交
1798
	/*
1799 1800 1801 1802 1803 1804
	 * If we are requested for another RTE then we have to suspend
	 * execution of current PlanQual and start execution for new one.
	 */
	if (epq == NULL || epq->rti != rti)
	{
		/* try to reuse plan used previously */
B
Bruce Momjian 已提交
1805
		evalPlanQual *newepq = (epq != NULL) ? epq->free : NULL;
1806

1807
		if (newepq == NULL)		/* first call or freePQ stack is empty */
1808
		{
1809
			newepq = (evalPlanQual *) palloc0(sizeof(evalPlanQual));
1810
			newepq->free = NULL;
1811 1812
			newepq->estate = NULL;
			newepq->planstate = NULL;
1813 1814
		}
		else
1815
		{
1816 1817 1818
			/* recycle previously used PlanQual */
			Assert(newepq->estate == NULL);
			epq->free = NULL;
1819
		}
1820
		/* push current PQ to the stack */
1821
		newepq->next = epq;
1822
		epq = newepq;
1823
		estate->es_evalPlanQual = epq;
1824 1825 1826 1827
		epq->rti = rti;
		endNode = false;
	}

1828
	Assert(epq->rti == rti);
1829 1830

	/*
1831 1832
	 * Ok - we're requested for the same RTE.  Unfortunately we still have
	 * to end and restart execution of the plan, because ExecReScan
1833
	 * wouldn't ensure that upper plan nodes would reset themselves.  We
1834 1835 1836
	 * could make that work if insertion of the target tuple were
	 * integrated with the Param mechanism somehow, so that the upper plan
	 * nodes know that their children's outputs have changed.
1837 1838 1839 1840 1841
	 *
	 * Note that the stack of free evalPlanQual nodes is quite useless at
	 * the moment, since it only saves us from pallocing/releasing the
	 * evalPlanQual nodes themselves.  But it will be useful once we
	 * implement ReScan instead of end/restart for re-using PlanQual nodes.
1842 1843
	 */
	if (endNode)
1844
	{
1845
		/* stop execution */
1846
		EvalPlanQualStop(epq);
1847
	}
1848

1849 1850 1851 1852 1853 1854 1855 1856 1857 1858
	/*
	 * Initialize new recheck query.
	 *
	 * Note: if we were re-using PlanQual plans via ExecReScan, we'd need
	 * to instead copy down changeable state from the top plan (including
	 * es_result_relation_info, es_junkFilter) and reset locally changeable
	 * state in the epq (including es_param_exec_vals, es_evTupleNull).
	 */
	EvalPlanQualStart(epq, estate, epq->next);

1859
	/*
1860 1861
	 * free old RTE' tuple, if any, and store target tuple where
	 * relation's scan node will see it
1862
	 */
1863
	epqstate = epq->estate;
1864 1865 1866
	if (epqstate->es_evTuple[rti - 1] != NULL)
		heap_freetuple(epqstate->es_evTuple[rti - 1]);
	epqstate->es_evTuple[rti - 1] = copyTuple;
1867

1868
	return EvalPlanQualNext(estate);
1869 1870
}

B
Bruce Momjian 已提交
1871
static TupleTableSlot *
1872 1873
EvalPlanQualNext(EState *estate)
{
1874 1875
	evalPlanQual *epq = estate->es_evalPlanQual;
	MemoryContext oldcontext;
B
Bruce Momjian 已提交
1876
	TupleTableSlot *slot;
1877 1878 1879 1880

	Assert(epq->rti != 0);

lpqnext:;
1881
	oldcontext = MemoryContextSwitchTo(epq->estate->es_query_cxt);
1882
	slot = ExecProcNode(epq->planstate);
1883
	MemoryContextSwitchTo(oldcontext);
1884 1885 1886 1887 1888 1889

	/*
	 * No more tuples for this PQ. Continue previous one.
	 */
	if (TupIsNull(slot))
	{
1890 1891
		evalPlanQual *oldepq;

1892
		/* stop execution */
1893
		EvalPlanQualStop(epq);
1894
		/* pop old PQ from the stack */
1895 1896
		oldepq = epq->next;
		if (oldepq == NULL)
1897
		{
1898 1899 1900 1901 1902
			/* this is the first (oldest) PQ - mark as free */
			epq->rti = 0;
			estate->es_useEvalPlan = false;
			/* and continue Query execution */
			return (NULL);
1903 1904 1905 1906 1907
		}
		Assert(oldepq->rti != 0);
		/* push current PQ to freePQ stack */
		oldepq->free = epq;
		epq = oldepq;
1908
		estate->es_evalPlanQual = epq;
1909 1910 1911 1912 1913
		goto lpqnext;
	}

	return (slot);
}
1914 1915 1916 1917

static void
EndEvalPlanQual(EState *estate)
{
1918
	evalPlanQual *epq = estate->es_evalPlanQual;
1919

1920 1921
	if (epq->rti == 0)			/* plans already shutdowned */
	{
1922
		Assert(epq->next == NULL);
1923
		return;
1924
	}
1925 1926 1927

	for (;;)
	{
1928 1929
		evalPlanQual *oldepq;

1930
		/* stop execution */
1931
		EvalPlanQualStop(epq);
1932
		/* pop old PQ from the stack */
1933 1934
		oldepq = epq->next;
		if (oldepq == NULL)
1935
		{
1936 1937 1938
			/* this is the first (oldest) PQ - mark as free */
			epq->rti = 0;
			estate->es_useEvalPlan = false;
1939 1940 1941 1942 1943 1944
			break;
		}
		Assert(oldepq->rti != 0);
		/* push current PQ to freePQ stack */
		oldepq->free = epq;
		epq = oldepq;
1945 1946 1947 1948 1949 1950 1951 1952 1953 1954 1955 1956 1957 1958 1959 1960 1961 1962 1963 1964 1965 1966 1967 1968 1969 1970 1971 1972 1973 1974 1975 1976 1977 1978 1979 1980 1981 1982 1983 1984 1985 1986 1987
		estate->es_evalPlanQual = epq;
	}
}

/*
 * Start execution of one level of PlanQual.
 *
 * This is a cut-down version of ExecutorStart(): we copy some state from
 * the top-level estate rather than initializing it fresh.
 */
static void
EvalPlanQualStart(evalPlanQual *epq, EState *estate, evalPlanQual *priorepq)
{
	EState	   *epqstate;
	int			rtsize;
	MemoryContext oldcontext;

	rtsize = length(estate->es_range_table);

	epq->estate = epqstate = CreateExecutorState();

	oldcontext = MemoryContextSwitchTo(epqstate->es_query_cxt);

	/*
	 * The epqstates share the top query's copy of unchanging state such
	 * as the snapshot, rangetable, result-rel info, and external Param info.
	 * They need their own copies of local state, including a tuple table,
	 * es_param_exec_vals, etc.
	 */
	epqstate->es_direction = ForwardScanDirection;
	epqstate->es_snapshot = estate->es_snapshot;
	epqstate->es_range_table = estate->es_range_table;
	epqstate->es_result_relations = estate->es_result_relations;
	epqstate->es_num_result_relations = estate->es_num_result_relations;
	epqstate->es_result_relation_info = estate->es_result_relation_info;
	epqstate->es_junkFilter = estate->es_junkFilter;
	epqstate->es_into_relation_descriptor = estate->es_into_relation_descriptor;
	epqstate->es_param_list_info = estate->es_param_list_info;
	if (estate->es_topPlan->nParamExec > 0)
		epqstate->es_param_exec_vals = (ParamExecData *)
			palloc0(estate->es_topPlan->nParamExec * sizeof(ParamExecData));
	epqstate->es_rowMark = estate->es_rowMark;
	epqstate->es_instrument = estate->es_instrument;
1988
	epqstate->es_force_oids = estate->es_force_oids;
1989 1990 1991 1992 1993 1994 1995 1996 1997 1998 1999 2000 2001 2002 2003 2004 2005 2006 2007 2008 2009 2010 2011 2012 2013 2014 2015 2016 2017 2018 2019 2020 2021 2022 2023 2024 2025 2026 2027 2028 2029 2030 2031 2032 2033 2034 2035 2036
	epqstate->es_topPlan = estate->es_topPlan;
	/*
	 * Each epqstate must have its own es_evTupleNull state, but
	 * all the stack entries share es_evTuple state.  This allows
	 * sub-rechecks to inherit the value being examined by an
	 * outer recheck.
	 */
	epqstate->es_evTupleNull = (bool *) palloc0(rtsize * sizeof(bool));
	if (priorepq == NULL)
		/* first PQ stack entry */
		epqstate->es_evTuple = (HeapTuple *)
			palloc0(rtsize * sizeof(HeapTuple));
	else
		/* later stack entries share the same storage */
		epqstate->es_evTuple = priorepq->estate->es_evTuple;

	epqstate->es_tupleTable =
		ExecCreateTupleTable(estate->es_tupleTable->size);

	epq->planstate = ExecInitNode(estate->es_topPlan, epqstate);

	MemoryContextSwitchTo(oldcontext);
}

/*
 * End execution of one level of PlanQual.
 *
 * This is a cut-down version of ExecutorEnd(); basically we want to do most
 * of the normal cleanup, but *not* close result relations (which we are
 * just sharing from the outer query).
 */
static void
EvalPlanQualStop(evalPlanQual *epq)
{
	EState	   *epqstate = epq->estate;
	MemoryContext oldcontext;

	oldcontext = MemoryContextSwitchTo(epqstate->es_query_cxt);

	ExecEndNode(epq->planstate);

	ExecDropTupleTable(epqstate->es_tupleTable, true);
	epqstate->es_tupleTable = NULL;

	if (epqstate->es_evTuple[epq->rti - 1] != NULL)
	{
		heap_freetuple(epqstate->es_evTuple[epq->rti - 1]);
		epqstate->es_evTuple[epq->rti - 1] = NULL;
2037
	}
2038 2039 2040 2041 2042 2043 2044

	MemoryContextSwitchTo(oldcontext);

	FreeExecutorState(epqstate);

	epq->estate = NULL;
	epq->planstate = NULL;
2045
}