PostgreSQL Source Code git master
Loading...
Searching...
No Matches
prepjointree.c
Go to the documentation of this file.
1/*-------------------------------------------------------------------------
2 *
3 * prepjointree.c
4 * Planner preprocessing for subqueries and join tree manipulation.
5 *
6 * NOTE: the intended sequence for invoking these operations is
7 * preprocess_relation_rtes
8 * replace_empty_jointree
9 * pull_up_sublinks
10 * preprocess_function_rtes
11 * pull_up_subqueries
12 * flatten_simple_union_all
13 * do expression preprocessing (including flattening JOIN alias vars)
14 * reduce_outer_joins
15 * remove_useless_result_rtes
16 *
17 *
18 * Portions Copyright (c) 1996-2026, PostgreSQL Global Development Group
19 * Portions Copyright (c) 1994, Regents of the University of California
20 *
21 *
22 * IDENTIFICATION
23 * src/backend/optimizer/prep/prepjointree.c
24 *
25 *-------------------------------------------------------------------------
26 */
27#include "postgres.h"
28
29#include "access/table.h"
30#include "catalog/pg_type.h"
31#include "funcapi.h"
32#include "miscadmin.h"
33#include "nodes/makefuncs.h"
35#include "nodes/nodeFuncs.h"
36#include "optimizer/clauses.h"
37#include "optimizer/optimizer.h"
39#include "optimizer/plancat.h"
40#include "optimizer/prep.h"
41#include "optimizer/subselect.h"
42#include "optimizer/tlist.h"
44#include "parser/parsetree.h"
47#include "utils/rel.h"
48
49
50typedef struct nullingrel_info
51{
52 /*
53 * For each leaf RTE, nullingrels[rti] is the set of relids of outer joins
54 * that potentially null that RTE.
55 */
57 /* Length of range table (maximum index in nullingrels[]) */
58 int rtlength; /* used only for assertion checks */
60
61/* Options for wrapping an expression for identification purposes */
63{
64 REPLACE_WRAP_NONE, /* no expressions need to be wrapped */
65 REPLACE_WRAP_ALL, /* all expressions need to be wrapped */
66 REPLACE_WRAP_VARFREE, /* variable-free expressions need to be
67 * wrapped */
69
71{
73 List *targetlist; /* tlist of subquery being pulled up */
74 RangeTblEntry *target_rte; /* RTE of subquery */
75 int result_relation; /* the index of the result relation in the
76 * rewritten query */
77 Relids relids; /* relids within subquery, as numbered after
78 * pullup (set only if target_rte->lateral) */
79 nullingrel_info *nullinfo; /* per-RTE nullingrel info (set only if
80 * target_rte->lateral) */
81 bool *outer_hasSubLinks; /* -> outer query's hasSubLinks */
82 int varno; /* varno of subquery */
83 ReplaceWrapOption wrap_option; /* do we need certain outputs to be PHVs? */
84 Node **rv_cache; /* cache for results with PHVs */
86
88{
89 Relids relids; /* base relids within this subtree */
90 bool contains_outer; /* does subtree contain outer join(s)? */
91 Relids nullable_rels; /* base relids that are nullable within this
92 * subtree */
93 List *sub_states; /* List of states for subtree components */
95
97{
98 Relids inner_reduced; /* OJ relids reduced to plain inner joins */
99 List *partial_reduced; /* List of partially reduced FULL joins */
101
103{
104 int full_join_rti; /* RT index of a formerly-FULL join */
105 Relids unreduced_side; /* relids in its still-nullable side */
107
109 RangeTblEntry *rte, int rt_index,
110 Relation relation);
112 Relids *relids);
127 int childRToffset);
128static void make_setop_translation_list(Query *query, int newvarno,
130static bool is_simple_subquery(PlannerInfo *root, Query *subquery,
139static bool is_simple_union_all(Query *subquery);
141 List *colTypes);
142static bool is_safe_append_member(Query *subquery);
144 Node *jtnode, bool restricted,
149static void replace_vars_in_jointree(Node *jtnode,
151static Node *pullup_replace_vars(Node *expr,
153static Node *pullup_replace_vars_callback(const Var *var,
158static void reduce_outer_joins_pass2(Node *jtnode,
162 Relids nonnullable_rels,
165 int rtindex, Relids relids);
171static int get_result_relid(PlannerInfo *root, Node *jtnode);
172static void remove_result_refs(PlannerInfo *root, int varno, Node *newjtloc);
173static bool find_dependent_phvs(PlannerInfo *root, int varno);
175 Node *node, int varno);
176static void substitute_phv_relids(Node *node,
177 int varno, Relids subrelids);
178static void fix_append_rel_relids(PlannerInfo *root, int varno,
179 Relids subrelids);
180static Node *find_jointree_node_for_rel(Node *jtnode, int relid);
183 nullingrel_info *info);
184
185
186/*
187 * transform_MERGE_to_join
188 * Replace a MERGE's jointree to also include the target relation.
189 */
190void
192{
196 JoinType jointype;
197 int joinrti;
198 List *vars;
200 FromExpr *target;
201 Node *source;
202 int sourcerti;
203
204 if (parse->commandType != CMD_MERGE)
205 return;
206
207 /* XXX probably bogus */
208 vars = NIL;
209
210 /*
211 * Work out what kind of join is required. If there any WHEN NOT MATCHED
212 * BY SOURCE/TARGET actions, an outer join is required so that we process
213 * all unmatched tuples from the source and/or target relations.
214 * Otherwise, we can use an inner join.
215 */
219
220 foreach_node(MergeAction, action, parse->mergeActionList)
221 {
222 if (action->commandType != CMD_NOTHING)
223 have_action[action->matchKind] = true;
224 }
225
228 jointype = JOIN_FULL;
230 jointype = JOIN_LEFT;
232 jointype = JOIN_RIGHT;
233 else
234 jointype = JOIN_INNER;
235
236 /* Manufacture a join RTE to use. */
238 joinrte->rtekind = RTE_JOIN;
239 joinrte->jointype = jointype;
240 joinrte->joinmergedcols = 0;
241 joinrte->joinaliasvars = vars;
242 joinrte->joinleftcols = NIL; /* MERGE does not allow JOIN USING */
243 joinrte->joinrightcols = NIL; /* ditto */
244 joinrte->join_using_alias = NULL;
245
246 joinrte->alias = NULL;
247 joinrte->eref = makeAlias("*MERGE*", NIL);
248 joinrte->lateral = false;
249 joinrte->inh = false;
250 joinrte->inFromCl = true;
251
252 /*
253 * Add completed RTE to pstate's range table list, so that we know its
254 * index.
255 */
256 parse->rtable = lappend(parse->rtable, joinrte);
257 joinrti = list_length(parse->rtable);
258
259 /*
260 * Create a JOIN between the target and the source relation.
261 *
262 * Here the target is identified by parse->mergeTargetRelation. For a
263 * regular table, this will equal parse->resultRelation, but for a
264 * trigger-updatable view, it will be the expanded view subquery that we
265 * need to pull data from.
266 *
267 * The source relation is in parse->jointree->fromlist, but any quals in
268 * parse->jointree->quals are restrictions on the target relation (if the
269 * target relation is an auto-updatable view).
270 */
271 /* target rel, with any quals */
273 rtr->rtindex = parse->mergeTargetRelation;
274 target = makeFromExpr(list_make1(rtr), parse->jointree->quals);
275
276 /* source rel (expect exactly one -- see transformMergeStmt()) */
277 Assert(list_length(parse->jointree->fromlist) == 1);
278 source = linitial(parse->jointree->fromlist);
279
280 /*
281 * index of source rel (expect either a RangeTblRef or a JoinExpr -- see
282 * transformFromClauseItem()).
283 */
284 if (IsA(source, RangeTblRef))
285 sourcerti = ((RangeTblRef *) source)->rtindex;
286 else if (IsA(source, JoinExpr))
287 sourcerti = ((JoinExpr *) source)->rtindex;
288 else
289 {
290 elog(ERROR, "unrecognized source node type: %d",
291 (int) nodeTag(source));
292 sourcerti = 0; /* keep compiler quiet */
293 }
294
295 /* Join the source and target */
297 joinexpr->jointype = jointype;
298 joinexpr->isNatural = false;
299 joinexpr->larg = (Node *) target;
300 joinexpr->rarg = source;
301 joinexpr->usingClause = NIL;
302 joinexpr->join_using_alias = NULL;
303 joinexpr->quals = parse->mergeJoinCondition;
304 joinexpr->alias = NULL;
305 joinexpr->rtindex = joinrti;
306
307 /* Make the new join be the sole entry in the query's jointree */
308 parse->jointree->fromlist = list_make1(joinexpr);
309 parse->jointree->quals = NULL;
310
311 /*
312 * If necessary, mark parse->targetlist entries that refer to the target
313 * as nullable by the join. Normally the targetlist will be empty for a
314 * MERGE, but if the target is a trigger-updatable view, it will contain a
315 * whole-row Var referring to the expanded view query.
316 */
317 if (parse->targetList != NIL &&
318 (jointype == JOIN_RIGHT || jointype == JOIN_FULL))
319 parse->targetList = (List *)
320 add_nulling_relids((Node *) parse->targetList,
321 bms_make_singleton(parse->mergeTargetRelation),
323
324 /*
325 * If the source relation is on the outer side of the join, mark any
326 * source relation Vars in the join condition, actions, and RETURNING list
327 * as nullable by the join. These Vars will be added to the targetlist by
328 * preprocess_targetlist(), so it's important to mark them correctly here.
329 *
330 * It might seem that this is not necessary for Vars in the join
331 * condition, since it is inside the join, but it is also needed above the
332 * join (in the ModifyTable node) to distinguish between the MATCHED and
333 * NOT MATCHED BY SOURCE cases -- see ExecMergeMatched(). Note that this
334 * creates a modified copy of the join condition, for use above the join,
335 * without modifying the original join condition, inside the join.
336 */
337 if (jointype == JOIN_LEFT || jointype == JOIN_FULL)
338 {
339 parse->mergeJoinCondition =
340 add_nulling_relids(parse->mergeJoinCondition,
343
344 foreach_node(MergeAction, action, parse->mergeActionList)
345 {
346 action->qual =
347 add_nulling_relids(action->qual,
350
351 action->targetList = (List *)
352 add_nulling_relids((Node *) action->targetList,
355 }
356
357 parse->returningList = (List *)
358 add_nulling_relids((Node *) parse->returningList,
361 }
362
363 /*
364 * If there are any WHEN NOT MATCHED BY SOURCE actions, the executor will
365 * use the join condition to distinguish between MATCHED and NOT MATCHED
366 * BY SOURCE cases. Otherwise, it's no longer needed, and we set it to
367 * NULL, saving cycles during planning and execution.
368 *
369 * We need to be careful though: the executor evaluates this condition
370 * using the output of the join subplan node, which nulls the output from
371 * the source relation when the join condition doesn't match. That risks
372 * producing incorrect results when rechecking using a "non-strict" join
373 * condition, such as "src.col IS NOT DISTINCT FROM tgt.col". To guard
374 * against that, we add an additional "src IS NOT NULL" check to the join
375 * condition, so that it does the right thing when performing a recheck
376 * based on the output of the join subplan.
377 */
379 {
380 Var *var;
382
383 /* source wholerow Var (nullable by the new join) */
384 var = makeWholeRowVar(rt_fetch(sourcerti, parse->rtable),
385 sourcerti, 0, false);
386 var->varnullingrels = bms_make_singleton(joinrti);
387
388 /* "src IS NOT NULL" check */
390 ntest->arg = (Expr *) var;
391 ntest->nulltesttype = IS_NOT_NULL;
392 ntest->argisrow = false;
393 ntest->location = -1;
394
395 /* combine it with the original join condition */
396 parse->mergeJoinCondition =
397 (Node *) make_and_qual((Node *) ntest, parse->mergeJoinCondition);
398 }
399 else
400 parse->mergeJoinCondition = NULL; /* join condition not needed */
401}
402
403/*
404 * preprocess_relation_rtes
405 * Do the preprocessing work for any relation RTEs in the FROM clause.
406 *
407 * This scans the rangetable for relation RTEs and retrieves the necessary
408 * catalog information for each relation. Using this information, it clears
409 * the inh flag for any relation that has no children, collects not-null
410 * attribute numbers for any relation that has column not-null constraints, and
411 * expands virtual generated columns for any relation that contains them.
412 *
413 * Note that expanding virtual generated columns may cause the query tree to
414 * have new copies of rangetable entries. Therefore, we have to use list_nth
415 * instead of foreach when iterating over the query's rangetable.
416 *
417 * Returns a modified copy of the query tree, if any relations with virtual
418 * generated columns are present.
419 */
420Query *
422{
423 Query *parse = root->parse;
424 int rtable_size;
425 int rt_index;
426
427 rtable_size = list_length(parse->rtable);
428
429 for (rt_index = 0; rt_index < rtable_size; rt_index++)
430 {
431 RangeTblEntry *rte = rt_fetch(rt_index + 1, parse->rtable);
432 Relation relation;
433
434 /* We only care about relation RTEs. */
435 if (rte->rtekind != RTE_RELATION)
436 continue;
437
438 /*
439 * We need not lock the relation since it was already locked by the
440 * rewriter.
441 */
442 relation = table_open(rte->relid, NoLock);
443
444 /*
445 * Check to see if the relation actually has any children; if not,
446 * clear the inh flag so we can treat it as a plain base relation.
447 *
448 * Note: this could give a false-positive result, if the rel once had
449 * children but no longer does. We used to be able to clear rte->inh
450 * later on when we discovered that, but no more; we have to handle
451 * such cases as full-fledged inheritance.
452 */
453 if (rte->inh)
454 rte->inh = relation->rd_rel->relhassubclass;
455
456 /*
457 * Check to see if the relation has any column not-null constraints;
458 * if so, retrieve the constraint information and store it in a
459 * relation OID based hash table.
460 */
462
463 /*
464 * Check to see if the relation has any virtual generated columns; if
465 * so, replace all Var nodes in the query that reference these columns
466 * with the generation expressions.
467 */
469 rte, rt_index + 1,
470 relation);
471
472 table_close(relation, NoLock);
473 }
474
475 return parse;
476}
477
478/*
479 * expand_virtual_generated_columns
480 * Expand virtual generated columns for the given relation.
481 *
482 * This checks whether the given relation has any virtual generated columns,
483 * and if so, replaces all Var nodes in the query that reference those columns
484 * with their generation expressions.
485 *
486 * Returns a modified copy of the query tree if the relation contains virtual
487 * generated columns.
488 */
489static Query *
491 RangeTblEntry *rte, int rt_index,
492 Relation relation)
493{
494 TupleDesc tupdesc;
495
496 /* Only normal relations can have virtual generated columns */
497 Assert(rte->rtekind == RTE_RELATION);
498
499 tupdesc = RelationGetDescr(relation);
500 if (tupdesc->constr && tupdesc->constr->has_generated_virtual)
501 {
502 List *tlist = NIL;
504
505 for (int i = 0; i < tupdesc->natts; i++)
506 {
507 Form_pg_attribute attr = TupleDescAttr(tupdesc, i);
509
510 if (attr->attgenerated == ATTRIBUTE_GENERATED_VIRTUAL)
511 {
512 Node *defexpr;
513
514 defexpr = build_generation_expression(relation, i + 1);
515 ChangeVarNodes(defexpr, 1, rt_index, 0);
516
517 tle = makeTargetEntry((Expr *) defexpr, i + 1, 0, false);
518 tlist = lappend(tlist, tle);
519 }
520 else
521 {
522 Var *var;
523
524 var = makeVar(rt_index,
525 i + 1,
526 attr->atttypid,
527 attr->atttypmod,
528 attr->attcollation,
529 0);
530
531 tle = makeTargetEntry((Expr *) var, i + 1, 0, false);
532 tlist = lappend(tlist, tle);
533 }
534 }
535
536 Assert(list_length(tlist) > 0);
537 Assert(!rte->lateral);
538
539 /*
540 * The relation's targetlist items are now in the appropriate form to
541 * insert into the query, except that we may need to wrap them in
542 * PlaceHolderVars. Set up required context data for
543 * pullup_replace_vars.
544 */
545 rvcontext.root = root;
546 rvcontext.targetlist = tlist;
547 rvcontext.target_rte = rte;
548 rvcontext.result_relation = parse->resultRelation;
549 /* won't need these values */
550 rvcontext.relids = NULL;
551 rvcontext.nullinfo = NULL;
552 /* pass NULL for outer_hasSubLinks */
553 rvcontext.outer_hasSubLinks = NULL;
554 rvcontext.varno = rt_index;
555 /* this flag will be set below, if needed */
556 rvcontext.wrap_option = REPLACE_WRAP_NONE;
557 /* initialize cache array with indexes 0 .. length(tlist) */
558 rvcontext.rv_cache = palloc0((list_length(tlist) + 1) *
559 sizeof(Node *));
560
561 /*
562 * If the query uses grouping sets, we need a PlaceHolderVar for each
563 * expression of the relation's targetlist items. (See comments in
564 * pull_up_simple_subquery().)
565 */
566 if (parse->groupingSets)
567 rvcontext.wrap_option = REPLACE_WRAP_ALL;
568
569 /*
570 * Apply pullup variable replacement throughout the query tree.
571 */
573 }
574
575 return parse;
576}
577
578/*
579 * replace_empty_jointree
580 * If the Query's jointree is empty, replace it with a dummy RTE_RESULT
581 * relation.
582 *
583 * By doing this, we can avoid a bunch of corner cases that formerly existed
584 * for SELECTs with omitted FROM clauses. An example is that a subquery
585 * with empty jointree previously could not be pulled up, because that would
586 * have resulted in an empty relid set, making the subquery not uniquely
587 * identifiable for join or PlaceHolderVar processing.
588 *
589 * Unlike most other functions in this file, this function doesn't recurse;
590 * we rely on other processing to invoke it on sub-queries at suitable times.
591 */
592void
594{
596 Index rti;
598
599 /* Nothing to do if jointree is already nonempty */
600 if (parse->jointree->fromlist != NIL)
601 return;
602
603 /* We mustn't change it in the top level of a setop tree, either */
604 if (parse->setOperations)
605 return;
606
607 /* Create suitable RTE */
609 rte->rtekind = RTE_RESULT;
610 rte->eref = makeAlias("*RESULT*", NIL);
611
612 /* Add it to rangetable */
613 parse->rtable = lappend(parse->rtable, rte);
614 rti = list_length(parse->rtable);
615
616 /* And jam a reference into the jointree */
618 rtr->rtindex = rti;
619 parse->jointree->fromlist = list_make1(rtr);
620}
621
622/*
623 * pull_up_sublinks
624 * Attempt to pull up ANY and EXISTS SubLinks to be treated as
625 * semijoins or anti-semijoins.
626 *
627 * A clause "foo op ANY (sub-SELECT)" can be processed by pulling the
628 * sub-SELECT up to become a rangetable entry and treating the implied
629 * comparisons as quals of a semijoin. However, this optimization *only*
630 * works at the top level of WHERE or a JOIN/ON clause, because we cannot
631 * distinguish whether the ANY ought to return FALSE or NULL in cases
632 * involving NULL inputs. Also, in an outer join's ON clause we can only
633 * do this if the sublink is degenerate (ie, references only the nullable
634 * side of the join). In that case it is legal to push the semijoin
635 * down into the nullable side of the join. If the sublink references any
636 * nonnullable-side variables then it would have to be evaluated as part
637 * of the outer join, which makes things way too complicated.
638 *
639 * Under similar conditions, EXISTS and NOT EXISTS clauses can be handled
640 * by pulling up the sub-SELECT and creating a semijoin or anti-semijoin.
641 *
642 * This routine searches for such clauses and does the necessary parsetree
643 * transformations if any are found.
644 *
645 * This routine has to run before preprocess_expression(), so the quals
646 * clauses are not yet reduced to implicit-AND format, and are not guaranteed
647 * to be AND/OR-flat either. That means we need to recursively search through
648 * explicit AND clauses. We stop as soon as we hit a non-AND item.
649 */
650void
652{
653 Node *jtnode;
654 Relids relids;
655
656 /* Begin recursion through the jointree */
658 (Node *) root->parse->jointree,
659 &relids);
660
661 /*
662 * root->parse->jointree must always be a FromExpr, so insert a dummy one
663 * if we got a bare RangeTblRef or JoinExpr out of the recursion.
664 */
665 if (IsA(jtnode, FromExpr))
666 root->parse->jointree = (FromExpr *) jtnode;
667 else
668 root->parse->jointree = makeFromExpr(list_make1(jtnode), NULL);
669}
670
671/*
672 * Recurse through jointree nodes for pull_up_sublinks()
673 *
674 * In addition to returning the possibly-modified jointree node, we return
675 * a relids set of the contained rels into *relids.
676 */
677static Node *
679 Relids *relids)
680{
681 /* Since this function recurses, it could be driven to stack overflow. */
683
684 if (jtnode == NULL)
685 {
686 *relids = NULL;
687 }
688 else if (IsA(jtnode, RangeTblRef))
689 {
690 int varno = ((RangeTblRef *) jtnode)->rtindex;
691
692 *relids = bms_make_singleton(varno);
693 /* jtnode is returned unmodified */
694 }
695 else if (IsA(jtnode, FromExpr))
696 {
697 FromExpr *f = (FromExpr *) jtnode;
700 FromExpr *newf;
701 Node *jtlink;
702 ListCell *l;
703
704 /* First, recurse to process children and collect their relids */
705 foreach(l, f->fromlist)
706 {
707 Node *newchild;
709
711 lfirst(l),
712 &childrelids);
715 }
716 /* Build the replacement FromExpr; no quals yet */
718 /* Set up a link representing the rebuilt jointree */
719 jtlink = (Node *) newf;
720 /* Now process qual --- all children are available for use */
722 &jtlink, frelids,
723 NULL, NULL);
724
725 /*
726 * Note that the result will be either newf, or a stack of JoinExprs
727 * with newf at the base. We rely on subsequent optimization steps to
728 * flatten this and rearrange the joins as needed.
729 *
730 * Although we could include the pulled-up subqueries in the returned
731 * relids, there's no need since upper quals couldn't refer to their
732 * outputs anyway.
733 */
734 *relids = frelids;
735 jtnode = jtlink;
736 }
737 else if (IsA(jtnode, JoinExpr))
738 {
739 JoinExpr *j;
742 Node *jtlink;
743
744 /*
745 * Make a modifiable copy of join node, but don't bother copying its
746 * subnodes (yet).
747 */
749 memcpy(j, jtnode, sizeof(JoinExpr));
750 jtlink = (Node *) j;
751
752 /* Recurse to process children and collect their relids */
754 &leftrelids);
756 &rightrelids);
757
758 /*
759 * Now process qual, showing appropriate child relids as available,
760 * and attach any pulled-up jointree items at the right place. In the
761 * inner-join case we put new JoinExprs above the existing one (much
762 * as for a FromExpr-style join). In outer-join cases the new
763 * JoinExprs must go into the nullable side of the outer join. The
764 * point of the available_rels machinations is to ensure that we only
765 * pull up quals for which that's okay.
766 *
767 * We don't expect to see any pre-existing JOIN_SEMI, JOIN_ANTI,
768 * JOIN_RIGHT_SEMI, or JOIN_RIGHT_ANTI jointypes here.
769 */
770 switch (j->jointype)
771 {
772 case JOIN_INNER:
773 j->quals = pull_up_sublinks_qual_recurse(root, j->quals,
774 &jtlink,
777 NULL, NULL);
778 break;
779 case JOIN_LEFT:
780 j->quals = pull_up_sublinks_qual_recurse(root, j->quals,
781 &j->rarg,
783 NULL, NULL);
784 break;
785 case JOIN_FULL:
786 /* can't do anything with full-join quals */
787 break;
788 case JOIN_RIGHT:
789 j->quals = pull_up_sublinks_qual_recurse(root, j->quals,
790 &j->larg,
792 NULL, NULL);
793 break;
794 default:
795 elog(ERROR, "unrecognized join type: %d",
796 (int) j->jointype);
797 break;
798 }
799
800 /*
801 * Although we could include the pulled-up subqueries in the returned
802 * relids, there's no need since upper quals couldn't refer to their
803 * outputs anyway. But we *do* need to include the join's own rtindex
804 * because we haven't yet collapsed join alias variables, so upper
805 * levels would mistakenly think they couldn't use references to this
806 * join.
807 */
808 *relids = bms_join(leftrelids, rightrelids);
809 if (j->rtindex)
810 *relids = bms_add_member(*relids, j->rtindex);
811 jtnode = jtlink;
812 }
813 else
814 elog(ERROR, "unrecognized node type: %d",
815 (int) nodeTag(jtnode));
816 return jtnode;
817}
818
819/*
820 * Recurse through top-level qual nodes for pull_up_sublinks()
821 *
822 * jtlink1 points to the link in the jointree where any new JoinExprs should
823 * be inserted if they reference available_rels1 (i.e., available_rels1
824 * denotes the relations present underneath jtlink1). Optionally, jtlink2 can
825 * point to a second link where new JoinExprs should be inserted if they
826 * reference available_rels2 (pass NULL for both those arguments if not used).
827 * Note that SubLinks referencing both sets of variables cannot be optimized.
828 * If we find multiple pull-up-able SubLinks, they'll get stacked onto jtlink1
829 * and/or jtlink2 in the order we encounter them. We rely on subsequent
830 * optimization to rearrange the stack if appropriate.
831 *
832 * Returns the replacement qual node, or NULL if the qual should be removed.
833 */
834static Node *
838{
839 if (node == NULL)
840 return NULL;
841 if (IsA(node, SubLink))
842 {
843 SubLink *sublink = (SubLink *) node;
844 JoinExpr *j;
846
847 /* Is it a convertible ANY or EXISTS clause? */
848 if (sublink->subLinkType == ANY_SUBLINK)
849 {
850 ScalarArrayOpExpr *saop;
851
852 if ((saop = convert_VALUES_to_ANY(root,
853 sublink->testexpr,
854 (Query *) sublink->subselect)) != NULL)
855 {
856 /*
857 * The VALUES sequence was simplified. Nothing more to do
858 * here.
859 */
860 return (Node *) saop;
861 }
862
865 {
866 /* Yes; insert the new join node into the join tree */
867 j->larg = *jtlink1;
868 *jtlink1 = (Node *) j;
869 /* Recursively process pulled-up jointree nodes */
871 j->rarg,
872 &child_rels);
873
874 /*
875 * Now recursively process the pulled-up quals. Any inserted
876 * joins can get stacked onto either j->larg or j->rarg,
877 * depending on which rels they reference.
878 */
880 j->quals,
881 &j->larg,
883 &j->rarg,
884 child_rels);
885 /* Return NULL representing constant TRUE */
886 return NULL;
887 }
888 if (available_rels2 != NULL &&
891 {
892 /* Yes; insert the new join node into the join tree */
893 j->larg = *jtlink2;
894 *jtlink2 = (Node *) j;
895 /* Recursively process pulled-up jointree nodes */
897 j->rarg,
898 &child_rels);
899
900 /*
901 * Now recursively process the pulled-up quals. Any inserted
902 * joins can get stacked onto either j->larg or j->rarg,
903 * depending on which rels they reference.
904 */
906 j->quals,
907 &j->larg,
909 &j->rarg,
910 child_rels);
911 /* Return NULL representing constant TRUE */
912 return NULL;
913 }
914 }
915 else if (sublink->subLinkType == EXISTS_SUBLINK)
916 {
919 {
920 /* Yes; insert the new join node into the join tree */
921 j->larg = *jtlink1;
922 *jtlink1 = (Node *) j;
923 /* Recursively process pulled-up jointree nodes */
925 j->rarg,
926 &child_rels);
927
928 /*
929 * Now recursively process the pulled-up quals. Any inserted
930 * joins can get stacked onto either j->larg or j->rarg,
931 * depending on which rels they reference.
932 */
934 j->quals,
935 &j->larg,
937 &j->rarg,
938 child_rels);
939 /* Return NULL representing constant TRUE */
940 return NULL;
941 }
942 if (available_rels2 != NULL &&
945 {
946 /* Yes; insert the new join node into the join tree */
947 j->larg = *jtlink2;
948 *jtlink2 = (Node *) j;
949 /* Recursively process pulled-up jointree nodes */
951 j->rarg,
952 &child_rels);
953
954 /*
955 * Now recursively process the pulled-up quals. Any inserted
956 * joins can get stacked onto either j->larg or j->rarg,
957 * depending on which rels they reference.
958 */
960 j->quals,
961 &j->larg,
963 &j->rarg,
964 child_rels);
965 /* Return NULL representing constant TRUE */
966 return NULL;
967 }
968 }
969 /* Else return it unmodified */
970 return node;
971 }
972 if (is_notclause(node))
973 {
974 /* If the immediate argument of NOT is ANY or EXISTS, try to convert */
976 JoinExpr *j;
978
979 if (sublink && IsA(sublink, SubLink))
980 {
981 if (sublink->subLinkType == ANY_SUBLINK)
982 {
985 {
986 /* Yes; insert the new join node into the join tree */
987 j->larg = *jtlink1;
988 *jtlink1 = (Node *) j;
989 /* Recursively process pulled-up jointree nodes */
991 j->rarg,
992 &child_rels);
993
994 /*
995 * Now recursively process the pulled-up quals. Because
996 * we are underneath a NOT, we can't pull up sublinks that
997 * reference the left-hand stuff, but it's still okay to
998 * pull up sublinks referencing j->rarg.
999 */
1001 j->quals,
1002 &j->rarg,
1003 child_rels,
1004 NULL, NULL);
1005 /* Return NULL representing constant TRUE */
1006 return NULL;
1007 }
1008 if (available_rels2 != NULL &&
1010 available_rels2)) != NULL)
1011 {
1012 /* Yes; insert the new join node into the join tree */
1013 j->larg = *jtlink2;
1014 *jtlink2 = (Node *) j;
1015 /* Recursively process pulled-up jointree nodes */
1017 j->rarg,
1018 &child_rels);
1019
1020 /*
1021 * Now recursively process the pulled-up quals. Because
1022 * we are underneath a NOT, we can't pull up sublinks that
1023 * reference the left-hand stuff, but it's still okay to
1024 * pull up sublinks referencing j->rarg.
1025 */
1027 j->quals,
1028 &j->rarg,
1029 child_rels,
1030 NULL, NULL);
1031 /* Return NULL representing constant TRUE */
1032 return NULL;
1033 }
1034 }
1035 else if (sublink->subLinkType == EXISTS_SUBLINK)
1036 {
1038 available_rels1)) != NULL)
1039 {
1040 /* Yes; insert the new join node into the join tree */
1041 j->larg = *jtlink1;
1042 *jtlink1 = (Node *) j;
1043 /* Recursively process pulled-up jointree nodes */
1045 j->rarg,
1046 &child_rels);
1047
1048 /*
1049 * Now recursively process the pulled-up quals. Because
1050 * we are underneath a NOT, we can't pull up sublinks that
1051 * reference the left-hand stuff, but it's still okay to
1052 * pull up sublinks referencing j->rarg.
1053 */
1055 j->quals,
1056 &j->rarg,
1057 child_rels,
1058 NULL, NULL);
1059 /* Return NULL representing constant TRUE */
1060 return NULL;
1061 }
1062 if (available_rels2 != NULL &&
1064 available_rels2)) != NULL)
1065 {
1066 /* Yes; insert the new join node into the join tree */
1067 j->larg = *jtlink2;
1068 *jtlink2 = (Node *) j;
1069 /* Recursively process pulled-up jointree nodes */
1071 j->rarg,
1072 &child_rels);
1073
1074 /*
1075 * Now recursively process the pulled-up quals. Because
1076 * we are underneath a NOT, we can't pull up sublinks that
1077 * reference the left-hand stuff, but it's still okay to
1078 * pull up sublinks referencing j->rarg.
1079 */
1081 j->quals,
1082 &j->rarg,
1083 child_rels,
1084 NULL, NULL);
1085 /* Return NULL representing constant TRUE */
1086 return NULL;
1087 }
1088 }
1089 }
1090 /* Else return it unmodified */
1091 return node;
1092 }
1093 if (is_andclause(node))
1094 {
1095 /* Recurse into AND clause */
1096 List *newclauses = NIL;
1097 ListCell *l;
1098
1099 foreach(l, ((BoolExpr *) node)->args)
1100 {
1101 Node *oldclause = (Node *) lfirst(l);
1102 Node *newclause;
1103
1105 oldclause,
1106 jtlink1,
1108 jtlink2,
1110 if (newclause)
1112 }
1113 /* We might have got back fewer clauses than we started with */
1114 if (newclauses == NIL)
1115 return NULL;
1116 else if (list_length(newclauses) == 1)
1117 return (Node *) linitial(newclauses);
1118 else
1119 return (Node *) make_andclause(newclauses);
1120 }
1121 /* Stop if not an AND */
1122 return node;
1123}
1124
1125/*
1126 * preprocess_function_rtes
1127 * Constant-simplify any FUNCTION RTEs in the FROM clause, and then
1128 * attempt to "inline" any that can be converted to simple subqueries.
1129 *
1130 * If an RTE_FUNCTION rtable entry invokes a set-returning SQL function that
1131 * contains just a simple SELECT, we can convert the rtable entry to an
1132 * RTE_SUBQUERY entry exposing the SELECT directly. Other sorts of functions
1133 * are also inline-able if they have a support function that can generate
1134 * the replacement sub-Query. This is especially useful if the subquery can
1135 * then be "pulled up" for further optimization, but we do it even if not,
1136 * to reduce executor overhead.
1137 *
1138 * This has to be done before we have started to do any optimization of
1139 * subqueries, else any such steps wouldn't get applied to subqueries
1140 * obtained via inlining. However, we do it after pull_up_sublinks
1141 * so that we can inline any functions used in SubLink subselects.
1142 *
1143 * The reason for applying const-simplification at this stage is that
1144 * (a) we'd need to do it anyway to inline a SRF, and (b) by doing it now,
1145 * we can be sure that pull_up_constant_function() will see constants
1146 * if there are constants to be seen. This approach also guarantees
1147 * that every FUNCTION RTE has been const-simplified, allowing planner.c's
1148 * preprocess_expression() to skip doing it again.
1149 *
1150 * Like most of the planner, this feels free to scribble on its input data
1151 * structure.
1152 */
1153void
1155{
1156 ListCell *rt;
1157
1158 foreach(rt, root->parse->rtable)
1159 {
1161
1162 if (rte->rtekind == RTE_FUNCTION)
1163 {
1165
1166 /* Apply const-simplification */
1167 rte->functions = (List *)
1168 eval_const_expressions(root, (Node *) rte->functions);
1169
1170 /* Check safety of expansion, and expand if possible */
1172 if (funcquery)
1173 {
1174 /* Successful expansion, convert the RTE to a subquery */
1175 rte->rtekind = RTE_SUBQUERY;
1176 rte->subquery = funcquery;
1177 rte->security_barrier = false;
1178
1179 /*
1180 * Clear fields that should not be set in a subquery RTE.
1181 * However, we leave rte->functions filled in for the moment,
1182 * in case makeWholeRowVar needs to consult it. We'll clear
1183 * it in setrefs.c (see add_rte_to_flat_rtable) so that this
1184 * abuse of the data structure doesn't escape the planner.
1185 */
1186 rte->funcordinality = false;
1187 }
1188 }
1189 }
1190}
1191
1192/*
1193 * pull_up_subqueries
1194 * Look for subqueries in the rangetable that can be pulled up into
1195 * the parent query. If the subquery has no special features like
1196 * grouping/aggregation then we can merge it into the parent's jointree.
1197 * Also, subqueries that are simple UNION ALL structures can be
1198 * converted into "append relations".
1199 */
1200void
1202{
1203 /* Top level of jointree must always be a FromExpr */
1204 Assert(IsA(root->parse->jointree, FromExpr));
1205 /* Recursion starts with no containing join nor appendrel */
1206 root->parse->jointree = (FromExpr *)
1207 pull_up_subqueries_recurse(root, (Node *) root->parse->jointree,
1208 NULL, NULL);
1209 /* We should still have a FromExpr */
1210 Assert(IsA(root->parse->jointree, FromExpr));
1211}
1212
1213/*
1214 * pull_up_subqueries_recurse
1215 * Recursive guts of pull_up_subqueries.
1216 *
1217 * This recursively processes the jointree and returns a modified jointree.
1218 *
1219 * If this jointree node is within either side of an outer join, then
1220 * lowest_outer_join references the lowest such JoinExpr node; otherwise
1221 * it is NULL. We use this to constrain the effects of LATERAL subqueries.
1222 *
1223 * If we are looking at a member subquery of an append relation,
1224 * containing_appendrel describes that relation; else it is NULL.
1225 * This forces use of the PlaceHolderVar mechanism for all non-Var targetlist
1226 * items, and puts some additional restrictions on what can be pulled up.
1227 *
1228 * A tricky aspect of this code is that if we pull up a subquery we have
1229 * to replace Vars that reference the subquery's outputs throughout the
1230 * parent query, including quals attached to jointree nodes above the one
1231 * we are currently processing! We handle this by being careful to maintain
1232 * validity of the jointree structure while recursing, in the following sense:
1233 * whenever we recurse, all qual expressions in the tree must be reachable
1234 * from the top level, in case the recursive call needs to modify them.
1235 *
1236 * Notice also that we can't turn pullup_replace_vars loose on the whole
1237 * jointree, because it'd return a mutated copy of the tree; we have to
1238 * invoke it just on the quals, instead. This behavior is what makes it
1239 * reasonable to pass lowest_outer_join as a pointer rather than some
1240 * more-indirect way of identifying the lowest OJ. Likewise, we don't
1241 * replace append_rel_list members but only their substructure, so the
1242 * containing_appendrel reference is safe to use.
1243 */
1244static Node *
1248{
1249 /* Since this function recurses, it could be driven to stack overflow. */
1251 /* Also, since it's a bit expensive, let's check for query cancel. */
1253
1254 Assert(jtnode != NULL);
1255 if (IsA(jtnode, RangeTblRef))
1256 {
1257 int varno = ((RangeTblRef *) jtnode)->rtindex;
1258 RangeTblEntry *rte = rt_fetch(varno, root->parse->rtable);
1259
1260 /*
1261 * Is this a subquery RTE, and if so, is the subquery simple enough to
1262 * pull up?
1263 *
1264 * If we are looking at an append-relation member, we can't pull it up
1265 * unless is_safe_append_member says so.
1266 */
1267 if (rte->rtekind == RTE_SUBQUERY &&
1270 is_safe_append_member(rte->subquery)))
1271 return pull_up_simple_subquery(root, jtnode, rte,
1274
1275 /*
1276 * Alternatively, is it a simple UNION ALL subquery? If so, flatten
1277 * into an "append relation".
1278 *
1279 * It's safe to do this regardless of whether this query is itself an
1280 * appendrel member. (If you're thinking we should try to flatten the
1281 * two levels of appendrel together, you're right; but we handle that
1282 * in set_append_rel_pathlist, not here.)
1283 */
1284 if (rte->rtekind == RTE_SUBQUERY &&
1285 is_simple_union_all(rte->subquery))
1286 return pull_up_simple_union_all(root, jtnode, rte);
1287
1288 /*
1289 * Or perhaps it's a simple VALUES RTE?
1290 *
1291 * We don't allow VALUES pullup below an outer join nor into an
1292 * appendrel (such cases are impossible anyway at the moment).
1293 */
1294 if (rte->rtekind == RTE_VALUES &&
1298 return pull_up_simple_values(root, jtnode, rte);
1299
1300 /*
1301 * Or perhaps it's a FUNCTION RTE that we could inline?
1302 */
1303 if (rte->rtekind == RTE_FUNCTION)
1304 return pull_up_constant_function(root, jtnode, rte,
1306
1307 /* Otherwise, do nothing at this node. */
1308 }
1309 else if (IsA(jtnode, FromExpr))
1310 {
1311 FromExpr *f = (FromExpr *) jtnode;
1312 ListCell *l;
1313
1315 /* Recursively transform all the child nodes */
1316 foreach(l, f->fromlist)
1317 {
1320 NULL);
1321 }
1322 }
1323 else if (IsA(jtnode, JoinExpr))
1324 {
1325 JoinExpr *j = (JoinExpr *) jtnode;
1326
1328 /* Recurse, being careful to tell myself when inside outer join */
1329 switch (j->jointype)
1330 {
1331 case JOIN_INNER:
1332 j->larg = pull_up_subqueries_recurse(root, j->larg,
1334 NULL);
1335 j->rarg = pull_up_subqueries_recurse(root, j->rarg,
1337 NULL);
1338 break;
1339 case JOIN_LEFT:
1340 case JOIN_SEMI:
1341 case JOIN_ANTI:
1342 j->larg = pull_up_subqueries_recurse(root, j->larg,
1343 j,
1344 NULL);
1345 j->rarg = pull_up_subqueries_recurse(root, j->rarg,
1346 j,
1347 NULL);
1348 break;
1349 case JOIN_FULL:
1350 j->larg = pull_up_subqueries_recurse(root, j->larg,
1351 j,
1352 NULL);
1353 j->rarg = pull_up_subqueries_recurse(root, j->rarg,
1354 j,
1355 NULL);
1356 break;
1357 case JOIN_RIGHT:
1358 j->larg = pull_up_subqueries_recurse(root, j->larg,
1359 j,
1360 NULL);
1361 j->rarg = pull_up_subqueries_recurse(root, j->rarg,
1362 j,
1363 NULL);
1364 break;
1365 default:
1366 elog(ERROR, "unrecognized join type: %d",
1367 (int) j->jointype);
1368 break;
1369 }
1370 }
1371 else
1372 elog(ERROR, "unrecognized node type: %d",
1373 (int) nodeTag(jtnode));
1374 return jtnode;
1375}
1376
1377/*
1378 * pull_up_simple_subquery
1379 * Attempt to pull up a single simple subquery.
1380 *
1381 * jtnode is a RangeTblRef that has been tentatively identified as a simple
1382 * subquery by pull_up_subqueries. We return the replacement jointree node,
1383 * or jtnode itself if we determine that the subquery can't be pulled up
1384 * after all.
1385 *
1386 * rte is the RangeTblEntry referenced by jtnode. Remaining parameters are
1387 * as for pull_up_subqueries_recurse.
1388 */
1389static Node *
1393{
1394 Query *parse = root->parse;
1395 int varno = ((RangeTblRef *) jtnode)->rtindex;
1396 Query *subquery;
1397 PlannerInfo *subroot;
1398 int rtoffset;
1400 ListCell *lc;
1401
1402 /*
1403 * Make a modifiable copy of the subquery to hack on, so that the RTE will
1404 * be left unchanged in case we decide below that we can't pull it up
1405 * after all.
1406 */
1407 subquery = copyObject(rte->subquery);
1408
1409 /*
1410 * Create a PlannerInfo data structure for this subquery.
1411 *
1412 * NOTE: the next few steps should match the first processing in
1413 * subquery_planner(). Can we refactor to avoid code duplication, or
1414 * would that just make things uglier?
1415 */
1416 subroot = makeNode(PlannerInfo);
1417 subroot->parse = subquery;
1418 subroot->glob = root->glob;
1419 subroot->query_level = root->query_level;
1420 subroot->plan_name = root->plan_name;
1421 subroot->alternative_plan_name = root->alternative_plan_name;
1422 subroot->parent_root = root->parent_root;
1423 subroot->plan_params = NIL;
1424 subroot->outer_params = NULL;
1425 subroot->planner_cxt = CurrentMemoryContext;
1426 subroot->init_plans = NIL;
1427 subroot->cte_plan_ids = NIL;
1428 subroot->multiexpr_params = NIL;
1429 subroot->join_domains = NIL;
1430 subroot->eq_classes = NIL;
1431 subroot->ec_merging_done = false;
1432 subroot->last_rinfo_serial = 0;
1433 subroot->all_result_relids = NULL;
1434 subroot->leaf_result_relids = NULL;
1435 subroot->append_rel_list = NIL;
1436 subroot->row_identity_vars = NIL;
1437 subroot->rowMarks = NIL;
1438 memset(subroot->upper_rels, 0, sizeof(subroot->upper_rels));
1439 memset(subroot->upper_targets, 0, sizeof(subroot->upper_targets));
1440 subroot->processed_groupClause = NIL;
1441 subroot->processed_distinctClause = NIL;
1442 subroot->processed_tlist = NIL;
1443 subroot->update_colnos = NIL;
1444 subroot->grouping_map = NULL;
1445 subroot->minmax_aggs = NIL;
1446 subroot->qual_security_level = 0;
1447 subroot->placeholdersFrozen = false;
1448 subroot->hasRecursion = false;
1449 subroot->assumeReplanning = false;
1450 subroot->wt_param_id = -1;
1451 subroot->non_recursive_path = NULL;
1452 /* We don't currently need a top JoinDomain for the subroot */
1453
1454 /* No CTEs to worry about */
1455 Assert(subquery->cteList == NIL);
1456
1457 /*
1458 * Scan the rangetable for relation RTEs and retrieve the necessary
1459 * catalog information for each relation. Using this information, clear
1460 * the inh flag for any relation that has no children, collect not-null
1461 * attribute numbers for any relation that has column not-null
1462 * constraints, and expand virtual generated columns for any relation that
1463 * contains them.
1464 */
1465 subquery = subroot->parse = preprocess_relation_rtes(subroot);
1466
1467 /*
1468 * If the FROM clause is empty, replace it with a dummy RTE_RESULT RTE, so
1469 * that we don't need so many special cases to deal with that situation.
1470 */
1471 replace_empty_jointree(subquery);
1472
1473 /*
1474 * Pull up any SubLinks within the subquery's quals, so that we don't
1475 * leave unoptimized SubLinks behind.
1476 */
1477 if (subquery->hasSubLinks)
1478 pull_up_sublinks(subroot);
1479
1480 /*
1481 * Similarly, preprocess its function RTEs to inline any set-returning
1482 * functions in its rangetable.
1483 */
1484 preprocess_function_rtes(subroot);
1485
1486 /*
1487 * Recursively pull up the subquery's subqueries, so that
1488 * pull_up_subqueries' processing is complete for its jointree and
1489 * rangetable.
1490 *
1491 * Note: it's okay that the subquery's recursion starts with NULL for
1492 * containing-join info, even if we are within an outer join in the upper
1493 * query; the lower query starts with a clean slate for outer-join
1494 * semantics. Likewise, we needn't pass down appendrel state.
1495 */
1496 pull_up_subqueries(subroot);
1497
1498 /*
1499 * Now we must recheck whether the subquery is still simple enough to pull
1500 * up. If not, abandon processing it.
1501 *
1502 * We don't really need to recheck all the conditions involved, but it's
1503 * easier just to keep this "if" looking the same as the one in
1504 * pull_up_subqueries_recurse.
1505 */
1506 if (is_simple_subquery(root, subquery, rte, lowest_outer_join) &&
1508 {
1509 /* good to go */
1510 }
1511 else
1512 {
1513 /*
1514 * Give up, return unmodified RangeTblRef.
1515 *
1516 * Note: The work we just did will be redone when the subquery gets
1517 * planned on its own. Perhaps we could avoid that by storing the
1518 * modified subquery back into the rangetable, but I'm not gonna risk
1519 * it now.
1520 */
1521 return jtnode;
1522 }
1523
1524 /*
1525 * We must flatten any join alias Vars in the subquery's targetlist,
1526 * because pulling up the subquery's subqueries might have changed their
1527 * expansions into arbitrary expressions, which could affect
1528 * pullup_replace_vars' decisions about whether PlaceHolderVar wrappers
1529 * are needed for tlist entries. (Likely it'd be better to do
1530 * flatten_join_alias_vars on the whole query tree at some earlier stage,
1531 * maybe even in the rewriter; but for now let's just fix this case here.)
1532 */
1533 subquery->targetList = (List *)
1534 flatten_join_alias_vars(subroot, subroot->parse,
1535 (Node *) subquery->targetList);
1536
1537 /*
1538 * Adjust level-0 varnos in subquery so that we can append its rangetable
1539 * to upper query's. We have to fix the subquery's append_rel_list as
1540 * well.
1541 */
1542 rtoffset = list_length(parse->rtable);
1543 OffsetVarNodes((Node *) subquery, rtoffset, 0);
1544 OffsetVarNodes((Node *) subroot->append_rel_list, rtoffset, 0);
1545
1546 /*
1547 * Upper-level vars in subquery are now one level closer to their parent
1548 * than before.
1549 */
1550 IncrementVarSublevelsUp((Node *) subquery, -1, 1);
1551 IncrementVarSublevelsUp((Node *) subroot->append_rel_list, -1, 1);
1552
1553 /*
1554 * The subquery's targetlist items are now in the appropriate form to
1555 * insert into the top query, except that we may need to wrap them in
1556 * PlaceHolderVars. Set up required context data for pullup_replace_vars.
1557 * (Note that we should include the subquery's inner joins in relids,
1558 * since it may include join alias vars referencing them.)
1559 */
1560 rvcontext.root = root;
1561 rvcontext.targetlist = subquery->targetList;
1562 rvcontext.target_rte = rte;
1563 rvcontext.result_relation = 0;
1564 if (rte->lateral)
1565 {
1566 rvcontext.relids = get_relids_in_jointree((Node *) subquery->jointree,
1567 true, true);
1568 rvcontext.nullinfo = get_nullingrels(parse);
1569 }
1570 else /* won't need these values */
1571 {
1572 rvcontext.relids = NULL;
1573 rvcontext.nullinfo = NULL;
1574 }
1575 rvcontext.outer_hasSubLinks = &parse->hasSubLinks;
1576 rvcontext.varno = varno;
1577 /* this flag will be set below, if needed */
1578 rvcontext.wrap_option = REPLACE_WRAP_NONE;
1579 /* initialize cache array with indexes 0 .. length(tlist) */
1580 rvcontext.rv_cache = palloc0((list_length(subquery->targetList) + 1) *
1581 sizeof(Node *));
1582
1583 /*
1584 * If the parent query uses grouping sets, we need a PlaceHolderVar for
1585 * each expression of the subquery's targetlist items. This ensures that
1586 * expressions retain their separate identity so that they will match
1587 * grouping set columns when appropriate. (It'd be sufficient to wrap
1588 * values used in grouping set columns, and do so only in non-aggregated
1589 * portions of the tlist and havingQual, but that would require a lot of
1590 * infrastructure that pullup_replace_vars hasn't currently got.)
1591 */
1592 if (parse->groupingSets)
1593 rvcontext.wrap_option = REPLACE_WRAP_ALL;
1594
1595 /*
1596 * Replace all of the top query's references to the subquery's outputs
1597 * with copies of the adjusted subtlist items, being careful not to
1598 * replace any of the jointree structure.
1599 */
1602
1603 /*
1604 * If the subquery had a LATERAL marker, propagate that to any of its
1605 * child RTEs that could possibly now contain lateral cross-references.
1606 * The children might or might not contain any actual lateral
1607 * cross-references, but we have to mark the pulled-up child RTEs so that
1608 * later planner stages will check for such.
1609 */
1610 if (rte->lateral)
1611 {
1612 foreach(lc, subquery->rtable)
1613 {
1615
1616 switch (child_rte->rtekind)
1617 {
1618 case RTE_RELATION:
1619 if (child_rte->tablesample)
1620 child_rte->lateral = true;
1621 break;
1622 case RTE_SUBQUERY:
1623 case RTE_FUNCTION:
1624 case RTE_VALUES:
1625 case RTE_TABLEFUNC:
1626 child_rte->lateral = true;
1627 break;
1628 case RTE_JOIN:
1629 case RTE_CTE:
1631 case RTE_RESULT:
1632 case RTE_GROUP:
1633 /* these can't contain any lateral references */
1634 break;
1635 case RTE_GRAPH_TABLE:
1636 /* shouldn't happen here */
1637 Assert(false);
1638 break;
1639 }
1640 }
1641 }
1642
1643 /*
1644 * Now append the adjusted rtable entries and their perminfos to upper
1645 * query. (We hold off until after fixing the upper rtable entries; no
1646 * point in running that code on the subquery ones too.)
1647 */
1648 CombineRangeTables(&parse->rtable, &parse->rteperminfos,
1649 subquery->rtable, subquery->rteperminfos);
1650
1651 /*
1652 * Pull up any FOR UPDATE/SHARE markers, too. (OffsetVarNodes already
1653 * adjusted the marker rtindexes, so just concat the lists.)
1654 */
1655 parse->rowMarks = list_concat(parse->rowMarks, subquery->rowMarks);
1656
1657 /*
1658 * We also have to fix the relid sets of any PlaceHolderVar nodes in the
1659 * parent query. (This could perhaps be done by pullup_replace_vars(),
1660 * but it seems cleaner to use two passes.) Note in particular that any
1661 * PlaceHolderVar nodes just created by pullup_replace_vars() will be
1662 * adjusted, so having created them with the subquery's varno is correct.
1663 *
1664 * Likewise, relids appearing in AppendRelInfo nodes have to be fixed. We
1665 * already checked that this won't require introducing multiple subrelids
1666 * into the single-slot AppendRelInfo structs.
1667 */
1668 if (root->glob->lastPHId != 0 || root->append_rel_list)
1669 {
1670 Relids subrelids;
1671
1672 subrelids = get_relids_in_jointree((Node *) subquery->jointree,
1673 true, false);
1674 if (root->glob->lastPHId != 0)
1675 substitute_phv_relids((Node *) parse, varno, subrelids);
1676 fix_append_rel_relids(root, varno, subrelids);
1677 }
1678
1679 /*
1680 * And now add subquery's AppendRelInfos to our list.
1681 */
1682 root->append_rel_list = list_concat(root->append_rel_list,
1683 subroot->append_rel_list);
1684
1685 /*
1686 * We don't have to do the equivalent bookkeeping for outer-join info,
1687 * because that hasn't been set up yet. placeholder_list likewise.
1688 */
1689 Assert(root->join_info_list == NIL);
1690 Assert(subroot->join_info_list == NIL);
1691 Assert(root->placeholder_list == NIL);
1692 Assert(subroot->placeholder_list == NIL);
1693
1694 /*
1695 * We no longer need the RTE's copy of the subquery's query tree. Getting
1696 * rid of it saves nothing in particular so far as this level of query is
1697 * concerned; but if this query level is in turn pulled up into a parent,
1698 * we'd waste cycles copying the now-unused query tree.
1699 */
1700 rte->subquery = NULL;
1701
1702 /*
1703 * Miscellaneous housekeeping.
1704 *
1705 * Although replace_rte_variables() faithfully updated parse->hasSubLinks
1706 * if it copied any SubLinks out of the subquery's targetlist, we still
1707 * could have SubLinks added to the query in the expressions of FUNCTION
1708 * and VALUES RTEs copied up from the subquery. So it's necessary to copy
1709 * subquery->hasSubLinks anyway. Perhaps this can be improved someday.
1710 */
1711 parse->hasSubLinks |= subquery->hasSubLinks;
1712
1713 /* If subquery had any RLS conditions, now main query does too */
1714 parse->hasRowSecurity |= subquery->hasRowSecurity;
1715
1716 /*
1717 * subquery won't be pulled up if it hasAggs, hasWindowFuncs, or
1718 * hasTargetSRFs, so no work needed on those flags
1719 */
1720
1721 /*
1722 * Return the adjusted subquery jointree to replace the RangeTblRef entry
1723 * in parent's jointree; or, if the FromExpr is degenerate, just return
1724 * its single member.
1725 */
1726 Assert(IsA(subquery->jointree, FromExpr));
1727 Assert(subquery->jointree->fromlist != NIL);
1728 if (subquery->jointree->quals == NULL &&
1729 list_length(subquery->jointree->fromlist) == 1)
1730 return (Node *) linitial(subquery->jointree->fromlist);
1731
1732 return (Node *) subquery->jointree;
1733}
1734
1735/*
1736 * pull_up_simple_union_all
1737 * Pull up a single simple UNION ALL subquery.
1738 *
1739 * jtnode is a RangeTblRef that has been identified as a simple UNION ALL
1740 * subquery by pull_up_subqueries. We pull up the leaf subqueries and
1741 * build an "append relation" for the union set. The result value is just
1742 * jtnode, since we don't actually need to change the query jointree.
1743 */
1744static Node *
1746{
1747 int varno = ((RangeTblRef *) jtnode)->rtindex;
1748 Query *subquery = rte->subquery;
1749 int rtoffset = list_length(root->parse->rtable);
1750 List *rtable;
1751
1752 /*
1753 * Make a modifiable copy of the subquery's rtable, so we can adjust
1754 * upper-level Vars in it. There are no such Vars in the setOperations
1755 * tree proper, so fixing the rtable should be sufficient.
1756 */
1757 rtable = copyObject(subquery->rtable);
1758
1759 /*
1760 * Upper-level vars in subquery are now one level closer to their parent
1761 * than before. We don't have to worry about offsetting varnos, though,
1762 * because the UNION leaf queries can't cross-reference each other.
1763 */
1764 IncrementVarSublevelsUp_rtable(rtable, -1, 1);
1765
1766 /*
1767 * If the UNION ALL subquery had a LATERAL marker, propagate that to all
1768 * its children. The individual children might or might not contain any
1769 * actual lateral cross-references, but we have to mark the pulled-up
1770 * child RTEs so that later planner stages will check for such.
1771 */
1772 if (rte->lateral)
1773 {
1774 ListCell *rt;
1775
1776 foreach(rt, rtable)
1777 {
1779
1780 Assert(child_rte->rtekind == RTE_SUBQUERY);
1781 child_rte->lateral = true;
1782 }
1783 }
1784
1785 /*
1786 * Append child RTEs (and their perminfos) to parent rtable.
1787 */
1788 CombineRangeTables(&root->parse->rtable, &root->parse->rteperminfos,
1789 rtable, subquery->rteperminfos);
1790
1791 /*
1792 * Recursively scan the subquery's setOperations tree and add
1793 * AppendRelInfo nodes for leaf subqueries to the parent's
1794 * append_rel_list. Also apply pull_up_subqueries to the leaf subqueries.
1795 */
1796 Assert(subquery->setOperations);
1797 pull_up_union_leaf_queries(subquery->setOperations, root, varno, subquery,
1798 rtoffset);
1799
1800 /*
1801 * Mark the parent as an append relation.
1802 */
1803 rte->inh = true;
1804
1805 return jtnode;
1806}
1807
1808/*
1809 * pull_up_union_leaf_queries -- recursive guts of pull_up_simple_union_all
1810 *
1811 * Build an AppendRelInfo for each leaf query in the setop tree, and then
1812 * apply pull_up_subqueries to the leaf query.
1813 *
1814 * Note that setOpQuery is the Query containing the setOp node, whose tlist
1815 * contains references to all the setop output columns. When called from
1816 * pull_up_simple_union_all, this is *not* the same as root->parse, which is
1817 * the parent Query we are pulling up into.
1818 *
1819 * parentRTindex is the appendrel parent's index in root->parse->rtable.
1820 *
1821 * The child RTEs have already been copied to the parent. childRToffset
1822 * tells us where in the parent's range table they were copied. When called
1823 * from flatten_simple_union_all, childRToffset is 0 since the child RTEs
1824 * were already in root->parse->rtable and no RT index adjustment is needed.
1825 */
1826static void
1829{
1830 if (IsA(setOp, RangeTblRef))
1831 {
1833 int childRTindex;
1835
1836 /*
1837 * Calculate the index in the parent's range table
1838 */
1839 childRTindex = childRToffset + rtr->rtindex;
1840
1841 /*
1842 * Build a suitable AppendRelInfo, and attach to parent's list.
1843 */
1845 appinfo->parent_relid = parentRTindex;
1846 appinfo->child_relid = childRTindex;
1847 appinfo->parent_reltype = InvalidOid;
1848 appinfo->child_reltype = InvalidOid;
1850 appinfo->parent_reloid = InvalidOid;
1851 root->append_rel_list = lappend(root->append_rel_list, appinfo);
1852
1853 /*
1854 * Recursively apply pull_up_subqueries to the new child RTE. (We
1855 * must build the AppendRelInfo first, because this will modify it;
1856 * indeed, that's the only part of the upper query where Vars
1857 * referencing childRTindex can exist at this point.)
1858 *
1859 * Note that we can pass NULL for containing-join info even if we're
1860 * actually under an outer join, because the child's expressions
1861 * aren't going to propagate up to the join. Also, we ignore the
1862 * possibility that pull_up_subqueries_recurse() returns a different
1863 * jointree node than what we pass it; if it does, the important thing
1864 * is that it replaced the child relid in the AppendRelInfo node.
1865 */
1867 rtr->rtindex = childRTindex;
1869 NULL, appinfo);
1870 }
1871 else if (IsA(setOp, SetOperationStmt))
1872 {
1874
1875 /* Recurse to reach leaf queries */
1880 }
1881 else
1882 {
1883 elog(ERROR, "unrecognized node type: %d",
1884 (int) nodeTag(setOp));
1885 }
1886}
1887
1888/*
1889 * make_setop_translation_list
1890 * Build the list of translations from parent Vars to child Vars for
1891 * a UNION ALL member. (At this point it's just a simple list of
1892 * referencing Vars, but if we succeed in pulling up the member
1893 * subquery, the Vars will get replaced by pulled-up expressions.)
1894 * Also create the rather trivial reverse-translation array.
1895 */
1896static void
1899{
1900 List *vars = NIL;
1902 ListCell *l;
1903
1904 /* Initialize reverse-translation array with all entries zero */
1905 /* (entries for resjunk columns will stay that way) */
1906 appinfo->num_child_cols = list_length(query->targetList);
1907 appinfo->parent_colnos = pcolnos =
1908 (AttrNumber *) palloc0(appinfo->num_child_cols * sizeof(AttrNumber));
1909
1910 foreach(l, query->targetList)
1911 {
1913
1914 if (tle->resjunk)
1915 continue;
1916
1918 pcolnos[tle->resno - 1] = tle->resno;
1919 }
1920
1921 appinfo->translated_vars = vars;
1922}
1923
1924/*
1925 * is_simple_subquery
1926 * Check a subquery in the range table to see if it's simple enough
1927 * to pull up into the parent query.
1928 *
1929 * rte is the RTE_SUBQUERY RangeTblEntry that contained the subquery.
1930 * (Note subquery is not necessarily equal to rte->subquery; it could be a
1931 * processed copy of that.)
1932 * lowest_outer_join is the lowest outer join above the subquery, or NULL.
1933 */
1934static bool
1937{
1938 /*
1939 * Let's just make sure it's a valid subselect ...
1940 */
1941 if (!IsA(subquery, Query) ||
1942 subquery->commandType != CMD_SELECT)
1943 elog(ERROR, "subquery is bogus");
1944
1945 /*
1946 * Can't currently pull up a query with setops (unless it's simple UNION
1947 * ALL, which is handled by a different code path). Maybe after querytree
1948 * redesign...
1949 */
1950 if (subquery->setOperations)
1951 return false;
1952
1953 /*
1954 * Can't pull up a subquery involving grouping, aggregation, SRFs,
1955 * sorting, limiting, or WITH. (XXX WITH could possibly be allowed later)
1956 *
1957 * We also don't pull up a subquery that has explicit FOR UPDATE/SHARE
1958 * clauses, because pullup would cause the locking to occur semantically
1959 * higher than it should. Implicit FOR UPDATE/SHARE is okay because in
1960 * that case the locking was originally declared in the upper query
1961 * anyway.
1962 */
1963 if (subquery->hasAggs ||
1964 subquery->hasWindowFuncs ||
1965 subquery->hasTargetSRFs ||
1966 subquery->groupClause ||
1967 subquery->groupingSets ||
1968 subquery->havingQual ||
1969 subquery->sortClause ||
1970 subquery->distinctClause ||
1971 subquery->limitOffset ||
1972 subquery->limitCount ||
1973 subquery->hasForUpdate ||
1974 subquery->cteList)
1975 return false;
1976
1977 /*
1978 * Don't pull up if the RTE represents a security-barrier view; we
1979 * couldn't prevent information leakage once the RTE's Vars are scattered
1980 * about in the upper query.
1981 */
1982 if (rte->security_barrier)
1983 return false;
1984
1985 /*
1986 * If the subquery is LATERAL, check for pullup restrictions from that.
1987 */
1988 if (rte->lateral)
1989 {
1990 bool restricted;
1992
1993 /*
1994 * The subquery's WHERE and JOIN/ON quals mustn't contain any lateral
1995 * references to rels outside a higher outer join (including the case
1996 * where the outer join is within the subquery itself). In such a
1997 * case, pulling up would result in a situation where we need to
1998 * postpone quals from below an outer join to above it, which is
1999 * probably completely wrong and in any case is a complication that
2000 * doesn't seem worth addressing at the moment.
2001 */
2002 if (lowest_outer_join != NULL)
2003 {
2004 restricted = true;
2006 true, true);
2007 }
2008 else
2009 {
2010 restricted = false;
2011 safe_upper_varnos = NULL; /* doesn't matter */
2012 }
2013
2015 (Node *) subquery->jointree,
2017 return false;
2018
2019 /*
2020 * If there's an outer join above the LATERAL subquery, also disallow
2021 * pullup if the subquery's targetlist has any references to rels
2022 * outside the outer join, since these might get pulled into quals
2023 * above the subquery (but in or below the outer join) and then lead
2024 * to qual-postponement issues similar to the case checked for above.
2025 * (We wouldn't need to prevent pullup if no such references appear in
2026 * outer-query quals, but we don't have enough info here to check
2027 * that. Also, maybe this restriction could be removed if we forced
2028 * such refs to be wrapped in PlaceHolderVars, even when they're below
2029 * the nearest outer join? But it's a pretty hokey usage, so not
2030 * clear this is worth sweating over.)
2031 *
2032 * If you change this, see also the comments about lateral references
2033 * in pullup_replace_vars_callback().
2034 */
2035 if (lowest_outer_join != NULL)
2036 {
2038 (Node *) subquery->targetList,
2039 1);
2040
2042 return false;
2043 }
2044 }
2045
2046 /*
2047 * Don't pull up a subquery that has any volatile functions in its
2048 * targetlist. Otherwise we might introduce multiple evaluations of these
2049 * functions, if they get copied to multiple places in the upper query,
2050 * leading to surprising results. (Note: the PlaceHolderVar mechanism
2051 * doesn't quite guarantee single evaluation; else we could pull up anyway
2052 * and just wrap such items in PlaceHolderVars ...)
2053 */
2054 if (contain_volatile_functions((Node *) subquery->targetList))
2055 return false;
2056
2057 return true;
2058}
2059
2060/*
2061 * pull_up_simple_values
2062 * Pull up a single simple VALUES RTE.
2063 *
2064 * jtnode is a RangeTblRef that has been identified as a simple VALUES RTE
2065 * by pull_up_subqueries. We always return a RangeTblRef representing a
2066 * RESULT RTE to replace it (all failure cases should have been detected by
2067 * is_simple_values()). Actually, what we return is just jtnode, because
2068 * we replace the VALUES RTE in the rangetable with the RESULT RTE.
2069 *
2070 * rte is the RangeTblEntry referenced by jtnode. Because of the limited
2071 * possible usage of VALUES RTEs, we do not need the remaining parameters
2072 * of pull_up_subqueries_recurse.
2073 */
2074static Node *
2076{
2077 Query *parse = root->parse;
2078 int varno = ((RangeTblRef *) jtnode)->rtindex;
2080 List *tlist;
2083 ListCell *lc;
2084
2085 Assert(rte->rtekind == RTE_VALUES);
2086 Assert(list_length(rte->values_lists) == 1);
2087
2088 /*
2089 * Need a modifiable copy of the VALUES list to hack on, just in case it's
2090 * multiply referenced.
2091 */
2092 values_list = copyObject(linitial(rte->values_lists));
2093
2094 /*
2095 * The VALUES RTE can't contain any Vars of level zero, let alone any that
2096 * are join aliases, so no need to flatten join alias Vars.
2097 */
2099
2100 /*
2101 * Set up required context data for pullup_replace_vars. In particular,
2102 * we have to make the VALUES list look like a subquery targetlist.
2103 */
2104 tlist = NIL;
2105 attrno = 1;
2106 foreach(lc, values_list)
2107 {
2108 tlist = lappend(tlist,
2110 attrno,
2111 NULL,
2112 false));
2113 attrno++;
2114 }
2115 rvcontext.root = root;
2116 rvcontext.targetlist = tlist;
2117 rvcontext.target_rte = rte;
2118 rvcontext.result_relation = 0;
2119 rvcontext.relids = NULL; /* can't be any lateral references here */
2120 rvcontext.nullinfo = NULL;
2121 rvcontext.outer_hasSubLinks = &parse->hasSubLinks;
2122 rvcontext.varno = varno;
2123 rvcontext.wrap_option = REPLACE_WRAP_NONE;
2124 /* initialize cache array with indexes 0 .. length(tlist) */
2125 rvcontext.rv_cache = palloc0((list_length(tlist) + 1) *
2126 sizeof(Node *));
2127
2128 /*
2129 * Replace all of the top query's references to the RTE's outputs with
2130 * copies of the adjusted VALUES expressions, being careful not to replace
2131 * any of the jointree structure. We can assume there's no outer joins or
2132 * appendrels in the dummy Query that surrounds a VALUES RTE.
2133 */
2135
2136 /*
2137 * There should be no appendrels to fix, nor any outer joins and hence no
2138 * PlaceHolderVars.
2139 */
2140 Assert(root->append_rel_list == NIL);
2141 Assert(root->join_info_list == NIL);
2142 Assert(root->placeholder_list == NIL);
2143
2144 /*
2145 * Replace the VALUES RTE with a RESULT RTE. The VALUES RTE is the only
2146 * rtable entry in the current query level, so this is easy.
2147 */
2148 Assert(list_length(parse->rtable) == 1);
2149
2150 /* Create suitable RTE */
2152 rte->rtekind = RTE_RESULT;
2153 rte->eref = makeAlias("*RESULT*", NIL);
2154
2155 /* Replace rangetable */
2156 parse->rtable = list_make1(rte);
2157
2158 /* We could manufacture a new RangeTblRef, but the one we have is fine */
2159 Assert(varno == 1);
2160
2161 return jtnode;
2162}
2163
2164/*
2165 * is_simple_values
2166 * Check a VALUES RTE in the range table to see if it's simple enough
2167 * to pull up into the parent query.
2168 *
2169 * rte is the RTE_VALUES RangeTblEntry to check.
2170 */
2171static bool
2173{
2174 Assert(rte->rtekind == RTE_VALUES);
2175
2176 /*
2177 * There must be exactly one VALUES list, else it's not semantically
2178 * correct to replace the VALUES RTE with a RESULT RTE, nor would we have
2179 * a unique set of expressions to substitute into the parent query.
2180 */
2181 if (list_length(rte->values_lists) != 1)
2182 return false;
2183
2184 /*
2185 * Because VALUES can't appear under an outer join (or at least, we won't
2186 * try to pull it up if it does), we need not worry about LATERAL, nor
2187 * about validity of PHVs for the VALUES' outputs.
2188 */
2189
2190 /*
2191 * Don't pull up a VALUES that contains any set-returning or volatile
2192 * functions. The considerations here are basically identical to the
2193 * restrictions on a pull-able subquery's targetlist.
2194 */
2195 if (expression_returns_set((Node *) rte->values_lists) ||
2196 contain_volatile_functions((Node *) rte->values_lists))
2197 return false;
2198
2199 /*
2200 * Do not pull up a VALUES that's not the only RTE in its parent query.
2201 * This is actually the only case that the parser will generate at the
2202 * moment, and assuming this is true greatly simplifies
2203 * pull_up_simple_values().
2204 */
2205 if (list_length(root->parse->rtable) != 1 ||
2206 rte != (RangeTblEntry *) linitial(root->parse->rtable))
2207 return false;
2208
2209 return true;
2210}
2211
2212/*
2213 * pull_up_constant_function
2214 * Pull up an RTE_FUNCTION expression that was simplified to a constant.
2215 *
2216 * jtnode is a RangeTblRef that has been identified as a FUNCTION RTE by
2217 * pull_up_subqueries. If its expression is just a Const, hoist that value
2218 * up into the parent query, and replace the RTE_FUNCTION with RTE_RESULT.
2219 *
2220 * In principle we could pull up any immutable expression, but we don't.
2221 * That might result in multiple evaluations of the expression, which could
2222 * be costly if it's not just a Const. Also, the main value of this is
2223 * to let the constant participate in further const-folding, and of course
2224 * that won't happen for a non-Const.
2225 *
2226 * The pulled-up value might need to be wrapped in a PlaceHolderVar if the
2227 * RTE is below an outer join or is part of an appendrel; the extra
2228 * parameters show whether that's needed.
2229 */
2230static Node *
2234{
2235 Query *parse = root->parse;
2239 TupleDesc tupdesc;
2241
2242 /* Fail if the RTE has ORDINALITY - we don't implement that here. */
2243 if (rte->funcordinality)
2244 return jtnode;
2245
2246 /* Fail if RTE isn't a single, simple Const expr */
2247 if (list_length(rte->functions) != 1)
2248 return jtnode;
2249 rtf = linitial_node(RangeTblFunction, rte->functions);
2250 if (!IsA(rtf->funcexpr, Const))
2251 return jtnode;
2252
2253 /*
2254 * If the function's result is not a scalar, we punt. In principle we
2255 * could break the composite constant value apart into per-column
2256 * constants, but for now it seems not worth the work.
2257 */
2258 if (rtf->funccolcount != 1)
2259 return jtnode; /* definitely composite */
2260
2261 /* If it has a coldeflist, it certainly returns RECORD */
2262 if (rtf->funccolnames != NIL)
2263 return jtnode; /* must be a one-column RECORD type */
2264
2266 &funcrettype,
2267 &tupdesc);
2269 return jtnode; /* must be a one-column composite type */
2270
2271 /* Create context for applying pullup_replace_vars */
2272 rvcontext.root = root;
2273 rvcontext.targetlist = list_make1(makeTargetEntry((Expr *) rtf->funcexpr,
2274 1, /* resno */
2275 NULL, /* resname */
2276 false)); /* resjunk */
2277 rvcontext.target_rte = rte;
2278 rvcontext.result_relation = 0;
2279
2280 /*
2281 * Since this function was reduced to a Const, it doesn't contain any
2282 * lateral references, even if it's marked as LATERAL. This means we
2283 * don't need to fill relids or nullinfo.
2284 */
2285 rvcontext.relids = NULL;
2286 rvcontext.nullinfo = NULL;
2287
2288 rvcontext.outer_hasSubLinks = &parse->hasSubLinks;
2289 rvcontext.varno = ((RangeTblRef *) jtnode)->rtindex;
2290 /* this flag will be set below, if needed */
2291 rvcontext.wrap_option = REPLACE_WRAP_NONE;
2292 /* initialize cache array with indexes 0 .. length(tlist) */
2293 rvcontext.rv_cache = palloc0((list_length(rvcontext.targetlist) + 1) *
2294 sizeof(Node *));
2295
2296 /*
2297 * If the parent query uses grouping sets, we need a PlaceHolderVar for
2298 * each expression of the subquery's targetlist items. (See comments in
2299 * pull_up_simple_subquery().)
2300 */
2301 if (parse->groupingSets)
2302 rvcontext.wrap_option = REPLACE_WRAP_ALL;
2303
2304 /*
2305 * Replace all of the top query's references to the RTE's output with
2306 * copies of the funcexpr, being careful not to replace any of the
2307 * jointree structure.
2308 */
2311
2312 /*
2313 * We don't need to bother with changing PlaceHolderVars in the parent
2314 * query. Their references to the RT index are still good for now, and
2315 * will get removed later if we're able to drop the RTE_RESULT.
2316 */
2317
2318 /*
2319 * Convert the RTE to be RTE_RESULT type, signifying that we don't need to
2320 * scan it anymore, and zero out RTE_FUNCTION-specific fields. Also make
2321 * sure the RTE is not marked LATERAL, since elsewhere we don't expect
2322 * RTE_RESULTs to be LATERAL.
2323 */
2324 rte->rtekind = RTE_RESULT;
2325 rte->functions = NIL;
2326 rte->lateral = false;
2327
2328 /*
2329 * We can reuse the RangeTblRef node.
2330 */
2331 return jtnode;
2332}
2333
2334/*
2335 * is_simple_union_all
2336 * Check a subquery to see if it's a simple UNION ALL.
2337 *
2338 * We require all the setops to be UNION ALL (no mixing) and there can't be
2339 * any datatype coercions involved, ie, all the leaf queries must emit the
2340 * same datatypes.
2341 */
2342static bool
2344{
2346
2347 /* Let's just make sure it's a valid subselect ... */
2348 if (!IsA(subquery, Query) ||
2349 subquery->commandType != CMD_SELECT)
2350 elog(ERROR, "subquery is bogus");
2351
2352 /* Is it a set-operation query at all? */
2354 if (!topop)
2355 return false;
2356
2357 /* Can't handle ORDER BY, LIMIT/OFFSET, locking, or WITH */
2358 if (subquery->sortClause ||
2359 subquery->limitOffset ||
2360 subquery->limitCount ||
2361 subquery->rowMarks ||
2362 subquery->cteList)
2363 return false;
2364
2365 /* Recursively check the tree of set operations */
2366 return is_simple_union_all_recurse((Node *) topop, subquery,
2367 topop->colTypes);
2368}
2369
2370static bool
2372{
2373 /* Since this function recurses, it could be driven to stack overflow. */
2375
2376 if (IsA(setOp, RangeTblRef))
2377 {
2379 RangeTblEntry *rte = rt_fetch(rtr->rtindex, setOpQuery->rtable);
2380 Query *subquery = rte->subquery;
2381
2382 Assert(subquery != NULL);
2383
2384 /* Leaf nodes are OK if they match the toplevel column types */
2385 /* We don't have to compare typmods or collations here */
2386 return tlist_same_datatypes(subquery->targetList, colTypes, true);
2387 }
2388 else if (IsA(setOp, SetOperationStmt))
2389 {
2391
2392 /* Must be UNION ALL */
2393 if (op->op != SETOP_UNION || !op->all)
2394 return false;
2395
2396 /* Recurse to check inputs */
2399 }
2400 else
2401 {
2402 elog(ERROR, "unrecognized node type: %d",
2403 (int) nodeTag(setOp));
2404 return false; /* keep compiler quiet */
2405 }
2406}
2407
2408/*
2409 * is_safe_append_member
2410 * Check a subquery that is a leaf of a UNION ALL appendrel to see if it's
2411 * safe to pull up.
2412 */
2413static bool
2415{
2416 FromExpr *jtnode;
2417
2418 /*
2419 * It's only safe to pull up the child if its jointree contains exactly
2420 * one RTE, else the AppendRelInfo data structure breaks. The one base RTE
2421 * could be buried in several levels of FromExpr, however. Also, if the
2422 * child's jointree is completely empty, we can pull up because
2423 * pull_up_simple_subquery will insert a single RTE_RESULT RTE instead.
2424 *
2425 * Also, the child can't have any WHERE quals because there's no place to
2426 * put them in an appendrel. (This is a bit annoying...) If we didn't
2427 * need to check this, we'd just test whether get_relids_in_jointree()
2428 * yields a singleton set, to be more consistent with the coding of
2429 * fix_append_rel_relids().
2430 */
2431 jtnode = subquery->jointree;
2432 Assert(IsA(jtnode, FromExpr));
2433 /* Check the completely-empty case */
2434 if (jtnode->fromlist == NIL && jtnode->quals == NULL)
2435 return true;
2436 /* Check the more general case */
2437 while (IsA(jtnode, FromExpr))
2438 {
2439 if (jtnode->quals != NULL)
2440 return false;
2441 if (list_length(jtnode->fromlist) != 1)
2442 return false;
2443 jtnode = linitial(jtnode->fromlist);
2444 }
2445 if (!IsA(jtnode, RangeTblRef))
2446 return false;
2447
2448 return true;
2449}
2450
2451/*
2452 * jointree_contains_lateral_outer_refs
2453 * Check for disallowed lateral references in a jointree's quals
2454 *
2455 * If restricted is false, all level-1 Vars are allowed (but we still must
2456 * search the jointree, since it might contain outer joins below which there
2457 * will be restrictions). If restricted is true, return true when any qual
2458 * in the jointree contains level-1 Vars coming from outside the rels listed
2459 * in safe_upper_varnos.
2460 */
2461static bool
2463 bool restricted,
2465{
2466 if (jtnode == NULL)
2467 return false;
2468 if (IsA(jtnode, RangeTblRef))
2469 return false;
2470 else if (IsA(jtnode, FromExpr))
2471 {
2472 FromExpr *f = (FromExpr *) jtnode;
2473 ListCell *l;
2474
2475 /* First, recurse to check child joins */
2476 foreach(l, f->fromlist)
2477 {
2479 lfirst(l),
2480 restricted,
2482 return true;
2483 }
2484
2485 /* Then check the top-level quals */
2486 if (restricted &&
2489 return true;
2490 }
2491 else if (IsA(jtnode, JoinExpr))
2492 {
2493 JoinExpr *j = (JoinExpr *) jtnode;
2494
2495 /*
2496 * If this is an outer join, we mustn't allow any upper lateral
2497 * references in or below it.
2498 */
2499 if (j->jointype != JOIN_INNER)
2500 {
2501 restricted = true;
2503 }
2504
2505 /* Check the child joins */
2507 j->larg,
2508 restricted,
2510 return true;
2512 j->rarg,
2513 restricted,
2515 return true;
2516
2517 /* Check the JOIN's qual clauses */
2518 if (restricted &&
2521 return true;
2522 }
2523 else
2524 elog(ERROR, "unrecognized node type: %d",
2525 (int) nodeTag(jtnode));
2526 return false;
2527}
2528
2529/*
2530 * Perform pullup_replace_vars everyplace it's needed in the query tree.
2531 *
2532 * Caller has already filled *rvcontext with data describing what to
2533 * substitute for Vars referencing the target subquery. In addition
2534 * we need the identity of the containing appendrel if any.
2535 */
2536static void
2540{
2541 Query *parse = root->parse;
2542 ListCell *lc;
2543
2544 /*
2545 * If we are considering an appendrel child subquery (that is, a UNION ALL
2546 * member query that we're pulling up), then the only part of the upper
2547 * query that could reference the child yet is the translated_vars list of
2548 * the associated AppendRelInfo. Furthermore, we do not want to force use
2549 * of PHVs in the AppendRelInfo --- there isn't any outer join between.
2550 */
2552 {
2554
2555 rvcontext->wrap_option = REPLACE_WRAP_NONE;
2556 containing_appendrel->translated_vars = (List *)
2557 pullup_replace_vars((Node *) containing_appendrel->translated_vars,
2558 rvcontext);
2559 rvcontext->wrap_option = save_wrap_option;
2560 return;
2561 }
2562
2563 /*
2564 * Replace all of the top query's references to the subquery's outputs
2565 * with copies of the adjusted subtlist items, being careful not to
2566 * replace any of the jointree structure. (This'd be a lot cleaner if we
2567 * could use query_tree_mutator.) We have to use PHVs in the targetList,
2568 * returningList, and havingQual, since those are certainly above any
2569 * outer join. replace_vars_in_jointree tracks its location in the
2570 * jointree and uses PHVs or not appropriately.
2571 */
2572 parse->targetList = (List *)
2573 pullup_replace_vars((Node *) parse->targetList, rvcontext);
2574 parse->returningList = (List *)
2575 pullup_replace_vars((Node *) parse->returningList, rvcontext);
2576
2577 if (parse->onConflict)
2578 {
2579 parse->onConflict->onConflictSet = (List *)
2580 pullup_replace_vars((Node *) parse->onConflict->onConflictSet,
2581 rvcontext);
2582 parse->onConflict->onConflictWhere =
2583 pullup_replace_vars(parse->onConflict->onConflictWhere,
2584 rvcontext);
2585
2586 /*
2587 * We assume ON CONFLICT's arbiterElems, arbiterWhere, exclRelTlist
2588 * can't contain any references to a subquery.
2589 */
2590 }
2591 if (parse->mergeActionList)
2592 {
2593 foreach(lc, parse->mergeActionList)
2594 {
2595 MergeAction *action = lfirst(lc);
2596
2597 action->qual = pullup_replace_vars(action->qual, rvcontext);
2598 action->targetList = (List *)
2599 pullup_replace_vars((Node *) action->targetList, rvcontext);
2600 }
2601 }
2602 parse->mergeJoinCondition = pullup_replace_vars(parse->mergeJoinCondition,
2603 rvcontext);
2605 Assert(parse->setOperations == NULL);
2606 parse->havingQual = pullup_replace_vars(parse->havingQual, rvcontext);
2607
2608 /*
2609 * Replace references in the translated_vars lists of appendrels.
2610 */
2611 foreach(lc, root->append_rel_list)
2612 {
2614
2616 pullup_replace_vars((Node *) appinfo->translated_vars, rvcontext);
2617 }
2618
2619 /*
2620 * Replace references in the joinaliasvars lists of join RTEs and the
2621 * groupexprs list of group RTE.
2622 */
2623 foreach(lc, parse->rtable)
2624 {
2626
2627 if (otherrte->rtekind == RTE_JOIN)
2628 otherrte->joinaliasvars = (List *)
2629 pullup_replace_vars((Node *) otherrte->joinaliasvars,
2630 rvcontext);
2631 else if (otherrte->rtekind == RTE_GROUP)
2632 otherrte->groupexprs = (List *)
2633 pullup_replace_vars((Node *) otherrte->groupexprs,
2634 rvcontext);
2635 }
2636}
2637
2638/*
2639 * Helper routine for perform_pullup_replace_vars: do pullup_replace_vars on
2640 * every expression in the jointree, without changing the jointree structure
2641 * itself. Ugly, but there's no other way...
2642 */
2643static void
2646{
2647 if (jtnode == NULL)
2648 return;
2649 if (IsA(jtnode, RangeTblRef))
2650 {
2651 /*
2652 * If the RangeTblRef refers to a LATERAL subquery (that isn't the
2653 * same subquery we're pulling up), it might contain references to the
2654 * target subquery, which we must replace. We drive this from the
2655 * jointree scan, rather than a scan of the rtable, so that we can
2656 * avoid processing no-longer-referenced RTEs.
2657 */
2658 int varno = ((RangeTblRef *) jtnode)->rtindex;
2659
2660 if (varno != context->varno) /* ignore target subquery itself */
2661 {
2662 RangeTblEntry *rte = rt_fetch(varno, context->root->parse->rtable);
2663
2664 Assert(rte != context->target_rte);
2665 if (rte->lateral)
2666 {
2667 switch (rte->rtekind)
2668 {
2669 case RTE_RELATION:
2670 /* shouldn't be marked LATERAL unless tablesample */
2671 Assert(rte->tablesample);
2672 rte->tablesample = (TableSampleClause *)
2673 pullup_replace_vars((Node *) rte->tablesample,
2674 context);
2675 break;
2676 case RTE_SUBQUERY:
2677 rte->subquery =
2679 context);
2680 break;
2681 case RTE_FUNCTION:
2682 rte->functions = (List *)
2683 pullup_replace_vars((Node *) rte->functions,
2684 context);
2685 break;
2686 case RTE_TABLEFUNC:
2687 rte->tablefunc = (TableFunc *)
2688 pullup_replace_vars((Node *) rte->tablefunc,
2689 context);
2690 break;
2691 case RTE_VALUES:
2692 rte->values_lists = (List *)
2693 pullup_replace_vars((Node *) rte->values_lists,
2694 context);
2695 break;
2696 case RTE_JOIN:
2697 case RTE_CTE:
2699 case RTE_RESULT:
2700 case RTE_GROUP:
2701 /* these shouldn't be marked LATERAL */
2702 Assert(false);
2703 break;
2704 case RTE_GRAPH_TABLE:
2705 /* shouldn't happen here */
2706 Assert(false);
2707 break;
2708 }
2709 }
2710 }
2711 }
2712 else if (IsA(jtnode, FromExpr))
2713 {
2714 FromExpr *f = (FromExpr *) jtnode;
2715 ListCell *l;
2716
2717 foreach(l, f->fromlist)
2718 replace_vars_in_jointree(lfirst(l), context);
2719 f->quals = pullup_replace_vars(f->quals, context);
2720 }
2721 else if (IsA(jtnode, JoinExpr))
2722 {
2723 JoinExpr *j = (JoinExpr *) jtnode;
2725
2726 replace_vars_in_jointree(j->larg, context);
2727 replace_vars_in_jointree(j->rarg, context);
2728
2729 /*
2730 * Use PHVs within the join quals of a full join for variable-free
2731 * expressions. Otherwise, we cannot identify which side of the join
2732 * a pulled-up variable-free expression came from, which can lead to
2733 * failure to make a plan at all because none of the quals appear to
2734 * be mergeable or hashable conditions.
2735 */
2736 if (j->jointype == JOIN_FULL)
2738
2739 j->quals = pullup_replace_vars(j->quals, context);
2740
2741 context->wrap_option = save_wrap_option;
2742 }
2743 else
2744 elog(ERROR, "unrecognized node type: %d",
2745 (int) nodeTag(jtnode));
2746}
2747
2748/*
2749 * Apply pullup variable replacement throughout an expression tree
2750 *
2751 * Returns a modified copy of the tree, so this can't be used where we
2752 * need to do in-place replacement.
2753 */
2754static Node *
2756{
2757 return replace_rte_variables(expr,
2758 context->varno, 0,
2760 context,
2761 context->outer_hasSubLinks);
2762}
2763
2764static Node *
2767{
2769 int varattno = var->varattno;
2770 bool need_phv;
2771 Node *newnode;
2772
2773 /* System columns are not replaced. */
2774 if (varattno < InvalidAttrNumber)
2775 return (Node *) copyObject(var);
2776
2777 /*
2778 * We need a PlaceHolderVar if the Var-to-be-replaced has nonempty
2779 * varnullingrels (unless we find below that the replacement expression is
2780 * a Var or PlaceHolderVar that we can just add the nullingrels to). We
2781 * also need one if the caller has instructed us that certain expression
2782 * replacements need to be wrapped for identification purposes.
2783 */
2784 need_phv = (var->varnullingrels != NULL) ||
2785 (rcon->wrap_option != REPLACE_WRAP_NONE);
2786
2787 /*
2788 * If PlaceHolderVars are needed, we cache the modified expressions in
2789 * rcon->rv_cache[]. This is not in hopes of any material speed gain
2790 * within this function, but to avoid generating identical PHVs with
2791 * different IDs. That would result in duplicate evaluations at runtime,
2792 * and possibly prevent optimizations that rely on recognizing different
2793 * references to the same subquery output as being equal(). So it's worth
2794 * a bit of extra effort to avoid it.
2795 *
2796 * The cached items have phlevelsup = 0 and phnullingrels = NULL; we'll
2797 * copy them and adjust those values for this reference site below.
2798 */
2799 if (need_phv &&
2800 varattno >= InvalidAttrNumber &&
2801 varattno <= list_length(rcon->targetlist) &&
2802 rcon->rv_cache[varattno] != NULL)
2803 {
2804 /* Just copy the entry and fall through to adjust phlevelsup etc */
2805 newnode = copyObject(rcon->rv_cache[varattno]);
2806 }
2807 else
2808 {
2809 /*
2810 * Generate the replacement expression. This takes care of expanding
2811 * wholerow references and dealing with non-default varreturningtype.
2812 */
2814 rcon->target_rte,
2815 rcon->targetlist,
2816 rcon->result_relation,
2818 0);
2819
2820 /* Insert PlaceHolderVar if needed */
2821 if (need_phv)
2822 {
2823 bool wrap;
2824
2825 if (rcon->wrap_option == REPLACE_WRAP_ALL)
2826 {
2827 /* Caller told us to wrap all expressions in a PlaceHolderVar */
2828 wrap = true;
2829 }
2830 else if (varattno == InvalidAttrNumber)
2831 {
2832 /*
2833 * Insert PlaceHolderVar for whole-tuple reference. Notice
2834 * that we are wrapping one PlaceHolderVar around the whole
2835 * RowExpr, rather than putting one around each element of the
2836 * row. This is because we need the expression to yield NULL,
2837 * not ROW(NULL,NULL,...) when it is forced to null by an
2838 * outer join.
2839 */
2840 wrap = true;
2841 }
2842 else if (newnode && IsA(newnode, Var) &&
2843 ((Var *) newnode)->varlevelsup == 0)
2844 {
2845 /*
2846 * Simple Vars always escape being wrapped, unless they are
2847 * lateral references to something outside the subquery being
2848 * pulled up and the referenced rel is not under the same
2849 * lowest nulling outer join.
2850 */
2851 wrap = false;
2852 if (rcon->target_rte->lateral &&
2853 !bms_is_member(((Var *) newnode)->varno, rcon->relids))
2854 {
2855 nullingrel_info *nullinfo = rcon->nullinfo;
2856 int lvarno = ((Var *) newnode)->varno;
2857
2858 Assert(lvarno > 0 && lvarno <= nullinfo->rtlength);
2859 if (!bms_is_subset(nullinfo->nullingrels[rcon->varno],
2860 nullinfo->nullingrels[lvarno]))
2861 wrap = true;
2862 }
2863 }
2864 else if (newnode && IsA(newnode, PlaceHolderVar) &&
2865 ((PlaceHolderVar *) newnode)->phlevelsup == 0)
2866 {
2867 /* The same rules apply for a PlaceHolderVar */
2868 wrap = false;
2869 if (rcon->target_rte->lateral &&
2871 rcon->relids))
2872 {
2873 nullingrel_info *nullinfo = rcon->nullinfo;
2874 Relids lvarnos = ((PlaceHolderVar *) newnode)->phrels;
2875 int lvarno;
2876
2877 lvarno = -1;
2878 while ((lvarno = bms_next_member(lvarnos, lvarno)) >= 0)
2879 {
2880 Assert(lvarno > 0 && lvarno <= nullinfo->rtlength);
2881 if (!bms_is_subset(nullinfo->nullingrels[rcon->varno],
2882 nullinfo->nullingrels[lvarno]))
2883 {
2884 wrap = true;
2885 break;
2886 }
2887 }
2888 }
2889 }
2890 else
2891 {
2892 /*
2893 * If the node contains Var(s) or PlaceHolderVar(s) of the
2894 * subquery being pulled up, or of rels that are under the
2895 * same lowest nulling outer join as the subquery, and does
2896 * not contain any non-strict constructs, then instead of
2897 * adding a PHV on top we can add the required nullingrels to
2898 * those Vars/PHVs. (This is fundamentally a generalization
2899 * of the above cases for bare Vars and PHVs.)
2900 *
2901 * This test is somewhat expensive, but it avoids pessimizing
2902 * the plan in cases where the nullingrels get removed again
2903 * later by outer join reduction.
2904 *
2905 * Note that we don't force wrapping of expressions containing
2906 * lateral references, so long as they also contain Vars/PHVs
2907 * of the subquery, or of rels that are under the same lowest
2908 * nulling outer join as the subquery. This is okay because
2909 * of the restriction to strict constructs: if those Vars/PHVs
2910 * have been forced to NULL by an outer join then the end
2911 * result of the expression will be NULL too, regardless of
2912 * the lateral references. So it's not necessary to force the
2913 * expression to be evaluated below the outer join. This can
2914 * be a very valuable optimization, because it may allow us to
2915 * avoid using a nested loop to pass the lateral reference
2916 * down.
2917 *
2918 * This analysis could be tighter: in particular, a non-strict
2919 * construct hidden within a lower-level PlaceHolderVar is not
2920 * reason to add another PHV. But for now it doesn't seem
2921 * worth the code to be more exact. This is also why it's
2922 * preferable to handle bare PHVs in the above branch, rather
2923 * than this branch. We also prefer to handle bare Vars in a
2924 * separate branch, as it's cheaper this way and parallels the
2925 * handling of PHVs.
2926 *
2927 * For a LATERAL subquery, we have to check the actual var
2928 * membership of the node, but if it's non-lateral then any
2929 * level-zero var must belong to the subquery.
2930 */
2931 bool contain_nullable_vars = false;
2932
2933 if (!rcon->target_rte->lateral)
2934 {
2936 contain_nullable_vars = true;
2937 }
2938 else
2939 {
2941
2943 if (bms_overlap(all_varnos, rcon->relids))
2944 contain_nullable_vars = true;
2945 else
2946 {
2947 nullingrel_info *nullinfo = rcon->nullinfo;
2948 int varno;
2949
2950 varno = -1;
2951 while ((varno = bms_next_member(all_varnos, varno)) >= 0)
2952 {
2953 Assert(varno > 0 && varno <= nullinfo->rtlength);
2954 if (bms_is_subset(nullinfo->nullingrels[rcon->varno],
2955 nullinfo->nullingrels[varno]))
2956 {
2957 contain_nullable_vars = true;
2958 break;
2959 }
2960 }
2961 }
2962 }
2963
2966 {
2967 /* No wrap needed */
2968 wrap = false;
2969 }
2970 else
2971 {
2972 /* Else wrap it in a PlaceHolderVar */
2973 wrap = true;
2974 }
2975 }
2976
2977 if (wrap)
2978 {
2979 newnode = (Node *)
2981 (Expr *) newnode,
2982 bms_make_singleton(rcon->varno));
2983
2984 /*
2985 * Cache it if possible (ie, if the attno is in range, which
2986 * it probably always should be).
2987 */
2988 if (varattno >= InvalidAttrNumber &&
2989 varattno <= list_length(rcon->targetlist))
2990 rcon->rv_cache[varattno] = copyObject(newnode);
2991 }
2992 }
2993 }
2994
2995 /* Propagate any varnullingrels into the replacement expression */
2996 if (var->varnullingrels != NULL)
2997 {
2998 if (IsA(newnode, Var))
2999 {
3000 Var *newvar = (Var *) newnode;
3001
3002 Assert(newvar->varlevelsup == 0);
3003 newvar->varnullingrels = bms_add_members(newvar->varnullingrels,
3004 var->varnullingrels);
3005 }
3006 else if (IsA(newnode, PlaceHolderVar))
3007 {
3009
3010 Assert(newphv->phlevelsup == 0);
3011 newphv->phnullingrels = bms_add_members(newphv->phnullingrels,
3012 var->varnullingrels);
3013 }
3014 else
3015 {
3016 /*
3017 * There should be Vars/PHVs within the expression that we can
3018 * modify. Vars/PHVs of the subquery should have the full
3019 * var->varnullingrels added to them, but if there are lateral
3020 * references within the expression, those must be marked with
3021 * only the nullingrels that potentially apply to them. (This
3022 * corresponds to the fact that the expression will now be
3023 * evaluated at the join level of the Var that we are replacing:
3024 * the lateral references may have bubbled up through fewer outer
3025 * joins than the subquery's Vars have. Per the discussion above,
3026 * we'll still get the right answers.) That relid set could be
3027 * different for different lateral relations, so we have to do
3028 * this work for each one.
3029 *
3030 * (Currently, the restrictions in is_simple_subquery() mean that
3031 * at most we have to remove the lowest outer join's relid from
3032 * the nullingrels of a lateral reference. However, we might
3033 * relax those restrictions someday, so let's do this right.)
3034 */
3035 if (rcon->target_rte->lateral)
3036 {
3037 nullingrel_info *nullinfo = rcon->nullinfo;
3039 int lvarno;
3040
3041 /*
3042 * Identify lateral varnos used within newnode. We must do
3043 * this before injecting var->varnullingrels into the tree.
3044 */
3045 lvarnos = pull_varnos(rcon->root, newnode);
3046 lvarnos = bms_del_members(lvarnos, rcon->relids);
3047 /* For each one, add relevant nullingrels if any */
3048 lvarno = -1;
3049 while ((lvarno = bms_next_member(lvarnos, lvarno)) >= 0)
3050 {
3052
3053 Assert(lvarno > 0 && lvarno <= nullinfo->rtlength);
3054 lnullingrels = bms_intersect(var->varnullingrels,
3055 nullinfo->nullingrels[lvarno]);
3059 lnullingrels);
3060 }
3061 }
3062
3063 /* Finally, deal with Vars/PHVs of the subquery itself */
3065 rcon->relids,
3066 var->varnullingrels);
3067 /* Assert we did put the varnullingrels into the expression */
3068 Assert(bms_is_subset(var->varnullingrels,
3069 pull_varnos(rcon->root, newnode)));
3070 }
3071 }
3072
3073 /* Must adjust varlevelsup if replaced Var is within a subquery */
3074 if (var->varlevelsup > 0)
3076
3077 return newnode;
3078}
3079
3080/*
3081 * Apply pullup variable replacement to a subquery
3082 *
3083 * This needs to be different from pullup_replace_vars() because
3084 * replace_rte_variables will think that it shouldn't increment sublevels_up
3085 * before entering the Query; so we need to call it with sublevels_up == 1.
3086 */
3087static Query *
3090{
3091 Assert(IsA(query, Query));
3092 return (Query *) replace_rte_variables((Node *) query,
3093 context->varno, 1,
3095 context,
3096 NULL);
3097}
3098
3099
3100/*
3101 * flatten_simple_union_all
3102 * Try to optimize top-level UNION ALL structure into an appendrel
3103 *
3104 * If a query's setOperations tree consists entirely of simple UNION ALL
3105 * operations, flatten it into an append relation, which we can process more
3106 * intelligently than the general setops case. Otherwise, do nothing.
3107 *
3108 * In most cases, this can succeed only for a top-level query, because for a
3109 * subquery in FROM, the parent query's invocation of pull_up_subqueries would
3110 * already have flattened the UNION via pull_up_simple_union_all. But there
3111 * are a few cases we can support here but not in that code path, for example
3112 * when the subquery also contains ORDER BY.
3113 */
3114void
3116{
3117 Query *parse = root->parse;
3120 int leftmostRTI;
3122 int childRTI;
3125
3126 /* Shouldn't be called unless query has setops */
3127 topop = castNode(SetOperationStmt, parse->setOperations);
3128 Assert(topop);
3129
3130 /* Can't optimize away a recursive UNION */
3131 if (root->hasRecursion)
3132 return;
3133
3134 /*
3135 * Recursively check the tree of set operations. If not all UNION ALL
3136 * with identical column types, punt.
3137 */
3138 if (!is_simple_union_all_recurse((Node *) topop, parse, topop->colTypes))
3139 return;
3140
3141 /*
3142 * Locate the leftmost leaf query in the setops tree. The upper query's
3143 * Vars all refer to this RTE (see transformSetOperationStmt).
3144 */
3145 leftmostjtnode = topop->larg;
3149 leftmostRTI = ((RangeTblRef *) leftmostjtnode)->rtindex;
3151 Assert(leftmostRTE->rtekind == RTE_SUBQUERY);
3152
3153 /*
3154 * Make a copy of the leftmost RTE and add it to the rtable. This copy
3155 * will represent the leftmost leaf query in its capacity as a member of
3156 * the appendrel. The original will represent the appendrel as a whole.
3157 * (We must do things this way because the upper query's Vars have to be
3158 * seen as referring to the whole appendrel.)
3159 */
3161 parse->rtable = lappend(parse->rtable, childRTE);
3162 childRTI = list_length(parse->rtable);
3163
3164 /* Modify the setops tree to reference the child copy */
3165 ((RangeTblRef *) leftmostjtnode)->rtindex = childRTI;
3166
3167 /* Modify the formerly-leftmost RTE to mark it as an appendrel parent */
3168 leftmostRTE->inh = true;
3169
3170 /*
3171 * Form a RangeTblRef for the appendrel, and insert it into FROM. The top
3172 * Query of a setops tree should have had an empty FromClause initially.
3173 */
3175 rtr->rtindex = leftmostRTI;
3176 Assert(parse->jointree->fromlist == NIL);
3177 parse->jointree->fromlist = list_make1(rtr);
3178
3179 /*
3180 * Now pretend the query has no setops. We must do this before trying to
3181 * do subquery pullup, because of Assert in pull_up_simple_subquery.
3182 */
3183 parse->setOperations = NULL;
3184
3185 /*
3186 * Build AppendRelInfo information, and apply pull_up_subqueries to the
3187 * leaf queries of the UNION ALL. (We must do that now because they
3188 * weren't previously referenced by the jointree, and so were missed by
3189 * the main invocation of pull_up_subqueries.)
3190 */
3192}
3193
3194
3195/*
3196 * reduce_outer_joins
3197 * Attempt to reduce outer joins to plain inner joins.
3198 *
3199 * The idea here is that given a query like
3200 * SELECT ... FROM a LEFT JOIN b ON (...) WHERE b.y = 42;
3201 * we can reduce the LEFT JOIN to a plain JOIN if the "=" operator in WHERE
3202 * is strict. The strict operator will always return NULL, causing the outer
3203 * WHERE to fail, on any row where the LEFT JOIN filled in NULLs for b's
3204 * columns. Therefore, there's no need for the join to produce null-extended
3205 * rows in the first place --- which makes it a plain join not an outer join.
3206 * (This scenario may not be very likely in a query written out by hand, but
3207 * it's reasonably likely when pushing quals down into complex views.)
3208 *
3209 * More generally, an outer join can be reduced in strength if there is a
3210 * strict qual above it in the qual tree that constrains a Var from the
3211 * nullable side of the join to be non-null. (For FULL joins this applies
3212 * to each side separately.)
3213 *
3214 * Another transformation we apply here is to recognize cases like
3215 * SELECT ... FROM a LEFT JOIN b ON (a.x = b.y) WHERE b.z IS NULL;
3216 * If we can prove that b.z must be non-null for any matching row, either
3217 * because the join clause is strict for b.z and b.z happens to be the join
3218 * key b.y, or because b.z is defined NOT NULL by table constraints and is
3219 * not nullable due to lower-level outer joins, then only null-extended rows
3220 * could pass the upper WHERE, and we can conclude that what the query is
3221 * really specifying is an anti-semijoin. We change the join type from
3222 * JOIN_LEFT to JOIN_ANTI. The IS NULL clause then becomes redundant, and
3223 * must be removed to prevent bogus selectivity calculations, but we leave
3224 * it to distribute_qual_to_rels to get rid of such clauses.
3225 *
3226 * Also, we get rid of JOIN_RIGHT cases by flipping them around to become
3227 * JOIN_LEFT. This saves some code here and in some later planner routines;
3228 * the main benefit is to reduce the number of jointypes that can appear in
3229 * SpecialJoinInfo nodes. Note that we can still generate Paths and Plans
3230 * that use JOIN_RIGHT (or JOIN_RIGHT_ANTI) by switching the inputs again.
3231 *
3232 * To ease recognition of strict qual clauses, we require this routine to be
3233 * run after expression preprocessing (i.e., qual canonicalization and JOIN
3234 * alias-var expansion).
3235 */
3236void
3238{
3241 ListCell *lc;
3242
3243 /*
3244 * To avoid doing strictness checks on more quals than necessary, we want
3245 * to stop descending the jointree as soon as there are no outer joins
3246 * below our current point. This consideration forces a two-pass process.
3247 * The first pass gathers information about which base rels appear below
3248 * each side of each join clause, about whether there are outer join(s)
3249 * below each side of each join clause, and about which base rels are from
3250 * the nullable side of those outer join(s). The second pass examines
3251 * qual clauses and changes join types as it descends the tree.
3252 */
3253 state1 = reduce_outer_joins_pass1((Node *) root->parse->jointree);
3254
3255 /* planner.c shouldn't have called me if no outer joins */
3256 if (state1 == NULL || !state1->contains_outer)
3257 elog(ERROR, "so where are the outer joins?");
3258
3259 state2.inner_reduced = NULL;
3260 state2.partial_reduced = NIL;
3261
3262 reduce_outer_joins_pass2((Node *) root->parse->jointree,
3263 state1, &state2,
3264 root, NULL, NIL);
3265
3266 /*
3267 * If we successfully reduced the strength of any outer joins, we must
3268 * remove references to those joins as nulling rels. This is handled as
3269 * an additional pass, for simplicity and because we can handle all
3270 * fully-reduced joins in a single pass over the parse tree.
3271 */
3272 if (!bms_is_empty(state2.inner_reduced))
3273 {
3274 root->parse = (Query *)
3275 remove_nulling_relids((Node *) root->parse,
3276 state2.inner_reduced,
3277 NULL);
3278 /* There could be references in the append_rel_list, too */
3279 root->append_rel_list = (List *)
3280 remove_nulling_relids((Node *) root->append_rel_list,
3281 state2.inner_reduced,
3282 NULL);
3283 }
3284
3285 /*
3286 * Partially-reduced full joins have to be done one at a time, since
3287 * they'll each need a different setting of except_relids.
3288 */
3289 foreach(lc, state2.partial_reduced)
3290 {
3293
3294 root->parse = (Query *)
3295 remove_nulling_relids((Node *) root->parse,
3297 statep->unreduced_side);
3298 root->append_rel_list = (List *)
3299 remove_nulling_relids((Node *) root->append_rel_list,
3301 statep->unreduced_side);
3302 }
3303}
3304
3305/*
3306 * reduce_outer_joins_pass1 - phase 1 data collection
3307 *
3308 * Returns a state node describing the given jointree node.
3309 */
3312{
3314
3316 result->relids = NULL;
3317 result->contains_outer = false;
3318 result->nullable_rels = NULL;
3319 result->sub_states = NIL;
3320
3321 if (jtnode == NULL)
3322 return result;
3323 if (IsA(jtnode, RangeTblRef))
3324 {
3325 int varno = ((RangeTblRef *) jtnode)->rtindex;
3326
3327 result->relids = bms_make_singleton(varno);
3328 }
3329 else if (IsA(jtnode, FromExpr))
3330 {
3331 FromExpr *f = (FromExpr *) jtnode;
3332 ListCell *l;
3333
3334 foreach(l, f->fromlist)
3335 {
3337
3339 result->relids = bms_add_members(result->relids,
3340 sub_state->relids);
3341 result->contains_outer |= sub_state->contains_outer;
3342 result->nullable_rels = bms_add_members(result->nullable_rels,
3343 sub_state->nullable_rels);
3344 result->sub_states = lappend(result->sub_states, sub_state);
3345 }
3346 }
3347 else if (IsA(jtnode, JoinExpr))
3348 {
3349 JoinExpr *j = (JoinExpr *) jtnode;
3352
3353 /* Recurse to children */
3356
3357 /* join's own RT index is not wanted in result->relids */
3358 result->relids = bms_union(left_state->relids, right_state->relids);
3359
3360 /* Store children's states for pass 2 */
3361 result->sub_states = list_make2(left_state, right_state);
3362
3363 /* Collect outer join information */
3364 switch (j->jointype)
3365 {
3366 case JOIN_INNER:
3367 case JOIN_SEMI:
3368 /* No new nullability; propagate state from children */
3369 result->contains_outer = left_state->contains_outer ||
3370 right_state->contains_outer;
3371 result->nullable_rels = bms_union(left_state->nullable_rels,
3372 right_state->nullable_rels);
3373 break;
3374 case JOIN_LEFT:
3375 case JOIN_ANTI:
3376 /* RHS is nullable; LHS keeps existing status */
3377 result->contains_outer = true;
3378 result->nullable_rels = bms_union(left_state->nullable_rels,
3379 right_state->relids);
3380 break;
3381 case JOIN_RIGHT:
3382 /* LHS is nullable; RHS keeps existing status */
3383 result->contains_outer = true;
3384 result->nullable_rels = bms_union(left_state->relids,
3385 right_state->nullable_rels);
3386 break;
3387 case JOIN_FULL:
3388 /* Both sides are nullable */
3389 result->contains_outer = true;
3390 result->nullable_rels = bms_union(left_state->relids,
3391 right_state->relids);
3392 break;
3393 default:
3394 elog(ERROR, "unrecognized join type: %d",
3395 (int) j->jointype);
3396 break;
3397 }
3398 }
3399 else
3400 elog(ERROR, "unrecognized node type: %d",
3401 (int) nodeTag(jtnode));
3402 return result;
3403}
3404
3405/*
3406 * reduce_outer_joins_pass2 - phase 2 processing
3407 *
3408 * jtnode: current jointree node
3409 * state1: state data collected by phase 1 for this node
3410 * state2: where to accumulate info about successfully-reduced joins
3411 * root: toplevel planner state
3412 * nonnullable_rels: set of base relids forced non-null by upper quals
3413 * forced_null_vars: multibitmapset of Vars forced null by upper quals
3414 *
3415 * Returns info in state2 about outer joins that were successfully simplified.
3416 * Joins that were fully reduced to inner joins are all added to
3417 * state2->inner_reduced. If a full join is reduced to a left join,
3418 * it needs its own entry in state2->partial_reduced, since that will
3419 * require custom processing to remove only the correct nullingrel markers.
3420 */
3421static void
3426 Relids nonnullable_rels,
3428{
3429 /*
3430 * pass 2 should never descend as far as an empty subnode or base rel,
3431 * because it's only called on subtrees marked as contains_outer.
3432 */
3433 if (jtnode == NULL)
3434 elog(ERROR, "reached empty jointree");
3435 if (IsA(jtnode, RangeTblRef))
3436 elog(ERROR, "reached base rel");
3437 else if (IsA(jtnode, FromExpr))
3438 {
3439 FromExpr *f = (FromExpr *) jtnode;
3440 ListCell *l;
3441 ListCell *s;
3444
3445 /* Scan quals to see if we can add any constraints */
3448 nonnullable_rels);
3452 /* And recurse --- but only into interesting subtrees */
3453 Assert(list_length(f->fromlist) == list_length(state1->sub_states));
3454 forboth(l, f->fromlist, s, state1->sub_states)
3455 {
3457
3458 if (sub_state->contains_outer)
3460 state2, root,
3463 }
3465 /* can't so easily clean up var lists, unfortunately */
3466 }
3467 else if (IsA(jtnode, JoinExpr))
3468 {
3469 JoinExpr *j = (JoinExpr *) jtnode;
3470 int rtindex = j->rtindex;
3471 JoinType jointype = j->jointype;
3474
3475 /* Can we simplify this join? */
3476 switch (jointype)
3477 {
3478 case JOIN_INNER:
3479 break;
3480 case JOIN_LEFT:
3481 if (bms_overlap(nonnullable_rels, right_state->relids))
3482 jointype = JOIN_INNER;
3483 break;
3484 case JOIN_RIGHT:
3485 if (bms_overlap(nonnullable_rels, left_state->relids))
3486 jointype = JOIN_INNER;
3487 break;
3488 case JOIN_FULL:
3489 if (bms_overlap(nonnullable_rels, left_state->relids))
3490 {
3491 if (bms_overlap(nonnullable_rels, right_state->relids))
3492 jointype = JOIN_INNER;
3493 else
3494 {
3495 jointype = JOIN_LEFT;
3496 /* Also report partial reduction in state2 */
3498 right_state->relids);
3499 }
3500 }
3501 else
3502 {
3503 if (bms_overlap(nonnullable_rels, right_state->relids))
3504 {
3505 jointype = JOIN_RIGHT;
3506 /* Also report partial reduction in state2 */
3508 left_state->relids);
3509 }
3510 }
3511 break;
3512 case JOIN_SEMI:
3513 case JOIN_ANTI:
3514
3515 /*
3516 * These could only have been introduced by pull_up_sublinks,
3517 * so there's no way that upper quals could refer to their
3518 * righthand sides, and no point in checking. We don't expect
3519 * to see JOIN_RIGHT_SEMI or JOIN_RIGHT_ANTI yet.
3520 */
3521 break;
3522 default:
3523 elog(ERROR, "unrecognized join type: %d",
3524 (int) jointype);
3525 break;
3526 }
3527
3528 /*
3529 * Convert JOIN_RIGHT to JOIN_LEFT. Note that in the case where we
3530 * reduced JOIN_FULL to JOIN_RIGHT, this will mean the JoinExpr no
3531 * longer matches the internal ordering of any CoalesceExpr's built to
3532 * represent merged join variables. We don't care about that at
3533 * present, but be wary of it ...
3534 */
3535 if (jointype == JOIN_RIGHT)
3536 {
3537 Node *tmparg;
3538
3539 tmparg = j->larg;
3540 j->larg = j->rarg;
3541 j->rarg = tmparg;
3542 jointype = JOIN_LEFT;
3543 right_state = linitial(state1->sub_states);
3544 left_state = lsecond(state1->sub_states);
3545 }
3546
3547 /*
3548 * See if we can reduce JOIN_LEFT to JOIN_ANTI. This is the case if
3549 * any var from the RHS was forced null by higher qual levels, but is
3550 * known to be non-nullable. We detect this either by seeing if the
3551 * join's own quals are strict for the var, or by checking if the var
3552 * is defined NOT NULL by table constraints (being careful to exclude
3553 * vars that are nullable due to lower-level outer joins). In either
3554 * case, the only way the higher qual clause's requirement for NULL
3555 * can be met is if the join fails to match, producing a null-extended
3556 * row. Thus, we can treat this as an anti-join.
3557 */
3558 if (jointype == JOIN_LEFT && forced_null_vars != NIL)
3559 {
3561 Bitmapset *overlap;
3562
3563 /* Find Vars in j->quals that must be non-null in joined rows */
3565
3566 /*
3567 * It's not sufficient to check whether nonnullable_vars and
3568 * forced_null_vars overlap: we need to know if the overlap
3569 * includes any RHS variables.
3570 *
3571 * Also check if any forced-null var is defined NOT NULL by table
3572 * constraints.
3573 */
3575 if (bms_overlap(overlap, right_state->relids) ||
3577 jointype = JOIN_ANTI;
3578 }
3579
3580 /*
3581 * Apply the jointype change, if any, to both jointree node and RTE.
3582 * Also, if we changed an RTE to INNER, add its RTI to inner_reduced.
3583 */
3584 if (rtindex && jointype != j->jointype)
3585 {
3586 RangeTblEntry *rte = rt_fetch(rtindex, root->parse->rtable);
3587
3588 Assert(rte->rtekind == RTE_JOIN);
3589 Assert(rte->jointype == j->jointype);
3590 rte->jointype = jointype;
3591 if (jointype == JOIN_INNER)
3592 state2->inner_reduced = bms_add_member(state2->inner_reduced,
3593 rtindex);
3594 }
3595 j->jointype = jointype;
3596
3597 /* Only recurse if there's more to do below here */
3598 if (left_state->contains_outer || right_state->contains_outer)
3599 {
3604
3605 /*
3606 * If this join is (now) inner, we can add any constraints its
3607 * quals provide to those we got from above. But if it is outer,
3608 * we can pass down the local constraints only into the nullable
3609 * side, because an outer join never eliminates any rows from its
3610 * non-nullable side. Also, there is no point in passing upper
3611 * constraints into the nullable side, since if there were any
3612 * we'd have been able to reduce the join. (In the case of upper
3613 * forced-null constraints, we *must not* pass them into the
3614 * nullable side --- they either applied here, or not.) The upshot
3615 * is that we pass either the local or the upper constraints,
3616 * never both, to the children of an outer join.
3617 *
3618 * Note that a SEMI join works like an inner join here: it's okay
3619 * to pass down both local and upper constraints. (There can't be
3620 * any upper constraints affecting its inner side, but it's not
3621 * worth having a separate code path to avoid passing them.)
3622 *
3623 * At a FULL join we just punt and pass nothing down --- is it
3624 * possible to be smarter?
3625 */
3626 if (jointype != JOIN_FULL)
3627 {
3630 if (jointype == JOIN_INNER || jointype == JOIN_SEMI)
3631 {
3632 /* OK to merge upper and local constraints */
3634 nonnullable_rels);
3637 }
3638 }
3639 else
3640 {
3641 /* no use in calculating these */
3644 }
3645
3646 if (left_state->contains_outer)
3647 {
3648 if (jointype == JOIN_INNER || jointype == JOIN_SEMI)
3649 {
3650 /* pass union of local and upper constraints */
3653 }
3654 else if (jointype != JOIN_FULL) /* ie, LEFT or ANTI */
3655 {
3656 /* can't pass local constraints to non-nullable side */
3657 pass_nonnullable_rels = nonnullable_rels;
3659 }
3660 else
3661 {
3662 /* no constraints pass through JOIN_FULL */
3665 }
3667 state2, root,
3670 }
3671
3672 if (right_state->contains_outer)
3673 {
3674 if (jointype != JOIN_FULL) /* ie, INNER/LEFT/SEMI/ANTI */
3675 {
3676 /* pass appropriate constraints, per comment above */
3679 }
3680 else
3681 {
3682 /* no constraints pass through JOIN_FULL */
3685 }
3687 state2, root,
3690 }
3692 }
3693 }
3694 else
3695 elog(ERROR, "unrecognized node type: %d",
3696 (int) nodeTag(jtnode));
3697}
3698
3699/* Helper for reduce_outer_joins_pass2 */
3700static void
3702 int rtindex, Relids relids)
3703{
3705
3707 statep->full_join_rti = rtindex;
3708 statep->unreduced_side = relids;
3709 state2->partial_reduced = lappend(state2->partial_reduced, statep);
3710}
3711
3712/*
3713 * has_notnull_forced_var
3714 * Check if "forced_null_vars" contains any Vars belonging to the subtree
3715 * indicated by "right_state" that are known to be non-nullable due to
3716 * table constraints.
3717 *
3718 * Note that we must also consider the situation where a NOT NULL Var can be
3719 * nulled by lower-level outer joins.
3720 *
3721 * Helper for reduce_outer_joins_pass2.
3722 */
3723static bool
3726{
3727 int varno = -1;
3728
3730 {
3732 Bitmapset *notnullattnums;
3734 int attno;
3735
3736 varno++;
3737
3738 /* Skip empty bitmaps */
3739 if (bms_is_empty(attrs))
3740 continue;
3741
3742 /* Skip Vars that do not belong to the target relations */
3743 if (!bms_is_member(varno, right_state->relids))
3744 continue;
3745
3746 /*
3747 * Skip Vars that can be nulled by lower-level outer joins within the
3748 * given subtree. These Vars might be NULL even if the schema defines
3749 * them as NOT NULL.
3750 */
3751 if (bms_is_member(varno, right_state->nullable_rels))
3752 continue;
3753
3754 /*
3755 * Iterate over attributes and adjust the bitmap indexes by
3756 * FirstLowInvalidHeapAttributeNumber to get the actual attribute
3757 * numbers.
3758 */
3759 attno = -1;
3760 while ((attno = bms_next_member(attrs, attno)) >= 0)
3761 {
3763
3764 /* system columns cannot be NULL */
3765 if (real_attno < 0)
3766 return true;
3767
3769 }
3770
3771 rte = rt_fetch(varno, root->parse->rtable);
3772
3773 /* We can only reason about ordinary relations */
3774 if (rte->rtekind != RTE_RELATION)
3775 {
3777 continue;
3778 }
3779
3780 /*
3781 * We must skip inheritance parent tables, as some child tables may
3782 * have a NOT NULL constraint for a column while others may not. This
3783 * cannot happen with partitioned tables, though.
3784 */
3785 if (rte->inh && rte->relkind != RELKIND_PARTITIONED_TABLE)
3786 {
3788 continue;
3789 }
3790
3791 /* Get the column not-null constraint information for this relation */
3792 notnullattnums = find_relation_notnullatts(root, rte->relid);
3793
3794 /*
3795 * Check if any forced-null attributes are defined as NOT NULL by
3796 * table constraints.
3797 */
3798 if (bms_overlap(notnullattnums, forcednullattnums))
3799 {
3801 return true;
3802 }
3803
3805 }
3806
3807 return false;
3808}
3809
3810
3811/*
3812 * remove_useless_result_rtes
3813 * Attempt to remove RTE_RESULT RTEs from the join tree.
3814 * Also, elide single-child FromExprs where possible.
3815 *
3816 * We can remove RTE_RESULT entries from the join tree using the knowledge
3817 * that RTE_RESULT returns exactly one row and has no output columns. Hence,
3818 * if one is inner-joined to anything else, we can delete it. Optimizations
3819 * are also possible for some outer-join cases, as detailed below.
3820 *
3821 * This pass also replaces single-child FromExprs with their child node
3822 * where possible. It's appropriate to do that here and not earlier because
3823 * RTE_RESULT removal might reduce a multiple-child FromExpr to have only one
3824 * child. We can remove such a FromExpr if its quals are empty, or if it's
3825 * semantically valid to merge the quals into those of the parent node.
3826 * While removing unnecessary join tree nodes has some micro-efficiency value,
3827 * the real reason to do this is to eliminate cases where the nullable side of
3828 * an outer join node is a FromExpr whose single child is another outer join.
3829 * To correctly determine whether the two outer joins can commute,
3830 * deconstruct_jointree() must treat any quals of such a FromExpr as being
3831 * degenerate quals of the upper outer join. The best way to do that is to
3832 * make them actually *be* quals of the upper join, by dropping the FromExpr
3833 * and hoisting the quals up into the upper join's quals. (Note that there is
3834 * no hazard when the intermediate FromExpr has multiple children, since then
3835 * it represents an inner join that cannot commute with the upper outer join.)
3836 * As long as we have to do that, we might as well elide such FromExprs
3837 * everywhere.
3838 *
3839 * Some of these optimizations depend on recognizing empty (constant-true)
3840 * quals for FromExprs and JoinExprs. That makes it useful to apply this
3841 * optimization pass after expression preprocessing, since that will have
3842 * eliminated constant-true quals, allowing more cases to be recognized as
3843 * optimizable. What's more, the usual reason for an RTE_RESULT to be present
3844 * is that we pulled up a subquery or VALUES clause, thus very possibly
3845 * replacing Vars with constants, making it more likely that a qual can be
3846 * reduced to constant true. Also, because some optimizations depend on
3847 * the outer-join type, it's best to have done reduce_outer_joins() first.
3848 *
3849 * A PlaceHolderVar referencing an RTE_RESULT RTE poses an obstacle to this
3850 * process: we must remove the RTE_RESULT's relid from the PHV's phrels, but
3851 * we must not reduce the phrels set to empty. If that would happen, and
3852 * the RTE_RESULT is an immediate child of an outer join, we have to give up
3853 * and not remove the RTE_RESULT: there is noplace else to evaluate the
3854 * PlaceHolderVar. (That is, in such cases the RTE_RESULT *does* have output
3855 * columns.) But if the RTE_RESULT is an immediate child of an inner join,
3856 * we can usually change the PlaceHolderVar's phrels so as to evaluate it at
3857 * the inner join instead. This is OK because we really only care that PHVs
3858 * are evaluated above or below the correct outer joins. We can't, however,
3859 * postpone the evaluation of a PHV to above where it is used; so there are
3860 * some checks below on whether output PHVs are laterally referenced in the
3861 * other join input rel(s).
3862 *
3863 * We used to try to do this work as part of pull_up_subqueries() where the
3864 * potentially-optimizable cases get introduced; but it's way simpler, and
3865 * more effective, to do it separately.
3866 */
3867void
3869{
3871 ListCell *cell;
3872
3873 /* Top level of jointree must always be a FromExpr */
3874 Assert(IsA(root->parse->jointree, FromExpr));
3875 /* Recurse ... */
3876 root->parse->jointree = (FromExpr *)
3878 (Node *) root->parse->jointree,
3879 NULL,
3881 /* We should still have a FromExpr */
3882 Assert(IsA(root->parse->jointree, FromExpr));
3883
3884 /*
3885 * If we removed any outer-join nodes from the jointree, run around and
3886 * remove references to those joins as nulling rels. (There could be such
3887 * references in PHVs that we pulled up out of the original subquery that
3888 * the RESULT rel replaced. This is kosher on the grounds that we now
3889 * know that such an outer join wouldn't really have nulled anything.) We
3890 * don't do this during the main recursion, for simplicity and because we
3891 * can handle all such joins in a single pass over the parse tree.
3892 */
3894 {
3895 root->parse = (Query *)
3896 remove_nulling_relids((Node *) root->parse,
3898 NULL);
3899 /* There could be references in the append_rel_list, too */
3900 root->append_rel_list = (List *)
3901 remove_nulling_relids((Node *) root->append_rel_list,
3903 NULL);
3904 }
3905
3906 /*
3907 * Remove any PlanRowMark referencing an RTE_RESULT RTE. We obviously
3908 * must do that for any RTE_RESULT that we just removed. But one for a
3909 * RTE that we did not remove can be dropped anyway: since the RTE has
3910 * only one possible output row, there is no need for EPQ to mark and
3911 * restore that row.
3912 *
3913 * It's necessary, not optional, to remove the PlanRowMark for a surviving
3914 * RTE_RESULT RTE; otherwise we'll generate a whole-row Var for the
3915 * RTE_RESULT, which the executor has no support for.
3916 */
3917 foreach(cell, root->rowMarks)
3918 {
3919 PlanRowMark *rc = (PlanRowMark *) lfirst(cell);
3920
3921 if (rt_fetch(rc->rti, root->parse->rtable)->rtekind == RTE_RESULT)
3922 root->rowMarks = foreach_delete_current(root->rowMarks, cell);
3923 }
3924}
3925
3926/*
3927 * remove_useless_results_recurse
3928 * Recursive guts of remove_useless_result_rtes.
3929 *
3930 * This recursively processes the jointree and returns a modified jointree.
3931 * In addition, the RT indexes of any removed outer-join nodes are added to
3932 * *dropped_outer_joins.
3933 *
3934 * jtnode is the current jointree node. If it could be valid to merge
3935 * its quals into those of the parent node, parent_quals should point to
3936 * the parent's quals list; otherwise, pass NULL for parent_quals.
3937 * (Note that in some cases, parent_quals points to the quals of a parent
3938 * more than one level up in the tree.)
3939 */
3940static Node *
3944{
3945 Assert(jtnode != NULL);
3946 if (IsA(jtnode, RangeTblRef))
3947 {
3948 /* Can't immediately do anything with a RangeTblRef */
3949 }
3950 else if (IsA(jtnode, FromExpr))
3951 {
3952 FromExpr *f = (FromExpr *) jtnode;
3954 ListCell *cell;
3955
3956 /*
3957 * We can drop RTE_RESULT rels from the fromlist so long as at least
3958 * one child remains, since joining to a one-row table changes
3959 * nothing. (But we can't drop a RTE_RESULT that computes PHV(s) that
3960 * are needed by some sibling. The cleanup transformation below would
3961 * reassign the PHVs to be computed at the join, which is too late for
3962 * the sibling's use.) The easiest way to mechanize this rule is to
3963 * modify the list in-place.
3964 */
3965 foreach(cell, f->fromlist)
3966 {
3967 Node *child = (Node *) lfirst(cell);
3968 int varno;
3969
3970 /* Recursively transform child, allowing it to push up quals ... */
3971 child = remove_useless_results_recurse(root, child,
3972 &f->quals,
3974 /* ... and stick it back into the tree */
3975 lfirst(cell) = child;
3976
3977 /*
3978 * If it's an RTE_RESULT with at least one sibling, and no sibling
3979 * references dependent PHVs, we can drop it. We don't yet know
3980 * what the inner join's final relid set will be, so postpone
3981 * cleanup of PHVs etc till after this loop.
3982 */
3983 if (list_length(f->fromlist) > 1 &&
3984 (varno = get_result_relid(root, child)) != 0 &&
3986 {
3987 f->fromlist = foreach_delete_current(f->fromlist, cell);
3989 }
3990 }
3991
3992 /*
3993 * Clean up if we dropped any RTE_RESULT RTEs. This is a bit
3994 * inefficient if there's more than one, but it seems better to
3995 * optimize the support code for the single-relid case.
3996 */
3997 if (result_relids)
3998 {
3999 int varno = -1;
4000
4001 while ((varno = bms_next_member(result_relids, varno)) >= 0)
4002 remove_result_refs(root, varno, (Node *) f);
4003 }
4004
4005 /*
4006 * If the FromExpr now has only one child, see if we can elide it.
4007 * This is always valid if there are no quals, except at the top of
4008 * the jointree (since Query.jointree is required to point to a
4009 * FromExpr). Otherwise, we can do it if we can push the quals up to
4010 * the parent node.
4011 *
4012 * Note: while it would not be terribly hard to generalize this
4013 * transformation to merge multi-child FromExprs into their parent
4014 * FromExpr, that risks making the parent join too expensive to plan.
4015 * We leave it to later processing to decide heuristically whether
4016 * that's a good idea. Pulling up a single child is always OK,
4017 * however.
4018 */
4019 if (list_length(f->fromlist) == 1 &&
4020 f != root->parse->jointree &&
4021 (f->quals == NULL || parent_quals != NULL))
4022 {
4023 /*
4024 * Merge any quals up to parent. They should be in implicit-AND
4025 * format by now, so we just need to concatenate lists. Put the
4026 * child quals at the front, on the grounds that they should
4027 * nominally be evaluated earlier.
4028 */
4029 if (f->quals != NULL)
4030 *parent_quals = (Node *)
4033 return (Node *) linitial(f->fromlist);
4034 }
4035 }
4036 else if (IsA(jtnode, JoinExpr))
4037 {
4038 JoinExpr *j = (JoinExpr *) jtnode;
4039 int varno;
4040
4041 /*
4042 * First, recurse. We can absorb pushed-up FromExpr quals from either
4043 * child into this node if the jointype is INNER, since then this is
4044 * equivalent to a FromExpr. When the jointype is LEFT, we can absorb
4045 * quals from the RHS child into the current node, as they're
4046 * essentially degenerate quals of the outer join. Moreover, if we've
4047 * been passed down a parent_quals pointer then we can allow quals of
4048 * the LHS child to be absorbed into the parent. (This is important
4049 * to ensure we remove single-child FromExprs immediately below
4050 * commutable left joins.) For other jointypes, we can't move child
4051 * quals up, or at least there's no particular reason to.
4052 */
4053 j->larg = remove_useless_results_recurse(root, j->larg,
4054 (j->jointype == JOIN_INNER) ?
4055 &j->quals :
4056 (j->jointype == JOIN_LEFT) ?
4059 j->rarg = remove_useless_results_recurse(root, j->rarg,
4060 (j->jointype == JOIN_INNER ||
4061 j->jointype == JOIN_LEFT) ?
4062 &j->quals : NULL,
4064
4065 /* Apply join-type-specific optimization rules */
4066 switch (j->jointype)
4067 {
4068 case JOIN_INNER:
4069
4070 /*
4071 * An inner join is equivalent to a FromExpr, so if either
4072 * side was simplified to an RTE_RESULT rel, we can replace
4073 * the join with a FromExpr with just the other side.
4074 * Furthermore, we can elide that FromExpr according to the
4075 * same rules as above.
4076 *
4077 * Just as in the FromExpr case, we can't simplify if the
4078 * other input rel references any PHVs that are marked as to
4079 * be evaluated at the RTE_RESULT rel, because we can't
4080 * postpone their evaluation in that case. But we only have
4081 * to check this in cases where it's syntactically legal for
4082 * the other input to have a LATERAL reference to the
4083 * RTE_RESULT rel. Only RHSes of inner and left joins are
4084 * allowed to have such refs.
4085 */
4086 if ((varno = get_result_relid(root, j->larg)) != 0 &&
4087 !find_dependent_phvs_in_jointree(root, j->rarg, varno))
4088 {
4089 remove_result_refs(root, varno, j->rarg);
4090 if (j->quals != NULL && parent_quals == NULL)
4091 jtnode = (Node *)
4092 makeFromExpr(list_make1(j->rarg), j->quals);
4093 else
4094 {
4095 /* Merge any quals up to parent */
4096 if (j->quals != NULL)
4097 *parent_quals = (Node *)
4098 list_concat(castNode(List, j->quals),
4100 jtnode = j->rarg;
4101 }
4102 }
4103 else if ((varno = get_result_relid(root, j->rarg)) != 0)
4104 {
4105 remove_result_refs(root, varno, j->larg);
4106 if (j->quals != NULL && parent_quals == NULL)
4107 jtnode = (Node *)
4108 makeFromExpr(list_make1(j->larg), j->quals);
4109 else
4110 {
4111 /* Merge any quals up to parent */
4112 if (j->quals != NULL)
4113 *parent_quals = (Node *)
4114 list_concat(castNode(List, j->quals),
4116 jtnode = j->larg;
4117 }
4118 }
4119 break;
4120 case JOIN_LEFT:
4121
4122 /*
4123 * We can simplify this case if the RHS is an RTE_RESULT, with
4124 * two different possibilities:
4125 *
4126 * If the qual is empty (JOIN ON TRUE), then the join can be
4127 * strength-reduced to a plain inner join, since each LHS row
4128 * necessarily has exactly one join partner. So we can always
4129 * discard the RHS, much as in the JOIN_INNER case above.
4130 * (Again, the LHS could not contain a lateral reference to
4131 * the RHS.)
4132 *
4133 * Otherwise, it's still true that each LHS row should be
4134 * returned exactly once, and since the RHS returns no columns
4135 * (unless there are PHVs that have to be evaluated there), we
4136 * don't much care if it's null-extended or not. So in this
4137 * case also, we can just ignore the qual and discard the left
4138 * join.
4139 */
4140 if ((varno = get_result_relid(root, j->rarg)) != 0 &&
4141 (j->quals == NULL ||
4142 !find_dependent_phvs(root, varno)))
4143 {
4144 remove_result_refs(root, varno, j->larg);
4146 j->rtindex);
4147 jtnode = j->larg;
4148 }
4149 break;
4150 case JOIN_SEMI:
4151
4152 /*
4153 * We may simplify this case if the RHS is an RTE_RESULT; the
4154 * join qual becomes effectively just a filter qual for the
4155 * LHS, since we should either return the LHS row or not. The
4156 * filter clause must go into a new FromExpr if we can't push
4157 * it up to the parent.
4158 *
4159 * There is a fine point about PHVs that are supposed to be
4160 * evaluated at the RHS. Such PHVs could only appear in the
4161 * semijoin's qual, since the rest of the query cannot
4162 * reference any outputs of the semijoin's RHS. Therefore,
4163 * they can't actually go to null before being examined, and
4164 * it'd be OK to just remove the PHV wrapping. We don't have
4165 * infrastructure for that, but remove_result_refs() will
4166 * relabel them as to be evaluated at the LHS, which is fine.
4167 *
4168 * Also, we don't need to worry about removing traces of the
4169 * join's rtindex, since it hasn't got one.
4170 */
4171 if ((varno = get_result_relid(root, j->rarg)) != 0)
4172 {
4173 Assert(j->rtindex == 0);
4174 remove_result_refs(root, varno, j->larg);
4175 if (j->quals != NULL && parent_quals == NULL)
4176 jtnode = (Node *)
4177 makeFromExpr(list_make1(j->larg), j->quals);
4178 else
4179 {
4180 /* Merge any quals up to parent */
4181 if (j->quals != NULL)
4182 *parent_quals = (Node *)
4183 list_concat(castNode(List, j->quals),
4185 jtnode = j->larg;
4186 }
4187 }
4188 break;
4189 case JOIN_FULL:
4190 case JOIN_ANTI:
4191 /* We have no special smarts for these cases */
4192 break;
4193 default:
4194 /* Note: JOIN_RIGHT should be gone at this point */
4195 elog(ERROR, "unrecognized join type: %d",
4196 (int) j->jointype);
4197 break;
4198 }
4199 }
4200 else
4201 elog(ERROR, "unrecognized node type: %d",
4202 (int) nodeTag(jtnode));
4203 return jtnode;
4204}
4205
4206/*
4207 * get_result_relid
4208 * If jtnode is a RangeTblRef for an RTE_RESULT RTE, return its relid;
4209 * otherwise return 0.
4210 */
4211static int
4213{
4214 int varno;
4215
4216 if (!IsA(jtnode, RangeTblRef))
4217 return 0;
4218 varno = ((RangeTblRef *) jtnode)->rtindex;
4219 if (rt_fetch(varno, root->parse->rtable)->rtekind != RTE_RESULT)
4220 return 0;
4221 return varno;
4222}
4223
4224/*
4225 * remove_result_refs
4226 * Helper routine for dropping an unneeded RTE_RESULT RTE.
4227 *
4228 * This doesn't physically remove the RTE from the jointree, because that's
4229 * more easily handled in remove_useless_results_recurse. What it does do
4230 * is the necessary cleanup in the rest of the tree: we must adjust any PHVs
4231 * that may reference the RTE. Be sure to call this at a point where the
4232 * jointree is valid (no disconnected nodes).
4233 *
4234 * Note that we don't need to process the append_rel_list, since RTEs
4235 * referenced directly in the jointree won't be appendrel members.
4236 *
4237 * varno is the RTE_RESULT's relid.
4238 * newjtloc is the jointree location at which any PHVs referencing the
4239 * RTE_RESULT should be evaluated instead.
4240 */
4241static void
4243{
4244 /* Fix up PlaceHolderVars as needed */
4245 /* If there are no PHVs anywhere, we can skip this bit */
4246 if (root->glob->lastPHId != 0)
4247 {
4248 Relids subrelids;
4249
4250 subrelids = get_relids_in_jointree(newjtloc, true, false);
4251 Assert(!bms_is_empty(subrelids));
4252 substitute_phv_relids((Node *) root->parse, varno, subrelids);
4253 fix_append_rel_relids(root, varno, subrelids);
4254 }
4255
4256 /*
4257 * We also need to remove any PlanRowMark referencing the RTE, but we
4258 * postpone that work until we return to remove_useless_result_rtes.
4259 */
4260}
4261
4262
4263/*
4264 * find_dependent_phvs - are there any PlaceHolderVars whose relids are
4265 * exactly the given varno?
4266 *
4267 * find_dependent_phvs should be used when we want to see if there are
4268 * any such PHVs anywhere in the Query. Another use-case is to see if
4269 * a subtree of the join tree contains such PHVs; but for that, we have
4270 * to look not only at the join tree nodes themselves but at the
4271 * referenced RTEs. For that, use find_dependent_phvs_in_jointree.
4272 */
4273
4279
4280static bool
4283{
4284 if (node == NULL)
4285 return false;
4286 if (IsA(node, PlaceHolderVar))
4287 {
4288 PlaceHolderVar *phv = (PlaceHolderVar *) node;
4289
4290 if (phv->phlevelsup == context->sublevels_up &&
4291 bms_equal(context->relids, phv->phrels))
4292 return true;
4293 /* fall through to examine children */
4294 }
4295 if (IsA(node, Query))
4296 {
4297 /* Recurse into subselects */
4298 bool result;
4299
4300 context->sublevels_up++;
4301 result = query_tree_walker((Query *) node,
4303 context, 0);
4304 context->sublevels_up--;
4305 return result;
4306 }
4307 /* Shouldn't need to handle most planner auxiliary nodes here */
4308 Assert(!IsA(node, SpecialJoinInfo));
4309 Assert(!IsA(node, PlaceHolderInfo));
4310 Assert(!IsA(node, MinMaxAggInfo));
4311
4313}
4314
4315static bool
4317{
4319
4320 /* If there are no PHVs anywhere, we needn't work hard */
4321 if (root->glob->lastPHId == 0)
4322 return false;
4323
4324 context.relids = bms_make_singleton(varno);
4325 context.sublevels_up = 0;
4326
4327 if (query_tree_walker(root->parse, find_dependent_phvs_walker, &context, 0))
4328 return true;
4329 /* The append_rel_list could be populated already, so check it too */
4330 if (expression_tree_walker((Node *) root->append_rel_list,
4332 &context))
4333 return true;
4334 return false;
4335}
4336
4337static bool
4339{
4341 Relids subrelids;
4342 int relid;
4343
4344 /* If there are no PHVs anywhere, we needn't work hard */
4345 if (root->glob->lastPHId == 0)
4346 return false;
4347
4348 context.relids = bms_make_singleton(varno);
4349 context.sublevels_up = 0;
4350
4351 /*
4352 * See if the jointree fragment itself contains references (in join quals)
4353 */
4354 if (find_dependent_phvs_walker(node, &context))
4355 return true;
4356
4357 /*
4358 * Otherwise, identify the set of referenced RTEs (we can ignore joins,
4359 * since they should be flattened already, so their join alias lists no
4360 * longer matter), and tediously check each RTE. We can ignore RTEs that
4361 * are not marked LATERAL, though, since they couldn't possibly contain
4362 * any cross-references to other RTEs.
4363 */
4364 subrelids = get_relids_in_jointree(node, false, false);
4365 relid = -1;
4366 while ((relid = bms_next_member(subrelids, relid)) >= 0)
4367 {
4368 RangeTblEntry *rte = rt_fetch(relid, root->parse->rtable);
4369
4370 if (rte->lateral &&
4372 return true;
4373 }
4374
4375 return false;
4376}
4377
4378/*
4379 * substitute_phv_relids - adjust PlaceHolderVar relid sets after pulling up
4380 * a subquery or removing an RTE_RESULT jointree item
4381 *
4382 * Find any PlaceHolderVar nodes in the given tree that reference the
4383 * pulled-up relid, and change them to reference the replacement relid(s).
4384 *
4385 * NOTE: although this has the form of a walker, we cheat and modify the
4386 * nodes in-place. This should be OK since the tree was copied by
4387 * pullup_replace_vars earlier. Avoid scribbling on the original values of
4388 * the bitmapsets, though, because expression_tree_mutator doesn't copy those.
4389 */
4390
4397
4398static bool
4401{
4402 if (node == NULL)
4403 return false;
4404 if (IsA(node, PlaceHolderVar))
4405 {
4406 PlaceHolderVar *phv = (PlaceHolderVar *) node;
4407
4408 if (phv->phlevelsup == context->sublevels_up &&
4409 bms_is_member(context->varno, phv->phrels))
4410 {
4411 phv->phrels = bms_union(phv->phrels,
4412 context->subrelids);
4413 phv->phrels = bms_del_member(phv->phrels,
4414 context->varno);
4415 /* Assert we haven't broken the PHV */
4416 Assert(!bms_is_empty(phv->phrels));
4417 }
4418 /* fall through to examine children */
4419 }
4420 if (IsA(node, Query))
4421 {
4422 /* Recurse into subselects */
4423 bool result;
4424
4425 context->sublevels_up++;
4426 result = query_tree_walker((Query *) node,
4428 context, 0);
4429 context->sublevels_up--;
4430 return result;
4431 }
4432 /* Shouldn't need to handle planner auxiliary nodes here */
4433 Assert(!IsA(node, SpecialJoinInfo));
4434 Assert(!IsA(node, AppendRelInfo));
4435 Assert(!IsA(node, PlaceHolderInfo));
4436 Assert(!IsA(node, MinMaxAggInfo));
4437
4439}
4440
4441static void
4442substitute_phv_relids(Node *node, int varno, Relids subrelids)
4443{
4445
4446 context.varno = varno;
4447 context.sublevels_up = 0;
4448 context.subrelids = subrelids;
4449
4450 /*
4451 * Must be prepared to start with a Query or a bare expression tree.
4452 */
4455 &context,
4456 0);
4457}
4458
4459/*
4460 * fix_append_rel_relids: update RT-index fields of AppendRelInfo nodes
4461 *
4462 * When we pull up a subquery, any AppendRelInfo references to the subquery's
4463 * RT index have to be replaced by the substituted relid (and there had better
4464 * be only one). We also need to apply substitute_phv_relids to their
4465 * translated_vars lists, since those might contain PlaceHolderVars.
4466 *
4467 * We assume we may modify the AppendRelInfo nodes in-place.
4468 */
4469static void
4471{
4472 ListCell *l;
4473 int subvarno = -1;
4474
4475 /*
4476 * We only want to extract the member relid once, but we mustn't fail
4477 * immediately if there are multiple members; it could be that none of the
4478 * AppendRelInfo nodes refer to it. So compute it on first use. Note that
4479 * bms_singleton_member will complain if set is not singleton.
4480 */
4481 foreach(l, root->append_rel_list)
4482 {
4484
4485 /* The parent_relid shouldn't ever be a pullup target */
4486 Assert(appinfo->parent_relid != varno);
4487
4488 if (appinfo->child_relid == varno)
4489 {
4490 if (subvarno < 0)
4491 subvarno = bms_singleton_member(subrelids);
4492 appinfo->child_relid = subvarno;
4493 }
4494
4495 /* Also fix up any PHVs in its translated vars */
4496 if (root->glob->lastPHId != 0)
4497 substitute_phv_relids((Node *) appinfo->translated_vars,
4498 varno, subrelids);
4499 }
4500}
4501
4502/*
4503 * get_relids_in_jointree: get set of RT indexes present in a jointree
4504 *
4505 * Base-relation relids are always included in the result.
4506 * If include_outer_joins is true, outer-join RT indexes are included.
4507 * If include_inner_joins is true, inner-join RT indexes are included.
4508 *
4509 * Note that for most purposes in the planner, outer joins are included
4510 * in standard relid sets. Setting include_inner_joins true is only
4511 * appropriate for special purposes during subquery flattening.
4512 */
4513Relids
4516{
4517 Relids result = NULL;
4518
4519 if (jtnode == NULL)
4520 return result;
4521 if (IsA(jtnode, RangeTblRef))
4522 {
4523 int varno = ((RangeTblRef *) jtnode)->rtindex;
4524
4525 result = bms_make_singleton(varno);
4526 }
4527 else if (IsA(jtnode, FromExpr))
4528 {
4529 FromExpr *f = (FromExpr *) jtnode;
4530 ListCell *l;
4531
4532 foreach(l, f->fromlist)
4533 {
4538 }
4539 }
4540 else if (IsA(jtnode, JoinExpr))
4541 {
4542 JoinExpr *j = (JoinExpr *) jtnode;
4543
4551 if (j->rtindex)
4552 {
4553 if (j->jointype == JOIN_INNER)
4554 {
4556 result = bms_add_member(result, j->rtindex);
4557 }
4558 else
4559 {
4561 result = bms_add_member(result, j->rtindex);
4562 }
4563 }
4564 }
4565 else
4566 elog(ERROR, "unrecognized node type: %d",
4567 (int) nodeTag(jtnode));
4568 return result;
4569}
4570
4571/*
4572 * get_relids_for_join: get set of base+OJ RT indexes making up a join
4573 */
4574Relids
4576{
4577 Node *jtnode;
4578
4579 jtnode = find_jointree_node_for_rel((Node *) query->jointree,
4580 joinrelid);
4581 if (!jtnode)
4582 elog(ERROR, "could not find join node %d", joinrelid);
4583 return get_relids_in_jointree(jtnode, true, false);
4584}
4585
4586/*
4587 * find_jointree_node_for_rel: locate jointree node for a base or join RT index
4588 *
4589 * Returns NULL if not found
4590 */
4591static Node *
4593{
4594 if (jtnode == NULL)
4595 return NULL;
4596 if (IsA(jtnode, RangeTblRef))
4597 {
4598 int varno = ((RangeTblRef *) jtnode)->rtindex;
4599
4600 if (relid == varno)
4601 return jtnode;
4602 }
4603 else if (IsA(jtnode, FromExpr))
4604 {
4605 FromExpr *f = (FromExpr *) jtnode;
4606 ListCell *l;
4607
4608 foreach(l, f->fromlist)
4609 {
4610 jtnode = find_jointree_node_for_rel(lfirst(l), relid);
4611 if (jtnode)
4612 return jtnode;
4613 }
4614 }
4615 else if (IsA(jtnode, JoinExpr))
4616 {
4617 JoinExpr *j = (JoinExpr *) jtnode;
4618
4619 if (relid == j->rtindex)
4620 return jtnode;
4621 jtnode = find_jointree_node_for_rel(j->larg, relid);
4622 if (jtnode)
4623 return jtnode;
4624 jtnode = find_jointree_node_for_rel(j->rarg, relid);
4625 if (jtnode)
4626 return jtnode;
4627 }
4628 else
4629 elog(ERROR, "unrecognized node type: %d",
4630 (int) nodeTag(jtnode));
4631 return NULL;
4632}
4633
4634/*
4635 * get_nullingrels: collect info about which outer joins null which relations
4636 *
4637 * The result struct contains, for each leaf relation used in the query,
4638 * the set of relids of outer joins that potentially null that rel.
4639 */
4640static nullingrel_info *
4642{
4644
4645 result->rtlength = list_length(parse->rtable);
4646 result->nullingrels = palloc0_array(Relids, result->rtlength + 1);
4647 get_nullingrels_recurse((Node *) parse->jointree, NULL, result);
4648 return result;
4649}
4650
4651/*
4652 * Recursive guts of get_nullingrels().
4653 *
4654 * Note: at any recursion level, the passed-down upper_nullingrels must be
4655 * treated as a constant, but it can be stored directly into *info
4656 * if we're at leaf level. Upper recursion levels do not free their mutated
4657 * copies of the nullingrels, because those are probably referenced by
4658 * at least one leaf rel.
4659 */
4660static void
4662 nullingrel_info *info)
4663{
4664 if (jtnode == NULL)
4665 return;
4666 if (IsA(jtnode, RangeTblRef))
4667 {
4668 int varno = ((RangeTblRef *) jtnode)->rtindex;
4669
4670 Assert(varno > 0 && varno <= info->rtlength);
4671 info->nullingrels[varno] = upper_nullingrels;
4672 }
4673 else if (IsA(jtnode, FromExpr))
4674 {
4675 FromExpr *f = (FromExpr *) jtnode;
4676 ListCell *l;
4677
4678 foreach(l, f->fromlist)
4679 {
4681 }
4682 }
4683 else if (IsA(jtnode, JoinExpr))
4684 {
4685 JoinExpr *j = (JoinExpr *) jtnode;
4687
4688 switch (j->jointype)
4689 {
4690 case JOIN_INNER:
4693 break;
4694 case JOIN_LEFT:
4695 case JOIN_SEMI:
4696 case JOIN_ANTI:
4698 j->rtindex);
4701 break;
4702 case JOIN_FULL:
4704 j->rtindex);
4707 break;
4708 case JOIN_RIGHT:
4710 j->rtindex);
4713 break;
4714 default:
4715 elog(ERROR, "unrecognized join type: %d",
4716 (int) j->jointype);
4717 break;
4718 }
4719 }
4720 else
4721 elog(ERROR, "unrecognized node type: %d",
4722 (int) nodeTag(jtnode));
4723}
int16 AttrNumber
Definition attnum.h:21
#define InvalidAttrNumber
Definition attnum.h:23
Bitmapset * bms_make_singleton(int x)
Definition bitmapset.c:216
Bitmapset * bms_intersect(const Bitmapset *a, const Bitmapset *b)
Definition bitmapset.c:292
bool bms_equal(const Bitmapset *a, const Bitmapset *b)
Definition bitmapset.c:142
int bms_next_member(const Bitmapset *a, int prevbit)
Definition bitmapset.c:1290
Bitmapset * bms_del_members(Bitmapset *a, const Bitmapset *b)
Definition bitmapset.c:1145
Bitmapset * bms_del_member(Bitmapset *a, int x)
Definition bitmapset.c:852
bool bms_is_subset(const Bitmapset *a, const Bitmapset *b)
Definition bitmapset.c:412
int bms_singleton_member(const Bitmapset *a)
Definition bitmapset.c:665
void bms_free(Bitmapset *a)
Definition bitmapset.c:239
bool bms_is_member(int x, const Bitmapset *a)
Definition bitmapset.c:510
Bitmapset * bms_add_member(Bitmapset *a, int x)
Definition bitmapset.c:799
Bitmapset * bms_add_members(Bitmapset *a, const Bitmapset *b)
Definition bitmapset.c:901
Bitmapset * bms_union(const Bitmapset *a, const Bitmapset *b)
Definition bitmapset.c:251
bool bms_overlap(const Bitmapset *a, const Bitmapset *b)
Definition bitmapset.c:575
Bitmapset * bms_join(Bitmapset *a, Bitmapset *b)
Definition bitmapset.c:1214
Bitmapset * bms_copy(const Bitmapset *a)
Definition bitmapset.c:122
#define bms_is_empty(a)
Definition bitmapset.h:118
#define Assert(condition)
Definition c.h:943
unsigned int Index
Definition c.h:698
uint32 result
memcpy(sums, checksumBaseOffsets, sizeof(checksumBaseOffsets))
List * find_forced_null_vars(Node *node)
Definition clauses.c:1934
Query * inline_function_in_from(PlannerInfo *root, RangeTblEntry *rte)
Definition clauses.c:5780
Node * eval_const_expressions(PlannerInfo *root, Node *node)
Definition clauses.c:2498
List * find_nonnullable_vars(Node *clause)
Definition clauses.c:1725
Relids find_nonnullable_rels(Node *clause)
Definition clauses.c:1474
bool contain_nonstrict_functions(Node *clause)
Definition clauses.c:1004
bool contain_volatile_functions(Node *clause)
Definition clauses.c:549
static bool restricted
Definition command.c:199
#define ERROR
Definition elog.h:39
#define elog(elevel,...)
Definition elog.h:227
#define palloc_object(type)
Definition fe_memutils.h:74
#define palloc0_array(type, count)
Definition fe_memutils.h:77
TypeFuncClass get_expr_result_type(Node *expr, Oid *resultTypeId, TupleDesc *resultTupleDesc)
Definition funcapi.c:299
TypeFuncClass
Definition funcapi.h:147
@ TYPEFUNC_SCALAR
Definition funcapi.h:148
void parse(int)
Definition parse.c:49
int j
Definition isn.c:78
int i
Definition isn.c:77
List * lappend(List *list, void *datum)
Definition list.c:339
List * list_concat(List *list1, const List *list2)
Definition list.c:561
#define NoLock
Definition lockdefs.h:34
Alias * makeAlias(const char *aliasname, List *colnames)
Definition makefuncs.c:438
Var * makeVarFromTargetEntry(int varno, TargetEntry *tle)
Definition makefuncs.c:107
FromExpr * makeFromExpr(List *fromlist, Node *quals)
Definition makefuncs.c:336
Var * makeVar(int varno, AttrNumber varattno, Oid vartype, int32 vartypmod, Oid varcollid, Index varlevelsup)
Definition makefuncs.c:66
Var * makeWholeRowVar(RangeTblEntry *rte, int varno, Index varlevelsup, bool allowScalar)
Definition makefuncs.c:137
Expr * make_andclause(List *andclauses)
Definition makefuncs.c:727
TargetEntry * makeTargetEntry(Expr *expr, AttrNumber resno, char *resname, bool resjunk)
Definition makefuncs.c:289
Node * make_and_qual(Node *qual1, Node *qual2)
Definition makefuncs.c:780
void * palloc0(Size size)
Definition mcxt.c:1417
MemoryContext CurrentMemoryContext
Definition mcxt.c:160
#define CHECK_FOR_INTERRUPTS()
Definition miscadmin.h:125
List * mbms_add_members(List *a, const List *b)
Bitmapset * mbms_overlap_sets(const List *a, const List *b)
bool expression_returns_set(Node *clause)
Definition nodeFuncs.c:768
static bool is_andclause(const void *clause)
Definition nodeFuncs.h:107
#define query_tree_walker(q, w, c, f)
Definition nodeFuncs.h:158
#define query_or_expression_tree_walker(n, w, c, f)
Definition nodeFuncs.h:171
#define range_table_entry_walker(r, w, c, f)
Definition nodeFuncs.h:168
#define expression_tree_walker(n, w, c)
Definition nodeFuncs.h:153
static bool is_notclause(const void *clause)
Definition nodeFuncs.h:125
static Expr * get_notclausearg(const void *notclause)
Definition nodeFuncs.h:134
#define IsA(nodeptr, _type_)
Definition nodes.h:164
#define copyObject(obj)
Definition nodes.h:232
#define nodeTag(nodeptr)
Definition nodes.h:139
@ CMD_MERGE
Definition nodes.h:279
@ CMD_SELECT
Definition nodes.h:275
@ CMD_NOTHING
Definition nodes.h:282
#define makeNode(_type_)
Definition nodes.h:161
#define castNode(_type_, nodeptr)
Definition nodes.h:182
JoinType
Definition nodes.h:298
@ JOIN_SEMI
Definition nodes.h:317
@ JOIN_FULL
Definition nodes.h:305
@ JOIN_INNER
Definition nodes.h:303
@ JOIN_RIGHT
Definition nodes.h:306
@ JOIN_LEFT
Definition nodes.h:304
@ JOIN_ANTI
Definition nodes.h:318
@ SETOP_UNION
@ RTE_JOIN
@ RTE_CTE
@ RTE_NAMEDTUPLESTORE
@ RTE_VALUES
@ RTE_SUBQUERY
@ RTE_RESULT
@ RTE_FUNCTION
@ RTE_TABLEFUNC
@ RTE_GROUP
@ RTE_GRAPH_TABLE
@ RTE_RELATION
#define rt_fetch(rangetable_index, rangetable)
Definition parsetree.h:31
FormData_pg_attribute * Form_pg_attribute
#define lfirst(lc)
Definition pg_list.h:172
static int list_length(const List *l)
Definition pg_list.h:152
#define linitial_node(type, l)
Definition pg_list.h:181
#define NIL
Definition pg_list.h:68
#define forboth(cell1, list1, cell2, list2)
Definition pg_list.h:550
#define foreach_delete_current(lst, var_or_cell)
Definition pg_list.h:423
#define list_make1(x1)
Definition pg_list.h:244
#define linitial(l)
Definition pg_list.h:178
#define lsecond(l)
Definition pg_list.h:183
#define foreach_node(type, var, lst)
Definition pg_list.h:528
#define list_make2(x1, x2)
Definition pg_list.h:246
static rewind_source * source
Definition pg_rewind.c:89
PlaceHolderVar * make_placeholder_expr(PlannerInfo *root, Expr *expr, Relids phrels)
Definition placeholder.c:54
void get_relation_notnullatts(PlannerInfo *root, Relation relation)
Definition plancat.c:690
Bitmapset * find_relation_notnullatts(PlannerInfo *root, Oid relid)
Definition plancat.c:763
#define InvalidOid
unsigned int Oid
static Node * pull_up_subqueries_recurse(PlannerInfo *root, Node *jtnode, JoinExpr *lowest_outer_join, AppendRelInfo *containing_appendrel)
static nullingrel_info * get_nullingrels(Query *parse)
static void remove_result_refs(PlannerInfo *root, int varno, Node *newjtloc)
static Node * pull_up_constant_function(PlannerInfo *root, Node *jtnode, RangeTblEntry *rte, AppendRelInfo *containing_appendrel)
void preprocess_function_rtes(PlannerInfo *root)
static bool find_dependent_phvs_walker(Node *node, find_dependent_phvs_context *context)
static Node * pullup_replace_vars_callback(const Var *var, replace_rte_variables_context *context)
static Node * find_jointree_node_for_rel(Node *jtnode, int relid)
static Node * pull_up_simple_union_all(PlannerInfo *root, Node *jtnode, RangeTblEntry *rte)
static void reduce_outer_joins_pass2(Node *jtnode, reduce_outer_joins_pass1_state *state1, reduce_outer_joins_pass2_state *state2, PlannerInfo *root, Relids nonnullable_rels, List *forced_null_vars)
static void pull_up_union_leaf_queries(Node *setOp, PlannerInfo *root, int parentRTindex, Query *setOpQuery, int childRToffset)
static bool is_simple_values(PlannerInfo *root, RangeTblEntry *rte)
static void make_setop_translation_list(Query *query, int newvarno, AppendRelInfo *appinfo)
void flatten_simple_union_all(PlannerInfo *root)
void transform_MERGE_to_join(Query *parse)
static void report_reduced_full_join(reduce_outer_joins_pass2_state *state2, int rtindex, Relids relids)
static void perform_pullup_replace_vars(PlannerInfo *root, pullup_replace_vars_context *rvcontext, AppendRelInfo *containing_appendrel)
void remove_useless_result_rtes(PlannerInfo *root)
static Node * pull_up_sublinks_jointree_recurse(PlannerInfo *root, Node *jtnode, Relids *relids)
static void get_nullingrels_recurse(Node *jtnode, Relids upper_nullingrels, nullingrel_info *info)
ReplaceWrapOption
@ REPLACE_WRAP_VARFREE
@ REPLACE_WRAP_ALL
@ REPLACE_WRAP_NONE
static reduce_outer_joins_pass1_state * reduce_outer_joins_pass1(Node *jtnode)
static void replace_vars_in_jointree(Node *jtnode, pullup_replace_vars_context *context)
static bool is_simple_subquery(PlannerInfo *root, Query *subquery, RangeTblEntry *rte, JoinExpr *lowest_outer_join)
static void substitute_phv_relids(Node *node, int varno, Relids subrelids)
void pull_up_sublinks(PlannerInfo *root)
static Node * pull_up_simple_subquery(PlannerInfo *root, Node *jtnode, RangeTblEntry *rte, JoinExpr *lowest_outer_join, AppendRelInfo *containing_appendrel)
void replace_empty_jointree(Query *parse)
static bool is_simple_union_all_recurse(Node *setOp, Query *setOpQuery, List *colTypes)
static bool substitute_phv_relids_walker(Node *node, substitute_phv_relids_context *context)
static void fix_append_rel_relids(PlannerInfo *root, int varno, Relids subrelids)
static Node * remove_useless_results_recurse(PlannerInfo *root, Node *jtnode, Node **parent_quals, Relids *dropped_outer_joins)
static bool has_notnull_forced_var(PlannerInfo *root, List *forced_null_vars, reduce_outer_joins_pass1_state *right_state)
static Query * pullup_replace_vars_subquery(Query *query, pullup_replace_vars_context *context)
Relids get_relids_for_join(Query *query, int joinrelid)
void pull_up_subqueries(PlannerInfo *root)
Relids get_relids_in_jointree(Node *jtnode, bool include_outer_joins, bool include_inner_joins)
static int get_result_relid(PlannerInfo *root, Node *jtnode)
Query * preprocess_relation_rtes(PlannerInfo *root)
static Node * pull_up_simple_values(PlannerInfo *root, Node *jtnode, RangeTblEntry *rte)
static bool is_safe_append_member(Query *subquery)
static Node * pull_up_sublinks_qual_recurse(PlannerInfo *root, Node *node, Node **jtlink1, Relids available_rels1, Node **jtlink2, Relids available_rels2)
void reduce_outer_joins(PlannerInfo *root)
static Query * expand_virtual_generated_columns(PlannerInfo *root, Query *parse, RangeTblEntry *rte, int rt_index, Relation relation)
static bool find_dependent_phvs(PlannerInfo *root, int varno)
static bool jointree_contains_lateral_outer_refs(PlannerInfo *root, Node *jtnode, bool restricted, Relids safe_upper_varnos)
static Node * pullup_replace_vars(Node *expr, pullup_replace_vars_context *context)
static bool is_simple_union_all(Query *subquery)
static bool find_dependent_phvs_in_jointree(PlannerInfo *root, Node *node, int varno)
static int fb(int x)
@ ANY_SUBLINK
Definition primnodes.h:1032
@ EXISTS_SUBLINK
Definition primnodes.h:1030
#define NUM_MERGE_MATCH_KINDS
Definition primnodes.h:2029
@ IS_NOT_NULL
Definition primnodes.h:1980
@ MERGE_WHEN_NOT_MATCHED_BY_TARGET
Definition primnodes.h:2026
@ MERGE_WHEN_NOT_MATCHED_BY_SOURCE
Definition primnodes.h:2025
@ MERGE_WHEN_MATCHED
Definition primnodes.h:2024
tree ctl root
Definition radixtree.h:1857
#define RelationGetDescr(relation)
Definition rel.h:542
Node * build_generation_expression(Relation rel, int attrno)
void IncrementVarSublevelsUp_rtable(List *rtable, int delta_sublevels_up, int min_sublevels_up)
void ChangeVarNodes(Node *node, int rt_index, int new_index, int sublevels_up)
void OffsetVarNodes(Node *node, int offset, int sublevels_up)
void CombineRangeTables(List **dst_rtable, List **dst_perminfos, List *src_rtable, List *src_perminfos)
Node * add_nulling_relids(Node *node, const Bitmapset *target_relids, const Bitmapset *added_relids)
Node * remove_nulling_relids(Node *node, const Bitmapset *removable_relids, const Bitmapset *except_relids)
Node * replace_rte_variables(Node *node, int target_varno, int sublevels_up, replace_rte_variables_callback callback, void *callback_arg, bool *outer_hasSubLinks)
void IncrementVarSublevelsUp(Node *node, int delta_sublevels_up, int min_sublevels_up)
Node * ReplaceVarFromTargetList(const Var *var, RangeTblEntry *target_rte, List *targetlist, int result_relation, ReplaceVarsNoMatchOption nomatch_option, int nomatch_varno)
@ REPLACEVARS_REPORT_ERROR
void check_stack_depth(void)
Definition stack_depth.c:95
List * translated_vars
Definition pathnodes.h:3329
Node * quals
Definition primnodes.h:2385
List * fromlist
Definition primnodes.h:2384
Definition pg_list.h:54
Definition nodes.h:135
List * minmax_aggs
Definition pathnodes.h:609
List * processed_tlist
Definition pathnodes.h:593
bool hasRecursion
Definition pathnodes.h:641
List * cte_plan_ids
Definition pathnodes.h:427
int last_rinfo_serial
Definition pathnodes.h:465
Index qual_security_level
Definition pathnodes.h:626
List * init_plans
Definition pathnodes.h:421
bool assumeReplanning
Definition pathnodes.h:643
List * multiexpr_params
Definition pathnodes.h:430
List * row_identity_vars
Definition pathnodes.h:490
bool ec_merging_done
Definition pathnodes.h:439
Bitmapset * outer_params
Definition pathnodes.h:343
Index query_level
Definition pathnodes.h:315
List * append_rel_list
Definition pathnodes.h:487
char * alternative_plan_name
Definition pathnodes.h:333
struct Path * non_recursive_path
Definition pathnodes.h:671
List * placeholder_list
Definition pathnodes.h:496
PlannerGlobal * glob
Definition pathnodes.h:312
List * join_domains
Definition pathnodes.h:433
List * eq_classes
Definition pathnodes.h:436
int wt_param_id
Definition pathnodes.h:669
List * plan_params
Definition pathnodes.h:342
List * processed_groupClause
Definition pathnodes.h:570
List * processed_distinctClause
Definition pathnodes.h:582
Query * parse
Definition pathnodes.h:309
List * rowMarks
Definition pathnodes.h:493
List * update_colnos
Definition pathnodes.h:601
bool placeholdersFrozen
Definition pathnodes.h:639
List * join_info_list
Definition pathnodes.h:462
char * plan_name
Definition pathnodes.h:321
Relids all_result_relids
Definition pathnodes.h:476
Relids leaf_result_relids
Definition pathnodes.h:478
List * rowMarks
Definition parsenodes.h:237
Node * limitCount
Definition parsenodes.h:234
FromExpr * jointree
Definition parsenodes.h:185
Node * setOperations
Definition parsenodes.h:239
List * cteList
Definition parsenodes.h:176
List * groupClause
Definition parsenodes.h:219
Node * havingQual
Definition parsenodes.h:225
List * rtable
Definition parsenodes.h:178
Node * limitOffset
Definition parsenodes.h:233
CmdType commandType
Definition parsenodes.h:121
List * targetList
Definition parsenodes.h:201
List * groupingSets
Definition parsenodes.h:223
List * distinctClause
Definition parsenodes.h:229
List * sortClause
Definition parsenodes.h:231
Form_pg_class rd_rel
Definition rel.h:111
SetOperation op
bool has_generated_virtual
Definition tupdesc.h:47
TupleConstr * constr
Definition tupdesc.h:159
ParseLoc location
Definition primnodes.h:311
AttrNumber varattno
Definition primnodes.h:275
Index varlevelsup
Definition primnodes.h:295
Relids * nullingrels
nullingrel_info * nullinfo
ReplaceWrapOption wrap_option
JoinExpr * convert_ANY_sublink_to_join(PlannerInfo *root, SubLink *sublink, bool under_not, Relids available_rels)
Definition subselect.c:1339
ScalarArrayOpExpr * convert_VALUES_to_ANY(PlannerInfo *root, Node *testexpr, Query *values)
Definition subselect.c:1230
JoinExpr * convert_EXISTS_sublink_to_join(PlannerInfo *root, SubLink *sublink, bool under_not, Relids available_rels)
Definition subselect.c:1591
#define FirstLowInvalidHeapAttributeNumber
Definition sysattr.h:27
void table_close(Relation relation, LOCKMODE lockmode)
Definition table.c:126
Relation table_open(Oid relationId, LOCKMODE lockmode)
Definition table.c:40
bool tlist_same_datatypes(List *tlist, List *colTypes, bool junkOK)
Definition tlist.c:257
static FormData_pg_attribute * TupleDescAttr(TupleDesc tupdesc, int i)
Definition tupdesc.h:178
bool contain_vars_of_level(Node *node, int levelsup)
Definition var.c:444
Relids pull_varnos_of_level(PlannerInfo *root, Node *node, int levelsup)
Definition var.c:140
Relids pull_varnos(PlannerInfo *root, Node *node)
Definition var.c:114
Node * flatten_join_alias_vars(PlannerInfo *root, Query *query, Node *node)
Definition var.c:781