Branch data Line data Source code
1 : : /*-------------------------------------------------------------------------
2 : : *
3 : : * prepunion.c
4 : : * Routines to plan set-operation queries. The filename is a leftover
5 : : * from a time when only UNIONs were implemented.
6 : : *
7 : : * There are two code paths in the planner for set-operation queries.
8 : : * If a subquery consists entirely of simple UNION ALL operations, it
9 : : * is converted into an "append relation". Otherwise, it is handled
10 : : * by the general code in this module (plan_set_operations and its
11 : : * subroutines). There is some support code here for the append-relation
12 : : * case, but most of the heavy lifting for that is done elsewhere,
13 : : * notably in prepjointree.c and allpaths.c.
14 : : *
15 : : * Portions Copyright (c) 1996-2026, PostgreSQL Global Development Group
16 : : * Portions Copyright (c) 1994, Regents of the University of California
17 : : *
18 : : *
19 : : * IDENTIFICATION
20 : : * src/backend/optimizer/prep/prepunion.c
21 : : *
22 : : *-------------------------------------------------------------------------
23 : : */
24 : : #include "postgres.h"
25 : :
26 : : #include <math.h>
27 : :
28 : : #include "access/htup_details.h"
29 : : #include "catalog/pg_type.h"
30 : : #include "miscadmin.h"
31 : : #include "nodes/makefuncs.h"
32 : : #include "nodes/nodeFuncs.h"
33 : : #include "optimizer/cost.h"
34 : : #include "optimizer/pathnode.h"
35 : : #include "optimizer/paths.h"
36 : : #include "optimizer/planner.h"
37 : : #include "optimizer/prep.h"
38 : : #include "optimizer/tlist.h"
39 : : #include "parser/parse_coerce.h"
40 : : #include "port/pg_bitutils.h"
41 : : #include "utils/selfuncs.h"
42 : :
43 : :
44 : : static RelOptInfo *recurse_set_operations(Node *setOp, PlannerInfo *root,
45 : : SetOperationStmt *parentOp,
46 : : List *colTypes, List *colCollations,
47 : : List *refnames_tlist,
48 : : List **pTargetList,
49 : : bool *istrivial_tlist);
50 : : static RelOptInfo *generate_recursion_path(SetOperationStmt *setOp,
51 : : PlannerInfo *root,
52 : : List *refnames_tlist,
53 : : List **pTargetList);
54 : : static void build_setop_child_paths(PlannerInfo *root, RelOptInfo *rel,
55 : : bool trivial_tlist, List *child_tlist,
56 : : List *interesting_pathkeys,
57 : : double *pNumGroups);
58 : : static RelOptInfo *generate_union_paths(SetOperationStmt *op, PlannerInfo *root,
59 : : List *refnames_tlist,
60 : : List **pTargetList);
61 : : static RelOptInfo *generate_nonunion_paths(SetOperationStmt *op, PlannerInfo *root,
62 : : List *refnames_tlist,
63 : : List **pTargetList);
64 : : static List *plan_union_children(PlannerInfo *root,
65 : : SetOperationStmt *top_union,
66 : : List *refnames_tlist,
67 : : List **tlist_list,
68 : : List **istrivial_tlist);
69 : : static void postprocess_setop_rel(PlannerInfo *root, RelOptInfo *rel);
70 : : static List *generate_setop_tlist(List *colTypes, List *colCollations,
71 : : Index varno,
72 : : bool hack_constants,
73 : : List *input_tlist,
74 : : List *refnames_tlist,
75 : : bool *trivial_tlist);
76 : : static List *generate_append_tlist(List *colTypes, List *colCollations,
77 : : List *input_tlists,
78 : : List *refnames_tlist);
79 : : static List *generate_setop_grouplist(SetOperationStmt *op, List *targetlist);
80 : : static PathTarget *create_setop_pathtarget(PlannerInfo *root, List *tlist,
81 : : List *child_pathlist);
82 : :
83 : :
84 : : /*
85 : : * plan_set_operations
86 : : *
87 : : * Plans the queries for a tree of set operations (UNION/INTERSECT/EXCEPT)
88 : : *
89 : : * This routine only deals with the setOperations tree of the given query.
90 : : * Any top-level ORDER BY requested in root->parse->sortClause will be handled
91 : : * when we return to grouping_planner; likewise for LIMIT.
92 : : *
93 : : * What we return is an "upperrel" RelOptInfo containing at least one Path
94 : : * that implements the set-operation tree. In addition, root->processed_tlist
95 : : * receives a targetlist representing the output of the topmost setop node.
96 : : */
97 : : RelOptInfo *
98 : 4835 : plan_set_operations(PlannerInfo *root)
99 : : {
100 : 4835 : Query *parse = root->parse;
101 : 4835 : SetOperationStmt *topop = castNode(SetOperationStmt, parse->setOperations);
102 : : Node *node;
103 : : RangeTblEntry *leftmostRTE;
104 : : Query *leftmostQuery;
105 : : RelOptInfo *setop_rel;
106 : : List *top_tlist;
107 : :
108 : : Assert(topop);
109 : :
110 : : /* check for unsupported stuff */
111 : : Assert(parse->jointree->fromlist == NIL);
112 : : Assert(parse->jointree->quals == NULL);
113 : : Assert(parse->groupClause == NIL);
114 : : Assert(parse->havingQual == NULL);
115 : : Assert(parse->windowClause == NIL);
116 : : Assert(parse->distinctClause == NIL);
117 : :
118 : : /*
119 : : * In the outer query level, equivalence classes are limited to classes
120 : : * which define that the top-level target entry is equivalent to the
121 : : * corresponding child target entry. There won't be any equivalence class
122 : : * merging. Mark that merging is complete to allow us to make pathkeys.
123 : : */
124 : : Assert(root->eq_classes == NIL);
125 : 4835 : root->ec_merging_done = true;
126 : :
127 : : /*
128 : : * We'll need to build RelOptInfos for each of the leaf subqueries, which
129 : : * are RTE_SUBQUERY rangetable entries in this Query. Prepare the index
130 : : * arrays for those, and for AppendRelInfos in case they're needed.
131 : : */
132 : 4835 : setup_simple_rel_arrays(root);
133 : :
134 : : /*
135 : : * Find the leftmost component Query. We need to use its column names for
136 : : * all generated tlists (else SELECT INTO won't work right).
137 : : */
138 : 4835 : node = topop->larg;
139 [ + - + + ]: 8062 : while (node && IsA(node, SetOperationStmt))
140 : 3227 : node = ((SetOperationStmt *) node)->larg;
141 : : Assert(node && IsA(node, RangeTblRef));
142 : 4835 : leftmostRTE = root->simple_rte_array[((RangeTblRef *) node)->rtindex];
143 : 4835 : leftmostQuery = leftmostRTE->subquery;
144 : : Assert(leftmostQuery != NULL);
145 : :
146 : : /*
147 : : * If the topmost node is a recursive union, it needs special processing.
148 : : */
149 [ + + ]: 4835 : if (root->hasRecursion)
150 : : {
151 : 637 : setop_rel = generate_recursion_path(topop, root,
152 : : leftmostQuery->targetList,
153 : : &top_tlist);
154 : : }
155 : : else
156 : : {
157 : : bool trivial_tlist;
158 : :
159 : : /*
160 : : * Recurse on setOperations tree to generate paths for set ops. The
161 : : * final output paths should have just the column types shown as the
162 : : * output from the top-level node.
163 : : */
164 : 4198 : setop_rel = recurse_set_operations((Node *) topop, root,
165 : : NULL, /* no parent */
166 : : topop->colTypes, topop->colCollations,
167 : : leftmostQuery->targetList,
168 : : &top_tlist,
169 : : &trivial_tlist);
170 : : }
171 : :
172 : : /* Must return the built tlist into root->processed_tlist. */
173 : 4831 : root->processed_tlist = top_tlist;
174 : :
175 : 4831 : return setop_rel;
176 : : }
177 : :
178 : : /*
179 : : * recurse_set_operations
180 : : * Recursively handle one step in a tree of set operations
181 : : *
182 : : * setOp: current step (could be a SetOperationStmt or a leaf RangeTblRef)
183 : : * parentOp: parent step, or NULL if none (but see below)
184 : : * colTypes: OID list of set-op's result column datatypes
185 : : * colCollations: OID list of set-op's result column collations
186 : : * refnames_tlist: targetlist to take column names from
187 : : *
188 : : * parentOp should be passed as NULL unless that step is interested in
189 : : * getting sorted output from this step. ("Sorted" means "sorted according
190 : : * to the default btree opclasses of the result column datatypes".)
191 : : *
192 : : * Returns a RelOptInfo for the subtree, as well as these output parameters:
193 : : * *pTargetList: receives the fully-fledged tlist for the subtree's top plan
194 : : * *istrivial_tlist: true if, and only if, datatypes between parent and child
195 : : * match.
196 : : *
197 : : * If setOp is a leaf node, this function plans the sub-query but does
198 : : * not populate the pathlist of the returned RelOptInfo. The caller will
199 : : * generate SubqueryScan paths using useful path(s) of the subquery (see
200 : : * build_setop_child_paths). But this function does build the paths for
201 : : * set-operation nodes.
202 : : *
203 : : * The pTargetList output parameter is mostly redundant with the pathtarget
204 : : * of the returned RelOptInfo, but for the moment we need it because much of
205 : : * the logic in this file depends on flag columns being marked resjunk.
206 : : * XXX Now that there are no flag columns and hence no resjunk columns, we
207 : : * could probably refactor this file to deal only in pathtargets.
208 : : *
209 : : * We don't have to care about typmods here: the only allowed difference
210 : : * between set-op input and output typmods is input is a specific typmod
211 : : * and output is -1, and that does not require a coercion.
212 : : */
213 : : static RelOptInfo *
214 : 17300 : recurse_set_operations(Node *setOp, PlannerInfo *root,
215 : : SetOperationStmt *parentOp,
216 : : List *colTypes, List *colCollations,
217 : : List *refnames_tlist,
218 : : List **pTargetList,
219 : : bool *istrivial_tlist)
220 : : {
221 : : RelOptInfo *rel;
222 : :
223 : 17300 : *istrivial_tlist = true; /* for now */
224 : :
225 : : /* Guard against stack overflow due to overly complex setop nests */
226 : 17300 : check_stack_depth();
227 : :
228 [ + + ]: 17300 : if (IsA(setOp, RangeTblRef))
229 : : {
230 : 12957 : RangeTblRef *rtr = (RangeTblRef *) setOp;
231 : 12957 : RangeTblEntry *rte = root->simple_rte_array[rtr->rtindex];
232 : 12957 : Query *subquery = rte->subquery;
233 : : PlannerInfo *subroot;
234 : : List *tlist;
235 : : bool trivial_tlist;
236 : : char *plan_name;
237 : :
238 : : Assert(subquery != NULL);
239 : :
240 : : /* Build a RelOptInfo for this leaf subquery. */
241 : 12957 : rel = build_simple_rel(root, rtr->rtindex, NULL);
242 : :
243 : : /* plan_params should not be in use in current query level */
244 : : Assert(root->plan_params == NIL);
245 : :
246 : : /*
247 : : * Generate a subroot and Paths for the subquery. If we have a
248 : : * parentOp, pass that down to encourage subquery_planner to consider
249 : : * suitably-sorted Paths.
250 : : */
251 : 12957 : plan_name = choose_plan_name(root->glob, "setop", true);
252 : 12957 : subroot = rel->subroot = subquery_planner(root->glob, subquery,
253 : : plan_name, root, NULL,
254 : : false, root->tuple_fraction,
255 : : parentOp);
256 : :
257 : : /*
258 : : * It should not be possible for the primitive query to contain any
259 : : * cross-references to other primitive queries in the setop tree.
260 : : */
261 [ - + ]: 12957 : if (root->plan_params)
262 [ # # ]: 0 : elog(ERROR, "unexpected outer reference in set operation subquery");
263 : :
264 : : /* Figure out the appropriate target list for this subquery. */
265 : 12957 : tlist = generate_setop_tlist(colTypes, colCollations,
266 : 12957 : rtr->rtindex,
267 : : true,
268 : : subroot->processed_tlist,
269 : : refnames_tlist,
270 : : &trivial_tlist);
271 : 12957 : rel->reltarget = create_pathtarget(root, tlist);
272 : :
273 : : /* Return the fully-fledged tlist to caller, too */
274 : 12957 : *pTargetList = tlist;
275 : 12957 : *istrivial_tlist = trivial_tlist;
276 : : }
277 [ + - ]: 4343 : else if (IsA(setOp, SetOperationStmt))
278 : : {
279 : 4343 : SetOperationStmt *op = (SetOperationStmt *) setOp;
280 : :
281 : : /* UNIONs are much different from INTERSECT/EXCEPT */
282 [ + + ]: 4343 : if (op->op == SETOP_UNION)
283 : 3719 : rel = generate_union_paths(op, root,
284 : : refnames_tlist,
285 : : pTargetList);
286 : : else
287 : 624 : rel = generate_nonunion_paths(op, root,
288 : : refnames_tlist,
289 : : pTargetList);
290 : :
291 : : /*
292 : : * If necessary, add a Result node to project the caller-requested
293 : : * output columns.
294 : : *
295 : : * XXX you don't really want to know about this: setrefs.c will apply
296 : : * fix_upper_expr() to the Result node's tlist. This would fail if the
297 : : * Vars generated by generate_setop_tlist() were not exactly equal()
298 : : * to the corresponding tlist entries of the subplan. However, since
299 : : * the subplan was generated by generate_union_paths() or
300 : : * generate_nonunion_paths(), and hence its tlist was generated by
301 : : * generate_append_tlist() or generate_setop_tlist(), this will work.
302 : : * We just tell generate_setop_tlist() to use varno 0.
303 : : */
304 [ + + ]: 4343 : if (!tlist_same_datatypes(*pTargetList, colTypes, false) ||
305 [ - + ]: 4328 : !tlist_same_collations(*pTargetList, colCollations, false))
306 : : {
307 : : PathTarget *target;
308 : : bool trivial_tlist;
309 : : ListCell *lc;
310 : :
311 : 15 : *pTargetList = generate_setop_tlist(colTypes, colCollations,
312 : : 0,
313 : : false,
314 : : *pTargetList,
315 : : refnames_tlist,
316 : : &trivial_tlist);
317 : 15 : *istrivial_tlist = trivial_tlist;
318 : 15 : target = create_pathtarget(root, *pTargetList);
319 : :
320 : : /* Apply projection to each path */
321 [ + - + + : 30 : foreach(lc, rel->pathlist)
+ + ]
322 : : {
323 : 15 : Path *subpath = (Path *) lfirst(lc);
324 : : Path *path;
325 : :
326 : : Assert(subpath->param_info == NULL);
327 : 15 : path = apply_projection_to_path(root, subpath->parent,
328 : : subpath, target);
329 : : /* If we had to add a Result, path is different from subpath */
330 [ + - ]: 15 : if (path != subpath)
331 : 15 : lfirst(lc) = path;
332 : : }
333 : :
334 : : /* Apply projection to each partial path */
335 [ - + - - : 15 : foreach(lc, rel->partial_pathlist)
- + ]
336 : : {
337 : 0 : Path *subpath = (Path *) lfirst(lc);
338 : : Path *path;
339 : :
340 : : Assert(subpath->param_info == NULL);
341 : :
342 : : /* avoid apply_projection_to_path, in case of multiple refs */
343 : 0 : path = (Path *) create_projection_path(root, subpath->parent,
344 : : subpath, target);
345 : 0 : lfirst(lc) = path;
346 : : }
347 : : }
348 : 4343 : postprocess_setop_rel(root, rel);
349 : : }
350 : : else
351 : : {
352 [ # # ]: 0 : elog(ERROR, "unrecognized node type: %d",
353 : : (int) nodeTag(setOp));
354 : : *pTargetList = NIL;
355 : : rel = NULL; /* keep compiler quiet */
356 : : }
357 : :
358 : 17300 : return rel;
359 : : }
360 : :
361 : : /*
362 : : * Generate paths for a recursive UNION node
363 : : */
364 : : static RelOptInfo *
365 : 637 : generate_recursion_path(SetOperationStmt *setOp, PlannerInfo *root,
366 : : List *refnames_tlist,
367 : : List **pTargetList)
368 : : {
369 : : RelOptInfo *result_rel;
370 : : Path *path;
371 : : RelOptInfo *lrel,
372 : : *rrel;
373 : : Path *lpath;
374 : : Path *rpath;
375 : : List *lpath_tlist;
376 : : bool lpath_trivial_tlist;
377 : : List *rpath_tlist;
378 : : bool rpath_trivial_tlist;
379 : : List *tlist;
380 : : List *groupList;
381 : : double dNumGroups;
382 : :
383 : : /* Parser should have rejected other cases */
384 [ - + ]: 637 : if (setOp->op != SETOP_UNION)
385 [ # # ]: 0 : elog(ERROR, "only UNION queries can be recursive");
386 : : /* Worktable ID should be assigned */
387 : : Assert(root->wt_param_id >= 0);
388 : :
389 : : /*
390 : : * Unlike a regular UNION node, process the left and right inputs
391 : : * separately without any intention of combining them into one Append.
392 : : */
393 : 637 : lrel = recurse_set_operations(setOp->larg, root,
394 : : NULL, /* no value in sorted results */
395 : : setOp->colTypes, setOp->colCollations,
396 : : refnames_tlist,
397 : : &lpath_tlist,
398 : : &lpath_trivial_tlist);
399 [ + - ]: 637 : if (lrel->rtekind == RTE_SUBQUERY)
400 : 637 : build_setop_child_paths(root, lrel, lpath_trivial_tlist, lpath_tlist,
401 : : NIL, NULL);
402 : 637 : lpath = lrel->cheapest_total_path;
403 : : /* The right path will want to look at the left one ... */
404 : 637 : root->non_recursive_path = lpath;
405 : 637 : rrel = recurse_set_operations(setOp->rarg, root,
406 : : NULL, /* no value in sorted results */
407 : : setOp->colTypes, setOp->colCollations,
408 : : refnames_tlist,
409 : : &rpath_tlist,
410 : : &rpath_trivial_tlist);
411 [ + + ]: 637 : if (rrel->rtekind == RTE_SUBQUERY)
412 : 632 : build_setop_child_paths(root, rrel, rpath_trivial_tlist, rpath_tlist,
413 : : NIL, NULL);
414 : 637 : rpath = rrel->cheapest_total_path;
415 : 637 : root->non_recursive_path = NULL;
416 : :
417 : : /*
418 : : * Generate tlist for RecursiveUnion path node --- same as in Append cases
419 : : */
420 : 637 : tlist = generate_append_tlist(setOp->colTypes, setOp->colCollations,
421 : : list_make2(lpath_tlist, rpath_tlist),
422 : : refnames_tlist);
423 : :
424 : 637 : *pTargetList = tlist;
425 : :
426 : : /* Build result relation. */
427 : 637 : result_rel = fetch_upper_rel(root, UPPERREL_SETOP,
428 : 637 : bms_union(lrel->relids, rrel->relids));
429 : 637 : result_rel->reltarget = create_pathtarget(root, tlist);
430 : :
431 : : /*
432 : : * If UNION, identify the grouping operators
433 : : */
434 [ + + ]: 637 : if (setOp->all)
435 : : {
436 : 417 : groupList = NIL;
437 : 417 : dNumGroups = 0;
438 : : }
439 : : else
440 : : {
441 : : /* Identify the grouping semantics */
442 : 220 : groupList = generate_setop_grouplist(setOp, tlist);
443 : :
444 : : /* We only support hashing here */
445 [ + + ]: 220 : if (!grouping_is_hashable(groupList))
446 [ + - ]: 4 : ereport(ERROR,
447 : : (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
448 : : errmsg("could not implement recursive UNION"),
449 : : errdetail("All column datatypes must be hashable.")));
450 : :
451 : : /*
452 : : * For the moment, take the number of distinct groups as equal to the
453 : : * total input size, ie, the worst case.
454 : : */
455 : 216 : dNumGroups = lpath->rows + rpath->rows * 10;
456 : : }
457 : :
458 : : /*
459 : : * And make the path node.
460 : : */
461 : 633 : path = (Path *) create_recursiveunion_path(root,
462 : : result_rel,
463 : : lpath,
464 : : rpath,
465 : 633 : result_rel->reltarget,
466 : : groupList,
467 : : root->wt_param_id,
468 : : dNumGroups);
469 : :
470 : 633 : add_path(result_rel, path);
471 : 633 : postprocess_setop_rel(root, result_rel);
472 : 633 : return result_rel;
473 : : }
474 : :
475 : : /*
476 : : * build_setop_child_paths
477 : : * Build paths for the set op child relation denoted by 'rel'.
478 : : *
479 : : * 'rel' is an RTE_SUBQUERY relation. We have already generated paths within
480 : : * the subquery's subroot; the task here is to create SubqueryScan paths for
481 : : * 'rel', representing scans of the useful subquery paths.
482 : : *
483 : : * interesting_pathkeys: if not NIL, also include paths that suit these
484 : : * pathkeys, sorting any unsorted paths as required.
485 : : * *pNumGroups: if not NULL, we estimate the number of distinct groups
486 : : * in the result, and store it there.
487 : : */
488 : : static void
489 : 12957 : build_setop_child_paths(PlannerInfo *root, RelOptInfo *rel,
490 : : bool trivial_tlist, List *child_tlist,
491 : : List *interesting_pathkeys, double *pNumGroups)
492 : : {
493 : : RelOptInfo *final_rel;
494 : 12957 : List *setop_pathkeys = rel->subroot->setop_pathkeys;
495 : : ListCell *lc;
496 : :
497 : : /* it can't be a set op child rel if it's not a subquery */
498 : : Assert(rel->rtekind == RTE_SUBQUERY);
499 : :
500 : : /* when sorting is needed, add child rel equivalences */
501 [ + + ]: 12957 : if (interesting_pathkeys != NIL)
502 : 10208 : add_setop_child_rel_equivalences(root,
503 : : rel,
504 : : child_tlist,
505 : : interesting_pathkeys);
506 : :
507 : : /*
508 : : * Mark rel with estimated output rows, width, etc. Note that we have to
509 : : * do this before generating outer-query paths, else cost_subqueryscan is
510 : : * not happy.
511 : : */
512 : 12957 : set_subquery_size_estimates(root, rel);
513 : :
514 : : /*
515 : : * Since we may want to add a partial path to this relation, we must set
516 : : * its consider_parallel flag correctly.
517 : : */
518 : 12957 : final_rel = fetch_upper_rel(rel->subroot, UPPERREL_FINAL, NULL);
519 : 12957 : rel->consider_parallel = final_rel->consider_parallel;
520 : :
521 : : /* Generate subquery scan paths for any interesting path in final_rel */
522 [ + - + + : 33959 : foreach(lc, final_rel->pathlist)
+ + ]
523 : : {
524 : 21002 : Path *subpath = (Path *) lfirst(lc);
525 : : List *pathkeys;
526 : 21002 : Path *cheapest_input_path = final_rel->cheapest_total_path;
527 : : bool is_sorted;
528 : : int presorted_keys;
529 : :
530 : : /* If the input rel is dummy, propagate that to this query level */
531 [ + + ]: 21002 : if (is_dummy_rel(final_rel))
532 : : {
533 : 68 : mark_dummy_rel(rel);
534 : 2845 : continue;
535 : : }
536 : :
537 : : /*
538 : : * Include the cheapest path as-is so that the set operation can be
539 : : * cheaply implemented using a method which does not require the input
540 : : * to be sorted.
541 : : */
542 [ + + ]: 20934 : if (subpath == cheapest_input_path)
543 : : {
544 : : /* Convert subpath's pathkeys to outer representation */
545 : 12889 : pathkeys = convert_subquery_pathkeys(root, rel, subpath->pathkeys,
546 : : make_tlist_from_pathtarget(subpath->pathtarget));
547 : :
548 : : /* Generate outer path using this subpath */
549 : 12889 : add_path(rel, (Path *) create_subqueryscan_path(root,
550 : : rel,
551 : : subpath,
552 : : trivial_tlist,
553 : : pathkeys,
554 : : NULL));
555 : : }
556 : :
557 : : /* skip dealing with sorted paths if the setop doesn't need them */
558 [ + + ]: 20934 : if (interesting_pathkeys == NIL)
559 : 2767 : continue;
560 : :
561 : : /*
562 : : * Create paths to suit final sort order required for setop_pathkeys.
563 : : * Here we'll sort the cheapest input path (if not sorted already) and
564 : : * incremental sort any paths which are partially sorted.
565 : : */
566 : 18167 : is_sorted = pathkeys_count_contained_in(setop_pathkeys,
567 : : subpath->pathkeys,
568 : : &presorted_keys);
569 : :
570 [ + + ]: 18167 : if (!is_sorted)
571 : : {
572 : 12054 : double limittuples = rel->subroot->limit_tuples;
573 : :
574 : : /*
575 : : * Try at least sorting the cheapest path and also try
576 : : * incrementally sorting any path which is partially sorted
577 : : * already (no need to deal with paths which have presorted keys
578 : : * when incremental sort is disabled unless it's the cheapest
579 : : * input path).
580 : : */
581 [ + + ]: 12054 : if (subpath != cheapest_input_path &&
582 [ + + - + ]: 2676 : (presorted_keys == 0 || !enable_incremental_sort))
583 : 10 : continue;
584 : :
585 : : /*
586 : : * We've no need to consider both a sort and incremental sort.
587 : : * We'll just do a sort if there are no presorted keys and an
588 : : * incremental sort when there are presorted keys.
589 : : */
590 [ + + + + ]: 12044 : if (presorted_keys == 0 || !enable_incremental_sort)
591 : 9378 : subpath = (Path *) create_sort_path(rel->subroot,
592 : : final_rel,
593 : : subpath,
594 : : setop_pathkeys,
595 : : limittuples);
596 : : else
597 : 2666 : subpath = (Path *) create_incremental_sort_path(rel->subroot,
598 : : final_rel,
599 : : subpath,
600 : : setop_pathkeys,
601 : : presorted_keys,
602 : : limittuples);
603 : : }
604 : :
605 : : /*
606 : : * subpath is now sorted, so add it to the pathlist. We already added
607 : : * the cheapest_input_path above, so don't add it again unless we just
608 : : * sorted it.
609 : : */
610 [ + + ]: 18157 : if (subpath != cheapest_input_path)
611 : : {
612 : : /* Convert subpath's pathkeys to outer representation */
613 : 17387 : pathkeys = convert_subquery_pathkeys(root, rel, subpath->pathkeys,
614 : : make_tlist_from_pathtarget(subpath->pathtarget));
615 : :
616 : : /* Generate outer path using this subpath */
617 : 17387 : add_path(rel, (Path *) create_subqueryscan_path(root,
618 : : rel,
619 : : subpath,
620 : : trivial_tlist,
621 : : pathkeys,
622 : : NULL));
623 : : }
624 : : }
625 : :
626 : : /* if consider_parallel is false, there should be no partial paths */
627 : : Assert(final_rel->consider_parallel ||
628 : : final_rel->partial_pathlist == NIL);
629 : :
630 : : /*
631 : : * If we have a partial path for the child relation, we can use that to
632 : : * build a partial path for this relation. But there's no point in
633 : : * considering any path but the cheapest.
634 : : */
635 [ + + + - ]: 12957 : if (rel->consider_parallel && bms_is_empty(rel->lateral_relids) &&
636 [ + + ]: 8961 : final_rel->partial_pathlist != NIL)
637 : : {
638 : : Path *partial_subpath;
639 : : Path *partial_path;
640 : :
641 : 15 : partial_subpath = linitial(final_rel->partial_pathlist);
642 : : partial_path = (Path *)
643 : 15 : create_subqueryscan_path(root, rel, partial_subpath,
644 : : trivial_tlist,
645 : : NIL, NULL);
646 : 15 : add_partial_path(rel, partial_path);
647 : : }
648 : :
649 : 12957 : postprocess_setop_rel(root, rel);
650 : :
651 : : /*
652 : : * Estimate number of groups if caller wants it. If the subquery used
653 : : * grouping or aggregation, its output is probably mostly unique anyway;
654 : : * otherwise do statistical estimation.
655 : : *
656 : : * XXX you don't really want to know about this: we do the estimation
657 : : * using the subroot->parse's original targetlist expressions, not the
658 : : * subroot->processed_tlist which might seem more appropriate. The reason
659 : : * is that if the subquery is itself a setop, it may return a
660 : : * processed_tlist containing "varno 0" Vars generated by
661 : : * generate_append_tlist, and those would confuse estimate_num_groups
662 : : * mightily. We ought to get rid of the "varno 0" hack, but that requires
663 : : * a redesign of the parsetree representation of setops, so that there can
664 : : * be an RTE corresponding to each setop's output. Note, we use this not
665 : : * subquery's targetlist but subroot->parse's targetlist, because it was
666 : : * revised by self-join removal. subquery's targetlist might contain the
667 : : * references to the removed relids.
668 : : */
669 [ + + ]: 12957 : if (pNumGroups)
670 : : {
671 : 10498 : PlannerInfo *subroot = rel->subroot;
672 : 10498 : Query *subquery = subroot->parse;
673 : :
674 [ + - + - ]: 10498 : if (subquery->groupClause || subquery->groupingSets ||
675 [ + + + - ]: 10498 : subquery->distinctClause || subroot->hasHavingQual ||
676 [ - + ]: 10488 : subquery->hasAggs)
677 : 10 : *pNumGroups = rel->cheapest_total_path->rows;
678 : : else
679 : 10488 : *pNumGroups = estimate_num_groups(subroot,
680 : 10488 : get_tlist_exprs(subroot->parse->targetList, false),
681 : 10488 : rel->cheapest_total_path->rows,
682 : : NULL,
683 : : NULL);
684 : : }
685 : 12957 : }
686 : :
687 : : /*
688 : : * Generate paths for a UNION or UNION ALL node
689 : : */
690 : : static RelOptInfo *
691 : 3719 : generate_union_paths(SetOperationStmt *op, PlannerInfo *root,
692 : : List *refnames_tlist,
693 : : List **pTargetList)
694 : : {
695 : 3719 : Relids relids = NULL;
696 : : RelOptInfo *result_rel;
697 : : ListCell *lc;
698 : : ListCell *lc2;
699 : : ListCell *lc3;
700 : 3719 : AppendPathInput cheapest = {0};
701 : 3719 : AppendPathInput ordered = {0};
702 : 3719 : AppendPathInput partial = {0};
703 : 3719 : bool partial_paths_valid = true;
704 : 3719 : bool consider_parallel = true;
705 : : List *rellist;
706 : : List *tlist_list;
707 : : List *trivial_tlist_list;
708 : : List *tlist;
709 : 3719 : List *groupList = NIL;
710 : : Path *apath;
711 : 3719 : Path *gpath = NULL;
712 : 3719 : bool try_sorted = false;
713 : 3719 : List *union_pathkeys = NIL;
714 : 3719 : double dNumChildGroups = 0;
715 : :
716 : : /*
717 : : * If any of my children are identical UNION nodes (same op, all-flag, and
718 : : * colTypes/colCollations) then they can be merged into this node so that
719 : : * we generate only one Append/MergeAppend and unique-ification for the
720 : : * lot. Recurse to find such nodes.
721 : : */
722 : 3719 : rellist = plan_union_children(root,
723 : : op,
724 : : refnames_tlist,
725 : : &tlist_list,
726 : : &trivial_tlist_list);
727 : :
728 : : /*
729 : : * Generate tlist for Append/MergeAppend plan node.
730 : : *
731 : : * The tlist for an Append plan isn't important as far as the Append is
732 : : * concerned, but we must make it look real anyway for the benefit of the
733 : : * next plan level up.
734 : : */
735 : 3719 : tlist = generate_append_tlist(op->colTypes, op->colCollations,
736 : : tlist_list, refnames_tlist);
737 : 3719 : *pTargetList = tlist;
738 : :
739 : : /* For UNIONs (not UNION ALL), try sorting, if sorting is possible */
740 [ + + ]: 3719 : if (!op->all)
741 : : {
742 : : /* Identify the grouping semantics */
743 : 3274 : groupList = generate_setop_grouplist(op, tlist);
744 : :
745 [ + + ]: 3274 : if (grouping_is_sortable(op->groupClauses))
746 : : {
747 : 3214 : try_sorted = true;
748 : : /* Determine the pathkeys for sorting by the whole target list */
749 : 3214 : union_pathkeys = make_pathkeys_for_sortclauses(root, groupList,
750 : : tlist);
751 : :
752 : 3214 : root->query_pathkeys = union_pathkeys;
753 : : }
754 : : }
755 : :
756 : : /*
757 : : * Now that we've got the append target list, we can build the union child
758 : : * paths.
759 : : */
760 [ + - + + : 14299 : forthree(lc, rellist, lc2, trivial_tlist_list, lc3, tlist_list)
+ - + + +
- + + + +
+ - + - +
+ ]
761 : : {
762 : 10580 : RelOptInfo *rel = lfirst(lc);
763 : 10580 : bool trivial_tlist = lfirst_int(lc2);
764 : 10580 : List *child_tlist = lfirst_node(List, lc3);
765 : 10580 : double childGroups = 0;
766 : :
767 : : /* only build paths for the union children */
768 [ + + ]: 10580 : if (rel->rtekind == RTE_SUBQUERY)
769 : 10470 : build_setop_child_paths(root, rel, trivial_tlist, child_tlist,
770 : : union_pathkeys,
771 [ + + ]: 10470 : op->all ? NULL : &childGroups);
772 : : else
773 : 110 : childGroups = rel->rows;
774 : :
775 : : /*
776 : : * For UNION (not UNION ALL), accumulate the per-child distinct-group
777 : : * estimates. This sum is the basis for the UNION's output estimate
778 : : * below: since distinct(A union B) <= distinct(A) + distinct(B), the
779 : : * union cannot have more distinct rows than its children do in total.
780 : : * Children that are known to be empty contribute nothing, so skip
781 : : * them.
782 : : */
783 [ + + + + ]: 10580 : if (!op->all && !is_dummy_rel(rel))
784 : 9260 : dNumChildGroups += childGroups;
785 : : }
786 : :
787 : : /* Build path lists and relid set. */
788 [ + - + + : 14299 : foreach(lc, rellist)
+ + ]
789 : : {
790 : 10580 : RelOptInfo *rel = lfirst(lc);
791 : : Path *ordered_path;
792 : :
793 : : /*
794 : : * Record the relids so that we can identify the correct
795 : : * UPPERREL_SETOP RelOptInfo below.
796 : : */
797 : 10580 : relids = bms_add_members(relids, rel->relids);
798 : :
799 : : /* Skip any UNION children that are proven not to yield any rows */
800 [ + + ]: 10580 : if (is_dummy_rel(rel))
801 : 38 : continue;
802 : :
803 : 21084 : cheapest.subpaths = lappend(cheapest.subpaths,
804 : 10542 : rel->cheapest_total_path);
805 : :
806 [ + + ]: 10542 : if (try_sorted)
807 : : {
808 : 3476 : ordered_path = get_cheapest_path_for_pathkeys(rel->pathlist,
809 : : union_pathkeys,
810 : : NULL,
811 : : TOTAL_COST,
812 : : false);
813 : :
814 [ + + ]: 3476 : if (ordered_path != NULL)
815 : 519 : ordered.subpaths = lappend(ordered.subpaths, ordered_path);
816 : : else
817 : : {
818 : : /*
819 : : * If we can't find a sorted path, just give up trying to
820 : : * generate a list of correctly sorted child paths. This can
821 : : * happen when type coercion was added to the targetlist due
822 : : * to mismatching types from the union children.
823 : : */
824 : 2957 : try_sorted = false;
825 : : }
826 : : }
827 : :
828 [ + + ]: 10542 : if (consider_parallel)
829 : : {
830 [ + + ]: 7602 : if (!rel->consider_parallel)
831 : : {
832 : 2825 : consider_parallel = false;
833 : 2825 : partial_paths_valid = false;
834 : : }
835 [ + + ]: 4777 : else if (rel->partial_pathlist == NIL)
836 : 4767 : partial_paths_valid = false;
837 : : else
838 : 10 : partial.partial_subpaths = lappend(partial.partial_subpaths,
839 : 10 : linitial(rel->partial_pathlist));
840 : : }
841 : : }
842 : :
843 : : /* Build result relation. */
844 : 3719 : result_rel = fetch_upper_rel(root, UPPERREL_SETOP, relids);
845 : 3719 : result_rel->reltarget = create_setop_pathtarget(root, tlist,
846 : : cheapest.subpaths);
847 : 3719 : result_rel->consider_parallel = consider_parallel;
848 : 3719 : result_rel->consider_startup = (root->tuple_fraction > 0);
849 : :
850 : : /* If all UNION children were dummy rels, make the resulting rel dummy */
851 [ + + ]: 3719 : if (cheapest.subpaths == NIL)
852 : : {
853 : 5 : mark_dummy_rel(result_rel);
854 : :
855 : 5 : return result_rel;
856 : : }
857 : :
858 : : /*
859 : : * Append the child results together using the cheapest paths from each
860 : : * union child.
861 : : */
862 : 3714 : apath = (Path *) create_append_path(root, result_rel, cheapest,
863 : : NIL, NULL, 0, false, -1);
864 : :
865 : : /*
866 : : * Initialize the result row estimate to the total input size. This is
867 : : * correct for UNION ALL; for the UNION case it is overwritten below with
868 : : * the estimated number of distinct groups.
869 : : */
870 : 3714 : result_rel->rows = apath->rows;
871 : :
872 : : /*
873 : : * Now consider doing the same thing using the partial paths plus Append
874 : : * plus Gather.
875 : : */
876 [ + + ]: 3714 : if (partial_paths_valid)
877 : : {
878 : : Path *papath;
879 : 5 : int parallel_workers = 0;
880 : :
881 : : /* Find the highest number of workers requested for any subpath. */
882 [ + - + + : 15 : foreach(lc, partial.partial_subpaths)
+ + ]
883 : : {
884 : 10 : Path *subpath = lfirst(lc);
885 : :
886 : 10 : parallel_workers = Max(parallel_workers,
887 : : subpath->parallel_workers);
888 : : }
889 : : Assert(parallel_workers > 0);
890 : :
891 : : /*
892 : : * If the use of parallel append is permitted, always request at least
893 : : * log2(# of children) paths. We assume it can be useful to have
894 : : * extra workers in this case because they will be spread out across
895 : : * the children. The precise formula is just a guess; see
896 : : * add_paths_to_append_rel.
897 : : */
898 [ + - ]: 5 : if (enable_parallel_append)
899 : : {
900 [ + - ]: 5 : parallel_workers = Max(parallel_workers,
901 : : pg_leftmost_one_pos32(list_length(partial.partial_subpaths)) + 1);
902 : 5 : parallel_workers = Min(parallel_workers,
903 : : max_parallel_workers_per_gather);
904 : : }
905 : : Assert(parallel_workers > 0);
906 : :
907 : : papath = (Path *)
908 : 5 : create_append_path(root, result_rel, partial,
909 : : NIL, NULL, parallel_workers,
910 : : enable_parallel_append, -1);
911 : : gpath = (Path *)
912 : 5 : create_gather_path(root, result_rel, papath,
913 : 5 : result_rel->reltarget, NULL, NULL);
914 : : }
915 : :
916 [ + + ]: 3714 : if (!op->all)
917 : : {
918 : 3269 : bool can_sort = grouping_is_sortable(groupList);
919 : 3269 : bool can_hash = grouping_is_hashable(groupList);
920 : :
921 : : /*
922 : : * result_rel->rows was initialized to the total input size above,
923 : : * which is the correct estimate for UNION ALL. A UNION removes
924 : : * duplicates, so override it with the estimated number of distinct
925 : : * groups.
926 : : */
927 : 3269 : result_rel->rows = dNumChildGroups;
928 : :
929 [ + + ]: 3269 : if (can_hash)
930 : : {
931 : : Path *path;
932 : :
933 : : /*
934 : : * Try a hash aggregate plan on 'apath'. This is the cheapest
935 : : * available path containing each append child.
936 : : */
937 : 3209 : path = (Path *) create_agg_path(root,
938 : : result_rel,
939 : : apath,
940 : 3209 : result_rel->reltarget,
941 : : AGG_HASHED,
942 : : AGGSPLIT_SIMPLE,
943 : : groupList,
944 : : NIL,
945 : : NULL,
946 : : dNumChildGroups);
947 : 3209 : add_path(result_rel, path);
948 : :
949 : : /* Try hash aggregate on the Gather path, if valid */
950 [ + + ]: 3209 : if (gpath != NULL)
951 : : {
952 : : /* Hashed aggregate plan --- no sort needed */
953 : 5 : path = (Path *) create_agg_path(root,
954 : : result_rel,
955 : : gpath,
956 : 5 : result_rel->reltarget,
957 : : AGG_HASHED,
958 : : AGGSPLIT_SIMPLE,
959 : : groupList,
960 : : NIL,
961 : : NULL,
962 : : dNumChildGroups);
963 : 5 : add_path(result_rel, path);
964 : : }
965 : : }
966 : :
967 [ + + ]: 3269 : if (can_sort)
968 : : {
969 : 3209 : Path *path = apath;
970 : :
971 : : /* Try Sort -> Unique on the Append path */
972 [ + + ]: 3209 : if (groupList != NIL)
973 : 3184 : path = (Path *) create_sort_path(root, result_rel, path,
974 : : make_pathkeys_for_sortclauses(root, groupList, tlist),
975 : : -1.0);
976 : :
977 : 3209 : path = (Path *) create_unique_path(root,
978 : : result_rel,
979 : : path,
980 : 3209 : list_length(path->pathkeys),
981 : : dNumChildGroups);
982 : :
983 : 3209 : add_path(result_rel, path);
984 : :
985 : : /* Try Sort -> Unique on the Gather path, if set */
986 [ + + ]: 3209 : if (gpath != NULL)
987 : : {
988 : 5 : path = gpath;
989 : :
990 : 5 : path = (Path *) create_sort_path(root, result_rel, path,
991 : : make_pathkeys_for_sortclauses(root, groupList, tlist),
992 : : -1.0);
993 : :
994 : 5 : path = (Path *) create_unique_path(root,
995 : : result_rel,
996 : : path,
997 : 5 : list_length(path->pathkeys),
998 : : dNumChildGroups);
999 : 5 : add_path(result_rel, path);
1000 : : }
1001 : : }
1002 : :
1003 : : /*
1004 : : * Try making a MergeAppend path if we managed to find a path with the
1005 : : * correct pathkeys in each union child query.
1006 : : */
1007 [ + + + + ]: 3269 : if (try_sorted && groupList != NIL)
1008 : : {
1009 : : Path *path;
1010 : :
1011 : 227 : path = (Path *) create_merge_append_path(root,
1012 : : result_rel,
1013 : : ordered.subpaths,
1014 : : NIL,
1015 : : union_pathkeys,
1016 : : NULL);
1017 : :
1018 : : /* and make the MergeAppend unique */
1019 : 227 : path = (Path *) create_unique_path(root,
1020 : : result_rel,
1021 : : path,
1022 : : list_length(tlist),
1023 : : dNumChildGroups);
1024 : :
1025 : 227 : add_path(result_rel, path);
1026 : : }
1027 : : }
1028 : : else
1029 : : {
1030 : : /* UNION ALL */
1031 : 445 : add_path(result_rel, apath);
1032 : :
1033 [ - + ]: 445 : if (gpath != NULL)
1034 : 0 : add_path(result_rel, gpath);
1035 : : }
1036 : :
1037 : 3714 : return result_rel;
1038 : : }
1039 : :
1040 : : /*
1041 : : * Generate paths for an INTERSECT, INTERSECT ALL, EXCEPT, or EXCEPT ALL node
1042 : : */
1043 : : static RelOptInfo *
1044 : 624 : generate_nonunion_paths(SetOperationStmt *op, PlannerInfo *root,
1045 : : List *refnames_tlist,
1046 : : List **pTargetList)
1047 : : {
1048 : : RelOptInfo *result_rel;
1049 : : RelOptInfo *lrel,
1050 : : *rrel;
1051 : 624 : double save_fraction = root->tuple_fraction;
1052 : : Path *lpath,
1053 : : *rpath,
1054 : : *path;
1055 : : List *lpath_tlist,
1056 : : *rpath_tlist,
1057 : : *tlist,
1058 : : *groupList;
1059 : : bool lpath_trivial_tlist,
1060 : : rpath_trivial_tlist,
1061 : : result_trivial_tlist;
1062 : 624 : List *nonunion_pathkeys = NIL;
1063 : : double dLeftGroups,
1064 : : dRightGroups,
1065 : : dNumGroups,
1066 : : dNumOutputRows;
1067 : : bool can_sort;
1068 : : bool can_hash;
1069 : : SetOpCmd cmd;
1070 : :
1071 : : /*
1072 : : * Tell children to fetch all tuples.
1073 : : */
1074 : 624 : root->tuple_fraction = 0.0;
1075 : :
1076 : : /* Recurse on children */
1077 : 624 : lrel = recurse_set_operations(op->larg, root,
1078 : : op,
1079 : : op->colTypes, op->colCollations,
1080 : : refnames_tlist,
1081 : : &lpath_tlist,
1082 : : &lpath_trivial_tlist);
1083 : :
1084 : 624 : rrel = recurse_set_operations(op->rarg, root,
1085 : : op,
1086 : : op->colTypes, op->colCollations,
1087 : : refnames_tlist,
1088 : : &rpath_tlist,
1089 : : &rpath_trivial_tlist);
1090 : :
1091 : : /*
1092 : : * Generate tlist for SetOp plan node.
1093 : : *
1094 : : * The tlist for a SetOp plan isn't important so far as the SetOp is
1095 : : * concerned, but we must make it look real anyway for the benefit of the
1096 : : * next plan level up.
1097 : : */
1098 : 624 : tlist = generate_setop_tlist(op->colTypes, op->colCollations,
1099 : : 0, false, lpath_tlist, refnames_tlist,
1100 : : &result_trivial_tlist);
1101 : :
1102 : : /* We should not have needed any type coercions in the tlist */
1103 : : Assert(result_trivial_tlist);
1104 : :
1105 : 624 : *pTargetList = tlist;
1106 : :
1107 : : /* Identify the grouping semantics */
1108 : 624 : groupList = generate_setop_grouplist(op, tlist);
1109 : :
1110 : : /* Check whether the operators support sorting or hashing */
1111 : 624 : can_sort = grouping_is_sortable(groupList);
1112 : 624 : can_hash = grouping_is_hashable(groupList);
1113 [ - + - - ]: 624 : if (!can_sort && !can_hash)
1114 [ # # # # ]: 0 : ereport(ERROR,
1115 : : (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
1116 : : /* translator: %s is INTERSECT or EXCEPT */
1117 : : errmsg("could not implement %s",
1118 : : (op->op == SETOP_INTERSECT) ? "INTERSECT" : "EXCEPT"),
1119 : : errdetail("Some of the datatypes only support hashing, while others only support sorting.")));
1120 : :
1121 [ + - ]: 624 : if (can_sort)
1122 : : {
1123 : : /* Determine the pathkeys for sorting by the whole target list */
1124 : 624 : nonunion_pathkeys = make_pathkeys_for_sortclauses(root, groupList,
1125 : : tlist);
1126 : :
1127 : 624 : root->query_pathkeys = nonunion_pathkeys;
1128 : : }
1129 : :
1130 : : /*
1131 : : * Now that we've got all that info, we can build the child paths.
1132 : : */
1133 [ + + ]: 624 : if (lrel->rtekind == RTE_SUBQUERY)
1134 : 604 : build_setop_child_paths(root, lrel, lpath_trivial_tlist, lpath_tlist,
1135 : : nonunion_pathkeys, &dLeftGroups);
1136 : : else
1137 : 20 : dLeftGroups = lrel->rows;
1138 [ + + ]: 624 : if (rrel->rtekind == RTE_SUBQUERY)
1139 : 614 : build_setop_child_paths(root, rrel, rpath_trivial_tlist, rpath_tlist,
1140 : : nonunion_pathkeys, &dRightGroups);
1141 : : else
1142 : 10 : dRightGroups = rrel->rows;
1143 : :
1144 : : /* Undo effects of forcing tuple_fraction to 0 */
1145 : 624 : root->tuple_fraction = save_fraction;
1146 : :
1147 : : /*
1148 : : * For EXCEPT, we must put the left input first. For INTERSECT, either
1149 : : * order should give the same results, and we prefer to put the smaller
1150 : : * input first in order to (a) minimize the size of the hash table in the
1151 : : * hashing case, and (b) improve our chances of exploiting the executor's
1152 : : * fast path for empty left-hand input. "Smaller" means the one with the
1153 : : * fewer groups.
1154 : : */
1155 [ + + + + ]: 624 : if (op->op != SETOP_EXCEPT && dLeftGroups > dRightGroups)
1156 : : {
1157 : : /* need to swap the two inputs */
1158 : : RelOptInfo *tmprel;
1159 : : List *tmplist;
1160 : : double tmpd;
1161 : :
1162 : 30 : tmprel = lrel;
1163 : 30 : lrel = rrel;
1164 : 30 : rrel = tmprel;
1165 : 30 : tmplist = lpath_tlist;
1166 : 30 : lpath_tlist = rpath_tlist;
1167 : 30 : rpath_tlist = tmplist;
1168 : 30 : tmpd = dLeftGroups;
1169 : 30 : dLeftGroups = dRightGroups;
1170 : 30 : dRightGroups = tmpd;
1171 : : }
1172 : :
1173 : 624 : lpath = lrel->cheapest_total_path;
1174 : 624 : rpath = rrel->cheapest_total_path;
1175 : :
1176 : : /* Build result relation. */
1177 : 624 : result_rel = fetch_upper_rel(root, UPPERREL_SETOP,
1178 : 624 : bms_union(lrel->relids, rrel->relids));
1179 : :
1180 : : /*
1181 : : * Create the PathTarget and set the width accordingly. For EXCEPT, since
1182 : : * the set op result won't contain rows from the rpath, we only account
1183 : : * for the width of the lpath. For INTERSECT, use both input paths.
1184 : : */
1185 [ + + ]: 624 : if (op->op == SETOP_EXCEPT)
1186 : 419 : result_rel->reltarget = create_setop_pathtarget(root, tlist,
1187 : : list_make1(lpath));
1188 : : else
1189 : 205 : result_rel->reltarget = create_setop_pathtarget(root, tlist,
1190 : : list_make2(lpath, rpath));
1191 : :
1192 : : /* Check for provably empty setop inputs and add short-circuit paths. */
1193 [ + + ]: 624 : if (op->op == SETOP_EXCEPT)
1194 : : {
1195 : : /*
1196 : : * For EXCEPTs, if the left side is dummy then there's no need to
1197 : : * inspect the right-hand side as scanning the right to find tuples to
1198 : : * remove won't make the left-hand input any more empty.
1199 : : */
1200 [ + + ]: 419 : if (is_dummy_rel(lrel))
1201 : : {
1202 : 5 : mark_dummy_rel(result_rel);
1203 : :
1204 : 5 : return result_rel;
1205 : : }
1206 : :
1207 : : /* Handle EXCEPTs with dummy right input */
1208 [ + + ]: 414 : if (is_dummy_rel(rrel))
1209 : : {
1210 [ + - ]: 5 : if (op->all)
1211 : : {
1212 : : Path *apath;
1213 : 5 : AppendPathInput append = {0};
1214 : :
1215 : 5 : append.subpaths = list_make1(lpath);
1216 : :
1217 : : /*
1218 : : * EXCEPT ALL: If the right-hand input is dummy then we can
1219 : : * simply scan the left-hand input. To keep createplan.c
1220 : : * happy, use a single child Append to handle the translation
1221 : : * between the set op targetlist and the targetlist of the
1222 : : * left input. The Append will be removed in setrefs.c.
1223 : : */
1224 : 5 : apath = (Path *) create_append_path(root, result_rel,
1225 : : append, NIL, NULL, 0,
1226 : : false, -1);
1227 : :
1228 : 5 : add_path(result_rel, apath);
1229 : :
1230 : 5 : return result_rel;
1231 : : }
1232 : : else
1233 : : {
1234 : : /*
1235 : : * To make EXCEPT with a dummy RHS work means having to
1236 : : * deduplicate the left input. That could be done with
1237 : : * AggPaths, but it doesn't seem worth the effort. Let the
1238 : : * normal path generation code below handle this one.
1239 : : */
1240 : : }
1241 : : }
1242 : : }
1243 : : else
1244 : : {
1245 : : /*
1246 : : * For INTERSECT, if either input is a dummy rel then we can mark the
1247 : : * result_rel as dummy since intersecting with an empty relation can
1248 : : * never yield any results. This is true regardless of INTERSECT or
1249 : : * INTERSECT ALL.
1250 : : */
1251 [ + + - + ]: 205 : if (is_dummy_rel(lrel) || is_dummy_rel(rrel))
1252 : : {
1253 : 15 : mark_dummy_rel(result_rel);
1254 : :
1255 : 15 : return result_rel;
1256 : : }
1257 : : }
1258 : :
1259 : : /*
1260 : : * Estimate number of distinct groups that we'll need hashtable entries
1261 : : * for; this is the size of the left-hand input for EXCEPT, or the smaller
1262 : : * input for INTERSECT. Also estimate the number of eventual output rows.
1263 : : * In non-ALL cases, we estimate each group produces one output row; in
1264 : : * ALL cases use the relevant relation size. These are worst-case
1265 : : * estimates, of course, but we need to be conservative.
1266 : : */
1267 [ + + ]: 599 : if (op->op == SETOP_EXCEPT)
1268 : : {
1269 : 409 : dNumGroups = dLeftGroups;
1270 [ + + ]: 409 : dNumOutputRows = op->all ? lpath->rows : dNumGroups;
1271 : : }
1272 : : else
1273 : : {
1274 : 190 : dNumGroups = dLeftGroups;
1275 [ + + - + ]: 190 : dNumOutputRows = op->all ? Min(lpath->rows, rpath->rows) : dNumGroups;
1276 : : }
1277 : 599 : result_rel->rows = dNumOutputRows;
1278 : :
1279 : : /* Select the SetOpCmd type */
1280 [ + + - ]: 599 : switch (op->op)
1281 : : {
1282 : 190 : case SETOP_INTERSECT:
1283 : 190 : cmd = op->all ? SETOPCMD_INTERSECT_ALL : SETOPCMD_INTERSECT;
1284 : 190 : break;
1285 : 409 : case SETOP_EXCEPT:
1286 [ + + ]: 409 : cmd = op->all ? SETOPCMD_EXCEPT_ALL : SETOPCMD_EXCEPT;
1287 : 409 : break;
1288 : 0 : default:
1289 [ # # ]: 0 : elog(ERROR, "unrecognized set op: %d", (int) op->op);
1290 : : cmd = SETOPCMD_INTERSECT; /* keep compiler quiet */
1291 : : break;
1292 : : }
1293 : :
1294 : : /*
1295 : : * If we can hash, that just requires a SetOp atop the cheapest inputs.
1296 : : */
1297 [ + + ]: 599 : if (can_hash)
1298 : : {
1299 : 549 : path = (Path *) create_setop_path(root,
1300 : : result_rel,
1301 : : lpath,
1302 : : rpath,
1303 : : cmd,
1304 : : SETOP_HASHED,
1305 : : groupList,
1306 : : dNumGroups,
1307 : : dNumOutputRows);
1308 : 549 : add_path(result_rel, path);
1309 : : }
1310 : :
1311 : : /*
1312 : : * If we can sort, generate the cheapest sorted input paths, and add a
1313 : : * SetOp atop those.
1314 : : */
1315 [ + - ]: 599 : if (can_sort)
1316 : : {
1317 : : List *pathkeys;
1318 : : Path *slpath,
1319 : : *srpath;
1320 : :
1321 : : /* First the left input ... */
1322 : 599 : pathkeys = make_pathkeys_for_sortclauses(root,
1323 : : groupList,
1324 : : lpath_tlist);
1325 [ + + ]: 599 : if (pathkeys_contained_in(pathkeys, lpath->pathkeys))
1326 : 80 : slpath = lpath; /* cheapest path is already sorted */
1327 : : else
1328 : : {
1329 : 519 : slpath = get_cheapest_path_for_pathkeys(lrel->pathlist,
1330 : : nonunion_pathkeys,
1331 : : NULL,
1332 : : TOTAL_COST,
1333 : : false);
1334 : : /* Subquery failed to produce any presorted paths? */
1335 [ + + ]: 519 : if (slpath == NULL)
1336 : 165 : slpath = (Path *) create_sort_path(root,
1337 : : lpath->parent,
1338 : : lpath,
1339 : : pathkeys,
1340 : : -1.0);
1341 : : }
1342 : :
1343 : : /* and now the same for the right. */
1344 : 599 : pathkeys = make_pathkeys_for_sortclauses(root,
1345 : : groupList,
1346 : : rpath_tlist);
1347 [ + + ]: 599 : if (pathkeys_contained_in(pathkeys, rpath->pathkeys))
1348 : 90 : srpath = rpath; /* cheapest path is already sorted */
1349 : : else
1350 : : {
1351 : 509 : srpath = get_cheapest_path_for_pathkeys(rrel->pathlist,
1352 : : nonunion_pathkeys,
1353 : : NULL,
1354 : : TOTAL_COST,
1355 : : false);
1356 : : /* Subquery failed to produce any presorted paths? */
1357 [ + + ]: 509 : if (srpath == NULL)
1358 : 165 : srpath = (Path *) create_sort_path(root,
1359 : : rpath->parent,
1360 : : rpath,
1361 : : pathkeys,
1362 : : -1.0);
1363 : : }
1364 : :
1365 : 599 : path = (Path *) create_setop_path(root,
1366 : : result_rel,
1367 : : slpath,
1368 : : srpath,
1369 : : cmd,
1370 : : SETOP_SORTED,
1371 : : groupList,
1372 : : dNumGroups,
1373 : : dNumOutputRows);
1374 : 599 : add_path(result_rel, path);
1375 : : }
1376 : :
1377 : 599 : return result_rel;
1378 : : }
1379 : :
1380 : : /*
1381 : : * Pull up children of a UNION node that are identically-propertied UNIONs,
1382 : : * and perform planning of the queries underneath the N-way UNION.
1383 : : *
1384 : : * The result is a list of RelOptInfos containing Paths for sub-nodes, with
1385 : : * one entry for each descendant that is a leaf query or non-identical setop.
1386 : : * We also return parallel lists of the childrens' targetlists and
1387 : : * is-trivial-tlist flags.
1388 : : *
1389 : : * NOTE: we can also pull a UNION ALL up into a UNION, since the distinct
1390 : : * output rows will be lost anyway.
1391 : : */
1392 : : static List *
1393 : 3719 : plan_union_children(PlannerInfo *root,
1394 : : SetOperationStmt *top_union,
1395 : : List *refnames_tlist,
1396 : : List **tlist_list,
1397 : : List **istrivial_tlist)
1398 : : {
1399 : 3719 : List *pending_rels = list_make1(top_union);
1400 : 3719 : List *result = NIL;
1401 : : List *child_tlist;
1402 : : bool trivial_tlist;
1403 : :
1404 : 3719 : *tlist_list = NIL;
1405 : 3719 : *istrivial_tlist = NIL;
1406 : :
1407 [ + + ]: 21160 : while (pending_rels != NIL)
1408 : : {
1409 : 17441 : Node *setOp = linitial(pending_rels);
1410 : :
1411 : 17441 : pending_rels = list_delete_first(pending_rels);
1412 : :
1413 [ + + ]: 17441 : if (IsA(setOp, SetOperationStmt))
1414 : : {
1415 : 6971 : SetOperationStmt *op = (SetOperationStmt *) setOp;
1416 : :
1417 [ + + ]: 6971 : if (op->op == top_union->op &&
1418 [ + + + + : 13767 : (op->all == top_union->all || op->all) &&
+ + ]
1419 [ + - ]: 13737 : equal(op->colTypes, top_union->colTypes) &&
1420 : 6861 : equal(op->colCollations, top_union->colCollations))
1421 : : {
1422 : : /* Same UNION, so fold children into parent */
1423 : 6861 : pending_rels = lcons(op->rarg, pending_rels);
1424 : 6861 : pending_rels = lcons(op->larg, pending_rels);
1425 : 6861 : continue;
1426 : : }
1427 : : }
1428 : :
1429 : : /*
1430 : : * Not same, so plan this child separately.
1431 : : *
1432 : : * If top_union isn't a UNION ALL, then we are interested in sorted
1433 : : * output from the child, so pass top_union as parentOp. Note that
1434 : : * this isn't necessarily the child node's immediate SetOperationStmt
1435 : : * parent, but that's fine: it's the effective parent.
1436 : : */
1437 : 10580 : result = lappend(result, recurse_set_operations(setOp, root,
1438 [ + + ]: 10580 : top_union->all ? NULL : top_union,
1439 : : top_union->colTypes,
1440 : : top_union->colCollations,
1441 : : refnames_tlist,
1442 : : &child_tlist,
1443 : : &trivial_tlist));
1444 : 10580 : *tlist_list = lappend(*tlist_list, child_tlist);
1445 : 10580 : *istrivial_tlist = lappend_int(*istrivial_tlist, trivial_tlist);
1446 : : }
1447 : :
1448 : 3719 : return result;
1449 : : }
1450 : :
1451 : : /*
1452 : : * postprocess_setop_rel - perform steps required after adding paths
1453 : : */
1454 : : static void
1455 : 17933 : postprocess_setop_rel(PlannerInfo *root, RelOptInfo *rel)
1456 : : {
1457 : : /*
1458 : : * We don't currently worry about allowing FDWs to contribute paths to
1459 : : * this relation, but give extensions a chance.
1460 : : */
1461 [ - + ]: 17933 : if (create_upper_paths_hook)
1462 : 0 : (*create_upper_paths_hook) (root, UPPERREL_SETOP,
1463 : : NULL, rel, NULL);
1464 : :
1465 : : /* Select cheapest path */
1466 : 17933 : set_cheapest(rel);
1467 : 17933 : }
1468 : :
1469 : : /*
1470 : : * Generate targetlist for a set-operation plan node
1471 : : *
1472 : : * colTypes: OID list of set-op's result column datatypes
1473 : : * colCollations: OID list of set-op's result column collations
1474 : : * varno: varno to use in generated Vars
1475 : : * hack_constants: true to copy up constants (see comments in code)
1476 : : * input_tlist: targetlist of this node's input node
1477 : : * refnames_tlist: targetlist to take column names from
1478 : : * trivial_tlist: output parameter, set to true if targetlist is trivial
1479 : : */
1480 : : static List *
1481 : 13596 : generate_setop_tlist(List *colTypes, List *colCollations,
1482 : : Index varno,
1483 : : bool hack_constants,
1484 : : List *input_tlist,
1485 : : List *refnames_tlist,
1486 : : bool *trivial_tlist)
1487 : : {
1488 : 13596 : List *tlist = NIL;
1489 : 13596 : int resno = 1;
1490 : : ListCell *ctlc,
1491 : : *cclc,
1492 : : *itlc,
1493 : : *rtlc;
1494 : : TargetEntry *tle;
1495 : : Node *expr;
1496 : :
1497 : 13596 : *trivial_tlist = true; /* until proven differently */
1498 : :
1499 [ + + + + : 54379 : forfour(ctlc, colTypes, cclc, colCollations,
+ + + + +
+ + + + +
+ + + + +
- + - + -
+ + ]
1500 : : itlc, input_tlist, rtlc, refnames_tlist)
1501 : : {
1502 : 40783 : Oid colType = lfirst_oid(ctlc);
1503 : 40783 : Oid colColl = lfirst_oid(cclc);
1504 : 40783 : TargetEntry *inputtle = (TargetEntry *) lfirst(itlc);
1505 : 40783 : TargetEntry *reftle = (TargetEntry *) lfirst(rtlc);
1506 : :
1507 : : Assert(inputtle->resno == resno);
1508 : : Assert(reftle->resno == resno);
1509 : : Assert(!inputtle->resjunk);
1510 : : Assert(!reftle->resjunk);
1511 : :
1512 : : /*
1513 : : * Generate columns referencing input columns and having appropriate
1514 : : * data types and column names. Insert datatype coercions where
1515 : : * necessary.
1516 : : *
1517 : : * HACK: constants in the input's targetlist are copied up as-is
1518 : : * rather than being referenced as subquery outputs. This is mainly
1519 : : * to ensure that when we try to coerce them to the output column's
1520 : : * datatype, the right things happen for UNKNOWN constants. But do
1521 : : * this only at the first level of subquery-scan plans; we don't want
1522 : : * phony constants appearing in the output tlists of upper-level
1523 : : * nodes!
1524 : : *
1525 : : * Note that copying a constant doesn't in itself require us to mark
1526 : : * the tlist nontrivial; see trivial_subqueryscan() in setrefs.c.
1527 : : */
1528 [ + + + - : 40783 : if (hack_constants && inputtle->expr && IsA(inputtle->expr, Const))
+ + ]
1529 : 12961 : expr = (Node *) inputtle->expr;
1530 : : else
1531 : 111288 : expr = (Node *) makeVar(varno,
1532 : 27822 : inputtle->resno,
1533 : 27822 : exprType((Node *) inputtle->expr),
1534 : 27822 : exprTypmod((Node *) inputtle->expr),
1535 : 27822 : exprCollation((Node *) inputtle->expr),
1536 : : 0);
1537 : :
1538 [ + + ]: 40783 : if (exprType(expr) != colType)
1539 : : {
1540 : : /*
1541 : : * Note: it's not really cool to be applying coerce_to_common_type
1542 : : * here; one notable point is that assign_expr_collations never
1543 : : * gets run on any generated nodes. For the moment that's not a
1544 : : * problem because we force the correct exposed collation below.
1545 : : * It would likely be best to make the parser generate the correct
1546 : : * output tlist for every set-op to begin with, though.
1547 : : */
1548 : 1124 : expr = coerce_to_common_type(NULL, /* no UNKNOWNs here */
1549 : : expr,
1550 : : colType,
1551 : : "UNION/INTERSECT/EXCEPT");
1552 : 1124 : *trivial_tlist = false; /* the coercion makes it not trivial */
1553 : : }
1554 : :
1555 : : /*
1556 : : * Ensure the tlist entry's exposed collation matches the set-op. This
1557 : : * is necessary because plan_set_operations() reports the result
1558 : : * ordering as a list of SortGroupClauses, which don't carry collation
1559 : : * themselves but just refer to tlist entries. If we don't show the
1560 : : * right collation then planner.c might do the wrong thing in
1561 : : * higher-level queries.
1562 : : *
1563 : : * Note we use RelabelType, not CollateExpr, since this expression
1564 : : * will reach the executor without any further processing.
1565 : : */
1566 [ + + ]: 40783 : if (exprCollation(expr) != colColl)
1567 : : {
1568 : 10915 : expr = applyRelabelType(expr,
1569 : : exprType(expr), exprTypmod(expr), colColl,
1570 : : COERCE_IMPLICIT_CAST, -1, false);
1571 : 10915 : *trivial_tlist = false; /* the relabel makes it not trivial */
1572 : : }
1573 : :
1574 : 81566 : tle = makeTargetEntry((Expr *) expr,
1575 : 40783 : (AttrNumber) resno++,
1576 : 40783 : pstrdup(reftle->resname),
1577 : : false);
1578 : :
1579 : : /*
1580 : : * By convention, all output columns in a setop tree have
1581 : : * ressortgroupref equal to their resno. In some cases the ref isn't
1582 : : * needed, but this is a cleaner way than modifying the tlist later.
1583 : : */
1584 : 40783 : tle->ressortgroupref = tle->resno;
1585 : :
1586 : 40783 : tlist = lappend(tlist, tle);
1587 : : }
1588 : :
1589 : 13596 : return tlist;
1590 : : }
1591 : :
1592 : : /*
1593 : : * Generate targetlist for a set-operation Append node
1594 : : *
1595 : : * colTypes: OID list of set-op's result column datatypes
1596 : : * colCollations: OID list of set-op's result column collations
1597 : : * input_tlists: list of tlists for sub-plans of the Append
1598 : : * refnames_tlist: targetlist to take column names from
1599 : : *
1600 : : * The entries in the Append's targetlist should always be simple Vars;
1601 : : * we just have to make sure they have the right datatypes/typmods/collations.
1602 : : * The Vars are always generated with varno 0.
1603 : : *
1604 : : * XXX a problem with the varno-zero approach is that set_pathtarget_cost_width
1605 : : * cannot figure out a realistic width for the tlist we make here. But we
1606 : : * ought to refactor this code to produce a PathTarget directly, anyway.
1607 : : */
1608 : : static List *
1609 : 4356 : generate_append_tlist(List *colTypes, List *colCollations,
1610 : : List *input_tlists,
1611 : : List *refnames_tlist)
1612 : : {
1613 : 4356 : List *tlist = NIL;
1614 : 4356 : int resno = 1;
1615 : : ListCell *curColType;
1616 : : ListCell *curColCollation;
1617 : : ListCell *ref_tl_item;
1618 : : int colindex;
1619 : : TargetEntry *tle;
1620 : : Node *expr;
1621 : : ListCell *tlistl;
1622 : : int32 *colTypmods;
1623 : :
1624 : : /*
1625 : : * First extract typmods to use.
1626 : : *
1627 : : * If the inputs all agree on type and typmod of a particular column, use
1628 : : * that typmod; else use -1.
1629 : : */
1630 : 4356 : colTypmods = palloc_array(int32, list_length(colTypes));
1631 : :
1632 [ + - + + : 16210 : foreach(tlistl, input_tlists)
+ + ]
1633 : : {
1634 : 11854 : List *subtlist = (List *) lfirst(tlistl);
1635 : : ListCell *subtlistl;
1636 : :
1637 : 11854 : curColType = list_head(colTypes);
1638 : 11854 : colindex = 0;
1639 [ + + + + : 46126 : foreach(subtlistl, subtlist)
+ + ]
1640 : : {
1641 : 34272 : TargetEntry *subtle = (TargetEntry *) lfirst(subtlistl);
1642 : :
1643 : : Assert(!subtle->resjunk);
1644 : : Assert(curColType != NULL);
1645 [ + - ]: 34272 : if (exprType((Node *) subtle->expr) == lfirst_oid(curColType))
1646 : : {
1647 : : /* If first subplan, copy the typmod; else compare */
1648 : 34272 : int32 subtypmod = exprTypmod((Node *) subtle->expr);
1649 : :
1650 [ + + ]: 34272 : if (tlistl == list_head(input_tlists))
1651 : 11840 : colTypmods[colindex] = subtypmod;
1652 [ + + ]: 22432 : else if (subtypmod != colTypmods[colindex])
1653 : 10 : colTypmods[colindex] = -1;
1654 : : }
1655 : : else
1656 : : {
1657 : : /* types disagree, so force typmod to -1 */
1658 : 0 : colTypmods[colindex] = -1;
1659 : : }
1660 : 34272 : curColType = lnext(colTypes, curColType);
1661 : 34272 : colindex++;
1662 : : }
1663 : : Assert(curColType == NULL);
1664 : : }
1665 : :
1666 : : /*
1667 : : * Now we can build the tlist for the Append.
1668 : : */
1669 : 4356 : colindex = 0;
1670 [ + + + + : 16196 : forthree(curColType, colTypes, curColCollation, colCollations,
+ + + + +
+ + + + +
+ - + - +
+ ]
1671 : : ref_tl_item, refnames_tlist)
1672 : : {
1673 : 11840 : Oid colType = lfirst_oid(curColType);
1674 : 11840 : int32 colTypmod = colTypmods[colindex++];
1675 : 11840 : Oid colColl = lfirst_oid(curColCollation);
1676 : 11840 : TargetEntry *reftle = (TargetEntry *) lfirst(ref_tl_item);
1677 : :
1678 : : Assert(reftle->resno == resno);
1679 : : Assert(!reftle->resjunk);
1680 : 11840 : expr = (Node *) makeVar(0,
1681 : : resno,
1682 : : colType,
1683 : : colTypmod,
1684 : : colColl,
1685 : : 0);
1686 : 23680 : tle = makeTargetEntry((Expr *) expr,
1687 : 11840 : (AttrNumber) resno++,
1688 : 11840 : pstrdup(reftle->resname),
1689 : : false);
1690 : :
1691 : : /*
1692 : : * By convention, all output columns in a setop tree have
1693 : : * ressortgroupref equal to their resno. In some cases the ref isn't
1694 : : * needed, but this is a cleaner way than modifying the tlist later.
1695 : : */
1696 : 11840 : tle->ressortgroupref = tle->resno;
1697 : :
1698 : 11840 : tlist = lappend(tlist, tle);
1699 : : }
1700 : :
1701 : 4356 : pfree(colTypmods);
1702 : :
1703 : 4356 : return tlist;
1704 : : }
1705 : :
1706 : : /*
1707 : : * generate_setop_grouplist
1708 : : * Build a SortGroupClause list defining the sort/grouping properties
1709 : : * of the setop's output columns.
1710 : : *
1711 : : * Parse analysis already determined the properties and built a suitable
1712 : : * list, except that the entries do not have sortgrouprefs set because
1713 : : * the parser output representation doesn't include a tlist for each
1714 : : * setop. So what we need to do here is copy that list and install
1715 : : * proper sortgrouprefs into it (copying those from the targetlist).
1716 : : */
1717 : : static List *
1718 : 4118 : generate_setop_grouplist(SetOperationStmt *op, List *targetlist)
1719 : : {
1720 : 4118 : List *grouplist = copyObject(op->groupClauses);
1721 : : ListCell *lg;
1722 : : ListCell *lt;
1723 : :
1724 : 4118 : lg = list_head(grouplist);
1725 [ + + + + : 15825 : foreach(lt, targetlist)
+ + ]
1726 : : {
1727 : 11707 : TargetEntry *tle = (TargetEntry *) lfirst(lt);
1728 : : SortGroupClause *sgc;
1729 : :
1730 : : Assert(!tle->resjunk);
1731 : :
1732 : : /* non-resjunk columns should have sortgroupref = resno */
1733 : : Assert(tle->ressortgroupref == tle->resno);
1734 : :
1735 : : /* non-resjunk columns should have grouping clauses */
1736 : : Assert(lg != NULL);
1737 : 11707 : sgc = (SortGroupClause *) lfirst(lg);
1738 : 11707 : lg = lnext(grouplist, lg);
1739 : : Assert(sgc->tleSortGroupRef == 0);
1740 : :
1741 : 11707 : sgc->tleSortGroupRef = tle->ressortgroupref;
1742 : : }
1743 : : Assert(lg == NULL);
1744 : 4118 : return grouplist;
1745 : : }
1746 : :
1747 : : /*
1748 : : * create_setop_pathtarget
1749 : : * Do the normal create_pathtarget() work, plus set the resulting
1750 : : * PathTarget's width to the average width of the Paths in child_pathlist
1751 : : * weighted using the estimated row count of each path.
1752 : : *
1753 : : * Note: This is required because set op target lists use varno==0, which
1754 : : * results in a type default width estimate rather than one that's based on
1755 : : * statistics of the columns from the set op children.
1756 : : */
1757 : : static PathTarget *
1758 : 4343 : create_setop_pathtarget(PlannerInfo *root, List *tlist, List *child_pathlist)
1759 : : {
1760 : : PathTarget *reltarget;
1761 : : ListCell *lc;
1762 : 4343 : double parent_rows = 0;
1763 : 4343 : double parent_size = 0;
1764 : :
1765 : 4343 : reltarget = create_pathtarget(root, tlist);
1766 : :
1767 : : /* Calculate the total rows and total size. */
1768 [ + + + + : 15714 : foreach(lc, child_pathlist)
+ + ]
1769 : : {
1770 : 11371 : Path *path = (Path *) lfirst(lc);
1771 : :
1772 : 11371 : parent_rows += path->rows;
1773 : 11371 : parent_size += path->parent->reltarget->width * path->rows;
1774 : : }
1775 : :
1776 [ + + ]: 4343 : if (parent_rows > 0)
1777 : 4328 : reltarget->width = rint(parent_size / parent_rows);
1778 : :
1779 : 4343 : return reltarget;
1780 : : }
|