Line data Source code
1 : /*-------------------------------------------------------------------------
2 : *
3 : * allpaths.c
4 : * Routines to find possible search paths for processing a query
5 : *
6 : * Portions Copyright (c) 1996-2026, PostgreSQL Global Development Group
7 : * Portions Copyright (c) 1994, Regents of the University of California
8 : *
9 : *
10 : * IDENTIFICATION
11 : * src/backend/optimizer/path/allpaths.c
12 : *
13 : *-------------------------------------------------------------------------
14 : */
15 :
16 : #include "postgres.h"
17 :
18 : #include <limits.h>
19 : #include <math.h>
20 :
21 : #include "access/sysattr.h"
22 : #include "access/tsmapi.h"
23 : #include "catalog/pg_class.h"
24 : #include "catalog/pg_operator.h"
25 : #include "catalog/pg_proc.h"
26 : #include "foreign/fdwapi.h"
27 : #include "miscadmin.h"
28 : #include "nodes/makefuncs.h"
29 : #include "nodes/nodeFuncs.h"
30 : #include "nodes/supportnodes.h"
31 : #ifdef OPTIMIZER_DEBUG
32 : #include "nodes/print.h"
33 : #endif
34 : #include "optimizer/appendinfo.h"
35 : #include "optimizer/clauses.h"
36 : #include "optimizer/cost.h"
37 : #include "optimizer/geqo.h"
38 : #include "optimizer/optimizer.h"
39 : #include "optimizer/pathnode.h"
40 : #include "optimizer/paths.h"
41 : #include "optimizer/plancat.h"
42 : #include "optimizer/planner.h"
43 : #include "optimizer/prep.h"
44 : #include "optimizer/tlist.h"
45 : #include "parser/parse_clause.h"
46 : #include "parser/parsetree.h"
47 : #include "partitioning/partbounds.h"
48 : #include "port/pg_bitutils.h"
49 : #include "rewrite/rewriteManip.h"
50 : #include "utils/lsyscache.h"
51 : #include "utils/selfuncs.h"
52 :
53 :
54 : /* Bitmask flags for pushdown_safety_info.unsafeFlags */
55 : #define UNSAFE_HAS_VOLATILE_FUNC (1 << 0)
56 : #define UNSAFE_HAS_SET_FUNC (1 << 1)
57 : #define UNSAFE_NOTIN_DISTINCTON_CLAUSE (1 << 2)
58 : #define UNSAFE_NOTIN_PARTITIONBY_CLAUSE (1 << 3)
59 : #define UNSAFE_TYPE_MISMATCH (1 << 4)
60 :
61 : /* results of subquery_is_pushdown_safe */
62 : typedef struct pushdown_safety_info
63 : {
64 : unsigned char *unsafeFlags; /* bitmask of reasons why this target list
65 : * column is unsafe for qual pushdown, or 0 if
66 : * no reason. */
67 : bool unsafeVolatile; /* don't push down volatile quals */
68 : bool unsafeLeaky; /* don't push down leaky quals */
69 : } pushdown_safety_info;
70 :
71 : /* Return type for qual_is_pushdown_safe */
72 : typedef enum pushdown_safe_type
73 : {
74 : PUSHDOWN_UNSAFE, /* unsafe to push qual into subquery */
75 : PUSHDOWN_SAFE, /* safe to push qual into subquery */
76 : PUSHDOWN_WINDOWCLAUSE_RUNCOND, /* unsafe, but may work as WindowClause
77 : * run condition */
78 : } pushdown_safe_type;
79 :
80 : /* These parameters are set by GUC */
81 : bool enable_geqo = false; /* just in case GUC doesn't set it */
82 : bool enable_eager_aggregate = true;
83 : int geqo_threshold;
84 : double min_eager_agg_group_size;
85 : int min_parallel_table_scan_size;
86 : int min_parallel_index_scan_size;
87 :
88 : /* Hook for plugins to get control in set_rel_pathlist() */
89 : set_rel_pathlist_hook_type set_rel_pathlist_hook = NULL;
90 :
91 : /* Hook for plugins to replace standard_join_search() */
92 : join_search_hook_type join_search_hook = NULL;
93 :
94 :
95 : static void set_base_rel_consider_startup(PlannerInfo *root);
96 : static void set_base_rel_sizes(PlannerInfo *root);
97 : static void setup_simple_grouped_rels(PlannerInfo *root);
98 : static void set_base_rel_pathlists(PlannerInfo *root);
99 : static void set_rel_size(PlannerInfo *root, RelOptInfo *rel,
100 : Index rti, RangeTblEntry *rte);
101 : static void set_rel_pathlist(PlannerInfo *root, RelOptInfo *rel,
102 : Index rti, RangeTblEntry *rte);
103 : static void set_plain_rel_size(PlannerInfo *root, RelOptInfo *rel,
104 : RangeTblEntry *rte);
105 : static void create_plain_partial_paths(PlannerInfo *root, RelOptInfo *rel);
106 : static void set_rel_consider_parallel(PlannerInfo *root, RelOptInfo *rel,
107 : RangeTblEntry *rte);
108 : static void set_plain_rel_pathlist(PlannerInfo *root, RelOptInfo *rel,
109 : RangeTblEntry *rte);
110 : static void set_tablesample_rel_size(PlannerInfo *root, RelOptInfo *rel,
111 : RangeTblEntry *rte);
112 : static void set_tablesample_rel_pathlist(PlannerInfo *root, RelOptInfo *rel,
113 : RangeTblEntry *rte);
114 : static void set_foreign_size(PlannerInfo *root, RelOptInfo *rel,
115 : RangeTblEntry *rte);
116 : static void set_foreign_pathlist(PlannerInfo *root, RelOptInfo *rel,
117 : RangeTblEntry *rte);
118 : static void set_append_rel_size(PlannerInfo *root, RelOptInfo *rel,
119 : Index rti, RangeTblEntry *rte);
120 : static void set_append_rel_pathlist(PlannerInfo *root, RelOptInfo *rel,
121 : Index rti, RangeTblEntry *rte);
122 : static void set_grouped_rel_pathlist(PlannerInfo *root, RelOptInfo *rel);
123 : static void generate_orderedappend_paths(PlannerInfo *root, RelOptInfo *rel,
124 : List *live_childrels,
125 : List *all_child_pathkeys);
126 : static Path *get_cheapest_parameterized_child_path(PlannerInfo *root,
127 : RelOptInfo *rel,
128 : Relids required_outer);
129 : static void accumulate_append_subpath(Path *path,
130 : List **subpaths,
131 : List **special_subpaths,
132 : List **child_append_relid_sets);
133 : static Path *get_singleton_append_subpath(Path *path,
134 : List **child_append_relid_sets);
135 : static void set_dummy_rel_pathlist(RelOptInfo *rel);
136 : static void set_subquery_pathlist(PlannerInfo *root, RelOptInfo *rel,
137 : Index rti, RangeTblEntry *rte);
138 : static void set_function_pathlist(PlannerInfo *root, RelOptInfo *rel,
139 : RangeTblEntry *rte);
140 : static void set_values_pathlist(PlannerInfo *root, RelOptInfo *rel,
141 : RangeTblEntry *rte);
142 : static void set_tablefunc_pathlist(PlannerInfo *root, RelOptInfo *rel,
143 : RangeTblEntry *rte);
144 : static void set_cte_pathlist(PlannerInfo *root, RelOptInfo *rel,
145 : RangeTblEntry *rte);
146 : static void set_namedtuplestore_pathlist(PlannerInfo *root, RelOptInfo *rel,
147 : RangeTblEntry *rte);
148 : static void set_result_pathlist(PlannerInfo *root, RelOptInfo *rel,
149 : RangeTblEntry *rte);
150 : static void set_worktable_pathlist(PlannerInfo *root, RelOptInfo *rel,
151 : RangeTblEntry *rte);
152 : static RelOptInfo *make_rel_from_joinlist(PlannerInfo *root, List *joinlist);
153 : static bool subquery_is_pushdown_safe(Query *subquery, Query *topquery,
154 : pushdown_safety_info *safetyInfo);
155 : static bool recurse_pushdown_safe(Node *setOp, Query *topquery,
156 : pushdown_safety_info *safetyInfo);
157 : static void check_output_expressions(Query *subquery,
158 : pushdown_safety_info *safetyInfo);
159 : static void compare_tlist_datatypes(List *tlist, List *colTypes,
160 : pushdown_safety_info *safetyInfo);
161 : static bool targetIsInAllPartitionLists(TargetEntry *tle, Query *query);
162 : static pushdown_safe_type qual_is_pushdown_safe(Query *subquery, Index rti,
163 : RestrictInfo *rinfo,
164 : pushdown_safety_info *safetyInfo);
165 : static void subquery_push_qual(Query *subquery,
166 : RangeTblEntry *rte, Index rti, Node *qual);
167 : static void recurse_push_qual(Node *setOp, Query *topquery,
168 : RangeTblEntry *rte, Index rti, Node *qual);
169 : static void remove_unused_subquery_outputs(Query *subquery, RelOptInfo *rel,
170 : Bitmapset *extra_used_attrs);
171 :
172 :
173 : /*
174 : * make_one_rel
175 : * Finds all possible access paths for executing a query, returning a
176 : * single rel that represents the join of all base rels in the query.
177 : */
178 : RelOptInfo *
179 253299 : make_one_rel(PlannerInfo *root, List *joinlist)
180 : {
181 : RelOptInfo *rel;
182 : Index rti;
183 : double total_pages;
184 :
185 : /* Mark base rels as to whether we care about fast-start plans */
186 253299 : set_base_rel_consider_startup(root);
187 :
188 : /*
189 : * Compute size estimates and consider_parallel flags for each base rel.
190 : */
191 253299 : set_base_rel_sizes(root);
192 :
193 : /*
194 : * Build grouped relations for simple rels (i.e., base or "other" member
195 : * relations) where possible.
196 : */
197 253277 : setup_simple_grouped_rels(root);
198 :
199 : /*
200 : * We should now have size estimates for every actual table involved in
201 : * the query, and we also know which if any have been deleted from the
202 : * query by join removal, pruned by partition pruning, or eliminated by
203 : * constraint exclusion. So we can now compute total_table_pages.
204 : *
205 : * Note that appendrels are not double-counted here, even though we don't
206 : * bother to distinguish RelOptInfos for appendrel parents, because the
207 : * parents will have pages = 0.
208 : *
209 : * XXX if a table is self-joined, we will count it once per appearance,
210 : * which perhaps is the wrong thing ... but that's not completely clear,
211 : * and detecting self-joins here is difficult, so ignore it for now.
212 : */
213 253277 : total_pages = 0;
214 794238 : for (rti = 1; rti < root->simple_rel_array_size; rti++)
215 : {
216 540961 : RelOptInfo *brel = root->simple_rel_array[rti];
217 :
218 : /* there may be empty slots corresponding to non-baserel RTEs */
219 540961 : if (brel == NULL)
220 127684 : continue;
221 :
222 : Assert(brel->relid == rti); /* sanity check on array */
223 :
224 413277 : if (IS_DUMMY_REL(brel))
225 1261 : continue;
226 :
227 412016 : if (IS_SIMPLE_REL(brel))
228 412016 : total_pages += (double) brel->pages;
229 : }
230 253277 : root->total_table_pages = total_pages;
231 :
232 : /*
233 : * Generate access paths for each base rel.
234 : */
235 253277 : set_base_rel_pathlists(root);
236 :
237 : /*
238 : * Generate access paths for the entire join tree.
239 : */
240 253277 : rel = make_rel_from_joinlist(root, joinlist);
241 :
242 : /*
243 : * The result should join all and only the query's base + outer-join rels.
244 : */
245 : Assert(bms_equal(rel->relids, root->all_query_rels));
246 :
247 253277 : return rel;
248 : }
249 :
250 : /*
251 : * set_base_rel_consider_startup
252 : * Set the consider_[param_]startup flags for each base-relation entry.
253 : *
254 : * For the moment, we only deal with consider_param_startup here; because the
255 : * logic for consider_startup is pretty trivial and is the same for every base
256 : * relation, we just let build_simple_rel() initialize that flag correctly to
257 : * start with. If that logic ever gets more complicated it would probably
258 : * be better to move it here.
259 : */
260 : static void
261 253299 : set_base_rel_consider_startup(PlannerInfo *root)
262 : {
263 : /*
264 : * Since parameterized paths can only be used on the inside of a nestloop
265 : * join plan, there is usually little value in considering fast-start
266 : * plans for them. However, for relations that are on the RHS of a SEMI
267 : * or ANTI join, a fast-start plan can be useful because we're only going
268 : * to care about fetching one tuple anyway.
269 : *
270 : * To minimize growth of planning time, we currently restrict this to
271 : * cases where the RHS is a single base relation, not a join; there is no
272 : * provision for consider_param_startup to get set at all on joinrels.
273 : * Also we don't worry about appendrels. costsize.c's costing rules for
274 : * nestloop semi/antijoins don't consider such cases either.
275 : */
276 : ListCell *lc;
277 :
278 288035 : foreach(lc, root->join_info_list)
279 : {
280 34736 : SpecialJoinInfo *sjinfo = (SpecialJoinInfo *) lfirst(lc);
281 : int varno;
282 :
283 44348 : if ((sjinfo->jointype == JOIN_SEMI || sjinfo->jointype == JOIN_ANTI) &&
284 9612 : bms_get_singleton_member(sjinfo->syn_righthand, &varno))
285 : {
286 9433 : RelOptInfo *rel = find_base_rel(root, varno);
287 :
288 9433 : rel->consider_param_startup = true;
289 : }
290 : }
291 253299 : }
292 :
293 : /*
294 : * set_base_rel_sizes
295 : * Set the size estimates (rows and widths) for each base-relation entry.
296 : * Also determine whether to consider parallel paths for base relations.
297 : *
298 : * We do this in a separate pass over the base rels so that rowcount
299 : * estimates are available for parameterized path generation, and also so
300 : * that each rel's consider_parallel flag is set correctly before we begin to
301 : * generate paths.
302 : */
303 : static void
304 253299 : set_base_rel_sizes(PlannerInfo *root)
305 : {
306 : Index rti;
307 :
308 794261 : for (rti = 1; rti < root->simple_rel_array_size; rti++)
309 : {
310 540984 : RelOptInfo *rel = root->simple_rel_array[rti];
311 : RangeTblEntry *rte;
312 :
313 : /* there may be empty slots corresponding to non-baserel RTEs */
314 540984 : if (rel == NULL)
315 127685 : continue;
316 :
317 : Assert(rel->relid == rti); /* sanity check on array */
318 :
319 : /* ignore RTEs that are "other rels" */
320 413299 : if (rel->reloptkind != RELOPT_BASEREL)
321 48600 : continue;
322 :
323 364699 : rte = root->simple_rte_array[rti];
324 :
325 : /*
326 : * If parallelism is allowable for this query in general, see whether
327 : * it's allowable for this rel in particular. We have to do this
328 : * before set_rel_size(), because (a) if this rel is an inheritance
329 : * parent, set_append_rel_size() will use and perhaps change the rel's
330 : * consider_parallel flag, and (b) for some RTE types, set_rel_size()
331 : * goes ahead and makes paths immediately.
332 : */
333 364699 : if (root->glob->parallelModeOK)
334 292890 : set_rel_consider_parallel(root, rel, rte);
335 :
336 364699 : set_rel_size(root, rel, rti, rte);
337 : }
338 253277 : }
339 :
340 : /*
341 : * setup_simple_grouped_rels
342 : * For each simple relation, build a grouped simple relation if eager
343 : * aggregation is possible and if this relation can produce grouped paths.
344 : */
345 : static void
346 253277 : setup_simple_grouped_rels(PlannerInfo *root)
347 : {
348 : Index rti;
349 :
350 : /*
351 : * If there are no aggregate expressions or grouping expressions, eager
352 : * aggregation is not possible.
353 : */
354 253277 : if (root->agg_clause_list == NIL ||
355 551 : root->group_expr_list == NIL)
356 252837 : return;
357 :
358 3761 : for (rti = 1; rti < root->simple_rel_array_size; rti++)
359 : {
360 3321 : RelOptInfo *rel = root->simple_rel_array[rti];
361 :
362 : /* there may be empty slots corresponding to non-baserel RTEs */
363 3321 : if (rel == NULL)
364 1071 : continue;
365 :
366 : Assert(rel->relid == rti); /* sanity check on array */
367 : Assert(IS_SIMPLE_REL(rel)); /* sanity check on rel */
368 :
369 2250 : (void) build_simple_grouped_rel(root, rel);
370 : }
371 : }
372 :
373 : /*
374 : * set_base_rel_pathlists
375 : * Finds all paths available for scanning each base-relation entry.
376 : * Sequential scan and any available indices are considered.
377 : * Each useful path is attached to its relation's 'pathlist' field.
378 : */
379 : static void
380 253277 : set_base_rel_pathlists(PlannerInfo *root)
381 : {
382 : Index rti;
383 :
384 794238 : for (rti = 1; rti < root->simple_rel_array_size; rti++)
385 : {
386 540961 : RelOptInfo *rel = root->simple_rel_array[rti];
387 :
388 : /* there may be empty slots corresponding to non-baserel RTEs */
389 540961 : if (rel == NULL)
390 127684 : continue;
391 :
392 : Assert(rel->relid == rti); /* sanity check on array */
393 :
394 : /* ignore RTEs that are "other rels" */
395 413277 : if (rel->reloptkind != RELOPT_BASEREL)
396 48600 : continue;
397 :
398 364677 : set_rel_pathlist(root, rel, rti, root->simple_rte_array[rti]);
399 : }
400 253277 : }
401 :
402 : /*
403 : * set_rel_size
404 : * Set size estimates for a base relation
405 : */
406 : static void
407 413027 : set_rel_size(PlannerInfo *root, RelOptInfo *rel,
408 : Index rti, RangeTblEntry *rte)
409 : {
410 777726 : if (rel->reloptkind == RELOPT_BASEREL &&
411 364699 : relation_excluded_by_constraints(root, rel, rte))
412 : {
413 : /*
414 : * We proved we don't need to scan the rel via constraint exclusion,
415 : * so set up a single dummy path for it. Here we only check this for
416 : * regular baserels; if it's an otherrel, CE was already checked in
417 : * set_append_rel_size().
418 : *
419 : * In this case, we go ahead and set up the relation's path right away
420 : * instead of leaving it for set_rel_pathlist to do. This is because
421 : * we don't have a convention for marking a rel as dummy except by
422 : * assigning a dummy path to it.
423 : */
424 631 : set_dummy_rel_pathlist(rel);
425 : }
426 412396 : else if (rte->inh)
427 : {
428 : /* It's an "append relation", process accordingly */
429 20787 : set_append_rel_size(root, rel, rti, rte);
430 : }
431 : else
432 : {
433 391609 : switch (rel->rtekind)
434 : {
435 323647 : case RTE_RELATION:
436 323647 : if (rte->relkind == RELKIND_FOREIGN_TABLE)
437 : {
438 : /* Foreign table */
439 1252 : set_foreign_size(root, rel, rte);
440 : }
441 322395 : else if (rte->relkind == RELKIND_PARTITIONED_TABLE)
442 : {
443 : /*
444 : * We could get here if asked to scan a partitioned table
445 : * with ONLY. In that case we shouldn't scan any of the
446 : * partitions, so mark it as a dummy rel.
447 : */
448 26 : set_dummy_rel_pathlist(rel);
449 : }
450 322369 : else if (rte->tablesample != NULL)
451 : {
452 : /* Sampled relation */
453 243 : set_tablesample_rel_size(root, rel, rte);
454 : }
455 : else
456 : {
457 : /* Plain relation */
458 322126 : set_plain_rel_size(root, rel, rte);
459 : }
460 323625 : break;
461 17357 : case RTE_SUBQUERY:
462 :
463 : /*
464 : * Subqueries don't support making a choice between
465 : * parameterized and unparameterized paths, so just go ahead
466 : * and build their paths immediately.
467 : */
468 17357 : set_subquery_pathlist(root, rel, rti, rte);
469 17357 : break;
470 35645 : case RTE_FUNCTION:
471 35645 : set_function_size_estimates(root, rel);
472 35645 : break;
473 519 : case RTE_TABLEFUNC:
474 519 : set_tablefunc_size_estimates(root, rel);
475 519 : break;
476 6793 : case RTE_VALUES:
477 6793 : set_values_size_estimates(root, rel);
478 6793 : break;
479 3620 : case RTE_CTE:
480 :
481 : /*
482 : * CTEs don't support making a choice between parameterized
483 : * and unparameterized paths, so just go ahead and build their
484 : * paths immediately.
485 : */
486 3620 : if (rte->self_reference)
487 692 : set_worktable_pathlist(root, rel, rte);
488 : else
489 2928 : set_cte_pathlist(root, rel, rte);
490 3620 : break;
491 433 : case RTE_NAMEDTUPLESTORE:
492 : /* Might as well just build the path immediately */
493 433 : set_namedtuplestore_pathlist(root, rel, rte);
494 433 : break;
495 3595 : case RTE_RESULT:
496 : /* Might as well just build the path immediately */
497 3595 : set_result_pathlist(root, rel, rte);
498 3595 : break;
499 0 : default:
500 0 : elog(ERROR, "unexpected rtekind: %d", (int) rel->rtekind);
501 : break;
502 : }
503 : }
504 :
505 : /*
506 : * We insist that all non-dummy rels have a nonzero rowcount estimate.
507 : */
508 : Assert(rel->rows > 0 || IS_DUMMY_REL(rel));
509 413004 : }
510 :
511 : /*
512 : * set_rel_pathlist
513 : * Build access paths for a base relation
514 : */
515 : static void
516 413129 : set_rel_pathlist(PlannerInfo *root, RelOptInfo *rel,
517 : Index rti, RangeTblEntry *rte)
518 : {
519 413129 : if (IS_DUMMY_REL(rel))
520 : {
521 : /* We already proved the relation empty, so nothing more to do */
522 : }
523 411986 : else if (rte->inh)
524 : {
525 : /* It's an "append relation", process accordingly */
526 20530 : set_append_rel_pathlist(root, rel, rti, rte);
527 : }
528 : else
529 : {
530 391456 : switch (rel->rtekind)
531 : {
532 323599 : case RTE_RELATION:
533 323599 : if (rte->relkind == RELKIND_FOREIGN_TABLE)
534 : {
535 : /* Foreign table */
536 1250 : set_foreign_pathlist(root, rel, rte);
537 : }
538 322349 : else if (rte->tablesample != NULL)
539 : {
540 : /* Sampled relation */
541 243 : set_tablesample_rel_pathlist(root, rel, rte);
542 : }
543 : else
544 : {
545 : /* Plain relation */
546 322106 : set_plain_rel_pathlist(root, rel, rte);
547 : }
548 323599 : break;
549 17252 : case RTE_SUBQUERY:
550 : /* Subquery --- fully handled during set_rel_size */
551 17252 : break;
552 35645 : case RTE_FUNCTION:
553 : /* RangeFunction */
554 35645 : set_function_pathlist(root, rel, rte);
555 35645 : break;
556 519 : case RTE_TABLEFUNC:
557 : /* Table Function */
558 519 : set_tablefunc_pathlist(root, rel, rte);
559 519 : break;
560 6793 : case RTE_VALUES:
561 : /* Values list */
562 6793 : set_values_pathlist(root, rel, rte);
563 6793 : break;
564 3620 : case RTE_CTE:
565 : /* CTE reference --- fully handled during set_rel_size */
566 3620 : break;
567 433 : case RTE_NAMEDTUPLESTORE:
568 : /* tuplestore reference --- fully handled during set_rel_size */
569 433 : break;
570 3595 : case RTE_RESULT:
571 : /* simple Result --- fully handled during set_rel_size */
572 3595 : break;
573 0 : default:
574 0 : elog(ERROR, "unexpected rtekind: %d", (int) rel->rtekind);
575 : break;
576 : }
577 : }
578 :
579 : /*
580 : * Allow a plugin to editorialize on the set of Paths for this base
581 : * relation. It could add new paths (such as CustomPaths) by calling
582 : * add_path(), or add_partial_path() if parallel aware. It could also
583 : * delete or modify paths added by the core code.
584 : */
585 413129 : if (set_rel_pathlist_hook)
586 0 : (*set_rel_pathlist_hook) (root, rel, rti, rte);
587 :
588 : /*
589 : * If this is a baserel, we should normally consider gathering any partial
590 : * paths we may have created for it. We have to do this after calling the
591 : * set_rel_pathlist_hook, else it cannot add partial paths to be included
592 : * here.
593 : *
594 : * However, if this is an inheritance child, skip it. Otherwise, we could
595 : * end up with a very large number of gather nodes, each trying to grab
596 : * its own pool of workers. Instead, we'll consider gathering partial
597 : * paths for the parent appendrel.
598 : *
599 : * Also, if this is the topmost scan/join rel, we postpone gathering until
600 : * the final scan/join targetlist is available (see grouping_planner).
601 : */
602 413129 : if (rel->reloptkind == RELOPT_BASEREL &&
603 364677 : !bms_equal(rel->relids, root->all_query_rels))
604 192325 : generate_useful_gather_paths(root, rel, false);
605 :
606 : /* Now find the cheapest of the paths for this rel */
607 413129 : set_cheapest(rel);
608 :
609 : /*
610 : * If a grouped relation for this rel exists, build partial aggregation
611 : * paths for it.
612 : *
613 : * Note that this can only happen after we've called set_cheapest() for
614 : * this base rel, because we need its cheapest paths.
615 : */
616 413129 : set_grouped_rel_pathlist(root, rel);
617 :
618 : #ifdef OPTIMIZER_DEBUG
619 : pprint(rel);
620 : #endif
621 413129 : }
622 :
623 : /*
624 : * set_plain_rel_size
625 : * Set size estimates for a plain relation (no subquery, no inheritance)
626 : */
627 : static void
628 322126 : set_plain_rel_size(PlannerInfo *root, RelOptInfo *rel, RangeTblEntry *rte)
629 : {
630 : /*
631 : * Test any partial indexes of rel for applicability. We must do this
632 : * first since partial unique indexes can affect size estimates.
633 : */
634 322126 : check_index_predicates(root, rel);
635 :
636 : /* Mark rel with estimated output rows, width, etc */
637 322126 : set_baserel_size_estimates(root, rel);
638 322106 : }
639 :
640 : /*
641 : * If this relation could possibly be scanned from within a worker, then set
642 : * its consider_parallel flag.
643 : */
644 : static void
645 329174 : set_rel_consider_parallel(PlannerInfo *root, RelOptInfo *rel,
646 : RangeTblEntry *rte)
647 : {
648 : /*
649 : * The flag has previously been initialized to false, so we can just
650 : * return if it becomes clear that we can't safely set it.
651 : */
652 : Assert(!rel->consider_parallel);
653 :
654 : /* Don't call this if parallelism is disallowed for the entire query. */
655 : Assert(root->glob->parallelModeOK);
656 :
657 : /* This should only be called for baserels and appendrel children. */
658 : Assert(IS_SIMPLE_REL(rel));
659 :
660 : /* Assorted checks based on rtekind. */
661 329174 : switch (rte->rtekind)
662 : {
663 283406 : case RTE_RELATION:
664 :
665 : /*
666 : * Currently, parallel workers can't access the leader's temporary
667 : * tables. We could possibly relax this if we wrote all of its
668 : * local buffers at the start of the query and made no changes
669 : * thereafter (maybe we could allow hint bit changes), and if we
670 : * taught the workers to read them. Writing a large number of
671 : * temporary buffers could be expensive, though, and we don't have
672 : * the rest of the necessary infrastructure right now anyway. So
673 : * for now, bail out if we see a temporary table.
674 : */
675 283406 : if (get_rel_persistence(rte->relid) == RELPERSISTENCE_TEMP)
676 7433 : return;
677 :
678 : /*
679 : * Table sampling can be pushed down to workers if the sample
680 : * function and its arguments are safe.
681 : */
682 275973 : if (rte->tablesample != NULL)
683 : {
684 263 : char proparallel = func_parallel(rte->tablesample->tsmhandler);
685 :
686 263 : if (proparallel != PROPARALLEL_SAFE)
687 18 : return;
688 245 : if (!is_parallel_safe(root, (Node *) rte->tablesample->args))
689 10 : return;
690 : }
691 :
692 : /*
693 : * Ask FDWs whether they can support performing a ForeignScan
694 : * within a worker. Most often, the answer will be no. For
695 : * example, if the nature of the FDW is such that it opens a TCP
696 : * connection with a remote server, each parallel worker would end
697 : * up with a separate connection, and these connections might not
698 : * be appropriately coordinated between workers and the leader.
699 : */
700 275945 : if (rte->relkind == RELKIND_FOREIGN_TABLE)
701 : {
702 : Assert(rel->fdwroutine);
703 797 : if (!rel->fdwroutine->IsForeignScanParallelSafe)
704 758 : return;
705 39 : if (!rel->fdwroutine->IsForeignScanParallelSafe(root, rel, rte))
706 0 : return;
707 : }
708 :
709 : /*
710 : * There are additional considerations for appendrels, which we'll
711 : * deal with in set_append_rel_size and set_append_rel_pathlist.
712 : * For now, just set consider_parallel based on the rel's own
713 : * quals and targetlist.
714 : */
715 275187 : break;
716 :
717 16306 : case RTE_SUBQUERY:
718 :
719 : /*
720 : * There's no intrinsic problem with scanning a subquery-in-FROM
721 : * (as distinct from a SubPlan or InitPlan) in a parallel worker.
722 : * If the subquery doesn't happen to have any parallel-safe paths,
723 : * then flagging it as consider_parallel won't change anything,
724 : * but that's true for plain tables, too. We must set
725 : * consider_parallel based on the rel's own quals and targetlist,
726 : * so that if a subquery path is parallel-safe but the quals and
727 : * projection we're sticking onto it are not, we correctly mark
728 : * the SubqueryScanPath as not parallel-safe. (Note that
729 : * set_subquery_pathlist() might push some of these quals down
730 : * into the subquery itself, but that doesn't change anything.)
731 : *
732 : * We can't push sub-select containing LIMIT/OFFSET to workers as
733 : * there is no guarantee that the row order will be fully
734 : * deterministic, and applying LIMIT/OFFSET will lead to
735 : * inconsistent results at the top-level. (In some cases, where
736 : * the result is ordered, we could relax this restriction. But it
737 : * doesn't currently seem worth expending extra effort to do so.)
738 : */
739 : {
740 16306 : Query *subquery = castNode(Query, rte->subquery);
741 :
742 16306 : if (limit_needed(subquery))
743 444 : return;
744 : }
745 15862 : break;
746 :
747 0 : case RTE_JOIN:
748 : /* Shouldn't happen; we're only considering baserels here. */
749 : Assert(false);
750 0 : return;
751 :
752 20137 : case RTE_FUNCTION:
753 : /* Check for parallel-restricted functions. */
754 20137 : if (!is_parallel_safe(root, (Node *) rte->functions))
755 8822 : return;
756 11315 : break;
757 :
758 519 : case RTE_TABLEFUNC:
759 : /* not parallel safe */
760 519 : return;
761 :
762 2381 : case RTE_VALUES:
763 : /* Check for parallel-restricted functions. */
764 2381 : if (!is_parallel_safe(root, (Node *) rte->values_lists))
765 10 : return;
766 2371 : break;
767 :
768 2759 : case RTE_CTE:
769 :
770 : /*
771 : * CTE tuplestores aren't shared among parallel workers, so we
772 : * force all CTE scans to happen in the leader. Also, populating
773 : * the CTE would require executing a subplan that's not available
774 : * in the worker, might be parallel-restricted, and must get
775 : * executed only once.
776 : */
777 2759 : return;
778 :
779 411 : case RTE_NAMEDTUPLESTORE:
780 :
781 : /*
782 : * tuplestore cannot be shared, at least without more
783 : * infrastructure to support that.
784 : */
785 411 : return;
786 :
787 3255 : case RTE_RESULT:
788 : /* RESULT RTEs, in themselves, are no problem. */
789 3255 : break;
790 :
791 0 : case RTE_GRAPH_TABLE:
792 :
793 : /*
794 : * Shouldn't happen since these are replaced by subquery RTEs when
795 : * rewriting queries.
796 : */
797 : Assert(false);
798 0 : return;
799 :
800 0 : case RTE_GROUP:
801 : /* Shouldn't happen; we're only considering baserels here. */
802 : Assert(false);
803 0 : return;
804 : }
805 :
806 : /*
807 : * If there's anything in baserestrictinfo that's parallel-restricted, we
808 : * give up on parallelizing access to this relation. We could consider
809 : * instead postponing application of the restricted quals until we're
810 : * above all the parallelism in the plan tree, but it's not clear that
811 : * that would be a win in very many cases, and it might be tricky to make
812 : * outer join clauses work correctly. It would likely break equivalence
813 : * classes, too.
814 : */
815 307990 : if (!is_parallel_safe(root, (Node *) rel->baserestrictinfo))
816 21830 : return;
817 :
818 : /*
819 : * Likewise, if the relation's outputs are not parallel-safe, give up.
820 : * (Usually, they're just Vars, but sometimes they're not.)
821 : */
822 286160 : if (!is_parallel_safe(root, (Node *) rel->reltarget->exprs))
823 15 : return;
824 :
825 : /* We have a winner. */
826 286145 : rel->consider_parallel = true;
827 : }
828 :
829 : /*
830 : * set_plain_rel_pathlist
831 : * Build access paths for a plain relation (no subquery, no inheritance)
832 : */
833 : static void
834 322106 : set_plain_rel_pathlist(PlannerInfo *root, RelOptInfo *rel, RangeTblEntry *rte)
835 : {
836 : Relids required_outer;
837 :
838 : /*
839 : * We don't support pushing join clauses into the quals of a seqscan, but
840 : * it could still have required parameterization due to LATERAL refs in
841 : * its tlist.
842 : */
843 322106 : required_outer = rel->lateral_relids;
844 :
845 : /*
846 : * Consider TID scans.
847 : *
848 : * If create_tidscan_paths returns true, then a TID scan path is forced.
849 : * This happens when rel->baserestrictinfo contains CurrentOfExpr, because
850 : * the executor can't handle any other type of path for such queries.
851 : * Hence, we return without adding any other paths.
852 : */
853 322106 : if (create_tidscan_paths(root, rel))
854 334 : return;
855 :
856 : /* Consider sequential scan */
857 321772 : add_path(rel, create_seqscan_path(root, rel, required_outer, 0));
858 :
859 : /* If appropriate, consider parallel sequential scan */
860 321772 : if (rel->consider_parallel && required_outer == NULL)
861 242601 : create_plain_partial_paths(root, rel);
862 :
863 : /* Consider index scans */
864 321772 : create_index_paths(root, rel);
865 : }
866 :
867 : /*
868 : * create_plain_partial_paths
869 : * Build partial access paths for parallel scan of a plain relation
870 : */
871 : static void
872 242601 : create_plain_partial_paths(PlannerInfo *root, RelOptInfo *rel)
873 : {
874 : int parallel_workers;
875 :
876 242601 : parallel_workers = compute_parallel_worker(rel, rel->pages, -1,
877 : max_parallel_workers_per_gather);
878 :
879 : /* If any limit was set to zero, the user doesn't want a parallel scan. */
880 242601 : if (parallel_workers <= 0)
881 218441 : return;
882 :
883 : /* Add an unordered partial path based on a parallel sequential scan. */
884 24160 : add_partial_path(rel, create_seqscan_path(root, rel, NULL, parallel_workers));
885 : }
886 :
887 : /*
888 : * set_tablesample_rel_size
889 : * Set size estimates for a sampled relation
890 : */
891 : static void
892 243 : set_tablesample_rel_size(PlannerInfo *root, RelOptInfo *rel, RangeTblEntry *rte)
893 : {
894 243 : TableSampleClause *tsc = rte->tablesample;
895 : TsmRoutine *tsm;
896 : BlockNumber pages;
897 : double tuples;
898 :
899 : /*
900 : * Test any partial indexes of rel for applicability. We must do this
901 : * first since partial unique indexes can affect size estimates.
902 : */
903 243 : check_index_predicates(root, rel);
904 :
905 : /*
906 : * Call the sampling method's estimation function to estimate the number
907 : * of pages it will read and the number of tuples it will return. (Note:
908 : * we assume the function returns sane values.)
909 : */
910 243 : tsm = GetTsmRoutine(tsc->tsmhandler);
911 243 : tsm->SampleScanGetSampleSize(root, rel, tsc->args,
912 : &pages, &tuples);
913 :
914 : /*
915 : * For the moment, because we will only consider a SampleScan path for the
916 : * rel, it's okay to just overwrite the pages and tuples estimates for the
917 : * whole relation. If we ever consider multiple path types for sampled
918 : * rels, we'll need more complication.
919 : */
920 243 : rel->pages = pages;
921 243 : rel->tuples = tuples;
922 :
923 : /* Mark rel with estimated output rows, width, etc */
924 243 : set_baserel_size_estimates(root, rel);
925 243 : }
926 :
927 : /*
928 : * set_tablesample_rel_pathlist
929 : * Build access paths for a sampled relation
930 : */
931 : static void
932 243 : set_tablesample_rel_pathlist(PlannerInfo *root, RelOptInfo *rel, RangeTblEntry *rte)
933 : {
934 : Relids required_outer;
935 : Path *path;
936 :
937 : /*
938 : * We don't support pushing join clauses into the quals of a samplescan,
939 : * but it could still have required parameterization due to LATERAL refs
940 : * in its tlist or TABLESAMPLE arguments.
941 : */
942 243 : required_outer = rel->lateral_relids;
943 :
944 : /* Consider sampled scan */
945 243 : path = create_samplescan_path(root, rel, required_outer);
946 :
947 : /*
948 : * If the sampling method does not support repeatable scans, we must avoid
949 : * plans that would scan the rel multiple times. Ideally, we'd simply
950 : * avoid putting the rel on the inside of a nestloop join; but adding such
951 : * a consideration to the planner seems like a great deal of complication
952 : * to support an uncommon usage of second-rate sampling methods. Instead,
953 : * if there is a risk that the query might perform an unsafe join, just
954 : * wrap the SampleScan in a Materialize node. We can check for joins by
955 : * counting the membership of all_query_rels (note that this correctly
956 : * counts inheritance trees as single rels). If we're inside a subquery,
957 : * we can't easily check whether a join might occur in the outer query, so
958 : * just assume one is possible.
959 : *
960 : * GetTsmRoutine is relatively expensive compared to the other tests here,
961 : * so check repeatable_across_scans last, even though that's a bit odd.
962 : */
963 469 : if ((root->query_level > 1 ||
964 226 : bms_membership(root->all_query_rels) != BMS_SINGLETON) &&
965 77 : !(GetTsmRoutine(rte->tablesample->tsmhandler)->repeatable_across_scans))
966 : {
967 4 : path = (Path *) create_material_path(rel, path, true);
968 : }
969 :
970 243 : add_path(rel, path);
971 :
972 : /* For the moment, at least, there are no other paths to consider */
973 243 : }
974 :
975 : /*
976 : * set_foreign_size
977 : * Set size estimates for a foreign table RTE
978 : */
979 : static void
980 1252 : set_foreign_size(PlannerInfo *root, RelOptInfo *rel, RangeTblEntry *rte)
981 : {
982 : /* Mark rel with estimated output rows, width, etc */
983 1252 : set_foreign_size_estimates(root, rel);
984 :
985 : /* Let FDW adjust the size estimates, if it can */
986 1252 : rel->fdwroutine->GetForeignRelSize(root, rel, rte->relid);
987 :
988 : /* ... but do not let it set the rows estimate to zero */
989 1250 : rel->rows = clamp_row_est(rel->rows);
990 :
991 : /*
992 : * Also, make sure rel->tuples is not insane relative to rel->rows.
993 : * Notably, this ensures sanity if pg_class.reltuples contains -1 and the
994 : * FDW doesn't do anything to replace that.
995 : */
996 1250 : rel->tuples = Max(rel->tuples, rel->rows);
997 1250 : }
998 :
999 : /*
1000 : * set_foreign_pathlist
1001 : * Build access paths for a foreign table RTE
1002 : */
1003 : static void
1004 1250 : set_foreign_pathlist(PlannerInfo *root, RelOptInfo *rel, RangeTblEntry *rte)
1005 : {
1006 : /* Call the FDW's GetForeignPaths function to generate path(s) */
1007 1250 : rel->fdwroutine->GetForeignPaths(root, rel, rte->relid);
1008 1250 : }
1009 :
1010 : /*
1011 : * set_append_rel_size
1012 : * Set size estimates for a simple "append relation"
1013 : *
1014 : * The passed-in rel and RTE represent the entire append relation. The
1015 : * relation's contents are computed by appending together the output of the
1016 : * individual member relations. Note that in the non-partitioned inheritance
1017 : * case, the first member relation is actually the same table as is mentioned
1018 : * in the parent RTE ... but it has a different RTE and RelOptInfo. This is
1019 : * a good thing because their outputs are not the same size.
1020 : */
1021 : static void
1022 20787 : set_append_rel_size(PlannerInfo *root, RelOptInfo *rel,
1023 : Index rti, RangeTblEntry *rte)
1024 : {
1025 20787 : int parentRTindex = rti;
1026 : bool has_live_children;
1027 : double parent_tuples;
1028 : double parent_rows;
1029 : double parent_size;
1030 : double *parent_attrsizes;
1031 : int nattrs;
1032 : ListCell *l;
1033 :
1034 : /* Guard against stack overflow due to overly deep inheritance tree. */
1035 20787 : check_stack_depth();
1036 :
1037 : Assert(IS_SIMPLE_REL(rel));
1038 :
1039 : /*
1040 : * If this is a partitioned baserel, set the consider_partitionwise_join
1041 : * flag; currently, we only consider partitionwise joins with the baserel
1042 : * if its targetlist doesn't contain a whole-row Var.
1043 : */
1044 20787 : if (enable_partitionwise_join &&
1045 4159 : rel->reloptkind == RELOPT_BASEREL &&
1046 3309 : rte->relkind == RELKIND_PARTITIONED_TABLE &&
1047 3309 : bms_is_empty(rel->attr_needed[InvalidAttrNumber - rel->min_attr]))
1048 3251 : rel->consider_partitionwise_join = true;
1049 :
1050 : /*
1051 : * Initialize to compute size estimates for whole append relation.
1052 : *
1053 : * We handle tuples estimates by setting "tuples" to the total number of
1054 : * tuples accumulated from each live child, rather than using "rows".
1055 : * Although an appendrel itself doesn't directly enforce any quals, its
1056 : * child relations may. Therefore, setting "tuples" equal to "rows" for
1057 : * an appendrel isn't always appropriate, and can lead to inaccurate cost
1058 : * estimates. For example, when estimating the number of distinct values
1059 : * from an appendrel, we would be unable to adjust the estimate based on
1060 : * the restriction selectivity (see estimate_num_groups).
1061 : *
1062 : * We handle width estimates by weighting the widths of different child
1063 : * rels proportionally to their number of rows. This is sensible because
1064 : * the use of width estimates is mainly to compute the total relation
1065 : * "footprint" if we have to sort or hash it. To do this, we sum the
1066 : * total equivalent size (in "double" arithmetic) and then divide by the
1067 : * total rowcount estimate. This is done separately for the total rel
1068 : * width and each attribute.
1069 : *
1070 : * Note: if you consider changing this logic, beware that child rels could
1071 : * have zero rows and/or width, if they were excluded by constraints.
1072 : */
1073 20787 : has_live_children = false;
1074 20787 : parent_tuples = 0;
1075 20787 : parent_rows = 0;
1076 20787 : parent_size = 0;
1077 20787 : nattrs = rel->max_attr - rel->min_attr + 1;
1078 20787 : parent_attrsizes = (double *) palloc0(nattrs * sizeof(double));
1079 :
1080 112735 : foreach(l, root->append_rel_list)
1081 : {
1082 91949 : AppendRelInfo *appinfo = (AppendRelInfo *) lfirst(l);
1083 : int childRTindex;
1084 : RangeTblEntry *childRTE;
1085 : RelOptInfo *childrel;
1086 : List *childrinfos;
1087 : ListCell *parentvars;
1088 : ListCell *childvars;
1089 : ListCell *lc;
1090 :
1091 : /* append_rel_list contains all append rels; ignore others */
1092 91949 : if (appinfo->parent_relid != parentRTindex)
1093 43756 : continue;
1094 :
1095 48508 : childRTindex = appinfo->child_relid;
1096 48508 : childRTE = root->simple_rte_array[childRTindex];
1097 :
1098 : /*
1099 : * The child rel's RelOptInfo was already created during
1100 : * add_other_rels_to_query.
1101 : */
1102 48508 : childrel = find_base_rel(root, childRTindex);
1103 : Assert(childrel->reloptkind == RELOPT_OTHER_MEMBER_REL);
1104 :
1105 : /* We may have already proven the child to be dummy. */
1106 48508 : if (IS_DUMMY_REL(childrel))
1107 20 : continue;
1108 :
1109 : /*
1110 : * We have to copy the parent's targetlist and quals to the child,
1111 : * with appropriate substitution of variables. However, the
1112 : * baserestrictinfo quals were already copied/substituted when the
1113 : * child RelOptInfo was built. So we don't need any additional setup
1114 : * before applying constraint exclusion.
1115 : */
1116 48488 : if (relation_excluded_by_constraints(root, childrel, childRTE))
1117 : {
1118 : /*
1119 : * This child need not be scanned, so we can omit it from the
1120 : * appendrel.
1121 : */
1122 160 : set_dummy_rel_pathlist(childrel);
1123 160 : continue;
1124 : }
1125 :
1126 : /*
1127 : * Constraint exclusion failed, so copy the parent's join quals and
1128 : * targetlist to the child, with appropriate variable substitutions.
1129 : *
1130 : * We skip join quals that came from above outer joins that can null
1131 : * this rel, since they would be of no value while generating paths
1132 : * for the child. This saves some effort while processing the child
1133 : * rel, and it also avoids an implementation restriction in
1134 : * adjust_appendrel_attrs (it can't apply nullingrels to a non-Var).
1135 : */
1136 48328 : childrinfos = NIL;
1137 59430 : foreach(lc, rel->joininfo)
1138 : {
1139 11102 : RestrictInfo *rinfo = (RestrictInfo *) lfirst(lc);
1140 :
1141 11102 : if (!bms_overlap(rinfo->clause_relids, rel->nulling_relids))
1142 9167 : childrinfos = lappend(childrinfos,
1143 9167 : adjust_appendrel_attrs(root,
1144 : (Node *) rinfo,
1145 : 1, &appinfo));
1146 : }
1147 48328 : childrel->joininfo = childrinfos;
1148 :
1149 : /*
1150 : * Now for the child's targetlist.
1151 : *
1152 : * NB: the resulting childrel->reltarget->exprs may contain arbitrary
1153 : * expressions, which otherwise would not occur in a rel's targetlist.
1154 : * Code that might be looking at an appendrel child must cope with
1155 : * such. (Normally, a rel's targetlist would only include Vars and
1156 : * PlaceHolderVars.) XXX we do not bother to update the cost or width
1157 : * fields of childrel->reltarget; not clear if that would be useful.
1158 : */
1159 96656 : childrel->reltarget->exprs = (List *)
1160 48328 : adjust_appendrel_attrs(root,
1161 48328 : (Node *) rel->reltarget->exprs,
1162 : 1, &appinfo);
1163 :
1164 : /*
1165 : * We have to make child entries in the EquivalenceClass data
1166 : * structures as well. This is needed either if the parent
1167 : * participates in some eclass joins (because we will want to consider
1168 : * inner-indexscan joins on the individual children) or if the parent
1169 : * has useful pathkeys (because we should try to build MergeAppend
1170 : * paths that produce those sort orderings).
1171 : */
1172 48328 : if (rel->has_eclass_joins || has_useful_pathkeys(root, rel))
1173 29962 : add_child_rel_equivalences(root, appinfo, rel, childrel);
1174 48328 : childrel->has_eclass_joins = rel->has_eclass_joins;
1175 :
1176 : /*
1177 : * Note: we could compute appropriate attr_needed data for the child's
1178 : * variables, by transforming the parent's attr_needed through the
1179 : * translated_vars mapping. However, currently there's no need
1180 : * because attr_needed is only examined for base relations not
1181 : * otherrels. So we just leave the child's attr_needed empty.
1182 : */
1183 :
1184 : /*
1185 : * If we consider partitionwise joins with the parent rel, do the same
1186 : * for partitioned child rels.
1187 : *
1188 : * Note: here we abuse the consider_partitionwise_join flag by setting
1189 : * it for child rels that are not themselves partitioned. We do so to
1190 : * tell try_partitionwise_join() that the child rel is sufficiently
1191 : * valid to be used as a per-partition input, even if it later gets
1192 : * proven to be dummy. (It's not usable until we've set up the
1193 : * reltarget and EC entries, which we just did.)
1194 : */
1195 48328 : if (rel->consider_partitionwise_join)
1196 11007 : childrel->consider_partitionwise_join = true;
1197 :
1198 : /*
1199 : * If parallelism is allowable for this query in general, see whether
1200 : * it's allowable for this childrel in particular. But if we've
1201 : * already decided the appendrel is not parallel-safe as a whole,
1202 : * there's no point in considering parallelism for this child. For
1203 : * consistency, do this before calling set_rel_size() for the child.
1204 : */
1205 48328 : if (root->glob->parallelModeOK && rel->consider_parallel)
1206 36284 : set_rel_consider_parallel(root, childrel, childRTE);
1207 :
1208 : /*
1209 : * Compute the child's size.
1210 : */
1211 48328 : set_rel_size(root, childrel, childRTindex, childRTE);
1212 :
1213 : /*
1214 : * It is possible that constraint exclusion detected a contradiction
1215 : * within a child subquery, even though we didn't prove one above. If
1216 : * so, we can skip this child.
1217 : */
1218 48327 : if (IS_DUMMY_REL(childrel))
1219 135 : continue;
1220 :
1221 : /* We have at least one live child. */
1222 48192 : has_live_children = true;
1223 :
1224 : /*
1225 : * If any live child is not parallel-safe, treat the whole appendrel
1226 : * as not parallel-safe. In future we might be able to generate plans
1227 : * in which some children are farmed out to workers while others are
1228 : * not; but we don't have that today, so it's a waste to consider
1229 : * partial paths anywhere in the appendrel unless it's all safe.
1230 : * (Child rels visited before this one will be unmarked in
1231 : * set_append_rel_pathlist().)
1232 : */
1233 48192 : if (!childrel->consider_parallel)
1234 12426 : rel->consider_parallel = false;
1235 :
1236 : /*
1237 : * Accumulate size information from each live child.
1238 : */
1239 : Assert(childrel->rows > 0);
1240 :
1241 48192 : parent_tuples += childrel->tuples;
1242 48192 : parent_rows += childrel->rows;
1243 48192 : parent_size += childrel->reltarget->width * childrel->rows;
1244 :
1245 : /*
1246 : * Accumulate per-column estimates too. We need not do anything for
1247 : * PlaceHolderVars in the parent list. If child expression isn't a
1248 : * Var, or we didn't record a width estimate for it, we have to fall
1249 : * back on a datatype-based estimate.
1250 : *
1251 : * By construction, child's targetlist is 1-to-1 with parent's.
1252 : */
1253 157519 : forboth(parentvars, rel->reltarget->exprs,
1254 : childvars, childrel->reltarget->exprs)
1255 : {
1256 109327 : Var *parentvar = (Var *) lfirst(parentvars);
1257 109327 : Node *childvar = (Node *) lfirst(childvars);
1258 :
1259 109327 : if (IsA(parentvar, Var) && parentvar->varno == parentRTindex)
1260 : {
1261 98953 : int pndx = parentvar->varattno - rel->min_attr;
1262 98953 : int32 child_width = 0;
1263 :
1264 98953 : if (IsA(childvar, Var) &&
1265 94744 : ((Var *) childvar)->varno == childrel->relid)
1266 : {
1267 94669 : int cndx = ((Var *) childvar)->varattno - childrel->min_attr;
1268 :
1269 94669 : child_width = childrel->attr_widths[cndx];
1270 : }
1271 98953 : if (child_width <= 0)
1272 4284 : child_width = get_typavgwidth(exprType(childvar),
1273 : exprTypmod(childvar));
1274 : Assert(child_width > 0);
1275 98953 : parent_attrsizes[pndx] += child_width * childrel->rows;
1276 : }
1277 : }
1278 : }
1279 :
1280 20786 : if (has_live_children)
1281 : {
1282 : /*
1283 : * Save the finished size estimates.
1284 : */
1285 : int i;
1286 :
1287 : Assert(parent_rows > 0);
1288 20530 : rel->tuples = parent_tuples;
1289 20530 : rel->rows = parent_rows;
1290 20530 : rel->reltarget->width = rint(parent_size / parent_rows);
1291 189086 : for (i = 0; i < nattrs; i++)
1292 168556 : rel->attr_widths[i] = rint(parent_attrsizes[i] / parent_rows);
1293 :
1294 : /*
1295 : * Note that we leave rel->pages as zero; this is important to avoid
1296 : * double-counting the appendrel tree in total_table_pages.
1297 : */
1298 : }
1299 : else
1300 : {
1301 : /*
1302 : * All children were excluded by constraints, so mark the whole
1303 : * appendrel dummy. We must do this in this phase so that the rel's
1304 : * dummy-ness is visible when we generate paths for other rels.
1305 : */
1306 256 : set_dummy_rel_pathlist(rel);
1307 : }
1308 :
1309 20786 : pfree(parent_attrsizes);
1310 20786 : }
1311 :
1312 : /*
1313 : * set_append_rel_pathlist
1314 : * Build access paths for an "append relation"
1315 : */
1316 : static void
1317 20530 : set_append_rel_pathlist(PlannerInfo *root, RelOptInfo *rel,
1318 : Index rti, RangeTblEntry *rte)
1319 : {
1320 20530 : int parentRTindex = rti;
1321 20530 : List *live_childrels = NIL;
1322 : ListCell *l;
1323 :
1324 : /*
1325 : * Generate access paths for each member relation, and remember the
1326 : * non-dummy children.
1327 : */
1328 112073 : foreach(l, root->append_rel_list)
1329 : {
1330 91543 : AppendRelInfo *appinfo = (AppendRelInfo *) lfirst(l);
1331 : int childRTindex;
1332 : RangeTblEntry *childRTE;
1333 : RelOptInfo *childrel;
1334 :
1335 : /* append_rel_list contains all append rels; ignore others */
1336 91543 : if (appinfo->parent_relid != parentRTindex)
1337 43091 : continue;
1338 :
1339 : /* Re-locate the child RTE and RelOptInfo */
1340 48452 : childRTindex = appinfo->child_relid;
1341 48452 : childRTE = root->simple_rte_array[childRTindex];
1342 48452 : childrel = root->simple_rel_array[childRTindex];
1343 :
1344 : /*
1345 : * If set_append_rel_size() decided the parent appendrel was
1346 : * parallel-unsafe at some point after visiting this child rel, we
1347 : * need to propagate the unsafety marking down to the child, so that
1348 : * we don't generate useless partial paths for it.
1349 : */
1350 48452 : if (!rel->consider_parallel)
1351 12595 : childrel->consider_parallel = false;
1352 :
1353 : /*
1354 : * Compute the child's access paths.
1355 : */
1356 48452 : set_rel_pathlist(root, childrel, childRTindex, childRTE);
1357 :
1358 : /*
1359 : * If child is dummy, ignore it.
1360 : */
1361 48452 : if (IS_DUMMY_REL(childrel))
1362 260 : continue;
1363 :
1364 : /*
1365 : * Child is live, so add it to the live_childrels list for use below.
1366 : */
1367 48192 : live_childrels = lappend(live_childrels, childrel);
1368 : }
1369 :
1370 : /* Add paths to the append relation. */
1371 20530 : add_paths_to_append_rel(root, rel, live_childrels);
1372 20530 : }
1373 :
1374 : /*
1375 : * set_grouped_rel_pathlist
1376 : * If a grouped relation for the given 'rel' exists, build partial
1377 : * aggregation paths for it.
1378 : */
1379 : static void
1380 413129 : set_grouped_rel_pathlist(PlannerInfo *root, RelOptInfo *rel)
1381 : {
1382 : RelOptInfo *grouped_rel;
1383 :
1384 : /*
1385 : * If there are no aggregate expressions or grouping expressions, eager
1386 : * aggregation is not possible.
1387 : */
1388 413129 : if (root->agg_clause_list == NIL ||
1389 2774 : root->group_expr_list == NIL)
1390 410879 : return;
1391 :
1392 : /* Add paths to the grouped base relation if one exists. */
1393 2250 : grouped_rel = rel->grouped_rel;
1394 2250 : if (grouped_rel)
1395 : {
1396 : Assert(IS_GROUPED_REL(grouped_rel));
1397 :
1398 467 : generate_grouped_paths(root, grouped_rel, rel);
1399 467 : set_cheapest(grouped_rel);
1400 : }
1401 : }
1402 :
1403 :
1404 : /*
1405 : * add_paths_to_append_rel
1406 : * Generate paths for the given append relation given the set of non-dummy
1407 : * child rels.
1408 : *
1409 : * The function collects all parameterizations and orderings supported by the
1410 : * non-dummy children. For every such parameterization or ordering, it creates
1411 : * an append path collecting one path from each non-dummy child with given
1412 : * parameterization or ordering. Similarly it collects partial paths from
1413 : * non-dummy children to create partial append paths.
1414 : */
1415 : void
1416 37364 : add_paths_to_append_rel(PlannerInfo *root, RelOptInfo *rel,
1417 : List *live_childrels)
1418 : {
1419 37364 : AppendPathInput unparameterized = {0};
1420 37364 : AppendPathInput startup = {0};
1421 37364 : AppendPathInput partial_only = {0};
1422 37364 : AppendPathInput parallel_append = {0};
1423 37364 : bool unparameterized_valid = true;
1424 37364 : bool startup_valid = true;
1425 37364 : bool partial_only_valid = true;
1426 37364 : bool parallel_append_valid = true;
1427 37364 : List *all_child_pathkeys = NIL;
1428 37364 : List *all_child_outers = NIL;
1429 : ListCell *l;
1430 37364 : double partial_rows = -1;
1431 :
1432 : /* If appropriate, consider parallel append */
1433 37364 : parallel_append_valid = enable_parallel_append && rel->consider_parallel;
1434 :
1435 : /*
1436 : * For every non-dummy child, remember the cheapest path. Also, identify
1437 : * all pathkeys (orderings) and parameterizations (required_outer sets)
1438 : * available for the non-dummy member relations.
1439 : */
1440 123118 : foreach(l, live_childrels)
1441 : {
1442 85754 : RelOptInfo *childrel = lfirst(l);
1443 : ListCell *lcp;
1444 85754 : Path *cheapest_partial_path = NULL;
1445 :
1446 : /*
1447 : * If child has an unparameterized cheapest-total path, add that to
1448 : * the unparameterized Append path we are constructing for the parent.
1449 : * If not, there's no workable unparameterized path.
1450 : *
1451 : * With partitionwise aggregates, the child rel's pathlist may be
1452 : * empty, so don't assume that a path exists here.
1453 : */
1454 85754 : if (childrel->pathlist != NIL &&
1455 85754 : childrel->cheapest_total_path->param_info == NULL)
1456 85124 : accumulate_append_subpath(childrel->cheapest_total_path,
1457 : &unparameterized.subpaths, NULL, &unparameterized.child_append_relid_sets);
1458 : else
1459 630 : unparameterized_valid = false;
1460 :
1461 : /*
1462 : * When the planner is considering cheap startup plans, we'll also
1463 : * collect all the cheapest_startup_paths (if set) and build an
1464 : * AppendPath containing those as subpaths.
1465 : */
1466 85754 : if (rel->consider_startup && childrel->cheapest_startup_path != NULL)
1467 1425 : {
1468 : Path *cheapest_path;
1469 :
1470 : /*
1471 : * With an indication of how many tuples the query should provide,
1472 : * the optimizer tries to choose the path optimal for that
1473 : * specific number of tuples.
1474 : */
1475 1425 : if (root->tuple_fraction > 0.0)
1476 : cheapest_path =
1477 1425 : get_cheapest_fractional_path(childrel,
1478 : root->tuple_fraction);
1479 : else
1480 0 : cheapest_path = childrel->cheapest_startup_path;
1481 :
1482 : /* cheapest_startup_path must not be a parameterized path. */
1483 : Assert(cheapest_path->param_info == NULL);
1484 1425 : accumulate_append_subpath(cheapest_path,
1485 : &startup.subpaths,
1486 : NULL,
1487 : &startup.child_append_relid_sets);
1488 : }
1489 : else
1490 84329 : startup_valid = false;
1491 :
1492 :
1493 : /* Same idea, but for a partial plan. */
1494 85754 : if (childrel->partial_pathlist != NIL)
1495 : {
1496 53874 : cheapest_partial_path = linitial(childrel->partial_pathlist);
1497 53874 : accumulate_append_subpath(cheapest_partial_path,
1498 : &partial_only.partial_subpaths, NULL,
1499 : &partial_only.child_append_relid_sets);
1500 : }
1501 : else
1502 31880 : partial_only_valid = false;
1503 :
1504 : /*
1505 : * Same idea, but for a parallel append mixing partial and non-partial
1506 : * paths.
1507 : */
1508 85754 : if (parallel_append_valid)
1509 : {
1510 65339 : Path *nppath = NULL;
1511 :
1512 : nppath =
1513 65339 : get_cheapest_parallel_safe_total_inner(childrel->pathlist);
1514 :
1515 65339 : if (cheapest_partial_path == NULL && nppath == NULL)
1516 : {
1517 : /* Neither a partial nor a parallel-safe path? Forget it. */
1518 413 : parallel_append_valid = false;
1519 : }
1520 64926 : else if (nppath == NULL ||
1521 53499 : (cheapest_partial_path != NULL &&
1522 53499 : cheapest_partial_path->total_cost < nppath->total_cost))
1523 : {
1524 : /* Partial path is cheaper or the only option. */
1525 : Assert(cheapest_partial_path != NULL);
1526 53302 : accumulate_append_subpath(cheapest_partial_path,
1527 : ¶llel_append.partial_subpaths,
1528 : ¶llel_append.subpaths,
1529 : ¶llel_append.child_append_relid_sets);
1530 : }
1531 : else
1532 : {
1533 : /*
1534 : * Either we've got only a non-partial path, or we think that
1535 : * a single backend can execute the best non-partial path
1536 : * faster than all the parallel backends working together can
1537 : * execute the best partial path.
1538 : *
1539 : * It might make sense to be more aggressive here. Even if
1540 : * the best non-partial path is more expensive than the best
1541 : * partial path, it could still be better to choose the
1542 : * non-partial path if there are several such paths that can
1543 : * be given to different workers. For now, we don't try to
1544 : * figure that out.
1545 : */
1546 11624 : accumulate_append_subpath(nppath,
1547 : ¶llel_append.subpaths,
1548 : NULL,
1549 : ¶llel_append.child_append_relid_sets);
1550 : }
1551 : }
1552 :
1553 : /*
1554 : * Collect lists of all the available path orderings and
1555 : * parameterizations for all the children. We use these as a
1556 : * heuristic to indicate which sort orderings and parameterizations we
1557 : * should build Append and MergeAppend paths for.
1558 : */
1559 199892 : foreach(lcp, childrel->pathlist)
1560 : {
1561 114138 : Path *childpath = (Path *) lfirst(lcp);
1562 114138 : List *childkeys = childpath->pathkeys;
1563 114138 : Relids childouter = PATH_REQ_OUTER(childpath);
1564 :
1565 : /* Unsorted paths don't contribute to pathkey list */
1566 114138 : if (childkeys != NIL)
1567 : {
1568 : ListCell *lpk;
1569 28680 : bool found = false;
1570 :
1571 : /* Have we already seen this ordering? */
1572 28833 : foreach(lpk, all_child_pathkeys)
1573 : {
1574 19540 : List *existing_pathkeys = (List *) lfirst(lpk);
1575 :
1576 19540 : if (compare_pathkeys(existing_pathkeys,
1577 : childkeys) == PATHKEYS_EQUAL)
1578 : {
1579 19387 : found = true;
1580 19387 : break;
1581 : }
1582 : }
1583 28680 : if (!found)
1584 : {
1585 : /* No, so add it to all_child_pathkeys */
1586 9293 : all_child_pathkeys = lappend(all_child_pathkeys,
1587 : childkeys);
1588 : }
1589 : }
1590 :
1591 : /* Unparameterized paths don't contribute to param-set list */
1592 114138 : if (childouter)
1593 : {
1594 : ListCell *lco;
1595 5693 : bool found = false;
1596 :
1597 : /* Have we already seen this param set? */
1598 6341 : foreach(lco, all_child_outers)
1599 : {
1600 4149 : Relids existing_outers = (Relids) lfirst(lco);
1601 :
1602 4149 : if (bms_equal(existing_outers, childouter))
1603 : {
1604 3501 : found = true;
1605 3501 : break;
1606 : }
1607 : }
1608 5693 : if (!found)
1609 : {
1610 : /* No, so add it to all_child_outers */
1611 2192 : all_child_outers = lappend(all_child_outers,
1612 : childouter);
1613 : }
1614 : }
1615 : }
1616 : }
1617 :
1618 : /*
1619 : * If we found unparameterized paths for all children, build an unordered,
1620 : * unparameterized Append path for the rel. (Note: this is correct even
1621 : * if we have zero or one live subpath due to constraint exclusion.)
1622 : */
1623 37364 : if (unparameterized_valid)
1624 37094 : add_path(rel, (Path *) create_append_path(root, rel, unparameterized,
1625 : NIL, NULL, 0, false,
1626 : -1));
1627 :
1628 : /* build an AppendPath for the cheap startup paths, if valid */
1629 37364 : if (startup_valid)
1630 575 : add_path(rel, (Path *) create_append_path(root, rel, startup,
1631 : NIL, NULL, 0, false, -1));
1632 :
1633 : /*
1634 : * Consider an append of unordered, unparameterized partial paths. Make
1635 : * it parallel-aware if possible.
1636 : */
1637 37364 : if (partial_only_valid && partial_only.partial_subpaths != NIL)
1638 : {
1639 : AppendPath *appendpath;
1640 : ListCell *lc;
1641 21953 : int parallel_workers = 0;
1642 :
1643 : /* Find the highest number of workers requested for any subpath. */
1644 79485 : foreach(lc, partial_only.partial_subpaths)
1645 : {
1646 57532 : Path *path = lfirst(lc);
1647 :
1648 57532 : parallel_workers = Max(parallel_workers, path->parallel_workers);
1649 : }
1650 : Assert(parallel_workers > 0);
1651 :
1652 : /*
1653 : * If the use of parallel append is permitted, always request at least
1654 : * log2(# of children) workers. We assume it can be useful to have
1655 : * extra workers in this case because they will be spread out across
1656 : * the children. The precise formula is just a guess, but we don't
1657 : * want to end up with a radically different answer for a table with N
1658 : * partitions vs. an unpartitioned table with the same data, so the
1659 : * use of some kind of log-scaling here seems to make some sense.
1660 : */
1661 21953 : if (enable_parallel_append)
1662 : {
1663 21913 : parallel_workers = Max(parallel_workers,
1664 : pg_leftmost_one_pos32(list_length(live_childrels)) + 1);
1665 21913 : parallel_workers = Min(parallel_workers,
1666 : max_parallel_workers_per_gather);
1667 : }
1668 : Assert(parallel_workers > 0);
1669 :
1670 : /* Generate a partial append path. */
1671 21953 : appendpath = create_append_path(root, rel, partial_only,
1672 : NIL, NULL, parallel_workers,
1673 : enable_parallel_append,
1674 : -1);
1675 :
1676 : /*
1677 : * Make sure any subsequent partial paths use the same row count
1678 : * estimate.
1679 : */
1680 21953 : partial_rows = appendpath->path.rows;
1681 :
1682 : /* Add the path. */
1683 21953 : add_partial_path(rel, (Path *) appendpath);
1684 : }
1685 :
1686 : /*
1687 : * Consider a parallel-aware append using a mix of partial and non-partial
1688 : * paths. (This only makes sense if there's at least one child which has
1689 : * a non-partial path that is substantially cheaper than any partial path;
1690 : * otherwise, we should use the append path added in the previous step.)
1691 : */
1692 37364 : if (parallel_append_valid && parallel_append.subpaths != NIL)
1693 : {
1694 : AppendPath *appendpath;
1695 : ListCell *lc;
1696 4257 : int parallel_workers = 0;
1697 :
1698 : /*
1699 : * Find the highest number of workers requested for any partial
1700 : * subpath.
1701 : */
1702 5002 : foreach(lc, parallel_append.partial_subpaths)
1703 : {
1704 745 : Path *path = lfirst(lc);
1705 :
1706 745 : parallel_workers = Max(parallel_workers, path->parallel_workers);
1707 : }
1708 :
1709 : /*
1710 : * Same formula here as above. It's even more important in this
1711 : * instance because the non-partial paths won't contribute anything to
1712 : * the planned number of parallel workers.
1713 : */
1714 4257 : parallel_workers = Max(parallel_workers,
1715 : pg_leftmost_one_pos32(list_length(live_childrels)) + 1);
1716 4257 : parallel_workers = Min(parallel_workers,
1717 : max_parallel_workers_per_gather);
1718 : Assert(parallel_workers > 0);
1719 :
1720 4257 : appendpath = create_append_path(root, rel, parallel_append,
1721 : NIL, NULL, parallel_workers, true,
1722 : partial_rows);
1723 4257 : add_partial_path(rel, (Path *) appendpath);
1724 : }
1725 :
1726 : /*
1727 : * Also build unparameterized ordered append paths based on the collected
1728 : * list of child pathkeys.
1729 : */
1730 37364 : if (unparameterized_valid)
1731 37094 : generate_orderedappend_paths(root, rel, live_childrels,
1732 : all_child_pathkeys);
1733 :
1734 : /*
1735 : * Build Append paths for each parameterization seen among the child rels.
1736 : * (This may look pretty expensive, but in most cases of practical
1737 : * interest, the child rels will expose mostly the same parameterizations,
1738 : * so that not that many cases actually get considered here.)
1739 : *
1740 : * The Append node itself cannot enforce quals, so all qual checking must
1741 : * be done in the child paths. This means that to have a parameterized
1742 : * Append path, we must have the exact same parameterization for each
1743 : * child path; otherwise some children might be failing to check the
1744 : * moved-down quals. To make them match up, we can try to increase the
1745 : * parameterization of lesser-parameterized paths.
1746 : */
1747 39556 : foreach(l, all_child_outers)
1748 : {
1749 2192 : Relids required_outer = (Relids) lfirst(l);
1750 : ListCell *lcr;
1751 2192 : AppendPathInput parameterized = {0};
1752 2192 : bool parameterized_valid = true;
1753 :
1754 : /* Select the child paths for an Append with this parameterization */
1755 7984 : foreach(lcr, live_childrels)
1756 : {
1757 5802 : RelOptInfo *childrel = (RelOptInfo *) lfirst(lcr);
1758 : Path *subpath;
1759 :
1760 5802 : if (childrel->pathlist == NIL)
1761 : {
1762 : /* failed to make a suitable path for this child */
1763 0 : parameterized_valid = false;
1764 0 : break;
1765 : }
1766 :
1767 5802 : subpath = get_cheapest_parameterized_child_path(root,
1768 : childrel,
1769 : required_outer);
1770 5802 : if (subpath == NULL)
1771 : {
1772 : /* failed to make a suitable path for this child */
1773 10 : parameterized_valid = false;
1774 10 : break;
1775 : }
1776 5792 : accumulate_append_subpath(subpath, ¶meterized.subpaths, NULL,
1777 : ¶meterized.child_append_relid_sets);
1778 : }
1779 :
1780 2192 : if (parameterized_valid)
1781 2182 : add_path(rel, (Path *)
1782 2182 : create_append_path(root, rel, parameterized,
1783 : NIL, required_outer, 0, false,
1784 : -1));
1785 : }
1786 :
1787 : /*
1788 : * When there is only a single child relation, the Append path can inherit
1789 : * any ordering available for the child rel's path, so that it's useful to
1790 : * consider ordered partial paths. Above we only considered the cheapest
1791 : * partial path for each child, but let's also make paths using any
1792 : * partial paths that have pathkeys.
1793 : */
1794 37364 : if (list_length(live_childrels) == 1)
1795 : {
1796 10355 : RelOptInfo *childrel = (RelOptInfo *) linitial(live_childrels);
1797 :
1798 : /* skip the cheapest partial path, since we already used that above */
1799 10504 : for_each_from(l, childrel->partial_pathlist, 1)
1800 : {
1801 149 : Path *path = (Path *) lfirst(l);
1802 : AppendPath *appendpath;
1803 149 : AppendPathInput append = {0};
1804 :
1805 : /* skip paths with no pathkeys. */
1806 149 : if (path->pathkeys == NIL)
1807 0 : continue;
1808 :
1809 149 : append.partial_subpaths = list_make1(path);
1810 149 : appendpath = create_append_path(root, rel, append, NIL, NULL,
1811 : path->parallel_workers, true,
1812 : partial_rows);
1813 149 : add_partial_path(rel, (Path *) appendpath);
1814 : }
1815 : }
1816 37364 : }
1817 :
1818 : /*
1819 : * generate_orderedappend_paths
1820 : * Generate ordered append paths for an append relation
1821 : *
1822 : * Usually we generate MergeAppend paths here, but there are some special
1823 : * cases where we can generate simple Append paths, because the subpaths
1824 : * can provide tuples in the required order already.
1825 : *
1826 : * We generate a path for each ordering (pathkey list) appearing in
1827 : * all_child_pathkeys.
1828 : *
1829 : * We consider the cheapest-startup and cheapest-total cases, and also the
1830 : * cheapest-fractional case when not all tuples need to be retrieved. For each
1831 : * interesting ordering, we collect all the cheapest startup subpaths, all the
1832 : * cheapest total paths, and, if applicable, all the cheapest fractional paths,
1833 : * and build a suitable path for each case.
1834 : *
1835 : * We don't currently generate any parameterized ordered paths here. While
1836 : * it would not take much more code here to do so, it's very unclear that it
1837 : * is worth the planning cycles to investigate such paths: there's little
1838 : * use for an ordered path on the inside of a nestloop. In fact, it's likely
1839 : * that the current coding of add_path would reject such paths out of hand,
1840 : * because add_path gives no credit for sort ordering of parameterized paths,
1841 : * and a parameterized MergeAppend is going to be more expensive than the
1842 : * corresponding parameterized Append path. If we ever try harder to support
1843 : * parameterized mergejoin plans, it might be worth adding support for
1844 : * parameterized paths here to feed such joins. (See notes in
1845 : * optimizer/README for why that might not ever happen, though.)
1846 : */
1847 : static void
1848 37094 : generate_orderedappend_paths(PlannerInfo *root, RelOptInfo *rel,
1849 : List *live_childrels,
1850 : List *all_child_pathkeys)
1851 : {
1852 : ListCell *lcp;
1853 37094 : List *partition_pathkeys = NIL;
1854 37094 : List *partition_pathkeys_desc = NIL;
1855 37094 : bool partition_pathkeys_partial = true;
1856 37094 : bool partition_pathkeys_desc_partial = true;
1857 :
1858 : /*
1859 : * Some partitioned table setups may allow us to use an Append node
1860 : * instead of a MergeAppend. This is possible in cases such as RANGE
1861 : * partitioned tables where it's guaranteed that an earlier partition must
1862 : * contain rows which come earlier in the sort order. To detect whether
1863 : * this is relevant, build pathkey descriptions of the partition ordering,
1864 : * for both forward and reverse scans.
1865 : */
1866 59350 : if (rel->part_scheme != NULL && IS_SIMPLE_REL(rel) &&
1867 22256 : partitions_are_ordered(rel->boundinfo, rel->live_parts))
1868 : {
1869 18252 : partition_pathkeys = build_partition_pathkeys(root, rel,
1870 : ForwardScanDirection,
1871 : &partition_pathkeys_partial);
1872 :
1873 18252 : partition_pathkeys_desc = build_partition_pathkeys(root, rel,
1874 : BackwardScanDirection,
1875 : &partition_pathkeys_desc_partial);
1876 :
1877 : /*
1878 : * You might think we should truncate_useless_pathkeys here, but
1879 : * allowing partition keys which are a subset of the query's pathkeys
1880 : * can often be useful. For example, consider a table partitioned by
1881 : * RANGE (a, b), and a query with ORDER BY a, b, c. If we have child
1882 : * paths that can produce the a, b, c ordering (perhaps via indexes on
1883 : * (a, b, c)) then it works to consider the appendrel output as
1884 : * ordered by a, b, c.
1885 : */
1886 : }
1887 :
1888 : /* Now consider each interesting sort ordering */
1889 46337 : foreach(lcp, all_child_pathkeys)
1890 : {
1891 9243 : List *pathkeys = (List *) lfirst(lcp);
1892 9243 : AppendPathInput startup = {0};
1893 9243 : AppendPathInput total = {0};
1894 9243 : AppendPathInput fractional = {0};
1895 9243 : bool startup_neq_total = false;
1896 9243 : bool fraction_neq_total = false;
1897 : bool match_partition_order;
1898 : bool match_partition_order_desc;
1899 : int end_index;
1900 : int first_index;
1901 : int direction;
1902 :
1903 : /*
1904 : * Determine if this sort ordering matches any partition pathkeys we
1905 : * have, for both ascending and descending partition order. If the
1906 : * partition pathkeys happen to be contained in pathkeys then it still
1907 : * works, as described above, providing that the partition pathkeys
1908 : * are complete and not just a prefix of the partition keys. (In such
1909 : * cases we'll be relying on the child paths to have sorted the
1910 : * lower-order columns of the required pathkeys.)
1911 : */
1912 9243 : match_partition_order =
1913 16563 : pathkeys_contained_in(pathkeys, partition_pathkeys) ||
1914 7484 : (!partition_pathkeys_partial &&
1915 164 : pathkeys_contained_in(partition_pathkeys, pathkeys));
1916 :
1917 23681 : match_partition_order_desc = !match_partition_order &&
1918 7234 : (pathkeys_contained_in(pathkeys, partition_pathkeys_desc) ||
1919 7252 : (!partition_pathkeys_desc_partial &&
1920 48 : pathkeys_contained_in(partition_pathkeys_desc, pathkeys)));
1921 :
1922 : /*
1923 : * When the required pathkeys match the reverse of the partition
1924 : * order, we must build the list of paths in reverse starting with the
1925 : * last matching partition first. We can get away without making any
1926 : * special cases for this in the loop below by just looping backward
1927 : * over the child relations in this case.
1928 : */
1929 9243 : if (match_partition_order_desc)
1930 : {
1931 : /* loop backward */
1932 40 : first_index = list_length(live_childrels) - 1;
1933 40 : end_index = -1;
1934 40 : direction = -1;
1935 :
1936 : /*
1937 : * Set this to true to save us having to check for
1938 : * match_partition_order_desc in the loop below.
1939 : */
1940 40 : match_partition_order = true;
1941 : }
1942 : else
1943 : {
1944 : /* for all other case, loop forward */
1945 9203 : first_index = 0;
1946 9203 : end_index = list_length(live_childrels);
1947 9203 : direction = 1;
1948 : }
1949 :
1950 : /* Select the child paths for this ordering... */
1951 33383 : for (int i = first_index; i != end_index; i += direction)
1952 : {
1953 24140 : RelOptInfo *childrel = list_nth_node(RelOptInfo, live_childrels, i);
1954 : Path *cheapest_startup,
1955 : *cheapest_total,
1956 24140 : *cheapest_fractional = NULL;
1957 :
1958 : /* Locate the right paths, if they are available. */
1959 : cheapest_startup =
1960 24140 : get_cheapest_path_for_pathkeys(childrel->pathlist,
1961 : pathkeys,
1962 : NULL,
1963 : STARTUP_COST,
1964 : false);
1965 : cheapest_total =
1966 24140 : get_cheapest_path_for_pathkeys(childrel->pathlist,
1967 : pathkeys,
1968 : NULL,
1969 : TOTAL_COST,
1970 : false);
1971 :
1972 : /*
1973 : * If we can't find any paths with the right order just use the
1974 : * cheapest-total path; we'll have to sort it later.
1975 : */
1976 24140 : if (cheapest_startup == NULL || cheapest_total == NULL)
1977 : {
1978 509 : cheapest_startup = cheapest_total =
1979 : childrel->cheapest_total_path;
1980 : /* Assert we do have an unparameterized path for this child */
1981 : Assert(cheapest_total->param_info == NULL);
1982 : }
1983 :
1984 : /*
1985 : * When building a fractional path, determine a cheapest
1986 : * fractional path for each child relation too. Looking at startup
1987 : * and total costs is not enough, because the cheapest fractional
1988 : * path may be dominated by two separate paths (one for startup,
1989 : * one for total).
1990 : *
1991 : * When needed (building fractional path), determine the cheapest
1992 : * fractional path too.
1993 : */
1994 24140 : if (root->tuple_fraction > 0)
1995 : {
1996 736 : double path_fraction = root->tuple_fraction;
1997 :
1998 : /*
1999 : * We should not have a dummy child relation here. However,
2000 : * we cannot use childrel->rows to compute the tuple fraction,
2001 : * as childrel can be an upper relation with an unset row
2002 : * estimate. Instead, we use the row estimate from the
2003 : * cheapest_total path, which should already have been forced
2004 : * to a sane value.
2005 : */
2006 : Assert(cheapest_total->rows > 0);
2007 :
2008 : /* Convert absolute limit to a path fraction */
2009 736 : if (path_fraction >= 1.0)
2010 736 : path_fraction /= cheapest_total->rows;
2011 :
2012 : cheapest_fractional =
2013 736 : get_cheapest_fractional_path_for_pathkeys(childrel->pathlist,
2014 : pathkeys,
2015 : NULL,
2016 : path_fraction);
2017 :
2018 : /*
2019 : * If we found no path with matching pathkeys, use the
2020 : * cheapest total path instead.
2021 : *
2022 : * XXX We might consider partially sorted paths too (with an
2023 : * incremental sort on top). But we'd have to build all the
2024 : * incremental paths, do the costing etc.
2025 : *
2026 : * Also, notice whether we actually have different paths for
2027 : * the "fractional" and "total" cases. This helps avoid
2028 : * generating two identical ordered append paths.
2029 : */
2030 736 : if (cheapest_fractional == NULL)
2031 34 : cheapest_fractional = cheapest_total;
2032 702 : else if (cheapest_fractional != cheapest_total)
2033 0 : fraction_neq_total = true;
2034 : }
2035 :
2036 : /*
2037 : * Notice whether we actually have different paths for the
2038 : * "cheapest" and "total" cases. This helps avoid generating two
2039 : * identical ordered append paths.
2040 : */
2041 24140 : if (cheapest_startup != cheapest_total)
2042 68 : startup_neq_total = true;
2043 :
2044 : /*
2045 : * Collect the appropriate child paths. The required logic varies
2046 : * for the Append and MergeAppend cases.
2047 : */
2048 24140 : if (match_partition_order)
2049 : {
2050 : /*
2051 : * We're going to make a plain Append path. We don't need
2052 : * most of what accumulate_append_subpath would do, but we do
2053 : * want to cut out child Appends or MergeAppends if they have
2054 : * just a single subpath (and hence aren't doing anything
2055 : * useful).
2056 : */
2057 : cheapest_startup =
2058 5472 : get_singleton_append_subpath(cheapest_startup,
2059 : &startup.child_append_relid_sets);
2060 : cheapest_total =
2061 5472 : get_singleton_append_subpath(cheapest_total,
2062 : &total.child_append_relid_sets);
2063 :
2064 5472 : startup.subpaths = lappend(startup.subpaths, cheapest_startup);
2065 5472 : total.subpaths = lappend(total.subpaths, cheapest_total);
2066 :
2067 5472 : if (cheapest_fractional)
2068 : {
2069 : cheapest_fractional =
2070 120 : get_singleton_append_subpath(cheapest_fractional,
2071 : &fractional.child_append_relid_sets);
2072 120 : fractional.subpaths =
2073 120 : lappend(fractional.subpaths, cheapest_fractional);
2074 : }
2075 : }
2076 : else
2077 : {
2078 : /*
2079 : * Otherwise, rely on accumulate_append_subpath to collect the
2080 : * child paths for the MergeAppend.
2081 : */
2082 18668 : accumulate_append_subpath(cheapest_startup,
2083 : &startup.subpaths, NULL,
2084 : &startup.child_append_relid_sets);
2085 18668 : accumulate_append_subpath(cheapest_total,
2086 : &total.subpaths, NULL,
2087 : &total.child_append_relid_sets);
2088 :
2089 18668 : if (cheapest_fractional)
2090 616 : accumulate_append_subpath(cheapest_fractional,
2091 : &fractional.subpaths, NULL,
2092 : &fractional.child_append_relid_sets);
2093 : }
2094 : }
2095 :
2096 : /* ... and build the Append or MergeAppend paths */
2097 9243 : if (match_partition_order)
2098 : {
2099 : /* We only need Append */
2100 2049 : add_path(rel, (Path *) create_append_path(root,
2101 : rel,
2102 : startup,
2103 : pathkeys,
2104 : NULL,
2105 : 0,
2106 : false,
2107 : -1));
2108 2049 : if (startup_neq_total)
2109 0 : add_path(rel, (Path *) create_append_path(root,
2110 : rel,
2111 : total,
2112 : pathkeys,
2113 : NULL,
2114 : 0,
2115 : false,
2116 : -1));
2117 :
2118 2049 : if (fractional.subpaths && fraction_neq_total)
2119 0 : add_path(rel, (Path *) create_append_path(root,
2120 : rel,
2121 : fractional,
2122 : pathkeys,
2123 : NULL,
2124 : 0,
2125 : false,
2126 : -1));
2127 : }
2128 : else
2129 : {
2130 : /* We need MergeAppend */
2131 7194 : add_path(rel, (Path *) create_merge_append_path(root,
2132 : rel,
2133 : startup.subpaths,
2134 : startup.child_append_relid_sets,
2135 : pathkeys,
2136 : NULL));
2137 7194 : if (startup_neq_total)
2138 44 : add_path(rel, (Path *) create_merge_append_path(root,
2139 : rel,
2140 : total.subpaths,
2141 : total.child_append_relid_sets,
2142 : pathkeys,
2143 : NULL));
2144 :
2145 7194 : if (fractional.subpaths && fraction_neq_total)
2146 0 : add_path(rel, (Path *) create_merge_append_path(root,
2147 : rel,
2148 : fractional.subpaths,
2149 : fractional.child_append_relid_sets,
2150 : pathkeys,
2151 : NULL));
2152 : }
2153 : }
2154 37094 : }
2155 :
2156 : /*
2157 : * get_cheapest_parameterized_child_path
2158 : * Get cheapest path for this relation that has exactly the requested
2159 : * parameterization.
2160 : *
2161 : * Returns NULL if unable to create such a path.
2162 : */
2163 : static Path *
2164 5802 : get_cheapest_parameterized_child_path(PlannerInfo *root, RelOptInfo *rel,
2165 : Relids required_outer)
2166 : {
2167 : Path *cheapest;
2168 : ListCell *lc;
2169 :
2170 : /*
2171 : * Look up the cheapest existing path with no more than the needed
2172 : * parameterization. If it has exactly the needed parameterization, we're
2173 : * done.
2174 : */
2175 5802 : cheapest = get_cheapest_path_for_pathkeys(rel->pathlist,
2176 : NIL,
2177 : required_outer,
2178 : TOTAL_COST,
2179 : false);
2180 : Assert(cheapest != NULL);
2181 5802 : if (bms_equal(PATH_REQ_OUTER(cheapest), required_outer))
2182 4962 : return cheapest;
2183 :
2184 : /*
2185 : * Otherwise, we can "reparameterize" an existing path to match the given
2186 : * parameterization, which effectively means pushing down additional
2187 : * joinquals to be checked within the path's scan. However, some existing
2188 : * paths might check the available joinquals already while others don't;
2189 : * therefore, it's not clear which existing path will be cheapest after
2190 : * reparameterization. We have to go through them all and find out.
2191 : */
2192 840 : cheapest = NULL;
2193 3298 : foreach(lc, rel->pathlist)
2194 : {
2195 2458 : Path *path = (Path *) lfirst(lc);
2196 :
2197 : /* Can't use it if it needs more than requested parameterization */
2198 2458 : if (!bms_is_subset(PATH_REQ_OUTER(path), required_outer))
2199 148 : continue;
2200 :
2201 : /*
2202 : * Reparameterization can only increase the path's cost, so if it's
2203 : * already more expensive than the current cheapest, forget it.
2204 : */
2205 3732 : if (cheapest != NULL &&
2206 1422 : compare_path_costs(cheapest, path, TOTAL_COST) <= 0)
2207 1372 : continue;
2208 :
2209 : /* Reparameterize if needed, then recheck cost */
2210 938 : if (!bms_equal(PATH_REQ_OUTER(path), required_outer))
2211 : {
2212 853 : path = reparameterize_path(root, path, required_outer, 1.0);
2213 853 : if (path == NULL)
2214 58 : continue; /* failed to reparameterize this one */
2215 : Assert(bms_equal(PATH_REQ_OUTER(path), required_outer));
2216 :
2217 795 : if (cheapest != NULL &&
2218 0 : compare_path_costs(cheapest, path, TOTAL_COST) <= 0)
2219 0 : continue;
2220 : }
2221 :
2222 : /* We have a new best path */
2223 880 : cheapest = path;
2224 : }
2225 :
2226 : /* Return the best path, or NULL if we found no suitable candidate */
2227 840 : return cheapest;
2228 : }
2229 :
2230 : /*
2231 : * accumulate_append_subpath
2232 : * Add a subpath to the list being built for an Append or MergeAppend.
2233 : *
2234 : * It's possible that the child is itself an Append or MergeAppend path, in
2235 : * which case we can "cut out the middleman" and just add its child paths to
2236 : * our own list. (We don't try to do this earlier because we need to apply
2237 : * both levels of transformation to the quals.)
2238 : *
2239 : * Note that if we omit a child MergeAppend in this way, we are effectively
2240 : * omitting a sort step, which seems fine: if the parent is to be an Append,
2241 : * its result would be unsorted anyway, while if the parent is to be a
2242 : * MergeAppend, there's no point in a separate sort on a child.
2243 : *
2244 : * Normally, either path is a partial path and subpaths is a list of partial
2245 : * paths, or else path is a non-partial plan and subpaths is a list of those.
2246 : * However, if path is a parallel-aware Append, then we add its partial path
2247 : * children to subpaths and the rest to special_subpaths. If the latter is
2248 : * NULL, we don't flatten the path at all (unless it contains only partial
2249 : * paths).
2250 : */
2251 : static void
2252 249093 : accumulate_append_subpath(Path *path, List **subpaths, List **special_subpaths,
2253 : List **child_append_relid_sets)
2254 : {
2255 249093 : if (IsA(path, AppendPath))
2256 : {
2257 13008 : AppendPath *apath = (AppendPath *) path;
2258 :
2259 13008 : if (!apath->path.parallel_aware || apath->first_partial_path == 0)
2260 : {
2261 12728 : *subpaths = list_concat(*subpaths, apath->subpaths);
2262 12728 : *child_append_relid_sets =
2263 12728 : lappend(*child_append_relid_sets, path->parent->relids);
2264 12728 : *child_append_relid_sets =
2265 12728 : list_concat(*child_append_relid_sets,
2266 12728 : apath->child_append_relid_sets);
2267 12728 : return;
2268 : }
2269 280 : else if (special_subpaths != NULL)
2270 : {
2271 : List *new_special_subpaths;
2272 :
2273 : /* Split Parallel Append into partial and non-partial subpaths */
2274 140 : *subpaths = list_concat(*subpaths,
2275 140 : list_copy_tail(apath->subpaths,
2276 : apath->first_partial_path));
2277 140 : new_special_subpaths = list_copy_head(apath->subpaths,
2278 : apath->first_partial_path);
2279 140 : *special_subpaths = list_concat(*special_subpaths,
2280 : new_special_subpaths);
2281 140 : *child_append_relid_sets =
2282 140 : lappend(*child_append_relid_sets, path->parent->relids);
2283 140 : *child_append_relid_sets =
2284 140 : list_concat(*child_append_relid_sets,
2285 140 : apath->child_append_relid_sets);
2286 140 : return;
2287 : }
2288 : }
2289 236085 : else if (IsA(path, MergeAppendPath))
2290 : {
2291 818 : MergeAppendPath *mpath = (MergeAppendPath *) path;
2292 :
2293 818 : *subpaths = list_concat(*subpaths, mpath->subpaths);
2294 818 : *child_append_relid_sets =
2295 818 : lappend(*child_append_relid_sets, path->parent->relids);
2296 818 : *child_append_relid_sets =
2297 818 : list_concat(*child_append_relid_sets,
2298 818 : mpath->child_append_relid_sets);
2299 818 : return;
2300 : }
2301 :
2302 235407 : *subpaths = lappend(*subpaths, path);
2303 : }
2304 :
2305 : /*
2306 : * get_singleton_append_subpath
2307 : * Returns the single subpath of an Append/MergeAppend, or just
2308 : * return 'path' if it's not a single sub-path Append/MergeAppend.
2309 : *
2310 : * As a side effect, whenever we return a single subpath rather than the
2311 : * original path, add the relid sets for the original path to
2312 : * child_append_relid_sets, so that those relids don't entirely disappear
2313 : * from the final plan.
2314 : *
2315 : * Note: 'path' must not be a parallel-aware path.
2316 : */
2317 : static Path *
2318 11064 : get_singleton_append_subpath(Path *path, List **child_append_relid_sets)
2319 : {
2320 : Assert(!path->parallel_aware);
2321 :
2322 11064 : if (IsA(path, AppendPath))
2323 : {
2324 328 : AppendPath *apath = (AppendPath *) path;
2325 :
2326 328 : if (list_length(apath->subpaths) == 1)
2327 : {
2328 178 : *child_append_relid_sets =
2329 178 : lappend(*child_append_relid_sets, path->parent->relids);
2330 178 : *child_append_relid_sets =
2331 178 : list_concat(*child_append_relid_sets,
2332 178 : apath->child_append_relid_sets);
2333 178 : return (Path *) linitial(apath->subpaths);
2334 : }
2335 : }
2336 10736 : else if (IsA(path, MergeAppendPath))
2337 : {
2338 290 : MergeAppendPath *mpath = (MergeAppendPath *) path;
2339 :
2340 290 : if (list_length(mpath->subpaths) == 1)
2341 : {
2342 0 : *child_append_relid_sets =
2343 0 : lappend(*child_append_relid_sets, path->parent->relids);
2344 0 : *child_append_relid_sets =
2345 0 : list_concat(*child_append_relid_sets,
2346 0 : mpath->child_append_relid_sets);
2347 0 : return (Path *) linitial(mpath->subpaths);
2348 : }
2349 : }
2350 :
2351 10886 : return path;
2352 : }
2353 :
2354 : /*
2355 : * set_dummy_rel_pathlist
2356 : * Build a dummy path for a relation that's been excluded by constraints
2357 : *
2358 : * Rather than inventing a special "dummy" path type, we represent this as an
2359 : * AppendPath with no members (see also IS_DUMMY_APPEND/IS_DUMMY_REL macros).
2360 : *
2361 : * (See also mark_dummy_rel, which does basically the same thing, but is
2362 : * typically used to change a rel into dummy state after we already made
2363 : * paths for it.)
2364 : */
2365 : static void
2366 1178 : set_dummy_rel_pathlist(RelOptInfo *rel)
2367 : {
2368 1178 : AppendPathInput in = {0};
2369 :
2370 : /* Set dummy size estimates --- we leave attr_widths[] as zeroes */
2371 1178 : rel->rows = 0;
2372 1178 : rel->reltarget->width = 0;
2373 :
2374 : /* Discard any pre-existing paths; no further need for them */
2375 1178 : rel->pathlist = NIL;
2376 1178 : rel->partial_pathlist = NIL;
2377 :
2378 : /* Set up the dummy path */
2379 1178 : add_path(rel, (Path *) create_append_path(NULL, rel, in,
2380 : NIL, rel->lateral_relids,
2381 : 0, false, -1));
2382 :
2383 : /*
2384 : * We set the cheapest-path fields immediately, just in case they were
2385 : * pointing at some discarded path. This is redundant in current usage
2386 : * because set_rel_pathlist will do it later, but it's cheap so we keep it
2387 : * for safety and consistency with mark_dummy_rel.
2388 : */
2389 1178 : set_cheapest(rel);
2390 1178 : }
2391 :
2392 : /*
2393 : * find_window_run_conditions
2394 : * Determine if 'wfunc' is really a WindowFunc and call its prosupport
2395 : * function to determine the function's monotonic properties. We then
2396 : * see if 'opexpr' can be used to short-circuit execution.
2397 : *
2398 : * For example row_number() over (order by ...) always produces a value one
2399 : * higher than the previous. If someone has a window function in a subquery
2400 : * and has a WHERE clause in the outer query to filter rows <= 10, then we may
2401 : * as well stop processing the windowagg once the row number reaches 11. Here
2402 : * we check if 'opexpr' might help us to stop doing needless extra processing
2403 : * in WindowAgg nodes.
2404 : *
2405 : * '*keep_original' is set to true if the caller should also use 'opexpr' for
2406 : * its original purpose. This is set to false if the caller can assume that
2407 : * the run condition will handle all of the required filtering.
2408 : *
2409 : * Returns true if 'opexpr' was found to be useful and was added to the
2410 : * WindowFunc's runCondition. We also set *keep_original accordingly and add
2411 : * 'attno' to *run_cond_attrs offset by FirstLowInvalidHeapAttributeNumber.
2412 : * If the 'opexpr' cannot be used then we set *keep_original to true and
2413 : * return false.
2414 : */
2415 : static bool
2416 200 : find_window_run_conditions(Query *subquery, AttrNumber attno,
2417 : WindowFunc *wfunc, OpExpr *opexpr, bool wfunc_left,
2418 : bool *keep_original, Bitmapset **run_cond_attrs)
2419 : {
2420 : Oid prosupport;
2421 : Expr *otherexpr;
2422 : SupportRequestWFuncMonotonic req;
2423 : SupportRequestWFuncMonotonic *res;
2424 : WindowClause *wclause;
2425 : List *opinfos;
2426 : OpExpr *runopexpr;
2427 : Oid runoperator;
2428 : ListCell *lc;
2429 :
2430 200 : *keep_original = true;
2431 :
2432 200 : while (IsA(wfunc, RelabelType))
2433 0 : wfunc = (WindowFunc *) ((RelabelType *) wfunc)->arg;
2434 :
2435 : /* we can only work with window functions */
2436 200 : if (!IsA(wfunc, WindowFunc))
2437 20 : return false;
2438 :
2439 : /* can't use it if there are subplans in the WindowFunc */
2440 180 : if (contain_subplans((Node *) wfunc))
2441 5 : return false;
2442 :
2443 175 : prosupport = get_func_support(wfunc->winfnoid);
2444 :
2445 : /* Check if there's a support function for 'wfunc' */
2446 175 : if (!OidIsValid(prosupport))
2447 15 : return false;
2448 :
2449 : /* get the Expr from the other side of the OpExpr */
2450 160 : if (wfunc_left)
2451 140 : otherexpr = lsecond(opexpr->args);
2452 : else
2453 20 : otherexpr = linitial(opexpr->args);
2454 :
2455 : /*
2456 : * The value being compared must not change during the evaluation of the
2457 : * window partition.
2458 : */
2459 160 : if (!is_pseudo_constant_clause((Node *) otherexpr))
2460 0 : return false;
2461 :
2462 : /* find the window clause belonging to the window function */
2463 160 : wclause = (WindowClause *) list_nth(subquery->windowClause,
2464 160 : wfunc->winref - 1);
2465 :
2466 160 : req.type = T_SupportRequestWFuncMonotonic;
2467 160 : req.window_func = wfunc;
2468 160 : req.window_clause = wclause;
2469 :
2470 : /* call the support function */
2471 : res = (SupportRequestWFuncMonotonic *)
2472 160 : DatumGetPointer(OidFunctionCall1(prosupport,
2473 : PointerGetDatum(&req)));
2474 :
2475 : /*
2476 : * Nothing to do if the function is neither monotonically increasing nor
2477 : * monotonically decreasing.
2478 : */
2479 160 : if (res == NULL || res->monotonic == MONOTONICFUNC_NONE)
2480 0 : return false;
2481 :
2482 160 : runopexpr = NULL;
2483 160 : runoperator = InvalidOid;
2484 160 : opinfos = get_op_index_interpretation(opexpr->opno);
2485 :
2486 160 : foreach(lc, opinfos)
2487 : {
2488 160 : OpIndexInterpretation *opinfo = (OpIndexInterpretation *) lfirst(lc);
2489 160 : CompareType cmptype = opinfo->cmptype;
2490 :
2491 : /* handle < / <= */
2492 160 : if (cmptype == COMPARE_LT || cmptype == COMPARE_LE)
2493 : {
2494 : /*
2495 : * < / <= is supported for monotonically increasing functions in
2496 : * the form <wfunc> op <pseudoconst> and <pseudoconst> op <wfunc>
2497 : * for monotonically decreasing functions.
2498 : */
2499 115 : if ((wfunc_left && (res->monotonic & MONOTONICFUNC_INCREASING)) ||
2500 15 : (!wfunc_left && (res->monotonic & MONOTONICFUNC_DECREASING)))
2501 : {
2502 105 : *keep_original = false;
2503 105 : runopexpr = opexpr;
2504 105 : runoperator = opexpr->opno;
2505 : }
2506 115 : break;
2507 : }
2508 : /* handle > / >= */
2509 45 : else if (cmptype == COMPARE_GT || cmptype == COMPARE_GE)
2510 : {
2511 : /*
2512 : * > / >= is supported for monotonically decreasing functions in
2513 : * the form <wfunc> op <pseudoconst> and <pseudoconst> op <wfunc>
2514 : * for monotonically increasing functions.
2515 : */
2516 15 : if ((wfunc_left && (res->monotonic & MONOTONICFUNC_DECREASING)) ||
2517 10 : (!wfunc_left && (res->monotonic & MONOTONICFUNC_INCREASING)))
2518 : {
2519 15 : *keep_original = false;
2520 15 : runopexpr = opexpr;
2521 15 : runoperator = opexpr->opno;
2522 : }
2523 15 : break;
2524 : }
2525 : /* handle = */
2526 30 : else if (cmptype == COMPARE_EQ)
2527 : {
2528 : CompareType newcmptype;
2529 :
2530 : /*
2531 : * When both monotonically increasing and decreasing then the
2532 : * return value of the window function will be the same each time.
2533 : * We can simply use 'opexpr' as the run condition without
2534 : * modifying it.
2535 : */
2536 30 : if ((res->monotonic & MONOTONICFUNC_BOTH) == MONOTONICFUNC_BOTH)
2537 : {
2538 5 : *keep_original = false;
2539 5 : runopexpr = opexpr;
2540 5 : runoperator = opexpr->opno;
2541 5 : break;
2542 : }
2543 :
2544 : /*
2545 : * When monotonically increasing we make a qual with <wfunc> <=
2546 : * <value> or <value> >= <wfunc> in order to filter out values
2547 : * which are above the value in the equality condition. For
2548 : * monotonically decreasing functions we want to filter values
2549 : * below the value in the equality condition.
2550 : */
2551 25 : if (res->monotonic & MONOTONICFUNC_INCREASING)
2552 25 : newcmptype = wfunc_left ? COMPARE_LE : COMPARE_GE;
2553 : else
2554 0 : newcmptype = wfunc_left ? COMPARE_GE : COMPARE_LE;
2555 :
2556 : /* We must keep the original equality qual */
2557 25 : *keep_original = true;
2558 25 : runopexpr = opexpr;
2559 :
2560 : /* determine the operator to use for the WindowFuncRunCondition */
2561 25 : runoperator = get_opfamily_member_for_cmptype(opinfo->opfamily_id,
2562 : opinfo->oplefttype,
2563 : opinfo->oprighttype,
2564 : newcmptype);
2565 25 : break;
2566 : }
2567 : }
2568 :
2569 160 : if (runopexpr != NULL)
2570 : {
2571 : WindowFuncRunCondition *wfuncrc;
2572 :
2573 150 : wfuncrc = makeNode(WindowFuncRunCondition);
2574 150 : wfuncrc->opno = runoperator;
2575 150 : wfuncrc->inputcollid = runopexpr->inputcollid;
2576 150 : wfuncrc->wfunc_left = wfunc_left;
2577 150 : wfuncrc->arg = copyObject(otherexpr);
2578 :
2579 150 : wfunc->runCondition = lappend(wfunc->runCondition, wfuncrc);
2580 :
2581 : /* record that this attno was used in a run condition */
2582 150 : *run_cond_attrs = bms_add_member(*run_cond_attrs,
2583 : attno - FirstLowInvalidHeapAttributeNumber);
2584 150 : return true;
2585 : }
2586 :
2587 : /* unsupported OpExpr */
2588 10 : return false;
2589 : }
2590 :
2591 : /*
2592 : * check_and_push_window_quals
2593 : * Check if 'clause' is a qual that can be pushed into a WindowFunc
2594 : * as a 'runCondition' qual. These, when present, allow some unnecessary
2595 : * work to be skipped during execution.
2596 : *
2597 : * 'run_cond_attrs' will be populated with all targetlist resnos of subquery
2598 : * targets (offset by FirstLowInvalidHeapAttributeNumber) that we pushed
2599 : * window quals for.
2600 : *
2601 : * Returns true if the caller still must keep the original qual or false if
2602 : * the caller can safely ignore the original qual because the WindowAgg node
2603 : * will use the runCondition to stop returning tuples.
2604 : */
2605 : static bool
2606 210 : check_and_push_window_quals(Query *subquery, Node *clause,
2607 : Bitmapset **run_cond_attrs)
2608 : {
2609 210 : OpExpr *opexpr = (OpExpr *) clause;
2610 210 : bool keep_original = true;
2611 : Var *var1;
2612 : Var *var2;
2613 :
2614 : /* We're only able to use OpExprs with 2 operands */
2615 210 : if (!IsA(opexpr, OpExpr))
2616 15 : return true;
2617 :
2618 195 : if (list_length(opexpr->args) != 2)
2619 0 : return true;
2620 :
2621 : /*
2622 : * Currently, we restrict this optimization to strict OpExprs. The reason
2623 : * for this is that during execution, once the runcondition becomes false,
2624 : * we stop evaluating WindowFuncs. To avoid leaving around stale window
2625 : * function result values, we set them to NULL. Having only strict
2626 : * OpExprs here ensures that we properly filter out the tuples with NULLs
2627 : * in the top-level WindowAgg.
2628 : */
2629 195 : set_opfuncid(opexpr);
2630 195 : if (!func_strict(opexpr->opfuncid))
2631 0 : return true;
2632 :
2633 : /*
2634 : * Check for plain Vars that reference window functions in the subquery.
2635 : * If we find any, we'll ask find_window_run_conditions() if 'opexpr' can
2636 : * be used as part of the run condition.
2637 : */
2638 :
2639 : /* Check the left side of the OpExpr */
2640 195 : var1 = linitial(opexpr->args);
2641 195 : if (IsA(var1, Var) && var1->varattno > 0)
2642 : {
2643 165 : TargetEntry *tle = list_nth(subquery->targetList, var1->varattno - 1);
2644 165 : WindowFunc *wfunc = (WindowFunc *) tle->expr;
2645 :
2646 165 : if (find_window_run_conditions(subquery, tle->resno, wfunc, opexpr,
2647 : true, &keep_original, run_cond_attrs))
2648 135 : return keep_original;
2649 : }
2650 :
2651 : /* and check the right side */
2652 60 : var2 = lsecond(opexpr->args);
2653 60 : if (IsA(var2, Var) && var2->varattno > 0)
2654 : {
2655 35 : TargetEntry *tle = list_nth(subquery->targetList, var2->varattno - 1);
2656 35 : WindowFunc *wfunc = (WindowFunc *) tle->expr;
2657 :
2658 35 : if (find_window_run_conditions(subquery, tle->resno, wfunc, opexpr,
2659 : false, &keep_original, run_cond_attrs))
2660 15 : return keep_original;
2661 : }
2662 :
2663 45 : return true;
2664 : }
2665 :
2666 : /*
2667 : * set_subquery_pathlist
2668 : * Generate SubqueryScan access paths for a subquery RTE
2669 : *
2670 : * We don't currently support generating parameterized paths for subqueries
2671 : * by pushing join clauses down into them; it seems too expensive to re-plan
2672 : * the subquery multiple times to consider different alternatives.
2673 : * (XXX that could stand to be reconsidered, now that we use Paths.)
2674 : * So the paths made here will be parameterized if the subquery contains
2675 : * LATERAL references, otherwise not. As long as that's true, there's no need
2676 : * for a separate set_subquery_size phase: just make the paths right away.
2677 : */
2678 : static void
2679 17357 : set_subquery_pathlist(PlannerInfo *root, RelOptInfo *rel,
2680 : Index rti, RangeTblEntry *rte)
2681 : {
2682 17357 : Query *parse = root->parse;
2683 17357 : Query *subquery = rte->subquery;
2684 : bool trivial_pathtarget;
2685 : Relids required_outer;
2686 : pushdown_safety_info safetyInfo;
2687 : double tuple_fraction;
2688 : RelOptInfo *sub_final_rel;
2689 17357 : Bitmapset *run_cond_attrs = NULL;
2690 : ListCell *lc;
2691 : char *plan_name;
2692 :
2693 : /*
2694 : * Must copy the Query so that planning doesn't mess up the RTE contents
2695 : * (really really need to fix the planner to not scribble on its input,
2696 : * someday ... but see remove_unused_subquery_outputs to start with).
2697 : */
2698 17357 : subquery = copyObject(subquery);
2699 :
2700 : /*
2701 : * If it's a LATERAL subquery, it might contain some Vars of the current
2702 : * query level, requiring it to be treated as parameterized, even though
2703 : * we don't support pushing down join quals into subqueries.
2704 : */
2705 17357 : required_outer = rel->lateral_relids;
2706 :
2707 : /*
2708 : * Zero out result area for subquery_is_pushdown_safe, so that it can set
2709 : * flags as needed while recursing. In particular, we need a workspace
2710 : * for keeping track of the reasons why columns are unsafe to reference.
2711 : * These reasons are stored in the bits inside unsafeFlags[i] when we
2712 : * discover reasons that column i of the subquery is unsafe to be used in
2713 : * a pushed-down qual.
2714 : */
2715 17357 : memset(&safetyInfo, 0, sizeof(safetyInfo));
2716 17357 : safetyInfo.unsafeFlags = (unsigned char *)
2717 17357 : palloc0((list_length(subquery->targetList) + 1) * sizeof(unsigned char));
2718 :
2719 : /*
2720 : * If the subquery has the "security_barrier" flag, it means the subquery
2721 : * originated from a view that must enforce row-level security. Then we
2722 : * must not push down quals that contain leaky functions. (Ideally this
2723 : * would be checked inside subquery_is_pushdown_safe, but since we don't
2724 : * currently pass the RTE to that function, we must do it here.)
2725 : */
2726 17357 : safetyInfo.unsafeLeaky = rte->security_barrier;
2727 :
2728 : /*
2729 : * If there are any restriction clauses that have been attached to the
2730 : * subquery relation, consider pushing them down to become WHERE or HAVING
2731 : * quals of the subquery itself. This transformation is useful because it
2732 : * may allow us to generate a better plan for the subquery than evaluating
2733 : * all the subquery output rows and then filtering them.
2734 : *
2735 : * There are several cases where we cannot push down clauses. Restrictions
2736 : * involving the subquery are checked by subquery_is_pushdown_safe().
2737 : * Restrictions on individual clauses are checked by
2738 : * qual_is_pushdown_safe(). Also, we don't want to push down
2739 : * pseudoconstant clauses; better to have the gating node above the
2740 : * subquery.
2741 : *
2742 : * Non-pushed-down clauses will get evaluated as qpquals of the
2743 : * SubqueryScan node.
2744 : *
2745 : * XXX Are there any cases where we want to make a policy decision not to
2746 : * push down a pushable qual, because it'd result in a worse plan?
2747 : */
2748 19520 : if (rel->baserestrictinfo != NIL &&
2749 2163 : subquery_is_pushdown_safe(subquery, subquery, &safetyInfo))
2750 : {
2751 : /* OK to consider pushing down individual quals */
2752 2042 : List *upperrestrictlist = NIL;
2753 : ListCell *l;
2754 :
2755 5558 : foreach(l, rel->baserestrictinfo)
2756 : {
2757 3516 : RestrictInfo *rinfo = (RestrictInfo *) lfirst(l);
2758 3516 : Node *clause = (Node *) rinfo->clause;
2759 :
2760 3516 : if (rinfo->pseudoconstant)
2761 : {
2762 2 : upperrestrictlist = lappend(upperrestrictlist, rinfo);
2763 2 : continue;
2764 : }
2765 :
2766 3514 : switch (qual_is_pushdown_safe(subquery, rti, rinfo, &safetyInfo))
2767 : {
2768 2664 : case PUSHDOWN_SAFE:
2769 : /* Push it down */
2770 2664 : subquery_push_qual(subquery, rte, rti, clause);
2771 2664 : break;
2772 :
2773 210 : case PUSHDOWN_WINDOWCLAUSE_RUNCOND:
2774 :
2775 : /*
2776 : * Since we can't push the qual down into the subquery,
2777 : * check if it happens to reference a window function. If
2778 : * so then it might be useful to use for the WindowAgg's
2779 : * runCondition.
2780 : */
2781 420 : if (!subquery->hasWindowFuncs ||
2782 210 : check_and_push_window_quals(subquery, clause,
2783 : &run_cond_attrs))
2784 : {
2785 : /*
2786 : * subquery has no window funcs or the clause is not a
2787 : * suitable window run condition qual or it is, but
2788 : * the original must also be kept in the upper query.
2789 : */
2790 85 : upperrestrictlist = lappend(upperrestrictlist, rinfo);
2791 : }
2792 210 : break;
2793 :
2794 640 : case PUSHDOWN_UNSAFE:
2795 640 : upperrestrictlist = lappend(upperrestrictlist, rinfo);
2796 640 : break;
2797 : }
2798 : }
2799 2042 : rel->baserestrictinfo = upperrestrictlist;
2800 : /* We don't bother recomputing baserestrict_min_security */
2801 : }
2802 :
2803 17357 : pfree(safetyInfo.unsafeFlags);
2804 :
2805 : /*
2806 : * The upper query might not use all the subquery's output columns; if
2807 : * not, we can simplify. Pass the attributes that were pushed down into
2808 : * WindowAgg run conditions to ensure we don't accidentally think those
2809 : * are unused.
2810 : */
2811 17357 : remove_unused_subquery_outputs(subquery, rel, run_cond_attrs);
2812 :
2813 : /*
2814 : * We can safely pass the outer tuple_fraction down to the subquery if the
2815 : * outer level has no joining, aggregation, or sorting to do. Otherwise
2816 : * we'd better tell the subquery to plan for full retrieval. (XXX This
2817 : * could probably be made more intelligent ...)
2818 : */
2819 17357 : if (parse->hasAggs ||
2820 13289 : parse->groupClause ||
2821 13274 : parse->groupingSets ||
2822 13274 : root->hasHavingQual ||
2823 13274 : parse->distinctClause ||
2824 18204 : parse->sortClause ||
2825 5264 : bms_membership(root->all_baserels) == BMS_MULTIPLE)
2826 13572 : tuple_fraction = 0.0; /* default case */
2827 : else
2828 3785 : tuple_fraction = root->tuple_fraction;
2829 :
2830 : /* plan_params should not be in use in current query level */
2831 : Assert(root->plan_params == NIL);
2832 :
2833 : /* Generate a subroot and Paths for the subquery */
2834 17357 : plan_name = choose_plan_name(root->glob, rte->eref->aliasname, false);
2835 17357 : rel->subroot = subquery_planner(root->glob, subquery, plan_name,
2836 : root, NULL, false, tuple_fraction, NULL);
2837 :
2838 : /* Isolate the params needed by this specific subplan */
2839 17357 : rel->subplan_params = root->plan_params;
2840 17357 : root->plan_params = NIL;
2841 :
2842 : /*
2843 : * It's possible that constraint exclusion proved the subquery empty. If
2844 : * so, it's desirable to produce an unadorned dummy path so that we will
2845 : * recognize appropriate optimizations at this query level.
2846 : */
2847 17357 : sub_final_rel = fetch_upper_rel(rel->subroot, UPPERREL_FINAL, NULL);
2848 :
2849 17357 : if (IS_DUMMY_REL(sub_final_rel))
2850 : {
2851 105 : set_dummy_rel_pathlist(rel);
2852 105 : return;
2853 : }
2854 :
2855 : /*
2856 : * Mark rel with estimated output rows, width, etc. Note that we have to
2857 : * do this before generating outer-query paths, else cost_subqueryscan is
2858 : * not happy.
2859 : */
2860 17252 : set_subquery_size_estimates(root, rel);
2861 :
2862 : /*
2863 : * Also detect whether the reltarget is trivial, so that we can pass that
2864 : * info to cost_subqueryscan (rather than re-deriving it multiple times).
2865 : * It's trivial if it fetches all the subplan output columns in order.
2866 : */
2867 17252 : if (list_length(rel->reltarget->exprs) != list_length(subquery->targetList))
2868 9561 : trivial_pathtarget = false;
2869 : else
2870 : {
2871 7691 : trivial_pathtarget = true;
2872 21364 : foreach(lc, rel->reltarget->exprs)
2873 : {
2874 13930 : Node *node = (Node *) lfirst(lc);
2875 : Var *var;
2876 :
2877 13930 : if (!IsA(node, Var))
2878 : {
2879 0 : trivial_pathtarget = false;
2880 0 : break;
2881 : }
2882 13930 : var = (Var *) node;
2883 13930 : if (var->varno != rti ||
2884 13930 : var->varattno != foreach_current_index(lc) + 1)
2885 : {
2886 257 : trivial_pathtarget = false;
2887 257 : break;
2888 : }
2889 : }
2890 : }
2891 :
2892 : /*
2893 : * For each Path that subquery_planner produced, make a SubqueryScanPath
2894 : * in the outer query.
2895 : */
2896 35859 : foreach(lc, sub_final_rel->pathlist)
2897 : {
2898 18607 : Path *subpath = (Path *) lfirst(lc);
2899 : List *pathkeys;
2900 :
2901 : /* Convert subpath's pathkeys to outer representation */
2902 18607 : pathkeys = convert_subquery_pathkeys(root,
2903 : rel,
2904 : subpath->pathkeys,
2905 : make_tlist_from_pathtarget(subpath->pathtarget));
2906 :
2907 : /* Generate outer path using this subpath */
2908 18607 : add_path(rel, (Path *)
2909 18607 : create_subqueryscan_path(root, rel, subpath,
2910 : trivial_pathtarget,
2911 : pathkeys, required_outer));
2912 : }
2913 :
2914 : /* If outer rel allows parallelism, do same for partial paths. */
2915 17252 : if (rel->consider_parallel && bms_is_empty(required_outer))
2916 : {
2917 : /* If consider_parallel is false, there should be no partial paths. */
2918 : Assert(sub_final_rel->consider_parallel ||
2919 : sub_final_rel->partial_pathlist == NIL);
2920 :
2921 : /* Same for partial paths. */
2922 10754 : foreach(lc, sub_final_rel->partial_pathlist)
2923 : {
2924 45 : Path *subpath = (Path *) lfirst(lc);
2925 : List *pathkeys;
2926 :
2927 : /* Convert subpath's pathkeys to outer representation */
2928 45 : pathkeys = convert_subquery_pathkeys(root,
2929 : rel,
2930 : subpath->pathkeys,
2931 : make_tlist_from_pathtarget(subpath->pathtarget));
2932 :
2933 : /* Generate outer path using this subpath */
2934 45 : add_partial_path(rel, (Path *)
2935 45 : create_subqueryscan_path(root, rel, subpath,
2936 : trivial_pathtarget,
2937 : pathkeys,
2938 : required_outer));
2939 : }
2940 : }
2941 : }
2942 :
2943 : /*
2944 : * set_function_pathlist
2945 : * Build the (single) access path for a function RTE
2946 : */
2947 : static void
2948 35645 : set_function_pathlist(PlannerInfo *root, RelOptInfo *rel, RangeTblEntry *rte)
2949 : {
2950 : Relids required_outer;
2951 35645 : List *pathkeys = NIL;
2952 :
2953 : /*
2954 : * We don't support pushing join clauses into the quals of a function
2955 : * scan, but it could still have required parameterization due to LATERAL
2956 : * refs in the function expression.
2957 : */
2958 35645 : required_outer = rel->lateral_relids;
2959 :
2960 : /*
2961 : * The result is considered unordered unless ORDINALITY was used, in which
2962 : * case it is ordered by the ordinal column (the last one). See if we
2963 : * care, by checking for uses of that Var in equivalence classes.
2964 : */
2965 35645 : if (rte->funcordinality)
2966 : {
2967 770 : AttrNumber ordattno = rel->max_attr;
2968 770 : Var *var = NULL;
2969 : ListCell *lc;
2970 :
2971 : /*
2972 : * Is there a Var for it in rel's targetlist? If not, the query did
2973 : * not reference the ordinality column, or at least not in any way
2974 : * that would be interesting for sorting.
2975 : */
2976 1787 : foreach(lc, rel->reltarget->exprs)
2977 : {
2978 1782 : Var *node = (Var *) lfirst(lc);
2979 :
2980 : /* checking varno/varlevelsup is just paranoia */
2981 1782 : if (IsA(node, Var) &&
2982 1782 : node->varattno == ordattno &&
2983 765 : node->varno == rel->relid &&
2984 765 : node->varlevelsup == 0)
2985 : {
2986 765 : var = node;
2987 765 : break;
2988 : }
2989 : }
2990 :
2991 : /*
2992 : * Try to build pathkeys for this Var with int8 sorting. We tell
2993 : * build_expression_pathkey not to build any new equivalence class; if
2994 : * the Var isn't already mentioned in some EC, it means that nothing
2995 : * cares about the ordering.
2996 : */
2997 770 : if (var)
2998 765 : pathkeys = build_expression_pathkey(root,
2999 : (Expr *) var,
3000 : Int8LessOperator,
3001 : rel->relids,
3002 : false);
3003 : }
3004 :
3005 : /* Generate appropriate path */
3006 35645 : add_path(rel, create_functionscan_path(root, rel,
3007 : pathkeys, required_outer));
3008 35645 : }
3009 :
3010 : /*
3011 : * set_values_pathlist
3012 : * Build the (single) access path for a VALUES RTE
3013 : */
3014 : static void
3015 6793 : set_values_pathlist(PlannerInfo *root, RelOptInfo *rel, RangeTblEntry *rte)
3016 : {
3017 : Relids required_outer;
3018 :
3019 : /*
3020 : * We don't support pushing join clauses into the quals of a values scan,
3021 : * but it could still have required parameterization due to LATERAL refs
3022 : * in the values expressions.
3023 : */
3024 6793 : required_outer = rel->lateral_relids;
3025 :
3026 : /* Generate appropriate path */
3027 6793 : add_path(rel, create_valuesscan_path(root, rel, required_outer));
3028 6793 : }
3029 :
3030 : /*
3031 : * set_tablefunc_pathlist
3032 : * Build the (single) access path for a table func RTE
3033 : */
3034 : static void
3035 519 : set_tablefunc_pathlist(PlannerInfo *root, RelOptInfo *rel, RangeTblEntry *rte)
3036 : {
3037 : Relids required_outer;
3038 :
3039 : /*
3040 : * We don't support pushing join clauses into the quals of a tablefunc
3041 : * scan, but it could still have required parameterization due to LATERAL
3042 : * refs in the function expression.
3043 : */
3044 519 : required_outer = rel->lateral_relids;
3045 :
3046 : /* Generate appropriate path */
3047 519 : add_path(rel, create_tablefuncscan_path(root, rel,
3048 : required_outer));
3049 519 : }
3050 :
3051 : /*
3052 : * set_cte_pathlist
3053 : * Build the (single) access path for a non-self-reference CTE RTE
3054 : *
3055 : * There's no need for a separate set_cte_size phase, since we don't
3056 : * support join-qual-parameterized paths for CTEs.
3057 : */
3058 : static void
3059 2928 : set_cte_pathlist(PlannerInfo *root, RelOptInfo *rel, RangeTblEntry *rte)
3060 : {
3061 : Path *ctepath;
3062 : Plan *cteplan;
3063 : PlannerInfo *cteroot;
3064 : Index levelsup;
3065 : List *pathkeys;
3066 : int ndx;
3067 : ListCell *lc;
3068 : int plan_id;
3069 : Relids required_outer;
3070 :
3071 : /*
3072 : * Find the referenced CTE, and locate the path and plan previously made
3073 : * for it.
3074 : */
3075 2928 : levelsup = rte->ctelevelsup;
3076 2928 : cteroot = root;
3077 4994 : while (levelsup-- > 0)
3078 : {
3079 2066 : cteroot = cteroot->parent_root;
3080 2066 : if (!cteroot) /* shouldn't happen */
3081 0 : elog(ERROR, "bad levelsup for CTE \"%s\"", rte->ctename);
3082 : }
3083 :
3084 : /*
3085 : * Note: cte_plan_ids can be shorter than cteList, if we are still working
3086 : * on planning the CTEs (ie, this is a side-reference from another CTE).
3087 : * So we mustn't use forboth here.
3088 : */
3089 2928 : ndx = 0;
3090 3884 : foreach(lc, cteroot->parse->cteList)
3091 : {
3092 3884 : CommonTableExpr *cte = (CommonTableExpr *) lfirst(lc);
3093 :
3094 3884 : if (strcmp(cte->ctename, rte->ctename) == 0)
3095 2928 : break;
3096 956 : ndx++;
3097 : }
3098 2928 : if (lc == NULL) /* shouldn't happen */
3099 0 : elog(ERROR, "could not find CTE \"%s\"", rte->ctename);
3100 2928 : if (ndx >= list_length(cteroot->cte_plan_ids))
3101 0 : elog(ERROR, "could not find plan for CTE \"%s\"", rte->ctename);
3102 2928 : plan_id = list_nth_int(cteroot->cte_plan_ids, ndx);
3103 2928 : if (plan_id <= 0)
3104 0 : elog(ERROR, "no plan was made for CTE \"%s\"", rte->ctename);
3105 :
3106 : Assert(list_length(root->glob->subpaths) == list_length(root->glob->subplans));
3107 2928 : ctepath = (Path *) list_nth(root->glob->subpaths, plan_id - 1);
3108 2928 : cteplan = (Plan *) list_nth(root->glob->subplans, plan_id - 1);
3109 :
3110 : /* Mark rel with estimated output rows, width, etc */
3111 2928 : set_cte_size_estimates(root, rel, cteplan->plan_rows);
3112 :
3113 : /* Convert the ctepath's pathkeys to outer query's representation */
3114 2928 : pathkeys = convert_subquery_pathkeys(root,
3115 : rel,
3116 : ctepath->pathkeys,
3117 : cteplan->targetlist);
3118 :
3119 : /*
3120 : * We don't support pushing join clauses into the quals of a CTE scan, but
3121 : * it could still have required parameterization due to LATERAL refs in
3122 : * its tlist.
3123 : */
3124 2928 : required_outer = rel->lateral_relids;
3125 :
3126 : /* Generate appropriate path */
3127 2928 : add_path(rel, create_ctescan_path(root, rel, pathkeys, required_outer));
3128 2928 : }
3129 :
3130 : /*
3131 : * set_namedtuplestore_pathlist
3132 : * Build the (single) access path for a named tuplestore RTE
3133 : *
3134 : * There's no need for a separate set_namedtuplestore_size phase, since we
3135 : * don't support join-qual-parameterized paths for tuplestores.
3136 : */
3137 : static void
3138 433 : set_namedtuplestore_pathlist(PlannerInfo *root, RelOptInfo *rel,
3139 : RangeTblEntry *rte)
3140 : {
3141 : Relids required_outer;
3142 :
3143 : /* Mark rel with estimated output rows, width, etc */
3144 433 : set_namedtuplestore_size_estimates(root, rel);
3145 :
3146 : /*
3147 : * We don't support pushing join clauses into the quals of a tuplestore
3148 : * scan, but it could still have required parameterization due to LATERAL
3149 : * refs in its tlist.
3150 : */
3151 433 : required_outer = rel->lateral_relids;
3152 :
3153 : /* Generate appropriate path */
3154 433 : add_path(rel, create_namedtuplestorescan_path(root, rel, required_outer));
3155 433 : }
3156 :
3157 : /*
3158 : * set_result_pathlist
3159 : * Build the (single) access path for an RTE_RESULT RTE
3160 : *
3161 : * There's no need for a separate set_result_size phase, since we
3162 : * don't support join-qual-parameterized paths for these RTEs.
3163 : */
3164 : static void
3165 3595 : set_result_pathlist(PlannerInfo *root, RelOptInfo *rel,
3166 : RangeTblEntry *rte)
3167 : {
3168 : Relids required_outer;
3169 :
3170 : /* Mark rel with estimated output rows, width, etc */
3171 3595 : set_result_size_estimates(root, rel);
3172 :
3173 : /*
3174 : * We don't support pushing join clauses into the quals of a Result scan,
3175 : * but it could still have required parameterization due to LATERAL refs
3176 : * in its tlist.
3177 : */
3178 3595 : required_outer = rel->lateral_relids;
3179 :
3180 : /* Generate appropriate path */
3181 3595 : add_path(rel, create_resultscan_path(root, rel, required_outer));
3182 3595 : }
3183 :
3184 : /*
3185 : * set_worktable_pathlist
3186 : * Build the (single) access path for a self-reference CTE RTE
3187 : *
3188 : * There's no need for a separate set_worktable_size phase, since we don't
3189 : * support join-qual-parameterized paths for CTEs.
3190 : */
3191 : static void
3192 692 : set_worktable_pathlist(PlannerInfo *root, RelOptInfo *rel, RangeTblEntry *rte)
3193 : {
3194 : Path *ctepath;
3195 : PlannerInfo *cteroot;
3196 : Index levelsup;
3197 : Relids required_outer;
3198 :
3199 : /*
3200 : * We need to find the non-recursive term's path, which is in the plan
3201 : * level that's processing the recursive UNION, which is one level *below*
3202 : * where the CTE comes from.
3203 : */
3204 692 : levelsup = rte->ctelevelsup;
3205 692 : if (levelsup == 0) /* shouldn't happen */
3206 0 : elog(ERROR, "bad levelsup for CTE \"%s\"", rte->ctename);
3207 692 : levelsup--;
3208 692 : cteroot = root;
3209 1626 : while (levelsup-- > 0)
3210 : {
3211 934 : cteroot = cteroot->parent_root;
3212 934 : if (!cteroot) /* shouldn't happen */
3213 0 : elog(ERROR, "bad levelsup for CTE \"%s\"", rte->ctename);
3214 : }
3215 692 : ctepath = cteroot->non_recursive_path;
3216 692 : if (!ctepath) /* shouldn't happen */
3217 0 : elog(ERROR, "could not find path for CTE \"%s\"", rte->ctename);
3218 :
3219 : /* Mark rel with estimated output rows, width, etc */
3220 692 : set_cte_size_estimates(root, rel, ctepath->rows);
3221 :
3222 : /*
3223 : * We don't support pushing join clauses into the quals of a worktable
3224 : * scan, but it could still have required parameterization due to LATERAL
3225 : * refs in its tlist. (I'm not sure this is actually possible given the
3226 : * restrictions on recursive references, but it's easy enough to support.)
3227 : */
3228 692 : required_outer = rel->lateral_relids;
3229 :
3230 : /* Generate appropriate path */
3231 692 : add_path(rel, create_worktablescan_path(root, rel, required_outer));
3232 692 : }
3233 :
3234 : /*
3235 : * generate_gather_paths
3236 : * Generate parallel access paths for a relation by pushing a Gather or
3237 : * Gather Merge on top of a partial path.
3238 : *
3239 : * This must not be called until after we're done creating all partial paths
3240 : * for the specified relation. (Otherwise, add_partial_path might delete a
3241 : * path that some GatherPath or GatherMergePath has a reference to.)
3242 : *
3243 : * If we're generating paths for a scan or join relation, override_rows will
3244 : * be false, and we'll just use the relation's size estimate. When we're
3245 : * being called for a partially-grouped or partially-distinct path, though, we
3246 : * need to override the rowcount estimate. (It's not clear that the
3247 : * particular value we're using here is actually best, but the underlying rel
3248 : * has no estimate so we must do something.)
3249 : */
3250 : void
3251 21875 : generate_gather_paths(PlannerInfo *root, RelOptInfo *rel, bool override_rows)
3252 : {
3253 : Path *cheapest_partial_path;
3254 : Path *simple_gather_path;
3255 : ListCell *lc;
3256 : double rows;
3257 21875 : double *rowsp = NULL;
3258 :
3259 : /* If there are no partial paths, there's nothing to do here. */
3260 21875 : if (rel->partial_pathlist == NIL)
3261 0 : return;
3262 :
3263 : /* Should we override the rel's rowcount estimate? */
3264 21875 : if (override_rows)
3265 5810 : rowsp = &rows;
3266 :
3267 : /*
3268 : * The output of Gather is always unsorted, so there's only one partial
3269 : * path of interest: the cheapest one. That will be the one at the front
3270 : * of partial_pathlist because of the way add_partial_path works.
3271 : */
3272 21875 : cheapest_partial_path = linitial(rel->partial_pathlist);
3273 21875 : rows = compute_gather_rows(cheapest_partial_path);
3274 : simple_gather_path = (Path *)
3275 21875 : create_gather_path(root, rel, cheapest_partial_path, rel->reltarget,
3276 : NULL, rowsp);
3277 21875 : add_path(rel, simple_gather_path);
3278 :
3279 : /*
3280 : * For each useful ordering, we can consider an order-preserving Gather
3281 : * Merge.
3282 : */
3283 48737 : foreach(lc, rel->partial_pathlist)
3284 : {
3285 26862 : Path *subpath = (Path *) lfirst(lc);
3286 : GatherMergePath *path;
3287 :
3288 26862 : if (subpath->pathkeys == NIL)
3289 21316 : continue;
3290 :
3291 5546 : rows = compute_gather_rows(subpath);
3292 5546 : path = create_gather_merge_path(root, rel, subpath, rel->reltarget,
3293 : subpath->pathkeys, NULL, rowsp);
3294 5546 : add_path(rel, &path->path);
3295 : }
3296 : }
3297 :
3298 : /*
3299 : * get_useful_pathkeys_for_relation
3300 : * Determine which orderings of a relation might be useful.
3301 : *
3302 : * Getting data in sorted order can be useful either because the requested
3303 : * order matches the final output ordering for the overall query we're
3304 : * planning, or because it enables an efficient merge join. Here, we try
3305 : * to figure out which pathkeys to consider.
3306 : *
3307 : * This allows us to do incremental sort on top of an index scan under a gather
3308 : * merge node, i.e. parallelized.
3309 : *
3310 : * If the require_parallel_safe is true, we also require the expressions to
3311 : * be parallel safe (which allows pushing the sort below Gather Merge).
3312 : *
3313 : * XXX At the moment this can only ever return a list with a single element,
3314 : * because it looks at query_pathkeys only. So we might return the pathkeys
3315 : * directly, but it seems plausible we'll want to consider other orderings
3316 : * in the future. For example, we might want to consider pathkeys useful for
3317 : * merge joins.
3318 : */
3319 : static List *
3320 21875 : get_useful_pathkeys_for_relation(PlannerInfo *root, RelOptInfo *rel,
3321 : bool require_parallel_safe)
3322 : {
3323 21875 : List *useful_pathkeys_list = NIL;
3324 :
3325 : /*
3326 : * Considering query_pathkeys is always worth it, because it might allow
3327 : * us to avoid a total sort when we have a partially presorted path
3328 : * available or to push the total sort into the parallel portion of the
3329 : * query.
3330 : */
3331 21875 : if (root->query_pathkeys)
3332 : {
3333 : ListCell *lc;
3334 13155 : int npathkeys = 0; /* useful pathkeys */
3335 :
3336 23188 : foreach(lc, root->query_pathkeys)
3337 : {
3338 16962 : PathKey *pathkey = (PathKey *) lfirst(lc);
3339 16962 : EquivalenceClass *pathkey_ec = pathkey->pk_eclass;
3340 :
3341 : /*
3342 : * We can only build a sort for pathkeys that contain a
3343 : * safe-to-compute-early EC member computable from the current
3344 : * relation's reltarget, so ignore the remainder of the list as
3345 : * soon as we find a pathkey without such a member.
3346 : *
3347 : * It's still worthwhile to return any prefix of the pathkeys list
3348 : * that meets this requirement, as we may be able to do an
3349 : * incremental sort.
3350 : *
3351 : * If requested, ensure the sort expression is parallel-safe too.
3352 : */
3353 16962 : if (!relation_can_be_sorted_early(root, rel, pathkey_ec,
3354 : require_parallel_safe))
3355 6929 : break;
3356 :
3357 10033 : npathkeys++;
3358 : }
3359 :
3360 : /*
3361 : * The whole query_pathkeys list matches, so append it directly, to
3362 : * allow comparing pathkeys easily by comparing list pointer. If we
3363 : * have to truncate the pathkeys, we gotta do a copy though.
3364 : */
3365 13155 : if (npathkeys == list_length(root->query_pathkeys))
3366 6226 : useful_pathkeys_list = lappend(useful_pathkeys_list,
3367 6226 : root->query_pathkeys);
3368 6929 : else if (npathkeys > 0)
3369 545 : useful_pathkeys_list = lappend(useful_pathkeys_list,
3370 545 : list_copy_head(root->query_pathkeys,
3371 : npathkeys));
3372 : }
3373 :
3374 21875 : return useful_pathkeys_list;
3375 : }
3376 :
3377 : /*
3378 : * generate_useful_gather_paths
3379 : * Generate parallel access paths for a relation by pushing a Gather or
3380 : * Gather Merge on top of a partial path.
3381 : *
3382 : * Unlike plain generate_gather_paths, this looks both at pathkeys of input
3383 : * paths (aiming to preserve the ordering), but also considers ordering that
3384 : * might be useful for nodes above the gather merge node, and tries to add
3385 : * a sort (regular or incremental) to provide that.
3386 : */
3387 : void
3388 486235 : generate_useful_gather_paths(PlannerInfo *root, RelOptInfo *rel, bool override_rows)
3389 : {
3390 : ListCell *lc;
3391 : double rows;
3392 486235 : double *rowsp = NULL;
3393 486235 : List *useful_pathkeys_list = NIL;
3394 486235 : Path *cheapest_partial_path = NULL;
3395 :
3396 : /* If there are no partial paths, there's nothing to do here. */
3397 486235 : if (rel->partial_pathlist == NIL)
3398 464360 : return;
3399 :
3400 : /* Should we override the rel's rowcount estimate? */
3401 21875 : if (override_rows)
3402 5810 : rowsp = &rows;
3403 :
3404 : /* generate the regular gather (merge) paths */
3405 21875 : generate_gather_paths(root, rel, override_rows);
3406 :
3407 : /* consider incremental sort for interesting orderings */
3408 21875 : useful_pathkeys_list = get_useful_pathkeys_for_relation(root, rel, true);
3409 :
3410 : /* used for explicit (full) sort paths */
3411 21875 : cheapest_partial_path = linitial(rel->partial_pathlist);
3412 :
3413 : /*
3414 : * Consider sorted paths for each interesting ordering. We generate both
3415 : * incremental and full sort.
3416 : */
3417 28646 : foreach(lc, useful_pathkeys_list)
3418 : {
3419 6771 : List *useful_pathkeys = lfirst(lc);
3420 : ListCell *lc2;
3421 : bool is_sorted;
3422 : int presorted_keys;
3423 :
3424 15771 : foreach(lc2, rel->partial_pathlist)
3425 : {
3426 9000 : Path *subpath = (Path *) lfirst(lc2);
3427 : GatherMergePath *path;
3428 :
3429 9000 : is_sorted = pathkeys_count_contained_in(useful_pathkeys,
3430 : subpath->pathkeys,
3431 : &presorted_keys);
3432 :
3433 : /*
3434 : * We don't need to consider the case where a subpath is already
3435 : * fully sorted because generate_gather_paths already creates a
3436 : * gather merge path for every subpath that has pathkeys present.
3437 : *
3438 : * But since the subpath is already sorted, we know we don't need
3439 : * to consider adding a sort (full or incremental) on top of it,
3440 : * so we can continue here.
3441 : */
3442 9000 : if (is_sorted)
3443 2380 : continue;
3444 :
3445 : /*
3446 : * Try at least sorting the cheapest path and also try
3447 : * incrementally sorting any path which is partially sorted
3448 : * already (no need to deal with paths which have presorted keys
3449 : * when incremental sort is disabled unless it's the cheapest
3450 : * input path).
3451 : */
3452 6620 : if (subpath != cheapest_partial_path &&
3453 260 : (presorted_keys == 0 || !enable_incremental_sort))
3454 73 : continue;
3455 :
3456 : /*
3457 : * Consider regular sort for any path that's not presorted or if
3458 : * incremental sort is disabled. We've no need to consider both
3459 : * sort and incremental sort on the same path. We assume that
3460 : * incremental sort is always faster when there are presorted
3461 : * keys.
3462 : *
3463 : * This is not redundant with the gather paths created in
3464 : * generate_gather_paths, because that doesn't generate ordered
3465 : * output. Here we add an explicit sort to match the useful
3466 : * ordering.
3467 : */
3468 6547 : if (presorted_keys == 0 || !enable_incremental_sort)
3469 : {
3470 6349 : subpath = (Path *) create_sort_path(root,
3471 : rel,
3472 : subpath,
3473 : useful_pathkeys,
3474 : -1.0);
3475 : }
3476 : else
3477 198 : subpath = (Path *) create_incremental_sort_path(root,
3478 : rel,
3479 : subpath,
3480 : useful_pathkeys,
3481 : presorted_keys,
3482 : -1);
3483 6547 : rows = compute_gather_rows(subpath);
3484 6547 : path = create_gather_merge_path(root, rel,
3485 : subpath,
3486 6547 : rel->reltarget,
3487 : subpath->pathkeys,
3488 : NULL,
3489 : rowsp);
3490 :
3491 6547 : add_path(rel, &path->path);
3492 : }
3493 : }
3494 : }
3495 :
3496 : /*
3497 : * generate_grouped_paths
3498 : * Generate paths for a grouped relation by adding sorted and hashed
3499 : * partial aggregation paths on top of paths of the ungrouped relation.
3500 : *
3501 : * The information needed is provided by the RelAggInfo structure stored in
3502 : * "grouped_rel".
3503 : */
3504 : void
3505 727 : generate_grouped_paths(PlannerInfo *root, RelOptInfo *grouped_rel,
3506 : RelOptInfo *rel)
3507 : {
3508 727 : RelAggInfo *agg_info = grouped_rel->agg_info;
3509 : AggClauseCosts agg_costs;
3510 : bool can_hash;
3511 : bool can_sort;
3512 727 : Path *cheapest_total_path = NULL;
3513 727 : Path *cheapest_partial_path = NULL;
3514 727 : double dNumGroups = 0;
3515 727 : double dNumPartialGroups = 0;
3516 727 : List *group_pathkeys = NIL;
3517 :
3518 727 : if (IS_DUMMY_REL(rel))
3519 : {
3520 0 : mark_dummy_rel(grouped_rel);
3521 0 : return;
3522 : }
3523 :
3524 : /*
3525 : * We push partial aggregation only to the lowest possible level in the
3526 : * join tree that is deemed useful.
3527 : */
3528 727 : if (!bms_equal(agg_info->apply_agg_at, rel->relids) ||
3529 727 : !agg_info->agg_useful)
3530 0 : return;
3531 :
3532 4362 : MemSet(&agg_costs, 0, sizeof(AggClauseCosts));
3533 727 : get_agg_clause_costs(root, AGGSPLIT_INITIAL_SERIAL, &agg_costs);
3534 :
3535 : /*
3536 : * Determine whether it's possible to perform sort-based implementations
3537 : * of grouping, and generate the pathkeys that represent the grouping
3538 : * requirements in that case.
3539 : */
3540 727 : can_sort = grouping_is_sortable(agg_info->group_clauses);
3541 727 : if (can_sort)
3542 : {
3543 : RelOptInfo *top_grouped_rel;
3544 : List *top_group_tlist;
3545 :
3546 397 : top_grouped_rel = IS_OTHER_REL(rel) ?
3547 1124 : rel->top_parent->grouped_rel : grouped_rel;
3548 : top_group_tlist =
3549 727 : make_tlist_from_pathtarget(top_grouped_rel->agg_info->target);
3550 :
3551 : group_pathkeys =
3552 727 : make_pathkeys_for_sortclauses(root, agg_info->group_clauses,
3553 : top_group_tlist);
3554 : }
3555 :
3556 : /*
3557 : * Determine whether we should consider hash-based implementations of
3558 : * grouping.
3559 : */
3560 : Assert(root->numOrderedAggs == 0);
3561 1454 : can_hash = (agg_info->group_clauses != NIL &&
3562 727 : grouping_is_hashable(agg_info->group_clauses));
3563 :
3564 : /*
3565 : * Consider whether we should generate partially aggregated non-partial
3566 : * paths. We can only do this if we have a non-partial path.
3567 : */
3568 727 : if (rel->pathlist != NIL)
3569 : {
3570 727 : cheapest_total_path = rel->cheapest_total_path;
3571 : Assert(cheapest_total_path != NULL);
3572 : }
3573 :
3574 : /*
3575 : * If parallelism is possible for grouped_rel, then we should consider
3576 : * generating partially-grouped partial paths. However, if the ungrouped
3577 : * rel has no partial paths, then we can't.
3578 : */
3579 727 : if (grouped_rel->consider_parallel && rel->partial_pathlist != NIL)
3580 : {
3581 610 : cheapest_partial_path = linitial(rel->partial_pathlist);
3582 : Assert(cheapest_partial_path != NULL);
3583 : }
3584 :
3585 : /* Estimate number of partial groups. */
3586 727 : if (cheapest_total_path != NULL)
3587 727 : dNumGroups = estimate_num_groups(root,
3588 : agg_info->group_exprs,
3589 : cheapest_total_path->rows,
3590 : NULL, NULL);
3591 727 : if (cheapest_partial_path != NULL)
3592 610 : dNumPartialGroups = estimate_num_groups(root,
3593 : agg_info->group_exprs,
3594 : cheapest_partial_path->rows,
3595 : NULL, NULL);
3596 :
3597 727 : if (can_sort && cheapest_total_path != NULL)
3598 : {
3599 : ListCell *lc;
3600 :
3601 : /*
3602 : * Use any available suitably-sorted path as input, and also consider
3603 : * sorting the cheapest-total path and incremental sort on any paths
3604 : * with presorted keys.
3605 : *
3606 : * To save planning time, we ignore parameterized input paths unless
3607 : * they are the cheapest-total path.
3608 : */
3609 1735 : foreach(lc, rel->pathlist)
3610 : {
3611 1008 : Path *input_path = (Path *) lfirst(lc);
3612 : Path *path;
3613 : bool is_sorted;
3614 : int presorted_keys;
3615 :
3616 : /*
3617 : * Ignore parameterized paths that are not the cheapest-total
3618 : * path.
3619 : */
3620 1008 : if (input_path->param_info &&
3621 : input_path != cheapest_total_path)
3622 23 : continue;
3623 :
3624 1003 : is_sorted = pathkeys_count_contained_in(group_pathkeys,
3625 : input_path->pathkeys,
3626 : &presorted_keys);
3627 :
3628 : /*
3629 : * Ignore paths that are not suitably or partially sorted, unless
3630 : * they are the cheapest total path (no need to deal with paths
3631 : * which have presorted keys when incremental sort is disabled).
3632 : */
3633 1003 : if (!is_sorted && input_path != cheapest_total_path &&
3634 122 : (presorted_keys == 0 || !enable_incremental_sort))
3635 18 : continue;
3636 :
3637 : /*
3638 : * Since the path originates from a non-grouped relation that is
3639 : * not aware of eager aggregation, we must ensure that it provides
3640 : * the correct input for partial aggregation.
3641 : */
3642 985 : path = (Path *) create_projection_path(root,
3643 : grouped_rel,
3644 : input_path,
3645 985 : agg_info->agg_input);
3646 :
3647 985 : if (!is_sorted)
3648 : {
3649 : /*
3650 : * We've no need to consider both a sort and incremental sort.
3651 : * We'll just do a sort if there are no presorted keys and an
3652 : * incremental sort when there are presorted keys.
3653 : */
3654 826 : if (presorted_keys == 0 || !enable_incremental_sort)
3655 716 : path = (Path *) create_sort_path(root,
3656 : grouped_rel,
3657 : path,
3658 : group_pathkeys,
3659 : -1.0);
3660 : else
3661 110 : path = (Path *) create_incremental_sort_path(root,
3662 : grouped_rel,
3663 : path,
3664 : group_pathkeys,
3665 : presorted_keys,
3666 : -1.0);
3667 : }
3668 :
3669 : /*
3670 : * qual is NIL because the HAVING clause cannot be evaluated until
3671 : * the final value of the aggregate is known.
3672 : */
3673 985 : path = (Path *) create_agg_path(root,
3674 : grouped_rel,
3675 : path,
3676 985 : agg_info->target,
3677 : AGG_SORTED,
3678 : AGGSPLIT_INITIAL_SERIAL,
3679 : agg_info->group_clauses,
3680 : NIL,
3681 : &agg_costs,
3682 : dNumGroups);
3683 :
3684 985 : add_path(grouped_rel, path);
3685 : }
3686 : }
3687 :
3688 727 : if (can_sort && cheapest_partial_path != NULL)
3689 : {
3690 : ListCell *lc;
3691 :
3692 : /* Similar to above logic, but for partial paths. */
3693 1394 : foreach(lc, rel->partial_pathlist)
3694 : {
3695 784 : Path *input_path = (Path *) lfirst(lc);
3696 : Path *path;
3697 : bool is_sorted;
3698 : int presorted_keys;
3699 :
3700 784 : is_sorted = pathkeys_count_contained_in(group_pathkeys,
3701 : input_path->pathkeys,
3702 : &presorted_keys);
3703 :
3704 : /*
3705 : * Ignore paths that are not suitably or partially sorted, unless
3706 : * they are the cheapest partial path (no need to deal with paths
3707 : * which have presorted keys when incremental sort is disabled).
3708 : */
3709 784 : if (!is_sorted && input_path != cheapest_partial_path &&
3710 70 : (presorted_keys == 0 || !enable_incremental_sort))
3711 0 : continue;
3712 :
3713 : /*
3714 : * Since the path originates from a non-grouped relation that is
3715 : * not aware of eager aggregation, we must ensure that it provides
3716 : * the correct input for partial aggregation.
3717 : */
3718 784 : path = (Path *) create_projection_path(root,
3719 : grouped_rel,
3720 : input_path,
3721 784 : agg_info->agg_input);
3722 :
3723 784 : if (!is_sorted)
3724 : {
3725 : /*
3726 : * We've no need to consider both a sort and incremental sort.
3727 : * We'll just do a sort if there are no presorted keys and an
3728 : * incremental sort when there are presorted keys.
3729 : */
3730 680 : if (presorted_keys == 0 || !enable_incremental_sort)
3731 610 : path = (Path *) create_sort_path(root,
3732 : grouped_rel,
3733 : path,
3734 : group_pathkeys,
3735 : -1.0);
3736 : else
3737 70 : path = (Path *) create_incremental_sort_path(root,
3738 : grouped_rel,
3739 : path,
3740 : group_pathkeys,
3741 : presorted_keys,
3742 : -1.0);
3743 : }
3744 :
3745 : /*
3746 : * qual is NIL because the HAVING clause cannot be evaluated until
3747 : * the final value of the aggregate is known.
3748 : */
3749 784 : path = (Path *) create_agg_path(root,
3750 : grouped_rel,
3751 : path,
3752 784 : agg_info->target,
3753 : AGG_SORTED,
3754 : AGGSPLIT_INITIAL_SERIAL,
3755 : agg_info->group_clauses,
3756 : NIL,
3757 : &agg_costs,
3758 : dNumPartialGroups);
3759 :
3760 784 : add_partial_path(grouped_rel, path);
3761 : }
3762 : }
3763 :
3764 : /*
3765 : * Add a partially-grouped HashAgg Path where possible
3766 : */
3767 727 : if (can_hash && cheapest_total_path != NULL)
3768 : {
3769 : Path *path;
3770 :
3771 : /*
3772 : * Since the path originates from a non-grouped relation that is not
3773 : * aware of eager aggregation, we must ensure that it provides the
3774 : * correct input for partial aggregation.
3775 : */
3776 727 : path = (Path *) create_projection_path(root,
3777 : grouped_rel,
3778 : cheapest_total_path,
3779 727 : agg_info->agg_input);
3780 :
3781 : /*
3782 : * qual is NIL because the HAVING clause cannot be evaluated until the
3783 : * final value of the aggregate is known.
3784 : */
3785 727 : path = (Path *) create_agg_path(root,
3786 : grouped_rel,
3787 : path,
3788 727 : agg_info->target,
3789 : AGG_HASHED,
3790 : AGGSPLIT_INITIAL_SERIAL,
3791 : agg_info->group_clauses,
3792 : NIL,
3793 : &agg_costs,
3794 : dNumGroups);
3795 :
3796 727 : add_path(grouped_rel, path);
3797 : }
3798 :
3799 : /*
3800 : * Now add a partially-grouped HashAgg partial Path where possible
3801 : */
3802 727 : if (can_hash && cheapest_partial_path != NULL)
3803 : {
3804 : Path *path;
3805 :
3806 : /*
3807 : * Since the path originates from a non-grouped relation that is not
3808 : * aware of eager aggregation, we must ensure that it provides the
3809 : * correct input for partial aggregation.
3810 : */
3811 610 : path = (Path *) create_projection_path(root,
3812 : grouped_rel,
3813 : cheapest_partial_path,
3814 610 : agg_info->agg_input);
3815 :
3816 : /*
3817 : * qual is NIL because the HAVING clause cannot be evaluated until the
3818 : * final value of the aggregate is known.
3819 : */
3820 610 : path = (Path *) create_agg_path(root,
3821 : grouped_rel,
3822 : path,
3823 610 : agg_info->target,
3824 : AGG_HASHED,
3825 : AGGSPLIT_INITIAL_SERIAL,
3826 : agg_info->group_clauses,
3827 : NIL,
3828 : &agg_costs,
3829 : dNumPartialGroups);
3830 :
3831 610 : add_partial_path(grouped_rel, path);
3832 : }
3833 : }
3834 :
3835 : /*
3836 : * make_rel_from_joinlist
3837 : * Build access paths using a "joinlist" to guide the join path search.
3838 : *
3839 : * See comments for deconstruct_jointree() for definition of the joinlist
3840 : * data structure.
3841 : */
3842 : static RelOptInfo *
3843 255965 : make_rel_from_joinlist(PlannerInfo *root, List *joinlist)
3844 : {
3845 : int levels_needed;
3846 : List *initial_rels;
3847 : ListCell *jl;
3848 :
3849 : /*
3850 : * Count the number of child joinlist nodes. This is the depth of the
3851 : * dynamic-programming algorithm we must employ to consider all ways of
3852 : * joining the child nodes.
3853 : */
3854 255965 : levels_needed = list_length(joinlist);
3855 :
3856 255965 : if (levels_needed <= 0)
3857 0 : return NULL; /* nothing to do? */
3858 :
3859 : /*
3860 : * Construct a list of rels corresponding to the child joinlist nodes.
3861 : * This may contain both base rels and rels constructed according to
3862 : * sub-joinlists.
3863 : */
3864 255965 : initial_rels = NIL;
3865 623330 : foreach(jl, joinlist)
3866 : {
3867 367365 : Node *jlnode = (Node *) lfirst(jl);
3868 : RelOptInfo *thisrel;
3869 :
3870 367365 : if (IsA(jlnode, RangeTblRef))
3871 : {
3872 364677 : int varno = ((RangeTblRef *) jlnode)->rtindex;
3873 :
3874 364677 : thisrel = find_base_rel(root, varno);
3875 : }
3876 2688 : else if (IsA(jlnode, List))
3877 : {
3878 : /* Recurse to handle subproblem */
3879 2688 : thisrel = make_rel_from_joinlist(root, (List *) jlnode);
3880 : }
3881 : else
3882 : {
3883 0 : elog(ERROR, "unrecognized joinlist node type: %d",
3884 : (int) nodeTag(jlnode));
3885 : thisrel = NULL; /* keep compiler quiet */
3886 : }
3887 :
3888 367365 : initial_rels = lappend(initial_rels, thisrel);
3889 : }
3890 :
3891 255965 : if (levels_needed == 1)
3892 : {
3893 : /*
3894 : * Single joinlist node, so we're done.
3895 : */
3896 174631 : return (RelOptInfo *) linitial(initial_rels);
3897 : }
3898 : else
3899 : {
3900 : /*
3901 : * Consider the different orders in which we could join the rels,
3902 : * using a plugin, GEQO, or the regular join search code.
3903 : *
3904 : * We put the initial_rels list into a PlannerInfo field because
3905 : * has_legal_joinclause() needs to look at it (ugly :-().
3906 : */
3907 81334 : root->initial_rels = initial_rels;
3908 :
3909 81334 : if (join_search_hook)
3910 0 : return (*join_search_hook) (root, levels_needed, initial_rels);
3911 81334 : else if (enable_geqo && levels_needed >= geqo_threshold)
3912 35 : return geqo(root, levels_needed, initial_rels);
3913 : else
3914 81299 : return standard_join_search(root, levels_needed, initial_rels);
3915 : }
3916 : }
3917 :
3918 : /*
3919 : * standard_join_search
3920 : * Find possible joinpaths for a query by successively finding ways
3921 : * to join component relations into join relations.
3922 : *
3923 : * 'levels_needed' is the number of iterations needed, ie, the number of
3924 : * independent jointree items in the query. This is > 1.
3925 : *
3926 : * 'initial_rels' is a list of RelOptInfo nodes for each independent
3927 : * jointree item. These are the components to be joined together.
3928 : * Note that levels_needed == list_length(initial_rels).
3929 : *
3930 : * Returns the final level of join relations, i.e., the relation that is
3931 : * the result of joining all the original relations together.
3932 : * At least one implementation path must be provided for this relation and
3933 : * all required sub-relations.
3934 : *
3935 : * To support loadable plugins that modify planner behavior by changing the
3936 : * join searching algorithm, we provide a hook variable that lets a plugin
3937 : * replace or supplement this function. Any such hook must return the same
3938 : * final join relation as the standard code would, but it might have a
3939 : * different set of implementation paths attached, and only the sub-joinrels
3940 : * needed for these paths need have been instantiated.
3941 : *
3942 : * Note to plugin authors: the functions invoked during standard_join_search()
3943 : * modify root->join_rel_list and root->join_rel_hash. If you want to do more
3944 : * than one join-order search, you'll probably need to save and restore the
3945 : * original states of those data structures. See geqo_eval() for an example.
3946 : */
3947 : RelOptInfo *
3948 81299 : standard_join_search(PlannerInfo *root, int levels_needed, List *initial_rels)
3949 : {
3950 : int lev;
3951 : RelOptInfo *rel;
3952 :
3953 : /*
3954 : * This function cannot be invoked recursively within any one planning
3955 : * problem, so join_rel_level[] can't be in use already.
3956 : */
3957 : Assert(root->join_rel_level == NULL);
3958 :
3959 : /*
3960 : * We employ a simple "dynamic programming" algorithm: we first find all
3961 : * ways to build joins of two jointree items, then all ways to build joins
3962 : * of three items (from two-item joins and single items), then four-item
3963 : * joins, and so on until we have considered all ways to join all the
3964 : * items into one rel.
3965 : *
3966 : * root->join_rel_level[j] is a list of all the j-item rels. Initially we
3967 : * set root->join_rel_level[1] to represent all the single-jointree-item
3968 : * relations.
3969 : */
3970 81299 : root->join_rel_level = (List **) palloc0((levels_needed + 1) * sizeof(List *));
3971 :
3972 81299 : root->join_rel_level[1] = initial_rels;
3973 :
3974 192649 : for (lev = 2; lev <= levels_needed; lev++)
3975 : {
3976 : ListCell *lc;
3977 :
3978 : /*
3979 : * Determine all possible pairs of relations to be joined at this
3980 : * level, and build paths for making each one from every available
3981 : * pair of lower-level relations.
3982 : */
3983 111350 : join_search_one_level(root, lev);
3984 :
3985 : /*
3986 : * Run generate_partitionwise_join_paths() and
3987 : * generate_useful_gather_paths() for each just-processed joinrel. We
3988 : * could not do this earlier because both regular and partial paths
3989 : * can get added to a particular joinrel at multiple times within
3990 : * join_search_one_level.
3991 : *
3992 : * After that, we're done creating paths for the joinrel, so run
3993 : * set_cheapest().
3994 : *
3995 : * In addition, we also run generate_grouped_paths() for the grouped
3996 : * relation of each just-processed joinrel, and run set_cheapest() for
3997 : * the grouped relation afterwards.
3998 : */
3999 285187 : foreach(lc, root->join_rel_level[lev])
4000 : {
4001 : bool is_top_rel;
4002 :
4003 173837 : rel = (RelOptInfo *) lfirst(lc);
4004 :
4005 173837 : is_top_rel = bms_equal(rel->relids, root->all_query_rels);
4006 :
4007 : /* Create paths for partitionwise joins. */
4008 173837 : generate_partitionwise_join_paths(root, rel);
4009 :
4010 : /*
4011 : * Except for the topmost scan/join rel, consider gathering
4012 : * partial paths. We'll do the same for the topmost scan/join rel
4013 : * once we know the final targetlist (see grouping_planner's and
4014 : * its call to apply_scanjoin_target_to_paths).
4015 : */
4016 173837 : if (!is_top_rel)
4017 92947 : generate_useful_gather_paths(root, rel, false);
4018 :
4019 : /* Find and save the cheapest paths for this rel */
4020 173837 : set_cheapest(rel);
4021 :
4022 : /*
4023 : * Except for the topmost scan/join rel, consider generating
4024 : * partial aggregation paths for the grouped relation on top of
4025 : * the paths of this rel. After that, we're done creating paths
4026 : * for the grouped relation, so run set_cheapest().
4027 : */
4028 173837 : if (rel->grouped_rel != NULL && !is_top_rel)
4029 : {
4030 60 : RelOptInfo *grouped_rel = rel->grouped_rel;
4031 :
4032 : Assert(IS_GROUPED_REL(grouped_rel));
4033 :
4034 60 : generate_grouped_paths(root, grouped_rel, rel);
4035 60 : set_cheapest(grouped_rel);
4036 : }
4037 :
4038 : #ifdef OPTIMIZER_DEBUG
4039 : pprint(rel);
4040 : #endif
4041 : }
4042 : }
4043 :
4044 : /*
4045 : * We should have a single rel at the final level.
4046 : */
4047 81299 : if (root->join_rel_level[levels_needed] == NIL)
4048 0 : elog(ERROR, "failed to build any %d-way joins", levels_needed);
4049 : Assert(list_length(root->join_rel_level[levels_needed]) == 1);
4050 :
4051 81299 : rel = (RelOptInfo *) linitial(root->join_rel_level[levels_needed]);
4052 :
4053 81299 : root->join_rel_level = NULL;
4054 :
4055 81299 : return rel;
4056 : }
4057 :
4058 : /*****************************************************************************
4059 : * PUSHING QUALS DOWN INTO SUBQUERIES
4060 : *****************************************************************************/
4061 :
4062 : /*
4063 : * subquery_is_pushdown_safe - is a subquery safe for pushing down quals?
4064 : *
4065 : * subquery is the particular component query being checked. topquery
4066 : * is the top component of a set-operations tree (the same Query if no
4067 : * set-op is involved).
4068 : *
4069 : * Conditions checked here:
4070 : *
4071 : * 1. If the subquery has a LIMIT clause, we must not push down any quals,
4072 : * since that could change the set of rows returned.
4073 : *
4074 : * 2. If the subquery contains EXCEPT or EXCEPT ALL set ops we cannot push
4075 : * quals into it, because that could change the results.
4076 : *
4077 : * 3. If the subquery uses DISTINCT, we cannot push volatile quals into it.
4078 : * This is because upper-level quals should semantically be evaluated only
4079 : * once per distinct row, not once per original row, and if the qual is
4080 : * volatile then extra evaluations could change the results. (This issue
4081 : * does not apply to other forms of aggregation such as GROUP BY, because
4082 : * when those are present we push into HAVING not WHERE, so that the quals
4083 : * are still applied after aggregation.)
4084 : *
4085 : * 4. If the subquery contains window functions, we cannot push volatile quals
4086 : * into it. The issue here is a bit different from DISTINCT: a volatile qual
4087 : * might succeed for some rows of a window partition and fail for others,
4088 : * thereby changing the partition contents and thus the window functions'
4089 : * results for rows that remain.
4090 : *
4091 : * 5. If the subquery contains any set-returning functions in its targetlist,
4092 : * we cannot push volatile quals into it. That would push them below the SRFs
4093 : * and thereby change the number of times they are evaluated. Also, a
4094 : * volatile qual could succeed for some SRF output rows and fail for others,
4095 : * a behavior that cannot occur if it's evaluated before SRF expansion.
4096 : *
4097 : * 6. If the subquery has nonempty grouping sets, we cannot push down any
4098 : * quals. The concern here is that a qual referencing a "constant" grouping
4099 : * column could get constant-folded, which would be improper because the value
4100 : * is potentially nullable by grouping-set expansion. This restriction could
4101 : * be removed if we had a parsetree representation that shows that such
4102 : * grouping columns are not really constant. (There are other ideas that
4103 : * could be used to relax this restriction, but that's the approach most
4104 : * likely to get taken in the future. Note that there's not much to be gained
4105 : * so long as subquery_planner can't move HAVING clauses to WHERE within such
4106 : * a subquery.)
4107 : *
4108 : * In addition, we make several checks on the subquery's output columns to see
4109 : * if it is safe to reference them in pushed-down quals. If output column k
4110 : * is found to be unsafe to reference, we set the reason for that inside
4111 : * safetyInfo->unsafeFlags[k], but we don't reject the subquery overall since
4112 : * column k might not be referenced by some/all quals. The unsafeFlags[]
4113 : * array will be consulted later by qual_is_pushdown_safe(). It's better to
4114 : * do it this way than to make the checks directly in qual_is_pushdown_safe(),
4115 : * because when the subquery involves set operations we have to check the
4116 : * output expressions in each arm of the set op.
4117 : *
4118 : * Note: pushing quals into a DISTINCT subquery is theoretically dubious:
4119 : * we're effectively assuming that the quals cannot distinguish values that
4120 : * the DISTINCT's equality operator sees as equal, yet there are many
4121 : * counterexamples to that assumption. However use of such a qual with a
4122 : * DISTINCT subquery would be unsafe anyway, since there's no guarantee which
4123 : * "equal" value will be chosen as the output value by the DISTINCT operation.
4124 : * So we don't worry too much about that. Another objection is that if the
4125 : * qual is expensive to evaluate, running it for each original row might cost
4126 : * more than we save by eliminating rows before the DISTINCT step. But it
4127 : * would be very hard to estimate that at this stage, and in practice pushdown
4128 : * seldom seems to make things worse, so we ignore that problem too.
4129 : *
4130 : * Note: likewise, pushing quals into a subquery with window functions is a
4131 : * bit dubious: the quals might remove some rows of a window partition while
4132 : * leaving others, causing changes in the window functions' results for the
4133 : * surviving rows. We insist that such a qual reference only partitioning
4134 : * columns, but again that only protects us if the qual does not distinguish
4135 : * values that the partitioning equality operator sees as equal. The risks
4136 : * here are perhaps larger than for DISTINCT, since no de-duplication of rows
4137 : * occurs and thus there is no theoretical problem with such a qual. But
4138 : * we'll do this anyway because the potential performance benefits are very
4139 : * large, and we've seen no field complaints about the longstanding comparable
4140 : * behavior with DISTINCT.
4141 : */
4142 : static bool
4143 2375 : subquery_is_pushdown_safe(Query *subquery, Query *topquery,
4144 : pushdown_safety_info *safetyInfo)
4145 : {
4146 : SetOperationStmt *topop;
4147 :
4148 : /* Check point 1 */
4149 2375 : if (subquery->limitOffset != NULL || subquery->limitCount != NULL)
4150 111 : return false;
4151 :
4152 : /* Check point 6 */
4153 2264 : if (subquery->groupClause && subquery->groupingSets)
4154 10 : return false;
4155 :
4156 : /* Check points 3, 4, and 5 */
4157 2254 : if (subquery->distinctClause ||
4158 2184 : subquery->hasWindowFuncs ||
4159 1963 : subquery->hasTargetSRFs)
4160 706 : safetyInfo->unsafeVolatile = true;
4161 :
4162 : /*
4163 : * If we're at a leaf query, check for unsafe expressions in its target
4164 : * list, and mark any reasons why they're unsafe in unsafeFlags[].
4165 : * (Non-leaf nodes in setop trees have only simple Vars in their tlists,
4166 : * so no need to check them.)
4167 : */
4168 2254 : if (subquery->setOperations == NULL)
4169 2148 : check_output_expressions(subquery, safetyInfo);
4170 :
4171 : /* Are we at top level, or looking at a setop component? */
4172 2254 : if (subquery == topquery)
4173 : {
4174 : /* Top level, so check any component queries */
4175 2042 : if (subquery->setOperations != NULL)
4176 106 : if (!recurse_pushdown_safe(subquery->setOperations, topquery,
4177 : safetyInfo))
4178 0 : return false;
4179 : }
4180 : else
4181 : {
4182 : /* Setop component must not have more components (too weird) */
4183 212 : if (subquery->setOperations != NULL)
4184 0 : return false;
4185 : /* Check whether setop component output types match top level */
4186 212 : topop = castNode(SetOperationStmt, topquery->setOperations);
4187 : Assert(topop);
4188 212 : compare_tlist_datatypes(subquery->targetList,
4189 : topop->colTypes,
4190 : safetyInfo);
4191 : }
4192 2254 : return true;
4193 : }
4194 :
4195 : /*
4196 : * Helper routine to recurse through setOperations tree
4197 : */
4198 : static bool
4199 318 : recurse_pushdown_safe(Node *setOp, Query *topquery,
4200 : pushdown_safety_info *safetyInfo)
4201 : {
4202 318 : if (IsA(setOp, RangeTblRef))
4203 : {
4204 212 : RangeTblRef *rtr = (RangeTblRef *) setOp;
4205 212 : RangeTblEntry *rte = rt_fetch(rtr->rtindex, topquery->rtable);
4206 212 : Query *subquery = rte->subquery;
4207 :
4208 : Assert(subquery != NULL);
4209 212 : return subquery_is_pushdown_safe(subquery, topquery, safetyInfo);
4210 : }
4211 106 : else if (IsA(setOp, SetOperationStmt))
4212 : {
4213 106 : SetOperationStmt *op = (SetOperationStmt *) setOp;
4214 :
4215 : /* EXCEPT is no good (point 2 for subquery_is_pushdown_safe) */
4216 106 : if (op->op == SETOP_EXCEPT)
4217 0 : return false;
4218 : /* Else recurse */
4219 106 : if (!recurse_pushdown_safe(op->larg, topquery, safetyInfo))
4220 0 : return false;
4221 106 : if (!recurse_pushdown_safe(op->rarg, topquery, safetyInfo))
4222 0 : return false;
4223 : }
4224 : else
4225 : {
4226 0 : elog(ERROR, "unrecognized node type: %d",
4227 : (int) nodeTag(setOp));
4228 : }
4229 106 : return true;
4230 : }
4231 :
4232 : /*
4233 : * check_output_expressions - check subquery's output expressions for safety
4234 : *
4235 : * There are several cases in which it's unsafe to push down an upper-level
4236 : * qual if it references a particular output column of a subquery. We check
4237 : * each output column of the subquery and set flags in unsafeFlags[k] when we
4238 : * see that column is unsafe for a pushed-down qual to reference. The
4239 : * conditions checked here are:
4240 : *
4241 : * 1. We must not push down any quals that refer to subselect outputs that
4242 : * return sets, else we'd introduce functions-returning-sets into the
4243 : * subquery's WHERE/HAVING quals.
4244 : *
4245 : * 2. We must not push down any quals that refer to subselect outputs that
4246 : * contain volatile functions, for fear of introducing strange results due
4247 : * to multiple evaluation of a volatile function.
4248 : *
4249 : * 3. If the subquery uses DISTINCT ON, we must not push down any quals that
4250 : * refer to non-DISTINCT output columns, because that could change the set
4251 : * of rows returned. (This condition is vacuous for DISTINCT, because then
4252 : * there are no non-DISTINCT output columns, so we needn't check. Note that
4253 : * subquery_is_pushdown_safe already reported that we can't use volatile
4254 : * quals if there's DISTINCT or DISTINCT ON.)
4255 : *
4256 : * 4. If the subquery has any window functions, we must not push down quals
4257 : * that reference any output columns that are not listed in all the subquery's
4258 : * window PARTITION BY clauses. We can push down quals that use only
4259 : * partitioning columns because they should succeed or fail identically for
4260 : * every row of any one window partition, and totally excluding some
4261 : * partitions will not change a window function's results for remaining
4262 : * partitions. (Again, this also requires nonvolatile quals, but
4263 : * subquery_is_pushdown_safe handles that.). Subquery columns marked as
4264 : * unsafe for this reason can still have WindowClause run conditions pushed
4265 : * down.
4266 : */
4267 : static void
4268 2148 : check_output_expressions(Query *subquery, pushdown_safety_info *safetyInfo)
4269 : {
4270 2148 : List *flattened_targetList = subquery->targetList;
4271 : ListCell *lc;
4272 :
4273 : /*
4274 : * We must be careful with grouping Vars and join alias Vars in the
4275 : * subquery's outputs, as they hide the underlying expressions.
4276 : *
4277 : * We need to expand grouping Vars to their underlying expressions (the
4278 : * grouping clauses) because the grouping expressions themselves might be
4279 : * volatile or set-returning. However, we do not need to expand join
4280 : * alias Vars, as their underlying structure does not introduce volatile
4281 : * or set-returning functions at the current level.
4282 : *
4283 : * In neither case do we need to recursively examine the Vars contained in
4284 : * these underlying expressions. Even if they reference outputs from
4285 : * lower-level subqueries (at any depth), those references are guaranteed
4286 : * not to expand to volatile or set-returning functions, because
4287 : * subqueries containing such functions in their targetlists are never
4288 : * pulled up.
4289 : */
4290 2148 : if (subquery->hasGroupRTE)
4291 : {
4292 : /*
4293 : * We can safely pass NULL for the root here. This function uses the
4294 : * expanded expressions solely to check for volatile or set-returning
4295 : * functions, which is independent of the Vars' nullingrels.
4296 : */
4297 : flattened_targetList = (List *)
4298 259 : flatten_group_exprs(NULL, subquery, (Node *) subquery->targetList);
4299 : }
4300 :
4301 25331 : foreach(lc, flattened_targetList)
4302 : {
4303 23183 : TargetEntry *tle = (TargetEntry *) lfirst(lc);
4304 :
4305 23183 : if (tle->resjunk)
4306 109 : continue; /* ignore resjunk columns */
4307 :
4308 : /* Functions returning sets are unsafe (point 1) */
4309 23074 : if (subquery->hasTargetSRFs &&
4310 1200 : (safetyInfo->unsafeFlags[tle->resno] &
4311 1200 : UNSAFE_HAS_SET_FUNC) == 0 &&
4312 1200 : expression_returns_set((Node *) tle->expr))
4313 : {
4314 848 : safetyInfo->unsafeFlags[tle->resno] |= UNSAFE_HAS_SET_FUNC;
4315 848 : continue;
4316 : }
4317 :
4318 : /* Volatile functions are unsafe (point 2) */
4319 22226 : if ((safetyInfo->unsafeFlags[tle->resno] &
4320 22216 : UNSAFE_HAS_VOLATILE_FUNC) == 0 &&
4321 22216 : contain_volatile_functions((Node *) tle->expr))
4322 : {
4323 75 : safetyInfo->unsafeFlags[tle->resno] |= UNSAFE_HAS_VOLATILE_FUNC;
4324 75 : continue;
4325 : }
4326 :
4327 : /* If subquery uses DISTINCT ON, check point 3 */
4328 22151 : if (subquery->hasDistinctOn &&
4329 0 : (safetyInfo->unsafeFlags[tle->resno] &
4330 0 : UNSAFE_NOTIN_DISTINCTON_CLAUSE) == 0 &&
4331 0 : !targetIsInSortList(tle, InvalidOid, subquery->distinctClause))
4332 : {
4333 : /* non-DISTINCT column, so mark it unsafe */
4334 0 : safetyInfo->unsafeFlags[tle->resno] |= UNSAFE_NOTIN_DISTINCTON_CLAUSE;
4335 0 : continue;
4336 : }
4337 :
4338 : /* If subquery uses window functions, check point 4 */
4339 22151 : if (subquery->hasWindowFuncs &&
4340 897 : (safetyInfo->unsafeFlags[tle->resno] &
4341 1722 : UNSAFE_NOTIN_DISTINCTON_CLAUSE) == 0 &&
4342 897 : !targetIsInAllPartitionLists(tle, subquery))
4343 : {
4344 : /* not present in all PARTITION BY clauses, so mark it unsafe */
4345 825 : safetyInfo->unsafeFlags[tle->resno] |= UNSAFE_NOTIN_PARTITIONBY_CLAUSE;
4346 825 : continue;
4347 : }
4348 : }
4349 2148 : }
4350 :
4351 : /*
4352 : * For subqueries using UNION/UNION ALL/INTERSECT/INTERSECT ALL, we can
4353 : * push quals into each component query, but the quals can only reference
4354 : * subquery columns that suffer no type coercions in the set operation.
4355 : * Otherwise there are possible semantic gotchas. So, we check the
4356 : * component queries to see if any of them have output types different from
4357 : * the top-level setop outputs. We set the UNSAFE_TYPE_MISMATCH bit in
4358 : * unsafeFlags[k] if column k has different type in any component.
4359 : *
4360 : * We don't have to care about typmods here: the only allowed difference
4361 : * between set-op input and output typmods is input is a specific typmod
4362 : * and output is -1, and that does not require a coercion.
4363 : *
4364 : * tlist is a subquery tlist.
4365 : * colTypes is an OID list of the top-level setop's output column types.
4366 : * safetyInfo is the pushdown_safety_info to set unsafeFlags[] for.
4367 : */
4368 : static void
4369 212 : compare_tlist_datatypes(List *tlist, List *colTypes,
4370 : pushdown_safety_info *safetyInfo)
4371 : {
4372 : ListCell *l;
4373 212 : ListCell *colType = list_head(colTypes);
4374 :
4375 660 : foreach(l, tlist)
4376 : {
4377 448 : TargetEntry *tle = (TargetEntry *) lfirst(l);
4378 :
4379 448 : if (tle->resjunk)
4380 0 : continue; /* ignore resjunk columns */
4381 448 : if (colType == NULL)
4382 0 : elog(ERROR, "wrong number of tlist entries");
4383 448 : if (exprType((Node *) tle->expr) != lfirst_oid(colType))
4384 64 : safetyInfo->unsafeFlags[tle->resno] |= UNSAFE_TYPE_MISMATCH;
4385 448 : colType = lnext(colTypes, colType);
4386 : }
4387 212 : if (colType != NULL)
4388 0 : elog(ERROR, "wrong number of tlist entries");
4389 212 : }
4390 :
4391 : /*
4392 : * targetIsInAllPartitionLists
4393 : * True if the TargetEntry is listed in the PARTITION BY clause
4394 : * of every window defined in the query.
4395 : *
4396 : * It would be safe to ignore windows not actually used by any window
4397 : * function, but it's not easy to get that info at this stage; and it's
4398 : * unlikely to be useful to spend any extra cycles getting it, since
4399 : * unreferenced window definitions are probably infrequent in practice.
4400 : */
4401 : static bool
4402 897 : targetIsInAllPartitionLists(TargetEntry *tle, Query *query)
4403 : {
4404 : ListCell *lc;
4405 :
4406 989 : foreach(lc, query->windowClause)
4407 : {
4408 917 : WindowClause *wc = (WindowClause *) lfirst(lc);
4409 :
4410 917 : if (!targetIsInSortList(tle, InvalidOid, wc->partitionClause))
4411 825 : return false;
4412 : }
4413 72 : return true;
4414 : }
4415 :
4416 : /*
4417 : * qual_is_pushdown_safe - is a particular rinfo safe to push down?
4418 : *
4419 : * rinfo is a restriction clause applying to the given subquery (whose RTE
4420 : * has index rti in the parent query).
4421 : *
4422 : * Conditions checked here:
4423 : *
4424 : * 1. rinfo's clause must not contain any SubPlans (mainly because it's
4425 : * unclear that it will work correctly: SubLinks will already have been
4426 : * transformed into SubPlans in the qual, but not in the subquery). Note that
4427 : * SubLinks that transform to initplans are safe, and will be accepted here
4428 : * because what we'll see in the qual is just a Param referencing the initplan
4429 : * output.
4430 : *
4431 : * 2. If unsafeVolatile is set, rinfo's clause must not contain any volatile
4432 : * functions.
4433 : *
4434 : * 3. If unsafeLeaky is set, rinfo's clause must not contain any leaky
4435 : * functions that are passed Var nodes, and therefore might reveal values from
4436 : * the subquery as side effects.
4437 : *
4438 : * 4. rinfo's clause must not refer to the whole-row output of the subquery
4439 : * (since there is no easy way to name that within the subquery itself).
4440 : *
4441 : * 5. rinfo's clause must not refer to any subquery output columns that were
4442 : * found to be unsafe to reference by subquery_is_pushdown_safe().
4443 : */
4444 : static pushdown_safe_type
4445 3514 : qual_is_pushdown_safe(Query *subquery, Index rti, RestrictInfo *rinfo,
4446 : pushdown_safety_info *safetyInfo)
4447 : {
4448 3514 : pushdown_safe_type safe = PUSHDOWN_SAFE;
4449 3514 : Node *qual = (Node *) rinfo->clause;
4450 : List *vars;
4451 : ListCell *vl;
4452 :
4453 : /* Refuse subselects (point 1) */
4454 3514 : if (contain_subplans(qual))
4455 55 : return PUSHDOWN_UNSAFE;
4456 :
4457 : /* Refuse volatile quals if we found they'd be unsafe (point 2) */
4458 4272 : if (safetyInfo->unsafeVolatile &&
4459 813 : contain_volatile_functions((Node *) rinfo))
4460 15 : return PUSHDOWN_UNSAFE;
4461 :
4462 : /* Refuse leaky quals if told to (point 3) */
4463 5361 : if (safetyInfo->unsafeLeaky &&
4464 1917 : contain_leaked_vars(qual))
4465 135 : return PUSHDOWN_UNSAFE;
4466 :
4467 : /*
4468 : * Examine all Vars used in clause. Since it's a restriction clause, all
4469 : * such Vars must refer to subselect output columns ... unless this is
4470 : * part of a LATERAL subquery, in which case there could be lateral
4471 : * references.
4472 : *
4473 : * By omitting the relevant flags, this also gives us a cheap sanity check
4474 : * that no aggregates or window functions appear in the qual. Those would
4475 : * be unsafe to push down, but at least for the moment we could never see
4476 : * any in a qual anyhow.
4477 : */
4478 3309 : vars = pull_var_clause(qual, PVC_INCLUDE_PLACEHOLDERS);
4479 6273 : foreach(vl, vars)
4480 : {
4481 3399 : Var *var = (Var *) lfirst(vl);
4482 :
4483 : /*
4484 : * XXX Punt if we find any PlaceHolderVars in the restriction clause.
4485 : * It's not clear whether a PHV could safely be pushed down, and even
4486 : * less clear whether such a situation could arise in any cases of
4487 : * practical interest anyway. So for the moment, just refuse to push
4488 : * down.
4489 : */
4490 3399 : if (!IsA(var, Var))
4491 : {
4492 0 : safe = PUSHDOWN_UNSAFE;
4493 0 : break;
4494 : }
4495 :
4496 : /*
4497 : * Punt if we find any lateral references. It would be safe to push
4498 : * these down, but we'd have to convert them into outer references,
4499 : * which subquery_push_qual lacks the infrastructure to do. The case
4500 : * arises so seldom that it doesn't seem worth working hard on.
4501 : */
4502 3399 : if (var->varno != rti)
4503 : {
4504 10 : safe = PUSHDOWN_UNSAFE;
4505 10 : break;
4506 : }
4507 :
4508 : /* Subqueries have no system columns */
4509 : Assert(var->varattno >= 0);
4510 :
4511 : /* Check point 4 */
4512 3389 : if (var->varattno == 0)
4513 : {
4514 0 : safe = PUSHDOWN_UNSAFE;
4515 0 : break;
4516 : }
4517 :
4518 : /* Check point 5 */
4519 3389 : if (safetyInfo->unsafeFlags[var->varattno] != 0)
4520 : {
4521 700 : if (safetyInfo->unsafeFlags[var->varattno] &
4522 : (UNSAFE_HAS_VOLATILE_FUNC | UNSAFE_HAS_SET_FUNC |
4523 : UNSAFE_NOTIN_DISTINCTON_CLAUSE | UNSAFE_TYPE_MISMATCH))
4524 : {
4525 425 : safe = PUSHDOWN_UNSAFE;
4526 425 : break;
4527 : }
4528 : else
4529 : {
4530 : /* UNSAFE_NOTIN_PARTITIONBY_CLAUSE is ok for run conditions */
4531 275 : safe = PUSHDOWN_WINDOWCLAUSE_RUNCOND;
4532 : /* don't break, we might find another Var that's unsafe */
4533 : }
4534 : }
4535 : }
4536 :
4537 3309 : list_free(vars);
4538 :
4539 3309 : return safe;
4540 : }
4541 :
4542 : /*
4543 : * subquery_push_qual - push down a qual that we have determined is safe
4544 : */
4545 : static void
4546 2836 : subquery_push_qual(Query *subquery, RangeTblEntry *rte, Index rti, Node *qual)
4547 : {
4548 2836 : if (subquery->setOperations != NULL)
4549 : {
4550 : /* Recurse to push it separately to each component query */
4551 86 : recurse_push_qual(subquery->setOperations, subquery,
4552 : rte, rti, qual);
4553 : }
4554 : else
4555 : {
4556 : /*
4557 : * We need to replace Vars in the qual (which must refer to outputs of
4558 : * the subquery) with copies of the subquery's targetlist expressions.
4559 : * Note that at this point, any uplevel Vars in the qual should have
4560 : * been replaced with Params, so they need no work.
4561 : *
4562 : * This step also ensures that when we are pushing into a setop tree,
4563 : * each component query gets its own copy of the qual.
4564 : */
4565 2750 : qual = ReplaceVarsFromTargetList(qual, rti, 0, rte,
4566 : subquery->targetList,
4567 : subquery->resultRelation,
4568 : REPLACEVARS_REPORT_ERROR, 0,
4569 : &subquery->hasSubLinks);
4570 :
4571 : /*
4572 : * Now attach the qual to the proper place: normally WHERE, but if the
4573 : * subquery uses grouping or aggregation, put it in HAVING (since the
4574 : * qual really refers to the group-result rows).
4575 : */
4576 2750 : if (subquery->hasAggs || subquery->groupClause || subquery->groupingSets || subquery->havingQual)
4577 333 : subquery->havingQual = make_and_qual(subquery->havingQual, qual);
4578 : else
4579 2417 : subquery->jointree->quals =
4580 2417 : make_and_qual(subquery->jointree->quals, qual);
4581 :
4582 : /*
4583 : * We need not change the subquery's hasAggs or hasSubLinks flags,
4584 : * since we can't be pushing down any aggregates that weren't there
4585 : * before, and we don't push down subselects at all.
4586 : */
4587 : }
4588 2836 : }
4589 :
4590 : /*
4591 : * Helper routine to recurse through setOperations tree
4592 : */
4593 : static void
4594 258 : recurse_push_qual(Node *setOp, Query *topquery,
4595 : RangeTblEntry *rte, Index rti, Node *qual)
4596 : {
4597 258 : if (IsA(setOp, RangeTblRef))
4598 : {
4599 172 : RangeTblRef *rtr = (RangeTblRef *) setOp;
4600 172 : RangeTblEntry *subrte = rt_fetch(rtr->rtindex, topquery->rtable);
4601 172 : Query *subquery = subrte->subquery;
4602 :
4603 : Assert(subquery != NULL);
4604 172 : subquery_push_qual(subquery, rte, rti, qual);
4605 : }
4606 86 : else if (IsA(setOp, SetOperationStmt))
4607 : {
4608 86 : SetOperationStmt *op = (SetOperationStmt *) setOp;
4609 :
4610 86 : recurse_push_qual(op->larg, topquery, rte, rti, qual);
4611 86 : recurse_push_qual(op->rarg, topquery, rte, rti, qual);
4612 : }
4613 : else
4614 : {
4615 0 : elog(ERROR, "unrecognized node type: %d",
4616 : (int) nodeTag(setOp));
4617 : }
4618 258 : }
4619 :
4620 : /*****************************************************************************
4621 : * SIMPLIFYING SUBQUERY TARGETLISTS
4622 : *****************************************************************************/
4623 :
4624 : /*
4625 : * remove_unused_subquery_outputs
4626 : * Remove subquery targetlist items we don't need
4627 : *
4628 : * It's possible, even likely, that the upper query does not read all the
4629 : * output columns of the subquery. We can remove any such outputs that are
4630 : * not needed by the subquery itself (e.g., as sort/group columns) and do not
4631 : * affect semantics otherwise (e.g., volatile functions can't be removed).
4632 : * This is useful not only because we might be able to remove expensive-to-
4633 : * compute expressions, but because deletion of output columns might allow
4634 : * optimizations such as join removal to occur within the subquery.
4635 : *
4636 : * extra_used_attrs can be passed as non-NULL to mark any columns (offset by
4637 : * FirstLowInvalidHeapAttributeNumber) that we should not remove. This
4638 : * parameter is modified by the function, so callers must make a copy if they
4639 : * need to use the passed in Bitmapset after calling this function.
4640 : *
4641 : * To avoid affecting column numbering in the targetlist, we don't physically
4642 : * remove unused tlist entries, but rather replace their expressions with NULL
4643 : * constants. This is implemented by modifying subquery->targetList.
4644 : */
4645 : static void
4646 17357 : remove_unused_subquery_outputs(Query *subquery, RelOptInfo *rel,
4647 : Bitmapset *extra_used_attrs)
4648 : {
4649 : Bitmapset *attrs_used;
4650 : ListCell *lc;
4651 :
4652 : /*
4653 : * Just point directly to extra_used_attrs. No need to bms_copy as none of
4654 : * the current callers use the Bitmapset after calling this function.
4655 : */
4656 17357 : attrs_used = extra_used_attrs;
4657 :
4658 : /*
4659 : * Do nothing if subquery has UNION/INTERSECT/EXCEPT: in principle we
4660 : * could update all the child SELECTs' tlists, but it seems not worth the
4661 : * trouble presently.
4662 : */
4663 17357 : if (subquery->setOperations)
4664 1365 : return;
4665 :
4666 : /*
4667 : * If subquery has regular DISTINCT (not DISTINCT ON), we're wasting our
4668 : * time: all its output columns must be used in the distinctClause.
4669 : */
4670 16765 : if (subquery->distinctClause && !subquery->hasDistinctOn)
4671 527 : return;
4672 :
4673 : /*
4674 : * Collect a bitmap of all the output column numbers used by the upper
4675 : * query.
4676 : *
4677 : * Add all the attributes needed for joins or final output. Note: we must
4678 : * look at rel's targetlist, not the attr_needed data, because attr_needed
4679 : * isn't computed for inheritance child rels, cf set_append_rel_size().
4680 : * (XXX might be worth changing that sometime.)
4681 : */
4682 16238 : pull_varattnos((Node *) rel->reltarget->exprs, rel->relid, &attrs_used);
4683 :
4684 : /* Add all the attributes used by un-pushed-down restriction clauses. */
4685 17111 : foreach(lc, rel->baserestrictinfo)
4686 : {
4687 873 : RestrictInfo *rinfo = (RestrictInfo *) lfirst(lc);
4688 :
4689 873 : pull_varattnos((Node *) rinfo->clause, rel->relid, &attrs_used);
4690 : }
4691 :
4692 : /*
4693 : * If there's a whole-row reference to the subquery, we can't remove
4694 : * anything.
4695 : */
4696 16238 : if (bms_is_member(0 - FirstLowInvalidHeapAttributeNumber, attrs_used))
4697 246 : return;
4698 :
4699 : /*
4700 : * Run through the tlist and zap entries we don't need. It's okay to
4701 : * modify the tlist items in-place because set_subquery_pathlist made a
4702 : * copy of the subquery.
4703 : */
4704 89565 : foreach(lc, subquery->targetList)
4705 : {
4706 73573 : TargetEntry *tle = (TargetEntry *) lfirst(lc);
4707 73573 : Node *texpr = (Node *) tle->expr;
4708 :
4709 : /*
4710 : * If it has a sortgroupref number, it's used in some sort/group
4711 : * clause so we'd better not remove it. Also, don't remove any
4712 : * resjunk columns, since their reason for being has nothing to do
4713 : * with anybody reading the subquery's output. (It's likely that
4714 : * resjunk columns in a sub-SELECT would always have ressortgroupref
4715 : * set, but even if they don't, it seems imprudent to remove them.)
4716 : */
4717 73573 : if (tle->ressortgroupref || tle->resjunk)
4718 2481 : continue;
4719 :
4720 : /*
4721 : * If it's used by the upper query, we can't remove it.
4722 : */
4723 71092 : if (bms_is_member(tle->resno - FirstLowInvalidHeapAttributeNumber,
4724 : attrs_used))
4725 40991 : continue;
4726 :
4727 : /*
4728 : * If it contains a set-returning function, we can't remove it since
4729 : * that could change the number of rows returned by the subquery.
4730 : */
4731 30805 : if (subquery->hasTargetSRFs &&
4732 704 : expression_returns_set(texpr))
4733 474 : continue;
4734 :
4735 : /*
4736 : * If it contains volatile functions, we daren't remove it for fear
4737 : * that the user is expecting their side-effects to happen.
4738 : */
4739 29627 : if (contain_volatile_functions(texpr))
4740 26 : continue;
4741 :
4742 : /*
4743 : * OK, we don't need it. Replace the expression with a NULL constant.
4744 : * Preserve the exposed type of the expression, in case something
4745 : * looks at the rowtype of the subquery's result.
4746 : */
4747 29601 : tle->expr = (Expr *) makeNullConst(exprType(texpr),
4748 : exprTypmod(texpr),
4749 : exprCollation(texpr));
4750 : }
4751 : }
4752 :
4753 : /*
4754 : * create_partial_bitmap_paths
4755 : * Build partial bitmap heap path for the relation
4756 : */
4757 : void
4758 111174 : create_partial_bitmap_paths(PlannerInfo *root, RelOptInfo *rel,
4759 : Path *bitmapqual)
4760 : {
4761 : int parallel_workers;
4762 : double pages_fetched;
4763 :
4764 : /* Compute heap pages for bitmap heap scan */
4765 111174 : pages_fetched = compute_bitmap_pages(root, rel, bitmapqual, 1.0,
4766 : NULL, NULL);
4767 :
4768 111174 : parallel_workers = compute_parallel_worker(rel, pages_fetched, -1,
4769 : max_parallel_workers_per_gather);
4770 :
4771 111174 : if (parallel_workers <= 0)
4772 107933 : return;
4773 :
4774 3241 : add_partial_path(rel, (Path *) create_bitmap_heap_path(root, rel,
4775 : bitmapqual, rel->lateral_relids, 1.0, parallel_workers));
4776 : }
4777 :
4778 : /*
4779 : * Compute the number of parallel workers that should be used to scan a
4780 : * relation. We compute the parallel workers based on the size of the heap to
4781 : * be scanned and the size of the index to be scanned, then choose a minimum
4782 : * of those.
4783 : *
4784 : * "heap_pages" is the number of pages from the table that we expect to scan, or
4785 : * -1 if we don't expect to scan any.
4786 : *
4787 : * "index_pages" is the number of pages from the index that we expect to scan, or
4788 : * -1 if we don't expect to scan any.
4789 : *
4790 : * "max_workers" is caller's limit on the number of workers. This typically
4791 : * comes from a GUC.
4792 : */
4793 : int
4794 602921 : compute_parallel_worker(RelOptInfo *rel, double heap_pages, double index_pages,
4795 : int max_workers)
4796 : {
4797 602921 : int parallel_workers = 0;
4798 :
4799 : /*
4800 : * If the user has set the parallel_workers reloption, use that; otherwise
4801 : * select a default number of workers.
4802 : */
4803 602921 : if (rel->rel_parallel_workers != -1)
4804 2740 : parallel_workers = rel->rel_parallel_workers;
4805 : else
4806 : {
4807 : /*
4808 : * If the number of pages being scanned is insufficient to justify a
4809 : * parallel scan, just return zero ... unless it's an inheritance
4810 : * child. In that case, we want to generate a parallel path here
4811 : * anyway. It might not be worthwhile just for this relation, but
4812 : * when combined with all of its inheritance siblings it may well pay
4813 : * off.
4814 : */
4815 600181 : if (rel->reloptkind == RELOPT_BASEREL &&
4816 568162 : ((heap_pages >= 0 && heap_pages < min_parallel_table_scan_size) ||
4817 18588 : (index_pages >= 0 && index_pages < min_parallel_index_scan_size)))
4818 567407 : return 0;
4819 :
4820 32774 : if (heap_pages >= 0)
4821 : {
4822 : int heap_parallel_threshold;
4823 31216 : int heap_parallel_workers = 1;
4824 :
4825 : /*
4826 : * Select the number of workers based on the log of the size of
4827 : * the relation. This probably needs to be a good deal more
4828 : * sophisticated, but we need something here for now. Note that
4829 : * the upper limit of the min_parallel_table_scan_size GUC is
4830 : * chosen to prevent overflow here.
4831 : */
4832 31216 : heap_parallel_threshold = Max(min_parallel_table_scan_size, 1);
4833 35624 : while (heap_pages >= (BlockNumber) (heap_parallel_threshold * 3))
4834 : {
4835 4408 : heap_parallel_workers++;
4836 4408 : heap_parallel_threshold *= 3;
4837 4408 : if (heap_parallel_threshold > INT_MAX / 3)
4838 0 : break; /* avoid overflow */
4839 : }
4840 :
4841 31216 : parallel_workers = heap_parallel_workers;
4842 : }
4843 :
4844 32774 : if (index_pages >= 0)
4845 : {
4846 7410 : int index_parallel_workers = 1;
4847 : int index_parallel_threshold;
4848 :
4849 : /* same calculation as for heap_pages above */
4850 7410 : index_parallel_threshold = Max(min_parallel_index_scan_size, 1);
4851 7640 : while (index_pages >= (BlockNumber) (index_parallel_threshold * 3))
4852 : {
4853 230 : index_parallel_workers++;
4854 230 : index_parallel_threshold *= 3;
4855 230 : if (index_parallel_threshold > INT_MAX / 3)
4856 0 : break; /* avoid overflow */
4857 : }
4858 :
4859 7410 : if (parallel_workers > 0)
4860 5852 : parallel_workers = Min(parallel_workers, index_parallel_workers);
4861 : else
4862 1558 : parallel_workers = index_parallel_workers;
4863 : }
4864 : }
4865 :
4866 : /* In no case use more than caller supplied maximum number of workers */
4867 35514 : parallel_workers = Min(parallel_workers, max_workers);
4868 :
4869 35514 : return parallel_workers;
4870 : }
4871 :
4872 : /*
4873 : * generate_partitionwise_join_paths
4874 : * Create paths representing partitionwise join for given partitioned
4875 : * join relation.
4876 : *
4877 : * This must not be called until after we are done adding paths for all
4878 : * child-joins. Otherwise, add_path might delete a path to which some path
4879 : * generated here has a reference.
4880 : */
4881 : void
4882 194692 : generate_partitionwise_join_paths(PlannerInfo *root, RelOptInfo *rel)
4883 : {
4884 194692 : List *live_children = NIL;
4885 : int cnt_parts;
4886 : int num_parts;
4887 : RelOptInfo **part_rels;
4888 :
4889 : /* Handle only join relations here. */
4890 194692 : if (!IS_JOIN_REL(rel))
4891 0 : return;
4892 :
4893 : /* We've nothing to do if the relation is not partitioned. */
4894 194692 : if (!IS_PARTITIONED_REL(rel))
4895 188725 : return;
4896 :
4897 : /* The relation should have consider_partitionwise_join set. */
4898 : Assert(rel->consider_partitionwise_join);
4899 :
4900 : /* Guard against stack overflow due to overly deep partition hierarchy. */
4901 5967 : check_stack_depth();
4902 :
4903 5967 : num_parts = rel->nparts;
4904 5967 : part_rels = rel->part_rels;
4905 :
4906 : /* Collect non-dummy child-joins. */
4907 21264 : for (cnt_parts = 0; cnt_parts < num_parts; cnt_parts++)
4908 : {
4909 15297 : RelOptInfo *child_rel = part_rels[cnt_parts];
4910 :
4911 : /* If it's been pruned entirely, it's certainly dummy. */
4912 15297 : if (child_rel == NULL)
4913 52 : continue;
4914 :
4915 : /* Make partitionwise join paths for this partitioned child-join. */
4916 15245 : generate_partitionwise_join_paths(root, child_rel);
4917 :
4918 : /* If we failed to make any path for this child, we must give up. */
4919 15245 : if (child_rel->pathlist == NIL)
4920 : {
4921 : /*
4922 : * Mark the parent joinrel as unpartitioned so that later
4923 : * functions treat it correctly.
4924 : */
4925 0 : rel->nparts = 0;
4926 0 : return;
4927 : }
4928 :
4929 : /* Else, identify the cheapest path for it. */
4930 15245 : set_cheapest(child_rel);
4931 :
4932 : /* Dummy children need not be scanned, so ignore those. */
4933 15245 : if (IS_DUMMY_REL(child_rel))
4934 0 : continue;
4935 :
4936 : /*
4937 : * Except for the topmost scan/join rel, consider generating partial
4938 : * aggregation paths for the grouped relation on top of the paths of
4939 : * this partitioned child-join. After that, we're done creating paths
4940 : * for the grouped relation, so run set_cheapest().
4941 : */
4942 15245 : if (child_rel->grouped_rel != NULL &&
4943 10730 : !bms_equal(IS_OTHER_REL(rel) ?
4944 : rel->top_parent_relids : rel->relids,
4945 10730 : root->all_query_rels))
4946 : {
4947 200 : RelOptInfo *grouped_rel = child_rel->grouped_rel;
4948 :
4949 : Assert(IS_GROUPED_REL(grouped_rel));
4950 :
4951 200 : generate_grouped_paths(root, grouped_rel, child_rel);
4952 200 : set_cheapest(grouped_rel);
4953 : }
4954 :
4955 : #ifdef OPTIMIZER_DEBUG
4956 : pprint(child_rel);
4957 : #endif
4958 :
4959 15245 : live_children = lappend(live_children, child_rel);
4960 : }
4961 :
4962 : /* If all child-joins are dummy, parent join is also dummy. */
4963 5967 : if (!live_children)
4964 : {
4965 0 : mark_dummy_rel(rel);
4966 0 : return;
4967 : }
4968 :
4969 : /* Build additional paths for this rel from child-join paths. */
4970 5967 : add_paths_to_append_rel(root, rel, live_children);
4971 5967 : list_free(live_children);
4972 : }
|