/*------------------------------------------------------------------------- * * allpaths.c * Routines to find possible search paths for processing a query * * Copyright (c) 1994, Regents of the University of California * * * IDENTIFICATION * $Header: /cvsroot/pgsql/src/backend/optimizer/path/allpaths.c,v 1.45 1999/05/25 16:09:22 momjian Exp $ * *------------------------------------------------------------------------- */ #include #include #include "postgres.h" #include "nodes/pg_list.h" #include "nodes/relation.h" #include "nodes/primnodes.h" #include "optimizer/internal.h" #include "optimizer/paths.h" #include "optimizer/pathnode.h" #include "optimizer/clauses.h" #include "optimizer/xfunc.h" #include "optimizer/cost.h" #include "commands/creatinh.h" #include "optimizer/geqo_gene.h" #include "optimizer/geqo.h" #ifdef GEQO bool _use_geqo_ = true; #else bool _use_geqo_ = false; #endif int32 _use_geqo_rels_ = GEQO_RELS; static void set_base_rel_pathlist(Query *root, List *rels); static RelOptInfo *make_one_rel_by_joins(Query *root, List *rels, int levels_needed); #ifdef OPTIMIZER_DEBUG static void debug_print_rel(Query *root, RelOptInfo * rel); #endif /* * make_one_rel * Finds all possible access paths for executing a query, returning a * single rel. * * 'rels' is the list of single relation entries appearing in the query */ RelOptInfo * make_one_rel(Query *root, List *rels) { int levels_needed; /* * Set the number of join (not nesting) levels yet to be processed. */ levels_needed = length(rels); if (levels_needed <= 0) return NULL; set_base_rel_pathlist(root, rels); if (levels_needed <= 1) { /* * Unsorted single relation, no more processing is required. */ return lfirst(rels); } else { /* * This means that joins or sorts are required. set selectivities * of clauses that have not been set by an index. */ set_rest_relselec(root, rels); return make_one_rel_by_joins(root, rels, levels_needed); } } /* * set_base_rel_pathlist * Finds all paths available for scanning each relation entry in * 'rels'. Sequential scan and any available indices are considered * if possible(indices are not considered for lower nesting levels). * All unique paths are attached to the relation's 'pathlist' field. * * MODIFIES: rels */ static void set_base_rel_pathlist(Query *root, List *rels) { List *temp; foreach(temp, rels) { List *sequential_scan_list; List *rel_index_scan_list; List *or_index_scan_list; RelOptInfo *rel = (RelOptInfo *) lfirst(temp); sequential_scan_list = lcons(create_seqscan_path(rel), NIL); rel_index_scan_list = create_index_paths(root, rel, find_relation_indices(root, rel), rel->restrictinfo, rel->joininfo); or_index_scan_list = create_or_index_paths(root, rel, rel->restrictinfo); rel->pathlist = add_pathlist(rel, sequential_scan_list, nconc(rel_index_scan_list, or_index_scan_list)); set_cheapest(rel, rel->pathlist); /* * if there is a qualification of sequential scan the selec. value * is not set -- so set it explicitly -- Sunita */ set_rest_selec(root, rel->restrictinfo); rel->size = compute_rel_size(rel); rel->width = compute_rel_width(rel); } return; } /* * make_one_rel_by_joins * Find all possible joinpaths for a query by successively finding ways * to join single relations into join relations. * * Find all possible joinpaths(bushy trees) for a query by systematically * finding ways to join relations(both original and derived) together. * * 'rels' is the current list of relations for which join paths * are to be found, i.e., the current list of relations that * have already been derived. * 'levels_needed' is the number of iterations needed * * Returns the final level of join relations, i.e., the relation that is * the result of joining all the original relations together. */ static RelOptInfo * make_one_rel_by_joins(Query *root, List *rels, int levels_needed) { List *x; List *joined_rels = NIL; RelOptInfo *rel; /******************************************* * genetic query optimizer entry point * * * *******************************************/ if ((_use_geqo_) && length(root->base_rel_list) >= _use_geqo_rels_) return geqo(root); /******************************************* * rest will be deprecated in case of GEQO * *******************************************/ while (--levels_needed) { /* * Determine all possible pairs of relations to be joined at this * level. Determine paths for joining these relation pairs and * modify 'joined_rels' accordingly, then eliminate redundant join * relations. */ joined_rels = make_rels_by_joins(root, rels); update_rels_pathlist_for_joins(root, joined_rels); merge_rels_with_same_relids(joined_rels); root->join_rel_list = rels = joined_rels; #ifdef NOT_USED /* * * for each expensive predicate in each path in each distinct * rel, * consider doing pullup -- JMH */ if (XfuncMode != XFUNC_NOPULL && XfuncMode != XFUNC_OFF) foreach(x, joined_rels) xfunc_trypullup((RelOptInfo *) lfirst(x)); #endif rels_set_cheapest(joined_rels); foreach(x, joined_rels) { rel = (RelOptInfo *) lfirst(x); if (rel->size <= 0) rel->size = compute_rel_size(rel); rel->width = compute_rel_width(rel); #ifdef OPTIMIZER_DEBUG printf("levels left: %d\n", levels_needed); debug_print_rel(root, rel); #endif } } return get_cheapest_complete_rel(rels); } /***************************************************************************** * *****************************************************************************/ #ifdef OPTIMIZER_DEBUG static void print_joinclauses(Query *root, List *clauses) { List *l; extern void print_expr(Node *expr, List *rtable); /* in print.c */ foreach(l, clauses) { RestrictInfo *c = lfirst(l); print_expr((Node *) c->clause, root->rtable); if (lnext(l)) printf(" "); } } static void print_path(Query *root, Path *path, int indent) { char *ptype = NULL; JoinPath *jp; bool join = false; int i; for (i = 0; i < indent; i++) printf("\t"); switch (nodeTag(path)) { case T_Path: ptype = "SeqScan"; join = false; break; case T_IndexPath: ptype = "IdxScan"; join = false; break; case T_NestPath: ptype = "Nestloop"; join = true; break; case T_MergePath: ptype = "MergeJoin"; join = true; break; case T_HashPath: ptype = "HashJoin"; join = true; break; default: break; } if (join) { int size = path->parent->size; jp = (JoinPath *) path; printf("%s size=%d cost=%f\n", ptype, size, path->path_cost); switch (nodeTag(path)) { case T_MergePath: case T_HashPath: for (i = 0; i < indent + 1; i++) printf("\t"); printf(" clauses=("); print_joinclauses(root, ((JoinPath *) path)->pathinfo); printf(")\n"); if (nodeTag(path) == T_MergePath) { MergePath *mp = (MergePath *) path; if (mp->outersortkeys || mp->innersortkeys) { for (i = 0; i < indent + 1; i++) printf("\t"); printf(" sortouter=%d sortinner=%d\n", ((mp->outersortkeys) ? 1 : 0), ((mp->innersortkeys) ? 1 : 0)); } } break; default: break; } print_path(root, jp->outerjoinpath, indent + 1); print_path(root, jp->innerjoinpath, indent + 1); } else { int size = path->parent->size; int relid = lfirsti(path->parent->relids); printf("%s(%d) size=%d cost=%f", ptype, relid, size, path->path_cost); if (nodeTag(path) == T_IndexPath) { List *k, *l; printf(" pathkeys="); foreach(k, path->pathkeys) { printf("("); foreach(l, lfirst(k)) { Var *var = lfirst(l); printf("%d.%d", var->varnoold, var->varoattno); if (lnext(l)) printf(", "); } printf(")"); if (lnext(k)) printf(", "); } } printf("\n"); } } static void debug_print_rel(Query *root, RelOptInfo * rel) { List *l; printf("("); foreach(l, rel->relids) printf("%d ", lfirsti(l)); printf("): size=%d width=%d\n", rel->size, rel->width); printf("\tpath list:\n"); foreach(l, rel->pathlist) print_path(root, lfirst(l), 1); printf("\tcheapest path:\n"); print_path(root, rel->cheapestpath, 1); } #endif /* OPTIMIZER_DEBUG */