postgresql/src/backend/optimizer/path/allpaths.c

375 lines
8.4 KiB
C
Raw Normal View History

/*-------------------------------------------------------------------------
*
* allpaths.c
* Routines to find possible search paths for processing a query
*
* Copyright (c) 1994, Regents of the University of California
*
*
* IDENTIFICATION
1999-05-25 18:15:34 +02:00
* $Header: /cvsroot/pgsql/src/backend/optimizer/path/allpaths.c,v 1.45 1999/05/25 16:09:22 momjian Exp $
*
*-------------------------------------------------------------------------
*/
#include <string.h>
1996-11-06 10:29:26 +01:00
#include <stdio.h>
#include "postgres.h"
#include "nodes/pg_list.h"
#include "nodes/relation.h"
#include "nodes/primnodes.h"
#include "optimizer/internal.h"
#include "optimizer/paths.h"
#include "optimizer/pathnode.h"
#include "optimizer/clauses.h"
#include "optimizer/xfunc.h"
#include "optimizer/cost.h"
#include "commands/creatinh.h"
#include "optimizer/geqo_gene.h"
#include "optimizer/geqo.h"
#ifdef GEQO
bool _use_geqo_ = true;
#else
bool _use_geqo_ = false;
#endif
int32 _use_geqo_rels_ = GEQO_RELS;
1999-02-15 06:21:12 +01:00
static void set_base_rel_pathlist(Query *root, List *rels);
static RelOptInfo *make_one_rel_by_joins(Query *root, List *rels,
1999-05-25 18:15:34 +02:00
int levels_needed);
#ifdef OPTIMIZER_DEBUG
1999-05-25 18:15:34 +02:00
static void debug_print_rel(Query *root, RelOptInfo * rel);
#endif
/*
* make_one_rel
* Finds all possible access paths for executing a query, returning a
* single rel.
*
* 'rels' is the list of single relation entries appearing in the query
*/
RelOptInfo *
make_one_rel(Query *root, List *rels)
{
int levels_needed;
/*
* Set the number of join (not nesting) levels yet to be processed.
*/
levels_needed = length(rels);
if (levels_needed <= 0)
return NULL;
1999-02-15 06:21:12 +01:00
set_base_rel_pathlist(root, rels);
if (levels_needed <= 1)
{
1999-05-25 18:15:34 +02:00
/*
* Unsorted single relation, no more processing is required.
*/
return lfirst(rels);
}
else
{
1999-05-25 18:15:34 +02:00
/*
1999-02-15 06:21:12 +01:00
* This means that joins or sorts are required. set selectivities
* of clauses that have not been set by an index.
*/
set_rest_relselec(root, rels);
return make_one_rel_by_joins(root, rels, levels_needed);
}
}
/*
1999-02-15 06:21:12 +01:00
* set_base_rel_pathlist
* Finds all paths available for scanning each relation entry in
* 'rels'. Sequential scan and any available indices are considered
* if possible(indices are not considered for lower nesting levels).
* All unique paths are attached to the relation's 'pathlist' field.
*
* MODIFIES: rels
*/
static void
1999-02-15 06:21:12 +01:00
set_base_rel_pathlist(Query *root, List *rels)
{
List *temp;
foreach(temp, rels)
{
List *sequential_scan_list;
List *rel_index_scan_list;
List *or_index_scan_list;
1998-08-04 02:42:14 +02:00
RelOptInfo *rel = (RelOptInfo *) lfirst(temp);
sequential_scan_list = lcons(create_seqscan_path(rel), NIL);
1999-02-15 06:28:10 +01:00
rel_index_scan_list = create_index_paths(root,
1999-05-25 18:15:34 +02:00
rel,
find_relation_indices(root, rel),
rel->restrictinfo,
rel->joininfo);
or_index_scan_list = create_or_index_paths(root, rel, rel->restrictinfo);
rel->pathlist = add_pathlist(rel,
sequential_scan_list,
1999-02-22 06:26:58 +01:00
nconc(rel_index_scan_list,
1999-05-25 18:15:34 +02:00
or_index_scan_list));
1999-02-12 06:57:08 +01:00
set_cheapest(rel, rel->pathlist);
/*
* if there is a qualification of sequential scan the selec. value
* is not set -- so set it explicitly -- Sunita
*/
set_rest_selec(root, rel->restrictinfo);
rel->size = compute_rel_size(rel);
rel->width = compute_rel_width(rel);
}
return;
}
/*
* make_one_rel_by_joins
* Find all possible joinpaths for a query by successively finding ways
* to join single relations into join relations.
*
* Find all possible joinpaths(bushy trees) for a query by systematically
* finding ways to join relations(both original and derived) together.
*
1999-02-15 06:21:12 +01:00
* 'rels' is the current list of relations for which join paths
1999-02-14 05:57:02 +01:00
* are to be found, i.e., the current list of relations that
* have already been derived.
* 'levels_needed' is the number of iterations needed
*
* Returns the final level of join relations, i.e., the relation that is
* the result of joining all the original relations together.
*/
static RelOptInfo *
1999-02-15 06:21:12 +01:00
make_one_rel_by_joins(Query *root, List *rels, int levels_needed)
{
List *x;
1999-02-14 06:27:12 +01:00
List *joined_rels = NIL;
1998-08-07 07:02:32 +02:00
RelOptInfo *rel;
/*******************************************
* genetic query optimizer entry point *
* <utesch@aut.tu-freiberg.de> *
*******************************************/
1999-02-14 06:14:15 +01:00
if ((_use_geqo_) && length(root->base_rel_list) >= _use_geqo_rels_)
return geqo(root);
1999-05-25 18:15:34 +02:00
/*******************************************
* rest will be deprecated in case of GEQO *
*******************************************/
while (--levels_needed)
{
1999-05-25 18:15:34 +02:00
/*
* Determine all possible pairs of relations to be joined at this
1999-02-15 06:21:12 +01:00
* level. Determine paths for joining these relation pairs and
1999-02-14 06:27:12 +01:00
* modify 'joined_rels' accordingly, then eliminate redundant join
* relations.
*/
1999-02-15 06:21:12 +01:00
joined_rels = make_rels_by_joins(root, rels);
1999-02-14 06:27:12 +01:00
update_rels_pathlist_for_joins(root, joined_rels);
1999-02-14 06:27:12 +01:00
merge_rels_with_same_relids(joined_rels);
1999-02-18 01:49:48 +01:00
root->join_rel_list = rels = joined_rels;
#ifdef NOT_USED
1999-05-25 18:15:34 +02:00
/*
* * for each expensive predicate in each path in each distinct
* rel, * consider doing pullup -- JMH
*/
if (XfuncMode != XFUNC_NOPULL && XfuncMode != XFUNC_OFF)
1999-02-14 06:27:12 +01:00
foreach(x, joined_rels)
1998-07-18 06:22:52 +02:00
xfunc_trypullup((RelOptInfo *) lfirst(x));
#endif
1999-02-14 06:27:12 +01:00
rels_set_cheapest(joined_rels);
1999-02-14 06:27:12 +01:00
foreach(x, joined_rels)
{
1998-07-18 06:22:52 +02:00
rel = (RelOptInfo *) lfirst(x);
1999-02-14 05:57:02 +01:00
if (rel->size <= 0)
rel->size = compute_rel_size(rel);
rel->width = compute_rel_width(rel);
#ifdef OPTIMIZER_DEBUG
1998-08-07 07:02:32 +02:00
printf("levels left: %d\n", levels_needed);
debug_print_rel(root, rel);
#endif
}
}
1999-02-18 06:26:34 +01:00
return get_cheapest_complete_rel(rels);
}
/*****************************************************************************
*
*****************************************************************************/
#ifdef OPTIMIZER_DEBUG
static void
print_joinclauses(Query *root, List *clauses)
{
List *l;
extern void print_expr(Node *expr, List *rtable); /* in print.c */
foreach(l, clauses)
{
RestrictInfo *c = lfirst(l);
print_expr((Node *) c->clause, root->rtable);
if (lnext(l))
printf(" ");
}
}
static void
print_path(Query *root, Path *path, int indent)
{
char *ptype = NULL;
1999-02-12 18:25:05 +01:00
JoinPath *jp;
bool join = false;
int i;
for (i = 0; i < indent; i++)
printf("\t");
switch (nodeTag(path))
{
case T_Path:
ptype = "SeqScan";
join = false;
break;
case T_IndexPath:
ptype = "IdxScan";
join = false;
break;
1999-02-12 07:43:53 +01:00
case T_NestPath:
ptype = "Nestloop";
join = true;
break;
case T_MergePath:
ptype = "MergeJoin";
join = true;
break;
case T_HashPath:
ptype = "HashJoin";
join = true;
break;
default:
break;
}
if (join)
{
int size = path->parent->size;
1999-02-12 18:25:05 +01:00
jp = (JoinPath *) path;
printf("%s size=%d cost=%f\n", ptype, size, path->path_cost);
switch (nodeTag(path))
{
case T_MergePath:
case T_HashPath:
for (i = 0; i < indent + 1; i++)
printf("\t");
printf(" clauses=(");
1999-02-12 18:25:05 +01:00
print_joinclauses(root, ((JoinPath *) path)->pathinfo);
printf(")\n");
if (nodeTag(path) == T_MergePath)
{
MergePath *mp = (MergePath *) path;
if (mp->outersortkeys || mp->innersortkeys)
{
for (i = 0; i < indent + 1; i++)
printf("\t");
printf(" sortouter=%d sortinner=%d\n",
((mp->outersortkeys) ? 1 : 0),
((mp->innersortkeys) ? 1 : 0));
}
}
break;
default:
break;
}
print_path(root, jp->outerjoinpath, indent + 1);
print_path(root, jp->innerjoinpath, indent + 1);
}
else
{
int size = path->parent->size;
int relid = lfirsti(path->parent->relids);
printf("%s(%d) size=%d cost=%f",
ptype, relid, size, path->path_cost);
if (nodeTag(path) == T_IndexPath)
{
List *k,
*l;
printf(" pathkeys=");
foreach(k, path->pathkeys)
{
printf("(");
foreach(l, lfirst(k))
{
Var *var = lfirst(l);
printf("%d.%d", var->varnoold, var->varoattno);
if (lnext(l))
printf(", ");
}
printf(")");
if (lnext(k))
printf(", ");
}
}
printf("\n");
}
}
static void
1999-05-25 18:15:34 +02:00
debug_print_rel(Query *root, RelOptInfo * rel)
{
List *l;
printf("(");
foreach(l, rel->relids)
printf("%d ", lfirsti(l));
printf("): size=%d width=%d\n", rel->size, rel->width);
printf("\tpath list:\n");
foreach(l, rel->pathlist)
print_path(root, lfirst(l), 1);
printf("\tcheapest path:\n");
print_path(root, rel->cheapestpath, 1);
}
#endif /* OPTIMIZER_DEBUG */