
identified by Hiroshi (incorrect cost attributed to OR clauses after multiple passes through set_rest_selec()). I think the code was trying to allow selectivities of OR subclauses to be passed in from outside, but noplace was actually passing any useful data, and set_rest_selec() was passing wrong data. Restructure representation of "indexqual" in IndexPath nodes so that it is the same as for indxqual in completed IndexScan nodes: namely, a toplevel list with an entry for each pass of the index scan, having sublists that are implicitly-ANDed index qual conditions for that pass. You don't want to know what the old representation was :-( Improve documentation of OR-clause indexscan functions. Remove useless 'notclause' field from RestrictInfo nodes. (This might force an initdb for anyone who has stored rules containing RestrictInfos, but I do not think that RestrictInfo ever appears in completed plans.)
286 lines
7.2 KiB
C
286 lines
7.2 KiB
C
/*-------------------------------------------------------------------------
|
|
*
|
|
* clausesel.c
|
|
* Routines to compute and set clause selectivities
|
|
*
|
|
* Copyright (c) 1994, Regents of the University of California
|
|
*
|
|
*
|
|
* IDENTIFICATION
|
|
* $Header: /cvsroot/pgsql/src/backend/optimizer/path/clausesel.c,v 1.24 1999/07/24 23:21:09 tgl Exp $
|
|
*
|
|
*-------------------------------------------------------------------------
|
|
*/
|
|
#include "postgres.h"
|
|
|
|
#include "catalog/pg_operator.h"
|
|
#include "optimizer/clauses.h"
|
|
#include "optimizer/cost.h"
|
|
#include "optimizer/internal.h"
|
|
#include "optimizer/plancat.h"
|
|
#include "optimizer/restrictinfo.h"
|
|
#include "parser/parsetree.h"
|
|
#include "utils/lsyscache.h"
|
|
|
|
|
|
/****************************************************************************
|
|
* ROUTINES TO SET CLAUSE SELECTIVITIES
|
|
****************************************************************************/
|
|
|
|
/*
|
|
* set_clause_selectivities -
|
|
* Sets the selectivity field for each clause in 'restrictinfo-list'
|
|
* to 'new-selectivity'. If the selectivity has already been set,
|
|
* change it only if the new one is better.
|
|
*/
|
|
void
|
|
set_clause_selectivities(List *restrictinfo_list, Cost new_selectivity)
|
|
{
|
|
List *rlist;
|
|
|
|
foreach(rlist, restrictinfo_list)
|
|
{
|
|
RestrictInfo *clausenode = (RestrictInfo *) lfirst(rlist);
|
|
Cost cost_clause = clausenode->selectivity;
|
|
|
|
if (cost_clause <= 0 || new_selectivity < cost_clause)
|
|
clausenode->selectivity = new_selectivity;
|
|
}
|
|
}
|
|
|
|
/*
|
|
* product_selec -
|
|
* Multiplies the selectivities of each clause in 'restrictinfo-list'.
|
|
*
|
|
* Returns a flonum corresponding to the selectivity of 'restrictinfo-list'.
|
|
*/
|
|
Cost
|
|
product_selec(List *restrictinfo_list)
|
|
{
|
|
Cost result = (Cost) 1.0;
|
|
List *rlist;
|
|
|
|
foreach(rlist, restrictinfo_list)
|
|
{
|
|
result *= ((RestrictInfo *) lfirst(rlist))->selectivity;
|
|
}
|
|
return result;
|
|
}
|
|
|
|
/*
|
|
* set_rest_relselec -
|
|
* Scans through clauses on each relation and assigns a selectivity to
|
|
* those clauses that haven't been assigned a selectivity by an index.
|
|
*
|
|
* MODIFIES: selectivities of the various rel's restrictinfo slots.
|
|
*/
|
|
void
|
|
set_rest_relselec(Query *root, List *rel_list)
|
|
{
|
|
List *x;
|
|
|
|
foreach(x, rel_list)
|
|
{
|
|
RelOptInfo *rel = (RelOptInfo *) lfirst(x);
|
|
set_rest_selec(root, rel->restrictinfo);
|
|
}
|
|
}
|
|
|
|
/*
|
|
* set_rest_selec -
|
|
* Sets the selectivity fields for those clauses within a single
|
|
* relation's 'restrictinfo-list' that haven't already been set.
|
|
*/
|
|
void
|
|
set_rest_selec(Query *root, List *restrictinfo_list)
|
|
{
|
|
List *rlist;
|
|
|
|
foreach(rlist, restrictinfo_list)
|
|
{
|
|
RestrictInfo *clause = (RestrictInfo *) lfirst(rlist);
|
|
|
|
if (clause->selectivity <= 0)
|
|
{
|
|
clause->selectivity =
|
|
compute_clause_selec(root, (Node *) clause->clause);
|
|
}
|
|
}
|
|
}
|
|
|
|
/****************************************************************************
|
|
* ROUTINES TO COMPUTE SELECTIVITIES
|
|
****************************************************************************/
|
|
|
|
/*
|
|
* compute_clause_selec -
|
|
* Computes the selectivity of a clause.
|
|
*/
|
|
Cost
|
|
compute_clause_selec(Query *root, Node *clause)
|
|
{
|
|
Cost s1 = 1.0; /* default for any unhandled clause type */
|
|
|
|
if (clause == NULL)
|
|
return s1;
|
|
if (IsA(clause, Var))
|
|
{
|
|
/*
|
|
* we have a bool Var. This is exactly equivalent to the clause:
|
|
* reln.attribute = 't' so we compute the selectivity as if that
|
|
* is what we have. The magic #define constants are a hack. I
|
|
* didn't want to have to do system cache look ups to find out all
|
|
* of that info.
|
|
*
|
|
* XXX why are we using varno and varoattno? Seems like it should
|
|
* be varno/varattno or varnoold/varoattno, not mix & match...
|
|
*/
|
|
Oid relid = getrelid(((Var *) clause)->varno,
|
|
root->rtable);
|
|
|
|
s1 = restriction_selectivity(F_EQSEL,
|
|
BooleanEqualOperator,
|
|
relid,
|
|
((Var *) clause)->varoattno,
|
|
"t",
|
|
_SELEC_CONSTANT_RIGHT_);
|
|
}
|
|
else if (IsA(clause, Param))
|
|
{
|
|
/* XXX any way to do better? */
|
|
s1 = 1.0;
|
|
}
|
|
else if (IsA(clause, Const))
|
|
{
|
|
/* bool constant is pretty easy... */
|
|
s1 = ((bool) ((Const *) clause)->constvalue) ? 1.0 : 0.0;
|
|
}
|
|
else if (not_clause(clause))
|
|
{
|
|
/* inverse of the selectivity of the underlying clause */
|
|
s1 = 1.0 - compute_clause_selec(root,
|
|
(Node *) get_notclausearg((Expr *) clause));
|
|
}
|
|
else if (and_clause(clause))
|
|
{
|
|
/* Use the product of the selectivities of the subclauses.
|
|
* XXX this is probably too optimistic, since the subclauses
|
|
* are very likely not independent...
|
|
*/
|
|
List *arg;
|
|
s1 = 1.0;
|
|
foreach(arg, ((Expr *) clause)->args)
|
|
{
|
|
Cost s2 = compute_clause_selec(root, (Node *) lfirst(arg));
|
|
s1 = s1 * s2;
|
|
}
|
|
}
|
|
else if (or_clause(clause))
|
|
{
|
|
/* Selectivities for an 'or' clause are computed as s1+s2 - s1*s2
|
|
* to account for the probable overlap of selected tuple sets.
|
|
* XXX is this too conservative?
|
|
*/
|
|
List *arg;
|
|
s1 = 0.0;
|
|
foreach(arg, ((Expr *) clause)->args)
|
|
{
|
|
Cost s2 = compute_clause_selec(root, (Node *) lfirst(arg));
|
|
s1 = s1 + s2 - s1 * s2;
|
|
}
|
|
}
|
|
else if (is_funcclause(clause))
|
|
{
|
|
/*
|
|
* This is not an operator, so we guess at the selectivity. THIS
|
|
* IS A HACK TO GET V4 OUT THE DOOR. FUNCS SHOULD BE ABLE TO HAVE
|
|
* SELECTIVITIES THEMSELVES. -- JMH 7/9/92
|
|
*/
|
|
s1 = (Cost) 0.3333333;
|
|
}
|
|
else if (is_subplan(clause))
|
|
{
|
|
/*
|
|
* Just for the moment! FIX ME! - vadim 02/04/98
|
|
*/
|
|
s1 = 1.0;
|
|
}
|
|
else if (is_opclause(clause))
|
|
{
|
|
if (NumRelids(clause) == 1)
|
|
{
|
|
/* The clause is not a join clause, since there is only one
|
|
* relid in the clause. The clause selectivity will be based on
|
|
* the operator selectivity and operand values.
|
|
*/
|
|
Oid opno = ((Oper *) ((Expr *) clause)->oper)->opno;
|
|
RegProcedure oprrest = get_oprrest(opno);
|
|
Oid relid;
|
|
int relidx;
|
|
AttrNumber attno;
|
|
Datum constval;
|
|
int flag;
|
|
|
|
get_relattval(clause, &relidx, &attno, &constval, &flag);
|
|
relid = getrelid(relidx, root->rtable);
|
|
|
|
/*
|
|
* if the oprrest procedure is missing for whatever reason, use a
|
|
* selectivity of 0.5
|
|
*/
|
|
if (!oprrest)
|
|
s1 = (Cost) 0.5;
|
|
else if (attno == InvalidAttrNumber)
|
|
{
|
|
/*
|
|
* attno can be Invalid if the clause had a function in it,
|
|
* i.e. WHERE myFunc(f) = 10
|
|
*/
|
|
/* this should be FIXED somehow to use function selectivity */
|
|
s1 = (Cost) (0.5);
|
|
}
|
|
else
|
|
s1 = (Cost) restriction_selectivity(oprrest,
|
|
opno,
|
|
relid,
|
|
attno,
|
|
(char *) constval,
|
|
flag);
|
|
}
|
|
else
|
|
{
|
|
/*
|
|
* The clause must be a join clause. The clause selectivity will
|
|
* be based on the relations to be scanned and the attributes they
|
|
* are to be joined on.
|
|
*/
|
|
Oid opno = ((Oper *) ((Expr *) clause)->oper)->opno;
|
|
RegProcedure oprjoin = get_oprjoin(opno);
|
|
int relid1,
|
|
relid2;
|
|
AttrNumber attno1,
|
|
attno2;
|
|
|
|
get_rels_atts(clause, &relid1, &attno1, &relid2, &attno2);
|
|
relid1 = getrelid(relid1, root->rtable);
|
|
relid2 = getrelid(relid2, root->rtable);
|
|
|
|
/*
|
|
* if the oprjoin procedure is missing for whatever reason, use a
|
|
* selectivity of 0.5
|
|
*/
|
|
if (!oprjoin)
|
|
s1 = (Cost) (0.5);
|
|
else
|
|
s1 = (Cost) join_selectivity(oprjoin,
|
|
opno,
|
|
relid1,
|
|
attno1,
|
|
relid2,
|
|
attno2);
|
|
}
|
|
}
|
|
|
|
return s1;
|
|
}
|