1 /*-------------------------------------------------------------------------
2  *
3  * selfuncs.h
4  *	  Selectivity functions for standard operators, and assorted
5  *	  infrastructure for selectivity and cost estimation.
6  *
7  *
8  * Portions Copyright (c) 1996-2016, PostgreSQL Global Development Group
9  * Portions Copyright (c) 1994, Regents of the University of California
10  *
11  * src/include/utils/selfuncs.h
12  *
13  *-------------------------------------------------------------------------
14  */
15 #ifndef SELFUNCS_H
16 #define SELFUNCS_H
17 
18 #include "fmgr.h"
19 #include "access/htup.h"
20 #include "nodes/relation.h"
21 
22 
23 /*
24  * Note: the default selectivity estimates are not chosen entirely at random.
25  * We want them to be small enough to ensure that indexscans will be used if
26  * available, for typical table densities of ~100 tuples/page.  Thus, for
27  * example, 0.01 is not quite small enough, since that makes it appear that
28  * nearly all pages will be hit anyway.  Also, since we sometimes estimate
29  * eqsel as 1/num_distinct, we probably want DEFAULT_NUM_DISTINCT to equal
30  * 1/DEFAULT_EQ_SEL.
31  */
32 
33 /* default selectivity estimate for equalities such as "A = b" */
34 #define DEFAULT_EQ_SEL	0.005
35 
36 /* default selectivity estimate for inequalities such as "A < b" */
37 #define DEFAULT_INEQ_SEL  0.3333333333333333
38 
39 /* default selectivity estimate for range inequalities "A > b AND A < c" */
40 #define DEFAULT_RANGE_INEQ_SEL	0.005
41 
42 /* default selectivity estimate for pattern-match operators such as LIKE */
43 #define DEFAULT_MATCH_SEL	0.005
44 
45 /* default number of distinct values in a table */
46 #define DEFAULT_NUM_DISTINCT  200
47 
48 /* default selectivity estimate for boolean and null test nodes */
49 #define DEFAULT_UNK_SEL			0.005
50 #define DEFAULT_NOT_UNK_SEL		(1.0 - DEFAULT_UNK_SEL)
51 
52 
53 /*
54  * Clamp a computed probability estimate (which may suffer from roundoff or
55  * estimation errors) to valid range.  Argument must be a float variable.
56  */
57 #define CLAMP_PROBABILITY(p) \
58 	do { \
59 		if (p < 0.0) \
60 			p = 0.0; \
61 		else if (p > 1.0) \
62 			p = 1.0; \
63 	} while (0)
64 
65 
66 /* Return data from examine_variable and friends */
67 typedef struct VariableStatData
68 {
69 	Node	   *var;			/* the Var or expression tree */
70 	RelOptInfo *rel;			/* Relation, or NULL if not identifiable */
71 	HeapTuple	statsTuple;		/* pg_statistic tuple, or NULL if none */
72 	/* NB: if statsTuple!=NULL, it must be freed when caller is done */
73 	void		(*freefunc) (HeapTuple tuple);	/* how to free statsTuple */
74 	Oid			vartype;		/* exposed type of expression */
75 	Oid			atttype;		/* type to pass to get_attstatsslot */
76 	int32		atttypmod;		/* typmod to pass to get_attstatsslot */
77 	bool		isunique;		/* matches unique index or DISTINCT clause */
78 	bool		acl_ok;			/* result of ACL check on table or column */
79 } VariableStatData;
80 
81 #define ReleaseVariableStats(vardata)  \
82 	do { \
83 		if (HeapTupleIsValid((vardata).statsTuple)) \
84 			(* (vardata).freefunc) ((vardata).statsTuple); \
85 	} while(0)
86 
87 
88 typedef enum
89 {
90 	Pattern_Type_Like, Pattern_Type_Like_IC,
91 	Pattern_Type_Regex, Pattern_Type_Regex_IC
92 } Pattern_Type;
93 
94 typedef enum
95 {
96 	Pattern_Prefix_None, Pattern_Prefix_Partial, Pattern_Prefix_Exact
97 } Pattern_Prefix_Status;
98 
99 /*
100  * deconstruct_indexquals is a simple function to examine the indexquals
101  * attached to a proposed IndexPath.  It returns a list of IndexQualInfo
102  * structs, one per qual expression.
103  */
104 typedef struct
105 {
106 	RestrictInfo *rinfo;		/* the indexqual itself */
107 	int			indexcol;		/* zero-based index column number */
108 	bool		varonleft;		/* true if index column is on left of qual */
109 	Oid			clause_op;		/* qual's operator OID, if relevant */
110 	Node	   *other_operand;	/* non-index operand of qual's operator */
111 } IndexQualInfo;
112 
113 /*
114  * genericcostestimate is a general-purpose estimator that can be used for
115  * most index types.  In some cases we use genericcostestimate as the base
116  * code and then incorporate additional index-type-specific knowledge in
117  * the type-specific calling function.  To avoid code duplication, we make
118  * genericcostestimate return a number of intermediate values as well as
119  * its preliminary estimates of the output cost values.  The GenericCosts
120  * struct includes all these values.
121  *
122  * Callers should initialize all fields of GenericCosts to zero.  In addition,
123  * they can set numIndexTuples to some positive value if they have a better
124  * than default way of estimating the number of leaf index tuples visited.
125  */
126 typedef struct
127 {
128 	/* These are the values the cost estimator must return to the planner */
129 	Cost		indexStartupCost;		/* index-related startup cost */
130 	Cost		indexTotalCost; /* total index-related scan cost */
131 	Selectivity indexSelectivity;		/* selectivity of index */
132 	double		indexCorrelation;		/* order correlation of index */
133 
134 	/* Intermediate values we obtain along the way */
135 	double		numIndexPages;	/* number of leaf pages visited */
136 	double		numIndexTuples; /* number of leaf tuples visited */
137 	double		spc_random_page_cost;	/* relevant random_page_cost value */
138 	double		num_sa_scans;	/* # indexscans from ScalarArrayOps */
139 } GenericCosts;
140 
141 /* Hooks for plugins to get control when we ask for stats */
142 typedef bool (*get_relation_stats_hook_type) (PlannerInfo *root,
143 														  RangeTblEntry *rte,
144 														  AttrNumber attnum,
145 												  VariableStatData *vardata);
146 extern PGDLLIMPORT get_relation_stats_hook_type get_relation_stats_hook;
147 typedef bool (*get_index_stats_hook_type) (PlannerInfo *root,
148 													   Oid indexOid,
149 													   AttrNumber indexattnum,
150 												  VariableStatData *vardata);
151 extern PGDLLIMPORT get_index_stats_hook_type get_index_stats_hook;
152 
153 /* Functions in selfuncs.c */
154 
155 extern void examine_variable(PlannerInfo *root, Node *node, int varRelid,
156 				 VariableStatData *vardata);
157 extern bool statistic_proc_security_check(VariableStatData *vardata, Oid func_oid);
158 extern bool get_restriction_variable(PlannerInfo *root, List *args,
159 						 int varRelid,
160 						 VariableStatData *vardata, Node **other,
161 						 bool *varonleft);
162 extern void get_join_variables(PlannerInfo *root, List *args,
163 				   SpecialJoinInfo *sjinfo,
164 				   VariableStatData *vardata1,
165 				   VariableStatData *vardata2,
166 				   bool *join_is_reversed);
167 extern double get_variable_numdistinct(VariableStatData *vardata,
168 						 bool *isdefault);
169 extern double mcv_selectivity(VariableStatData *vardata, FmgrInfo *opproc,
170 				Datum constval, bool varonleft,
171 				double *sumcommonp);
172 extern double histogram_selectivity(VariableStatData *vardata, FmgrInfo *opproc,
173 					  Datum constval, bool varonleft,
174 					  int min_hist_size, int n_skip,
175 					  int *hist_size);
176 
177 extern Pattern_Prefix_Status pattern_fixed_prefix(Const *patt,
178 					 Pattern_Type ptype,
179 					 Oid collation,
180 					 Const **prefix,
181 					 Selectivity *rest_selec);
182 extern Const *make_greater_string(const Const *str_const, FmgrInfo *ltproc,
183 					Oid collation);
184 
185 extern Datum eqsel(PG_FUNCTION_ARGS);
186 extern Datum neqsel(PG_FUNCTION_ARGS);
187 extern Datum scalarltsel(PG_FUNCTION_ARGS);
188 extern Datum scalargtsel(PG_FUNCTION_ARGS);
189 extern Datum regexeqsel(PG_FUNCTION_ARGS);
190 extern Datum icregexeqsel(PG_FUNCTION_ARGS);
191 extern Datum likesel(PG_FUNCTION_ARGS);
192 extern Datum iclikesel(PG_FUNCTION_ARGS);
193 extern Datum regexnesel(PG_FUNCTION_ARGS);
194 extern Datum icregexnesel(PG_FUNCTION_ARGS);
195 extern Datum nlikesel(PG_FUNCTION_ARGS);
196 extern Datum icnlikesel(PG_FUNCTION_ARGS);
197 
198 extern Datum eqjoinsel(PG_FUNCTION_ARGS);
199 extern Datum neqjoinsel(PG_FUNCTION_ARGS);
200 extern Datum scalarltjoinsel(PG_FUNCTION_ARGS);
201 extern Datum scalargtjoinsel(PG_FUNCTION_ARGS);
202 extern Datum regexeqjoinsel(PG_FUNCTION_ARGS);
203 extern Datum icregexeqjoinsel(PG_FUNCTION_ARGS);
204 extern Datum likejoinsel(PG_FUNCTION_ARGS);
205 extern Datum iclikejoinsel(PG_FUNCTION_ARGS);
206 extern Datum regexnejoinsel(PG_FUNCTION_ARGS);
207 extern Datum icregexnejoinsel(PG_FUNCTION_ARGS);
208 extern Datum nlikejoinsel(PG_FUNCTION_ARGS);
209 extern Datum icnlikejoinsel(PG_FUNCTION_ARGS);
210 
211 extern Selectivity boolvarsel(PlannerInfo *root, Node *arg, int varRelid);
212 extern Selectivity booltestsel(PlannerInfo *root, BoolTestType booltesttype,
213 			Node *arg, int varRelid,
214 			JoinType jointype, SpecialJoinInfo *sjinfo);
215 extern Selectivity nulltestsel(PlannerInfo *root, NullTestType nulltesttype,
216 			Node *arg, int varRelid,
217 			JoinType jointype, SpecialJoinInfo *sjinfo);
218 extern Selectivity scalararraysel(PlannerInfo *root,
219 			   ScalarArrayOpExpr *clause,
220 			   bool is_join_clause,
221 			   int varRelid, JoinType jointype, SpecialJoinInfo *sjinfo);
222 extern int	estimate_array_length(Node *arrayexpr);
223 extern Selectivity rowcomparesel(PlannerInfo *root,
224 			  RowCompareExpr *clause,
225 			  int varRelid, JoinType jointype, SpecialJoinInfo *sjinfo);
226 
227 extern void mergejoinscansel(PlannerInfo *root, Node *clause,
228 				 Oid opfamily, int strategy, bool nulls_first,
229 				 Selectivity *leftstart, Selectivity *leftend,
230 				 Selectivity *rightstart, Selectivity *rightend);
231 
232 extern double estimate_num_groups(PlannerInfo *root, List *groupExprs,
233 					double input_rows, List **pgset);
234 
235 extern Selectivity estimate_hash_bucketsize(PlannerInfo *root, Node *hashkey,
236 						 double nbuckets);
237 
238 extern List *deconstruct_indexquals(IndexPath *path);
239 extern void genericcostestimate(PlannerInfo *root, IndexPath *path,
240 					double loop_count,
241 					List *qinfos,
242 					GenericCosts *costs);
243 
244 /* Functions in array_selfuncs.c */
245 
246 extern Selectivity scalararraysel_containment(PlannerInfo *root,
247 						   Node *leftop, Node *rightop,
248 						   Oid elemtype, bool isEquality, bool useOr,
249 						   int varRelid);
250 extern Datum arraycontsel(PG_FUNCTION_ARGS);
251 extern Datum arraycontjoinsel(PG_FUNCTION_ARGS);
252 
253 #endif   /* SELFUNCS_H */
254