NotificationsYou must be signed in to change notification settings
Fork6
Star31

Commitc23bc6f

committed

First cut at making indexscan cost estimates depend on correlation

between index order and table order.

1 parente020335 commitc23bc6fCopy full SHA for c23bc6f

File tree

8 files changed

+315

-86

lines changed

doc/src/sgml
- indexcost.sgml
src
- backend
  - optimizer
    - path
      - costsize.c
    - util
      - var.c
  - utils
    - adt
      - selfuncs.c
    - cache
      - lsyscache.c
- include
  - catalog
    - pg_proc.h
  - optimizer
    - var.h
  - utils
    - lsyscache.h

8 files changed

+315

-86

lines changed

`‎doc/src/sgml/indexcost.sgml`

Lines changed: 31 additions & 5 deletions

Original file line number	Diff line number	Diff line change
`@@ -1,5 +1,5 @@`
`1`	`1`	`<!--`
`2`		`-$Header: /cvsroot/pgsql/doc/src/sgml/Attic/indexcost.sgml,v 2.6 2000/12/22 21:51:57 petere Exp $`
	`2`	`+$Header: /cvsroot/pgsql/doc/src/sgml/Attic/indexcost.sgml,v 2.7 2001/05/09 23:13:34 tgl Exp $`
`3`	`3`	`-->`
`4`	`4`
`5`	`5`	`<chapter id="indexcost">`
`@@ -57,7 +57,8 @@ amcostestimate (Query *root,`
`57`	`57`	`List *indexQuals,`
`58`	`58`	`Cost *indexStartupCost,`
`59`	`59`	`Cost *indexTotalCost,`
`60`		`- Selectivity *indexSelectivity);`
	`60`	`+ Selectivity *indexSelectivity,`
	`61`	`+ double *indexCorrelation);`
`61`	`62`	`</programlisting>`
`62`	`63`
`63`	`64`	`The first four parameters are inputs:`
`@@ -103,7 +104,7 @@ amcostestimate (Query *root,`
`103`	`104`	`</para>`
`104`	`105`
`105`	`106`	`<para>`
`106`		`- The lastthree parameters are pass-by-reference outputs:`
	`107`	`+ The lastfour parameters are pass-by-reference outputs:`
`107`	`108`
`108`	`109`	`<variablelist>`
`109`	`110`	`<varlistentry>`
`@@ -132,6 +133,16 @@ amcostestimate (Query *root,`
`132`	`133`	`</para>`
`133`	`134`	`</listitem>`
`134`	`135`	`</varlistentry>`
	`136`	`+`
	`137`	`+ <varlistentry>`
	`138`	`+ <term>*indexCorrelation</term>`
	`139`	`+ <listitem>`
	`140`	`+ <para>`
	`141`	`+ Set to correlation coefficient between index scan order and`
	`142`	`+ underlying table's order`
	`143`	`+ </para>`
	`144`	`+ </listitem>`
	`145`	`+ </varlistentry>`
`135`	`146`	`</variablelist>`
`136`	`147`	`</para>`
`137`	`148`
`@@ -172,6 +183,13 @@ amcostestimate (Query *root,`
`172`	`183`	`tuples that actually pass the given qual conditions.`
`173`	`184`	`</para>`
`174`	`185`
	`186`	`+ <para>`
	`187`	`+ The indexCorrelation should be set to the correlation (ranging between`
	`188`	`+ -1.0 and 1.0) between the index order and the table order. This is used`
	`189`	`+ to adjust the estimate for the cost of fetching tuples from the main`
	`190`	`+ table.`
	`191`	`+ </para>`
	`192`	`+`
`175`	`193`	`<procedure>`
`176`	`194`	`<title>Cost Estimation</title>`
`177`	`195`	`<para>`
`@@ -224,6 +242,14 @@ amcostestimate (Query *root,`
`224`	`242`	`</programlisting>`
`225`	`243`	`</para>`
`226`	`244`	`</step>`
	`245`	`+`
	`246`	`+ <step>`
	`247`	`+ <para>`
	`248`	`+ Estimate the index correlation. For a simple ordered index on a single`
	`249`	`+ field, this can be retrieved from pg_statistic. If the correlation`
	`250`	`+ is not known, the conservative estimate is zero (no correlation).`
	`251`	`+ </para>`
	`252`	`+ </step>`
`227`	`253`	`</procedure>`
`228`	`254`
`229`	`255`	`<para>`
`@@ -237,8 +263,8 @@ amcostestimate (Query *root,`
`237`	`263`
`238`	`264`	`<programlisting>`
`239`	`265`	`prorettype = 0`
`240`		`-pronargs =7`
`241`		`-proargtypes = 0 0 0 0 0 0 0`
	`266`	`+pronargs =8`
	`267`	`+proargtypes = 0 0 0 0 0 0 0 0`
`242`	`268`	`</programlisting>`
`243`	`269`
`244`	`270`	`We use zero ("opaque") for all the arguments since none of them have types`

`‎src/backend/optimizer/path/costsize.c`

Lines changed: 88 additions & 33 deletions

Original file line number	Diff line number	Diff line change
`@@ -31,17 +31,18 @@`
`31`	`31`	`* result by interpolating between startup_cost and total_cost. In detail:`
`32`	`32`	`*actual_cost = startup_cost +`
`33`	`33`	`(total_cost - startup_cost) tuples_to_fetch / path->parent->rows;`
`34`		`- * Note that a relation's rows count (and, by extension, a Plan's plan_rows)`
`35`		`- * are set without regard to any LIMIT, so that this equation works properly.`
`36`		`- * (Also, these routines guarantee not to set the rows count to zero, so there`
`37`		`- * will be no zero divide.) The LIMIT is applied as a separate Plan node.`
	`34`	`+ * Note that a base relation's rows count (and, by extension, plan_rows for`
	`35`	`+ * plan nodes below the LIMIT node) are set without regard to any LIMIT, so`
	`36`	`+ * that this equation works properly. (Also, these routines guarantee not to`
	`37`	`+ * set the rows count to zero, so there will be no zero divide.) The LIMIT is`
	`38`	`+ * applied as a top-level plan node.`
`38`	`39`	`*`
`39`	`40`	`*`
`40`	`41`	`* Portions Copyright (c) 1996-2001, PostgreSQL Global Development Group`
`41`	`42`	`* Portions Copyright (c) 1994, Regents of the University of California`
`42`	`43`	`*`
`43`	`44`	`* IDENTIFICATION`
`44`		`- * $Header: /cvsroot/pgsql/src/backend/optimizer/path/costsize.c,v 1.72 2001/05/0900:35:09 tgl Exp $`
	`45`	`+ * $Header: /cvsroot/pgsql/src/backend/optimizer/path/costsize.c,v 1.73 2001/05/0923:13:34 tgl Exp $`
`45`	`46`	`*`
`46`	`47`	`*-------------------------------------------------------------------------`
`47`	`48`	`*/`
`@@ -205,12 +206,18 @@ cost_index(Path path, Query root,`
`205`	`206`	`{`
`206`	`207`	`Coststartup_cost=0;`
`207`	`208`	`Costrun_cost=0;`
`208`		`-Costcpu_per_tuple;`
`209`	`209`	`CostindexStartupCost;`
`210`	`210`	`CostindexTotalCost;`
`211`	`211`	`SelectivityindexSelectivity;`
	`212`	`+doubleindexCorrelation,`
	`213`	`+csquared;`
	`214`	`+Costmin_IO_cost,`
	`215`	`+max_IO_cost;`
	`216`	`+Costcpu_per_tuple;`
`212`	`217`	`doubletuples_fetched;`
`213`	`218`	`doublepages_fetched;`
	`219`	`+doubleT,`
	`220`	`+b;`
`214`	`221`
`215`	`222`	`/* Should only be applied to base relations */`
`216`	`223`	`Assert(IsA(baserel,RelOptInfo)&&IsA(index,IndexOptInfo));`
`@@ -224,63 +231,109 @@ cost_index(Path path, Query root,`
`224`	`231`	`* Call index-access-method-specific code to estimate the processing`
`225`	`232`	`* cost for scanning the index, as well as the selectivity of the`
`226`	`233`	`* index (ie, the fraction of main-table tuples we will have to`
`227`		`- * retrieve).`
	`234`	`+ * retrieve) and its correlation to the main-table tuple order.`
`228`	`235`	`*/`
`229`		`-OidFunctionCall7(index->amcostestimate,`
	`236`	`+OidFunctionCall8(index->amcostestimate,`
`230`	`237`	`PointerGetDatum(root),`
`231`	`238`	`PointerGetDatum(baserel),`
`232`	`239`	`PointerGetDatum(index),`
`233`	`240`	`PointerGetDatum(indexQuals),`
`234`	`241`	`PointerGetDatum(&indexStartupCost),`
`235`	`242`	`PointerGetDatum(&indexTotalCost),`
`236`		`-PointerGetDatum(&indexSelectivity));`
	`243`	`+PointerGetDatum(&indexSelectivity),`
	`244`	`+PointerGetDatum(&indexCorrelation));`
`237`	`245`
`238`	`246`	`/* all costs for touching index itself included here */`
`239`	`247`	`startup_cost+=indexStartupCost;`
`240`	`248`	`run_cost+=indexTotalCost-indexStartupCost;`
`241`	`249`
`242`		`-/*`
	`250`	`+/*----------`
`243`	`251`	`* Estimate number of main-table tuples and pages fetched.`
`244`	`252`	`*`
`245`		`- * If the number of tuples is much smaller than the number of pages in`
`246`		`- * the relation, each tuple will cost a separate nonsequential fetch.`
`247`		`- * If it is comparable or larger, then probably we will be able to`
`248`		`- * avoid some fetches.We use a growth rate of log(#tuples/#pages +`
`249`		`- * 1) --- probably totally bogus, but intuitively it gives the right`
`250`		`- * shape of curve at least.`
	`253`	`+ * When the index ordering is uncorrelated with the table ordering,`
	`254`	`+ * we use an approximation proposed by Mackert and Lohman, "Index Scans`
	`255`	`+ * Using a Finite LRU Buffer: A Validated I/O Model", ACM Transactions`
	`256`	`+ * on Database Systems, Vol. 14, No. 3, September 1989, Pages 401-424.`
	`257`	`+ * The Mackert and Lohman approximation is that the number of pages`
	`258`	`+ * fetched is`
	`259`	`+ *PF =`
	`260`	`+ *min(2TNs/(2T+Ns), T)when T <= b`
	`261`	`+ *2TNs/(2T+Ns)when T > b and Ns <= 2Tb/(2T-b)`
	`262`	`+ b + (Ns - 2Tb/(2T-b))(T-b)/Twhen T > b and Ns > 2Tb/(2T-b)`
	`263`	`+ * where`
	`264`	`+ *T = # pages in table`
	`265`	`+ *N = # tuples in table`
	`266`	`+ *s = selectivity = fraction of table to be scanned`
	`267`	`+ *b = # buffer pages available (we include kernel space here)`
`251`	`268`	`*`
`252`		`- * XXX if the relation has recently been "clustered" using this index,`
`253`		`- * then in fact the target tuples will be highly nonuniformly`
`254`		`- * distributed, and we will be seriously overestimating the scan cost!`
`255`		`- * Currently we have no way to know whether the relation has been`
`256`		`- * clustered, nor how much it's been modified since the last`
`257`		`- * clustering, so we ignore this effect. Would be nice to do better`
`258`		`- * someday.`
	`269`	`+ * When the index ordering is exactly correlated with the table ordering`
	`270`	`+ * (just after a CLUSTER, for example), the number of pages fetched should`
	`271`	`+ * be just sT. What's more, these will be sequential fetches, not the`
	`272`	`+ * random fetches that occur in the uncorrelated case. So, depending on`
	`273`	`+ * the extent of correlation, we should estimate the actual I/O cost`
	`274`	`+ * somewhere between s * T * 1.0 and PF * random_cost. We currently`
	`275`	`+ * interpolate linearly between these two endpoints based on the`
	`276`	`+ * correlation squared (XXX is that appropriate?).`
	`277`	`+ *`
	`278`	`+ * In any case the number of tuples fetched is Ns.`
	`279`	`+ *----------`
`259`	`280`	`*/`
`260`	`281`
`261`	`282`	`tuples_fetched=indexSelectivity*baserel->tuples;`
`262`	`283`	`/* Don't believe estimates less than 1... */`
`263`	`284`	`if (tuples_fetched<1.0)`
`264`	`285`	`tuples_fetched=1.0;`
`265`	`286`
`266`		`-if (baserel->pages>0)`
`267`		`-pages_fetched=ceil(baserel->pages*`
`268`		`-log(tuples_fetched /baserel->pages+1.0));`
	`287`	`+/* This part is the Mackert and Lohman formula */`
	`288`	`+`
	`289`	`+T= (baserel->pages>1) ? (double)baserel->pages :1.0;`
	`290`	`+b= (effective_cache_size>1) ?effective_cache_size :1.0;`
	`291`	`+`
	`292`	`+if (T <=b)`
	`293`	`+{`
	`294`	`+pages_fetched=`
	`295`	`+(2.0Ttuples_fetched) / (2.0*T+tuples_fetched);`
	`296`	`+if (pages_fetched>T)`
	`297`	`+pages_fetched=T;`
	`298`	`+}`
`269`	`299`	`else`
`270`		`-pages_fetched=tuples_fetched;`
	`300`	`+{`
	`301`	`+doublelim;`
	`302`	`+`
	`303`	`+lim= (2.0Tb) / (2.0*T-b);`
	`304`	`+if (tuples_fetched <=lim)`
	`305`	`+{`
	`306`	`+pages_fetched=`
	`307`	`+(2.0Ttuples_fetched) / (2.0*T+tuples_fetched);`
	`308`	`+}`
	`309`	`+else`
	`310`	`+{`
	`311`	`+pages_fetched=`
	`312`	`+b+ (tuples_fetched-lim)* (T-b) /T;`
	`313`	`+}`
	`314`	`+}`
`271`	`315`
`272`	`316`	`/*`
`273`		`- * Now estimate one nonsequential access per page fetched, plus`
`274`		`- * appropriate CPU costs per tuple.`
	`317`	`+ * min_IO_cost corresponds to the perfectly correlated case (csquared=1),`
	`318`	`+ * max_IO_cost to the perfectly uncorrelated case (csquared=0). Note`
	`319`	`+ * that we just charge random_page_cost per page in the uncorrelated`
	`320`	`+ * case, rather than using cost_nonsequential_access, since we've already`
	`321`	`+ * accounted for caching effects by using the Mackert model.`
`275`	`322`	`*/`
	`323`	`+min_IO_cost=ceil(indexSelectivity*T);`
	`324`	`+max_IO_cost=pages_fetched*random_page_cost;`
`276`	`325`
`277`		`-/* disk costs for main table */`
`278`		`-run_cost+=pages_fetched*cost_nonsequential_access(baserel->pages);`
	`326`	`+/*`
	`327`	`+ * Now interpolate based on estimated index order correlation`
	`328`	`+ * to get total disk I/O cost for main table accesses.`
	`329`	`+ */`
	`330`	`+csquared=indexCorrelation*indexCorrelation;`
`279`	`331`
`280`		`-/* CPU costs */`
`281`		`-cpu_per_tuple=cpu_tuple_cost+baserel->baserestrictcost;`
	`332`	`+run_cost+=max_IO_cost+csquared* (min_IO_cost-max_IO_cost);`
`282`	`333`
`283`	`334`	`/*`
	`335`	`+ * Estimate CPU costs per tuple.`
	`336`	`+ *`
`284`	`337`	`* Normally the indexquals will be removed from the list of`
`285`	`338`	`* restriction clauses that we have to evaluate as qpquals, so we`
`286`	`339`	`* should subtract their costs from baserestrictcost. For a lossy`
`@@ -290,6 +343,8 @@ cost_index(Path path, Query root,`
`290`	`343`	`* Rather than work out exactly how much to subtract, we don't`
`291`	`344`	`* subtract anything in that case either.`
`292`	`345`	`*/`
	`346`	`+cpu_per_tuple=cpu_tuple_cost+baserel->baserestrictcost;`
	`347`	`+`
`293`	`348`	`if (!index->lossy&& !is_injoin)`
`294`	`349`	`cpu_per_tuple-=cost_qual_eval(indexQuals);`
`295`	`350`

0 commit comments

Comments

(0)

Movatterモバイル変換

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commitc23bc6f

File tree

8 files changed

8 files changed

`‎doc/src/sgml/indexcost.sgml`

`‎src/backend/optimizer/path/costsize.c`

0 commit comments