Movatterモバイル変換

Skip to content

postgrespro/postgresPublic

forked frompostgres/postgres

NotificationsYou must be signed in to change notification settings
Fork6
Star31

Commit87bd07d

bmomjian

committed

Make EXPLAIN sampling smarter, to avoid excessive sampling delay.

Martijn van Oosterhout

1 parent53d669e commit87bd07dCopy full SHA for 87bd07d

File tree

8 files changed

+150

-55

lines changed

src
- backend
  - commands
    - trigger.c
  - executor
- include/executor
  - instrument.h

8 files changed

+150

-55

lines changed

`‎src/backend/commands/trigger.c‎`

Lines changed: 3 additions & 3 deletions

Original file line number	Diff line number	Diff line change
`@@ -7,7 +7,7 @@`
`7`	`7`	`* Portions Copyright (c) 1994, Regents of the University of California`
`8`	`8`	`*`
`9`	`9`	`* IDENTIFICATION`
`10`		`- * $PostgreSQL: pgsql/src/backend/commands/trigger.c,v 1.201 2006/04/27 00:33:41 momjian Exp $`
	`10`	`+ * $PostgreSQL: pgsql/src/backend/commands/trigger.c,v 1.202 2006/05/30 14:01:57 momjian Exp $`
`11`	`11`	`*`
`12`	`12`	`*-------------------------------------------------------------------------`
`13`	`13`	`*/`
`@@ -1306,7 +1306,7 @@ ExecCallTriggerFunc(TriggerData *trigdata,`
`1306`	`1306`	`* one "tuple returned" (really the number of firings).`
`1307`	`1307`	`*/`
`1308`	`1308`	`if (instr)`
`1309`		`-InstrStopNode(instr+tgindx,true);`
	`1309`	`+InstrStopNode(instr+tgindx,1);`
`1310`	`1310`
`1311`	`1311`	`return (HeapTuple)DatumGetPointer(result);`
`1312`	`1312`	`}`
`@@ -2154,7 +2154,7 @@ AfterTriggerExecute(AfterTriggerEvent event,`
`2154`	`2154`	`* one "tuple returned" (really the number of firings).`
`2155`	`2155`	`*/`
`2156`	`2156`	`if (instr)`
`2157`		`-InstrStopNode(instr+tgindx,true);`
	`2157`	`+InstrStopNode(instr+tgindx,1);`
`2158`	`2158`	`}`
`2159`	`2159`
`2160`	`2160`

`‎src/backend/executor/execProcnode.c‎`

Lines changed: 2 additions & 2 deletions

Original file line number	Diff line number	Diff line change
`@@ -12,7 +12,7 @@`
`12`	`12`	`*`
`13`	`13`	`*`
`14`	`14`	`* IDENTIFICATION`
`15`		`- * $PostgreSQL: pgsql/src/backend/executor/execProcnode.c,v 1.54 2006/03/05 15:58:26 momjian Exp $`
	`15`	`+ * $PostgreSQL: pgsql/src/backend/executor/execProcnode.c,v 1.55 2006/05/30 14:01:57 momjian Exp $`
`16`	`16`	`*`
`17`	`17`	`*-------------------------------------------------------------------------`
`18`	`18`	`*/`
`@@ -423,7 +423,7 @@ ExecProcNode(PlanState *node)`
`423`	`423`	`}`
`424`	`424`
`425`	`425`	`if (node->instrument)`
`426`		`-InstrStopNode(node->instrument,!TupIsNull(result));`
	`426`	`+InstrStopNode(node->instrument,TupIsNull(result) ?0 :1);`
`427`	`427`
`428`	`428`	`returnresult;`
`429`	`429`	`}`

`‎src/backend/executor/instrument.c‎`

Lines changed: 130 additions & 39 deletions

Original file line number	Diff line number	Diff line change
`@@ -7,16 +7,78 @@`
`7`	`7`	`* Copyright (c) 2001-2006, PostgreSQL Global Development Group`
`8`	`8`	`*`
`9`	`9`	`* IDENTIFICATION`
`10`		`- * $PostgreSQL: pgsql/src/backend/executor/instrument.c,v 1.14 2006/03/05 15:58:26 momjian Exp $`
	`10`	`+ * $PostgreSQL: pgsql/src/backend/executor/instrument.c,v 1.15 2006/05/30 14:01:58 momjian Exp $`
`11`	`11`	`*`
`12`	`12`	`*-------------------------------------------------------------------------`
`13`	`13`	`*/`
`14`	`14`	`#include"postgres.h"`
`15`	`15`
`16`	`16`	`#include<unistd.h>`
	`17`	`+#include<math.h>`
`17`	`18`
`18`	`19`	`#include"executor/instrument.h"`
`19`	`20`
	`21`	`+/* This is the function that is used to determine the sampling intervals. In`
	`22`	`+ * general, if the function is f(x), then for N tuples we will take on the`
	`23`	`+ * order of integral(1/f(x), x=0..N) samples. Some examples follow, with the`
	`24`	`+ * number of samples that would be collected over 1,000,000 tuples.`
	`25`	`+`
	`26`	`+ f(x) = x => log2(N) 20`
	`27`	`+ f(x) = x^(1/2) => 2 * N^(1/2) 2000`
	`28`	`+ f(x) = x^(1/3) => 1.5 * N^(2/3) 15000`
	`29`	`+`
	`30`	`+ * I've chosen the last one as it seems to provide a good compromise between`
	`31`	`+ * low overhead but still getting a meaningful number of samples. However,`
	`32`	`+ * not all machines have the cbrt() function so on those we substitute`
	`33`	`+ * sqrt(). The difference is not very significant in the tests I made.`
	`34`	`+*/`
	`35`	`+#ifdefHAVE_CBRT`
	`36`	`+#defineSampleFunc cbrt`
	`37`	`+#else`
	`38`	`+#defineSampleFunc sqrt`
	`39`	`+#endif`
	`40`	`+`
	`41`	`+#defineSAMPLE_THRESHOLD 50`
	`42`	`+`
	`43`	`+staticdoubleSampleOverhead;`
	`44`	`+staticboolSampleOverheadCalculated;`
	`45`	`+`
	`46`	`+staticvoid`
	`47`	`+CalculateSampleOverhead()`
	`48`	`+{`
	`49`	`+Instrumentationinstr;`
	`50`	`+inti;`
	`51`	`+`
	`52`	`+/* We want to determine the sampling overhead, to correct`
	`53`	`+ * calculations later. This only needs to be done once per backend.`
	`54`	`+ * Is this the place? A wrong value here (due to a mistimed`
	`55`	`+ * task-switch) will cause bad calculations later.`
	`56`	`+ *`
	`57`	`+ * To minimize the risk we do it a few times and take the lowest.`
	`58`	`+ */`
	`59`	`+`
	`60`	`+SampleOverhead=1.0e6;`
	`61`	`+`
	`62`	`+for(i=0;i<5;i++ )`
	`63`	`+{`
	`64`	`+intj;`
	`65`	`+doubleoverhead;`
	`66`	`+`
	`67`	`+memset(&instr,0,sizeof(instr) );`
	`68`	`+`
	`69`	`+/* Loop SAMPLE_THRESHOLD times or 100 microseconds, whichever is faster */`
	`70`	`+for(j=0;j<SAMPLE_THRESHOLD&&INSTR_TIME_GET_DOUBLE(instr.counter)<100e-6;i++ )`
	`71`	`+{`
	`72`	`+InstrStartNode(&instr );`
	`73`	`+InstrStopNode(&instr,1 );`
	`74`	`+}`
	`75`	`+overhead=INSTR_TIME_GET_DOUBLE(instr.counter) /instr.samplecount;`
	`76`	`+if(overhead<SampleOverhead )`
	`77`	`+SampleOverhead=overhead;`
	`78`	`+}`
	`79`	`+`
	`80`	`+SampleOverheadCalculated= true;`
	`81`	`+}`
`20`	`82`
`21`	`83`	`/* Allocate new instrumentation structure(s) */`
`22`	`84`	`Instrumentation*`
`@@ -25,7 +87,10 @@ InstrAlloc(int n)`
`25`	`87`	`Instrumentationinstr=palloc0(nsizeof(Instrumentation));`
`26`	`88`
`27`	`89`	`/* we don't need to do any initialization except zero 'em */`
`28`		`-`
	`90`	`+`
	`91`	`+/* Calculate overhead, if not done yet */`
	`92`	`+if( !SampleOverheadCalculated )`
	`93`	`+CalculateSampleOverhead();`
`29`	`94`	`returninstr;`
`30`	`95`	`}`
`31`	`96`
`@@ -34,49 +99,69 @@ void`
`34`	`99`	`InstrStartNode(Instrumentation*instr)`
`35`	`100`	`{`
`36`	`101`	`if (INSTR_TIME_IS_ZERO(instr->starttime))`
`37`		`-INSTR_TIME_SET_CURRENT(instr->starttime);`
	`102`	`+{`
	`103`	`+/* We always sample the first SAMPLE_THRESHOLD tuples, so small nodes are always accurate */`
	`104`	`+if (instr->tuplecount<SAMPLE_THRESHOLD)`
	`105`	`+instr->sampling= true;`
	`106`	`+else`
	`107`	`+{`
	`108`	`+/* Otherwise we go to sampling, see the comments on SampleFunc at the top of the file */`
	`109`	`+if(instr->tuplecount>instr->nextsample )`
	`110`	`+{`
	`111`	`+instr->sampling= true;`
	`112`	`+/* The doubling is so the random will average 1 over time */`
	`113`	`+instr->nextsample+=2.0SampleFunc(instr->tuplecount) (double)rand() / (double)RAND_MAX;`
	`114`	`+}`
	`115`	`+}`
	`116`	`+if (instr->sampling)`
	`117`	`+INSTR_TIME_SET_CURRENT(instr->starttime);`
	`118`	`+}`
`38`	`119`	`else`
`39`	`120`	`elog(DEBUG2,"InstrStartNode called twice in a row");`
`40`	`121`	`}`
`41`	`122`
`42`	`123`	`/* Exit from a plan node */`
`43`	`124`	`void`
`44`		`-InstrStopNode(Instrumentation*instr,boolreturnedTuple)`
	`125`	`+InstrStopNode(Instrumentation*instr,doublenTuples)`
`45`	`126`	`{`
`46`	`127`	`instr_timeendtime;`
`47`	`128`
`48`	`129`	`/* count the returned tuples */`
`49`		`-if (returnedTuple)`
`50`		`-instr->tuplecount+=1;`
	`130`	`+instr->tuplecount+=nTuples;`
`51`	`131`
`52`		`-if (INSTR_TIME_IS_ZERO(instr->starttime))`
	`132`	`+if (instr->sampling)`
`53`	`133`	`{`
`54`		`-elog(DEBUG2,"InstrStopNode called without start");`
`55`		`-return;`
`56`		`-}`
	`134`	`+if (INSTR_TIME_IS_ZERO(instr->starttime))`
	`135`	`+{`
	`136`	`+elog(DEBUG2,"InstrStopNode called without start");`
	`137`	`+return;`
	`138`	`+}`
`57`	`139`
`58`		`-INSTR_TIME_SET_CURRENT(endtime);`
	`140`	`+INSTR_TIME_SET_CURRENT(endtime);`
`59`	`141`
`60`	`142`	`#ifndefWIN32`
`61`		`-instr->counter.tv_sec+=endtime.tv_sec-instr->starttime.tv_sec;`
`62`		`-instr->counter.tv_usec+=endtime.tv_usec-instr->starttime.tv_usec;`
`63`		`-`
`64`		`-/* Normalize after each add to avoid overflow/underflow of tv_usec */`
`65`		`-while (instr->counter.tv_usec<0)`
`66`		`-{`
`67`		`-instr->counter.tv_usec+=1000000;`
`68`		`-instr->counter.tv_sec--;`
`69`		`-}`
`70`		`-while (instr->counter.tv_usec >=1000000)`
`71`		`-{`
`72`		`-instr->counter.tv_usec-=1000000;`
`73`		`-instr->counter.tv_sec++;`
`74`		`-}`
	`143`	`+instr->counter.tv_sec+=endtime.tv_sec-instr->starttime.tv_sec;`
	`144`	`+instr->counter.tv_usec+=endtime.tv_usec-instr->starttime.tv_usec;`
	`145`	`+`
	`146`	`+/* Normalize after each add to avoid overflow/underflow of tv_usec */`
	`147`	`+while (instr->counter.tv_usec<0)`
	`148`	`+{`
	`149`	`+instr->counter.tv_usec+=1000000;`
	`150`	`+instr->counter.tv_sec--;`
	`151`	`+}`
	`152`	`+while (instr->counter.tv_usec >=1000000)`
	`153`	`+{`
	`154`	`+instr->counter.tv_usec-=1000000;`
	`155`	`+instr->counter.tv_sec++;`
	`156`	`+}`
`75`	`157`	`#else/* WIN32 */`
`76`		`-instr->counter.QuadPart+= (endtime.QuadPart-instr->starttime.QuadPart);`
	`158`	`+instr->counter.QuadPart+= (endtime.QuadPart-instr->starttime.QuadPart);`
`77`	`159`	`#endif`
`78`	`160`
`79`		`-INSTR_TIME_SET_ZERO(instr->starttime);`
	`161`	`+INSTR_TIME_SET_ZERO(instr->starttime);`
	`162`	`+instr->samplecount+=nTuples;`
	`163`	`+instr->sampling= false;`
	`164`	`+}`
`80`	`165`
`81`	`166`	`/* Is this the first tuple of this cycle? */`
`82`	`167`	`if (!instr->running)`
`@@ -86,17 +171,6 @@ InstrStopNode(Instrumentation *instr, bool returnedTuple)`
`86`	`171`	`}`
`87`	`172`	`}`
`88`	`173`
`89`		`-/* As above, but count multiple tuples returned at once */`
`90`		`-void`
`91`		`-InstrStopNodeMulti(Instrumentation*instr,doublenTuples)`
`92`		`-{`
`93`		`-/* count the returned tuples */`
`94`		`-instr->tuplecount+=nTuples;`
`95`		`-`
`96`		`-/* delegate the rest */`
`97`		`-InstrStopNode(instr, false);`
`98`		`-}`
`99`		`-`
`100`	`174`	`/* Finish a run cycle for a plan node */`
`101`	`175`	`void`
`102`	`176`	`InstrEndLoop(Instrumentation*instr)`
`@@ -114,14 +188,31 @@ InstrEndLoop(Instrumentation *instr)`
`114`	`188`	`totaltime=INSTR_TIME_GET_DOUBLE(instr->counter);`
`115`	`189`
`116`	`190`	`instr->startup+=instr->firsttuple;`
`117`		`-instr->total+=totaltime;`
	`191`	`+`
	`192`	`+/* Here we take into account sampling effects. Doing it naively ends`
	`193`	`+ * up assuming the sampling overhead applies to all tuples, even the`
	`194`	`+ * ones we didn't measure. We've calculated an overhead, so we`
	`195`	`+ * subtract that for all samples we didn't measure. The first tuple`
	`196`	`+ * is also special cased, because it usually takes longer. */`
	`197`	`+`
	`198`	`+if(instr->samplecount<instr->tuplecount )`
	`199`	`+{`
	`200`	`+doublepertuple= (totaltime-instr->firsttuple) / (instr->samplecount-1);`
	`201`	`+instr->total+=instr->firsttuple+ (pertuple* (instr->samplecount-1))`
	`202`	`++ ((pertuple-SampleOverhead)* (instr->tuplecount-instr->samplecount));`
	`203`	`+}`
	`204`	`+else`
	`205`	`+instr->total+=totaltime;`
	`206`	`+`
`118`	`207`	`instr->ntuples+=instr->tuplecount;`
	`208`	`+instr->nsamples+=instr->samplecount;`
`119`	`209`	`instr->nloops+=1;`
`120`	`210`
`121`	`211`	`/* Reset for next cycle (if any) */`
`122`	`212`	`instr->running= false;`
`123`	`213`	`INSTR_TIME_SET_ZERO(instr->starttime);`
`124`	`214`	`INSTR_TIME_SET_ZERO(instr->counter);`
`125`	`215`	`instr->firsttuple=0;`
	`216`	`+instr->samplecount=0;`
`126`	`217`	`instr->tuplecount=0;`
`127`	`218`	`}`

`‎src/backend/executor/nodeBitmapAnd.c‎`

Lines changed: 2 additions & 2 deletions

Original file line number	Diff line number	Diff line change
`@@ -8,7 +8,7 @@`
`8`	`8`	`*`
`9`	`9`	`*`
`10`	`10`	`* IDENTIFICATION`
`11`		`- * $PostgreSQL: pgsql/src/backend/executor/nodeBitmapAnd.c,v 1.7 2006/05/23 15:21:52 tgl Exp $`
	`11`	`+ * $PostgreSQL: pgsql/src/backend/executor/nodeBitmapAnd.c,v 1.8 2006/05/30 14:01:58 momjian Exp $`
`12`	`12`	`*`
`13`	`13`	`*-------------------------------------------------------------------------`
`14`	`14`	`*/`
`@@ -161,7 +161,7 @@ MultiExecBitmapAnd(BitmapAndState *node)`
`161`	`161`
`162`	`162`	`/* must provide our own instrumentation support */`
`163`	`163`	`if (node->ps.instrument)`
`164`		`-InstrStopNodeMulti(node->ps.instrument,0/* XXX */ );`
	`164`	`+InstrStopNode(node->ps.instrument,0/* XXX */ );`
`165`	`165`
`166`	`166`	`return (Node*)result;`
`167`	`167`	`}`

`‎src/backend/executor/nodeBitmapIndexscan.c‎`

Lines changed: 2 additions & 2 deletions

Original file line number	Diff line number	Diff line change
`@@ -8,7 +8,7 @@`
`8`	`8`	`*`
`9`	`9`	`*`
`10`	`10`	`* IDENTIFICATION`
`11`		`- * $PostgreSQL: pgsql/src/backend/executor/nodeBitmapIndexscan.c,v 1.18 2006/05/23 15:21:52 tgl Exp $`
	`11`	`+ * $PostgreSQL: pgsql/src/backend/executor/nodeBitmapIndexscan.c,v 1.19 2006/05/30 14:01:58 momjian Exp $`
`12`	`12`	`*`
`13`	`13`	`*-------------------------------------------------------------------------`
`14`	`14`	`*/`
`@@ -112,7 +112,7 @@ MultiExecBitmapIndexScan(BitmapIndexScanState *node)`
`112`	`112`
`113`	`113`	`/* must provide our own instrumentation support */`
`114`	`114`	`if (node->ss.ps.instrument)`
`115`		`-InstrStopNodeMulti(node->ss.ps.instrument,nTuples);`
	`115`	`+InstrStopNode(node->ss.ps.instrument,nTuples);`
`116`	`116`
`117`	`117`	`return (Node*)tbm;`
`118`	`118`	`}`

`‎src/backend/executor/nodeBitmapOr.c‎`

Lines changed: 2 additions & 2 deletions

Original file line number	Diff line number	Diff line change
`@@ -8,7 +8,7 @@`
`8`	`8`	`*`
`9`	`9`	`*`
`10`	`10`	`* IDENTIFICATION`
`11`		`- * $PostgreSQL: pgsql/src/backend/executor/nodeBitmapOr.c,v 1.6 2006/05/23 15:21:52 tgl Exp $`
	`11`	`+ * $PostgreSQL: pgsql/src/backend/executor/nodeBitmapOr.c,v 1.7 2006/05/30 14:01:58 momjian Exp $`
`12`	`12`	`*`
`13`	`13`	`*-------------------------------------------------------------------------`
`14`	`14`	`*/`
`@@ -177,7 +177,7 @@ MultiExecBitmapOr(BitmapOrState *node)`
`177`	`177`
`178`	`178`	`/* must provide our own instrumentation support */`
`179`	`179`	`if (node->ps.instrument)`
`180`		`-InstrStopNodeMulti(node->ps.instrument,0/* XXX */ );`
	`180`	`+InstrStopNode(node->ps.instrument,0/* XXX */ );`
`181`	`181`
`182`	`182`	`return (Node*)result;`
`183`	`183`	`}`

`‎src/backend/executor/nodeHash.c‎`

Lines changed: 2 additions & 2 deletions

Original file line number	Diff line number	Diff line change
`@@ -8,7 +8,7 @@`
`8`	`8`	`*`
`9`	`9`	`*`
`10`	`10`	`* IDENTIFICATION`
`11`		`- * $PostgreSQL: pgsql/src/backend/executor/nodeHash.c,v 1.102 2006/05/23 15:21:52 tgl Exp $`
	`11`	`+ * $PostgreSQL: pgsql/src/backend/executor/nodeHash.c,v 1.103 2006/05/30 14:01:58 momjian Exp $`
`12`	`12`	`*`
`13`	`13`	`*-------------------------------------------------------------------------`
`14`	`14`	`*/`
`@@ -97,7 +97,7 @@ MultiExecHash(HashState *node)`
`97`	`97`
`98`	`98`	`/* must provide our own instrumentation support */`
`99`	`99`	`if (node->ps.instrument)`
`100`		`-InstrStopNodeMulti(node->ps.instrument,hashtable->totalTuples);`
	`100`	`+InstrStopNode(node->ps.instrument,hashtable->totalTuples);`
`101`	`101`
`102`	`102`	`/*`
`103`	`103`	`* We do not return the hash table directly because it's not a subtype of`

`‎src/include/executor/instrument.h‎`

Lines changed: 7 additions & 3 deletions

Original file line number	Diff line number	Diff line change
`@@ -6,7 +6,7 @@`
`6`	`6`	`*`
`7`	`7`	`* Copyright (c) 2001-2006, PostgreSQL Global Development Group`
`8`	`8`	`*`
`9`		`- * $PostgreSQL: pgsql/src/include/executor/instrument.h,v 1.13 2006/03/05 15:58:56 momjian Exp $`
	`9`	`+ * $PostgreSQL: pgsql/src/include/executor/instrument.h,v 1.14 2006/05/30 14:01:58 momjian Exp $`
`10`	`10`	`*`
`11`	`11`	`*-------------------------------------------------------------------------`
`12`	`12`	`*/`
`@@ -61,17 +61,21 @@ typedef struct Instrumentation`
`61`	`61`	`instr_timecounter;/* Accumulated runtime for this node */`
`62`	`62`	`doublefirsttuple;/* Time for first tuple of this cycle */`
`63`	`63`	`doubletuplecount;/* Tuples emitted so far this cycle */`
	`64`	`+doublesamplecount;/* Samples collected this cycle */`
`64`	`65`	`/* Accumulated statistics across all completed cycles: */`
`65`	`66`	`doublestartup;/* Total startup time (in seconds) */`
`66`	`67`	`doubletotal;/* Total total time (in seconds) */`
`67`	`68`	`doublentuples;/* Total tuples produced */`
`68`	`69`	`doublenloops;/* # of run cycles for this node */`
	`70`	`+doublensamples;/* # of samples taken */`
	`71`	`+/* Tracking for sampling */`
	`72`	`+boolsampling;/* Are we sampling this iteration */`
	`73`	`+doublenextsample;/* The next tuplecount we're going to sample */`
`69`	`74`	`}Instrumentation;`
`70`	`75`
`71`	`76`	`externInstrumentation*InstrAlloc(intn);`
`72`	`77`	`externvoidInstrStartNode(Instrumentation*instr);`
`73`		`-externvoidInstrStopNode(Instrumentation*instr,boolreturnedTuple);`
`74`		`-externvoidInstrStopNodeMulti(Instrumentation*instr,doublenTuples);`
	`78`	`+externvoidInstrStopNode(Instrumentation*instr,doublenTuples);`
`75`	`79`	`externvoidInstrEndLoop(Instrumentation*instr);`
`76`	`80`
`77`	`81`	`#endif/* INSTRUMENT_H */`

0 commit comments

Comments

(0)

[8]ページ先頭

©2009-2025 Movatter.jp