NotificationsYou must be signed in to change notification settings
Fork5
Star26

Commita72ee09

committed

Add infrastructure for making spins_per_delay variable depending on

whether we seem to be running in a uniprocessor or multiprocessor.The adjustment rules could probably still use further tweaking, butI'm convinced this should be a win overall.

1 parent9907b97 commita72ee09Copy full SHA for a72ee09

File tree

4 files changed

+145

-24

lines changed

src
- backend/storage/lmgr
  - proc.c
  - s_lock.c
- include/storage
  - proc.h
  - s_lock.h

4 files changed

+145

-24

lines changed

`‎src/backend/storage/lmgr/proc.c`

Lines changed: 36 additions & 2 deletions

Original file line number	Diff line number	Diff line change
`@@ -8,7 +8,7 @@`
`8`	`8`	`*`
`9`	`9`	`*`
`10`	`10`	`* IDENTIFICATION`
`11`		`- * $PostgreSQL: pgsql/src/backend/storage/lmgr/proc.c,v 1.164 2005/09/19 17:21:47 momjian Exp $`
	`11`	`+ * $PostgreSQL: pgsql/src/backend/storage/lmgr/proc.c,v 1.165 2005/10/11 20:41:32 tgl Exp $`
`12`	`12`	`*`
`13`	`13`	`*-------------------------------------------------------------------------`
`14`	`14`	`*/`
`@@ -171,6 +171,8 @@ InitProcGlobal(void)`
`171`	`171`
`172`	`172`	`ProcGlobal->freeProcs=INVALID_OFFSET;`
`173`	`173`
	`174`	`+ProcGlobal->spins_per_delay=DEFAULT_SPINS_PER_DELAY;`
	`175`	`+`
`174`	`176`	`/*`
`175`	`177`	`* Pre-create the PGPROC structures and create a semaphore for`
`176`	`178`	`* each.`
`@@ -225,9 +227,14 @@ InitProcess(void)`
`225`	`227`	`/*`
`226`	`228`	`* Try to get a proc struct from the free list. If this fails, we`
`227`	`229`	`* must be out of PGPROC structures (not to mention semaphores).`
	`230`	`+ *`
	`231`	`+ * While we are holding the ProcStructLock, also copy the current`
	`232`	`+ * shared estimate of spins_per_delay to local storage.`
`228`	`233`	`*/`
`229`	`234`	`SpinLockAcquire(ProcStructLock);`
`230`	`235`
	`236`	`+set_spins_per_delay(procglobal->spins_per_delay);`
	`237`	`+`
`231`	`238`	`myOffset=procglobal->freeProcs;`
`232`	`239`
`233`	`240`	`if (myOffset!=INVALID_OFFSET)`
`@@ -319,21 +326,38 @@ InitDummyProcess(int proctype)`
`319`	`326`
`320`	`327`	`Assert(proctype >=0&&proctype<NUM_DUMMY_PROCS);`
`321`	`328`
	`329`	`+/*`
	`330`	`+ * Just for paranoia's sake, we use the ProcStructLock to protect`
	`331`	`+ * assignment and releasing of DummyProcs entries.`
	`332`	`+ *`
	`333`	`+ * While we are holding the ProcStructLock, also copy the current`
	`334`	`+ * shared estimate of spins_per_delay to local storage.`
	`335`	`+ */`
	`336`	`+SpinLockAcquire(ProcStructLock);`
	`337`	`+`
	`338`	`+set_spins_per_delay(ProcGlobal->spins_per_delay);`
	`339`	`+`
`322`	`340`	`dummyproc=&DummyProcs[proctype];`
`323`	`341`
`324`	`342`	`/*`
`325`	`343`	`* dummyproc should not presently be in use by anyone else`
`326`	`344`	`*/`
`327`	`345`	`if (dummyproc->pid!=0)`
	`346`	`+{`
	`347`	`+SpinLockRelease(ProcStructLock);`
`328`	`348`	`elog(FATAL,"DummyProc[%d] is in use by PID %d",`
`329`	`349`	`proctype,dummyproc->pid);`
	`350`	`+}`
`330`	`351`	`MyProc=dummyproc;`
`331`	`352`
	`353`	`+MyProc->pid=MyProcPid;/* marks dummy proc as in use by me */`
	`354`	`+`
	`355`	`+SpinLockRelease(ProcStructLock);`
	`356`	`+`
`332`	`357`	`/*`
`333`	`358`	`* Initialize all fields of MyProc, except MyProc->sem which was set`
`334`	`359`	`* up by InitProcGlobal.`
`335`	`360`	`*/`
`336`		`-MyProc->pid=MyProcPid;/* marks dummy proc as in use by me */`
`337`	`361`	`SHMQueueElemInit(&(MyProc->links));`
`338`	`362`	`MyProc->waitStatus=STATUS_OK;`
`339`	`363`	`MyProc->xid=InvalidTransactionId;`
`@@ -510,6 +534,9 @@ ProcKill(int code, Datum arg)`
`510`	`534`	`/* PGPROC struct isn't mine anymore */`
`511`	`535`	`MyProc=NULL;`
`512`	`536`
	`537`	`+/* Update shared estimate of spins_per_delay */`
	`538`	`+procglobal->spins_per_delay=update_spins_per_delay(procglobal->spins_per_delay);`
	`539`	`+`
`513`	`540`	`SpinLockRelease(ProcStructLock);`
`514`	`541`	`}`
`515`	`542`
`@@ -533,11 +560,18 @@ DummyProcKill(int code, Datum arg)`
`533`	`560`	`/* Release any LW locks I am holding (see notes above) */`
`534`	`561`	`LWLockReleaseAll();`
`535`	`562`
	`563`	`+SpinLockAcquire(ProcStructLock);`
	`564`	`+`
`536`	`565`	`/* Mark dummy proc no longer in use */`
`537`	`566`	`MyProc->pid=0;`
`538`	`567`
`539`	`568`	`/* PGPROC struct isn't mine anymore */`
`540`	`569`	`MyProc=NULL;`
	`570`	`+`
	`571`	`+/* Update shared estimate of spins_per_delay */`
	`572`	`+ProcGlobal->spins_per_delay=update_spins_per_delay(ProcGlobal->spins_per_delay);`
	`573`	`+`
	`574`	`+SpinLockRelease(ProcStructLock);`
`541`	`575`	`}`
`542`	`576`
`543`	`577`

`‎src/backend/storage/lmgr/s_lock.c`

Lines changed: 99 additions & 20 deletions

Original file line number	Diff line number	Diff line change
`@@ -9,7 +9,7 @@`
`9`	`9`	`*`
`10`	`10`	`*`
`11`	`11`	`* IDENTIFICATION`
`12`		`- * $PostgreSQL: pgsql/src/backend/storage/lmgr/s_lock.c,v 1.38 2005/08/26 14:47:35 tgl Exp $`
	`12`	`+ * $PostgreSQL: pgsql/src/backend/storage/lmgr/s_lock.c,v 1.39 2005/10/11 20:41:32 tgl Exp $`
`13`	`13`	`*`
`14`	`14`	`*-------------------------------------------------------------------------`
`15`	`15`	`*/`
`@@ -21,6 +21,10 @@`
`21`	`21`	`#include"storage/s_lock.h"`
`22`	`22`	`#include"miscadmin.h"`
`23`	`23`
	`24`	`+`
	`25`	`+staticintspins_per_delay=DEFAULT_SPINS_PER_DELAY;`
	`26`	`+`
	`27`	`+`
`24`	`28`	`/*`
`25`	`29`	`* s_lock_stuck() - complain about a stuck spinlock`
`26`	`30`	`*/`
`@@ -49,54 +53,67 @@ s_lock(volatile slock_t lock, const char file, int line)`
`49`	`53`	`* We loop tightly for awhile, then delay using pg_usleep() and try`
`50`	`54`	`* again. Preferably, "awhile" should be a small multiple of the`
`51`	`55`	`* maximum time we expect a spinlock to be held. 100 iterations seems`
`52`		`- * about right. In most multi-CPU scenarios, the spinlock is probably`
`53`		`- * held by a process on another CPU and will be released before we`
`54`		`- * finish 100 iterations. However, on a uniprocessor, the tight loop`
`55`		`- * is just a waste of cycles, so don't iterate thousands of times.`
	`56`	`+ * about right as an initial guess. However, on a uniprocessor the`
	`57`	`+ * loop is a waste of cycles, while in a multi-CPU scenario it's usually`
	`58`	`+ * better to spin a bit longer than to call the kernel, so we try to`
	`59`	`+ * adapt the spin loop count depending on whether we seem to be in`
	`60`	`+ * a uniprocessor or multiprocessor.`
	`61`	`+ *`
	`62`	`+ * Note: you might think MIN_SPINS_PER_DELAY should be just 1, but you'd`
	`63`	`+ * be wrong; there are platforms where that can result in a "stuck`
	`64`	`+ * spinlock" failure. This has been seen particularly on Alphas; it`
	`65`	`+ * seems that the first TAS after returning from kernel space will always`
	`66`	`+ * fail on that hardware.`
`56`	`67`	`*`
`57`	`68`	`* Once we do decide to block, we use randomly increasing pg_usleep()`
`58`		`- * delays. The first delay is10 msec, then the delay randomly`
`59`		`- * increases to about one second, after which we reset to10 msec and`
	`69`	`+ * delays. The first delay is1 msec, then the delay randomly`
	`70`	`+ * increases to about one second, after which we reset to1 msec and`
`60`	`71`	`* start again. The idea here is that in the presence of heavy`
`61`	`72`	`* contention we need to increase the delay, else the spinlock holder`
`62`	`73`	`* may never get to run and release the lock. (Consider situation`
`63`	`74`	`* where spinlock holder has been nice'd down in priority by the`
`64`	`75`	`* scheduler --- it will not get scheduled until all would-be`
`65`		`- * acquirers are sleeping, so if we always use a10-msec sleep, there`
	`76`	`+ * acquirers are sleeping, so if we always use a1-msec sleep, there`
`66`	`77`	`* is a real possibility of starvation.) But we can't just clamp the`
`67`	`78`	`* delay to an upper bound, else it would take a long time to make a`
`68`	`79`	`* reasonable number of tries.`
`69`	`80`	`*`
`70`	`81`	`* We time out and declare error after NUM_DELAYS delays (thus, exactly`
`71`	`82`	`* that many tries). With the given settings, this will usually take`
`72`		`- *3 or so minutes. It seems better to fix the total number of tries`
	`83`	`+ *2 or so minutes. It seems better to fix the total number of tries`
`73`	`84`	`* (and thus the probability of unintended failure) than to fix the`
`74`	`85`	`* total time spent.`
`75`	`86`	`*`
`76`		`- * The pg_usleep() delays are measured in centiseconds (0.01 sec) because`
`77`		`- * 10 msec is a common resolution limit at the OS level.`
	`87`	`+ * The pg_usleep() delays are measured in milliseconds because 1 msec`
	`88`	`+ * is a common resolution limit at the OS level for newer platforms.`
	`89`	`+ * On older platforms the resolution limit is usually 10 msec, in`
	`90`	`+ * which case the total delay before timeout will be a bit more.`
`78`	`91`	`*/`
`79`		`-#defineSPINS_PER_DELAY100`
	`92`	`+#defineMIN_SPINS_PER_DELAY10`
	`93`	`+#defineMAX_SPINS_PER_DELAY1000`
`80`	`94`	`#defineNUM_DELAYS1000`
`81`		`-#defineMIN_DELAY_CSEC1`
`82`		`-#defineMAX_DELAY_CSEC100`
	`95`	`+#defineMIN_DELAY_MSEC1`
	`96`	`+#defineMAX_DELAY_MSEC1000`
`83`	`97`
`84`	`98`	`intspins=0;`
`85`	`99`	`intdelays=0;`
`86`		`-intcur_delay=MIN_DELAY_CSEC;`
	`100`	`+intcur_delay=0;`
`87`	`101`
`88`	`102`	`while (TAS(lock))`
`89`	`103`	`{`
`90`	`104`	`/* CPU-specific delay each time through the loop */`
`91`	`105`	`SPIN_DELAY();`
`92`	`106`
`93`		`-/* Block the process everySPINS_PER_DELAY tries */`
`94`		`-if (++spins>SPINS_PER_DELAY)`
	`107`	`+/* Block the process everyspins_per_delay tries */`
	`108`	`+if (++spins >=spins_per_delay)`
`95`	`109`	`{`
`96`	`110`	`if (++delays>NUM_DELAYS)`
`97`	`111`	`s_lock_stuck(lock,file,line);`
`98`	`112`
`99`		`-pg_usleep(cur_delay*10000L);`
	`113`	`+if (cur_delay==0)/* first time to delay? */`
	`114`	`+cur_delay=MIN_DELAY_MSEC;`
	`115`	`+`
	`116`	`+pg_usleep(cur_delay*1000L);`
`100`	`117`
`101`	`118`	`#if defined(S_LOCK_TEST)`
`102`	`119`	`fprintf(stdout,"*");`
`@@ -107,14 +124,76 @@ s_lock(volatile slock_t lock, const char file, int line)`
`107`	`124`	`cur_delay+= (int) (cur_delay*`
`108`	`125`	`(((double)random()) / ((double)MAX_RANDOM_VALUE))+0.5);`
`109`	`126`	`/* wrap back to minimum delay when max is exceeded */`
`110`		`-if (cur_delay>MAX_DELAY_CSEC)`
`111`		`-cur_delay=MIN_DELAY_CSEC;`
	`127`	`+if (cur_delay>MAX_DELAY_MSEC)`
	`128`	`+cur_delay=MIN_DELAY_MSEC;`
`112`	`129`
`113`	`130`	`spins=0;`
`114`	`131`	`}`
`115`	`132`	`}`
	`133`	`+`
	`134`	`+/*`
	`135`	`+ * If we were able to acquire the lock without delaying, it's a good`
	`136`	`+ * indication we are in a multiprocessor. If we had to delay, it's`
	`137`	`+ * a sign (but not a sure thing) that we are in a uniprocessor.`
	`138`	`+ * Hence, we decrement spins_per_delay slowly when we had to delay,`
	`139`	`+ * and increase it rapidly when we didn't. It's expected that`
	`140`	`+ * spins_per_delay will converge to the minimum value on a uniprocessor`
	`141`	`+ * and to the maximum value on a multiprocessor.`
	`142`	`+ *`
	`143`	`+ * Note: spins_per_delay is local within our current process.`
	`144`	`+ * We want to average these observations across multiple backends,`
	`145`	`+ * since it's relatively rare for this function to even get entered,`
	`146`	`+ * and so a single backend might not live long enough to converge on`
	`147`	`+ * a good value. That is handled by the two routines below.`
	`148`	`+ */`
	`149`	`+if (cur_delay==0)`
	`150`	`+{`
	`151`	`+/* we never had to delay */`
	`152`	`+if (spins_per_delay<MAX_SPINS_PER_DELAY)`
	`153`	`+spins_per_delay=Min(spins_per_delay+100,MAX_SPINS_PER_DELAY);`
	`154`	`+}`
	`155`	`+else`
	`156`	`+{`
	`157`	`+if (spins_per_delay>MIN_SPINS_PER_DELAY)`
	`158`	`+spins_per_delay=Max(spins_per_delay-1,MIN_SPINS_PER_DELAY);`
	`159`	`+}`
	`160`	`+}`
	`161`	`+`
	`162`	`+`
	`163`	`+/*`
	`164`	`+ * Set local copy of spins_per_delay during backend startup.`
	`165`	`+ *`
	`166`	`+ * NB: this has to be pretty fast as it is called while holding a spinlock`
	`167`	`+ */`
	`168`	`+void`
	`169`	`+set_spins_per_delay(intshared_spins_per_delay)`
	`170`	`+{`
	`171`	`+spins_per_delay=shared_spins_per_delay;`
	`172`	`+}`
	`173`	`+`
	`174`	`+/*`
	`175`	`+ * Update shared estimate of spins_per_delay during backend exit.`
	`176`	`+ *`
	`177`	`+ * NB: this has to be pretty fast as it is called while holding a spinlock`
	`178`	`+ */`
	`179`	`+int`
	`180`	`+update_spins_per_delay(intshared_spins_per_delay)`
	`181`	`+{`
	`182`	`+/*`
	`183`	`+ * We use an exponential moving average with a relatively slow`
	`184`	`+ * adaption rate, so that noise in any one backend's result won't`
	`185`	`+ * affect the shared value too much. As long as both inputs are`
	`186`	`+ * within the allowed range, the result must be too, so we need not`
	`187`	`+ * worry about clamping the result.`
	`188`	`+ *`
	`189`	`+ * We deliberately truncate rather than rounding; this is so that`
	`190`	`+ * single adjustments inside a backend can affect the shared estimate`
	`191`	`+ * (see the asymmetric adjustment rules above).`
	`192`	`+ */`
	`193`	`+return (shared_spins_per_delay*15+spins_per_delay) /16;`
`116`	`194`	`}`
`117`	`195`
	`196`	`+`
`118`	`197`	`/*`
`119`	`198`	`* Various TAS implementations that cannot live in s_lock.h as no inline`
`120`	`199`	`* definition exists (yet).`

`‎src/include/storage/proc.h`

Lines changed: 3 additions & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -7,7 +7,7 @@`
`7`	`7`	`* Portions Copyright (c) 1996-2005, PostgreSQL Global Development Group`
`8`	`8`	`* Portions Copyright (c) 1994, Regents of the University of California`
`9`	`9`	`*`
`10`		`- * $PostgreSQL: pgsql/src/include/storage/proc.h,v 1.82 2005/09/19 17:21:48 momjian Exp $`
	`10`	`+ * $PostgreSQL: pgsql/src/include/storage/proc.h,v 1.83 2005/10/11 20:41:32 tgl Exp $`
`11`	`11`	`*`
`12`	`12`	`*-------------------------------------------------------------------------`
`13`	`13`	`*/`
`@@ -105,6 +105,8 @@ typedef struct PROC_HDR`
`105`	`105`	`{`
`106`	`106`	`/* Head of list of free PGPROC structures */`
`107`	`107`	`SHMEM_OFFSETfreeProcs;`
	`108`	`+/* Current shared estimate of appropriate spins_per_delay value */`
	`109`	`+intspins_per_delay;`
`108`	`110`	`}PROC_HDR;`
`109`	`111`
`110`	`112`

`‎src/include/storage/s_lock.h`

Lines changed: 7 additions & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -66,7 +66,7 @@`
`66`	`66`	`* Portions Copyright (c) 1996-2005, PostgreSQL Global Development Group`
`67`	`67`	`* Portions Copyright (c) 1994, Regents of the University of California`
`68`	`68`	`*`
`69`		`- * $PostgreSQL: pgsql/src/include/storage/s_lock.h,v 1.141 2005/10/11 20:01:30 tgl Exp $`
	`69`	`+ * $PostgreSQL: pgsql/src/include/storage/s_lock.h,v 1.142 2005/10/11 20:41:32 tgl Exp $`
`70`	`70`	`*`
`71`	`71`	`*-------------------------------------------------------------------------`
`72`	`72`	`*/`
`@@ -872,4 +872,10 @@ extern inttas(volatile slock_t lock);/ in port/.../tas.s, or`
`872`	`872`	`*/`
`873`	`873`	`externvoids_lock(volatileslock_tlock,constcharfile,intline);`
`874`	`874`
	`875`	`+/* Support for dynamic adjustment of spins_per_delay */`
	`876`	`+#defineDEFAULT_SPINS_PER_DELAY 100`
	`877`	`+`
	`878`	`+externvoidset_spins_per_delay(intshared_spins_per_delay);`
	`879`	`+externintupdate_spins_per_delay(intshared_spins_per_delay);`
	`880`	`+`
`875`	`881`	`#endif/* S_LOCK_H */`

0 commit comments

Comments

(0)

Movatterモバイル変換

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commita72ee09

File tree

4 files changed

4 files changed

`‎src/backend/storage/lmgr/proc.c`

`‎src/backend/storage/lmgr/s_lock.c`

`‎src/include/storage/proc.h`

`‎src/include/storage/s_lock.h`

0 commit comments