NotificationsYou must be signed in to change notification settings
Fork6
Star31

Commiteddbf39

committed

Extend yesterday's patch so that the bgwriter is also told to forget

pending fsyncs during DROP DATABASE. Obviously necessary in hindsight :-(

1 parent530b10c commiteddbf39Copy full SHA for eddbf39

File tree

4 files changed

+124

-55

lines changed

src
- backend
  - commands
    - dbcommands.c
  - postmaster
    - bgwriter.c
  - storage/smgr
    - md.c
- include/storage
  - smgr.h

4 files changed

+124

-55

lines changed

`‎src/backend/commands/dbcommands.c‎`

Lines changed: 8 additions & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -13,7 +13,7 @@`
`13`	`13`	`*`
`14`	`14`	`*`
`15`	`15`	`* IDENTIFICATION`
`16`		`- * $PostgreSQL: pgsql/src/backend/commands/dbcommands.c,v 1.189 2007/01/16 13:28:56 alvherre Exp $`
	`16`	`+ * $PostgreSQL: pgsql/src/backend/commands/dbcommands.c,v 1.190 2007/01/17 16:25:01 tgl Exp $`
`17`	`17`	`*`
`18`	`18`	`*-------------------------------------------------------------------------`
`19`	`19`	`*/`
`@@ -40,6 +40,7 @@`
`40`	`40`	`#include"postmaster/bgwriter.h"`
`41`	`41`	`#include"storage/freespace.h"`
`42`	`42`	`#include"storage/procarray.h"`
	`43`	`+#include"storage/smgr.h"`
`43`	`44`	`#include"utils/acl.h"`
`44`	`45`	`#include"utils/builtins.h"`
`45`	`46`	`#include"utils/flatfiles.h"`
`@@ -643,6 +644,12 @@ dropdb(const char *dbname, bool missing_ok)`
`643`	`644`	`*/`
`644`	`645`	`FreeSpaceMapForgetDatabase(db_id);`
`645`	`646`
	`647`	`+/*`
	`648`	`+ * Tell bgwriter to forget any pending fsync requests for files in the`
	`649`	`+ * database; else it'll fail at next checkpoint.`
	`650`	`+ */`
	`651`	`+ForgetDatabaseFsyncRequests(db_id);`
	`652`	`+`
`646`	`653`	`/*`
`647`	`654`	`* On Windows, force a checkpoint so that the bgwriter doesn't hold any`
`648`	`655`	`* open files, which would cause rmdir() to fail.`

`‎src/backend/postmaster/bgwriter.c‎`

Lines changed: 7 additions & 7 deletions

Original file line number	Diff line number	Diff line change
`@@ -37,7 +37,7 @@`
`37`	`37`	`*`
`38`	`38`	`*`
`39`	`39`	`* IDENTIFICATION`
`40`		`- * $PostgreSQL: pgsql/src/backend/postmaster/bgwriter.c,v 1.35 2007/01/1700:17:20 tgl Exp $`
	`40`	`+ * $PostgreSQL: pgsql/src/backend/postmaster/bgwriter.c,v 1.36 2007/01/1716:25:01 tgl Exp $`
`41`	`41`	`*`
`42`	`42`	`*-------------------------------------------------------------------------`
`43`	`43`	`*/`
`@@ -103,7 +103,7 @@`
`103`	`103`	`typedefstruct`
`104`	`104`	`{`
`105`	`105`	`RelFileNodernode;`
`106`		`-BlockNumbersegno;/InvalidBlockNumber means "revoke" /`
	`106`	`+BlockNumbersegno;/see md.c for special values /`
`107`	`107`	`/* might add a real request-type field later; not needed yet */`
`108`	`108`	`}BgWriterRequest;`
`109`	`109`
`@@ -695,16 +695,16 @@ RequestCheckpoint(bool waitforit, bool warnontime)`
`695`	`695`	`* ForwardFsyncRequest`
`696`	`696`	`*Forward a file-fsync request from a backend to the bgwriter`
`697`	`697`	`*`
`698`		`- * segno specifies which segment (not block!) of the relation needs to be`
`699`		`- * fsync'd. If segno == InvalidBlockNumber, the meaning is to revoke any`
`700`		`- * pending fsync requests for the entire relation (this message is sent`
`701`		`- * when the relation is about to be deleted).`
`702`		`- *`
`703`	`698`	`* Whenever a backend is compelled to write directly to a relation`
`704`	`699`	`* (which should be seldom, if the bgwriter is getting its job done),`
`705`	`700`	`* the backend calls this routine to pass over knowledge that the relation`
`706`	`701`	`* is dirty and must be fsync'd before next checkpoint.`
`707`	`702`	`*`
	`703`	`+ * segno specifies which segment (not block!) of the relation needs to be`
	`704`	`+ * fsync'd. (Since the valid range is much less than BlockNumber, we can`
	`705`	`+ * use high values for special flags; that's all internal to md.c, which`
	`706`	`+ * see for details.)`
	`707`	`+ *`
`708`	`708`	`* If we are unable to pass over the request (at present, this can happen`
`709`	`709`	`* if the shared memory queue is full), we return false. That forces`
`710`	`710`	`* the backend to do its own fsync. We hope that will be even more seldom.`

`‎src/backend/storage/smgr/md.c‎`

Lines changed: 106 additions & 46 deletions

Original file line number	Diff line number	Diff line change
`@@ -8,7 +8,7 @@`
`8`	`8`	`*`
`9`	`9`	`*`
`10`	`10`	`* IDENTIFICATION`
`11`		`- * $PostgreSQL: pgsql/src/backend/storage/smgr/md.c,v 1.126 2007/01/1700:17:21 tgl Exp $`
	`11`	`+ * $PostgreSQL: pgsql/src/backend/storage/smgr/md.c,v 1.127 2007/01/1716:25:01 tgl Exp $`
`12`	`12`	`*`
`13`	`13`	`*-------------------------------------------------------------------------`
`14`	`14`	`*/`
`@@ -31,6 +31,10 @@`
`31`	`31`	`/* interval for calling AbsorbFsyncRequests in mdsync */`
`32`	`32`	`#defineFSYNCS_PER_ABSORB10`
`33`	`33`
	`34`	`+/* special values for the segno arg to RememberFsyncRequest */`
	`35`	`+#defineFORGET_RELATION_FSYNC(InvalidBlockNumber)`
	`36`	`+#defineFORGET_DATABASE_FSYNC(InvalidBlockNumber-1)`
	`37`	`+`
`34`	`38`	`/*`
`35`	`39`	`* On Windows, we have to interpret EACCES as possibly meaning the same as`
`36`	`40`	`* ENOENT, because if a file is unlinked-but-not-yet-gone on that platform,`
`@@ -258,30 +262,7 @@ mdunlink(RelFileNode rnode, bool isRedo)`
`258`	`262`	`* We have to clean out any pending fsync requests for the doomed relation,`
`259`	`263`	`* else the next mdsync() will fail.`
`260`	`264`	`*/`
`261`		`-if (pendingOpsTable)`
`262`		`-{`
`263`		`-/* standalone backend or startup process: fsync state is local */`
`264`		`-RememberFsyncRequest(rnode,InvalidBlockNumber);`
`265`		`-}`
`266`		`-elseif (IsUnderPostmaster)`
`267`		`-{`
`268`		`-/*`
`269`		`- * Notify the bgwriter about it. If we fail to queue the revoke`
`270`		`- * message, we have to sleep and try again ... ugly, but hopefully`
`271`		`- * won't happen often.`
`272`		`- *`
`273`		`- * XXX should we CHECK_FOR_INTERRUPTS in this loop? Escaping with`
`274`		`- * an error would leave the no-longer-used file still present on`
`275`		`- * disk, which would be bad, so I'm inclined to assume that the`
`276`		`- * bgwriter will always empty the queue soon.`
`277`		`- */`
`278`		`-while (!ForwardFsyncRequest(rnode,InvalidBlockNumber))`
`279`		`-pg_usleep(10000L);/* 10 msec seems a good number */`
`280`		`-/*`
`281`		`- * Note we don't wait for the bgwriter to actually absorb the`
`282`		`- * revoke message; see mdsync() for the implications.`
`283`		`- */`
`284`		`-}`
	`265`	`+ForgetRelationFsyncRequests(rnode);`
`285`	`266`
`286`	`267`	`path=relpath(rnode);`
`287`	`268`
`@@ -894,7 +875,8 @@ mdsync(void)`
`894`	`875`	`* what we will do is retry the whole process after absorbing fsync`
`895`	`876`	`* request messages again. Since mdunlink() queues a "revoke" message`
`896`	`877`	`* before actually unlinking, the fsync request is guaranteed to be gone`
`897`		`- * the second time if it really was this case.`
	`878`	`+ * the second time if it really was this case. DROP DATABASE likewise`
	`879`	`+ * has to tell us to forget fsync requests before it starts deletions.`
`898`	`880`	`*/`
`899`	`881`	`do {`
`900`	`882`	`HASH_SEQ_STATUShstat;`
`@@ -1043,17 +1025,58 @@ register_dirty_segment(SMgrRelation reln, MdfdVec *seg)`
`1043`	`1025`	`* We stuff the fsync request into the local hash table for execution`
`1044`	`1026`	`* during the bgwriter's next checkpoint.`
`1045`	`1027`	`*`
`1046`		`- * segno == InvalidBlockNumber is a "revoke" request: remove any pending`
`1047`		`- * fsync requests for the whole relation.`
	`1028`	`+ * The range of possible segment numbers is way less than the range of`
	`1029`	`+ * BlockNumber, so we can reserve high values of segno for special purposes.`
	`1030`	`+ * We define two: FORGET_RELATION_FSYNC means to drop pending fsyncs for`
	`1031`	`+ * a relation, and FORGET_DATABASE_FSYNC means to drop pending fsyncs for`
	`1032`	`+ * a whole database. (These are a tad slow because the hash table has to be`
	`1033`	`+ * searched linearly, but it doesn't seem worth rethinking the table structure`
	`1034`	`+ * for them.)`
`1048`	`1035`	`*/`
`1049`	`1036`	`void`
`1050`	`1037`	`RememberFsyncRequest(RelFileNodernode,BlockNumbersegno)`
`1051`	`1038`	`{`
`1052`	`1039`	`Assert(pendingOpsTable);`
`1053`	`1040`
`1054`		`-if (segno!=InvalidBlockNumber)`
	`1041`	`+if (segno==FORGET_RELATION_FSYNC)`
	`1042`	`+{`
	`1043`	`+/* Remove any pending requests for the entire relation */`
	`1044`	`+HASH_SEQ_STATUShstat;`
	`1045`	`+PendingOperationEntry*entry;`
	`1046`	`+`
	`1047`	`+hash_seq_init(&hstat,pendingOpsTable);`
	`1048`	`+while ((entry= (PendingOperationEntry*)hash_seq_search(&hstat))!=NULL)`
	`1049`	`+{`
	`1050`	`+if (RelFileNodeEquals(entry->tag.rnode,rnode))`
	`1051`	`+{`
	`1052`	`+/* Okay, delete this entry */`
	`1053`	`+if (hash_search(pendingOpsTable,&entry->tag,`
	`1054`	`+HASH_REMOVE,NULL)==NULL)`
	`1055`	`+elog(ERROR,"pendingOpsTable corrupted");`
	`1056`	`+}`
	`1057`	`+}`
	`1058`	`+}`
	`1059`	`+elseif (segno==FORGET_DATABASE_FSYNC)`
	`1060`	`+{`
	`1061`	`+/* Remove any pending requests for the entire database */`
	`1062`	`+HASH_SEQ_STATUShstat;`
	`1063`	`+PendingOperationEntry*entry;`
	`1064`	`+`
	`1065`	`+hash_seq_init(&hstat,pendingOpsTable);`
	`1066`	`+while ((entry= (PendingOperationEntry*)hash_seq_search(&hstat))!=NULL)`
	`1067`	`+{`
	`1068`	`+if (entry->tag.rnode.dbNode==rnode.dbNode)`
	`1069`	`+{`
	`1070`	`+/* Okay, delete this entry */`
	`1071`	`+if (hash_search(pendingOpsTable,&entry->tag,`
	`1072`	`+HASH_REMOVE,NULL)==NULL)`
	`1073`	`+elog(ERROR,"pendingOpsTable corrupted");`
	`1074`	`+}`
	`1075`	`+}`
	`1076`	`+}`
	`1077`	`+else`
`1055`	`1078`	`{`
`1056`		`-/Enter a request to fsync this segment /`
	`1079`	`+/Normal case: enter a request to fsync this segment /`
`1057`	`1080`	`PendingOperationTagkey;`
`1058`	`1081`	`PendingOperationEntry*entry;`
`1059`	`1082`	`boolfound;`
`@@ -1070,29 +1093,66 @@ RememberFsyncRequest(RelFileNode rnode, BlockNumber segno)`
`1070`	`1093`	`if (!found)/* new entry, so initialize it */`
`1071`	`1094`	`entry->failures=0;`
`1072`	`1095`	`}`
`1073`		`-else`
	`1096`	`+}`
	`1097`	`+`
	`1098`	`+/*`
	`1099`	`+ * ForgetRelationFsyncRequests -- ensure any fsyncs for a rel are forgotten`
	`1100`	`+ */`
	`1101`	`+void`
	`1102`	`+ForgetRelationFsyncRequests(RelFileNodernode)`
	`1103`	`+{`
	`1104`	`+if (pendingOpsTable)`
	`1105`	`+{`
	`1106`	`+/* standalone backend or startup process: fsync state is local */`
	`1107`	`+RememberFsyncRequest(rnode,FORGET_RELATION_FSYNC);`
	`1108`	`+}`
	`1109`	`+elseif (IsUnderPostmaster)`
`1074`	`1110`	`{`
`1075`	`1111`	`/*`
`1076`		`- * Remove any pending requests for the entire relation. (This is a`
`1077`		`- * tad slow but it doesn't seem worth rethinking the table structure.)`
	`1112`	`+ * Notify the bgwriter about it. If we fail to queue the revoke`
	`1113`	`+ * message, we have to sleep and try again ... ugly, but hopefully`
	`1114`	`+ * won't happen often.`
	`1115`	`+ *`
	`1116`	`+ * XXX should we CHECK_FOR_INTERRUPTS in this loop? Escaping with`
	`1117`	`+ * an error would leave the no-longer-used file still present on`
	`1118`	`+ * disk, which would be bad, so I'm inclined to assume that the`
	`1119`	`+ * bgwriter will always empty the queue soon.`
`1078`	`1120`	`*/`
`1079`		`-HASH_SEQ_STATUShstat;`
`1080`		`-PendingOperationEntry*entry;`
	`1121`	`+while (!ForwardFsyncRequest(rnode,FORGET_RELATION_FSYNC))`
	`1122`	`+pg_usleep(10000L);/* 10 msec seems a good number */`
	`1123`	`+/*`
	`1124`	`+ * Note we don't wait for the bgwriter to actually absorb the`
	`1125`	`+ * revoke message; see mdsync() for the implications.`
	`1126`	`+ */`
	`1127`	`+}`
	`1128`	`+}`
`1081`	`1129`
`1082`		`-hash_seq_init(&hstat,pendingOpsTable);`
`1083`		`-while ((entry= (PendingOperationEntry*)hash_seq_search(&hstat))!=NULL)`
`1084`		`-{`
`1085`		`-if (RelFileNodeEquals(entry->tag.rnode,rnode))`
`1086`		`-{`
`1087`		`-/* Okay, delete this entry */`
`1088`		`-if (hash_search(pendingOpsTable,&entry->tag,`
`1089`		`-HASH_REMOVE,NULL)==NULL)`
`1090`		`-elog(ERROR,"pendingOpsTable corrupted");`
`1091`		`-}`
`1092`		`-}`
	`1130`	`+/*`
	`1131`	`+ * ForgetDatabaseFsyncRequests -- ensure any fsyncs for a DB are forgotten`
	`1132`	`+ */`
	`1133`	`+void`
	`1134`	`+ForgetDatabaseFsyncRequests(Oiddbid)`
	`1135`	`+{`
	`1136`	`+RelFileNodernode;`
	`1137`	`+`
	`1138`	`+rnode.dbNode=dbid;`
	`1139`	`+rnode.spcNode=0;`
	`1140`	`+rnode.relNode=0;`
	`1141`	`+`
	`1142`	`+if (pendingOpsTable)`
	`1143`	`+{`
	`1144`	`+/* standalone backend or startup process: fsync state is local */`
	`1145`	`+RememberFsyncRequest(rnode,FORGET_DATABASE_FSYNC);`
	`1146`	`+}`
	`1147`	`+elseif (IsUnderPostmaster)`
	`1148`	`+{`
	`1149`	`+/* see notes in ForgetRelationFsyncRequests */`
	`1150`	`+while (!ForwardFsyncRequest(rnode,FORGET_DATABASE_FSYNC))`
	`1151`	`+pg_usleep(10000L);/* 10 msec seems a good number */`
`1093`	`1152`	`}`
`1094`	`1153`	`}`
`1095`	`1154`
	`1155`	`+`
`1096`	`1156`	`/*`
`1097`	`1157`	`*_fdvec_alloc() -- Make a MdfdVec object.`
`1098`	`1158`	`*/`

`‎src/include/storage/smgr.h‎`

Lines changed: 3 additions & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -7,7 +7,7 @@`
`7`	`7`	`* Portions Copyright (c) 1996-2007, PostgreSQL Global Development Group`
`8`	`8`	`* Portions Copyright (c) 1994, Regents of the University of California`
`9`	`9`	`*`
`10`		`- * $PostgreSQL: pgsql/src/include/storage/smgr.h,v 1.57 2007/01/05 22:19:58 momjian Exp $`
	`10`	`+ * $PostgreSQL: pgsql/src/include/storage/smgr.h,v 1.58 2007/01/17 16:25:01 tgl Exp $`
`11`	`11`	`*`
`12`	`12`	`*-------------------------------------------------------------------------`
`13`	`13`	`*/`
`@@ -106,6 +106,8 @@ extern void mdimmedsync(SMgrRelation reln);`
`106`	`106`	`externvoidmdsync(void);`
`107`	`107`
`108`	`108`	`externvoidRememberFsyncRequest(RelFileNodernode,BlockNumbersegno);`
	`109`	`+externvoidForgetRelationFsyncRequests(RelFileNodernode);`
	`110`	`+externvoidForgetDatabaseFsyncRequests(Oiddbid);`
`109`	`111`
`110`	`112`	`/* smgrtype.c */`
`111`	`113`	`externDatumsmgrout(PG_FUNCTION_ARGS);`

0 commit comments

Comments

(0)

Movatterモバイル変換

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commiteddbf39

File tree

4 files changed

4 files changed

`‎src/backend/commands/dbcommands.c‎`

`‎src/backend/postmaster/bgwriter.c‎`

`‎src/backend/storage/smgr/md.c‎`

`‎src/include/storage/smgr.h‎`

0 commit comments