diff options
author | Tom Lane <tgl@sss.pgh.pa.us> | 2000-11-28 23:27:57 +0000 |
---|---|---|
committer | Tom Lane <tgl@sss.pgh.pa.us> | 2000-11-28 23:27:57 +0000 |
commit | c715fdea267843fd7fae4253aee0ae91e941393c (patch) | |
tree | b19e41edd57afe461ebc3dae271c8a5d17eba710 /src/backend/storage/ipc | |
parent | 914822713c9a8ce452860fb895ef79ecfd583746 (diff) | |
download | postgresql-c715fdea267843fd7fae4253aee0ae91e941393c.tar.gz postgresql-c715fdea267843fd7fae4253aee0ae91e941393c.zip |
Significant cleanups in SysV IPC handling (shared mem and semaphores).
IPC key assignment will now work correctly even when multiple postmasters
are using same logical port number (which is possible given -k switch).
There is only one shared-mem segment per postmaster now, not 3.
Rip out broken code for non-TAS case in bufmgr and xlog, substitute a
complete S_LOCK emulation using semaphores in spin.c. TAS and non-TAS
logic is now exactly the same.
When deadlock is detected, "Deadlock detected" is now the elog(ERROR)
message, rather than a NOTICE that comes out before an unhelpful ERROR.
Diffstat (limited to 'src/backend/storage/ipc')
-rw-r--r-- | src/backend/storage/ipc/ipc.c | 830 | ||||
-rw-r--r-- | src/backend/storage/ipc/ipci.c | 147 | ||||
-rw-r--r-- | src/backend/storage/ipc/shmem.c | 266 | ||||
-rw-r--r-- | src/backend/storage/ipc/sinval.c | 43 | ||||
-rw-r--r-- | src/backend/storage/ipc/sinvaladt.c | 95 | ||||
-rw-r--r-- | src/backend/storage/ipc/spin.c | 403 |
6 files changed, 838 insertions, 946 deletions
diff --git a/src/backend/storage/ipc/ipc.c b/src/backend/storage/ipc/ipc.c index 98d90bc62e0..920f7f9bfeb 100644 --- a/src/backend/storage/ipc/ipc.c +++ b/src/backend/storage/ipc/ipc.c @@ -8,7 +8,7 @@ * * * IDENTIFICATION - * $Header: /cvsroot/pgsql/src/backend/storage/ipc/ipc.c,v 1.53 2000/11/21 21:16:01 petere Exp $ + * $Header: /cvsroot/pgsql/src/backend/storage/ipc/ipc.c,v 1.54 2000/11/28 23:27:56 tgl Exp $ * * NOTES * @@ -30,6 +30,7 @@ #include <sys/types.h> #include <sys/file.h> #include <errno.h> +#include <unistd.h> #include "storage/ipc.h" #include "storage/s_lock.h" @@ -51,6 +52,7 @@ #include <sys/ipc.h> #endif + /* * This flag is set during proc_exit() to change elog()'s behavior, * so that an elog() from an on_proc_exit routine cannot get us out @@ -58,12 +60,31 @@ */ bool proc_exit_inprogress = false; -static int UsePrivateMemory = 0; +static IpcSemaphoreId InternalIpcSemaphoreCreate(IpcSemaphoreKey semKey, + int numSems, int permission, + int semStartValue, bool removeOnExit); +static void CallbackSemaphoreKill(int status, Datum semId); +static void *InternalIpcMemoryCreate(IpcMemoryKey memKey, uint32 size, + int permission); +static void IpcMemoryDetach(int status, Datum shmaddr); +static void IpcMemoryDelete(int status, Datum shmId); +static void *PrivateMemoryCreate(uint32 size); +static void PrivateMemoryDelete(int status, Datum memaddr); -static void IpcMemoryDetach(int status, char *shmaddr); /* ---------------------------------------------------------------- * exit() handling stuff + * + * These functions are in generally the same spirit as atexit(2), + * but provide some additional features we need --- in particular, + * we want to register callbacks to invoke when we are disconnecting + * from a broken shared-memory context but not exiting the postmaster. + * + * Callback functions can take zero, one, or two args: the first passed + * arg is the integer exitcode, the second is the Datum supplied when + * the callback was registered. + * + * XXX these functions probably ought to live in some other module. * ---------------------------------------------------------------- */ @@ -73,43 +94,12 @@ static struct ONEXIT { void (*function) (); Datum arg; -} on_proc_exit_list[MAX_ON_EXITS], on_shmem_exit_list[MAX_ON_EXITS]; +} on_proc_exit_list[MAX_ON_EXITS], + on_shmem_exit_list[MAX_ON_EXITS]; static int on_proc_exit_index, on_shmem_exit_index; -typedef struct _PrivateMemStruct -{ - int id; - char *memptr; -} PrivateMem; - -static PrivateMem IpcPrivateMem[16]; - - -static int -PrivateMemoryCreate(IpcMemoryKey memKey, - uint32 size) -{ - static int memid = 0; - - UsePrivateMemory = 1; - - IpcPrivateMem[memid].id = memid; - IpcPrivateMem[memid].memptr = malloc(size); - if (IpcPrivateMem[memid].memptr == NULL) - elog(ERROR, "PrivateMemoryCreate: not enough memory to malloc"); - MemSet(IpcPrivateMem[memid].memptr, 0, size); /* XXX PURIFY */ - - return memid++; -} - -static char * -PrivateMemoryAttach(IpcMemoryId memid) -{ - return IpcPrivateMem[memid].memptr; -} - /* ---------------------------------------------------------------- * proc_exit @@ -156,9 +146,9 @@ proc_exit(int code) } /* ------------------ - * Run all of the on_shmem_exit routines but don't exit in the end. + * Run all of the on_shmem_exit routines --- but don't actually exit. * This is used by the postmaster to re-initialize shared memory and - * semaphores after a backend dies horribly + * semaphores after a backend dies horribly. * ------------------ */ void @@ -188,18 +178,16 @@ shmem_exit(int code) * functions invoked by proc_exit(). -cim 2/6/90 * ---------------------------------------------------------------- */ -int +void on_proc_exit(void (*function) (), Datum arg) { if (on_proc_exit_index >= MAX_ON_EXITS) - return -1; + elog(FATAL, "Out of on_proc_exit slots"); on_proc_exit_list[on_proc_exit_index].function = function; on_proc_exit_list[on_proc_exit_index].arg = arg; ++on_proc_exit_index; - - return 0; } /* ---------------------------------------------------------------- @@ -209,24 +197,25 @@ on_proc_exit(void (*function) (), Datum arg) * functions invoked by shmem_exit(). -cim 2/6/90 * ---------------------------------------------------------------- */ -int +void on_shmem_exit(void (*function) (), Datum arg) { if (on_shmem_exit_index >= MAX_ON_EXITS) - return -1; + elog(FATAL, "Out of on_shmem_exit slots"); on_shmem_exit_list[on_shmem_exit_index].function = function; on_shmem_exit_list[on_shmem_exit_index].arg = arg; ++on_shmem_exit_index; - - return 0; } /* ---------------------------------------------------------------- * on_exit_reset * - * this function clears all proc_exit() registered functions. + * this function clears all on_proc_exit() and on_shmem_exit() + * registered functions. This is used just after forking a backend, + * so that the backend doesn't believe it should call the postmaster's + * on-exit routines when it exits... * ---------------------------------------------------------------- */ void @@ -236,190 +225,135 @@ on_exit_reset(void) on_proc_exit_index = 0; } -/****************************************************************************/ -/* IPCPrivateSemaphoreKill(status, semId) */ -/* */ -/****************************************************************************/ -static void -IPCPrivateSemaphoreKill(int status, int semId) -{ - union semun semun; - semun.val = 0; /* unused */ - - if (semctl(semId, 0, IPC_RMID, semun) == -1) - elog(NOTICE, "IPCPrivateSemaphoreKill: semctl(%d, 0, IPC_RMID, ...) failed: %s", - semId, strerror(errno)); -} - - -/****************************************************************************/ -/* IPCPrivateMemoryKill(status, shmId) */ -/* */ -/****************************************************************************/ -static void -IPCPrivateMemoryKill(int status, int shmId) -{ - if (UsePrivateMemory) - { - /* free ( IpcPrivateMem[shmId].memptr ); */ - } - else - { - if (shmctl(shmId, IPC_RMID, (struct shmid_ds *) NULL) < 0) - { - elog(NOTICE, "IPCPrivateMemoryKill: shmctl(%d, %d, 0) failed: %m", - shmId, IPC_RMID); - } - } -} -/* - * Note: - * XXX This should be split into two different calls. One should - * XXX be used to create a semaphore set. The other to "attach" a - * XXX existing set. It should be an error for the semaphore set - * XXX to to already exist or for it not to, respectively. +/* ---------------------------------------------------------------- + * Semaphore support * - * Currently, the semaphore sets are "attached" and an error - * is detected only when a later shared memory attach fails. + * These routines represent a fairly thin layer on top of SysV semaphore + * functionality. + * ---------------------------------------------------------------- */ -IpcSemaphoreId -IpcSemaphoreCreate(IpcSemaphoreKey semKey, - int semNum, - int permission, - int semStartValue, - int removeOnExit) +/* ---------------------------------------------------------------- + * InternalIpcSemaphoreCreate(semKey, numSems, permission, + * semStartValue, removeOnExit) + * + * Attempt to create a new semaphore set with the specified key. + * Will fail (return -1) if such a set already exists. + * On success, a callback is optionally registered with on_shmem_exit + * to delete the semaphore set when on_shmem_exit is called. + * + * If we fail with a failure code other than collision-with-existing-set, + * print out an error and abort. Other types of errors are not recoverable. + * ---------------------------------------------------------------- + */ +static IpcSemaphoreId +InternalIpcSemaphoreCreate(IpcSemaphoreKey semKey, + int numSems, int permission, + int semStartValue, bool removeOnExit) { int semId; int i; - int errStatus; u_short array[IPC_NMAXSEM]; union semun semun; - /* check arguments */ - if (semNum > IPC_NMAXSEM || semNum <= 0) - return (-1); + Assert(numSems > 0 && numSems <= IPC_NMAXSEM); - semId = semget(semKey, 0, 0); + semId = semget(semKey, numSems, IPC_CREAT | IPC_EXCL | permission); - if (semId == -1) + if (semId < 0) { -#ifdef DEBUG_IPC - fprintf(stderr, "calling semget(%d, %d, 0%o)\n", - semKey, semNum, (unsigned)(IPC_CREAT|permission)); -#endif + /* + * Fail quietly if error indicates a collision with existing set. + * One would expect EEXIST, given that we said IPC_EXCL, but perhaps + * we could get a permission violation instead? + */ + if (errno == EEXIST || errno == EACCES) + return -1; + /* + * Else complain and abort + */ + fprintf(stderr, "IpcSemaphoreCreate: semget(key=%d, num=%d, 0%o) failed: %s\n", + (int) semKey, numSems, (IPC_CREAT|IPC_EXCL|permission), + strerror(errno)); - semId = semget(semKey, semNum, IPC_CREAT | permission); + if (errno == ENOSPC) + fprintf(stderr, + "\nThis error does *not* mean that you have run out of disk space.\n\n" + "It occurs either because system limit for the maximum number of\n" + "semaphore sets (SEMMNI), or the system wide maximum number of\n" + "semaphores (SEMMNS), would be exceeded. You need to raise the\n" + "respective kernel parameter. Look into the PostgreSQL documentation\n" + "for details.\n\n"); - if (semId < 0) - { - fprintf(stderr, "IpcSemaphoreCreate: semget(key=%d, num=%d, 0%o) failed: %s\n", - semKey, semNum, (unsigned)(permission|IPC_CREAT), - strerror(errno)); - - if (errno == ENOSPC) - fprintf(stderr, - "\nThis error does *not* mean that you have run out of disk space.\n\n" - "It occurs either because system limit for the maximum number of\n" - "semaphore sets (SEMMNI), or the system wide maximum number of\n" - "semaphores (SEMMNS), would be exceeded. You need to raise the\n" - "respective kernel parameter. Look into the PostgreSQL documentation\n" - "for details.\n\n"); - - return (-1); - } - for (i = 0; i < semNum; i++) - array[i] = semStartValue; - semun.array = array; - errStatus = semctl(semId, 0, SETALL, semun); - if (errStatus == -1) - { - fprintf(stderr, "IpcSemaphoreCreate: semctl(id=%d, 0, SETALL, ...) failed: %s\n", - semId, strerror(errno)); + proc_exit(1); + } - if (errno == ERANGE) - fprintf(stderr, - "You possibly need to raise your kernel's SEMVMX value to be at least\n" - "%d. Look into the PostgreSQL documentation for details.\n", - semStartValue); + /* Initialize new semas to specified start value */ + for (i = 0; i < numSems; i++) + array[i] = semStartValue; + semun.array = array; + if (semctl(semId, 0, SETALL, semun) < 0) + { + fprintf(stderr, "IpcSemaphoreCreate: semctl(id=%d, 0, SETALL, ...) failed: %s\n", + semId, strerror(errno)); - semctl(semId, 0, IPC_RMID, semun); - return (-1); - } + if (errno == ERANGE) + fprintf(stderr, + "You possibly need to raise your kernel's SEMVMX value to be at least\n" + "%d. Look into the PostgreSQL documentation for details.\n", + semStartValue); - if (removeOnExit) - on_shmem_exit(IPCPrivateSemaphoreKill, (Datum) semId); + IpcSemaphoreKill(semId); + proc_exit(1); } - -#ifdef DEBUG_IPC - fprintf(stderr, "IpcSemaphoreCreate returns %d\n", semId); - fflush(stdout); - fflush(stderr); -#endif + /* Register on-exit routine to delete the new set */ + if (removeOnExit) + on_shmem_exit(CallbackSemaphoreKill, Int32GetDatum(semId)); return semId; } - /****************************************************************************/ -/* IpcSemaphoreSet() - sets the initial value of the semaphore */ +/* IpcSemaphoreKill(semId) - removes a semaphore set */ /* */ -/* note: the xxx_return variables are only used for debugging. */ /****************************************************************************/ -#ifdef NOT_USED -static int IpcSemaphoreSet_return; - void -IpcSemaphoreSet(int semId, int semno, int value) +IpcSemaphoreKill(IpcSemaphoreId semId) { - int errStatus; union semun semun; - semun.val = value; - errStatus = semctl(semId, semno, SETVAL, semun); - IpcSemaphoreSet_return = errStatus; + semun.val = 0; /* unused, but keep compiler quiet */ - if (errStatus == -1) - fprintf(stderr, "IpcSemaphoreSet: semctl(id=%d) failed: %s\n", + if (semctl(semId, 0, IPC_RMID, semun) < 0) + fprintf(stderr, "IpcSemaphoreKill: semctl(%d, 0, IPC_RMID, ...) failed: %s\n", semId, strerror(errno)); + /* We used to report a failure via elog(NOTICE), but that's pretty + * pointless considering any client has long since disconnected ... + */ } -#endif /* NOT_USED */ - /****************************************************************************/ -/* IpcSemaphoreKill(key) - removes a semaphore */ -/* */ +/* CallbackSemaphoreKill(status, semId) */ +/* (called as an on_shmem_exit callback, hence funny argument list) */ /****************************************************************************/ -void -IpcSemaphoreKill(IpcSemaphoreKey key) +static void +CallbackSemaphoreKill(int status, Datum semId) { - int semId; - union semun semun; - semun.val = 0; /* unused */ - - /* kill semaphore if existent */ - - semId = semget(key, 0, 0); - if (semId != -1) - semctl(semId, 0, IPC_RMID, semun); + IpcSemaphoreKill(DatumGetInt32(semId)); } /****************************************************************************/ -/* IpcSemaphoreLock(semId, sem, lock) - locks a semaphore */ -/* */ -/* note: the xxx_return variables are only used for debugging. */ +/* IpcSemaphoreLock(semId, sem) - locks a semaphore */ /****************************************************************************/ -static int IpcSemaphoreLock_return; - void -IpcSemaphoreLock(IpcSemaphoreId semId, int sem, int lock) +IpcSemaphoreLock(IpcSemaphoreId semId, int sem) { int errStatus; struct sembuf sops; - sops.sem_op = lock; + sops.sem_op = -1; /* decrement */ sops.sem_flg = 0; sops.sem_num = sem; @@ -427,11 +361,6 @@ IpcSemaphoreLock(IpcSemaphoreId semId, int sem, int lock) * Note: if errStatus is -1 and errno == EINTR then it means we * returned from the operation prematurely because we were * sent a signal. So we try and lock the semaphore again. - * I am not certain this is correct, but the semantics aren't - * clear it fixes problems with parallel abort synchronization, - * namely that after processing an abort signal, the semaphore - * call returns with -1 (and errno == EINTR) before it should. - * -cim 3/28/90 * ---------------- */ do @@ -439,8 +368,6 @@ IpcSemaphoreLock(IpcSemaphoreId semId, int sem, int lock) errStatus = semop(semId, &sops, 1); } while (errStatus == -1 && errno == EINTR); - IpcSemaphoreLock_return = errStatus; - if (errStatus == -1) { fprintf(stderr, "IpcSemaphoreLock: semop(id=%d) failed: %s\n", @@ -450,19 +377,15 @@ IpcSemaphoreLock(IpcSemaphoreId semId, int sem, int lock) } /****************************************************************************/ -/* IpcSemaphoreUnlock(semId, sem, lock) - unlocks a semaphore */ -/* */ -/* note: the xxx_return variables are only used for debugging. */ +/* IpcSemaphoreUnlock(semId, sem) - unlocks a semaphore */ /****************************************************************************/ -static int IpcSemaphoreUnlock_return; - void -IpcSemaphoreUnlock(IpcSemaphoreId semId, int sem, int lock) +IpcSemaphoreUnlock(IpcSemaphoreId semId, int sem) { int errStatus; struct sembuf sops; - sops.sem_op = -lock; + sops.sem_op = 1; /* increment */ sops.sem_flg = 0; sops.sem_num = sem; @@ -470,12 +393,8 @@ IpcSemaphoreUnlock(IpcSemaphoreId semId, int sem, int lock) /* ---------------- * Note: if errStatus is -1 and errno == EINTR then it means we * returned from the operation prematurely because we were - * sent a signal. So we try and lock the semaphore again. - * I am not certain this is correct, but the semantics aren't - * clear it fixes problems with parallel abort synchronization, - * namely that after processing an abort signal, the semaphore - * call returns with -1 (and errno == EINTR) before it should. - * -cim 3/28/90 + * sent a signal. So we try and unlock the semaphore again. + * Not clear this can really happen, but might as well cope. * ---------------- */ do @@ -483,8 +402,6 @@ IpcSemaphoreUnlock(IpcSemaphoreId semId, int sem, int lock) errStatus = semop(semId, &sops, 1); } while (errStatus == -1 && errno == EINTR); - IpcSemaphoreUnlock_return = errStatus; - if (errStatus == -1) { fprintf(stderr, "IpcSemaphoreUnlock: semop(id=%d) failed: %s\n", @@ -493,53 +410,115 @@ IpcSemaphoreUnlock(IpcSemaphoreId semId, int sem, int lock) } } +/****************************************************************************/ +/* IpcSemaphoreTryLock(semId, sem) - conditionally locks a semaphore */ +/* Lock the semaphore if it's free, but don't block. */ +/****************************************************************************/ +bool +IpcSemaphoreTryLock(IpcSemaphoreId semId, int sem) +{ + int errStatus; + struct sembuf sops; + + sops.sem_op = -1; /* decrement */ + sops.sem_flg = IPC_NOWAIT; /* but don't block */ + sops.sem_num = sem; + + /* ---------------- + * Note: if errStatus is -1 and errno == EINTR then it means we + * returned from the operation prematurely because we were + * sent a signal. So we try and lock the semaphore again. + * ---------------- + */ + do + { + errStatus = semop(semId, &sops, 1); + } while (errStatus == -1 && errno == EINTR); + + if (errStatus == -1) + { + /* Expect EAGAIN or EWOULDBLOCK (platform-dependent) */ +#ifdef EAGAIN + if (errno == EAGAIN) + return false; /* failed to lock it */ +#endif +#if defined(EWOULDBLOCK) && (!defined(EAGAIN) || (EWOULDBLOCK != EAGAIN)) + if (errno == EWOULDBLOCK) + return false; /* failed to lock it */ +#endif + /* Otherwise we got trouble */ + fprintf(stderr, "IpcSemaphoreTryLock: semop(id=%d) failed: %s\n", + semId, strerror(errno)); + proc_exit(255); + } + + return true; +} + +/* Get the current value (semval) of the semaphore */ int -IpcSemaphoreGetCount(IpcSemaphoreId semId, int sem) +IpcSemaphoreGetValue(IpcSemaphoreId semId, int sem) { - int semncnt; union semun dummy; /* for Solaris */ dummy.val = 0; /* unused */ - semncnt = semctl(semId, sem, GETNCNT, dummy); - return semncnt; + return semctl(semId, sem, GETVAL, dummy); } -int -IpcSemaphoreGetValue(IpcSemaphoreId semId, int sem) +/* Get the PID of the last process to do semop() on the semaphore */ +static pid_t +IpcSemaphoreGetLastPID(IpcSemaphoreId semId, int sem) { - int semval; union semun dummy; /* for Solaris */ dummy.val = 0; /* unused */ - semval = semctl(semId, sem, GETVAL, dummy); - return semval; + return semctl(semId, sem, GETPID, dummy); } -/****************************************************************************/ -/* IpcMemoryCreate(memKey) */ -/* */ -/* - returns the memory identifier, if creation succeeds */ -/* returns IpcMemCreationFailed, if failure */ -/****************************************************************************/ -IpcMemoryId -IpcMemoryCreate(IpcMemoryKey memKey, uint32 size, int permission) +/* ---------------------------------------------------------------- + * Shared memory support + * + * These routines represent a fairly thin layer on top of SysV shared + * memory functionality. + * ---------------------------------------------------------------- + */ + +/* ---------------------------------------------------------------- + * InternalIpcMemoryCreate(memKey, size, permission) + * + * Attempt to create a new shared memory segment with the specified key. + * Will fail (return NULL) if such a segment already exists. If successful, + * attach the segment to the current process and return its attached address. + * On success, callbacks are registered with on_shmem_exit to detach and + * delete the segment when on_shmem_exit is called. + * + * If we fail with a failure code other than collision-with-existing-segment, + * print out an error and abort. Other types of errors are not recoverable. + * ---------------------------------------------------------------- + */ +static void * +InternalIpcMemoryCreate(IpcMemoryKey memKey, uint32 size, int permission) { IpcMemoryId shmid; + void *memAddress; - if (memKey == PrivateIPCKey) - { - /* private */ - shmid = PrivateMemoryCreate(memKey, size); - } - else - - shmid = shmget(memKey, size, IPC_CREAT | permission); + shmid = shmget(memKey, size, IPC_CREAT | IPC_EXCL | permission); if (shmid < 0) { - fprintf(stderr, "IpcMemoryCreate: shmget(key=%d, size=%d, 0%o) failed: %s\n", - (int)memKey, size, (unsigned)(IPC_CREAT|permission), + /* + * Fail quietly if error indicates a collision with existing segment. + * One would expect EEXIST, given that we said IPC_EXCL, but perhaps + * we could get a permission violation instead? + */ + if (errno == EEXIST || errno == EACCES) + return NULL; + /* + * Else complain and abort + */ + fprintf(stderr, "IpcMemoryCreate: shmget(key=%d, size=%u, 0%o) failed: %s\n", + (int) memKey, size, (IPC_CREAT | IPC_EXCL | permission), strerror(errno)); if (errno == EINVAL) @@ -547,7 +526,7 @@ IpcMemoryCreate(IpcMemoryKey memKey, uint32 size, int permission) "\nThis error can be caused by one of three things:\n\n" "1. The maximum size for shared memory segments on your system was\n" " exceeded. You need to raise the SHMMAX parameter in your kernel\n" - " to be at least %d bytes.\n\n" + " to be at least %u bytes.\n\n" "2. The requested shared memory segment was too small for your system.\n" " You need to lower the SHMMIN parameter in your kernel.\n\n" "3. The requested shared memory segment already exists but is of the\n" @@ -567,179 +546,302 @@ IpcMemoryCreate(IpcMemoryKey memKey, uint32 size, int permission) "reached. The PostgreSQL Administrator's Guide contains more\n" "information about shared memory configuration.\n\n"); - return IpcMemCreationFailed; + proc_exit(1); } + /* Register on-exit routine to delete the new segment */ + on_shmem_exit(IpcMemoryDelete, Int32GetDatum(shmid)); - /* if (memKey == PrivateIPCKey) */ - on_shmem_exit(IPCPrivateMemoryKill, (Datum) shmid); + /* OK, should be able to attach to the segment */ + memAddress = shmat(shmid, 0, 0); - return shmid; -} - -/****************************************************************************/ -/* IpcMemoryIdGet(memKey, size) returns the shared memory Id */ -/* or IpcMemIdGetFailed */ -/****************************************************************************/ -IpcMemoryId -IpcMemoryIdGet(IpcMemoryKey memKey, uint32 size) -{ - IpcMemoryId shmid; - - shmid = shmget(memKey, size, 0); - - if (shmid < 0) + if (memAddress == (void *) -1) { - fprintf(stderr, "IpcMemoryIdGet: shmget(key=%d, size=%d, 0) failed: %s\n", - memKey, size, strerror(errno)); - return IpcMemIdGetFailed; + fprintf(stderr, "IpcMemoryCreate: shmat(id=%d) failed: %s\n", + shmid, strerror(errno)); + proc_exit(1); } - return shmid; + /* Register on-exit routine to detach new segment before deleting */ + on_shmem_exit(IpcMemoryDetach, PointerGetDatum(memAddress)); + + return memAddress; } /****************************************************************************/ /* IpcMemoryDetach(status, shmaddr) removes a shared memory segment */ -/* from a backend address space */ -/* (only called by backends running under the postmaster) */ +/* from process' address spaceq */ +/* (called as an on_shmem_exit callback, hence funny argument list) */ /****************************************************************************/ static void -IpcMemoryDetach(int status, char *shmaddr) +IpcMemoryDetach(int status, Datum shmaddr) { - if (shmdt(shmaddr) < 0) - elog(NOTICE, "IpcMemoryDetach: shmdt(0x%p) failed: %m", shmaddr); + if (shmdt(DatumGetPointer(shmaddr)) < 0) + fprintf(stderr, "IpcMemoryDetach: shmdt(%p) failed: %s\n", + DatumGetPointer(shmaddr), strerror(errno)); + /* We used to report a failure via elog(NOTICE), but that's pretty + * pointless considering any client has long since disconnected ... + */ } /****************************************************************************/ -/* IpcMemoryAttach(memId) returns the adress of shared memory */ -/* or IpcMemAttachFailed */ -/* */ -/* CALL IT: addr = (struct <MemoryStructure> *) IpcMemoryAttach(memId); */ -/* */ +/* IpcMemoryDelete(status, shmId) deletes a shared memory segment */ +/* (called as an on_shmem_exit callback, hence funny argument list) */ /****************************************************************************/ -char * -IpcMemoryAttach(IpcMemoryId memId) +static void +IpcMemoryDelete(int status, Datum shmId) { - char *memAddress; + if (shmctl(DatumGetInt32(shmId), IPC_RMID, (struct shmid_ds *) NULL) < 0) + fprintf(stderr, "IpcMemoryDelete: shmctl(%d, %d, 0) failed: %s\n", + DatumGetInt32(shmId), IPC_RMID, strerror(errno)); + /* We used to report a failure via elog(NOTICE), but that's pretty + * pointless considering any client has long since disconnected ... + */ +} - if (UsePrivateMemory) - memAddress = (char *) PrivateMemoryAttach(memId); - else - memAddress = (char *) shmat(memId, 0, 0); +/* ---------------------------------------------------------------- + * private memory support + * + * Rather than allocating shmem segments with IPC_PRIVATE key, we + * just malloc() the requested amount of space. This code emulates + * the needed shmem functions. + * ---------------------------------------------------------------- + */ - /* if ( *memAddress == -1) { XXX ??? */ - if (memAddress == (char *) -1) +static void * +PrivateMemoryCreate(uint32 size) +{ + void *memAddress; + + memAddress = malloc(size); + if (!memAddress) { - fprintf(stderr, "IpcMemoryAttach: shmat(id=%d) failed: %s\n", - memId, strerror(errno)); - return IpcMemAttachFailed; + fprintf(stderr, "PrivateMemoryCreate: malloc(%u) failed\n", size); + proc_exit(1); } + MemSet(memAddress, 0, size); /* keep Purify quiet */ - if (!UsePrivateMemory) - on_shmem_exit(IpcMemoryDetach, PointerGetDatum(memAddress)); + /* Register on-exit routine to release storage */ + on_shmem_exit(PrivateMemoryDelete, PointerGetDatum(memAddress)); - return (char *) memAddress; + return memAddress; } - -/****************************************************************************/ -/* IpcMemoryKill(memKey) removes a shared memory segment */ -/* (only called by the postmaster and standalone backends) */ -/****************************************************************************/ -void -IpcMemoryKill(IpcMemoryKey memKey) +static void +PrivateMemoryDelete(int status, Datum memaddr) { - IpcMemoryId shmid; - - if (!UsePrivateMemory && (shmid = shmget(memKey, 0, 0)) >= 0) - { - if (shmctl(shmid, IPC_RMID, (struct shmid_ds *) NULL) < 0) - { - elog(NOTICE, "IpcMemoryKill: shmctl(%d, %d, 0) failed: %m", - shmid, IPC_RMID); - } - } + free(DatumGetPointer(memaddr)); } -#ifdef HAS_TEST_AND_SET + /* ------------------ - * use hardware locks to replace semaphores for sequent machines - * to avoid costs of swapping processes and to provide unlimited - * supply of locks. + * Routines to assign keys for new IPC objects + * + * The idea here is to detect and re-use keys that may have been assigned + * by a crashed postmaster or backend. * ------------------ */ -/* used in spin.c */ -SLock *SLockArray = NULL; +static IpcMemoryKey NextShmemSegID = 0; +static IpcSemaphoreKey NextSemaID = 0; -static SLock **FreeSLockPP; -static int *UnusedSLockIP; -static slock_t *SLockMemoryLock; -static IpcMemoryId SLockMemoryId = -1; +/* + * (Re) initialize key assignment at startup of postmaster or standalone + * backend, also at postmaster reset. + */ +void +IpcInitKeyAssignment(int port) +{ + NextShmemSegID = port * 1000; + NextSemaID = port * 1000; +} -struct ipcdummy -{ /* to get alignment/size right */ - SLock *free; - int unused; - slock_t memlock; - SLock slocks[MAX_SPINS + 1]; -}; +/* + * Create a shared memory segment of the given size and initialize its + * standard header. Dead Postgres segments are recycled if found, + * but we do not fail upon collision with non-Postgres shmem segments. + */ +PGShmemHeader * +IpcMemoryCreate(uint32 size, bool private, int permission) +{ + void *memAddress; + PGShmemHeader *hdr; -#define SLOCKMEMORYSIZE sizeof(struct ipcdummy) + /* Room for a header? */ + Assert(size > MAXALIGN(sizeof(PGShmemHeader))); -void -CreateAndInitSLockMemory(IPCKey key) -{ - int id; - SLock *slckP; - - SLockMemoryId = IpcMemoryCreate(key, - SLOCKMEMORYSIZE, - 0700); - AttachSLockMemory(key); - *FreeSLockPP = NULL; - *UnusedSLockIP = (int) FIRSTFREELOCKID; - for (id = 0; id < (int) FIRSTFREELOCKID; id++) + /* Loop till we find a free IPC key */ + for (NextShmemSegID++ ; ; NextShmemSegID++) { - slckP = &(SLockArray[id]); - S_INIT_LOCK(&(slckP->locklock)); - slckP->flag = NOLOCK; - slckP->nshlocks = 0; - S_INIT_LOCK(&(slckP->shlock)); - S_INIT_LOCK(&(slckP->exlock)); - S_INIT_LOCK(&(slckP->comlock)); - slckP->next = NULL; + IpcMemoryId shmid; + + /* Special case if creating a private segment --- just malloc() it */ + if (private) + { + memAddress = PrivateMemoryCreate(size); + break; + } + + /* Try to create new segment */ + memAddress = InternalIpcMemoryCreate(NextShmemSegID, size, permission); + if (memAddress) + break; /* successful create and attach */ + + /* See if it looks to be leftover from a dead Postgres process */ + shmid = shmget(NextShmemSegID, sizeof(PGShmemHeader), 0); + if (shmid < 0) + continue; /* failed: must be some other app's */ + memAddress = shmat(shmid, 0, 0); + if (memAddress == (void *) -1) + continue; /* failed: must be some other app's */ + hdr = (PGShmemHeader *) memAddress; + if (hdr->magic != PGShmemMagic) + { + shmdt(memAddress); + continue; /* segment belongs to a non-Postgres app */ + } + /* + * If the creator PID is my own PID or does not belong to any + * extant process, it's safe to zap it. + */ + if (hdr->creatorPID != getpid()) + { + if (kill(hdr->creatorPID, 0) == 0 || + errno != ESRCH) + { + shmdt(memAddress); + continue; /* segment belongs to a live process */ + } + } + /* + * The segment appears to be from a dead Postgres process, or + * from a previous cycle of life in this same process. Zap it, + * if possible. This probably shouldn't fail, but if it does, + * assume the segment belongs to someone else after all, + * and continue quietly. + */ + shmdt(memAddress); + if (shmctl(shmid, IPC_RMID, (struct shmid_ds *) NULL) < 0) + continue; + /* + * Now try again to create the segment. + */ + memAddress = InternalIpcMemoryCreate(NextShmemSegID, size, permission); + if (memAddress) + break; /* successful create and attach */ + /* + * Can only get here if some other process managed to create the + * same shmem key before we did. Let him have that one, + * loop around to try next key. + */ } - return; -} + /* + * OK, we created a new segment. Mark it as created by this process. + * The order of assignments here is critical so that another Postgres + * process can't see the header as valid but belonging to an invalid + * PID! + */ + hdr = (PGShmemHeader *) memAddress; + hdr->creatorPID = getpid(); + hdr->magic = PGShmemMagic; + /* + * Initialize space allocation status for segment. + */ + hdr->totalsize = size; + hdr->freeoffset = MAXALIGN(sizeof(PGShmemHeader)); -void -AttachSLockMemory(IPCKey key) -{ - struct ipcdummy *slockM; - - if (SLockMemoryId == -1) - SLockMemoryId = IpcMemoryIdGet(key, SLOCKMEMORYSIZE); - if (SLockMemoryId == -1) - elog(FATAL, "SLockMemory not in shared memory"); - slockM = (struct ipcdummy *) IpcMemoryAttach(SLockMemoryId); - if (slockM == IpcMemAttachFailed) - elog(FATAL, "AttachSLockMemory: could not attach segment"); - FreeSLockPP = (SLock **) &(slockM->free); - UnusedSLockIP = (int *) &(slockM->unused); - SLockMemoryLock = (slock_t *) &(slockM->memlock); - S_INIT_LOCK(SLockMemoryLock); - SLockArray = (SLock *) &(slockM->slocks[0]); - return; + return hdr; } -#ifdef NOT_USED -bool -LockIsFree(int lockid) +/* + * Create a semaphore set with the given number of useful semaphores + * (an additional sema is actually allocated to serve as identifier). + * Dead Postgres sema sets are recycled if found, but we do not fail + * upon collision with non-Postgres sema sets. + */ +IpcSemaphoreId +IpcSemaphoreCreate(int numSems, int permission, + int semStartValue, bool removeOnExit) { - return SLockArray[lockid].flag == NOLOCK; -} + IpcSemaphoreId semId; + union semun semun; -#endif + /* Loop till we find a free IPC key */ + for (NextSemaID++ ; ; NextSemaID++) + { + pid_t creatorPID; + + /* Try to create new semaphore set */ + semId = InternalIpcSemaphoreCreate(NextSemaID, numSems+1, + permission, semStartValue, + removeOnExit); + if (semId >= 0) + break; /* successful create */ -#endif /* HAS_TEST_AND_SET */ + /* See if it looks to be leftover from a dead Postgres process */ + semId = semget(NextSemaID, numSems+1, 0); + if (semId < 0) + continue; /* failed: must be some other app's */ + if (IpcSemaphoreGetValue(semId, numSems) != PGSemaMagic) + continue; /* sema belongs to a non-Postgres app */ + /* + * If the creator PID is my own PID or does not belong to any + * extant process, it's safe to zap it. + */ + creatorPID = IpcSemaphoreGetLastPID(semId, numSems); + if (creatorPID <= 0) + continue; /* oops, GETPID failed */ + if (creatorPID != getpid()) + { + if (kill(creatorPID, 0) == 0 || + errno != ESRCH) + continue; /* sema belongs to a live process */ + } + /* + * The sema set appears to be from a dead Postgres process, or + * from a previous cycle of life in this same process. Zap it, + * if possible. This probably shouldn't fail, but if it does, + * assume the sema set belongs to someone else after all, + * and continue quietly. + */ + semun.val = 0; /* unused, but keep compiler quiet */ + if (semctl(semId, 0, IPC_RMID, semun) < 0) + continue; + /* + * Now try again to create the sema set. + */ + semId = InternalIpcSemaphoreCreate(NextSemaID, numSems+1, + permission, semStartValue, + removeOnExit); + if (semId >= 0) + break; /* successful create */ + /* + * Can only get here if some other process managed to create the + * same sema key before we did. Let him have that one, + * loop around to try next key. + */ + } + /* + * OK, we created a new sema set. Mark it as created by this process. + * We do this by setting the spare semaphore to PGSemaMagic-1 and then + * incrementing it with semop(). That leaves it with value PGSemaMagic + * and sempid referencing this process. + */ + semun.val = PGSemaMagic-1; + if (semctl(semId, numSems, SETVAL, semun) < 0) + { + fprintf(stderr, "IpcSemaphoreCreate: semctl(id=%d, %d, SETVAL, %d) failed: %s\n", + semId, numSems, PGSemaMagic-1, strerror(errno)); + + if (errno == ERANGE) + fprintf(stderr, + "You possibly need to raise your kernel's SEMVMX value to be at least\n" + "%d. Look into the PostgreSQL documentation for details.\n", + PGSemaMagic); + + proc_exit(1); + } + IpcSemaphoreUnlock(semId, numSems); + + return semId; +} diff --git a/src/backend/storage/ipc/ipci.c b/src/backend/storage/ipc/ipci.c index 5c7e88af73e..7a5813df57d 100644 --- a/src/backend/storage/ipc/ipci.c +++ b/src/backend/storage/ipc/ipci.c @@ -8,148 +8,91 @@ * * * IDENTIFICATION - * $Header: /cvsroot/pgsql/src/backend/storage/ipc/ipci.c,v 1.34 2000/11/21 21:16:01 petere Exp $ + * $Header: /cvsroot/pgsql/src/backend/storage/ipc/ipci.c,v 1.35 2000/11/28 23:27:56 tgl Exp $ * *------------------------------------------------------------------------- */ -#include <sys/types.h> - #include "postgres.h" +#include <sys/types.h> + #include "miscadmin.h" #include "access/xlog.h" #include "storage/bufmgr.h" +#include "storage/proc.h" #include "storage/sinval.h" +#include "storage/spin.h" -/* - * SystemPortAddressCreateMemoryKey - * Returns a memory key given a port address. - */ -IPCKey -SystemPortAddressCreateIPCKey(SystemPortAddress address) -{ - Assert(address < 32768); /* XXX */ - - return SystemPortAddressGetIPCKey(address); -} /* * CreateSharedMemoryAndSemaphores * Creates and initializes shared memory and semaphores. + * + * This is called by the postmaster or by a standalone backend. + * It is NEVER called by a backend forked from the postmaster; + * for such a backend, the shared memory is already ready-to-go. + * + * If "private" is true then we only need private memory, not shared + * memory. This is true for a standalone backend, false for a postmaster. */ -/************************************************** - - CreateSharedMemoryAndSemaphores - is called exactly *ONCE* by the postmaster. - It is *NEVER* called by the postgres backend, - except in the case of a standalone backend. - - 0) destroy any existing semaphores for both buffer - and lock managers. - 1) create the appropriate *SHARED* memory segments - for the two resource managers. - 2) create shared semaphores as needed. - - **************************************************/ - void -CreateSharedMemoryAndSemaphores(IPCKey key, int maxBackends) +CreateSharedMemoryAndSemaphores(bool private, int maxBackends) { int size; - -#ifdef HAS_TEST_AND_SET - - /* - * Create shared memory for slocks - */ - CreateAndInitSLockMemory(IPCKeyGetSLockSharedMemoryKey(key)); -#endif - - /* - * Kill and create the buffer manager buffer pool (and semaphore) - */ - CreateSpinlocks(IPCKeyGetSpinLockSemaphoreKey(key)); + PGShmemHeader *seghdr; /* - * Size of the primary shared-memory block is estimated via + * Size of the Postgres shared-memory block is estimated via * moderately-accurate estimates for the big hogs, plus 100K for the * stuff that's too small to bother with estimating. */ - size = BufferShmemSize() + LockShmemSize(maxBackends) + XLOGShmemSize(); + size = BufferShmemSize() + LockShmemSize(maxBackends) + + XLOGShmemSize() + SLockShmemSize() + SInvalShmemSize(maxBackends); #ifdef STABLE_MEMORY_STORAGE size += MMShmemSize(); #endif size += 100000; - /* might as well round it off to a multiple of a K or so... */ - size += 1024 - (size % 1024); + /* might as well round it off to a multiple of a typical page size */ + size += 8192 - (size % 8192); if (DebugLvl > 1) - { - fprintf(stderr, "binding ShmemCreate(key=%x, size=%d)\n", - IPCKeyGetBufferMemoryKey(key), size); - } - ShmemCreate(IPCKeyGetBufferMemoryKey(key), size); - ShmemIndexReset(); - InitShmem(key, size); - XLOGShmemInit(); - InitBufferPool(key); + fprintf(stderr, "invoking IpcMemoryCreate(size=%d)\n", size); - /* ---------------- - * do the lock table stuff - * ---------------- + /* + * Create the shmem segment */ - InitLocks(); - if (InitLockTable() == INVALID_TABLEID) - elog(FATAL, "Couldn't create the lock table"); + seghdr = IpcMemoryCreate(size, private, IPCProtection); - /* ---------------- - * do process table stuff - * ---------------- + /* + * First initialize spinlocks --- needed by InitShmemAllocation() */ - InitProcGlobal(key, maxBackends); - - CreateSharedInvalidationState(key, maxBackends); -} - + CreateSpinlocks(seghdr); -/* - * AttachSharedMemoryAndSemaphores - * Attachs existant shared memory and semaphores. - */ -void -AttachSharedMemoryAndSemaphores(IPCKey key) -{ - /* ---------------- - * create rather than attach if using private key - * ---------------- + /* + * Set up shmem.c hashtable */ - if (key == PrivateIPCKey) - { - CreateSharedMemoryAndSemaphores(key, 16); - return; - } + InitShmemAllocation(seghdr); -#ifdef HAS_TEST_AND_SET - /* ---------------- - * attach the slock shared memory - * ---------------- - */ - AttachSLockMemory(IPCKeyGetSLockSharedMemoryKey(key)); -#endif - /* ---------------- - * attach the buffer manager buffer pool (and semaphore) - * ---------------- + /* + * Set up xlog and buffers */ - InitShmem(key, 0); - InitBufferPool(key); + XLOGShmemInit(); + InitBufferPool(); - /* ---------------- - * initialize lock table stuff - * ---------------- + /* + * Set up lock manager */ InitLocks(); if (InitLockTable() == INVALID_TABLEID) - elog(FATAL, "Couldn't attach to the lock table"); + elog(FATAL, "Couldn't create the lock table"); + + /* + * Set up process table + */ + InitProcGlobal(maxBackends); - AttachSharedInvalidationState(key); + /* + * Set up shared-inval messaging + */ + CreateSharedInvalidationState(maxBackends); } diff --git a/src/backend/storage/ipc/shmem.c b/src/backend/storage/ipc/shmem.c index c5048a389b1..15922947087 100644 --- a/src/backend/storage/ipc/shmem.c +++ b/src/backend/storage/ipc/shmem.c @@ -8,14 +8,14 @@ * * * IDENTIFICATION - * $Header: /cvsroot/pgsql/src/backend/storage/ipc/shmem.c,v 1.54 2000/11/21 21:16:01 petere Exp $ + * $Header: /cvsroot/pgsql/src/backend/storage/ipc/shmem.c,v 1.55 2000/11/28 23:27:56 tgl Exp $ * *------------------------------------------------------------------------- */ /* * POSTGRES processes share one or more regions of shared memory. * The shared memory is created by a postmaster and is inherited - * by each backends via fork(). The routines in this file are used for + * by each backend via fork(). The routines in this file are used for * allocating and binding to shared memory data structures. * * NOTES: @@ -56,153 +56,57 @@ * * See InitSem() in sem.c for an example of how to use the * shmem index. - * */ #include "postgres.h" + #include "access/transam.h" #include "utils/tqual.h" /* shared memory global variables */ -unsigned long ShmemBase = 0; /* start and end address of shared memory */ -static unsigned long ShmemEnd = 0; -static unsigned long ShmemSize = 0; /* current size (and default) */ +static PGShmemHeader *ShmemSegHdr; /* shared mem segment header */ + +SHMEM_OFFSET ShmemBase; /* start address of shared memory */ + +static SHMEM_OFFSET ShmemEnd; /* end+1 address of shared memory */ SPINLOCK ShmemLock; /* lock for shared memory allocation */ SPINLOCK ShmemIndexLock; /* lock for shmem index access */ -static unsigned long *ShmemFreeStart = NULL; /* pointer to the OFFSET - * of first free shared - * memory */ -static unsigned long *ShmemIndexOffset = NULL; /* start of the shmem - * index table (for - * bootstrap) */ -static int ShmemBootstrap = FALSE; /* flag becomes true when shared - * mem is created by POSTMASTER */ - -static HTAB *ShmemIndex = NULL; - -/* --------------------- - * ShmemIndexReset() - Resets the shmem index to NULL.... - * useful when the postmaster destroys existing shared memory - * and creates all new segments after a backend crash. - * ---------------------- - */ -void -ShmemIndexReset(void) -{ - ShmemIndex = (HTAB *) NULL; -} +static HTAB *ShmemIndex = NULL; /* primary index hashtable for shmem */ -/* - * CreateSharedRegion() - * - * This routine is called once by the postmaster to - * initialize the shared buffer pool. Assume there is - * only one postmaster so no synchronization is necessary - * until after this routine completes successfully. - * - * key is a unique identifier for the shmem region. - * size is the size of the region. - */ -static IpcMemoryId ShmemId; +static bool ShmemBootstrap = false; /* bootstrapping shmem index? */ -void -ShmemCreate(unsigned int key, unsigned int size) -{ - if (size) - ShmemSize = size; - /* create shared mem region */ - if ((ShmemId = IpcMemoryCreate(key, ShmemSize, IPCProtection)) - == IpcMemCreationFailed) - { - elog(FATAL, "ShmemCreate: cannot create region"); - exit(1); - } - - /* - * ShmemBootstrap is true if shared memory has been created, but not - * yet initialized. Only the postmaster/creator-of-all-things should - * have this flag set. - */ - ShmemBootstrap = TRUE; -} /* - * InitShmem() -- map region into process address space - * and initialize shared data structures. - * + * InitShmemAllocation() --- set up shared-memory allocation and index table. */ -int -InitShmem(unsigned int key, unsigned int size) +void +InitShmemAllocation(PGShmemHeader *seghdr) { - Pointer sharedRegion; - unsigned long currFreeSpace; - HASHCTL info; int hash_flags; ShmemIndexEnt *result, item; bool found; - IpcMemoryId shmid; - - /* if zero key, use default memory size */ - if (size) - ShmemSize = size; - - /* default key is 0 */ - - /* attach to shared memory region (SysV or BSD OS specific) */ - if (ShmemBootstrap && key == PrivateIPCKey) - /* if we are running backend alone */ - shmid = ShmemId; - else - shmid = IpcMemoryIdGet(IPCKeyGetBufferMemoryKey(key), ShmemSize); - sharedRegion = IpcMemoryAttach(shmid); - if (sharedRegion == NULL) - { - elog(FATAL, "AttachSharedRegion: couldn't attach to shmem\n"); - return FALSE; - } - - /* get pointers to the dimensions of shared memory */ - ShmemBase = (unsigned long) sharedRegion; - ShmemEnd = (unsigned long) sharedRegion + ShmemSize; - - /* First long in shared memory is the available-space pointer */ - ShmemFreeStart = (unsigned long *) ShmemBase; - /* next is a shmem pointer to the shmem index */ - ShmemIndexOffset = ShmemFreeStart + 1; - /* next is ShmemVariableCache */ - ShmemVariableCache = (VariableCache) (ShmemIndexOffset + 1); - - /* here is where to start dynamic allocation */ - currFreeSpace = MAXALIGN(sizeof(*ShmemFreeStart) + - sizeof(*ShmemIndexOffset) + - sizeof(*ShmemVariableCache)); - /* - * bootstrap initialize spin locks so we can start to use the - * allocator and shmem index. - */ - InitSpinLocks(); + /* Set up basic pointers to shared memory */ + ShmemSegHdr = seghdr; + ShmemBase = (SHMEM_OFFSET) seghdr; + ShmemEnd = ShmemBase + seghdr->totalsize; /* - * We have just allocated additional space for two spinlocks. Now - * setup the global free space count + * Since ShmemInitHash calls ShmemInitStruct, which expects the + * ShmemIndex hashtable to exist already, we have a bit of a circularity + * problem in initializing the ShmemIndex itself. We set ShmemBootstrap + * to tell ShmemInitStruct to fake it. */ - if (ShmemBootstrap) - { - *ShmemFreeStart = currFreeSpace; - memset(ShmemVariableCache, 0, sizeof(*ShmemVariableCache)); - } - - /* if ShmemFreeStart is NULL, then the allocator won't work */ - Assert(*ShmemFreeStart); + ShmemIndex = (HTAB *) NULL; + ShmemBootstrap = true; - /* create OR attach to the shared memory shmem index */ + /* create the shared memory shmem index */ info.keysize = SHMEM_INDEX_KEYSIZE; info.datasize = SHMEM_INDEX_DATASIZE; hash_flags = HASH_ELEM; @@ -211,60 +115,43 @@ InitShmem(unsigned int key, unsigned int size) ShmemIndex = ShmemInitHash("ShmemIndex", SHMEM_INDEX_SIZE, SHMEM_INDEX_SIZE, &info, hash_flags); - if (!ShmemIndex) - { - elog(FATAL, "InitShmem: couldn't initialize Shmem Index"); - return FALSE; - } + elog(FATAL, "InitShmemAllocation: couldn't initialize Shmem Index"); /* - * Now, check the shmem index for an entry to the shmem index. If - * there is an entry there, someone else created the table. Otherwise, - * we did and we have to initialize it. + * Now, create an entry in the hashtable for the index itself. */ MemSet(item.key, 0, SHMEM_INDEX_KEYSIZE); strncpy(item.key, "ShmemIndex", SHMEM_INDEX_KEYSIZE); result = (ShmemIndexEnt *) hash_search(ShmemIndex, (char *) &item, HASH_ENTER, &found); - - if (!result) - { - elog(FATAL, "InitShmem: corrupted shmem index"); - return FALSE; - } - - if (!found) - { + elog(FATAL, "InitShmemAllocation: corrupted shmem index"); - /* - * bootstrapping shmem: we have to initialize the shmem index now. - */ + Assert(ShmemBootstrap && !found); - Assert(ShmemBootstrap); - result->location = MAKE_OFFSET(ShmemIndex->hctl); - *ShmemIndexOffset = result->location; - result->size = SHMEM_INDEX_SIZE; + result->location = MAKE_OFFSET(ShmemIndex->hctl); + result->size = SHMEM_INDEX_SIZE; - ShmemBootstrap = FALSE; + ShmemBootstrap = false; - } - else - Assert(!ShmemBootstrap); - /* now release the lock acquired in ShmemHashInit */ + /* now release the lock acquired in ShmemInitStruct */ SpinRelease(ShmemIndexLock); - Assert(result->location == MAKE_OFFSET(ShmemIndex->hctl)); - - return TRUE; + /* + * Initialize ShmemVariableCache for transaction manager. + */ + ShmemVariableCache = (VariableCache) + ShmemAlloc(sizeof(*ShmemVariableCache)); + memset(ShmemVariableCache, 0, sizeof(*ShmemVariableCache)); } /* - * ShmemAlloc -- allocate max-aligned byte string from shared memory + * ShmemAlloc -- allocate max-aligned chunk from shared memory + * + * Assumes ShmemLock and ShmemSegHdr are initialized. * - * Assumes ShmemLock and ShmemFreeStart are initialized. * Returns: real pointer to memory or NULL if we are out * of space. Has to return a real pointer in order * to be compatible with malloc(). @@ -272,7 +159,7 @@ InitShmem(unsigned int key, unsigned int size) void * ShmemAlloc(Size size) { - unsigned long tmpFree; + uint32 newFree; void *newSpace; /* @@ -280,15 +167,15 @@ ShmemAlloc(Size size) */ size = MAXALIGN(size); - Assert(*ShmemFreeStart); + Assert(ShmemSegHdr); SpinAcquire(ShmemLock); - tmpFree = *ShmemFreeStart + size; - if (tmpFree <= ShmemSize) + newFree = ShmemSegHdr->freeoffset + size; + if (newFree <= ShmemSegHdr->totalsize) { - newSpace = (void *) MAKE_PTR(*ShmemFreeStart); - *ShmemFreeStart += size; + newSpace = (void *) MAKE_PTR(ShmemSegHdr->freeoffset); + ShmemSegHdr->freeoffset = newFree; } else newSpace = NULL; @@ -306,7 +193,7 @@ ShmemAlloc(Size size) * * Returns TRUE if the pointer is valid. */ -int +bool ShmemIsValid(unsigned long addr) { return (addr < ShmemEnd) && (addr >= ShmemBase); @@ -394,16 +281,15 @@ ShmemPIDLookup(int pid, SHMEM_OFFSET *locationPtr) sprintf(item.key, "PID %d", pid); SpinAcquire(ShmemIndexLock); + result = (ShmemIndexEnt *) hash_search(ShmemIndex, (char *) &item, HASH_ENTER, &found); if (!result) { - SpinRelease(ShmemIndexLock); elog(ERROR, "ShmemInitPID: ShmemIndex corrupted"); return FALSE; - } if (found) @@ -438,19 +324,19 @@ ShmemPIDDestroy(int pid) sprintf(item.key, "PID %d", pid); SpinAcquire(ShmemIndexLock); + result = (ShmemIndexEnt *) hash_search(ShmemIndex, (char *) &item, HASH_REMOVE, &found); if (found) location = result->location; + SpinRelease(ShmemIndexLock); if (!result) { - elog(ERROR, "ShmemPIDDestroy: PID table corrupted"); return INVALID_OFFSET; - } if (found) @@ -487,53 +373,31 @@ ShmemInitStruct(char *name, Size size, bool *foundPtr) if (!ShmemIndex) { -#ifdef USE_ASSERT_CHECKING - char *strname = "ShmemIndex"; - -#endif - /* - * If the shmem index doesn't exist, we fake it. + * If the shmem index doesn't exist, we are bootstrapping: we must + * be trying to init the shmem index itself. * - * If we are creating the first shmem index, then let shmemalloc() - * allocate the space for a new HTAB. Otherwise, find the old one - * and return that. Notice that the ShmemIndexLock is held until - * the shmem index has been completely initialized. + * Notice that the ShmemIndexLock is held until the shmem index has + * been completely initialized. */ - Assert(strcmp(name, strname) == 0); - if (ShmemBootstrap) - { - /* in POSTMASTER/Single process */ - - *foundPtr = FALSE; - return ShmemAlloc(size); - } - else - { - Assert(*ShmemIndexOffset); - - *foundPtr = TRUE; - return (void *) MAKE_PTR(*ShmemIndexOffset); - } - - - } - else - { - /* look it up in the shmem index */ - result = (ShmemIndexEnt *) - hash_search(ShmemIndex, (char *) &item, HASH_ENTER, foundPtr); + Assert(strcmp(name, "ShmemIndex") == 0); + Assert(ShmemBootstrap); + *foundPtr = FALSE; + return ShmemAlloc(size); } + /* look it up in the shmem index */ + result = (ShmemIndexEnt *) + hash_search(ShmemIndex, (char *) &item, HASH_ENTER, foundPtr); + if (!result) { SpinRelease(ShmemIndexLock); - elog(ERROR, "ShmemInitStruct: Shmem Index corrupted"); return NULL; - } - else if (*foundPtr) + + if (*foundPtr) { /* diff --git a/src/backend/storage/ipc/sinval.c b/src/backend/storage/ipc/sinval.c index fb2e4804dd3..c87fcd36602 100644 --- a/src/backend/storage/ipc/sinval.c +++ b/src/backend/storage/ipc/sinval.c @@ -8,7 +8,7 @@ * * * IDENTIFICATION - * $Header: /cvsroot/pgsql/src/backend/storage/ipc/sinval.c,v 1.23 2000/11/12 20:51:51 tgl Exp $ + * $Header: /cvsroot/pgsql/src/backend/storage/ipc/sinval.c,v 1.24 2000/11/28 23:27:56 tgl Exp $ * *------------------------------------------------------------------------- */ @@ -27,52 +27,23 @@ SPINLOCK SInvalLock = (SPINLOCK) NULL; /****************************************************************************/ -/* CreateSharedInvalidationState() Create a buffer segment */ +/* CreateSharedInvalidationState() Initialize SI buffer */ /* */ /* should be called only by the POSTMASTER */ /****************************************************************************/ void -CreateSharedInvalidationState(IPCKey key, int maxBackends) +CreateSharedInvalidationState(int maxBackends) { - int status; - - /* SInvalLock gets set in spin.c, during spinlock init */ - status = SISegmentInit(true, IPCKeyGetSIBufferMemoryBlock(key), - maxBackends); - - if (status == -1) - elog(FATAL, "CreateSharedInvalidationState: failed segment init"); -} - -/****************************************************************************/ -/* AttachSharedInvalidationState(key) Attach to existing buffer segment */ -/* */ -/* should be called by each backend during startup */ -/****************************************************************************/ -void -AttachSharedInvalidationState(IPCKey key) -{ - int status; - - if (key == PrivateIPCKey) - { - CreateSharedInvalidationState(key, 16); - return; - } - /* SInvalLock gets set in spin.c, during spinlock init */ - status = SISegmentInit(false, IPCKeyGetSIBufferMemoryBlock(key), 0); - - if (status == -1) - elog(FATAL, "AttachSharedInvalidationState: failed segment init"); + /* SInvalLock must be initialized already, during spinlock init */ + SIBufferInit(maxBackends); } /* - * InitSharedInvalidationState + * InitBackendSharedInvalidationState * Initialize new backend's state info in buffer segment. - * Must be called after AttachSharedInvalidationState(). */ void -InitSharedInvalidationState(void) +InitBackendSharedInvalidationState(void) { SpinAcquire(SInvalLock); if (!SIBackendInit(shmInvalBuffer)) diff --git a/src/backend/storage/ipc/sinvaladt.c b/src/backend/storage/ipc/sinvaladt.c index f4b29983433..c7612759793 100644 --- a/src/backend/storage/ipc/sinvaladt.c +++ b/src/backend/storage/ipc/sinvaladt.c @@ -8,7 +8,7 @@ * * * IDENTIFICATION - * $Header: /cvsroot/pgsql/src/backend/storage/ipc/sinvaladt.c,v 1.35 2000/11/12 20:51:51 tgl Exp $ + * $Header: /cvsroot/pgsql/src/backend/storage/ipc/sinvaladt.c,v 1.36 2000/11/28 23:27:56 tgl Exp $ * *------------------------------------------------------------------------- */ @@ -25,95 +25,38 @@ SISeg *shmInvalBuffer; -static void SISegmentAttach(IpcMemoryId shmid); -static void SISegInit(SISeg *segP, int maxBackends); static void CleanupInvalidationState(int status, Datum arg); static void SISetProcStateInvalid(SISeg *segP); -/* - * SISegmentInit - * Create a new SI memory segment, or attach to an existing one - * - * This is called with createNewSegment = true by the postmaster (or by - * a standalone backend), and subsequently with createNewSegment = false - * by backends started by the postmaster. - * - * Note: maxBackends param is only valid when createNewSegment is true - */ -int -SISegmentInit(bool createNewSegment, IPCKey key, int maxBackends) -{ - int segSize; - IpcMemoryId shmId; - - if (createNewSegment) - { - /* Kill existing segment, if any */ - IpcMemoryKill(key); - - /* - * Figure space needed. Note sizeof(SISeg) includes the first - * ProcState entry. - */ - segSize = sizeof(SISeg) + sizeof(ProcState) * (maxBackends - 1); - - /* Get a shared segment */ - shmId = IpcMemoryCreate(key, segSize, IPCProtection); - if (shmId < 0) - { - perror("SISegmentInit: segment create failed"); - return -1; /* an error */ - } - - /* Attach to the shared cache invalidation segment */ - /* sets the global variable shmInvalBuffer */ - SISegmentAttach(shmId); - - /* Init shared memory contents */ - SISegInit(shmInvalBuffer, maxBackends); - } - else - { - /* find existing segment */ - shmId = IpcMemoryIdGet(key, 0); - if (shmId < 0) - { - perror("SISegmentInit: segment get failed"); - return -1; /* an error */ - } - - /* Attach to the shared cache invalidation segment */ - /* sets the global variable shmInvalBuffer */ - SISegmentAttach(shmId); - } - return 1; -} /* - * SISegmentAttach - * Attach to specified shared memory segment + * SInvalShmemSize --- return shared-memory space needed */ -static void -SISegmentAttach(IpcMemoryId shmid) +int +SInvalShmemSize(int maxBackends) { - shmInvalBuffer = (SISeg *) IpcMemoryAttach(shmid); - - if (shmInvalBuffer == IpcMemAttachFailed) - { - /* XXX use validity function */ - elog(FATAL, "SISegmentAttach: Could not attach segment: %m"); - } + /* + * Figure space needed. Note sizeof(SISeg) includes the first + * ProcState entry. + */ + return sizeof(SISeg) + sizeof(ProcState) * (maxBackends - 1); } /* - * SISegInit - * Initialize contents of a new shared memory sinval segment + * SIBufferInit + * Create and initialize a new SI message buffer */ -static void -SISegInit(SISeg *segP, int maxBackends) +void +SIBufferInit(int maxBackends) { + int segSize; + SISeg *segP; int i; + /* Allocate space in shared memory */ + segSize = SInvalShmemSize(maxBackends); + shmInvalBuffer = segP = (SISeg *) ShmemAlloc(segSize); + /* Clear message counters, save size of procState array */ segP->minMsgNum = 0; segP->maxMsgNum = 0; diff --git a/src/backend/storage/ipc/spin.c b/src/backend/storage/ipc/spin.c index 674ee06a9a3..a93ae69e032 100644 --- a/src/backend/storage/ipc/spin.c +++ b/src/backend/storage/ipc/spin.c @@ -3,31 +3,24 @@ * spin.c * routines for managing spin locks * + * POSTGRES has two kinds of locks: semaphores (which put the + * process to sleep) and spinlocks (which are supposed to be + * short term locks). Spinlocks are implemented via test-and-set (TAS) + * instructions if possible, else via semaphores. The semaphore method + * is too slow to be useful :-( + * * Portions Copyright (c) 1996-2000, PostgreSQL, Inc * Portions Copyright (c) 1994, Regents of the University of California * * * IDENTIFICATION - * $Header: /cvsroot/pgsql/src/backend/storage/ipc/Attic/spin.c,v 1.25 2000/05/31 00:28:29 petere Exp $ + * $Header: /cvsroot/pgsql/src/backend/storage/ipc/Attic/spin.c,v 1.26 2000/11/28 23:27:56 tgl Exp $ * *------------------------------------------------------------------------- */ -/* - * POSTGRES has two kinds of locks: semaphores (which put the - * process to sleep) and spinlocks (which are supposed to be - * short term locks). Currently both are implemented as SysV - * semaphores, but presumably this can change if we move to - * a machine with a test-and-set (TAS) instruction. Its probably - * a good idea to think about (and allocate) short term and long - * term semaphores separately anyway. - * - * NOTE: These routines are not supposed to be widely used in Postgres. - * They are preserved solely for the purpose of porting Mark Sullivan's - * buffer manager to Postgres. - */ -#include <errno.h> #include "postgres.h" +#include <errno.h> #ifndef HAS_TEST_AND_SET #include <sys/sem.h> #endif @@ -35,39 +28,33 @@ #include "storage/proc.h" #include "storage/s_lock.h" - -/* globals used in this file */ -IpcSemaphoreId SpinLockId; - -#ifdef HAS_TEST_AND_SET -/* real spin lock implementations */ - -void -CreateSpinlocks(IPCKey key) -{ - /* the spin lock shared memory must have been created by now */ - return; -} - -void -InitSpinLocks(void) -{ - extern SPINLOCK ShmemLock; - extern SPINLOCK ShmemIndexLock; - extern SPINLOCK BufMgrLock; - extern SPINLOCK LockMgrLock; - extern SPINLOCK ProcStructLock; - extern SPINLOCK SInvalLock; - extern SPINLOCK OidGenLockId; - extern SPINLOCK XidGenLockId; - extern SPINLOCK ControlFileLockId; +/* Probably should move these to an appropriate header file */ +extern SPINLOCK ShmemLock; +extern SPINLOCK ShmemIndexLock; +extern SPINLOCK BufMgrLock; +extern SPINLOCK LockMgrLock; +extern SPINLOCK ProcStructLock; +extern SPINLOCK SInvalLock; +extern SPINLOCK OidGenLockId; +extern SPINLOCK XidGenLockId; +extern SPINLOCK ControlFileLockId; #ifdef STABLE_MEMORY_STORAGE - extern SPINLOCK MMCacheLock; +extern SPINLOCK MMCacheLock; #endif - /* These six spinlocks have fixed location is shmem */ + +/* + * Initialize identifiers for permanent spinlocks during startup + * + * The same identifiers are used for both TAS and semaphore implementations, + * although in one case they are indexes into a shmem array and in the other + * they are semaphore numbers. + */ +static void +InitSpinLockIDs(void) +{ ShmemLock = (SPINLOCK) SHMEMLOCKID; ShmemIndexLock = (SPINLOCK) SHMEMINDEXLOCKID; BufMgrLock = (SPINLOCK) BUFMGRLOCKID; @@ -81,11 +68,18 @@ InitSpinLocks(void) #ifdef STABLE_MEMORY_STORAGE MMCacheLock = (SPINLOCK) MMCACHELOCKID; #endif - - return; } +#ifdef HAS_TEST_AND_SET + +/* real spin lock implementation */ + +typedef struct slock +{ + slock_t shlock; +} SLock; + #ifdef LOCK_DEBUG bool Trace_spinlocks = false; @@ -93,193 +87,268 @@ inline static void PRINT_SLDEBUG(const char * where, SPINLOCK lockid, const SLock * lock) { if (Trace_spinlocks) - elog(DEBUG, - "%s: id=%d (locklock=%d, flag=%d, nshlocks=%d, shlock=%d, exlock=%d)", - where, lockid, - lock->locklock, lock->flag, lock->nshlocks, lock->shlock, lock->exlock); + elog(DEBUG, "%s: id=%d", where, lockid); } #else /* not LOCK_DEBUG */ #define PRINT_SLDEBUG(a,b,c) #endif /* not LOCK_DEBUG */ -/* from ipc.c */ -extern SLock *SLockArray; +static SLock *SLockArray = NULL; + +#define SLOCKMEMORYSIZE ((int) MAX_SPINS * sizeof(SLock)) + +/* + * SLockShmemSize --- return shared-memory space needed + */ +int +SLockShmemSize(void) +{ + return MAXALIGN(SLOCKMEMORYSIZE); +} + +/* + * CreateSpinlocks --- create and initialize spinlocks during startup + */ +void +CreateSpinlocks(PGShmemHeader *seghdr) +{ + int id; + + /* + * We must allocate the space "by hand" because shmem.c isn't up yet + */ + SLockArray = (SLock *) (((char *) seghdr) + seghdr->freeoffset); + seghdr->freeoffset += MAXALIGN(SLOCKMEMORYSIZE); + Assert(seghdr->freeoffset <= seghdr->totalsize); + + /* + * Initialize all spinlocks to "unlocked" state + */ + for (id = 0; id < (int) MAX_SPINS; id++) + { + SLock *slckP = &(SLockArray[id]); + + S_INIT_LOCK(&(slckP->shlock)); + } + + /* + * Assign indexes for fixed spinlocks + */ + InitSpinLockIDs(); +} void SpinAcquire(SPINLOCK lockid) { - SLock *slckP; + SLock *slckP = &(SLockArray[lockid]); - /* This used to be in ipc.c, but move here to reduce function calls */ - slckP = &(SLockArray[lockid]); PRINT_SLDEBUG("SpinAcquire", lockid, slckP); -ex_try_again: - S_LOCK(&(slckP->locklock)); - switch (slckP->flag) - { - case NOLOCK: - slckP->flag = EXCLUSIVELOCK; - S_LOCK(&(slckP->exlock)); - S_LOCK(&(slckP->shlock)); - S_UNLOCK(&(slckP->locklock)); - PRINT_SLDEBUG("OUT", lockid, slckP); - break; - case SHAREDLOCK: - case EXCLUSIVELOCK: - S_UNLOCK(&(slckP->locklock)); - S_LOCK(&(slckP->exlock)); - S_UNLOCK(&(slckP->exlock)); - goto ex_try_again; - } + S_LOCK(&(slckP->shlock)); PROC_INCR_SLOCK(lockid); - PRINT_SLDEBUG("SpinAcquire/success", lockid, slckP); + PRINT_SLDEBUG("SpinAcquire/done", lockid, slckP); } void SpinRelease(SPINLOCK lockid) { - SLock *slckP; - - /* This used to be in ipc.c, but move here to reduce function calls */ - slckP = &(SLockArray[lockid]); + SLock *slckP = &(SLockArray[lockid]); /* * Check that we are actually holding the lock we are releasing. This * can be done only after MyProc has been initialized. */ Assert(!MyProc || MyProc->sLocks[lockid] > 0); - Assert(slckP->flag != NOLOCK); - PROC_DECR_SLOCK(lockid); PRINT_SLDEBUG("SpinRelease", lockid, slckP); - S_LOCK(&(slckP->locklock)); - /* ------------- - * give favor to read processes - * ------------- + S_UNLOCK(&(slckP->shlock)); + PRINT_SLDEBUG("SpinRelease/done", lockid, slckP); +} + +#else /* !HAS_TEST_AND_SET */ + +/* + * No TAS, so spinlocks are implemented using SysV semaphores. + * + * We support two slightly different APIs here: SpinAcquire/SpinRelease + * work with SPINLOCK integer indexes for the permanent spinlocks, which + * are all assumed to live in the first spinlock semaphore set. There + * is also an emulation of the s_lock.h TAS-spinlock macros; for that case, + * typedef slock_t stores the semId and sem number of the sema to use. + * The semas needed are created by CreateSpinlocks and doled out by + * s_init_lock_sema. + * + * Since many systems have a rather small SEMMSL limit on semas per set, + * we allocate the semaphores required in sets of SPINLOCKS_PER_SET semas. + * This value is deliberately made equal to PROC_NSEMS_PER_SET so that all + * sema sets allocated by Postgres will be the same size; that eases the + * semaphore-recycling logic in IpcSemaphoreCreate(). + * + * Note that the SpinLockIds array is not in shared memory; it is filled + * by the postmaster and then inherited through fork() by backends. This + * is OK because its contents do not change after system startup. + */ + +#define SPINLOCKS_PER_SET PROC_NSEMS_PER_SET + +static IpcSemaphoreId *SpinLockIds = NULL; + +static int numSpinSets = 0; /* number of sema sets used */ +static int numSpinLocks = 0; /* total number of semas allocated */ +static int nextSpinLock = 0; /* next free spinlock index */ + +static void SpinFreeAllSemaphores(void); + +/* + * SLockShmemSize --- return shared-memory space needed + */ +int +SLockShmemSize(void) +{ + return 0; +} + +/* + * CreateSpinlocks --- create and initialize spinlocks during startup + */ +void +CreateSpinlocks(PGShmemHeader *seghdr) +{ + int i; + + if (SpinLockIds == NULL) + { + /* + * Compute number of spinlocks needed. If this logic gets any more + * complicated, it should be distributed into the affected modules, + * similar to the way shmem space estimation is handled. + * + * For now, though, we just need the fixed spinlocks (MAX_SPINS), + * two spinlocks per shared disk buffer, and four spinlocks for XLOG. + */ + numSpinLocks = (int) MAX_SPINS + 2 * NBuffers + 4; + + /* might as well round up to a multiple of SPINLOCKS_PER_SET */ + numSpinSets = (numSpinLocks - 1) / SPINLOCKS_PER_SET + 1; + numSpinLocks = numSpinSets * SPINLOCKS_PER_SET; + + SpinLockIds = (IpcSemaphoreId *) + malloc(numSpinSets * sizeof(IpcSemaphoreId)); + Assert(SpinLockIds != NULL); + } + + for (i = 0; i < numSpinSets; i++) + SpinLockIds[i] = -1; + + /* + * Arrange to delete semas on exit --- set this up now so that we + * will clean up if allocation fails. We use our own freeproc, + * rather than IpcSemaphoreCreate's removeOnExit option, because + * we don't want to fill up the on_shmem_exit list with a separate + * entry for each semaphore set. */ - slckP->flag = NOLOCK; - if (slckP->nshlocks > 0) + on_shmem_exit(SpinFreeAllSemaphores, 0); + + /* Create sema sets and set all semas to count 1 */ + for (i = 0; i < numSpinSets; i++) { - while (slckP->nshlocks > 0) - { - S_UNLOCK(&(slckP->shlock)); - S_LOCK(&(slckP->comlock)); - } - S_UNLOCK(&(slckP->shlock)); + SpinLockIds[i] = IpcSemaphoreCreate(SPINLOCKS_PER_SET, + IPCProtection, + 1, + false); } - else - S_UNLOCK(&(slckP->shlock)); - S_UNLOCK(&(slckP->exlock)); - S_UNLOCK(&(slckP->locklock)); - PRINT_SLDEBUG("SpinRelease/released", lockid, slckP); + + /* + * Assign indexes for fixed spinlocks + */ + Assert(MAX_SPINS <= SPINLOCKS_PER_SET); + InitSpinLockIDs(); + + /* Init counter for allocating dynamic spinlocks */ + nextSpinLock = MAX_SPINS; } -#else /* !HAS_TEST_AND_SET */ -/* Spinlocks are implemented using SysV semaphores */ +/* + * SpinFreeAllSemaphores - + * called at shmem_exit time, ie when exiting the postmaster or + * destroying shared state for a failed set of backends. + * Free up all the semaphores allocated for spinlocks. + */ +static void +SpinFreeAllSemaphores(void) +{ + int i; -static bool AttachSpinLocks(IPCKey key); -static bool SpinIsLocked(SPINLOCK lock); + for (i = 0; i < numSpinSets; i++) + { + if (SpinLockIds[i] >= 0) + IpcSemaphoreKill(SpinLockIds[i]); + } +} /* - * SpinAcquire -- try to grab a spinlock + * SpinAcquire -- grab a fixed spinlock * * FAILS if the semaphore is corrupted. */ void SpinAcquire(SPINLOCK lock) { - IpcSemaphoreLock(SpinLockId, lock, IpcExclusiveLock); + IpcSemaphoreLock(SpinLockIds[0], lock); PROC_INCR_SLOCK(lock); } /* - * SpinRelease -- release a spin lock + * SpinRelease -- release a fixed spin lock * * FAILS if the semaphore is corrupted */ void SpinRelease(SPINLOCK lock) { - Assert(SpinIsLocked(lock)); - PROC_DECR_SLOCK(lock); - IpcSemaphoreUnlock(SpinLockId, lock, IpcExclusiveLock); -} - -static bool -SpinIsLocked(SPINLOCK lock) -{ +#ifdef USE_ASSERT_CHECKING + /* Check it's locked */ int semval; - semval = IpcSemaphoreGetValue(SpinLockId, lock); - return semval < IpcSemaphoreDefaultStartValue; + semval = IpcSemaphoreGetValue(SpinLockIds[0], lock); + Assert(semval < 1); +#endif + PROC_DECR_SLOCK(lock); + IpcSemaphoreUnlock(SpinLockIds[0], lock); } /* - * CreateSpinlocks -- Create a sysV semaphore array for - * the spinlocks - * + * s_lock.h hardware-spinlock emulation */ + void -CreateSpinlocks(IPCKey key) +s_init_lock_sema(volatile slock_t *lock) { - - SpinLockId = IpcSemaphoreCreate(key, MAX_SPINS, IPCProtection, - IpcSemaphoreDefaultStartValue, 1); - - if (SpinLockId <= 0) - elog(STOP, "CreateSpinlocks: cannot create spin locks"); - - return; + if (nextSpinLock >= numSpinLocks) + elog(FATAL, "s_init_lock_sema: not enough semaphores"); + lock->semId = SpinLockIds[nextSpinLock / SPINLOCKS_PER_SET]; + lock->sem = nextSpinLock % SPINLOCKS_PER_SET; + nextSpinLock++; } -/* - * InitSpinLocks -- Spinlock bootstrapping - * - * We need several spinlocks for bootstrapping: - * ShmemIndexLock (for the shmem index table) and - * ShmemLock (for the shmem allocator), BufMgrLock (for buffer - * pool exclusive access), LockMgrLock (for the lock table), and - * ProcStructLock (a spin lock for the shared process structure). - * If there's a Sony WORM drive attached, we also have a spinlock - * (SJCacheLock) for it. Same story for the main memory storage mgr. - * - */ void -InitSpinLocks(void) +s_unlock_sema(volatile slock_t *lock) { - extern SPINLOCK ShmemLock; - extern SPINLOCK ShmemIndexLock; - extern SPINLOCK BufMgrLock; - extern SPINLOCK LockMgrLock; - extern SPINLOCK ProcStructLock; - extern SPINLOCK SInvalLock; - extern SPINLOCK OidGenLockId; - extern SPINLOCK XidGenLockId; - extern SPINLOCK ControlFileLockId; - -#ifdef STABLE_MEMORY_STORAGE - extern SPINLOCK MMCacheLock; - -#endif - - /* These five (or six) spinlocks have fixed location is shmem */ - ShmemLock = (SPINLOCK) SHMEMLOCKID; - ShmemIndexLock = (SPINLOCK) SHMEMINDEXLOCKID; - BufMgrLock = (SPINLOCK) BUFMGRLOCKID; - LockMgrLock = (SPINLOCK) LOCKMGRLOCKID; - ProcStructLock = (SPINLOCK) PROCSTRUCTLOCKID; - SInvalLock = (SPINLOCK) SINVALLOCKID; - OidGenLockId = (SPINLOCK) OIDGENLOCKID; - XidGenLockId = (SPINLOCK) XIDGENLOCKID; - ControlFileLockId = (SPINLOCK) CNTLFILELOCKID; + IpcSemaphoreUnlock(lock->semId, lock->sem); +} -#ifdef STABLE_MEMORY_STORAGE - MMCacheLock = (SPINLOCK) MMCACHELOCKID; -#endif +bool +s_lock_free_sema(volatile slock_t *lock) +{ + return IpcSemaphoreGetValue(lock->semId, lock->sem) > 0; +} - return; +int +tas_sema(volatile slock_t *lock) +{ + /* Note that TAS macros return 0 if *success* */ + return ! IpcSemaphoreTryLock(lock->semId, lock->sem); } #endif /* !HAS_TEST_AND_SET */ |