]> granicus.if.org Git - postgresql/commitdiff
Avoid "could not reattach" by providing space for concurrent allocation.
authorNoah Misch <noah@leadboat.com>
Tue, 9 Apr 2019 04:39:00 +0000 (21:39 -0700)
committerNoah Misch <noah@leadboat.com>
Tue, 9 Apr 2019 04:39:04 +0000 (21:39 -0700)
We've long had reports of intermittent "could not reattach to shared
memory" errors on Windows.  Buildfarm member dory fails that way when
PGSharedMemoryReAttach() execution overlaps with creation of a thread
for the process's "default thread pool".  Fix that by providing a second
region to receive asynchronous allocations that would otherwise intrude
into UsedShmemSegAddr.  In pgwin32_ReserveSharedMemoryRegion(), stop
trying to free reservations landing at incorrect addresses; the caller's
next step has been to terminate the affected process.  Back-patch to 9.4
(all supported versions).

Reviewed by Tom Lane.  He also did much of the prerequisite research;
see commit bcbf2346d69f6006f126044864dd9383d50d87b4.

Discussion: https://postgr.es/m/20190402135442.GA1173872@rfd.leadboat.com

src/backend/port/win32_shmem.c
src/backend/postmaster/postmaster.c
src/include/storage/pg_shmem.h

index 110bdcc703dce07b8a29b051051b8b2f1ce16a89..64ba2296d4f3871b3a92aa54ef9f0742509422f8 100644 (file)
 #include "storage/ipc.h"
 #include "storage/pg_shmem.h"
 
+/*
+ * Early in a process's life, Windows asynchronously creates threads for the
+ * process's "default thread pool"
+ * (https://docs.microsoft.com/en-us/windows/desktop/ProcThread/thread-pools).
+ * Occasionally, thread creation allocates a stack after
+ * PGSharedMemoryReAttach() has released UsedShmemSegAddr and before it has
+ * mapped shared memory at UsedShmemSegAddr.  This would cause mapping to fail
+ * if the allocator preferred the just-released region for allocating the new
+ * thread stack.  We observed such failures in some Windows Server 2016
+ * configurations.  To give the system another region to prefer, reserve and
+ * release an additional, protective region immediately before reserving or
+ * releasing shared memory.  The idea is that, if the allocator handed out
+ * REGION1 pages before REGION2 pages at one occasion, it will do so whenever
+ * both regions are free.  Windows Server 2016 exhibits that behavior, and a
+ * system behaving differently would have less need to protect
+ * UsedShmemSegAddr.  The protective region must be at least large enough for
+ * one thread stack.  However, ten times as much is less than 2% of the 32-bit
+ * address space and is negligible relative to the 64-bit address space.
+ */
+#define PROTECTIVE_REGION_SIZE (10 * WIN32_STACK_RLIMIT)
+void      *ShmemProtectiveRegion = NULL;
+
 HANDLE         UsedShmemSegID = INVALID_HANDLE_VALUE;
 void      *UsedShmemSegAddr = NULL;
 static Size UsedShmemSegSize = 0;
@@ -133,6 +155,12 @@ PGSharedMemoryCreate(Size size, bool makePrivate, int port,
                                (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
                                 errmsg("huge pages not supported on this platform")));
 
+       ShmemProtectiveRegion = VirtualAlloc(NULL, PROTECTIVE_REGION_SIZE,
+                                                                                MEM_RESERVE, PAGE_NOACCESS);
+       if (ShmemProtectiveRegion == NULL)
+               elog(FATAL, "could not reserve memory region: error code %lu",
+                        GetLastError());
+
        /* Room for a header? */
        Assert(size > MAXALIGN(sizeof(PGShmemHeader)));
 
@@ -263,9 +291,9 @@ PGSharedMemoryCreate(Size size, bool makePrivate, int port,
  * an already existing shared memory segment, using the handle inherited from
  * the postmaster.
  *
- * UsedShmemSegID and UsedShmemSegAddr are implicit parameters to this
- * routine.  The caller must have already restored them to the postmaster's
- * values.
+ * ShmemProtectiveRegion, UsedShmemSegID and UsedShmemSegAddr are implicit
+ * parameters to this routine.  The caller must have already restored them to
+ * the postmaster's values.
  */
 void
 PGSharedMemoryReAttach(void)
@@ -273,12 +301,16 @@ PGSharedMemoryReAttach(void)
        PGShmemHeader *hdr;
        void       *origUsedShmemSegAddr = UsedShmemSegAddr;
 
+       Assert(ShmemProtectiveRegion != NULL);
        Assert(UsedShmemSegAddr != NULL);
        Assert(IsUnderPostmaster);
 
        /*
-        * Release memory region reservation that was made by the postmaster
+        * Release memory region reservations made by the postmaster
         */
+       if (VirtualFree(ShmemProtectiveRegion, 0, MEM_RELEASE) == 0)
+               elog(FATAL, "failed to release reserved memory region (addr=%p): error code %lu",
+                        ShmemProtectiveRegion, GetLastError());
        if (VirtualFree(UsedShmemSegAddr, 0, MEM_RELEASE) == 0)
                elog(FATAL, "failed to release reserved memory region (addr=%p): error code %lu",
                         UsedShmemSegAddr, GetLastError());
@@ -307,13 +339,14 @@ PGSharedMemoryReAttach(void)
  * The child process startup logic might or might not call PGSharedMemoryDetach
  * after this; make sure that it will be a no-op if called.
  *
- * UsedShmemSegID and UsedShmemSegAddr are implicit parameters to this
- * routine.  The caller must have already restored them to the postmaster's
- * values.
+ * ShmemProtectiveRegion, UsedShmemSegID and UsedShmemSegAddr are implicit
+ * parameters to this routine.  The caller must have already restored them to
+ * the postmaster's values.
  */
 void
 PGSharedMemoryNoReAttach(void)
 {
+       Assert(ShmemProtectiveRegion != NULL);
        Assert(UsedShmemSegAddr != NULL);
        Assert(IsUnderPostmaster);
 
@@ -340,12 +373,25 @@ PGSharedMemoryNoReAttach(void)
  * Rather, this is for subprocesses that have inherited an attachment and want
  * to get rid of it.
  *
- * UsedShmemSegID and UsedShmemSegAddr are implicit parameters to this
- * routine.
+ * ShmemProtectiveRegion, UsedShmemSegID and UsedShmemSegAddr are implicit
+ * parameters to this routine.
  */
 void
 PGSharedMemoryDetach(void)
 {
+       /*
+        * Releasing the protective region liberates an unimportant quantity of
+        * address space, but be tidy.
+        */
+       if (ShmemProtectiveRegion != NULL)
+       {
+               if (VirtualFree(ShmemProtectiveRegion, 0, MEM_RELEASE) == 0)
+                       elog(LOG, "failed to release reserved memory region (addr=%p): error code %lu",
+                                ShmemProtectiveRegion, GetLastError());
+
+               ShmemProtectiveRegion = NULL;
+       }
+
        /* Unmap the view, if it's mapped */
        if (UsedShmemSegAddr != NULL)
        {
@@ -403,19 +449,22 @@ pgwin32_ReserveSharedMemoryRegion(HANDLE hChild)
 {
        void       *address;
 
+       Assert(ShmemProtectiveRegion != NULL);
        Assert(UsedShmemSegAddr != NULL);
        Assert(UsedShmemSegSize != 0);
 
-       address = VirtualAllocEx(hChild, UsedShmemSegAddr, UsedShmemSegSize,
-                                                        MEM_RESERVE, PAGE_READWRITE);
+       /* ShmemProtectiveRegion */
+       address = VirtualAllocEx(hChild, ShmemProtectiveRegion,
+                                                        PROTECTIVE_REGION_SIZE,
+                                                        MEM_RESERVE, PAGE_NOACCESS);
        if (address == NULL)
        {
                /* Don't use FATAL since we're running in the postmaster */
                elog(LOG, "could not reserve shared memory region (addr=%p) for child %p: error code %lu",
-                        UsedShmemSegAddr, hChild, GetLastError());
+                        ShmemProtectiveRegion, hChild, GetLastError());
                return false;
        }
-       if (address != UsedShmemSegAddr)
+       if (address != ShmemProtectiveRegion)
        {
                /*
                 * Should never happen - in theory if allocation granularity causes
@@ -423,9 +472,24 @@ pgwin32_ReserveSharedMemoryRegion(HANDLE hChild)
                 *
                 * Don't use FATAL since we're running in the postmaster.
                 */
+               elog(LOG, "reserved shared memory region got incorrect address %p, expected %p",
+                        address, ShmemProtectiveRegion);
+               return false;
+       }
+
+       /* UsedShmemSegAddr */
+       address = VirtualAllocEx(hChild, UsedShmemSegAddr, UsedShmemSegSize,
+                                                        MEM_RESERVE, PAGE_READWRITE);
+       if (address == NULL)
+       {
+               elog(LOG, "could not reserve shared memory region (addr=%p) for child %p: error code %lu",
+                        UsedShmemSegAddr, hChild, GetLastError());
+               return false;
+       }
+       if (address != UsedShmemSegAddr)
+       {
                elog(LOG, "reserved shared memory region got incorrect address %p, expected %p",
                         address, UsedShmemSegAddr);
-               VirtualFreeEx(hChild, address, 0, MEM_RELEASE);
                return false;
        }
 
index 644b4c6b2c89fac22dbc1c62c07dde06ebfa54f4..abbd18f0730740613c906bc99d5be30968837f83 100644 (file)
@@ -479,6 +479,7 @@ typedef struct
 #ifndef WIN32
        unsigned long UsedShmemSegID;
 #else
+       void       *ShmemProtectiveRegion;
        HANDLE          UsedShmemSegID;
 #endif
        void       *UsedShmemSegAddr;
@@ -5898,6 +5899,9 @@ save_backend_variables(BackendParameters *param, Port *port,
        param->MyCancelKey = MyCancelKey;
        param->MyPMChildSlot = MyPMChildSlot;
 
+#ifdef WIN32
+       param->ShmemProtectiveRegion = ShmemProtectiveRegion;
+#endif
        param->UsedShmemSegID = UsedShmemSegID;
        param->UsedShmemSegAddr = UsedShmemSegAddr;
 
@@ -6129,6 +6133,9 @@ restore_backend_variables(BackendParameters *param, Port *port)
        MyCancelKey = param->MyCancelKey;
        MyPMChildSlot = param->MyPMChildSlot;
 
+#ifdef WIN32
+       ShmemProtectiveRegion = param->ShmemProtectiveRegion;
+#endif
        UsedShmemSegID = param->UsedShmemSegID;
        UsedShmemSegAddr = param->UsedShmemSegAddr;
 
index 9dbcbce0692f8ee794c22ff3098a45cfe4640dc5..f36ecd51369311e18af0190a2f9a3177a4181e30 100644 (file)
@@ -56,6 +56,7 @@ typedef enum
 extern unsigned long UsedShmemSegID;
 #else
 extern HANDLE UsedShmemSegID;
+extern void *ShmemProtectiveRegion;
 #endif
 extern void *UsedShmemSegAddr;