In immediate shutdown, postmaster should not exit till children are gone.

author Tom Lane

Fri, 19 Jun 2015 18:23:39 +0000 (14:23 -0400)

committer Tom Lane

Fri, 19 Jun 2015 18:23:39 +0000 (14:23 -0400)
author Tom Lane
Fri, 19 Jun 2015 18:23:39 +0000 (14:23 -0400)
committer Tom Lane
Fri, 19 Jun 2015 18:23:39 +0000 (14:23 -0400)
diff --git a/doc/src/sgml/runtime.sgml b/doc/src/sgml/runtime.sgml

index 39bb74784916dd76b70a38f758cd6287a61c101c..5771757c5fd6dfd36a25e31e2bc07a5c0723f814 100644 (file)
--- a/doc/src/sgml/runtime.sgml
+++ b/doc/src/sgml/runtime.sgml
@@ -1426,10 +1426,11 @@ $ sysctl -w vm.nr_hugepages=3170
        
        This is the Immediate Shutdown mode.
        The server will send SIGQUIT to all child
-      processes and wait for them to terminate.  Those that don't terminate
-      within 5 seconds, will be sent SIGKILL by the
-      master postgres process, which will then terminate
-      without further waiting.  This will lead to recovery (by
+      processes and wait for them to terminate.  If any do not terminate
+      within 5 seconds, they will be sent SIGKILL.
+      The master server process exits as soon as all child processes have
+      exited, without doing normal database shutdown processing.
+      This will lead to recovery (by
        replaying the WAL log) upon next start-up. This is recommended
        only in emergencies.
        
diff --git a/src/backend/postmaster/postmaster.c b/src/backend/postmaster/postmaster.c

index d6721d7971c7f2a3afd6f882b49f2331c0ad148f..002e6f29a011e9ad1409ab64586cbdf474b67c92 100644 (file)
--- a/src/backend/postmaster/postmaster.c
+++ b/src/backend/postmaster/postmaster.c
@@ -324,8 +324,10 @@ typedef enum
  
  static PMState pmState = PM_INIT;
  
-/* Start time of abort processing at immediate shutdown or child crash */
-static time_t AbortStartTime;
+/* Start time of SIGKILL timeout during immediate shutdown or child crash */
+/* Zero means timeout is not running */
+static time_t AbortStartTime = 0;
+/* Length of said timeout */
  #define SIGKILL_CHILDREN_AFTER_SECS        5
  
  static bool ReachedNormalRunning = false;      /* T if we've reached PM_RUN */
@@ -1411,7 +1413,8 @@ checkDataDir(void)
   * In normal conditions we wait at most one minute, to ensure that the other
   * background tasks handled by ServerLoop get done even when no requests are
   * arriving.  However, if there are background workers waiting to be started,
- * we don't actually sleep so that they are quickly serviced.
+ * we don't actually sleep so that they are quickly serviced.  Other exception
+ * cases are as shown in the code.
   */
  static void
  DetermineSleepTime(struct timeval * timeout)
@@ -1425,11 +1428,12 @@ DetermineSleepTime(struct timeval * timeout)
     if (Shutdown > NoShutdown ||
         (!StartWorkerNeeded && !HaveCrashedWorker))
     {
-       if (AbortStartTime > 0)
+       if (AbortStartTime != 0)
         {
             /* time left to abort; clamp to 0 in case it already expired */
-           timeout->tv_sec = Max(SIGKILL_CHILDREN_AFTER_SECS -
-                                 (time(NULL) - AbortStartTime), 0);
+           timeout->tv_sec = SIGKILL_CHILDREN_AFTER_SECS -
+               (time(NULL) - AbortStartTime);
+           timeout->tv_sec = Max(timeout->tv_sec, 0);
             timeout->tv_usec = 0;
         }
         else
@@ -1699,20 +1703,13 @@ ServerLoop(void)
          * Note we also do this during recovery from a process crash.
          */
         if ((Shutdown >= ImmediateShutdown || (FatalError && !SendStop)) &&
-           AbortStartTime > 0 &&
-           now - AbortStartTime >= SIGKILL_CHILDREN_AFTER_SECS)
+           AbortStartTime != 0 &&
+           (now - AbortStartTime) >= SIGKILL_CHILDREN_AFTER_SECS)
         {
             /* We were gentle with them before. Not anymore */
             TerminateChildren(SIGKILL);
             /* reset flag so we don't SIGKILL again */
             AbortStartTime = 0;
-
-           /*
-            * Additionally, unless we're recovering from a process crash,
-            * it's now the time for postmaster to abandon ship.
-            */
-           if (!FatalError)
-               ExitPostmaster(1);
         }
     }
  }
author	Tom Lane
	Fri, 19 Jun 2015 18:23:39 +0000 (14:23 -0400)
committer	Tom Lane
	Fri, 19 Jun 2015 18:23:39 +0000 (14:23 -0400)
doc/src/sgml/runtime.sgml		patch \| blob \| blame \| history
src/backend/postmaster/postmaster.c		patch \| blob \| blame \| history