Be more careful to not lose sync in the FE/BE protocol.

author Heikki Linnakangas <heikki.linnakangas@iki.fi>

Mon, 2 Feb 2015 15:08:56 +0000 (17:08 +0200)

committer Heikki Linnakangas <heikki.linnakangas@iki.fi>

Mon, 2 Feb 2015 15:09:46 +0000 (17:09 +0200)
author Heikki Linnakangas <heikki.linnakangas@iki.fi>
Mon, 2 Feb 2015 15:08:56 +0000 (17:08 +0200)
committer Heikki Linnakangas <heikki.linnakangas@iki.fi>
Mon, 2 Feb 2015 15:09:46 +0000 (17:09 +0200)
diff --git a/src/backend/commands/copy.c b/src/backend/commands/copy.c

index be829a6eadc657080515e58534991051168f955c..3eba9efcc6322445b917c16fb9745f66d7f3ece4 100644 (file)
--- a/src/backend/commands/copy.c
+++ b/src/backend/commands/copy.c
@@ -406,6 +406,8 @@ ReceiveCopyBegin(CopyState cstate)
                                         (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
                         errmsg("COPY BINARY is not supported to stdout or from stdin")));
                 pq_putemptymessage('G');
+               /* any error in old protocol will make us lose sync */
+               pq_startmsgread();
                 cstate->copy_dest = COPY_OLD_FE;
         }
         else
@@ -416,6 +418,8 @@ ReceiveCopyBegin(CopyState cstate)
                                         (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
                         errmsg("COPY BINARY is not supported to stdout or from stdin")));
                 pq_putemptymessage('D');
+               /* any error in old protocol will make us lose sync */
+               pq_startmsgread();
                 cstate->copy_dest = COPY_OLD_FE;
         }
         /* We *must* flush here to ensure FE knows it can send. */
@@ -602,6 +606,8 @@ CopyGetData(CopyState cstate, void *databuf, int minread, int maxread)
                                         int                     mtype;
  
                         readmessage:
+                                       HOLD_CANCEL_INTERRUPTS();
+                                       pq_startmsgread();
                                         mtype = pq_getbyte();
                                         if (mtype == EOF)
                                                 ereport(ERROR,
@@ -611,6 +617,7 @@ CopyGetData(CopyState cstate, void *databuf, int minread, int maxread)
                                                 ereport(ERROR,
                                                                 (errcode(ERRCODE_CONNECTION_FAILURE),
                                                                  errmsg("unexpected EOF on client connection with an open transaction")));
+                                       RESUME_CANCEL_INTERRUPTS();
                                         switch (mtype)
                                         {
                                                 case 'd':               /* CopyData */
@@ -2370,6 +2377,13 @@ CopyFrom(CopyState cstate)
  
         MemoryContextSwitchTo(oldcontext);
  
+       /*
+        * In the old protocol, tell pqcomm that we can process normal protocol
+        * messages again.
+        */
+       if (cstate->copy_dest == COPY_OLD_FE)
+               pq_endmsgread();
+
         /* Execute AFTER STATEMENT insertion triggers */
         ExecASInsertTriggers(estate, resultRelInfo);
  
diff --git a/src/backend/libpq/auth.c b/src/backend/libpq/auth.c

index 09491fd5089d06295dcbe39264afd5870d88b324..2a67bcd9926832ca0b856998306d9d0aab5811c1 100644 (file)
--- a/src/backend/libpq/auth.c
+++ b/src/backend/libpq/auth.c
@@ -625,6 +625,7 @@ recv_password_packet(Port *port)
  {
         StringInfoData buf;
  
+       pq_startmsgread();
         if (PG_PROTOCOL_MAJOR(port->proto) >= 3)
         {
                 /* Expect 'p' message type */
@@ -849,6 +850,7 @@ pg_GSS_recvauth(Port *port)
          */
         do
         {
+               pq_startmsgread();
                 mtype = pq_getbyte();
                 if (mtype != 'p')
                 {
@@ -1083,6 +1085,7 @@ pg_SSPI_recvauth(Port *port)
          */
         do
         {
+               pq_startmsgread();
                 mtype = pq_getbyte();
                 if (mtype != 'p')
                 {
diff --git a/src/backend/libpq/pqcomm.c b/src/backend/libpq/pqcomm.c

index 605d8913b16d2487c0f4f6c4a9d4baf6cc2635b8..c08c5d73ba403ac8a7bad33bdbaf1e8343c5c820 100644 (file)
--- a/src/backend/libpq/pqcomm.c
+++ b/src/backend/libpq/pqcomm.c
@@ -129,8 +129,9 @@ static int  PqRecvLength;           /* End of data available in PqRecvBuffer */
  /*
   * Message status
   */
-static bool PqCommBusy;
-static bool DoingCopyOut;
+static bool PqCommBusy;                        /* busy sending data to the client */
+static bool PqCommReadingMsg;  /* in the middle of reading a message */
+static bool DoingCopyOut;              /* in old-protocol COPY OUT processing */
  
  
  /* Internal functions */
@@ -156,6 +157,7 @@ pq_init(void)
         PqSendBuffer = MemoryContextAlloc(TopMemoryContext, PqSendBufferSize);
         PqSendPointer = PqSendStart = PqRecvPointer = PqRecvLength = 0;
         PqCommBusy = false;
+       PqCommReadingMsg = false;
         DoingCopyOut = false;
         on_proc_exit(pq_close, 0);
  }
@@ -890,6 +892,8 @@ pq_recvbuf(void)
  int
  pq_getbyte(void)
  {
+       Assert(PqCommReadingMsg);
+
         while (PqRecvPointer >= PqRecvLength)
         {
                 if (pq_recvbuf())               /* If nothing in buffer, then recv some */
@@ -928,6 +932,8 @@ pq_getbyte_if_available(unsigned char *c)
  {
         int                     r;
  
+       Assert(PqCommReadingMsg);
+
         if (PqRecvPointer < PqRecvLength)
         {
                 *c = PqRecvBuffer[PqRecvPointer++];
@@ -980,6 +986,8 @@ pq_getbytes(char *s, size_t len)
  {
         size_t          amount;
  
+       Assert(PqCommReadingMsg);
+
         while (len > 0)
         {
                 while (PqRecvPointer >= PqRecvLength)
@@ -1012,6 +1020,8 @@ pq_discardbytes(size_t len)
  {
         size_t          amount;
  
+       Assert(PqCommReadingMsg);
+
         while (len > 0)
         {
                 while (PqRecvPointer >= PqRecvLength)
@@ -1048,6 +1058,8 @@ pq_getstring(StringInfo s)
  {
         int                     i;
  
+       Assert(PqCommReadingMsg);
+
         resetStringInfo(s);
  
         /* Read until we get the terminating '\0' */
@@ -1079,6 +1091,58 @@ pq_getstring(StringInfo s)
  }
  
  
+/* --------------------------------
+ *             pq_startmsgread - begin reading a message from the client.
+ *
+ *             This must be called before any of the pq_get* functions.
+ * --------------------------------
+ */
+void
+pq_startmsgread(void)
+{
+       /*
+        * There shouldn't be a read active already, but let's check just to be
+        * sure.
+        */
+       if (PqCommReadingMsg)
+               ereport(FATAL,
+                               (errcode(ERRCODE_PROTOCOL_VIOLATION),
+                                errmsg("terminating connection because protocol sync was lost")));
+
+       PqCommReadingMsg = true;
+}
+
+
+/* --------------------------------
+ *             pq_endmsgread   - finish reading message.
+ *
+ *             This must be called after reading a V2 protocol message with
+ *             pq_getstring() and friends, to indicate that we have read the whole
+ *             message. In V3 protocol, pq_getmessage() does this implicitly.
+ * --------------------------------
+ */
+void
+pq_endmsgread(void)
+{
+       Assert(PqCommReadingMsg);
+
+       PqCommReadingMsg = false;
+}
+
+/* --------------------------------
+ *             pq_is_reading_msg - are we currently reading a message?
+ *
+ * This is used in error recovery at the outer idle loop to detect if we have
+ * lost protocol sync, and need to terminate the connection. pq_startmsgread()
+ * will check for that too, but it's nicer to detect it earlier.
+ * --------------------------------
+ */
+bool
+pq_is_reading_msg(void)
+{
+       return PqCommReadingMsg;
+}
+
  /* --------------------------------
   *             pq_getmessage   - get a message with length word from connection
   *
@@ -1100,6 +1164,8 @@ pq_getmessage(StringInfo s, int maxlen)
  {
         int32           len;
  
+       Assert(PqCommReadingMsg);
+
         resetStringInfo(s);
  
         /* Read message length word */
@@ -1141,6 +1207,9 @@ pq_getmessage(StringInfo s, int maxlen)
                                 ereport(COMMERROR,
                                                 (errcode(ERRCODE_PROTOCOL_VIOLATION),
                                                  errmsg("incomplete message from client")));
+
+                       /* we discarded the rest of the message so we're back in sync. */
+                       PqCommReadingMsg = false;
                         PG_RE_THROW();
                 }
                 PG_END_TRY();
@@ -1158,6 +1227,9 @@ pq_getmessage(StringInfo s, int maxlen)
                 s->data[len] = '\0';
         }
  
+       /* finished reading the message. */
+       PqCommReadingMsg = false;
+
         return 0;
  }
  
diff --git a/src/backend/postmaster/postmaster.c b/src/backend/postmaster/postmaster.c

index 4ef9f921aeb725f2e7ebb2e542c0c5804b94ed06..f05114d129b9a808ac07a90278b682c27b7e85fe 100644 (file)
--- a/src/backend/postmaster/postmaster.c
+++ b/src/backend/postmaster/postmaster.c
@@ -1764,6 +1764,7 @@ ProcessStartupPacket(Port *port, bool SSLdone)
         ProtocolVersion proto;
         MemoryContext oldcontext;
  
+       pq_startmsgread();
         if (pq_getbytes((char *) &len, 4) == EOF)
         {
                 /*
@@ -1808,6 +1809,7 @@ ProcessStartupPacket(Port *port, bool SSLdone)
                                  errmsg("incomplete startup packet")));
                 return STATUS_ERROR;
         }
+       pq_endmsgread();
  
         /*
          * The first field is either a protocol version number or a special
diff --git a/src/backend/replication/walsender.c b/src/backend/replication/walsender.c

index 5633922786d4052e3c9b941acb80b30c5e06c188..f593c529842d8ee42f47419548a3bf82d0592c9a 100644 (file)
--- a/src/backend/replication/walsender.c
+++ b/src/backend/replication/walsender.c
@@ -1352,6 +1352,7 @@ ProcessRepliesIfAny(void)
  
         for (;;)
         {
+               pq_startmsgread();
                 r = pq_getbyte_if_available(&firstchar);
                 if (r < 0)
                 {
@@ -1364,9 +1365,20 @@ ProcessRepliesIfAny(void)
                 if (r == 0)
                 {
                         /* no data available without blocking */
+                       pq_endmsgread();
                         break;
                 }
  
+               /* Read the message contents */
+               resetStringInfo(&reply_message);
+               if (pq_getmessage(&reply_message, 0))
+               {
+                       ereport(COMMERROR,
+                                       (errcode(ERRCODE_PROTOCOL_VIOLATION),
+                                        errmsg("unexpected EOF on standby connection")));
+                       proc_exit(0);
+               }
+
                 /*
                  * If we already received a CopyDone from the frontend, the frontend
                  * should not send us anything until we've closed our end of the COPY.
@@ -1402,16 +1414,6 @@ ProcessRepliesIfAny(void)
                                         streamingDoneSending = true;
                                 }
  
-                               /* consume the CopyData message */
-                               resetStringInfo(&reply_message);
-                               if (pq_getmessage(&reply_message, 0))
-                               {
-                                       ereport(COMMERROR,
-                                                       (errcode(ERRCODE_PROTOCOL_VIOLATION),
-                                                        errmsg("unexpected EOF on standby connection")));
-                                       proc_exit(0);
-                               }
-
                                 streamingDoneReceiving = true;
                                 received = true;
                                 break;
@@ -1448,19 +1450,6 @@ ProcessStandbyMessage(void)
  {
         char            msgtype;
  
-       resetStringInfo(&reply_message);
-
-       /*
-        * Read the message contents.
-        */
-       if (pq_getmessage(&reply_message, 0))
-       {
-               ereport(COMMERROR,
-                               (errcode(ERRCODE_PROTOCOL_VIOLATION),
-                                errmsg("unexpected EOF on standby connection")));
-               proc_exit(0);
-       }
-
         /*
          * Check message type from the first byte.
          */
diff --git a/src/backend/storage/lmgr/proc.c b/src/backend/storage/lmgr/proc.c

index 266b0daa94f48f5c3937d77f5537282067ce7664..0ca7911caee083c00631c7c45cfbb2611bf55840 100644 (file)
--- a/src/backend/storage/lmgr/proc.c
+++ b/src/backend/storage/lmgr/proc.c
@@ -668,11 +668,16 @@ LockErrorCleanup(void)
         LWLock     *partitionLock;
         DisableTimeoutParams timeouts[2];
  
+       HOLD_INTERRUPTS();
+
         AbortStrongLockAcquire();
  
         /* Nothing to do if we weren't waiting for a lock */
         if (lockAwaited == NULL)
+       {
+               RESUME_INTERRUPTS();
                 return;
+       }
  
         /*
          * Turn off the deadlock and lock timeout timers, if they are still
@@ -722,6 +727,8 @@ LockErrorCleanup(void)
          * wakeup signal isn't harmful, and it seems not worth expending cycles to
          * get rid of a signal that most likely isn't there.
          */
+
+       RESUME_INTERRUPTS();
  }
  
  
diff --git a/src/backend/tcop/fastpath.c b/src/backend/tcop/fastpath.c

index 9f50c5add583966ab4b9eef3e8e16aefb5a7703c..6614a12f1dd3a9d8182b4b54943c35aa58587b32 100644 (file)
--- a/src/backend/tcop/fastpath.c
+++ b/src/backend/tcop/fastpath.c
@@ -75,7 +75,7 @@ static int16 parse_fcall_arguments_20(StringInfo msgBuf, struct fp_info * fip,
   * The caller should already have initialized buf to empty.
   * ----------------
   */
-static int
+int
  GetOldFunctionMessage(StringInfo buf)
  {
         int32           ibuf;
@@ -280,33 +280,6 @@ HandleFunctionRequest(StringInfo msgBuf)
         bool            was_logged = false;
         char            msec_str[32];
  
-       /*
-        * Read message contents if not already done.
-        */
-       if (PG_PROTOCOL_MAJOR(FrontendProtocol) < 3)
-       {
-               if (GetOldFunctionMessage(msgBuf))
-               {
-                       if (IsTransactionState())
-                               ereport(COMMERROR,
-                                               (errcode(ERRCODE_CONNECTION_FAILURE),
-                                                errmsg("unexpected EOF on client connection with an open transaction")));
-                       else
-                       {
-                               /*
-                                * Can't send DEBUG log messages to client at this point.
-                                * Since we're disconnecting right away, we don't need to
-                                * restore whereToSendOutput.
-                                */
-                               whereToSendOutput = DestNone;
-                               ereport(DEBUG1,
-                                               (errcode(ERRCODE_CONNECTION_DOES_NOT_EXIST),
-                                                errmsg("unexpected EOF on client connection")));
-                       }
-                       return EOF;
-               }
-       }
-
         /*
          * Now that we've eaten the input message, check to see if we actually
          * want to do the function call or not.  It's now safe to ereport(); we
diff --git a/src/backend/tcop/postgres.c b/src/backend/tcop/postgres.c

index abd2f9200fe9793cc1703ed580d621f3f2dddfbb..bc4eb33deef6709f9417376a58619c51cea6f231 100644 (file)
--- a/src/backend/tcop/postgres.c
+++ b/src/backend/tcop/postgres.c
@@ -332,6 +332,8 @@ SocketBackend(StringInfo inBuf)
         /*
          * Get message type code from the frontend.
          */
+       HOLD_CANCEL_INTERRUPTS();
+       pq_startmsgread();
         qtype = pq_getbyte();
  
         if (qtype == EOF)                       /* frontend disconnected */
@@ -380,7 +382,7 @@ SocketBackend(StringInfo inBuf)
                                         {
                                                 /*
                                                  * Can't send DEBUG log messages to client at this
-                                                * point.Since we're disconnecting right away, we
+                                                * point. Since we're disconnecting right away, we
                                                  * don't need to restore whereToSendOutput.
                                                  */
                                                 whereToSendOutput = DestNone;
@@ -394,8 +396,30 @@ SocketBackend(StringInfo inBuf)
                         break;
  
                 case 'F':                               /* fastpath function call */
-                       /* we let fastpath.c cope with old-style input of this */
                         doing_extended_query_message = false;
+                       if (PG_PROTOCOL_MAJOR(FrontendProtocol) < 3)
+                       {
+                               if (GetOldFunctionMessage(inBuf))
+                               {
+                                       if (IsTransactionState())
+                                               ereport(COMMERROR,
+                                                               (errcode(ERRCODE_CONNECTION_FAILURE),
+                                                                errmsg("unexpected EOF on client connection with an open transaction")));
+                                       else
+                                       {
+                                               /*
+                                                * Can't send DEBUG log messages to client at this
+                                                * point. Since we're disconnecting right away, we
+                                                * don't need to restore whereToSendOutput.
+                                                */
+                                               whereToSendOutput = DestNone;
+                                               ereport(DEBUG1,
+                                                               (errcode(ERRCODE_CONNECTION_DOES_NOT_EXIST),
+                                                        errmsg("unexpected EOF on client connection")));
+                                       }
+                                       return EOF;
+                               }
+                       }
                         break;
  
                 case 'X':                               /* terminate */
@@ -463,6 +487,9 @@ SocketBackend(StringInfo inBuf)
                 if (pq_getmessage(inBuf, 0))
                         return EOF;                     /* suitable message already logged */
         }
+       else
+               pq_endmsgread();
+       RESUME_CANCEL_INTERRUPTS();
  
         return qtype;
  }
@@ -507,7 +534,7 @@ prepare_for_client_read(void)
                 EnableNotifyInterrupt();
                 EnableCatchupInterrupt();
  
-               /* Allow cancel/die interrupts to be processed while waiting */
+               /* Allow die interrupts to be processed while waiting */
                 ImmediateInterruptOK = true;
  
                 /* And don't forget to detect one that already arrived */
@@ -2590,21 +2617,11 @@ die(SIGNAL_ARGS)
                 ProcDiePending = true;
  
                 /*
-                * If it's safe to interrupt, and we're waiting for input or a lock,
-                * service the interrupt immediately
+                * If we're waiting for input or a lock so that it's safe to
+                * interrupt, service the interrupt immediately
                  */
-               if (ImmediateInterruptOK && InterruptHoldoffCount == 0 &&
-                       CritSectionCount == 0)
-               {
-                       /* bump holdoff count to make ProcessInterrupts() a no-op */
-                       /* until we are done getting ready for it */
-                       InterruptHoldoffCount++;
-                       LockErrorCleanup(); /* prevent CheckDeadLock from running */
-                       DisableNotifyInterrupt();
-                       DisableCatchupInterrupt();
-                       InterruptHoldoffCount--;
+               if (ImmediateInterruptOK)
                         ProcessInterrupts();
-               }
         }
  
         /* If we're still here, waken anything waiting on the process latch */
@@ -2632,21 +2649,11 @@ StatementCancelHandler(SIGNAL_ARGS)
                 QueryCancelPending = true;
  
                 /*
-                * If it's safe to interrupt, and we're waiting for input or a lock,
-                * service the interrupt immediately
+                * If we're waiting for input or a lock so that it's safe to
+                * interrupt, service the interrupt immediately
                  */
-               if (ImmediateInterruptOK && InterruptHoldoffCount == 0 &&
-                       CritSectionCount == 0)
-               {
-                       /* bump holdoff count to make ProcessInterrupts() a no-op */
-                       /* until we are done getting ready for it */
-                       InterruptHoldoffCount++;
-                       LockErrorCleanup(); /* prevent CheckDeadLock from running */
-                       DisableNotifyInterrupt();
-                       DisableCatchupInterrupt();
-                       InterruptHoldoffCount--;
+               if (ImmediateInterruptOK)
                         ProcessInterrupts();
-               }
         }
  
         /* If we're still here, waken anything waiting on the process latch */
@@ -2791,21 +2798,11 @@ RecoveryConflictInterrupt(ProcSignalReason reason)
                         RecoveryConflictRetryable = false;
  
                 /*
-                * If it's safe to interrupt, and we're waiting for input or a lock,
-                * service the interrupt immediately
+                * If we're waiting for input or a lock so that it's safe to
+                * interrupt, service the interrupt immediately.
                  */
-               if (ImmediateInterruptOK && InterruptHoldoffCount == 0 &&
-                       CritSectionCount == 0)
-               {
-                       /* bump holdoff count to make ProcessInterrupts() a no-op */
-                       /* until we are done getting ready for it */
-                       InterruptHoldoffCount++;
-                       LockErrorCleanup(); /* prevent CheckDeadLock from running */
-                       DisableNotifyInterrupt();
-                       DisableCatchupInterrupt();
-                       InterruptHoldoffCount--;
+               if (ImmediateInterruptOK)
                         ProcessInterrupts();
-               }
         }
  
         /*
@@ -2831,15 +2828,17 @@ RecoveryConflictInterrupt(ProcSignalReason reason)
  void
  ProcessInterrupts(void)
  {
-       /* OK to accept interrupt now? */
+       /* OK to accept any interrupts now? */
         if (InterruptHoldoffCount != 0 || CritSectionCount != 0)
                 return;
         InterruptPending = false;
+
         if (ProcDiePending)
         {
                 ProcDiePending = false;
                 QueryCancelPending = false;             /* ProcDie trumps QueryCancel */
                 ImmediateInterruptOK = false;   /* not idle anymore */
+               LockErrorCleanup();
                 DisableNotifyInterrupt();
                 DisableCatchupInterrupt();
                 /* As in quickdie, don't risk sending to client during auth */
@@ -2876,6 +2875,7 @@ ProcessInterrupts(void)
         {
                 QueryCancelPending = false;             /* lost connection trumps QueryCancel */
                 ImmediateInterruptOK = false;   /* not idle anymore */
+               LockErrorCleanup();
                 DisableNotifyInterrupt();
                 DisableCatchupInterrupt();
                 /* don't send to client, we already know the connection to be dead. */
@@ -2884,12 +2884,53 @@ ProcessInterrupts(void)
                                 (errcode(ERRCODE_CONNECTION_FAILURE),
                                  errmsg("connection to client lost")));
         }
+
+       /*
+        * If a recovery conflict happens while we are waiting for input from the
+        * client, the client is presumably just sitting idle in a transaction,
+        * preventing recovery from making progress.  Terminate the connection to
+        * dislodge it.
+        */
+       if (RecoveryConflictPending && DoingCommandRead)
+       {
+               QueryCancelPending = false;                     /* this trumps QueryCancel */
+               ImmediateInterruptOK = false;           /* not idle anymore */
+               RecoveryConflictPending = false;
+               LockErrorCleanup();
+               DisableNotifyInterrupt();
+               DisableCatchupInterrupt();
+               pgstat_report_recovery_conflict(RecoveryConflictReason);
+               ereport(FATAL,
+                               (errcode(ERRCODE_T_R_SERIALIZATION_FAILURE),
+                                errmsg("terminating connection due to conflict with recovery"),
+                                errdetail_recovery_conflict(),
+                                errhint("In a moment you should be able to reconnect to the"
+                                                " database and repeat your command.")));
+       }
+
         if (QueryCancelPending)
         {
+               /*
+                * Don't allow query cancel interrupts while reading input from the
+                * client, because we might lose sync in the FE/BE protocol.  (Die
+                * interrupts are OK, because we won't read any further messages from
+                * the client in that case.)
+                */
+               if (QueryCancelHoldoffCount != 0)
+               {
+                       /*
+                        * Re-arm InterruptPending so that we process the cancel request
+                        * as soon as we're done reading the message.
+                        */
+                       InterruptPending = true;
+                       return;
+               }
+
                 QueryCancelPending = false;
                 if (ClientAuthInProgress)
                 {
                         ImmediateInterruptOK = false;           /* not idle anymore */
+                       LockErrorCleanup();
                         DisableNotifyInterrupt();
                         DisableCatchupInterrupt();
                         /* As in quickdie, don't risk sending to client during auth */
@@ -2908,6 +2949,7 @@ ProcessInterrupts(void)
                 {
                         ImmediateInterruptOK = false;           /* not idle anymore */
                         (void) get_timeout_indicator(STATEMENT_TIMEOUT, true);
+                       LockErrorCleanup();
                         DisableNotifyInterrupt();
                         DisableCatchupInterrupt();
                         ereport(ERROR,
@@ -2917,6 +2959,7 @@ ProcessInterrupts(void)
                 if (get_timeout_indicator(STATEMENT_TIMEOUT, true))
                 {
                         ImmediateInterruptOK = false;           /* not idle anymore */
+                       LockErrorCleanup();
                         DisableNotifyInterrupt();
                         DisableCatchupInterrupt();
                         ereport(ERROR,
@@ -2926,6 +2969,7 @@ ProcessInterrupts(void)
                 if (IsAutoVacuumWorkerProcess())
                 {
                         ImmediateInterruptOK = false;           /* not idle anymore */
+                       LockErrorCleanup();
                         DisableNotifyInterrupt();
                         DisableCatchupInterrupt();
                         ereport(ERROR,
@@ -2936,21 +2980,14 @@ ProcessInterrupts(void)
                 {
                         ImmediateInterruptOK = false;           /* not idle anymore */
                         RecoveryConflictPending = false;
+                       LockErrorCleanup();
                         DisableNotifyInterrupt();
                         DisableCatchupInterrupt();
                         pgstat_report_recovery_conflict(RecoveryConflictReason);
-                       if (DoingCommandRead)
-                               ereport(FATAL,
-                                               (errcode(ERRCODE_T_R_SERIALIZATION_FAILURE),
-                                                errmsg("terminating connection due to conflict with recovery"),
-                                                errdetail_recovery_conflict(),
-                                errhint("In a moment you should be able to reconnect to the"
-                                                " database and repeat your command.")));
-                       else
-                               ereport(ERROR,
-                                               (errcode(ERRCODE_T_R_SERIALIZATION_FAILURE),
+                       ereport(ERROR,
+                                       (errcode(ERRCODE_T_R_SERIALIZATION_FAILURE),
                                  errmsg("canceling statement due to conflict with recovery"),
-                                                errdetail_recovery_conflict()));
+                                        errdetail_recovery_conflict()));
                 }
  
                 /*
@@ -2961,6 +2998,7 @@ ProcessInterrupts(void)
                 if (!DoingCommandRead)
                 {
                         ImmediateInterruptOK = false;           /* not idle anymore */
+                       LockErrorCleanup();
                         DisableNotifyInterrupt();
                         DisableCatchupInterrupt();
                         ereport(ERROR,
@@ -3894,6 +3932,19 @@ PostgresMain(int argc, char *argv[],
                 /* We don't have a transaction command open anymore */
                 xact_started = false;
  
+               /*
+                * If an error occurred while we were reading a message from the
+                * client, we have potentially lost track of where the previous
+                * message ends and the next one begins.  Even though we have
+                * otherwise recovered from the error, we cannot safely read any more
+                * messages from the client, so there isn't much we can do with the
+                * connection anymore.
+                */
+               if (pq_is_reading_msg())
+                       ereport(FATAL,
+                                       (errcode(ERRCODE_PROTOCOL_VIOLATION),
+                                        errmsg("terminating connection because protocol sync was lost")));
+
                 /* Now we can allow interrupts again */
                 RESUME_INTERRUPTS();
         }
@@ -3978,7 +4029,14 @@ PostgresMain(int argc, char *argv[],
  
                 /*
                  * (4) disable async signal conditions again.
+                *
+                * Query cancel is supposed to be a no-op when there is no query in
+                * progress, so if a query cancel arrived while we were idle, just
+                * reset QueryCancelPending. ProcessInterrupts() has that effect when
+                * it's called when DoingCommandRead is set, so check for interrupts
+                * before resetting DoingCommandRead.
                  */
+               CHECK_FOR_INTERRUPTS();
                 DoingCommandRead = false;
  
                 /*
diff --git a/src/backend/utils/error/elog.c b/src/backend/utils/error/elog.c

index 7e82ea34f2ad7c8017321c7bbaa2c052576fc6bc..de46945e6854773c8918bbb1084cc50b52d9e5e5 100644 (file)
--- a/src/backend/utils/error/elog.c
+++ b/src/backend/utils/error/elog.c
@@ -469,6 +469,7 @@ errfinish(int dummy,...)
                  * while doing error cleanup.
                  */
                 InterruptHoldoffCount = 0;
+               QueryCancelHoldoffCount = 0;
  
                 CritSectionCount = 0;   /* should be unnecessary, but... */
  
diff --git a/src/backend/utils/init/globals.c b/src/backend/utils/init/globals.c

index be748357720c7ee9479e9cbda99b2692b835811b..342105f0174b233913fec161cfa1014c18fcc88a 100644 (file)
--- a/src/backend/utils/init/globals.c
+++ b/src/backend/utils/init/globals.c
@@ -32,6 +32,7 @@ volatile bool ProcDiePending = false;
  volatile bool ClientConnectionLost = false;
  volatile bool ImmediateInterruptOK = false;
  volatile uint32 InterruptHoldoffCount = 0;
+volatile uint32 QueryCancelHoldoffCount = 0;
  volatile uint32 CritSectionCount = 0;
  
  int                    MyProcPid;
diff --git a/src/include/libpq/libpq.h b/src/include/libpq/libpq.h

index e4e354dafa05a6ddf50e81eff26a91ddd1bf577c..9d216facaee7394b981641bd287a35667531bb15 100644 (file)
--- a/src/include/libpq/libpq.h
+++ b/src/include/libpq/libpq.h
@@ -54,6 +54,9 @@ extern void pq_init(void);
  extern void pq_comm_reset(void);
  extern int     pq_getbytes(char *s, size_t len);
  extern int     pq_getstring(StringInfo s);
+extern void pq_startmsgread(void);
+extern void pq_endmsgread(void);
+extern bool pq_is_reading_msg(void);
  extern int     pq_getmessage(StringInfo s, int maxlen);
  extern int     pq_getbyte(void);
  extern int     pq_peekbyte(void);
diff --git a/src/include/miscadmin.h b/src/include/miscadmin.h

index c2b786e666eb22afa25b423ba83bb80e0d12e453..d3b5022a841116ce0a0ba11e6c8d776f328719ae 100644 (file)
--- a/src/include/miscadmin.h
+++ b/src/include/miscadmin.h
@@ -52,6 +52,10 @@
   * will be held off until CHECK_FOR_INTERRUPTS() is done outside any
   * HOLD_INTERRUPTS() ... RESUME_INTERRUPTS() section.
   *
+ * There is also a mechanism to prevent query cancel interrupts, while still
+ * allowing die interrupts: HOLD_CANCEL_INTERRUPTS() and
+ * RESUME_CANCEL_INTERRUPTS().
+ *
   * Special mechanisms are used to let an interrupt be accepted when we are
   * waiting for a lock or when we are waiting for command input (but, of
   * course, only if the interrupt holdoff counter is zero).  See the
@@ -82,6 +86,7 @@ extern volatile bool ClientConnectionLost;
  /* these are marked volatile because they are examined by signal handlers: */
  extern PGDLLIMPORT volatile bool ImmediateInterruptOK;
  extern PGDLLIMPORT volatile uint32 InterruptHoldoffCount;
+extern PGDLLIMPORT volatile uint32 QueryCancelHoldoffCount;
  extern PGDLLIMPORT volatile uint32 CritSectionCount;
  
  /* in tcop/postgres.c */
@@ -114,6 +119,14 @@ do { \
         InterruptHoldoffCount--; \
  } while(0)
  
+#define HOLD_CANCEL_INTERRUPTS()  (QueryCancelHoldoffCount++)
+
+#define RESUME_CANCEL_INTERRUPTS() \
+do { \
+       Assert(QueryCancelHoldoffCount > 0); \
+       QueryCancelHoldoffCount--; \
+} while(0)
+
  #define START_CRIT_SECTION()  (CritSectionCount++)
  
  #define END_CRIT_SECTION() \
diff --git a/src/include/tcop/fastpath.h b/src/include/tcop/fastpath.h

index fdbc937e2fdb5c94c471253f9c9b339bd7cef2ef..c03a35fc0aea02e1855dd6fb91fdf2a9cc9d773d 100644 (file)
--- a/src/include/tcop/fastpath.h
+++ b/src/include/tcop/fastpath.h
@@ -15,6 +15,7 @@
  
  #include "lib/stringinfo.h"
  
+extern int GetOldFunctionMessage(StringInfo buf);
  extern int     HandleFunctionRequest(StringInfo msgBuf);
  
  #endif   /* FASTPATH_H */
author	Heikki Linnakangas <heikki.linnakangas@iki.fi>
	Mon, 2 Feb 2015 15:08:56 +0000 (17:08 +0200)
committer	Heikki Linnakangas <heikki.linnakangas@iki.fi>
	Mon, 2 Feb 2015 15:09:46 +0000 (17:09 +0200)
src/backend/commands/copy.c		patch \| blob \| history
src/backend/libpq/auth.c		patch \| blob \| history
src/backend/libpq/pqcomm.c		patch \| blob \| history
src/backend/postmaster/postmaster.c		patch \| blob \| history
src/backend/replication/walsender.c		patch \| blob \| history
src/backend/storage/lmgr/proc.c		patch \| blob \| history
src/backend/tcop/fastpath.c		patch \| blob \| history
src/backend/tcop/postgres.c		patch \| blob \| history
src/backend/utils/error/elog.c		patch \| blob \| history
src/backend/utils/init/globals.c		patch \| blob \| history
src/include/libpq/libpq.h		patch \| blob \| history
src/include/miscadmin.h		patch \| blob \| history
src/include/tcop/fastpath.h		patch \| blob \| history