]> granicus.if.org Git - postgresql/commitdiff
Reduce spurious Hot Standby conflicts from never-visible records.
authorSimon Riggs <simon@2ndQuadrant.com>
Thu, 9 Dec 2010 09:41:47 +0000 (09:41 +0000)
committerSimon Riggs <simon@2ndQuadrant.com>
Thu, 9 Dec 2010 09:41:47 +0000 (09:41 +0000)
Hot Standby conflicts only with tuples that were visible at
some point. So ignore tuples from aborted transactions or for
tuples updated/deleted during the inserting transaction when
generating the conflict transaction ids.

Following detailed analysis and test case by Noah Misch.
Original report covered btree delete records, correctly observed
by Heikki Linnakangas that this applies to other cases also.
Fix covers all sources of cleanup records via common code.

src/backend/access/heap/heapam.c
src/backend/access/heap/pruneheap.c
src/backend/access/nbtree/nbtxlog.c

index 8b064bcff2428d2d7ae0b2544a1f1c04e2ac03de..cfbbc6301e3daba23bd885373c7f7af214369d6e 100644 (file)
@@ -3776,8 +3776,11 @@ heap_restrpos(HeapScanDesc scan)
 }
 
 /*
- * If 'tuple' contains any XID greater than latestRemovedXid, update
- * latestRemovedXid to the greatest one found.
+ * If 'tuple' contains any visible XID greater than latestRemovedXid,
+ * ratchet forwards latestRemovedXid to the greatest one found.
+ * This is used as the basis for generating Hot Standby conflicts, so
+ * if a tuple was never visible then removing it should not conflict
+ * with queries.
  */
 void
 HeapTupleHeaderAdvanceLatestRemovedXid(HeapTupleHeader tuple,
@@ -3793,13 +3796,27 @@ HeapTupleHeaderAdvanceLatestRemovedXid(HeapTupleHeader tuple,
                        *latestRemovedXid = xvac;
        }
 
-       if (TransactionIdPrecedes(*latestRemovedXid, xmax))
-               *latestRemovedXid = xmax;
-
-       if (TransactionIdPrecedes(*latestRemovedXid, xmin))
-               *latestRemovedXid = xmin;
+       /*
+        * Ignore tuples inserted by an aborted transaction or
+        * if the tuple was updated/deleted by the inserting transaction.
+        *
+        * Look for a committed hint bit, or if no xmin bit is set, check clog.
+        * This needs to work on both master and standby, where it is used
+        * to assess btree delete records.
+        */
+       if ((tuple->t_infomask & HEAP_XMIN_COMMITTED) ||
+               (!(tuple->t_infomask & HEAP_XMIN_COMMITTED) &&
+                !(tuple->t_infomask & HEAP_XMIN_INVALID) &&
+                TransactionIdDidCommit(xmin)))
+       {
+               if (TransactionIdFollows(xmax, xmin))
+               {
+                       if (TransactionIdFollows(xmax, *latestRemovedXid))
+                               *latestRemovedXid = xmax;
+               }
+       }
 
-       Assert(TransactionIdIsValid(*latestRemovedXid));
+       /* *latestRemovedXid may still be invalid at end */
 }
 
 /*
index b8c4027a9e7d3d5e11a6c17850596603ffeffd9c..ee5f38fccd65abb68e192f605201f145e77cb537 100644 (file)
@@ -237,7 +237,6 @@ heap_page_prune(Relation relation, Buffer buffer, TransactionId OldestXmin,
                {
                        XLogRecPtr      recptr;
 
-                       Assert(TransactionIdIsValid(prstate.latestRemovedXid));
                        recptr = log_heap_clean(relation, buffer,
                                                                        prstate.redirected, prstate.nredirected,
                                                                        prstate.nowdead, prstate.ndead,
index 0822f5cb11026f4c68418993f82224a9fd270b2e..e1221709b1484143af16110bcc0e318d2b197c13 100644 (file)
@@ -580,7 +580,6 @@ btree_xlog_delete_get_latestRemovedXid(XLogRecord *record)
        BlockNumber hblkno;
        OffsetNumber hoffnum;
        TransactionId latestRemovedXid = InvalidTransactionId;
-       TransactionId htupxid = InvalidTransactionId;
        int                     i;
 
        /*
@@ -646,24 +645,16 @@ btree_xlog_delete_get_latestRemovedXid(XLogRecord *record)
                }
 
                /*
-                * If the heap item has storage, then read the header. Some LP_DEAD
-                * items may not be accessible, so we ignore them.
+                * If the heap item has storage, then read the header and use that to
+                * set latestRemovedXid.
+                *
+                * Some LP_DEAD items may not be accessible, so we ignore them.
                 */
                if (ItemIdHasStorage(hitemid))
                {
                        htuphdr = (HeapTupleHeader) PageGetItem(hpage, hitemid);
 
-                       /*
-                        * Get the heap tuple's xmin/xmax and ratchet up the
-                        * latestRemovedXid. No need to consider xvac values here.
-                        */
-                       htupxid = HeapTupleHeaderGetXmin(htuphdr);
-                       if (TransactionIdFollows(htupxid, latestRemovedXid))
-                               latestRemovedXid = htupxid;
-
-                       htupxid = HeapTupleHeaderGetXmax(htuphdr);
-                       if (TransactionIdFollows(htupxid, latestRemovedXid))
-                               latestRemovedXid = htupxid;
+                       HeapTupleHeaderAdvanceLatestRemovedXid(htuphdr, &latestRemovedXid);
                }
                else if (ItemIdIsDead(hitemid))
                {