int nmsgs = 0;
SharedInvalidationMessage *invalMessages = NULL;
bool RelcacheInitFileInval = false;
+ bool wrote_xlog = XactLastRecEnd.xrecoff != 0;
/* Get data needed for commit record */
nrels = smgrGetPendingDeletes(true, &rels, &haveNonTemp);
/*
* If we didn't create XLOG entries, we're done here; otherwise we
- * should flush those entries the same as a commit record. (An
- * example of a possible record that wouldn't cause an XID to be
- * assigned is a sequence advance record due to nextval() --- we want
- * to flush that to disk before reporting commit.)
+ * should trigger flushing those entries the same as a commit record
+ * would. This will primarily happen for HOT pruning and the like; we
+ * want these to be flushed to disk in due time.
*/
- if (XactLastRecEnd.xrecoff == 0)
+ if (!wrote_xlog)
goto cleanup;
}
else
}
/*
- * Check if we want to commit asynchronously. If the user has set
- * synchronous_commit = off, and we're not doing cleanup of any non-temp
- * rels nor committing any command that wanted to force sync commit, then
- * we can defer flushing XLOG. (We must not allow asynchronous commit if
- * there are any non-temp tables to be deleted, because we might delete
- * the files before the COMMIT record is flushed to disk. We do allow
- * asynchronous commit if all to-be-deleted tables are temporary though,
- * since they are lost anyway if we crash.)
+ * Check if we want to commit asynchronously. We can allow the XLOG flush
+ * to happen asynchronously if synchronous_commit=off, or if the current
+ * transaction has not performed any WAL-logged operation or didn't assign
+ * a xid. The transaction can end up not writing any WAL, even if it has
+ * a xid, if it only wrote to temporary tables. It can end up having
+ * written WAL without an xid if it did HOT pruning. In case of a crash,
+ * the loss of such a transaction will be irrelevant; temp tables will be
+ * lost anyway and HOT pruning will be done again later. (Given the
+ * foregoing, you might think that it would be unnecessary to emit the
+ * XLOG record at all in this case, but we don't currently try to do that.
+ * It would certainly cause problems at least in Hot Standby mode, where
+ * the KnownAssignedXids machinery requires tracking every XID assignment.
+ * It might be OK to skip it only when wal_level < hot_standby, but for
+ * now we don't.)
+ *
+ * However, if we're doing cleanup of any non-temp rels or committing any
+ * command that wanted to force sync commit, then we must flush XLOG
+ * immediately. (We must not allow asynchronous commit if there are any
+ * non-temp tables to be deleted, because we might delete the files before
+ * the COMMIT record is flushed to disk. We do allow asynchronous commit
+ * if all to-be-deleted tables are temporary though, since they are lost
+ * anyway if we crash.)
*/
- if (XactSyncCommit || forceSyncCommit || haveNonTemp)
+ if ((wrote_xlog && markXidCommitted && XactSyncCommit)
+ || forceSyncCommit || haveNonTemp)
{
/*
* Synchronous commit case:
*/
LockBuffer(buf, BUFFER_LOCK_EXCLUSIVE);
+ /* check the comment above nextval_internal()'s equivalent call. */
+ if (!rel->rd_istemp)
+ GetTopTransactionId();
+
START_CRIT_SECTION();
{
/* Note that we do not change the currval() state */
elm->cached = elm->last;
+ /* check the comment above nextval_internal()'s equivalent call. */
+ if (!seqrel->rd_istemp)
+ GetTopTransactionId();
+
/* Now okay to update the on-disk tuple */
START_CRIT_SECTION();
last_used_seq = elm;
+ /*
+ * If something needs to be WAL logged, acquire an xid, so this
+ * transaction's commit will trigger a WAL flush and wait for
+ * syncrep. It's sufficient to ensure the toplevel transaction has a xid,
+ * no need to assign xids subxacts, that'll already trigger a appropriate
+ * wait. (Have to do that here, so we're outside the critical section)
+ */
+ if (logit && !seqrel->rd_istemp)
+ GetTopTransactionId();
+
/* ready to change the on-disk (or really, in-buffer) tuple */
START_CRIT_SECTION();
/* In any case, forget any future cached numbers */
elm->cached = elm->last;
+ /* check the comment above nextval_internal()'s equivalent call. */
+ if (!seqrel->rd_istemp)
+ GetTopTransactionId();
+
/* ready to change the on-disk (or really, in-buffer) tuple */
START_CRIT_SECTION();