summaryrefslogtreecommitdiff
path: root/jstests
diff options
context:
space:
mode:
authorSamy Lanka <samy.lanka@mongodb.com>2019-06-11 15:51:38 -0400
committerSamy Lanka <samy.lanka@mongodb.com>2019-06-21 15:23:50 -0400
commitee746fb1672655b1cf6a1efff2b3f48ed8551e20 (patch)
tree60ab2058b759c2e3d8ea74c8ae80c847ae36051f /jstests
parent451d98685a3275b4cfd53164cf323155cbb3260a (diff)
downloadmongo-ee746fb1672655b1cf6a1efff2b3f48ed8551e20.tar.gz
SERVER-41250 Reset the oldest timestamp if initial sync fails and starts another attempt
Diffstat (limited to 'jstests')
-rw-r--r--jstests/replsets/initial_sync_reset_oldest_timestamp_after_failed_attempt.js100
1 files changed, 100 insertions, 0 deletions
diff --git a/jstests/replsets/initial_sync_reset_oldest_timestamp_after_failed_attempt.js b/jstests/replsets/initial_sync_reset_oldest_timestamp_after_failed_attempt.js
new file mode 100644
index 00000000000..d589c6320bc
--- /dev/null
+++ b/jstests/replsets/initial_sync_reset_oldest_timestamp_after_failed_attempt.js
@@ -0,0 +1,100 @@
+/**
+ * Tests that initial sync resets the oldest timestamp after a failed attempt. The test will turn on
+ * a failpoint that causes initial sync to fail partway through its first attempt and makes sure it
+ * does not hit a WiredTiger assertion on the second attempt.
+ *
+ * @tags: [uses_transactions, uses_prepare_transaction]
+ */
+
+(function() {
+ "use strict";
+
+ load("jstests/libs/check_log.js");
+ load("jstests/core/txns/libs/prepare_helpers.js");
+
+ // Set the number of initial sync attempts to 2 so that the test fails on unplanned failures.
+ const replTest =
+ new ReplSetTest({nodes: 2, nodeOptions: {setParameter: "numInitialSyncAttempts=2"}});
+ replTest.startSet();
+
+ // Increase the election timeout to 24 hours so that we do not accidentally trigger an election
+ // while the secondary is restarting.
+ replTest.initiateWithHighElectionTimeout();
+
+ const primary = replTest.getPrimary();
+ let secondary = replTest.getSecondary();
+
+ const dbName = "test";
+ const collName = "initial_sync_reset_oldest_timestamp_after_failed_attempt";
+ const testDB = primary.getDB(dbName);
+ const testColl = testDB.getCollection(collName);
+
+ assert.commandWorked(testColl.insert({_id: 1}));
+
+ const session = primary.startSession();
+ const sessionDB = session.getDatabase(dbName);
+ const sessionColl = sessionDB.getCollection(collName);
+ session.startTransaction();
+ assert.commandWorked(sessionColl.insert({_id: 2}));
+
+ // This will be the begin fetching point for both initial sync attempts. After the first initial
+ // sync attempt fails, if the oldest timestamp isn't reset before the next attempt, the update
+ // to the transaction table for this prepare will fail a WiredTiger assertion that the commit
+ // timestamp for a storage transaction cannot be older than the oldest timestamp.
+ const prepareTimestamp = PrepareHelpers.prepareTransaction(session);
+
+ jsTestLog("Prepared a transaction at timestamp: " + prepareTimestamp);
+
+ replTest.stop(secondary, undefined, {skipValidation: true});
+ secondary = replTest.start(
+ secondary,
+ {
+ startClean: true,
+ setParameter: {
+ // Set the number of operations per batch to be 1 so that we can know exactly how
+ // many batches there will be.
+ "replBatchLimitOperations": 1,
+ "failpoint.initialSyncHangAfterDataCloning": tojson({mode: "alwaysOn"}),
+ // Allow the syncing node to write the prepare oplog entry and apply the first update
+ // before failing initial sync.
+ "failpoint.failInitialSyncBeforeApplyingBatch": tojson({mode: {skip: 2}}),
+ }
+ },
+ true /* wait */);
+
+ // Wait for failpoint to be reached so we know that collection cloning is paused.
+ checkLog.contains(secondary, "initialSyncHangAfterDataCloning fail point enabled");
+
+ jsTestLog("Running operations while collection cloning is paused");
+
+ // This command will be in the last batch applied before the first initial sync attempt fails.
+ // If the oldest timestamp isn't reset on the next attempt, then the timestamp for this update
+ // will be the oldest timestamp.
+ assert.commandWorked(testColl.update({_id: 1}, {_id: 1, a: 1}));
+
+ // This entry will be applied in its own batch, so the failInitialSyncBeforeApplyingBatch
+ // failpoint will cause the first initial sync attempt to fail before applying this.
+ assert.commandWorked(testColl.update({_id: 1}, {_id: 1, b: 2}));
+
+ jsTestLog("Resuming initial sync");
+
+ assert.commandWorked(secondary.adminCommand(
+ {configureFailPoint: "initialSyncHangAfterDataCloning", mode: "off"}));
+
+ // Wait for this failpoint to be hit before turning it off and causing initial sync to fail.
+ checkLog.contains(secondary, "failInitialSyncBeforeApplyingBatch fail point enabled");
+
+ jsTestLog("Failing first initial sync attempt");
+
+ // Turn the failpoint off and cause initial sync to fail.
+ assert.commandWorked(secondary.adminCommand(
+ {configureFailPoint: "failInitialSyncBeforeApplyingBatch", mode: "off"}));
+
+ replTest.waitForState(secondary, ReplSetTest.State.SECONDARY);
+
+ jsTestLog("Initial sync completed");
+
+ assert.commandWorked(session.abortTransaction_forTesting());
+
+ replTest.stopSet();
+})(); \ No newline at end of file