summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorEric Milkie <milkie@10gen.com>2016-04-07 09:51:28 -0400
committerEric Milkie <milkie@10gen.com>2016-04-14 13:20:34 -0400
commitc558a396d221ee5c13278ca76667cca5adf8bdf5 (patch)
tree62afab0b42ed7751e8fb24ae037f31c1d1ab30de
parent7ee4e4e493c3785fea489ee3508ca18526709c16 (diff)
downloadmongo-c558a396d221ee5c13278ca76667cca5adf8bdf5.tar.gz
SERVER-23351 test read committed snapshots after a rollback occurs
(cherry picked from commit 0c3430437bc84b1d1f02ab78f1303732e84fe0c4)
-rw-r--r--jstests/replsets/read_committed_after_rollback.js156
1 files changed, 156 insertions, 0 deletions
diff --git a/jstests/replsets/read_committed_after_rollback.js b/jstests/replsets/read_committed_after_rollback.js
new file mode 100644
index 00000000000..68ba334ac9c
--- /dev/null
+++ b/jstests/replsets/read_committed_after_rollback.js
@@ -0,0 +1,156 @@
+/**
+ *
+ * Test read committed functionality following a following a rollback. Currently we require that all
+ * snapshots be dropped during rollback, therefore committed reads will block until a new committed
+ * snapshot is available.
+ */
+
+load("jstests/replsets/rslib.js"); // For startSetIfSupportsReadMajority.
+
+(function() {
+ "use strict";
+
+ function assertCommittedReadsBlock(coll) {
+ var res =
+ coll.runCommand('find', {"readConcern": {"level": "majority"}, "maxTimeMS": 3000});
+ assert.commandFailedWithCode(
+ res,
+ ErrorCodes.ExceededTimeLimit,
+ "Expected read of " + coll.getFullName() + ' on ' + coll.getMongo().host + " to block");
+ }
+
+ function doCommittedRead(coll) {
+ var res =
+ coll.runCommand('find', {"readConcern": {"level": "majority"}, "maxTimeMS": 10000});
+ assert.commandWorked(res,
+ 'reading from ' + coll.getFullName() + ' on ' + coll.getMongo().host);
+ return new DBCommandCursor(coll.getMongo(), res).toArray()[0].state;
+ }
+
+ function doDirtyRead(coll) {
+ var res = coll.runCommand('find', {"readConcern": {"level": "local"}});
+ assert.commandWorked(res,
+ 'reading from ' + coll.getFullName() + ' on ' + coll.getMongo().host);
+ return new DBCommandCursor(coll.getMongo(), res).toArray()[0].state;
+ }
+
+ // Set up a set and grab things for later.
+ var name = "read_committed_after_rollback";
+ var replTest = new ReplSetTest(
+ {name: name, nodes: 5, useBridge: true, nodeOptions: {enableMajorityReadConcern: ''}});
+
+ try {
+ replTest.startSet();
+ } catch (e) {
+ var conn = MongoRunner.runMongod();
+ if (!conn.getDB('admin').serverStatus().storageEngine.supportsCommittedReads) {
+ jsTest.log("skipping test since storage engine doesn't support committed reads");
+ MongoRunner.stopMongod(conn);
+ return;
+ }
+ throw e;
+ }
+
+ var nodes = replTest.nodeList();
+ var config = {
+ "_id": name,
+ "members": [
+ {"_id": 0, "host": nodes[0]},
+ {"_id": 1, "host": nodes[1]},
+ {"_id": 2, "host": nodes[2], priority: 0},
+ // Note: using two arbiters to ensure that a host that can't talk to any other
+ // data-bearing node can still be elected. This also means that a write isn't considered
+ // committed until it is on all 3 data-bearing nodes, not just 2.
+ {"_id": 3, "host": nodes[3], arbiterOnly: true},
+ {"_id": 4, "host": nodes[4], arbiterOnly: true},
+ ]
+ };
+ replTest.initiate(config);
+
+ // Get connections.
+ var oldPrimary = replTest.getPrimary();
+ var newPrimary = replTest.liveNodes.slaves[0];
+ var pureSecondary = replTest.liveNodes.slaves[1];
+ var arbiters = [replTest.nodes[3], replTest.nodes[4]];
+
+ // This is the collection that all of the tests will use.
+ var collName = name + '.collection';
+ var oldPrimaryColl = oldPrimary.getCollection(collName);
+ var newPrimaryColl = newPrimary.getCollection(collName);
+
+ // Set up initial state.
+ assert.writeOK(oldPrimaryColl.insert({_id: 1, state: 'old'},
+ {writeConcern: {w: 'majority', wtimeout: 30000}}));
+ assert.eq(doDirtyRead(oldPrimaryColl), 'old');
+ assert.eq(doCommittedRead(oldPrimaryColl), 'old');
+ assert.eq(doDirtyRead(newPrimaryColl), 'old');
+ // Note that we can't necessarily do a committed read from newPrimaryColl and get 'old', since
+ // delivery of the commit level to secondaries isn't synchronized with anything
+ // (we would have to hammer to reliably prove that it eventually would work).
+
+ // Partition the world such that oldPrimary is still primary but can't replicate to anyone.
+ // newPrimary is disconnected from the arbiters first to ensure that it can't be elected.
+ newPrimary.disconnect(arbiters);
+ oldPrimary.disconnect([newPrimary, pureSecondary]);
+ assert.eq(doDirtyRead(newPrimaryColl), 'old');
+
+ // This write will only make it to oldPrimary and will never become committed.
+ assert.writeOK(oldPrimaryColl.save({_id: 1, state: 'INVALID'}));
+ assert.eq(doDirtyRead(oldPrimaryColl), 'INVALID');
+ assert.eq(doCommittedRead(oldPrimaryColl), 'old');
+
+ // Change the partitioning so that oldPrimary is isolated, and newPrimary can be elected.
+ oldPrimary.setSlaveOk();
+ oldPrimary.disconnect(arbiters);
+ newPrimary.reconnect(arbiters);
+ assert.soon(() => newPrimary.adminCommand('isMaster').ismaster, '', 60 * 1000);
+ assert.soon(function() {
+ try {
+ return !oldPrimary.adminCommand('isMaster').ismaster;
+ } catch (e) {
+ return false; // ignore disconnect errors.
+ }
+ });
+
+ // Stop applier on pureSecondary to ensure that writes to newPrimary won't become committed yet.
+ assert.commandWorked(
+ pureSecondary.adminCommand({configureFailPoint: "rsSyncApplyStop", mode: "alwaysOn"}));
+ assert.writeOK(newPrimaryColl.save({_id: 1, state: 'new'}));
+ assert.eq(doDirtyRead(newPrimaryColl), 'new');
+ // Note that we still can't do a committed read from the new primary and reliably get anything,
+ // since we never proved that it learned about the commit level from the old primary before
+ // the new primary got elected. The new primary cannot advance the commit level until it
+ // commits a write in its own term. This includes learning that a majority of nodes have
+ // received such a write.
+ assert.eq(doCommittedRead(oldPrimaryColl), 'old');
+
+ // Reconnect oldPrimary to newPrimary, inducing rollback of the 'INVALID' write. This causes
+ // oldPrimary to drop all snapshots. oldPrimary still won't be connected to enough hosts to
+ // allow it to be elected, so newPrimary should stay primary for the rest of this test.
+ oldPrimary.reconnect(newPrimary);
+ assert.soon(function() {
+ try {
+ return oldPrimary.adminCommand('isMaster').secondary &&
+ doDirtyRead(oldPrimaryColl) == 'new';
+ } catch (e) {
+ return false; // ignore disconnect errors.
+ }
+ }, '', 60 * 1000);
+ assert.eq(doDirtyRead(oldPrimaryColl), 'new');
+ assertCommittedReadsBlock(oldPrimaryColl);
+
+ // Try asserts again after sleeping to make sure state doesn't change while pureSecondary isn't
+ // replicating.
+ sleep(1000);
+ assert.eq(doDirtyRead(oldPrimaryColl), 'new');
+ assertCommittedReadsBlock(oldPrimaryColl);
+
+ // Resume oplog application on pureSecondary to allow the 'new' write to be committed. It should
+ // now be visible as a committed read to both oldPrimary and newPrimary.
+ assert.commandWorked(
+ pureSecondary.adminCommand({configureFailPoint: "rsSyncApplyStop", mode: "off"}));
+ assert.commandWorked(
+ newPrimaryColl.runCommand({getLastError: 1, w: 'majority', wtimeout: 30000}));
+ assert.eq(doCommittedRead(newPrimaryColl), 'new');
+ assert.eq(doCommittedRead(oldPrimaryColl), 'new');
+}());