diff options
author | Eric Milkie <milkie@10gen.com> | 2016-04-07 09:51:28 -0400 |
---|---|---|
committer | Eric Milkie <milkie@10gen.com> | 2016-04-14 13:20:34 -0400 |
commit | c558a396d221ee5c13278ca76667cca5adf8bdf5 (patch) | |
tree | 62afab0b42ed7751e8fb24ae037f31c1d1ab30de | |
parent | 7ee4e4e493c3785fea489ee3508ca18526709c16 (diff) | |
download | mongo-c558a396d221ee5c13278ca76667cca5adf8bdf5.tar.gz |
SERVER-23351 test read committed snapshots after a rollback occurs
(cherry picked from commit 0c3430437bc84b1d1f02ab78f1303732e84fe0c4)
-rw-r--r-- | jstests/replsets/read_committed_after_rollback.js | 156 |
1 files changed, 156 insertions, 0 deletions
diff --git a/jstests/replsets/read_committed_after_rollback.js b/jstests/replsets/read_committed_after_rollback.js new file mode 100644 index 00000000000..68ba334ac9c --- /dev/null +++ b/jstests/replsets/read_committed_after_rollback.js @@ -0,0 +1,156 @@ +/** + * + * Test read committed functionality following a following a rollback. Currently we require that all + * snapshots be dropped during rollback, therefore committed reads will block until a new committed + * snapshot is available. + */ + +load("jstests/replsets/rslib.js"); // For startSetIfSupportsReadMajority. + +(function() { + "use strict"; + + function assertCommittedReadsBlock(coll) { + var res = + coll.runCommand('find', {"readConcern": {"level": "majority"}, "maxTimeMS": 3000}); + assert.commandFailedWithCode( + res, + ErrorCodes.ExceededTimeLimit, + "Expected read of " + coll.getFullName() + ' on ' + coll.getMongo().host + " to block"); + } + + function doCommittedRead(coll) { + var res = + coll.runCommand('find', {"readConcern": {"level": "majority"}, "maxTimeMS": 10000}); + assert.commandWorked(res, + 'reading from ' + coll.getFullName() + ' on ' + coll.getMongo().host); + return new DBCommandCursor(coll.getMongo(), res).toArray()[0].state; + } + + function doDirtyRead(coll) { + var res = coll.runCommand('find', {"readConcern": {"level": "local"}}); + assert.commandWorked(res, + 'reading from ' + coll.getFullName() + ' on ' + coll.getMongo().host); + return new DBCommandCursor(coll.getMongo(), res).toArray()[0].state; + } + + // Set up a set and grab things for later. + var name = "read_committed_after_rollback"; + var replTest = new ReplSetTest( + {name: name, nodes: 5, useBridge: true, nodeOptions: {enableMajorityReadConcern: ''}}); + + try { + replTest.startSet(); + } catch (e) { + var conn = MongoRunner.runMongod(); + if (!conn.getDB('admin').serverStatus().storageEngine.supportsCommittedReads) { + jsTest.log("skipping test since storage engine doesn't support committed reads"); + MongoRunner.stopMongod(conn); + return; + } + throw e; + } + + var nodes = replTest.nodeList(); + var config = { + "_id": name, + "members": [ + {"_id": 0, "host": nodes[0]}, + {"_id": 1, "host": nodes[1]}, + {"_id": 2, "host": nodes[2], priority: 0}, + // Note: using two arbiters to ensure that a host that can't talk to any other + // data-bearing node can still be elected. This also means that a write isn't considered + // committed until it is on all 3 data-bearing nodes, not just 2. + {"_id": 3, "host": nodes[3], arbiterOnly: true}, + {"_id": 4, "host": nodes[4], arbiterOnly: true}, + ] + }; + replTest.initiate(config); + + // Get connections. + var oldPrimary = replTest.getPrimary(); + var newPrimary = replTest.liveNodes.slaves[0]; + var pureSecondary = replTest.liveNodes.slaves[1]; + var arbiters = [replTest.nodes[3], replTest.nodes[4]]; + + // This is the collection that all of the tests will use. + var collName = name + '.collection'; + var oldPrimaryColl = oldPrimary.getCollection(collName); + var newPrimaryColl = newPrimary.getCollection(collName); + + // Set up initial state. + assert.writeOK(oldPrimaryColl.insert({_id: 1, state: 'old'}, + {writeConcern: {w: 'majority', wtimeout: 30000}})); + assert.eq(doDirtyRead(oldPrimaryColl), 'old'); + assert.eq(doCommittedRead(oldPrimaryColl), 'old'); + assert.eq(doDirtyRead(newPrimaryColl), 'old'); + // Note that we can't necessarily do a committed read from newPrimaryColl and get 'old', since + // delivery of the commit level to secondaries isn't synchronized with anything + // (we would have to hammer to reliably prove that it eventually would work). + + // Partition the world such that oldPrimary is still primary but can't replicate to anyone. + // newPrimary is disconnected from the arbiters first to ensure that it can't be elected. + newPrimary.disconnect(arbiters); + oldPrimary.disconnect([newPrimary, pureSecondary]); + assert.eq(doDirtyRead(newPrimaryColl), 'old'); + + // This write will only make it to oldPrimary and will never become committed. + assert.writeOK(oldPrimaryColl.save({_id: 1, state: 'INVALID'})); + assert.eq(doDirtyRead(oldPrimaryColl), 'INVALID'); + assert.eq(doCommittedRead(oldPrimaryColl), 'old'); + + // Change the partitioning so that oldPrimary is isolated, and newPrimary can be elected. + oldPrimary.setSlaveOk(); + oldPrimary.disconnect(arbiters); + newPrimary.reconnect(arbiters); + assert.soon(() => newPrimary.adminCommand('isMaster').ismaster, '', 60 * 1000); + assert.soon(function() { + try { + return !oldPrimary.adminCommand('isMaster').ismaster; + } catch (e) { + return false; // ignore disconnect errors. + } + }); + + // Stop applier on pureSecondary to ensure that writes to newPrimary won't become committed yet. + assert.commandWorked( + pureSecondary.adminCommand({configureFailPoint: "rsSyncApplyStop", mode: "alwaysOn"})); + assert.writeOK(newPrimaryColl.save({_id: 1, state: 'new'})); + assert.eq(doDirtyRead(newPrimaryColl), 'new'); + // Note that we still can't do a committed read from the new primary and reliably get anything, + // since we never proved that it learned about the commit level from the old primary before + // the new primary got elected. The new primary cannot advance the commit level until it + // commits a write in its own term. This includes learning that a majority of nodes have + // received such a write. + assert.eq(doCommittedRead(oldPrimaryColl), 'old'); + + // Reconnect oldPrimary to newPrimary, inducing rollback of the 'INVALID' write. This causes + // oldPrimary to drop all snapshots. oldPrimary still won't be connected to enough hosts to + // allow it to be elected, so newPrimary should stay primary for the rest of this test. + oldPrimary.reconnect(newPrimary); + assert.soon(function() { + try { + return oldPrimary.adminCommand('isMaster').secondary && + doDirtyRead(oldPrimaryColl) == 'new'; + } catch (e) { + return false; // ignore disconnect errors. + } + }, '', 60 * 1000); + assert.eq(doDirtyRead(oldPrimaryColl), 'new'); + assertCommittedReadsBlock(oldPrimaryColl); + + // Try asserts again after sleeping to make sure state doesn't change while pureSecondary isn't + // replicating. + sleep(1000); + assert.eq(doDirtyRead(oldPrimaryColl), 'new'); + assertCommittedReadsBlock(oldPrimaryColl); + + // Resume oplog application on pureSecondary to allow the 'new' write to be committed. It should + // now be visible as a committed read to both oldPrimary and newPrimary. + assert.commandWorked( + pureSecondary.adminCommand({configureFailPoint: "rsSyncApplyStop", mode: "off"})); + assert.commandWorked( + newPrimaryColl.runCommand({getLastError: 1, w: 'majority', wtimeout: 30000})); + assert.eq(doCommittedRead(newPrimaryColl), 'new'); + assert.eq(doCommittedRead(oldPrimaryColl), 'new'); +}()); |