summaryrefslogtreecommitdiff
path: root/jstests/sharding/migration_ignore_interrupts_4.js
blob: bc692a9897c8e73a1335ae91baa875c9c66da23d (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
// If a donor aborts a migration to a recipient, the recipient does not realize the migration has
// been aborted, and the donor moves on to a new migration, the original recipient will then fail to
// retrieve transferMods from the donor's xfermods log.
//
// Note: don't use coll1 in this test after a coll1 migration is interrupted -- the distlock isn't
// released promptly when interrupted.

load('./jstests/libs/chunk_manipulation_util.js');

(function() {
"use strict";

var staticMongod = MongoRunner.runMongod({});  // For startParallelOps.

var st = new ShardingTest({shards: 3});

var mongos = st.s0, admin = mongos.getDB('admin'), dbName = "testDB", ns1 = dbName + ".foo",
    ns2 = dbName + ".bar", coll1 = mongos.getCollection(ns1), coll2 = mongos.getCollection(ns2),
    shard0 = st.shard0, shard1 = st.shard1, shard2 = st.shard2,
    shard0Coll1 = shard0.getCollection(ns1), shard1Coll1 = shard1.getCollection(ns1),
    shard2Coll1 = shard2.getCollection(ns1), shard0Coll2 = shard0.getCollection(ns2),
    shard1Coll2 = shard1.getCollection(ns2), shard2Coll2 = shard2.getCollection(ns2);

assert.commandWorked(admin.runCommand({enableSharding: dbName}));
st.ensurePrimaryShard(dbName, st.shard0.shardName);

assert.commandWorked(admin.runCommand({shardCollection: ns1, key: {a: 1}}));
assert.writeOK(coll1.insert({a: 0}));
assert.eq(1, shard0Coll1.find().itcount());
assert.eq(0, shard1Coll1.find().itcount());
assert.eq(0, shard2Coll1.find().itcount());
assert.eq(1, coll1.find().itcount());

assert.commandWorked(admin.runCommand({shardCollection: ns2, key: {a: 1}}));
assert.writeOK(coll2.insert({a: 0}));
assert.eq(1, shard0Coll2.find().itcount());
assert.eq(0, shard1Coll2.find().itcount());
assert.eq(0, shard2Coll2.find().itcount());
assert.eq(1, coll2.find().itcount());

// Shard0:
//      coll1:     [-inf, +inf)
//      coll2:     [-inf, +inf)
// Shard1:
// Shard2:

jsTest.log("Set up complete, now proceeding to test that migration interruption fails.");

// Start coll1 migration to shard1: pause recipient after cloning, donor before interrupt check
pauseMigrateAtStep(shard1, migrateStepNames.cloned);
pauseMoveChunkAtStep(shard0, moveChunkStepNames.startedMoveChunk);
var joinMoveChunk = moveChunkParallel(
    staticMongod, st.s0.host, {a: 0}, null, coll1.getFullName(), st.shard1.shardName);
waitForMigrateStep(shard1, migrateStepNames.cloned);

// Abort migration on donor side, recipient is unaware
let inProgressOps = admin.aggregate([{$currentOp: {'allUsers': true}}]);
var abortedMigration = false;
let inProgressStr = '';
while (inProgressOps.hasNext()) {
    let op = inProgressOps.next();
    inProgressStr += tojson(op);
    if (op.command.moveChunk) {
        admin.killOp(op.opid);
        abortedMigration = true;
    }
}
assert.eq(
    true, abortedMigration, "Failed to abort migration, current running ops: " + inProgressStr);
unpauseMoveChunkAtStep(shard0, moveChunkStepNames.startedMoveChunk);
assert.throws(function() {
    joinMoveChunk();
});

// Start coll2 migration to shard2, pause recipient after cloning step.
pauseMigrateAtStep(shard2, migrateStepNames.cloned);
joinMoveChunk = moveChunkParallel(
    staticMongod, st.s0.host, {a: 0}, null, coll2.getFullName(), st.shard2.shardName);
waitForMigrateStep(shard2, migrateStepNames.cloned);

// Populate donor (shard0) xfermods log.
assert.writeOK(coll2.insert({a: 1}));
assert.writeOK(coll2.insert({a: 2}));
assert.eq(3, coll2.find().itcount(), "Failed to insert documents into coll2.");
assert.eq(3, shard0Coll2.find().itcount());

jsTest.log('Releasing coll1 migration recipient, whose transferMods command should fail....');
unpauseMigrateAtStep(shard1, migrateStepNames.cloned);
assert.soon(function() {
    // Wait for the destination shard to report that it is not in an active migration.
    var res = shard1.adminCommand({'_recvChunkStatus': 1});
    return (res.active == false);
}, "coll1 migration recipient didn't abort migration in catchup phase.", 2 * 60 * 1000);
assert.eq(1, shard0Coll1.find().itcount(), "donor shard0 completed a migration that it aborted.");

jsTest.log('Finishing coll2 migration, which should succeed....');
unpauseMigrateAtStep(shard2, migrateStepNames.cloned);
assert.doesNotThrow(function() {
    joinMoveChunk();
});
assert.eq(0,
          shard0Coll2.find().itcount(),
          "donor shard0 failed to complete a migration after aborting a prior migration.");
assert.eq(3, shard2Coll2.find().itcount(), "shard2 failed to complete migration.");

st.stop();
MongoRunner.stopMongod(staticMongod);
})();