summaryrefslogtreecommitdiff
path: root/jstests/sharding/migration_ignore_interrupts_4.js
blob: d28d809178d817342d7884082acec1bae153050d (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
// If a donor aborts a migration to a recipient, the recipient does not realize the migration has
// been aborted, and the donor moves on to a new migration, the original recipient will then fail to
// retrieve transferMods from the donor's xfermods log.
//
// Note: don't use coll1 in this test after a coll1 migration is interrupted -- the distlock isn't
// released promptly when interrupted.

load('./jstests/libs/chunk_manipulation_util.js');

(function() {
"use strict";

var staticMongod = MongoRunner.runMongod({});  // For startParallelOps.

// This test only makes sense if resumable range deletion is off, because when it is on, it is not
// possible for the donor to begin a new migration before having completed the previous one.
var st = new ShardingTest(
    {shards: 3, shardOptions: {setParameter: {"disableResumableRangeDeleter": true}}});

var mongos = st.s0, admin = mongos.getDB('admin'), dbName = "testDB", ns1 = dbName + ".foo",
    ns2 = dbName + ".bar", coll1 = mongos.getCollection(ns1), coll2 = mongos.getCollection(ns2),
    shard0 = st.shard0, shard1 = st.shard1, shard2 = st.shard2,
    shard0Coll1 = shard0.getCollection(ns1), shard1Coll1 = shard1.getCollection(ns1),
    shard2Coll1 = shard2.getCollection(ns1), shard0Coll2 = shard0.getCollection(ns2),
    shard1Coll2 = shard1.getCollection(ns2), shard2Coll2 = shard2.getCollection(ns2);

assert.commandWorked(admin.runCommand({enableSharding: dbName}));
st.ensurePrimaryShard(dbName, st.shard0.shardName);

assert.commandWorked(admin.runCommand({shardCollection: ns1, key: {a: 1}}));
assert.commandWorked(coll1.insert({a: 0}));
assert.eq(1, shard0Coll1.find().itcount());
assert.eq(0, shard1Coll1.find().itcount());
assert.eq(0, shard2Coll1.find().itcount());
assert.eq(1, coll1.find().itcount());

assert.commandWorked(admin.runCommand({shardCollection: ns2, key: {a: 1}}));
assert.commandWorked(coll2.insert({a: 0}));
assert.eq(1, shard0Coll2.find().itcount());
assert.eq(0, shard1Coll2.find().itcount());
assert.eq(0, shard2Coll2.find().itcount());
assert.eq(1, coll2.find().itcount());

// Shard0:
//      coll1:     [-inf, +inf)
//      coll2:     [-inf, +inf)
// Shard1:
// Shard2:

jsTest.log("Set up complete, now proceeding to test that migration interruption fails.");

// Start coll1 migration to shard1: pause recipient after cloning, donor before interrupt check
pauseMigrateAtStep(shard1, migrateStepNames.cloned);
pauseMoveChunkAtStep(shard0, moveChunkStepNames.startedMoveChunk);
const joinMoveChunk = moveChunkParallel(
    staticMongod, st.s0.host, {a: 0}, null, coll1.getFullName(), st.shard1.shardName);
waitForMigrateStep(shard1, migrateStepNames.cloned);

// Abort migration on donor side, recipient is unaware
killRunningMoveChunk(admin);

unpauseMoveChunkAtStep(shard0, moveChunkStepNames.startedMoveChunk);

assert.throws(function() {
    joinMoveChunk();
});

// Start coll2 migration to shard2, pause recipient after cloning step.
pauseMigrateAtStep(shard2, migrateStepNames.cloned);
const joinMoveChunk2 = moveChunkParallel(
    staticMongod, st.s0.host, {a: 0}, null, coll2.getFullName(), st.shard2.shardName);
waitForMigrateStep(shard2, migrateStepNames.cloned);

// Populate donor (shard0) xfermods log.
assert.commandWorked(coll2.insert({a: 1}));
assert.commandWorked(coll2.insert({a: 2}));
assert.eq(3, coll2.find().itcount(), "Failed to insert documents into coll2.");
assert.eq(3, shard0Coll2.find().itcount());

jsTest.log('Releasing coll1 migration recipient, whose transferMods command should fail....');
unpauseMigrateAtStep(shard1, migrateStepNames.cloned);
assert.soon(function() {
    // Wait for the destination shard to report that it is not in an active migration.
    var res = shard1.adminCommand({'_recvChunkStatus': 1});
    return (res.active == false);
}, "coll1 migration recipient didn't abort migration in catchup phase.", 2 * 60 * 1000);
assert.eq(1, shard0Coll1.find().itcount(), "donor shard0 completed a migration that it aborted.");

jsTest.log('Finishing coll2 migration, which should succeed....');
unpauseMigrateAtStep(shard2, migrateStepNames.cloned);
assert.doesNotThrow(function() {
    joinMoveChunk2();
});
assert.eq(0,
          shard0Coll2.find().itcount(),
          "donor shard0 failed to complete a migration after aborting a prior migration.");
assert.eq(3, shard2Coll2.find().itcount(), "shard2 failed to complete migration.");

st.stop();
MongoRunner.stopMongod(staticMongod);
})();