/** * Copyright (C) 2018-present MongoDB, Inc. * * This program is free software: you can redistribute it and/or modify * it under the terms of the Server Side Public License, version 1, * as published by MongoDB, Inc. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * Server Side Public License for more details. * * You should have received a copy of the Server Side Public License * along with this program. If not, see * . * * As a special exception, the copyright holders give permission to link the * code of portions of this program with the OpenSSL library under certain * conditions as described in each individual source file and distribute * linked combinations including the program with the OpenSSL library. You * must comply with the Server Side Public License in all respects for * all of the code used other than as permitted herein. If you modify file(s) * with this exception, you may extend this exception to your version of the * file(s), but you are not obligated to do so. If you do not wish to do so, * delete this exception statement from your version. If you delete this * exception statement from all source files in the program, then also delete * it in the license file. */ #include "mongo/platform/basic.h" #include "mongo/s/query/async_results_merger.h" #include #include "mongo/db/json.h" #include "mongo/db/pipeline/change_stream_constants.h" #include "mongo/db/pipeline/resume_token.h" #include "mongo/db/query/cursor_response.h" #include "mongo/db/query/getmore_command_gen.h" #include "mongo/executor/task_executor.h" #include "mongo/s/catalog/type_shard.h" #include "mongo/s/client/shard_registry.h" #include "mongo/s/query/results_merger_test_fixture.h" #include "mongo/unittest/death_test.h" #include "mongo/unittest/unittest.h" namespace mongo { namespace { LogicalSessionId parseSessionIdFromCmd(BSONObj cmdObj) { return LogicalSessionId::parse(IDLParserErrorContext("lsid"), cmdObj["lsid"].Obj()); } BSONObj makePostBatchResumeToken(Timestamp clusterTime) { auto pbrt = ResumeToken::makeHighWaterMarkToken(clusterTime).toDocument().toBson(); invariant(pbrt.firstElement().type() == BSONType::String); return pbrt; } BSONObj makeResumeToken(Timestamp clusterTime, UUID uuid, BSONObj docKey) { ResumeTokenData data; data.clusterTime = clusterTime; data.uuid = uuid; data.documentKey = Value(Document{docKey}); return ResumeToken(data).toDocument().toBson(); } using AsyncResultsMergerTest = ResultsMergerTestFixture; TEST_F(AsyncResultsMergerTest, SingleShardUnsorted) { std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 5, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors)); // Before any requests are scheduled, ARM is not ready to return results. ASSERT_FALSE(arm->ready()); ASSERT_FALSE(arm->remotesExhausted()); // Schedule requests. auto readyEvent = unittest::assertGet(arm->nextEvent()); // Before any responses are delivered, ARM is not ready to return results. ASSERT_FALSE(arm->ready()); ASSERT_FALSE(arm->remotesExhausted()); // Shard responds; the handleBatchResponse callbacks are run and ARM's remotes get updated. std::vector responses; std::vector batch = {fromjson("{_id: 1}"), fromjson("{_id: 2}"), fromjson("{_id: 3}")}; responses.emplace_back(kTestNss, CursorId(0), batch); scheduleNetworkResponses(std::move(responses)); // Now that the responses have been delivered, ARM is ready to return results. ASSERT_TRUE(arm->ready()); // Because the response contained a cursorId of 0, ARM marked the remote as exhausted. ASSERT_TRUE(arm->remotesExhausted()); // ARM returns the correct results. executor()->waitForEvent(readyEvent); ASSERT_BSONOBJ_EQ(fromjson("{_id: 1}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 2}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 3}"), *unittest::assertGet(arm->nextReady()).getResult()); // After returning all the buffered results, ARM returns EOF immediately because the cursor was // exhausted. ASSERT_TRUE(arm->ready()); ASSERT_TRUE(unittest::assertGet(arm->nextReady()).isEOF()); } TEST_F(AsyncResultsMergerTest, SingleShardSorted) { BSONObj findCmd = fromjson("{find: 'testcoll', sort: {_id: 1}}"); std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 5, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors), findCmd); // Before any requests are scheduled, ARM is not ready to return results. ASSERT_FALSE(arm->ready()); ASSERT_FALSE(arm->remotesExhausted()); // Schedule requests. auto readyEvent = unittest::assertGet(arm->nextEvent()); // Before any responses are delivered, ARM is not ready to return results. ASSERT_FALSE(arm->ready()); ASSERT_FALSE(arm->remotesExhausted()); // Shard responds; the handleBatchResponse callbacks are run and ARM's remotes get updated. std::vector responses; std::vector batch = {fromjson("{$sortKey: [5]}"), fromjson("{$sortKey: [6]}")}; responses.emplace_back(kTestNss, CursorId(0), batch); scheduleNetworkResponses(std::move(responses)); // Now that the responses have been delivered, ARM is ready to return results. ASSERT_TRUE(arm->ready()); // Because the response contained a cursorId of 0, ARM marked the remote as exhausted. ASSERT_TRUE(arm->remotesExhausted()); // ARM returns all results in order. executor()->waitForEvent(readyEvent); ASSERT_BSONOBJ_EQ(fromjson("{$sortKey: [5]}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{$sortKey: [6]}"), *unittest::assertGet(arm->nextReady()).getResult()); // After returning all the buffered results, ARM returns EOF immediately because the cursor was // exhausted. ASSERT_TRUE(arm->ready()); ASSERT_TRUE(unittest::assertGet(arm->nextReady()).isEOF()); } TEST_F(AsyncResultsMergerTest, MultiShardUnsorted) { std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 5, {}))); cursors.push_back( makeRemoteCursor(kTestShardIds[1], kTestShardHosts[1], CursorResponse(kTestNss, 6, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors)); // Before any requests are scheduled, ARM is not ready to return results. ASSERT_FALSE(arm->ready()); ASSERT_FALSE(arm->remotesExhausted()); // Schedule requests. auto readyEvent = unittest::assertGet(arm->nextEvent()); // Before any responses are delivered, ARM is not ready to return results. ASSERT_FALSE(arm->ready()); ASSERT_FALSE(arm->remotesExhausted()); // First shard responds; the handleBatchResponse callback is run and ARM's remote gets updated. std::vector responses; std::vector batch1 = { fromjson("{_id: 1}"), fromjson("{_id: 2}"), fromjson("{_id: 3}")}; responses.emplace_back(kTestNss, CursorId(0), batch1); scheduleNetworkResponses(std::move(responses)); // ARM is ready to return first result. ASSERT_TRUE(arm->ready()); // ARM is not exhausted, because second shard has yet to respond. ASSERT_FALSE(arm->remotesExhausted()); // ARM returns results from first shard immediately. executor()->waitForEvent(readyEvent); ASSERT_BSONOBJ_EQ(fromjson("{_id: 1}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 2}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 3}"), *unittest::assertGet(arm->nextReady()).getResult()); // There are no further buffered results, so ARM is not ready. ASSERT_FALSE(arm->ready()); // Make next event to be signaled. readyEvent = unittest::assertGet(arm->nextEvent()); // Second shard responds; the handleBatchResponse callback is run and ARM's remote gets updated. responses.clear(); std::vector batch2 = { fromjson("{_id: 4}"), fromjson("{_id: 5}"), fromjson("{_id: 6}")}; responses.emplace_back(kTestNss, CursorId(0), batch2); scheduleNetworkResponses(std::move(responses)); // ARM is ready to return remaining results. ASSERT_TRUE(arm->ready()); ASSERT_TRUE(arm->remotesExhausted()); // ARM returns results from second shard immediately. executor()->waitForEvent(readyEvent); ASSERT_BSONOBJ_EQ(fromjson("{_id: 4}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 5}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 6}"), *unittest::assertGet(arm->nextReady()).getResult()); // After returning all the buffered results, the ARM returns EOF immediately because both shards // cursors were exhausted. ASSERT_TRUE(arm->ready()); ASSERT_TRUE(unittest::assertGet(arm->nextReady()).isEOF()); } TEST_F(AsyncResultsMergerTest, MultiShardSorted) { BSONObj findCmd = fromjson("{find: 'testcoll', sort: {_id: 1}}"); std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 5, {}))); cursors.push_back( makeRemoteCursor(kTestShardIds[1], kTestShardHosts[1], CursorResponse(kTestNss, 6, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors), findCmd); // Before any requests are scheduled, ARM is not ready to return results. ASSERT_FALSE(arm->ready()); ASSERT_FALSE(arm->remotesExhausted()); // Schedule requests. auto readyEvent = unittest::assertGet(arm->nextEvent()); // Before any responses are delivered, ARM is not ready to return results. ASSERT_FALSE(arm->ready()); ASSERT_FALSE(arm->remotesExhausted()); // First shard responds; the handleBatchResponse callback is run and ARM's remote gets updated. std::vector responses; std::vector batch1 = {fromjson("{$sortKey: [5]}"), fromjson("{$sortKey: [6]}")}; responses.emplace_back(kTestNss, CursorId(0), batch1); scheduleNetworkResponses(std::move(responses)); // ARM is not ready to return results until receiving responses from all remotes. ASSERT_FALSE(arm->ready()); // ARM is not exhausted, because second shard has yet to respond. ASSERT_FALSE(arm->remotesExhausted()); // Second shard responds; the handleBatchResponse callback is run and ARM's remote gets updated. responses.clear(); std::vector batch2 = {fromjson("{$sortKey: [3]}"), fromjson("{$sortKey: [9]}")}; responses.emplace_back(kTestNss, CursorId(0), batch2); scheduleNetworkResponses(std::move(responses)); // Now that all remotes have responded, ARM is ready to return results. ASSERT_TRUE(arm->ready()); ASSERT_TRUE(arm->remotesExhausted()); // ARM returns all results in sorted order. executor()->waitForEvent(readyEvent); ASSERT_BSONOBJ_EQ(fromjson("{$sortKey: [3]}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{$sortKey: [5]}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{$sortKey: [6]}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{$sortKey: [9]}"), *unittest::assertGet(arm->nextReady()).getResult()); // After returning all the buffered results, the ARM returns EOF immediately because both shards // cursors were exhausted. ASSERT_TRUE(arm->ready()); ASSERT_TRUE(unittest::assertGet(arm->nextReady()).isEOF()); } TEST_F(AsyncResultsMergerTest, MultiShardMultipleGets) { std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 5, {}))); cursors.push_back( makeRemoteCursor(kTestShardIds[1], kTestShardHosts[1], CursorResponse(kTestNss, 6, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors)); // Before any requests are scheduled, ARM is not ready to return results. ASSERT_FALSE(arm->ready()); ASSERT_FALSE(arm->remotesExhausted()); // Schedule requests. auto readyEvent = unittest::assertGet(arm->nextEvent()); // First shard responds; the handleBatchResponse callback is run and ARM's remote gets updated. std::vector responses; std::vector batch1 = { fromjson("{_id: 1}"), fromjson("{_id: 2}"), fromjson("{_id: 3}")}; responses.emplace_back(kTestNss, CursorId(5), batch1); scheduleNetworkResponses(std::move(responses)); // ARM is ready to return first result. ASSERT_TRUE(arm->ready()); // ARM is not exhausted, because second shard has yet to respond and first shard's response did // not contain cursorId=0. ASSERT_FALSE(arm->remotesExhausted()); // ARM returns results from first shard immediately. executor()->waitForEvent(readyEvent); ASSERT_BSONOBJ_EQ(fromjson("{_id: 1}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 2}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 3}"), *unittest::assertGet(arm->nextReady()).getResult()); // There are no further buffered results, so ARM is not ready. ASSERT_FALSE(arm->ready()); // Make next event to be signaled. readyEvent = unittest::assertGet(arm->nextEvent()); // Second shard responds; the handleBatchResponse callback is run and ARM's remote gets updated. responses.clear(); std::vector batch2 = { fromjson("{_id: 4}"), fromjson("{_id: 5}"), fromjson("{_id: 6}")}; responses.emplace_back(kTestNss, CursorId(0), batch2); scheduleNetworkResponses(std::move(responses)); // ARM is ready to return second shard's results. ASSERT_TRUE(arm->ready()); // ARM is not exhausted, because first shard's response did not contain cursorId=0. ASSERT_FALSE(arm->remotesExhausted()); // ARM returns results from second shard immediately. executor()->waitForEvent(readyEvent); ASSERT_BSONOBJ_EQ(fromjson("{_id: 4}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 5}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 6}"), *unittest::assertGet(arm->nextReady()).getResult()); // ARM is not ready to return results until further results are obtained from first shard. ASSERT_FALSE(arm->ready()); // Make next event to be signaled. readyEvent = unittest::assertGet(arm->nextEvent()); // First shard returns remainder of results. responses.clear(); std::vector batch3 = { fromjson("{_id: 7}"), fromjson("{_id: 8}"), fromjson("{_id: 9}")}; responses.emplace_back(kTestNss, CursorId(0), batch3); scheduleNetworkResponses(std::move(responses)); // ARM is ready to return remaining results. ASSERT_TRUE(arm->ready()); ASSERT_TRUE(arm->remotesExhausted()); // ARM returns remaining results immediately. executor()->waitForEvent(readyEvent); ASSERT_BSONOBJ_EQ(fromjson("{_id: 7}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 8}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 9}"), *unittest::assertGet(arm->nextReady()).getResult()); // After returning all the buffered results, the ARM returns EOF immediately because both shards // cursors were exhausted. ASSERT_TRUE(arm->ready()); ASSERT_TRUE(unittest::assertGet(arm->nextReady()).isEOF()); } TEST_F(AsyncResultsMergerTest, CompoundSortKey) { BSONObj findCmd = fromjson("{find: 'testcoll', sort: {a: -1, b: 1}}"); std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 5, {}))); cursors.push_back( makeRemoteCursor(kTestShardIds[1], kTestShardHosts[1], CursorResponse(kTestNss, 6, {}))); cursors.push_back( makeRemoteCursor(kTestShardIds[2], kTestShardHosts[2], CursorResponse(kTestNss, 7, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors), findCmd); // Schedule requests. ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); // Deliver responses. std::vector responses; std::vector batch1 = {fromjson("{$sortKey: [5, 9]}"), fromjson("{$sortKey: [4, 20]}")}; responses.emplace_back(kTestNss, CursorId(0), batch1); std::vector batch2 = {fromjson("{$sortKey: [10, 11]}"), fromjson("{$sortKey: [4, 4]}")}; responses.emplace_back(kTestNss, CursorId(0), batch2); std::vector batch3 = {fromjson("{$sortKey: [10, 12]}"), fromjson("{$sortKey: [5, 9]}")}; responses.emplace_back(kTestNss, CursorId(0), batch3); scheduleNetworkResponses(std::move(responses)); executor()->waitForEvent(readyEvent); // ARM returns all results in sorted order. ASSERT_TRUE(arm->ready()); ASSERT_TRUE(arm->remotesExhausted()); ASSERT_BSONOBJ_EQ(fromjson("{$sortKey: [10, 11]}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{$sortKey: [10, 12]}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{$sortKey: [5, 9]}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{$sortKey: [5, 9]}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{$sortKey: [4, 4]}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{$sortKey: [4, 20]}"), *unittest::assertGet(arm->nextReady()).getResult()); // After returning all the buffered results, the ARM returns EOF immediately because both shards // cursors were exhausted. ASSERT_TRUE(arm->ready()); ASSERT_TRUE(unittest::assertGet(arm->nextReady()).isEOF()); } TEST_F(AsyncResultsMergerTest, SortedButNoSortKey) { BSONObj findCmd = fromjson("{find: 'testcoll', sort: {a: -1, b: 1}}"); std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 1, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors), findCmd); ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); // Parsing the batch results in an error because the sort key is missing. std::vector responses; std::vector batch1 = {fromjson("{a: 2, b: 1}"), fromjson("{a: 1, b: 2}")}; responses.emplace_back(kTestNss, CursorId(1), batch1); scheduleNetworkResponses(std::move(responses)); executor()->waitForEvent(readyEvent); ASSERT_TRUE(arm->ready()); auto statusWithNext = arm->nextReady(); ASSERT(!statusWithNext.isOK()); ASSERT_EQ(statusWithNext.getStatus().code(), ErrorCodes::InternalError); // Required to kill the 'arm' on error before destruction. auto killFuture = arm->kill(operationContext()); killFuture.wait(); } TEST_F(AsyncResultsMergerTest, HasFirstBatch) { std::vector firstBatch = { fromjson("{_id: 1}"), fromjson("{_id: 2}"), fromjson("{_id: 3}")}; std::vector cursors; cursors.push_back(makeRemoteCursor( kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 5, std::move(firstBatch)))); auto arm = makeARMFromExistingCursors(std::move(cursors)); // Because there was firstBatch, ARM is immediately ready to return results. ASSERT_TRUE(arm->ready()); // Because the cursorId was not zero, ARM is not exhausted. ASSERT_FALSE(arm->remotesExhausted()); // ARM returns the correct results. ASSERT_BSONOBJ_EQ(fromjson("{_id: 1}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 2}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 3}"), *unittest::assertGet(arm->nextReady()).getResult()); // Now that the firstBatch results have been returned, ARM must wait for further results. ASSERT_FALSE(arm->ready()); // Schedule requests. auto readyEvent = unittest::assertGet(arm->nextEvent()); // Before any responses are delivered, ARM is not ready to return results. ASSERT_FALSE(arm->ready()); ASSERT_FALSE(arm->remotesExhausted()); // Shard responds; the handleBatchResponse callbacks are run and ARM's remotes get updated. std::vector responses; std::vector batch = {fromjson("{_id: 4}"), fromjson("{_id: 5}"), fromjson("{_id: 6}")}; responses.emplace_back(kTestNss, CursorId(0), batch); scheduleNetworkResponses(std::move(responses)); // Now that the responses have been delivered, ARM is ready to return results. ASSERT_TRUE(arm->ready()); // Because the response contained a cursorId of 0, ARM marked the remote as exhausted. ASSERT_TRUE(arm->remotesExhausted()); // ARM returns the correct results. executor()->waitForEvent(readyEvent); ASSERT_BSONOBJ_EQ(fromjson("{_id: 4}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 5}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 6}"), *unittest::assertGet(arm->nextReady()).getResult()); // After returning all the buffered results, ARM returns EOF immediately because the cursor was // exhausted. ASSERT_TRUE(arm->ready()); ASSERT_TRUE(unittest::assertGet(arm->nextReady()).isEOF()); } TEST_F(AsyncResultsMergerTest, OneShardHasInitialBatchOtherShardExhausted) { std::vector firstBatch = { fromjson("{_id: 1}"), fromjson("{_id: 2}"), fromjson("{_id: 3}")}; std::vector cursors; cursors.push_back(makeRemoteCursor( kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 5, std::move(firstBatch)))); cursors.push_back( makeRemoteCursor(kTestShardIds[1], kTestShardHosts[1], CursorResponse(kTestNss, 0, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors)); // Because there was firstBatch, ARM is immediately ready to return results. ASSERT_TRUE(arm->ready()); // Because one of the remotes' cursorId was not zero, ARM is not exhausted. ASSERT_FALSE(arm->remotesExhausted()); // ARM returns the correct results. ASSERT_BSONOBJ_EQ(fromjson("{_id: 1}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 2}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 3}"), *unittest::assertGet(arm->nextReady()).getResult()); // Now that the firstBatch results have been returned, ARM must wait for further results. ASSERT_FALSE(arm->ready()); // Schedule requests. auto readyEvent = unittest::assertGet(arm->nextEvent()); // Before any responses are delivered, ARM is not ready to return results. ASSERT_FALSE(arm->ready()); ASSERT_FALSE(arm->remotesExhausted()); // Shard responds; the handleBatchResponse callbacks are run and ARM's remotes get updated. std::vector responses; std::vector batch = {fromjson("{_id: 4}"), fromjson("{_id: 5}"), fromjson("{_id: 6}")}; responses.emplace_back(kTestNss, CursorId(0), batch); scheduleNetworkResponses(std::move(responses)); // Now that the responses have been delivered, ARM is ready to return results. ASSERT_TRUE(arm->ready()); // Because the response contained a cursorId of 0, ARM marked the remote as exhausted. ASSERT_TRUE(arm->remotesExhausted()); // ARM returns the correct results. executor()->waitForEvent(readyEvent); ASSERT_BSONOBJ_EQ(fromjson("{_id: 4}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 5}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 6}"), *unittest::assertGet(arm->nextReady()).getResult()); // After returning all the buffered results, ARM returns EOF immediately because the cursor was // exhausted. ASSERT_TRUE(arm->ready()); ASSERT_TRUE(unittest::assertGet(arm->nextReady()).isEOF()); } TEST_F(AsyncResultsMergerTest, StreamResultsFromOneShardIfOtherDoesntRespond) { std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 1, {}))); cursors.push_back( makeRemoteCursor(kTestShardIds[1], kTestShardHosts[1], CursorResponse(kTestNss, 2, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors)); ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); // Both shards respond with the first batch. std::vector responses; std::vector batch1 = {fromjson("{_id: 1}"), fromjson("{_id: 2}")}; responses.emplace_back(kTestNss, CursorId(1), batch1); std::vector batch2 = {fromjson("{_id: 3}"), fromjson("{_id: 4}")}; responses.emplace_back(kTestNss, CursorId(2), batch2); scheduleNetworkResponses(std::move(responses)); executor()->waitForEvent(readyEvent); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 1}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 2}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 3}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 4}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_FALSE(arm->ready()); readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); // When we ask the shards for their next batch, the first shard responds and the second shard // never responds. responses.clear(); std::vector batch3 = {fromjson("{_id: 5}"), fromjson("{_id: 6}")}; responses.emplace_back(kTestNss, CursorId(1), batch3); scheduleNetworkResponses(std::move(responses)); blackHoleNextRequest(); executor()->waitForEvent(readyEvent); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 5}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 6}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_FALSE(arm->ready()); readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); // We can continue to return results from first shard, while second shard remains unresponsive. responses.clear(); std::vector batch4 = {fromjson("{_id: 7}"), fromjson("{_id: 8}")}; responses.emplace_back(kTestNss, CursorId(0), batch4); scheduleNetworkResponses(std::move(responses)); executor()->waitForEvent(readyEvent); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 7}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 8}"), *unittest::assertGet(arm->nextReady()).getResult()); auto killFuture = arm->kill(operationContext()); executor()->shutdown(); killFuture.wait(); } TEST_F(AsyncResultsMergerTest, ErrorOnMismatchedCursorIds) { std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 123, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors)); ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); std::vector responses; std::vector batch = {fromjson("{_id: 4}"), fromjson("{_id: 5}"), fromjson("{_id: 6}")}; responses.emplace_back(kTestNss, CursorId(456), batch); scheduleNetworkResponses(std::move(responses)); executor()->waitForEvent(readyEvent); ASSERT_TRUE(arm->ready()); ASSERT(!arm->nextReady().isOK()); // Required to kill the 'arm' on error before destruction. auto killFuture = arm->kill(operationContext()); killFuture.wait(); } TEST_F(AsyncResultsMergerTest, BadResponseReceivedFromShard) { std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 123, {}))); cursors.push_back( makeRemoteCursor(kTestShardIds[1], kTestShardHosts[1], CursorResponse(kTestNss, 456, {}))); cursors.push_back( makeRemoteCursor(kTestShardIds[2], kTestShardHosts[2], CursorResponse(kTestNss, 789, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors)); ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); std::vector batch1 = {fromjson("{_id: 1}"), fromjson("{_id: 2}")}; BSONObj response1 = CursorResponse(kTestNss, CursorId(123), batch1) .toBSON(CursorResponse::ResponseType::SubsequentResponse); BSONObj response2 = fromjson("{foo: 'bar'}"); std::vector batch3 = {fromjson("{_id: 4}"), fromjson("{_id: 5}")}; BSONObj response3 = CursorResponse(kTestNss, CursorId(789), batch3) .toBSON(CursorResponse::ResponseType::SubsequentResponse); scheduleNetworkResponseObjs({response1, response2, response3}); runReadyCallbacks(); executor()->waitForEvent(readyEvent); ASSERT_TRUE(arm->ready()); auto statusWithNext = arm->nextReady(); ASSERT(!statusWithNext.isOK()); // Required to kill the 'arm' on error before destruction. auto killFuture = arm->kill(operationContext()); killFuture.wait(); } TEST_F(AsyncResultsMergerTest, ErrorReceivedFromShard) { std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 1, {}))); cursors.push_back( makeRemoteCursor(kTestShardIds[1], kTestShardHosts[1], CursorResponse(kTestNss, 2, {}))); cursors.push_back( makeRemoteCursor(kTestShardIds[2], kTestShardHosts[2], CursorResponse(kTestNss, 3, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors)); ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); std::vector responses; std::vector batch1 = {fromjson("{_id: 1}"), fromjson("{_id: 2}")}; responses.emplace_back(kTestNss, CursorId(1), batch1); std::vector batch2 = {fromjson("{_id: 3}"), fromjson("{_id: 4}")}; responses.emplace_back(kTestNss, CursorId(2), batch2); scheduleNetworkResponses(std::move(responses)); scheduleErrorResponse({ErrorCodes::BadValue, "bad thing happened"}); executor()->waitForEvent(readyEvent); ASSERT_TRUE(arm->ready()); auto statusWithNext = arm->nextReady(); ASSERT(!statusWithNext.isOK()); ASSERT_EQ(statusWithNext.getStatus().code(), ErrorCodes::BadValue); ASSERT_EQ(statusWithNext.getStatus().reason(), "bad thing happened"); // Required to kill the 'arm' on error before destruction. auto killFuture = arm->kill(operationContext()); killFuture.wait(); } TEST_F(AsyncResultsMergerTest, ErrorCantScheduleEventBeforeLastSignaled) { std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 1, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors)); ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); // Error to call nextEvent()() before the previous event is signaled. ASSERT_NOT_OK(arm->nextEvent().getStatus()); std::vector responses; std::vector batch = {fromjson("{_id: 1}"), fromjson("{_id: 2}")}; responses.emplace_back(kTestNss, CursorId(0), batch); scheduleNetworkResponses(std::move(responses)); executor()->waitForEvent(readyEvent); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 1}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 2}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_TRUE(unittest::assertGet(arm->nextReady()).isEOF()); // Required to kill the 'arm' on error before destruction. auto killFuture = arm->kill(operationContext()); killFuture.wait(); } TEST_F(AsyncResultsMergerTest, NextEventAfterTaskExecutorShutdown) { std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 1, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors)); executor()->shutdown(); ASSERT_EQ(ErrorCodes::ShutdownInProgress, arm->nextEvent().getStatus()); auto killFuture = arm->kill(operationContext()); killFuture.wait(); } TEST_F(AsyncResultsMergerTest, KillAfterTaskExecutorShutdownWithOutstandingBatches) { std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 1, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors)); // Make a request to the shard that will never get answered. ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); blackHoleNextRequest(); // Executor shuts down before a response is received. executor()->shutdown(); auto killFuture = arm->kill(operationContext()); killFuture.wait(); // Ensure that the executor finishes all of the outstanding callbacks before the ARM is freed. executor()->join(); } TEST_F(AsyncResultsMergerTest, KillNoBatchesRequested) { std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 1, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors)); ASSERT_FALSE(arm->ready()); auto killFuture = arm->kill(operationContext()); assertKillCusorsCmdHasCursorId(getNthPendingRequest(0u).cmdObj, 1); // Killed cursors are considered ready, but return an error when you try to receive the next // doc. ASSERT_TRUE(arm->ready()); ASSERT_NOT_OK(arm->nextReady().getStatus()); killFuture.wait(); } TEST_F(AsyncResultsMergerTest, KillAllRemotesExhausted) { std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 1, {}))); cursors.push_back( makeRemoteCursor(kTestShardIds[1], kTestShardHosts[1], CursorResponse(kTestNss, 2, {}))); cursors.push_back( makeRemoteCursor(kTestShardIds[2], kTestShardHosts[2], CursorResponse(kTestNss, 3, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors)); ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); std::vector responses; std::vector batch1 = {fromjson("{_id: 1}"), fromjson("{_id: 2}")}; responses.emplace_back(kTestNss, CursorId(0), batch1); std::vector batch2 = {fromjson("{_id: 3}"), fromjson("{_id: 4}")}; responses.emplace_back(kTestNss, CursorId(0), batch2); std::vector batch3 = {fromjson("{_id: 3}"), fromjson("{_id: 4}")}; responses.emplace_back(kTestNss, CursorId(0), batch3); scheduleNetworkResponses(std::move(responses)); auto killFuture = arm->kill(operationContext()); // ARM shouldn't schedule killCursors on anything since all of the remotes are exhausted. ASSERT_FALSE(networkHasReadyRequests()); ASSERT_TRUE(arm->ready()); ASSERT_NOT_OK(arm->nextReady().getStatus()); killFuture.wait(); } TEST_F(AsyncResultsMergerTest, KillNonExhaustedCursorWithoutPendingRequest) { std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 1, {}))); cursors.push_back( makeRemoteCursor(kTestShardIds[1], kTestShardHosts[1], CursorResponse(kTestNss, 2, {}))); cursors.push_back( makeRemoteCursor(kTestShardIds[2], kTestShardHosts[2], CursorResponse(kTestNss, 123, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors)); ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); std::vector responses; std::vector batch1 = {fromjson("{_id: 1}"), fromjson("{_id: 2}")}; responses.emplace_back(kTestNss, CursorId(0), batch1); std::vector batch2 = {fromjson("{_id: 3}"), fromjson("{_id: 4}")}; responses.emplace_back(kTestNss, CursorId(0), batch2); // Cursor 3 is not exhausted. std::vector batch3 = {fromjson("{_id: 3}"), fromjson("{_id: 4}")}; responses.emplace_back(kTestNss, CursorId(123), batch3); scheduleNetworkResponses(std::move(responses)); auto killFuture = arm->kill(operationContext()); // ARM should schedule killCursors on cursor 123 assertKillCusorsCmdHasCursorId(getNthPendingRequest(0u).cmdObj, 123); ASSERT_TRUE(arm->ready()); ASSERT_NOT_OK(arm->nextReady().getStatus()); killFuture.wait(); } TEST_F(AsyncResultsMergerTest, KillTwoOutstandingBatches) { std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 1, {}))); cursors.push_back( makeRemoteCursor(kTestShardIds[1], kTestShardHosts[1], CursorResponse(kTestNss, 2, {}))); cursors.push_back( makeRemoteCursor(kTestShardIds[2], kTestShardHosts[2], CursorResponse(kTestNss, 3, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors)); ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); std::vector responses; std::vector batch1 = {fromjson("{_id: 1}"), fromjson("{_id: 2}")}; responses.emplace_back(kTestNss, CursorId(0), batch1); scheduleNetworkResponses(std::move(responses)); // Kill event will only be signalled once the callbacks for the pending batches have run. auto killFuture = arm->kill(operationContext()); // Check that the ARM kills both batches. assertKillCusorsCmdHasCursorId(getNthPendingRequest(0u).cmdObj, 2); assertKillCusorsCmdHasCursorId(getNthPendingRequest(1u).cmdObj, 3); // Run the callbacks which were canceled. runReadyCallbacks(); // Ensure that we properly signal those waiting for more results to be ready. executor()->waitForEvent(readyEvent); killFuture.wait(); } TEST_F(AsyncResultsMergerTest, NextEventErrorsAfterKill) { std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 1, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors)); ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); std::vector responses; std::vector batch1 = {fromjson("{_id: 1}"), fromjson("{_id: 2}")}; responses.emplace_back(kTestNss, CursorId(1), batch1); scheduleNetworkResponses(std::move(responses)); auto killFuture = arm->kill(operationContext()); // Attempting to schedule more network operations on a killed arm is an error. ASSERT_NOT_OK(arm->nextEvent().getStatus()); killFuture.wait(); } TEST_F(AsyncResultsMergerTest, KillCalledTwice) { std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 1, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors)); auto killFuture1 = arm->kill(operationContext()); auto killFuture2 = arm->kill(operationContext()); killFuture1.wait(); killFuture2.wait(); } TEST_F(AsyncResultsMergerTest, TailableBasic) { BSONObj findCmd = fromjson("{find: 'testcoll', tailable: true}"); std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 123, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors), findCmd); ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); std::vector responses; std::vector batch1 = {fromjson("{_id: 1}"), fromjson("{_id: 2}")}; responses.emplace_back(kTestNss, CursorId(123), batch1); scheduleNetworkResponses(std::move(responses)); executor()->waitForEvent(readyEvent); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 1}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 2}"), *unittest::assertGet(arm->nextReady()).getResult()); // In the tailable case, we expect EOF after every batch. ASSERT_TRUE(arm->ready()); ASSERT_TRUE(unittest::assertGet(arm->nextReady()).isEOF()); ASSERT_FALSE(arm->remotesExhausted()); ASSERT_FALSE(arm->ready()); readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); responses.clear(); std::vector batch2 = {fromjson("{_id: 3}")}; responses.emplace_back(kTestNss, CursorId(123), batch2); scheduleNetworkResponses(std::move(responses)); executor()->waitForEvent(readyEvent); ASSERT_TRUE(arm->ready()); ASSERT_FALSE(arm->remotesExhausted()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 3}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_TRUE(unittest::assertGet(arm->nextReady()).isEOF()); ASSERT_FALSE(arm->remotesExhausted()); auto killFuture = arm->kill(operationContext()); killFuture.wait(); } TEST_F(AsyncResultsMergerTest, TailableEmptyBatch) { BSONObj findCmd = fromjson("{find: 'testcoll', tailable: true}"); std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 123, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors), findCmd); ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); // Remote responds with an empty batch and a non-zero cursor id. std::vector responses; std::vector batch; responses.emplace_back(kTestNss, CursorId(123), batch); scheduleNetworkResponses(std::move(responses)); executor()->waitForEvent(readyEvent); // After receiving an empty batch, the ARM should return boost::none, but remotes should not be // marked as exhausted. ASSERT_TRUE(arm->ready()); ASSERT_TRUE(unittest::assertGet(arm->nextReady()).isEOF()); ASSERT_FALSE(arm->remotesExhausted()); auto killFuture = arm->kill(operationContext()); killFuture.wait(); } TEST_F(AsyncResultsMergerTest, TailableExhaustedCursor) { BSONObj findCmd = fromjson("{find: 'testcoll', tailable: true}"); std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 123, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors), findCmd); ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); // Remote responds with an empty batch and a zero cursor id. std::vector responses; std::vector batch; responses.emplace_back(kTestNss, CursorId(0), batch); scheduleNetworkResponses(std::move(responses)); executor()->waitForEvent(readyEvent); // Afterwards, the ARM should return boost::none and remote cursors should be marked as // exhausted. ASSERT_TRUE(arm->ready()); ASSERT_TRUE(unittest::assertGet(arm->nextReady()).isEOF()); ASSERT_TRUE(arm->remotesExhausted()); } TEST_F(AsyncResultsMergerTest, GetMoreBatchSizes) { BSONObj findCmd = fromjson("{find: 'testcoll', batchSize: 3}"); std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 1, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors), findCmd); ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); std::vector responses; std::vector batch1 = {fromjson("{_id: 1}"), fromjson("{_id: 2}")}; responses.emplace_back(kTestNss, CursorId(1), batch1); scheduleNetworkResponses(std::move(responses)); executor()->waitForEvent(readyEvent); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 1}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 2}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_FALSE(arm->ready()); responses.clear(); std::vector batch2 = {fromjson("{_id: 3}")}; responses.emplace_back(kTestNss, CursorId(0), batch2); readyEvent = unittest::assertGet(arm->nextEvent()); BSONObj scheduledCmd = getNthPendingRequest(0).cmdObj; auto cmd = GetMoreCommandRequest::parse({"getMore"}, scheduledCmd.addField(BSON("$db" << "anydbname") .firstElement())); ASSERT_EQ(*cmd.getBatchSize(), 1LL); ASSERT_EQ(cmd.getCommandParameter(), 1LL); scheduleNetworkResponses(std::move(responses)); executor()->waitForEvent(readyEvent); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 3}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_TRUE(unittest::assertGet(arm->nextReady()).isEOF()); } TEST_F(AsyncResultsMergerTest, AllowPartialResults) { BSONObj findCmd = fromjson("{find: 'testcoll', allowPartialResults: true}"); std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 97, {}))); cursors.push_back( makeRemoteCursor(kTestShardIds[1], kTestShardHosts[1], CursorResponse(kTestNss, 98, {}))); cursors.push_back( makeRemoteCursor(kTestShardIds[2], kTestShardHosts[2], CursorResponse(kTestNss, 99, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors), findCmd); ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); // An error occurs with the first host. scheduleErrorResponse({ErrorCodes::AuthenticationFailed, "authentication failed"}); ASSERT_FALSE(arm->ready()); // Instead of propagating the error, we should be willing to return results from the two // remaining shards. std::vector responses; std::vector batch1 = {fromjson("{_id: 1}")}; responses.emplace_back(kTestNss, CursorId(98), batch1); std::vector batch2 = {fromjson("{_id: 2}")}; responses.emplace_back(kTestNss, CursorId(99), batch2); scheduleNetworkResponses(std::move(responses)); executor()->waitForEvent(readyEvent); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 1}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 2}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_FALSE(arm->ready()); readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); // Now the second host becomes unreachable. We should still be willing to return results from // the third shard. scheduleErrorResponse({ErrorCodes::AuthenticationFailed, "authentication failed"}); ASSERT_FALSE(arm->ready()); responses.clear(); std::vector batch3 = {fromjson("{_id: 3}")}; responses.emplace_back(kTestNss, CursorId(99), batch3); scheduleNetworkResponses(std::move(responses)); executor()->waitForEvent(readyEvent); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 3}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_FALSE(arm->ready()); readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); // Once the last reachable shard indicates that its cursor is closed, we're done. responses.clear(); std::vector batch4 = {}; responses.emplace_back(kTestNss, CursorId(0), batch4); scheduleNetworkResponses(std::move(responses)); executor()->waitForEvent(readyEvent); ASSERT_TRUE(arm->ready()); ASSERT_TRUE(unittest::assertGet(arm->nextReady()).isEOF()); } TEST_F(AsyncResultsMergerTest, AllowPartialResultsSingleNode) { BSONObj findCmd = fromjson("{find: 'testcoll', allowPartialResults: true}"); std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 98, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors), findCmd); ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); std::vector responses; std::vector batch = {fromjson("{_id: 1}"), fromjson("{_id: 2}")}; responses.emplace_back(kTestNss, CursorId(98), batch); scheduleNetworkResponses(std::move(responses)); executor()->waitForEvent(readyEvent); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 1}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 2}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_FALSE(arm->ready()); readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); // The lone host involved in this query returns an error. This should simply cause us to return // EOF. scheduleErrorResponse({ErrorCodes::AuthenticationFailed, "authentication failed"}); ASSERT_TRUE(arm->ready()); ASSERT_TRUE(unittest::assertGet(arm->nextReady()).isEOF()); } TEST_F(AsyncResultsMergerTest, AllowPartialResultsOnRetriableErrorNoRetries) { BSONObj findCmd = fromjson("{find: 'testcoll', allowPartialResults: true}"); std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 1, {}))); cursors.push_back( makeRemoteCursor(kTestShardIds[2], kTestShardHosts[2], CursorResponse(kTestNss, 2, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors), findCmd); ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); // First host returns single result std::vector responses; std::vector batch = {fromjson("{_id: 1}")}; responses.emplace_back(kTestNss, CursorId(0), batch); scheduleNetworkResponses(std::move(responses)); // From the second host we get a network (retriable) error. scheduleErrorResponse({ErrorCodes::HostUnreachable, "host unreachable"}); executor()->waitForEvent(readyEvent); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 1}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->remotesExhausted()); ASSERT_TRUE(arm->ready()); } TEST_F(AsyncResultsMergerTest, ReturnsErrorOnRetriableError) { BSONObj findCmd = fromjson("{find: 'testcoll', sort: {_id: 1}}"); std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 1, {}))); cursors.push_back( makeRemoteCursor(kTestShardIds[2], kTestShardHosts[2], CursorResponse(kTestNss, 2, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors), findCmd); ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); // Both hosts return network (retriable) errors. scheduleErrorResponse({ErrorCodes::HostUnreachable, "host unreachable"}); scheduleErrorResponse({ErrorCodes::HostUnreachable, "host unreachable"}); executor()->waitForEvent(readyEvent); ASSERT_TRUE(arm->ready()); auto statusWithNext = arm->nextReady(); ASSERT(!statusWithNext.isOK()); ASSERT_EQ(statusWithNext.getStatus().code(), ErrorCodes::HostUnreachable); ASSERT_EQ(statusWithNext.getStatus().reason(), "host unreachable"); // Required to kill the 'arm' on error before destruction. auto killFuture = arm->kill(operationContext()); killFuture.wait(); } TEST_F(AsyncResultsMergerTest, GetMoreRequestIncludesMaxTimeMS) { BSONObj findCmd = fromjson("{find: 'testcoll', tailable: true, awaitData: true}"); std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 123, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors), findCmd); ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); std::vector responses; std::vector batch1 = {fromjson("{_id: 1}")}; responses.emplace_back(kTestNss, CursorId(123), batch1); scheduleNetworkResponses(std::move(responses)); executor()->waitForEvent(readyEvent); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 1}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_FALSE(arm->ready()); readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_OK(arm->setAwaitDataTimeout(Milliseconds(789))); // Pending getMore request should already have been scheduled without the maxTimeMS. BSONObj expectedCmdObj = BSON("getMore" << CursorId(123) << "collection" << "testcoll"); ASSERT_BSONOBJ_EQ(getNthPendingRequest(0).cmdObj, expectedCmdObj); ASSERT_FALSE(arm->ready()); responses.clear(); std::vector batch2 = {fromjson("{_id: 2}")}; responses.emplace_back(kTestNss, CursorId(123), batch2); scheduleNetworkResponses(std::move(responses)); executor()->waitForEvent(readyEvent); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 2}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_FALSE(arm->ready()); readyEvent = unittest::assertGet(arm->nextEvent()); // The next getMore request should include the maxTimeMS. expectedCmdObj = BSON("getMore" << CursorId(123) << "collection" << "testcoll" << "maxTimeMS" << 789); ASSERT_BSONOBJ_EQ(getNthPendingRequest(0).cmdObj, expectedCmdObj); // Clean up. responses.clear(); std::vector batch3 = {fromjson("{_id: 3}")}; responses.emplace_back(kTestNss, CursorId(0), batch3); scheduleNetworkResponses(std::move(responses)); } DEATH_TEST_REGEX_F( AsyncResultsMergerTest, SortedTailableInvariantsIfInitialBatchHasNoPostBatchResumeToken, R"#(Invariant failure.*_promisedMinSortKeys.empty || _promisedMinSortKeys.size == _remotes.size)#") { AsyncResultsMergerParams params; params.setNss(kTestNss); UUID uuid = UUID::gen(); std::vector cursors; // Create one cursor whose initial response has a postBatchResumeToken. auto pbrtFirstCursor = makePostBatchResumeToken(Timestamp(1, 5)); auto firstDocSortKey = makeResumeToken(Timestamp(1, 4), uuid, BSON("_id" << 1)); auto firstCursorResponse = fromjson( str::stream() << "{_id: {clusterTime: {ts: Timestamp(1, 4)}, uuid: '" << uuid.toString() << "', documentKey: {_id: 1}}, $sortKey: [{_data: '" << firstDocSortKey.firstElement().String() << "'}]}"); cursors.push_back(makeRemoteCursor( kTestShardIds[0], kTestShardHosts[0], CursorResponse( kTestNss, 123, {firstCursorResponse}, boost::none, boost::none, pbrtFirstCursor))); // Create a second cursor whose initial batch has no PBRT. cursors.push_back( makeRemoteCursor(kTestShardIds[1], kTestShardHosts[1], CursorResponse(kTestNss, 456, {}))); params.setRemotes(std::move(cursors)); params.setTailableMode(TailableModeEnum::kTailableAndAwaitData); params.setSort(change_stream_constants::kSortSpec); auto arm = std::make_unique(operationContext(), executor(), std::move(params)); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); // We should be dead by now. MONGO_UNREACHABLE; } DEATH_TEST_REGEX_F(AsyncResultsMergerTest, SortedTailableCursorInvariantsIfOneOrMoreRemotesHasEmptyPostBatchResumeToken, R"#(Invariant failure.*!response.getPostBatchResumeToken->isEmpty)#") { AsyncResultsMergerParams params; params.setNss(kTestNss); UUID uuid = UUID::gen(); std::vector cursors; BSONObj pbrtFirstCursor; auto firstDocSortKey = makeResumeToken(Timestamp(1, 4), uuid, BSON("_id" << 1)); auto firstCursorResponse = fromjson( str::stream() << "{_id: {clusterTime: {ts: Timestamp(1, 4)}, uuid: '" << uuid.toString() << "', documentKey: {_id: 1}}, $sortKey: [{_data: '" << firstDocSortKey.firstElement().String() << "'}]}"); cursors.push_back(makeRemoteCursor( kTestShardIds[0], kTestShardHosts[0], CursorResponse( kTestNss, 123, {firstCursorResponse}, boost::none, boost::none, pbrtFirstCursor))); params.setRemotes(std::move(cursors)); params.setTailableMode(TailableModeEnum::kTailableAndAwaitData); params.setSort(change_stream_constants::kSortSpec); auto arm = std::make_unique(operationContext(), executor(), std::move(params)); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_TRUE(arm->ready()); // We should be dead by now. MONGO_UNREACHABLE; } TEST_F(AsyncResultsMergerTest, SortedTailableCursorNotReadyIfRemoteHasLowerPostBatchResumeToken) { AsyncResultsMergerParams params; params.setNss(kTestNss); UUID uuid = UUID::gen(); std::vector cursors; auto pbrtFirstCursor = makePostBatchResumeToken(Timestamp(1, 5)); auto firstDocSortKey = makeResumeToken(Timestamp(1, 4), uuid, BSON("_id" << 1)); auto firstCursorResponse = fromjson( str::stream() << "{_id: {clusterTime: {ts: Timestamp(1, 4)}, uuid: '" << uuid.toString() << "', documentKey: {_id: 1}}, $sortKey: [{data: '" << firstDocSortKey.firstElement().String() << "'}]}"); cursors.push_back(makeRemoteCursor( kTestShardIds[0], kTestShardHosts[0], CursorResponse( kTestNss, 123, {firstCursorResponse}, boost::none, boost::none, pbrtFirstCursor))); auto tooLowPBRT = makePostBatchResumeToken(Timestamp(1, 2)); cursors.push_back( makeRemoteCursor(kTestShardIds[1], kTestShardHosts[1], CursorResponse(kTestNss, 456, {}, boost::none, boost::none, tooLowPBRT))); params.setRemotes(std::move(cursors)); params.setTailableMode(TailableModeEnum::kTailableAndAwaitData); params.setSort(change_stream_constants::kSortSpec); auto arm = std::make_unique(operationContext(), executor(), std::move(params)); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); // Clean up the cursors. std::vector responses; responses.emplace_back(kTestNss, CursorId(0), std::vector{}); scheduleNetworkResponses(std::move(responses)); auto killFuture = arm->kill(operationContext()); killFuture.wait(); } TEST_F(AsyncResultsMergerTest, SortedTailableCursorNewShardOrderedAfterExisting) { AsyncResultsMergerParams params; params.setNss(kTestNss); UUID uuid = UUID::gen(); std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 123, {}))); params.setRemotes(std::move(cursors)); params.setTailableMode(TailableModeEnum::kTailableAndAwaitData); params.setSort(change_stream_constants::kSortSpec); auto arm = std::make_unique(operationContext(), executor(), std::move(params)); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); // Schedule one response with an oplog timestamp in it. std::vector responses; auto firstDocSortKey = makeResumeToken(Timestamp(1, 4), uuid, BSON("_id" << 1)); auto pbrtFirstCursor = makePostBatchResumeToken(Timestamp(1, 6)); auto firstCursorResponse = fromjson( str::stream() << "{_id: {clusterTime: {ts: Timestamp(1, 4)}, uuid: '" << uuid.toString() << "', documentKey: {_id: 1}}, $sortKey: [{_data: '" << firstDocSortKey.firstElement().String() << "'}]}"); std::vector batch1 = {firstCursorResponse}; auto firstDoc = batch1.front(); responses.emplace_back( kTestNss, CursorId(123), batch1, boost::none, boost::none, pbrtFirstCursor); scheduleNetworkResponses(std::move(responses)); // Should be ready now. ASSERT_TRUE(arm->ready()); // Add the new shard. auto tooLowPBRT = makePostBatchResumeToken(Timestamp(1, 3)); std::vector newCursors; newCursors.push_back( makeRemoteCursor(kTestShardIds[1], kTestShardHosts[1], CursorResponse(kTestNss, 456, {}, boost::none, boost::none, tooLowPBRT))); arm->addNewShardCursors(std::move(newCursors)); // Now shouldn't be ready, our guarantee from the new shard isn't sufficiently advanced. ASSERT_FALSE(arm->ready()); readyEvent = unittest::assertGet(arm->nextEvent()); // Schedule another response from the other shard. responses.clear(); auto secondDocSortKey = makeResumeToken(Timestamp(1, 5), uuid, BSON("_id" << 2)); auto pbrtSecondCursor = makePostBatchResumeToken(Timestamp(1, 6)); auto secondCursorResponse = fromjson( str::stream() << "{_id: {clusterTime: {ts: Timestamp(1, 5)}, uuid: '" << uuid.toString() << "', documentKey: {_id: 2}}, $sortKey: [{_data: '" << secondDocSortKey.firstElement().String() << "'}]}"); std::vector batch2 = {secondCursorResponse}; auto secondDoc = batch2.front(); responses.emplace_back( kTestNss, CursorId(456), batch2, boost::none, boost::none, pbrtSecondCursor); scheduleNetworkResponses(std::move(responses)); executor()->waitForEvent(readyEvent); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(firstCursorResponse, *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(secondCursorResponse, *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_FALSE(arm->ready()); readyEvent = unittest::assertGet(arm->nextEvent()); // Clean up the cursors. responses.clear(); std::vector batch3 = {}; responses.emplace_back(kTestNss, CursorId(0), batch3); scheduleNetworkResponses(std::move(responses)); responses.clear(); std::vector batch4 = {}; responses.emplace_back(kTestNss, CursorId(0), batch4); scheduleNetworkResponses(std::move(responses)); } TEST_F(AsyncResultsMergerTest, SortedTailableCursorNewShardOrderedBeforeExisting) { AsyncResultsMergerParams params; params.setNss(kTestNss); UUID uuid = UUID::gen(); std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 123, {}))); params.setRemotes(std::move(cursors)); params.setTailableMode(TailableModeEnum::kTailableAndAwaitData); params.setSort(change_stream_constants::kSortSpec); auto arm = std::make_unique(operationContext(), executor(), std::move(params)); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); // Schedule one response with an oplog timestamp in it. std::vector responses; auto firstDocSortKey = makeResumeToken(Timestamp(1, 4), uuid, BSON("_id" << 1)); auto pbrtFirstCursor = makePostBatchResumeToken(Timestamp(1, 5)); auto firstCursorResponse = fromjson( str::stream() << "{_id: {clusterTime: {ts: Timestamp(1, 4)}, uuid: '" << uuid.toString() << "', documentKey: {_id: 1}}, $sortKey: [{_data: '" << firstDocSortKey.firstElement().String() << "'}]}"); std::vector batch1 = {firstCursorResponse}; responses.emplace_back( kTestNss, CursorId(123), batch1, boost::none, boost::none, pbrtFirstCursor); scheduleNetworkResponses(std::move(responses)); // Should be ready now. ASSERT_TRUE(arm->ready()); // Add the new shard. auto tooLowPBRT = makePostBatchResumeToken(Timestamp(1, 3)); std::vector newCursors; newCursors.push_back( makeRemoteCursor(kTestShardIds[1], kTestShardHosts[1], CursorResponse(kTestNss, 456, {}, boost::none, boost::none, tooLowPBRT))); arm->addNewShardCursors(std::move(newCursors)); // Now shouldn't be ready, our guarantee from the new shard isn't sufficiently advanced. ASSERT_FALSE(arm->ready()); readyEvent = unittest::assertGet(arm->nextEvent()); // Schedule another response from the other shard. responses.clear(); auto secondDocSortKey = makeResumeToken(Timestamp(1, 3), uuid, BSON("_id" << 2)); auto pbrtSecondCursor = makePostBatchResumeToken(Timestamp(1, 5)); auto secondCursorResponse = fromjson( str::stream() << "{_id: {clusterTime: {ts: Timestamp(1, 3)}, uuid: '" << uuid.toString() << "', documentKey: {_id: 2}}, $sortKey: [{_data: '" << secondDocSortKey.firstElement().String() << "'}]}"); std::vector batch2 = {secondCursorResponse}; // The last observed time should still be later than the first shard, so we can get the data // from it. responses.emplace_back( kTestNss, CursorId(456), batch2, boost::none, boost::none, pbrtSecondCursor); scheduleNetworkResponses(std::move(responses)); executor()->waitForEvent(readyEvent); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(secondCursorResponse, *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(firstCursorResponse, *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_FALSE(arm->ready()); readyEvent = unittest::assertGet(arm->nextEvent()); // Clean up the cursors. responses.clear(); std::vector batch3 = {}; responses.emplace_back(kTestNss, CursorId(0), batch3); scheduleNetworkResponses(std::move(responses)); responses.clear(); std::vector batch4 = {}; responses.emplace_back(kTestNss, CursorId(0), batch4); scheduleNetworkResponses(std::move(responses)); } TEST_F(AsyncResultsMergerTest, SortedTailableCursorReturnsHighWaterMarkSortKey) { AsyncResultsMergerParams params; params.setNss(kTestNss); std::vector cursors; // Create three cursors with empty initial batches. Each batch has a PBRT. auto pbrtFirstCursor = makePostBatchResumeToken(Timestamp(1, 5)); cursors.push_back(makeRemoteCursor( kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 123, {}, boost::none, boost::none, pbrtFirstCursor))); auto pbrtSecondCursor = makePostBatchResumeToken(Timestamp(1, 1)); cursors.push_back(makeRemoteCursor( kTestShardIds[1], kTestShardHosts[1], CursorResponse(kTestNss, 456, {}, boost::none, boost::none, pbrtSecondCursor))); auto pbrtThirdCursor = makePostBatchResumeToken(Timestamp(1, 4)); cursors.push_back(makeRemoteCursor( kTestShardIds[2], kTestShardHosts[2], CursorResponse(kTestNss, 789, {}, boost::none, boost::none, pbrtThirdCursor))); params.setRemotes(std::move(cursors)); params.setTailableMode(TailableModeEnum::kTailableAndAwaitData); params.setSort(change_stream_constants::kSortSpec); auto arm = std::make_unique(operationContext(), executor(), std::move(params)); // We have no results to return, so the ARM is not ready. auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); // The high water mark should be the second cursor's PBRT, since it is the lowest of the three. ASSERT_BSONOBJ_EQ(arm->getHighWaterMark(), pbrtSecondCursor); // Advance the PBRT of the second cursor. It should still be the lowest. The fixture expects // each cursor to be updated in-order, so we keep the first and third PBRTs constant. pbrtSecondCursor = makePostBatchResumeToken(Timestamp(1, 3)); std::vector emptyBatch = {}; scheduleNetworkResponse( {kTestNss, CursorId(123), emptyBatch, boost::none, boost::none, pbrtFirstCursor}); scheduleNetworkResponse( {kTestNss, CursorId(456), emptyBatch, boost::none, boost::none, pbrtSecondCursor}); scheduleNetworkResponse( {kTestNss, CursorId(789), emptyBatch, boost::none, boost::none, pbrtThirdCursor}); ASSERT_BSONOBJ_EQ(arm->getHighWaterMark(), pbrtSecondCursor); ASSERT_FALSE(arm->ready()); // Advance the second cursor again, so that it surpasses the other two. The third cursor becomes // the new high water mark. pbrtSecondCursor = makePostBatchResumeToken(Timestamp(1, 6)); scheduleNetworkResponse( {kTestNss, CursorId(123), emptyBatch, boost::none, boost::none, pbrtFirstCursor}); scheduleNetworkResponse( {kTestNss, CursorId(456), emptyBatch, boost::none, boost::none, pbrtSecondCursor}); scheduleNetworkResponse( {kTestNss, CursorId(789), emptyBatch, boost::none, boost::none, pbrtThirdCursor}); ASSERT_BSONOBJ_EQ(arm->getHighWaterMark(), pbrtThirdCursor); ASSERT_FALSE(arm->ready()); // Advance the third cursor such that the first cursor becomes the high water mark. pbrtThirdCursor = makePostBatchResumeToken(Timestamp(1, 7)); scheduleNetworkResponse( {kTestNss, CursorId(123), emptyBatch, boost::none, boost::none, pbrtFirstCursor}); scheduleNetworkResponse( {kTestNss, CursorId(456), emptyBatch, boost::none, boost::none, pbrtSecondCursor}); scheduleNetworkResponse( {kTestNss, CursorId(789), emptyBatch, boost::none, boost::none, pbrtThirdCursor}); ASSERT_BSONOBJ_EQ(arm->getHighWaterMark(), pbrtFirstCursor); ASSERT_FALSE(arm->ready()); // Clean up the cursors. std::vector cleanupBatch = {}; scheduleNetworkResponse({kTestNss, CursorId(0), cleanupBatch}); scheduleNetworkResponse({kTestNss, CursorId(0), cleanupBatch}); scheduleNetworkResponse({kTestNss, CursorId(0), cleanupBatch}); } TEST_F(AsyncResultsMergerTest, SortedTailableCursorDoesNotAdvanceHighWaterMarkForIneligibleCursor) { AsyncResultsMergerParams params; params.setNss(kTestNss); std::vector cursors; // Create three cursors with empty initial batches. Each batch has a PBRT. The third cursor is // the $changeStream opened on "config.shards" to monitor for the addition of new shards. auto pbrtFirstCursor = makePostBatchResumeToken(Timestamp(1, 5)); cursors.push_back(makeRemoteCursor( kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 123, {}, boost::none, boost::none, pbrtFirstCursor))); auto pbrtSecondCursor = makePostBatchResumeToken(Timestamp(1, 3)); cursors.push_back(makeRemoteCursor( kTestShardIds[1], kTestShardHosts[1], CursorResponse(kTestNss, 456, {}, boost::none, boost::none, pbrtSecondCursor))); auto pbrtConfigCursor = makePostBatchResumeToken(Timestamp(1, 1)); cursors.push_back(makeRemoteCursor( kTestShardIds[2], kTestShardHosts[2], CursorResponse(ShardType::ConfigNS, 789, {}, boost::none, boost::none, pbrtConfigCursor))); params.setRemotes(std::move(cursors)); params.setTailableMode(TailableModeEnum::kTailableAndAwaitData); params.setSort(change_stream_constants::kSortSpec); auto arm = std::make_unique(operationContext(), executor(), std::move(params)); // We have no results to return, so the ARM is not ready. auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); // For a change stream cursor on "config.shards", the first batch is not eligible to provide the // HWM. Despite the fact that 'pbrtConfigCursor' has the lowest PBRT, the ARM returns the PBRT // of 'pbrtSecondCursor' as the current high water mark. This guards against the possibility // that the user requests a start time in the future. The "config.shards" cursor must start // monitoring for shards at the current point in time, and so its initial PBRT will be lower // than that of the shards. We do not wish to return a high water mark to the client that is // earlier than the start time they specified in their request. auto initialHighWaterMark = arm->getHighWaterMark(); ASSERT_BSONOBJ_EQ(initialHighWaterMark, pbrtSecondCursor); // Advance the PBRT of the 'pbrtConfigCursor'. It is still the lowest, but is ineligible to // provide the high water mark because it is still lower than the high water mark that was // already returned. As above, the guards against the possibility that the user requested a // stream with a start point at an arbitrary point in the future. pbrtConfigCursor = makePostBatchResumeToken(Timestamp(1, 2)); scheduleNetworkResponse( {kTestNss, CursorId(123), {}, boost::none, boost::none, pbrtFirstCursor}); scheduleNetworkResponse( {kTestNss, CursorId(456), {}, boost::none, boost::none, pbrtSecondCursor}); scheduleNetworkResponse( {ShardType::ConfigNS, CursorId(789), {}, boost::none, boost::none, pbrtConfigCursor}); // The high water mark has not advanced from its previous value. ASSERT_BSONOBJ_EQ(arm->getHighWaterMark(), initialHighWaterMark); ASSERT_FALSE(arm->ready()); // If the "config.shards" cursor returns a result, this document does not advance the HWM. We // consume this event internally but do not return it to the client, and its resume token is not // actually resumable. We therefore do not want to expose it to the client via the PBRT. const auto configUUID = UUID::gen(); auto configEvent = fromjson("{_id: 'shard_add_event'}"); pbrtFirstCursor = makePostBatchResumeToken(Timestamp(1, 15)); pbrtSecondCursor = makePostBatchResumeToken(Timestamp(1, 13)); pbrtConfigCursor = makeResumeToken(Timestamp(1, 11), configUUID, configEvent); configEvent = configEvent.addField(BSON("$sortKey" << BSON_ARRAY(pbrtConfigCursor)).firstElement()); scheduleNetworkResponse( {kTestNss, CursorId(123), {}, boost::none, boost::none, pbrtFirstCursor}); scheduleNetworkResponse( {kTestNss, CursorId(456), {}, boost::none, boost::none, pbrtSecondCursor}); scheduleNetworkResponse({ShardType::ConfigNS, CursorId(789), {configEvent}, boost::none, boost::none, pbrtConfigCursor}); // The config cursor has a lower sort key than the other shards, so we can retrieve the event. ASSERT_TRUE(arm->ready()); ASSERT_BSONOBJ_EQ(configEvent, *unittest::assertGet(arm->nextReady()).getResult()); readyEvent = unittest::assertGet(arm->nextEvent()); // Reading the config cursor event document does not advance the high water mark. ASSERT_BSONOBJ_EQ(arm->getHighWaterMark(), initialHighWaterMark); ASSERT_FALSE(arm->ready()); // If the next config batch is empty but the PBRT is still the resume token of the addShard // event, it does not advance the ARM's high water mark sort key. scheduleNetworkResponse( {kTestNss, CursorId(123), {}, boost::none, boost::none, pbrtFirstCursor}); scheduleNetworkResponse( {kTestNss, CursorId(456), {}, boost::none, boost::none, pbrtSecondCursor}); scheduleNetworkResponse( {ShardType::ConfigNS, CursorId(789), {}, boost::none, boost::none, pbrtConfigCursor}); ASSERT_BSONOBJ_EQ(arm->getHighWaterMark(), initialHighWaterMark); ASSERT_FALSE(arm->ready()); // If none of the above criteria obtain, then the "config.shards" cursor is eligible to advance // the ARM's high water mark. The only reason we allow the config.shards cursor to participate // in advancing of the high water mark at all is so that we cannot end up in a situation where // the config cursor is always the lowest and the high water mark can therefore never advance. pbrtConfigCursor = makePostBatchResumeToken(Timestamp(1, 12)); scheduleNetworkResponse( {kTestNss, CursorId(123), {}, boost::none, boost::none, pbrtFirstCursor}); scheduleNetworkResponse( {kTestNss, CursorId(456), {}, boost::none, boost::none, pbrtSecondCursor}); scheduleNetworkResponse( {ShardType::ConfigNS, CursorId(789), {}, boost::none, boost::none, pbrtConfigCursor}); ASSERT_BSONOBJ_GT(arm->getHighWaterMark(), initialHighWaterMark); ASSERT_BSONOBJ_EQ(arm->getHighWaterMark(), pbrtConfigCursor); ASSERT_FALSE(arm->ready()); // Clean up the cursors. std::vector cleanupBatch = {}; scheduleNetworkResponse({kTestNss, CursorId(0), cleanupBatch}); scheduleNetworkResponse({kTestNss, CursorId(0), cleanupBatch}); scheduleNetworkResponse({kTestNss, CursorId(0), cleanupBatch}); } TEST_F(AsyncResultsMergerTest, GetMoreRequestWithoutTailableCantHaveMaxTime) { BSONObj findCmd = fromjson("{find: 'testcoll'}"); std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 123, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors), findCmd); ASSERT_NOT_OK(arm->setAwaitDataTimeout(Milliseconds(789))); auto killFuture = arm->kill(operationContext()); killFuture.wait(); } TEST_F(AsyncResultsMergerTest, GetMoreRequestWithoutAwaitDataCantHaveMaxTime) { BSONObj findCmd = fromjson("{find: 'testcoll', tailable: true}"); std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 123, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors), findCmd); ASSERT_NOT_OK(arm->setAwaitDataTimeout(Milliseconds(789))); auto killFuture = arm->kill(operationContext()); killFuture.wait(); } TEST_F(AsyncResultsMergerTest, ShardCanErrorInBetweenReadyAndNextEvent) { BSONObj findCmd = fromjson("{find: 'testcoll', tailable: true}"); std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 123, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors), findCmd); ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); scheduleErrorResponse({ErrorCodes::BadValue, "bad thing happened"}); ASSERT_EQ(ErrorCodes::BadValue, arm->nextEvent().getStatus()); // Required to kill the 'arm' on error before destruction. auto killFuture = arm->kill(operationContext()); killFuture.wait(); } TEST_F(AsyncResultsMergerTest, KillShouldNotWaitForRemoteCommandsBeforeSchedulingKillCursors) { std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 1, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors)); // Before any requests are scheduled, ARM is not ready to return results. ASSERT_FALSE(arm->ready()); ASSERT_FALSE(arm->remotesExhausted()); // Schedule requests. auto readyEvent = unittest::assertGet(arm->nextEvent()); // Before any responses are delivered, ARM is not ready to return results. ASSERT_FALSE(arm->ready()); ASSERT_FALSE(arm->remotesExhausted()); // Kill the ARM while a batch is still outstanding. The callback for the outstanding batch // should be canceled. auto killFuture = arm->kill(operationContext()); // Check that the ARM will run killCursors. assertKillCusorsCmdHasCursorId(getNthPendingRequest(0u).cmdObj, 1); // Let the callback run now that it's been canceled. runReadyCallbacks(); executor()->waitForEvent(readyEvent); killFuture.wait(); } TEST_F(AsyncResultsMergerTest, GetMoresShouldNotIncludeLSIDOrTxnNumberIfNoneSpecified) { std::vector cursors; cursors.emplace_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 1, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors)); // There should be no lsid txnNumber in the scheduled getMore. ASSERT_OK(arm->nextEvent().getStatus()); onCommand([&](const auto& request) { ASSERT(request.cmdObj["getMore"]); ASSERT(request.cmdObj["lsid"].eoo()); ASSERT(request.cmdObj["txnNumber"].eoo()); return CursorResponse(kTestNss, 0LL, {BSON("x" << 1)}) .toBSON(CursorResponse::ResponseType::SubsequentResponse); }); } TEST_F(AsyncResultsMergerTest, GetMoresShouldIncludeLSIDIfSpecified) { auto lsid = makeLogicalSessionIdForTest(); operationContext()->setLogicalSessionId(lsid); std::vector cursors; cursors.emplace_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 1, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors)); // There should be an lsid and no txnNumber in the scheduled getMore. ASSERT_OK(arm->nextEvent().getStatus()); onCommand([&](const auto& request) { ASSERT(request.cmdObj["getMore"]); ASSERT_EQ(parseSessionIdFromCmd(request.cmdObj), lsid); ASSERT(request.cmdObj["txnNumber"].eoo()); return CursorResponse(kTestNss, 1LL, {BSON("x" << 1)}) .toBSON(CursorResponse::ResponseType::SubsequentResponse); }); // Subsequent requests still pass the lsid. ASSERT(arm->ready()); ASSERT_OK(arm->nextReady().getStatus()); ASSERT_FALSE(arm->ready()); ASSERT_OK(arm->nextEvent().getStatus()); onCommand([&](const auto& request) { ASSERT(request.cmdObj["getMore"]); ASSERT_EQ(parseSessionIdFromCmd(request.cmdObj), lsid); ASSERT(request.cmdObj["txnNumber"].eoo()); return CursorResponse(kTestNss, 0LL, {BSON("x" << 1)}) .toBSON(CursorResponse::ResponseType::SubsequentResponse); }); } TEST_F(AsyncResultsMergerTest, GetMoresShouldIncludeLSIDAndTxnNumIfSpecified) { auto lsid = makeLogicalSessionIdForTest(); operationContext()->setLogicalSessionId(lsid); const TxnNumber txnNumber = 5; operationContext()->setTxnNumber(txnNumber); std::vector cursors; cursors.emplace_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 1, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors)); // The first scheduled getMore should pass the txnNumber the ARM was constructed with. ASSERT_OK(arm->nextEvent().getStatus()); onCommand([&](const auto& request) { ASSERT(request.cmdObj["getMore"]); ASSERT_EQ(parseSessionIdFromCmd(request.cmdObj), lsid); ASSERT_EQ(request.cmdObj["txnNumber"].numberLong(), txnNumber); return CursorResponse(kTestNss, 1LL, {BSON("x" << 1)}) .toBSON(CursorResponse::ResponseType::SubsequentResponse); }); // Subsequent requests still pass the txnNumber. ASSERT(arm->ready()); ASSERT_OK(arm->nextReady().getStatus()); ASSERT_FALSE(arm->ready()); // Subsequent getMore requests should include txnNumber. ASSERT_OK(arm->nextEvent().getStatus()); onCommand([&](const auto& request) { ASSERT(request.cmdObj["getMore"]); ASSERT_EQ(parseSessionIdFromCmd(request.cmdObj), lsid); ASSERT_EQ(request.cmdObj["txnNumber"].numberLong(), txnNumber); return CursorResponse(kTestNss, 0LL, {BSON("x" << 1)}) .toBSON(CursorResponse::ResponseType::SubsequentResponse); }); } DEATH_TEST_REGEX_F(AsyncResultsMergerTest, ConstructingARMWithTxnNumAndNoLSIDShouldCrash, R"#(Invariant failure.*params.getSessionId)#") { AsyncResultsMergerParams params; OperationSessionInfoFromClient sessionInfo; sessionInfo.setTxnNumber(5); params.setOperationSessionInfo(sessionInfo); // This should trigger an invariant. ASSERT_FALSE( std::make_unique(operationContext(), executor(), std::move(params))); } DEATH_TEST_F(AsyncResultsMergerTest, ShouldFailIfAskedToPerformGetMoresWithoutAnOpCtx, "Cannot schedule a getMore without an OperationContext") { BSONObj findCmd = fromjson("{find: 'testcoll', tailable: true, awaitData: true}"); std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 123, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors), findCmd); ASSERT_FALSE(arm->ready()); arm->detachFromOperationContext(); arm->scheduleGetMores().ignore(); // Should crash. } TEST_F(AsyncResultsMergerTest, ShouldNotScheduleGetMoresWithoutAnOperationContext) { BSONObj findCmd = fromjson("{find: 'testcoll', tailable: true, awaitData: true}"); std::vector cursors; cursors.push_back( makeRemoteCursor(kTestShardIds[0], kTestShardHosts[0], CursorResponse(kTestNss, 123, {}))); auto arm = makeARMFromExistingCursors(std::move(cursors), findCmd); ASSERT_FALSE(arm->ready()); auto readyEvent = unittest::assertGet(arm->nextEvent()); ASSERT_FALSE(arm->ready()); // While detached from the OperationContext, schedule an empty batch response. Because the // response is empty and this is a tailable cursor, the ARM will need to run another getMore on // that host, but it should not schedule this without a non-null OperationContext. arm->detachFromOperationContext(); { std::vector responses; std::vector emptyBatch; responses.emplace_back(kTestNss, CursorId(123), emptyBatch); scheduleNetworkResponses(std::move(responses)); } ASSERT_FALSE(arm->ready()); ASSERT_FALSE(networkHasReadyRequests()); // Tests that we haven't asked for the next batch yet. // After manually requesting the next getMore, the ARM should be ready. arm->reattachToOperationContext(operationContext()); ASSERT_OK(arm->scheduleGetMores()); // Schedule the next getMore response. { std::vector responses; std::vector nonEmptyBatch = {fromjson("{_id: 1}")}; responses.emplace_back(kTestNss, CursorId(123), nonEmptyBatch); scheduleNetworkResponses(std::move(responses)); } ASSERT_TRUE(arm->ready()); ASSERT_FALSE(arm->remotesExhausted()); ASSERT_BSONOBJ_EQ(fromjson("{_id: 1}"), *unittest::assertGet(arm->nextReady()).getResult()); ASSERT_FALSE(arm->ready()); ASSERT_FALSE(arm->remotesExhausted()); auto killFuture = arm->kill(operationContext()); killFuture.wait(); } } // namespace } // namespace mongo