diff options
author | Charlie Swanson <charlie.swanson@mongodb.com> | 2018-08-01 08:33:20 -0400 |
---|---|---|
committer | Charlie Swanson <charlie.swanson@mongodb.com> | 2018-08-24 09:42:50 -0400 |
commit | 7987c50c9702bf2280ca4f902499f58f98448241 (patch) | |
tree | 6fda98cf2e2fcbb45fde0f4c2f693902c14f0335 /src/mongo | |
parent | c8f5485a7c5455b5487990113597f935d1df1ddf (diff) | |
download | mongo-7987c50c9702bf2280ca4f902499f58f98448241.tar.gz |
SERVER-35905 Add logic to detect when $out is eligible for an exchange
Diffstat (limited to 'src/mongo')
26 files changed, 1725 insertions, 106 deletions
diff --git a/src/mongo/db/pipeline/document_source.cpp b/src/mongo/db/pipeline/document_source.cpp index d51ad84ab67..32edc1704d5 100644 --- a/src/mongo/db/pipeline/document_source.cpp +++ b/src/mongo/db/pipeline/document_source.cpp @@ -1,30 +1,30 @@ /** -* Copyright (C) 2011 10gen Inc. -* -* This program is free software: you can redistribute it and/or modify -* it under the terms of the GNU Affero General Public License, version 3, -* as published by the Free Software Foundation. -* -* This program is distributed in the hope that it will be useful, -* but WITHOUT ANY WARRANTY; without even the implied warranty of -* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the -* GNU Affero General Public License for more details. -* -* You should have received a copy of the GNU Affero General Public License -* along with this program. If not, see <http://www.gnu.org/licenses/>. -* -* As a special exception, the copyright holders give permission to link the -* code of portions of this program with the OpenSSL library under certain -* conditions as described in each individual source file and distribute -* linked combinations including the program with the OpenSSL library. You -* must comply with the GNU Affero General Public License in all respects for -* all of the code used other than as permitted herein. If you modify file(s) -* with this exception, you may extend this exception to your version of the -* file(s), but you are not obligated to do so. If you do not wish to do so, -* delete this exception statement from your version. If you delete this -* exception statement from all source files in the program, then also delete -* it in the license file. -*/ + * Copyright (C) 2011 10gen Inc. + * + * This program is free software: you can redistribute it and/or modify + * it under the terms of the GNU Affero General Public License, version 3, + * as published by the Free Software Foundation. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU Affero General Public License for more details. + * + * You should have received a copy of the GNU Affero General Public License + * along with this program. If not, see <http://www.gnu.org/licenses/>. + * + * As a special exception, the copyright holders give permission to link the + * code of portions of this program with the OpenSSL library under certain + * conditions as described in each individual source file and distribute + * linked combinations including the program with the OpenSSL library. You + * must comply with the GNU Affero General Public License in all respects for + * all of the code used other than as permitted herein. If you modify file(s) + * with this exception, you may extend this exception to your version of the + * file(s), but you are not obligated to do so. If you do not wish to do so, + * delete this exception statement from your version. If you delete this + * exception statement from all source files in the program, then also delete + * it in the license file. + */ #include "mongo/platform/basic.h" @@ -160,6 +160,52 @@ splitMatchByModifiedFields(const boost::intrusive_ptr<DocumentSourceMatch>& matc return match->splitSourceBy(modifiedPaths, modifiedPathsRet.renames); } +/** + * If 'pathOfInterest' or some path prefix of 'pathOfInterest' is renamed, returns the new name for + * 'pathOfInterest', otherwise returns boost::none. + * For example, if 'renamedPaths' is {"c.d", "c"}, and 'pathOfInterest' is "c.d.f", returns "c.f". + */ +boost::optional<std::string> findNewName(const StringMap<std::string>& renamedPaths, + std::string pathOfInterest) { + FieldPath fullPathOfInterest(pathOfInterest); + StringBuilder toLookup; + std::size_t pathIndex = 0; + while (pathIndex < fullPathOfInterest.getPathLength()) { + if (pathIndex != 0) { + toLookup << "."; + } + toLookup << fullPathOfInterest.getFieldName(pathIndex++); + + auto it = renamedPaths.find(toLookup.stringData()); + if (it != renamedPaths.end()) { + const auto& newPathOfPrefix = it->second; + // We found a rename! Note this might be a rename of the prefix of the path, so we have + // to add back on the suffix that was unchanged. + StringBuilder renamedPath; + renamedPath << newPathOfPrefix; + while (pathIndex < fullPathOfInterest.getPathLength()) { + renamedPath << "." << fullPathOfInterest.getFieldName(pathIndex++); + } + return {renamedPath.str()}; + } + } + return boost::none; +} + +StringMap<std::string> computeNewNamesAssumingAnyPathsNotRenamedAreUnmodified( + const StringMap<std::string>& renamedPaths, const std::set<std::string>& pathsOfInterest) { + StringMap<std::string> renameOut; + for (auto&& ofInterest : pathsOfInterest) { + if (auto newName = findNewName(renamedPaths, ofInterest)) { + renameOut[ofInterest] = *newName; + } else { + // This path was not renamed, assume it was unchanged and map it to itself. + renameOut[ofInterest] = ofInterest; + } + } + return renameOut; +} + } // namespace Pipeline::SourceContainer::iterator DocumentSource::optimizeAt( @@ -202,6 +248,53 @@ Pipeline::SourceContainer::iterator DocumentSource::optimizeAt( return doOptimizeAt(itr, container); } +boost::optional<StringMap<std::string>> DocumentSource::renamedPaths( + const std::set<std::string>& pathsOfInterest) const { + auto modifiedPathsRet = this->getModifiedPaths(); + switch (modifiedPathsRet.type) { + case DocumentSource::GetModPathsReturn::Type::kNotSupported: + case DocumentSource::GetModPathsReturn::Type::kAllPaths: + return boost::none; + case DocumentSource::GetModPathsReturn::Type::kFiniteSet: { + for (auto&& modified : modifiedPathsRet.paths) { + for (auto&& ofInterest : pathsOfInterest) { + // Any overlap of the path means the path of interest is not preserved. For + // example, if the path of interest is "a.b", then a modified path of "a", + // "a.b", or "a.b.c" would all signal that "a.b" is not preserved. + if (ofInterest == modified || + expression::isPathPrefixOf(ofInterest, modified) || + expression::isPathPrefixOf(modified, ofInterest)) { + // This stage modifies at least one of the fields which the caller is + // interested in, bail out. + return boost::none; + } + } + } + + // None of the paths of interest were modified, construct the result map, mapping + // the names after this stage to the names before this stage. + return computeNewNamesAssumingAnyPathsNotRenamedAreUnmodified(modifiedPathsRet.renames, + pathsOfInterest); + } + case DocumentSource::GetModPathsReturn::Type::kAllExcept: { + auto preservedPaths = modifiedPathsRet.paths; + for (auto&& rename : modifiedPathsRet.renames) { + // For the purposes of checking which paths are modified, consider renames to + // preserve the path. We'll circle back later to figure out the new name if + // appropriate. + preservedPaths.insert(rename.first); + } + auto modifiedPaths = extractModifiedDependencies(pathsOfInterest, preservedPaths); + if (modifiedPaths.empty()) { + return computeNewNamesAssumingAnyPathsNotRenamedAreUnmodified( + modifiedPathsRet.renames, pathsOfInterest); + } + return boost::none; + } + } + MONGO_UNREACHABLE; +} + void DocumentSource::serializeToArray(vector<Value>& array, boost::optional<ExplainOptions::Verbosity> explain) const { Value entry = serialize(explain); @@ -258,4 +351,4 @@ BSONObjSet DocumentSource::truncateSortSet(const BSONObjSet& sorts, return out; } -} +} // namespace mongo diff --git a/src/mongo/db/pipeline/document_source.h b/src/mongo/db/pipeline/document_source.h index 682b03b76e1..e9bf60dba55 100644 --- a/src/mongo/db/pipeline/document_source.h +++ b/src/mongo/db/pipeline/document_source.h @@ -628,6 +628,14 @@ public: } /** + * Given 'currentNames' which describes a set of paths which the caller is interested in, + * returns boost::none if any of those paths are modified by this stage, or a mapping from + * their old name to their new name if they are preserved but possibly renamed by this stage. + */ + boost::optional<StringMap<std::string>> renamedPaths( + const std::set<std::string>& currentNames) const; + + /** * Get the dependencies this operation needs to do its job. If overridden, subclasses must add * all paths needed to apply their transformation to 'deps->fields', and call * 'deps->setNeedsMetadata()' to indicate what metadata (e.g. text score), if any, is required. @@ -731,6 +739,16 @@ public: */ virtual MergingLogic mergingLogic() = 0; + /** + * Returns true if it would be correct to execute this stage in parallel across the shards in + * cases where the final stage is an $out. For example, a $group stage which is just merging the + * groups from the shards can be run in parallel since it will preserve the shard key. + */ + virtual bool canRunInParallelBeforeOut( + const std::set<std::string>& nameOfShardKeyFieldsUponEntryToStage) const { + return false; + } + protected: // It is invalid to delete through a NeedsMergerDocumentSource-typed pointer. virtual ~NeedsMergerDocumentSource() {} diff --git a/src/mongo/db/pipeline/document_source_group.cpp b/src/mongo/db/pipeline/document_source_group.cpp index 1563c6ba14b..de3dcd084ec 100644 --- a/src/mongo/db/pipeline/document_source_group.cpp +++ b/src/mongo/db/pipeline/document_source_group.cpp @@ -1,30 +1,30 @@ /** -* Copyright (C) 2011 10gen Inc. -* -* This program is free software: you can redistribute it and/or modify -* it under the terms of the GNU Affero General Public License, version 3, -* as published by the Free Software Foundation. -* -* This program is distributed in the hope that it will be useful, -* but WITHOUT ANY WARRANTY; without even the implied warranty of -* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the -* GNU Affero General Public License for more details. -* -* You should have received a copy of the GNU Affero General Public License -* along with this program. If not, see <http://www.gnu.org/licenses/>. -* -* As a special exception, the copyright holders give permission to link the -* code of portions of this program with the OpenSSL library under certain -* conditions as described in each individual source file and distribute -* linked combinations including the program with the OpenSSL library. You -* must comply with the GNU Affero General Public License in all respects for -* all of the code used other than as permitted herein. If you modify file(s) -* with this exception, you may extend this exception to your version of the -* file(s), but you are not obligated to do so. If you do not wish to do so, -* delete this exception statement from your version. If you delete this -* exception statement from all source files in the program, then also delete -* it in the license file. -*/ + * Copyright (C) 2011 10gen Inc. + * + * This program is free software: you can redistribute it and/or modify + * it under the terms of the GNU Affero General Public License, version 3, + * as published by the Free Software Foundation. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU Affero General Public License for more details. + * + * You should have received a copy of the GNU Affero General Public License + * along with this program. If not, see <http://www.gnu.org/licenses/>. + * + * As a special exception, the copyright holders give permission to link the + * code of portions of this program with the OpenSSL library under certain + * conditions as described in each individual source file and distribute + * linked combinations including the program with the OpenSSL library. You + * must comply with the GNU Affero General Public License in all respects for + * all of the code used other than as permitted herein. If you modify file(s) + * with this exception, you may extend this exception to your version of the + * file(s), but you are not obligated to do so. If you do not wish to do so, + * delete this exception statement from your version. If you delete this + * exception statement from all source files in the program, then also delete + * it in the license file. + */ #include "mongo/platform/basic.h" @@ -43,8 +43,8 @@ namespace mongo { using boost::intrusive_ptr; -using std::shared_ptr; using std::pair; +using std::shared_ptr; using std::vector; REGISTER_DOCUMENT_SOURCE(group, @@ -241,6 +241,25 @@ DepsTracker::State DocumentSourceGroup::getDependencies(DepsTracker* deps) const return DepsTracker::State::EXHAUSTIVE_ALL; } +DocumentSource::GetModPathsReturn DocumentSourceGroup::getModifiedPaths() const { + // We preserve none of the fields, but any fields referenced as part of the group key are + // logically just renamed. + StringMap<std::string> renames; + for (std::size_t i = 0; i < _idExpressions.size(); ++i) { + auto idExp = _idExpressions[i]; + auto pathToPutResultOfExpression = + _idFieldNames.empty() ? "_id" : "_id." + _idFieldNames[i]; + auto computedPaths = idExp->getComputedPaths(pathToPutResultOfExpression); + for (auto&& rename : computedPaths.renames) { + renames[rename.first] = rename.second; + } + } + + return {DocumentSource::GetModPathsReturn::Type::kAllExcept, + std::set<std::string>{}, // No fields are preserved. + std::move(renames)}; +} + intrusive_ptr<DocumentSourceGroup> DocumentSourceGroup::create( const intrusive_ptr<ExpressionContext>& pExpCtx, const boost::intrusive_ptr<Expression>& groupByExpression, @@ -860,6 +879,42 @@ NeedsMergerDocumentSource::MergingLogic DocumentSourceGroup::mergingLogic() { return {mergingGroup}; } + +bool DocumentSourceGroup::pathIncludedInGroupKeys(const std::string& dottedPath) const { + return std::any_of( + _idExpressions.begin(), _idExpressions.end(), [&dottedPath](const auto& exp) { + if (auto fieldExp = dynamic_cast<ExpressionFieldPath*>(exp.get())) { + if (fieldExp->representsPath(dottedPath)) { + return true; + } + } + return false; + }); +} + +bool DocumentSourceGroup::canRunInParallelBeforeOut( + const std::set<std::string>& nameOfShardKeyFieldsUponEntryToStage) const { + if (_doingMerge) { + return true; // This is fine. + } + + // Certain $group stages are allowed to execute on each exchange consumer. In order to + // guarantee each consumer will only group together data from its own shard, the $group must + // group on a superset of the shard key. + for (auto&& currentPathOfShardKey : nameOfShardKeyFieldsUponEntryToStage) { + if (!pathIncludedInGroupKeys(currentPathOfShardKey)) { + // This requires an exact path match, but as a future optimization certain path + // prefixes should be okay. For example, if the shard key path is "a.b", and we're + // grouping by "a", then each group of "a" is strictly more specific than "a.b", so + // we can deduce that grouping by "a" will not need to group together documents + // across different values of the shard key field "a.b", and thus as long as any + // other shard key fields are similarly preserved will not need to consume a merged + // stream to perform the group. + return false; + } + } + return true; +} } // namespace mongo #include "mongo/db/sorter/sorter.cpp" diff --git a/src/mongo/db/pipeline/document_source_group.h b/src/mongo/db/pipeline/document_source_group.h index 421c244641e..7a79db09a56 100644 --- a/src/mongo/db/pipeline/document_source_group.h +++ b/src/mongo/db/pipeline/document_source_group.h @@ -43,13 +43,13 @@ public: using Accumulators = std::vector<boost::intrusive_ptr<Accumulator>>; using GroupsMap = ValueUnorderedMap<Accumulators>; - // Virtuals from DocumentSource. boost::intrusive_ptr<DocumentSource> optimize() final; DepsTracker::State getDependencies(DepsTracker* deps) const final; Value serialize(boost::optional<ExplainOptions::Verbosity> explain = boost::none) const final; GetNextResult getNext() final; const char* getSourceName() const final; BSONObjSet getOutputSorts() final; + GetModPathsReturn getModifiedPaths() const final; /** * Convenience method for creating a new $group stage. If maxMemoryUsageBytes is boost::none, @@ -88,6 +88,14 @@ public: void setIdExpression(const boost::intrusive_ptr<Expression> idExpression); /** + * Returns true if this $group stage represents a 'global' $group which is merging together + * results from earlier partial groups. + */ + bool doingMerge() const { + return _doingMerge; + } + + /** * Tell this source if it is doing a merge from shards. Defaults to false. */ void setDoingMerge(bool doingMerge) { @@ -98,15 +106,17 @@ public: return _streaming; } - // Virtuals for NeedsMergerDocumentSource. - boost::intrusive_ptr<DocumentSource> getShardSource() final; - MergingLogic mergingLogic() final; - /** * Returns true if this $group stage used disk during execution and false otherwise. */ bool usedDisk() final; + // Virtuals for NeedsMergerDocumentSource. + boost::intrusive_ptr<DocumentSource> getShardSource() final; + MergingLogic mergingLogic() final; + bool canRunInParallelBeforeOut( + const std::set<std::string>& nameOfShardKeyFieldsUponEntryToStage) const final; + protected: void doDispose() final; @@ -161,9 +171,14 @@ private: */ Value expandId(const Value& val); - bool _usedDisk; // Keeps track of whether this $group spilled to disk. + /** + * Returns true if 'dottedPath' is one of the group keys present in '_idExpressions'. + */ + bool pathIncludedInGroupKeys(const std::string& dottedPath) const; + std::vector<AccumulationStatement> _accumulatedFields; + bool _usedDisk; // Keeps track of whether this $group spilled to disk. bool _doingMerge; size_t _memoryUsageBytes = 0; size_t _maxMemoryUsageBytes; diff --git a/src/mongo/db/pipeline/document_source_group_test.cpp b/src/mongo/db/pipeline/document_source_group_test.cpp index 3a8cecedf54..b612b9c7512 100644 --- a/src/mongo/db/pipeline/document_source_group_test.cpp +++ b/src/mongo/db/pipeline/document_source_group_test.cpp @@ -189,6 +189,44 @@ TEST_F(DocumentSourceGroupTest, ShouldCorrectlyTrackMemoryUsageBetweenPauses) { ASSERT_THROWS_CODE(group->getNext(), AssertionException, 16945); } +TEST_F(DocumentSourceGroupTest, ShouldReportSingleFieldGroupKeyAsARename) { + auto expCtx = getExpCtx(); + VariablesParseState vps = expCtx->variablesParseState; + auto groupByExpression = ExpressionFieldPath::parse(expCtx, "$x", vps); + auto group = DocumentSourceGroup::create(expCtx, groupByExpression, {}); + auto modifiedPathsRet = group->getModifiedPaths(); + ASSERT(modifiedPathsRet.type == DocumentSource::GetModPathsReturn::Type::kAllExcept); + ASSERT_EQ(modifiedPathsRet.paths.size(), 0UL); + ASSERT_EQ(modifiedPathsRet.renames.size(), 1UL); + ASSERT_EQ(modifiedPathsRet.renames["_id"], "x"); +} + +TEST_F(DocumentSourceGroupTest, ShouldReportMultipleFieldGroupKeysAsARename) { + auto expCtx = getExpCtx(); + VariablesParseState vps = expCtx->variablesParseState; + auto x = ExpressionFieldPath::parse(expCtx, "$x", vps); + auto y = ExpressionFieldPath::parse(expCtx, "$y", vps); + auto groupByExpression = ExpressionObject::create(expCtx, {{"x", x}, {"y", y}}); + auto group = DocumentSourceGroup::create(expCtx, groupByExpression, {}); + auto modifiedPathsRet = group->getModifiedPaths(); + ASSERT(modifiedPathsRet.type == DocumentSource::GetModPathsReturn::Type::kAllExcept); + ASSERT_EQ(modifiedPathsRet.paths.size(), 0UL); + ASSERT_EQ(modifiedPathsRet.renames.size(), 2UL); + ASSERT_EQ(modifiedPathsRet.renames["_id.x"], "x"); + ASSERT_EQ(modifiedPathsRet.renames["_id.y"], "y"); +} + +TEST_F(DocumentSourceGroupTest, ShouldNotReportDottedGroupKeyAsARename) { + auto expCtx = getExpCtx(); + VariablesParseState vps = expCtx->variablesParseState; + auto xDotY = ExpressionFieldPath::parse(expCtx, "$x.y", vps); + auto group = DocumentSourceGroup::create(expCtx, xDotY, {}); + auto modifiedPathsRet = group->getModifiedPaths(); + ASSERT(modifiedPathsRet.type == DocumentSource::GetModPathsReturn::Type::kAllExcept); + ASSERT_EQ(modifiedPathsRet.paths.size(), 0UL); + ASSERT_EQ(modifiedPathsRet.renames.size(), 0UL); +} + BSONObj toBson(const intrusive_ptr<DocumentSource>& source) { vector<Value> arr; source->serializeToArray(arr); diff --git a/src/mongo/db/pipeline/document_source_mock.h b/src/mongo/db/pipeline/document_source_mock.h index cc81d533fb2..0a0ad30ca41 100644 --- a/src/mongo/db/pipeline/document_source_mock.h +++ b/src/mongo/db/pipeline/document_source_mock.h @@ -89,6 +89,13 @@ public: return this; } + /** + * This stage does not modify anything. + */ + GetModPathsReturn getModifiedPaths() const override { + return {GetModPathsReturn::Type::kFiniteSet, std::set<std::string>{}, {}}; + } + // Return documents from front of queue. std::deque<GetNextResult> queue; diff --git a/src/mongo/db/pipeline/document_source_out.cpp b/src/mongo/db/pipeline/document_source_out.cpp index e5ccdc038bc..9f59cc099b0 100644 --- a/src/mongo/db/pipeline/document_source_out.cpp +++ b/src/mongo/db/pipeline/document_source_out.cpp @@ -165,18 +165,11 @@ DocumentSource::GetNextResult DocumentSourceOut::getNext() { MONGO_UNREACHABLE; } -DocumentSourceOut::DocumentSourceOut(const NamespaceString& outputNs, - const boost::intrusive_ptr<ExpressionContext>& expCtx, - WriteModeEnum mode, - std::set<FieldPath> uniqueKey) - : DocumentSource(expCtx), - _done(false), - _outputNs(outputNs), - _mode(mode), - _uniqueKeyFields(std::move(uniqueKey)) {} - -intrusive_ptr<DocumentSource> DocumentSourceOut::createFromBson( - BSONElement elem, const intrusive_ptr<ExpressionContext>& expCtx) { +intrusive_ptr<DocumentSourceOut> DocumentSourceOut::create( + NamespaceString outputNs, + const intrusive_ptr<ExpressionContext>& expCtx, + WriteModeEnum mode, + std::set<FieldPath> uniqueKey) { uassert(ErrorCodes::OperationNotSupportedInTransaction, "$out cannot be used in a transaction", @@ -187,6 +180,45 @@ intrusive_ptr<DocumentSource> DocumentSourceOut::createFromBson( "$out cannot be used with a 'majority' read concern level", readConcernLevel != repl::ReadConcernLevel::kMajorityReadConcern); + // Although we perform a check for "replaceCollection" mode with a sharded output collection + // during lite parsing, we need to do it here as well in case mongos is stale or the command is + // sent directly to the shard. + uassert(17017, + str::stream() << "$out with mode " << WriteMode_serializer(mode) + << " is not supported to an existing *sharded* output collection.", + !(mode == WriteModeEnum::kModeReplaceCollection && + expCtx->mongoProcessInterface->isSharded(expCtx->opCtx, outputNs))); + + uassert(17385, "Can't $out to special collection: " + outputNs.coll(), !outputNs.isSpecial()); + + switch (mode) { + case WriteModeEnum::kModeReplaceCollection: + return new DocumentSourceOutReplaceColl( + std::move(outputNs), expCtx, mode, std::move(uniqueKey)); + case WriteModeEnum::kModeInsertDocuments: + return new DocumentSourceOutInPlace( + std::move(outputNs), expCtx, mode, std::move(uniqueKey)); + case WriteModeEnum::kModeReplaceDocuments: + return new DocumentSourceOutInPlaceReplace( + std::move(outputNs), expCtx, mode, std::move(uniqueKey)); + default: + MONGO_UNREACHABLE; + } +} + +DocumentSourceOut::DocumentSourceOut(NamespaceString outputNs, + const intrusive_ptr<ExpressionContext>& expCtx, + WriteModeEnum mode, + std::set<FieldPath> uniqueKey) + : DocumentSource(expCtx), + _done(false), + _outputNs(std::move(outputNs)), + _mode(mode), + _uniqueKeyFields(std::move(uniqueKey)) {} + +intrusive_ptr<DocumentSource> DocumentSourceOut::createFromBson( + BSONElement elem, const intrusive_ptr<ExpressionContext>& expCtx) { + auto mode = WriteModeEnum::kModeReplaceCollection; std::set<FieldPath> uniqueKey; NamespaceString outputNs; @@ -221,27 +253,7 @@ intrusive_ptr<DocumentSource> DocumentSourceOut::createFromBson( << typeName(elem.type())); } - // Although we perform a check for "replaceCollection" mode with a sharded output collection - // during lite parsing, we need to do it here as well in case mongos is stale or the command is - // sent directly to the shard. - uassert(17017, - str::stream() << "$out with mode " << WriteMode_serializer(mode) - << " is not supported to an existing *sharded* output collection.", - !(mode == WriteModeEnum::kModeReplaceCollection && - expCtx->mongoProcessInterface->isSharded(expCtx->opCtx, outputNs))); - - uassert(17385, "Can't $out to special collection: " + outputNs.coll(), !outputNs.isSpecial()); - - switch (mode) { - case WriteModeEnum::kModeReplaceCollection: - return new DocumentSourceOutReplaceColl(outputNs, expCtx, mode, uniqueKey); - case WriteModeEnum::kModeInsertDocuments: - return new DocumentSourceOutInPlace(outputNs, expCtx, mode, uniqueKey); - case WriteModeEnum::kModeReplaceDocuments: - return new DocumentSourceOutInPlaceReplace(outputNs, expCtx, mode, uniqueKey); - default: - MONGO_UNREACHABLE; - } + return create(std::move(outputNs), expCtx, mode, std::move(uniqueKey)); } Value DocumentSourceOut::serialize(boost::optional<ExplainOptions::Verbosity> explain) const { diff --git a/src/mongo/db/pipeline/document_source_out.h b/src/mongo/db/pipeline/document_source_out.h index 4ae2c9af5e8..45a631cabd4 100644 --- a/src/mongo/db/pipeline/document_source_out.h +++ b/src/mongo/db/pipeline/document_source_out.h @@ -59,7 +59,7 @@ public: bool _allowShardedOutNss; }; - DocumentSourceOut(const NamespaceString& outputNs, + DocumentSourceOut(NamespaceString outputNs, const boost::intrusive_ptr<ExpressionContext>& expCtx, WriteModeEnum mode, std::set<FieldPath> uniqueKey); @@ -70,28 +70,46 @@ public: const char* getSourceName() const final; Value serialize(boost::optional<ExplainOptions::Verbosity> explain = boost::none) const final; DepsTracker::State getDependencies(DepsTracker* deps) const final; + /** + * For purposes of tracking which fields come from where, this stage does not modify any fields. + */ + GetModPathsReturn getModifiedPaths() const final { + return {GetModPathsReturn::Type::kFiniteSet, std::set<std::string>{}, {}}; + } StageConstraints constraints(Pipeline::SplitState pipeState) const final { return {StreamType::kStreaming, PositionRequirement::kLast, + // A $out to an unsharded collection should merge on the primary shard to perform + // local writes. A $out to a sharded collection has no requirement, since each shard + // can perform its own portion of the write. HostTypeRequirement::kPrimaryShard, DiskUseRequirement::kWritesPersistentData, FacetRequirement::kNotAllowed, TransactionRequirement::kNotAllowed}; } - // Virtuals for NeedsMergerDocumentSource + const NamespaceString& getOutputNs() const { + return _outputNs; + } + + WriteModeEnum getMode() const { + return _mode; + } + boost::intrusive_ptr<DocumentSource> getShardSource() final { - return NULL; + return nullptr; } MergingLogic mergingLogic() final { return {this}; } - - const NamespaceString& getOutputNs() const { - return _outputNs; + virtual bool canRunInParallelBeforeOut( + const std::set<std::string>& nameOfShardKeyFieldsUponEntryToStage) const final { + // If someone is asking the question, this must be the $out stage in question, so yes! + return true; } + /** * Retrieves the namespace to direct each batch to, which may be a temporary namespace or the * final output namespace. @@ -146,6 +164,18 @@ public: */ virtual void finalize() = 0; + /** + * Creates a new $out stage from the given arguments. + */ + static boost::intrusive_ptr<DocumentSourceOut> create( + NamespaceString outputNs, + const boost::intrusive_ptr<ExpressionContext>& expCtx, + WriteModeEnum, + std::set<FieldPath> uniqueKey = std::set<FieldPath>{"_id"}); + + /** + * Parses a $out stage from the user-supplied BSON. + */ static boost::intrusive_ptr<DocumentSource> createFromBson( BSONElement elem, const boost::intrusive_ptr<ExpressionContext>& pExpCtx); diff --git a/src/mongo/db/pipeline/document_source_sort.cpp b/src/mongo/db/pipeline/document_source_sort.cpp index cb753b400f9..ca092927f56 100644 --- a/src/mongo/db/pipeline/document_source_sort.cpp +++ b/src/mongo/db/pipeline/document_source_sort.cpp @@ -513,6 +513,17 @@ NeedsMergerDocumentSource::MergingLogic DocumentSourceSort::mergingLogic() { return {_limitSrc ? DocumentSourceLimit::create(pExpCtx, _limitSrc->getLimit()) : nullptr, sortKeyPattern(SortKeySerialization::kForSortKeyMerging).toBson()}; } + +bool DocumentSourceSort::canRunInParallelBeforeOut( + const std::set<std::string>& nameOfShardKeyFieldsUponEntryToStage) const { + // This is an interesting special case. If there are no further stages which require merging the + // streams into one, a $sort should not require it. This is only the case because the sort order + // doesn't matter for a pipeline ending with a $out stage. We may encounter it here as an + // intermediate stage before a final $group with a $sort, which would make sense. Should we + // extend our analysis to detect if an exchange is appropriate in a general pipeline, a $sort + // would generally require merging the streams before producing output. + return false; +} } // namespace mongo #include "mongo/db/sorter/sorter.cpp" diff --git a/src/mongo/db/pipeline/document_source_sort.h b/src/mongo/db/pipeline/document_source_sort.h index ac860c5b7a5..a104c3f5713 100644 --- a/src/mongo/db/pipeline/document_source_sort.h +++ b/src/mongo/db/pipeline/document_source_sort.h @@ -83,6 +83,8 @@ public: boost::intrusive_ptr<DocumentSource> getShardSource() final; MergingLogic mergingLogic() final; + bool canRunInParallelBeforeOut( + const std::set<std::string>& nameOfShardKeyFieldsUponEntryToStage) const final; /** * Write out a Document whose contents are the sort key pattern. diff --git a/src/mongo/db/pipeline/document_source_test.cpp b/src/mongo/db/pipeline/document_source_test.cpp index 2979179c255..9372e683071 100644 --- a/src/mongo/db/pipeline/document_source_test.cpp +++ b/src/mongo/db/pipeline/document_source_test.cpp @@ -32,6 +32,7 @@ #include "mongo/bson/bsonobj.h" #include "mongo/bson/bsonobjbuilder.h" #include "mongo/db/pipeline/document_source.h" +#include "mongo/db/pipeline/document_source_test_optimizations.h" #include "mongo/db/service_context_test_fixture.h" #include "mongo/unittest/unittest.h" @@ -78,5 +79,244 @@ TEST_F(DocumentSourceTruncateSort, TruncateSortDedupsSortCorrectly) { ASSERT_EQUALS(truncated.count(BSON("a" << 1)), 1U); } +class RenamesAToB : public DocumentSourceTestOptimizations { +public: + RenamesAToB() : DocumentSourceTestOptimizations() {} + GetModPathsReturn getModifiedPaths() const final { + // Pretend this stage simply renames the "a" field to be "b", leaving the value of "a" the + // same. This would be the equivalent of an {$addFields: {b: "$a"}}. + return {GetModPathsReturn::Type::kFiniteSet, std::set<std::string>{}, {{"b", "a"}}}; + } +}; + +TEST(DocumentSourceRenamedPaths, DoesReturnSimpleRenameFromFiniteSetRename) { + RenamesAToB renamesAToB; + auto renames = renamesAToB.renamedPaths({"b"}); + ASSERT(static_cast<bool>(renames)); + auto map = *renames; + ASSERT_EQ(map.size(), 1UL); + ASSERT_EQ(map["b"], "a"); +} + +TEST(DocumentSourceRenamedPaths, ReturnsSimpleMapForUnaffectedFieldsFromFiniteSetRename) { + RenamesAToB renamesAToB; + { + auto renames = renamesAToB.renamedPaths({"c"}); + ASSERT(static_cast<bool>(renames)); + auto map = *renames; + ASSERT_EQ(map.size(), 1UL); + ASSERT_EQ(map["c"], "c"); + } + + { + auto renames = renamesAToB.renamedPaths({"a"}); + ASSERT(static_cast<bool>(renames)); + auto map = *renames; + ASSERT_EQ(map.size(), 1UL); + ASSERT_EQ(map["a"], "a"); + } + + { + auto renames = renamesAToB.renamedPaths({"e", "f", "g"}); + ASSERT(static_cast<bool>(renames)); + auto map = *renames; + ASSERT_EQ(map.size(), 3UL); + ASSERT_EQ(map["e"], "e"); + ASSERT_EQ(map["f"], "f"); + ASSERT_EQ(map["g"], "g"); + } +} + +class RenameCToDPreserveEFG : public DocumentSourceTestOptimizations { +public: + RenameCToDPreserveEFG() : DocumentSourceTestOptimizations() {} + + GetModPathsReturn getModifiedPaths() const final { + return {GetModPathsReturn::Type::kAllExcept, + std::set<std::string>{"e", "f", "g"}, + {{"d", "c"}}}; + } +}; + +TEST(DocumentSourceRenamedPaths, DoesReturnSimpleRenameFromAllExceptRename) { + RenameCToDPreserveEFG renameCToDPreserveEFG; + auto renames = renameCToDPreserveEFG.renamedPaths({"d"}); + ASSERT(static_cast<bool>(renames)); + auto map = *renames; + ASSERT_EQ(map.size(), 1UL); + ASSERT_EQ(map["d"], "c"); +} + +TEST(DocumentSourceRenamedPaths, ReturnsSimpleMapForUnaffectedFieldsFromAllExceptRename) { + RenameCToDPreserveEFG renameCToDPreserveEFG; + { + auto renames = renameCToDPreserveEFG.renamedPaths({"e"}); + ASSERT(static_cast<bool>(renames)); + auto map = *renames; + ASSERT_EQ(map.size(), 1UL); + ASSERT_EQ(map["e"], "e"); + } + + { + auto renames = renameCToDPreserveEFG.renamedPaths({"f", "g"}); + ASSERT(static_cast<bool>(renames)); + auto map = *renames; + ASSERT_EQ(map.size(), 2UL); + ASSERT_EQ(map["f"], "f"); + ASSERT_EQ(map["g"], "g"); + } +} + +class RenameCDotDToEPreserveFDotG : public DocumentSourceTestOptimizations { +public: + RenameCDotDToEPreserveFDotG() : DocumentSourceTestOptimizations() {} + + GetModPathsReturn getModifiedPaths() const final { + return {GetModPathsReturn::Type::kAllExcept, std::set<std::string>{"f.g"}, {{"e", "c.d"}}}; + } +}; + +TEST(DocumentSourceRenamedPaths, DoesReturnRenameToDottedFieldFromAllExceptRename) { + RenameCDotDToEPreserveFDotG renameCDotDToEPreserveFDotG; + { + auto renames = renameCDotDToEPreserveFDotG.renamedPaths({"e"}); + ASSERT(static_cast<bool>(renames)); + auto map = *renames; + ASSERT_EQ(map.size(), 1UL); + ASSERT_EQ(map["e"], "c.d"); + } + { + auto renames = renameCDotDToEPreserveFDotG.renamedPaths({"e.x", "e.y"}); + ASSERT(static_cast<bool>(renames)); + auto map = *renames; + ASSERT_EQ(map.size(), 2UL); + ASSERT_EQ(map["e.x"], "c.d.x"); + ASSERT_EQ(map["e.y"], "c.d.y"); + } +} + +TEST(DocumentSourceRenamedPaths, DoesNotTreatPrefixAsUnmodifiedWhenSuffixIsModifiedFromAllExcept) { + RenameCDotDToEPreserveFDotG renameCDotDToEPreserveFDotG; + { + auto renames = renameCDotDToEPreserveFDotG.renamedPaths({"f"}); + ASSERT_FALSE(static_cast<bool>(renames)); + } + { + // This is the exception, the only path that is not modified. + auto renames = renameCDotDToEPreserveFDotG.renamedPaths({"f.g"}); + ASSERT(static_cast<bool>(renames)); + auto map = *renames; + ASSERT_EQ(map.size(), 1UL); + ASSERT_EQ(map["f.g"], "f.g"); + } + { + // We know "f.g" is preserved, so it follows that a subpath of that path is also preserved. + auto renames = renameCDotDToEPreserveFDotG.renamedPaths({"f.g.x", "f.g.xyz.foobarbaz"}); + ASSERT(static_cast<bool>(renames)); + auto map = *renames; + ASSERT_EQ(map.size(), 2UL); + ASSERT_EQ(map["f.g.x"], "f.g.x"); + ASSERT_EQ(map["f.g.xyz.foobarbaz"], "f.g.xyz.foobarbaz"); + } + + { + // This shares a prefix with the unmodified path, but should not be reported as unmodified. + auto renames = renameCDotDToEPreserveFDotG.renamedPaths({"f.x"}); + ASSERT_FALSE(static_cast<bool>(renames)); + } +} + +class RenameAToXDotYModifyCDotD : public DocumentSourceTestOptimizations { +public: + RenameAToXDotYModifyCDotD() : DocumentSourceTestOptimizations() {} + + GetModPathsReturn getModifiedPaths() const final { + return {GetModPathsReturn::Type::kFiniteSet, std::set<std::string>{"c.d"}, {{"x.y", "a"}}}; + } +}; + +TEST(DocumentSourceRenamedPaths, DoesReturnRenameToDottedFieldFromFiniteSetRename) { + RenameAToXDotYModifyCDotD renameAToXDotYModifyCDotD; + { + auto renames = renameAToXDotYModifyCDotD.renamedPaths({"x.y"}); + ASSERT(static_cast<bool>(renames)); + auto map = *renames; + ASSERT_EQ(map.size(), 1UL); + ASSERT_EQ(map["x.y"], "a"); + } + { + auto renames = renameAToXDotYModifyCDotD.renamedPaths({"x.y.z", "x.y.a.b.c"}); + ASSERT(static_cast<bool>(renames)); + auto map = *renames; + ASSERT_EQ(map.size(), 2UL); + ASSERT_EQ(map["x.y.z"], "a.z"); + ASSERT_EQ(map["x.y.a.b.c"], "a.a.b.c"); + } +} + +TEST(DocumentSourceRenamedPaths, DoesNotTreatPrefixAsUnmodifiedWhenSuffixIsPartOfModifiedSet) { + RenameAToXDotYModifyCDotD renameAToXDotYModifyCDotD; + { + auto renames = renameAToXDotYModifyCDotD.renamedPaths({"c"}); + ASSERT_FALSE(static_cast<bool>(renames)); + } + { + auto renames = renameAToXDotYModifyCDotD.renamedPaths({"c.d"}); + ASSERT_FALSE(static_cast<bool>(renames)); + } + { + auto renames = renameAToXDotYModifyCDotD.renamedPaths({"c.d.e"}); + ASSERT_FALSE(static_cast<bool>(renames)); + } + { + auto renames = renameAToXDotYModifyCDotD.renamedPaths({"c.not_d", "c.decoy"}); + ASSERT(static_cast<bool>(renames)); + auto map = *renames; + ASSERT_EQ(map.size(), 2UL); + ASSERT_EQ(map["c.not_d"], "c.not_d"); + ASSERT_EQ(map["c.decoy"], "c.decoy"); + } +} + +class ModifiesAllPaths : public DocumentSourceTestOptimizations { +public: + ModifiesAllPaths() : DocumentSourceTestOptimizations() {} + GetModPathsReturn getModifiedPaths() const final { + return {GetModPathsReturn::Type::kAllPaths, std::set<std::string>{}, {}}; + } +}; + +TEST(DocumentSourceRenamedPaths, ReturnsNoneWhenAllPathsAreModified) { + ModifiesAllPaths modifiesAllPaths; + { + auto renames = modifiesAllPaths.renamedPaths({"a"}); + ASSERT_FALSE(static_cast<bool>(renames)); + } + { + auto renames = modifiesAllPaths.renamedPaths({"a", "b", "c.d"}); + ASSERT_FALSE(static_cast<bool>(renames)); + } +} + +class ModificationsUnknown : public DocumentSourceTestOptimizations { +public: + ModificationsUnknown() : DocumentSourceTestOptimizations() {} + GetModPathsReturn getModifiedPaths() const final { + return {GetModPathsReturn::Type::kNotSupported, std::set<std::string>{}, {}}; + } +}; + +TEST(DocumentSourceRenamedPaths, ReturnsNoneWhenModificationsAreNotKnown) { + ModificationsUnknown modificationsUnknown; + { + auto renames = modificationsUnknown.renamedPaths({"a"}); + ASSERT_FALSE(static_cast<bool>(renames)); + } + { + auto renames = modificationsUnknown.renamedPaths({"a", "b", "c.d"}); + ASSERT_FALSE(static_cast<bool>(renames)); + } +} + } // namespace } // namespace mongo diff --git a/src/mongo/db/pipeline/document_source_test_optimizations.h b/src/mongo/db/pipeline/document_source_test_optimizations.h new file mode 100644 index 00000000000..e7141835457 --- /dev/null +++ b/src/mongo/db/pipeline/document_source_test_optimizations.h @@ -0,0 +1,67 @@ +/** + * Copyright (C) 2018 MongoDB Inc. + * + * This program is free software: you can redistribute it and/or modify + * it under the terms of the GNU Affero General Public License, version 3, + * as published by the Free Software Foundation. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU Affero General Public License for more details. + * + * You should have received a copy of the GNU Affero General Public License + * along with this program. If not, see <http://www.gnu.org/licenses/>. + * + * As a special exception, the copyright holders give permission to link the + * code of portions of this program with the OpenSSL library under certain + * conditions as described in each individual source file and distribute + * linked combinations including the program with the OpenSSL library. You + * must comply with the GNU Affero General Public License in all respects + * for all of the code used other than as permitted herein. If you modify + * file(s) with this exception, you may extend this exception to your + * version of the file(s), but you are not obligated to do so. If you do not + * wish to do so, delete this exception statement from your version. If you + * delete this exception statement from all source files in the program, + * then also delete it in the license file. + */ + +#pragma once + +#include "mongo/db/pipeline/document_source.h" +#include "mongo/db/pipeline/expression_context_for_test.h" + +namespace mongo { +/** + * A dummy class for other tests to inherit from to customize the behavior of any of the virtual + * methods from DocumentSource without having to implement all of them. + */ +class DocumentSourceTestOptimizations : public DocumentSource { +public: + DocumentSourceTestOptimizations() : DocumentSource(new ExpressionContextForTest()) {} + virtual ~DocumentSourceTestOptimizations() = default; + virtual GetNextResult getNext() override { + MONGO_UNREACHABLE; + } + virtual StageConstraints constraints(Pipeline::SplitState) const override { + // Return the default constraints so that this can be used in test pipelines. Constructing a + // pipeline needs to do some validation that depends on this. + return StageConstraints{StreamType::kStreaming, + PositionRequirement::kNone, + HostTypeRequirement::kNone, + DiskUseRequirement::kNoDiskUse, + FacetRequirement::kAllowed, + TransactionRequirement::kNotAllowed}; + } + + virtual GetModPathsReturn getModifiedPaths() const override { + MONGO_UNREACHABLE; + } + +private: + virtual Value serialize(boost::optional<ExplainOptions::Verbosity>) const override { + MONGO_UNREACHABLE; + } +}; + +} // namespace mongo diff --git a/src/mongo/db/pipeline/expression.cpp b/src/mongo/db/pipeline/expression.cpp index 200792ac734..4e8f911087c 100644 --- a/src/mongo/db/pipeline/expression.cpp +++ b/src/mongo/db/pipeline/expression.cpp @@ -1970,6 +1970,16 @@ intrusive_ptr<Expression> ExpressionFieldPath::optimize() { return intrusive_ptr<Expression>(this); } +bool ExpressionFieldPath::representsPath(const std::string& dottedPath) const { + if (_variable != Variables::kRootId || _fieldPath.getPathLength() == 1) { + // This variable refers to the entire document, or refers to a sub-field of something + // besides the root document. Either way we can't prove that it represents the path given by + // 'dottedPath'. + return false; + } + return _fieldPath.tail().fullPath() == dottedPath; +} + void ExpressionFieldPath::_doAddDependencies(DepsTracker* deps) const { if (_variable == Variables::kRootId) { // includes CURRENT when it is equivalent to ROOT. if (_fieldPath.getPathLength() == 1) { diff --git a/src/mongo/db/pipeline/expression.h b/src/mongo/db/pipeline/expression.h index 6cfd4603bac..bc39e271575 100644 --- a/src/mongo/db/pipeline/expression.h +++ b/src/mongo/db/pipeline/expression.h @@ -1108,6 +1108,12 @@ public: const std::string& raw, const VariablesParseState& vps); + /** + * Returns true if this expression logically represents the path 'dottedPath'. For example, if + * 'dottedPath' is 'a.b' and this FieldPath is '$$CURRENT.a.b', returns true. + */ + bool representsPath(const std::string& dottedPath) const; + const FieldPath& getFieldPath() const { return _fieldPath; } diff --git a/src/mongo/db/pipeline/pipeline.cpp b/src/mongo/db/pipeline/pipeline.cpp index 1a82bf1569a..3c84881323f 100644 --- a/src/mongo/db/pipeline/pipeline.cpp +++ b/src/mongo/db/pipeline/pipeline.cpp @@ -478,6 +478,48 @@ void Pipeline::addFinalSource(intrusive_ptr<DocumentSource> source) { _sources.push_back(source); } +boost::optional<StringMap<std::string>> Pipeline::renamedPaths( + SourceContainer::const_reverse_iterator rstart, + SourceContainer::const_reverse_iterator rend, + std::set<std::string> pathsOfInterest) { + // Use a vector to give a path id to each input path. A path's id is its index in the vector. + const std::vector<string> inputPaths(pathsOfInterest.begin(), pathsOfInterest.end()); + std::vector<string> currentPaths(pathsOfInterest.begin(), pathsOfInterest.end()); + + // Loop backwards over the stages. We will re-use 'pathsOfInterest', modifying that set each + // time to be the current set of field's we're interested in. At the same time, we will maintain + // 'currentPaths'. 'pathsOfInterest' is used to compute the renames, while 'currentPaths' is + // used to tie a path back to its id. + // + // Interestingly, 'currentPaths' may contain duplicates. For example, if a stage like + // {$addFields: {a: "$b"}} duplicates the value of "a" and both paths are of interest, then + // 'currentPaths' may begin as ["a", "b"] representing the paths after the $addFields stage, but + // becomes ["a", "a"] via the rename. + for (auto it = rstart; it != rend; ++it) { + boost::optional<StringMap<string>> renamed = (*it)->renamedPaths(pathsOfInterest); + if (!renamed) { + return boost::none; + } + pathsOfInterest.clear(); + for (std::size_t pathId = 0; pathId < inputPaths.size(); ++pathId) { + currentPaths[pathId] = (*renamed)[currentPaths[pathId]]; + pathsOfInterest.insert(currentPaths[pathId]); + } + } + + // We got all the way through the pipeline via renames! Construct the mapping from path at the + // end of the pipeline to path at the beginning. + StringMap<string> renameMap; + for (std::size_t pathId = 0; pathId < currentPaths.size(); ++pathId) { + renameMap[inputPaths[pathId]] = currentPaths[pathId]; + } + return renameMap; +} + +boost::optional<StringMap<string>> Pipeline::renamedPaths(std::set<string> pathsOfInterest) const { + return renamedPaths(_sources.rbegin(), _sources.rend(), std::move(pathsOfInterest)); +} + DepsTracker Pipeline::getDependencies(DepsTracker::MetadataAvailable metadataAvailable) const { DepsTracker deps(metadataAvailable); const bool scopeHasVariables = pCtx->variablesParseState.hasDefinedVariables(); diff --git a/src/mongo/db/pipeline/pipeline.h b/src/mongo/db/pipeline/pipeline.h index d3e99daae31..4874126b398 100644 --- a/src/mongo/db/pipeline/pipeline.h +++ b/src/mongo/db/pipeline/pipeline.h @@ -132,6 +132,19 @@ public: */ static bool aggSupportsWriteConcern(const BSONObj& cmd); + /** + * Given 'pathsOfInterest' which describes a set of paths which the caller is interested in, + * returns boost::none if any of those paths are modified by the section of a pipeline + * described by 'rstart' and 'rend', or a mapping from their name at the end of the pipeline to + * their name at the beginning of the pipeline if they are preserved but possibly renamed by + * this pipeline. Note that the analysis proceeds backwards, so the iterators must be reverse + * iterators. + */ + static boost::optional<StringMap<std::string>> renamedPaths( + SourceContainer::const_reverse_iterator rstart, + SourceContainer::const_reverse_iterator rend, + std::set<std::string> pathsOfInterest); + const boost::intrusive_ptr<ExpressionContext>& getContext() const { return pCtx; } @@ -250,6 +263,15 @@ public: */ DepsTracker getDependencies(DepsTracker::MetadataAvailable metadataAvailable) const; + /** + * Given 'pathsOfInterest' which describes a set of paths which the caller is interested in, + * returns boost::none if any of those paths are modified by this pipeline, or a mapping from + * their name at the end of the pipeline to their name at the beginning of the pipeline if they + * are preserved but possibly renamed by this pipeline. + */ + boost::optional<StringMap<std::string>> renamedPaths( + std::set<std::string> pathsOfInterest) const; + const SourceContainer& getSources() const { return _sources; } diff --git a/src/mongo/db/pipeline/pipeline_test.cpp b/src/mongo/db/pipeline/pipeline_test.cpp index 65d3c4fecc0..280473848cc 100644 --- a/src/mongo/db/pipeline/pipeline_test.cpp +++ b/src/mongo/db/pipeline/pipeline_test.cpp @@ -45,10 +45,12 @@ #include "mongo/db/pipeline/document_source_out.h" #include "mongo/db/pipeline/document_source_project.h" #include "mongo/db/pipeline/document_source_sort.h" +#include "mongo/db/pipeline/document_source_test_optimizations.h" #include "mongo/db/pipeline/document_value_test_util.h" #include "mongo/db/pipeline/expression_context_for_test.h" #include "mongo/db/pipeline/field_path.h" #include "mongo/db/pipeline/pipeline.h" +#include "mongo/db/pipeline/stub_mongo_process_interface.h" #include "mongo/db/query/collation/collator_interface_mock.h" #include "mongo/db/query/query_test_service_context.h" #include "mongo/db/repl/replication_coordinator_mock.h" @@ -2246,11 +2248,24 @@ DEATH_TEST_F(PipelineMustRunOnMongoSTest, splitPipeline.shardsPipeline->requiredToRunOnMongos(); } +/** + * For the purpsoses of this test, assume every collection is unsharded. Stages may ask this during + * setup. For example, to compute its constraints, the $out stage needs to know if the output + * collection is sharded. + */ +class FakeMongoProcessInterface : public StubMongoProcessInterface { +public: + bool isSharded(OperationContext* opCtx, const NamespaceString& ns) override { + return false; + } +}; + TEST_F(PipelineMustRunOnMongoSTest, SplitMongoSMergePipelineAssertsIfShardStagePresent) { auto expCtx = getExpCtx(); expCtx->allowDiskUse = true; expCtx->inMongos = true; + expCtx->mongoProcessInterface = std::make_shared<FakeMongoProcessInterface>(); auto match = DocumentSourceMatch::create(fromjson("{x: 5}"), expCtx); auto split = DocumentSourceInternalSplitPipeline::create(expCtx, HostTypeRequirement::kNone); @@ -2678,6 +2693,201 @@ TEST_F(PipelineDependenciesTest, ShouldNotRequireTextScoreIfAvailableButDefinite } // namespace Dependencies +namespace { +TEST(PipelineRenameTracking, ReportsIdentityMapWhenEmpty) { + boost::intrusive_ptr<ExpressionContext> expCtx(new ExpressionContextForTest()); + auto pipeline = unittest::assertGet(Pipeline::create({DocumentSourceMock::create()}, expCtx)); + auto renames = pipeline->renamedPaths({"a", "b", "c.d"}); + ASSERT(static_cast<bool>(renames)); + auto nameMap = *renames; + ASSERT_EQ(nameMap.size(), 3UL); + ASSERT_EQ(nameMap["a"], "a"); + ASSERT_EQ(nameMap["b"], "b"); + ASSERT_EQ(nameMap["c.d"], "c.d"); +} + +class NoModifications : public DocumentSourceTestOptimizations { +public: + NoModifications() : DocumentSourceTestOptimizations() {} + static boost::intrusive_ptr<NoModifications> create() { + return new NoModifications(); + } + + /** + * Returns a description which communicate that this stage modifies nothing. + */ + GetModPathsReturn getModifiedPaths() const final { + return {GetModPathsReturn::Type::kFiniteSet, std::set<std::string>(), {}}; + } +}; + +TEST(PipelineRenameTracking, ReportsIdentityWhenNoStageModifiesAnything) { + boost::intrusive_ptr<ExpressionContext> expCtx(new ExpressionContextForTest()); + { + auto pipeline = unittest::assertGet( + Pipeline::create({DocumentSourceMock::create(), NoModifications::create()}, expCtx)); + auto renames = pipeline->renamedPaths({"a", "b", "c.d"}); + ASSERT(static_cast<bool>(renames)); + auto nameMap = *renames; + ASSERT_EQ(nameMap.size(), 3UL); + ASSERT_EQ(nameMap["a"], "a"); + ASSERT_EQ(nameMap["b"], "b"); + ASSERT_EQ(nameMap["c.d"], "c.d"); + } + { + auto pipeline = unittest::assertGet(Pipeline::create({DocumentSourceMock::create(), + NoModifications::create(), + NoModifications::create(), + NoModifications::create()}, + expCtx)); + auto renames = pipeline->renamedPaths({"a", "b", "c.d"}); + ASSERT(static_cast<bool>(renames)); + auto nameMap = *renames; + ASSERT_EQ(nameMap.size(), 3UL); + ASSERT_EQ(nameMap["a"], "a"); + ASSERT_EQ(nameMap["b"], "b"); + ASSERT_EQ(nameMap["c.d"], "c.d"); + } +} + +class NotSupported : public DocumentSourceTestOptimizations { +public: + NotSupported() : DocumentSourceTestOptimizations() {} + static boost::intrusive_ptr<NotSupported> create() { + return new NotSupported(); + } + + /** + * Returns a description which communicate that this stage modifies nothing. + */ + GetModPathsReturn getModifiedPaths() const final { + return {GetModPathsReturn::Type::kNotSupported, std::set<std::string>(), {}}; + } +}; + +TEST(PipelineRenameTracking, DoesNotReportRenamesIfAStageDoesNotSupportTrackingThem) { + boost::intrusive_ptr<ExpressionContext> expCtx(new ExpressionContextForTest()); + auto pipeline = unittest::assertGet(Pipeline::create({DocumentSourceMock::create(), + NoModifications::create(), + NotSupported::create(), + NoModifications::create()}, + expCtx)); + ASSERT_FALSE(static_cast<bool>(pipeline->renamedPaths({"a"}))); + ASSERT_FALSE(static_cast<bool>(pipeline->renamedPaths({"a", "b"}))); + ASSERT_FALSE(static_cast<bool>(pipeline->renamedPaths({"x", "yahoo", "c.d"}))); +} + +class RenamesAToB : public DocumentSourceTestOptimizations { +public: + RenamesAToB() : DocumentSourceTestOptimizations() {} + static boost::intrusive_ptr<RenamesAToB> create() { + return new RenamesAToB(); + } + GetModPathsReturn getModifiedPaths() const final { + return {GetModPathsReturn::Type::kFiniteSet, std::set<std::string>{}, {{"b", "a"}}}; + } +}; + +TEST(PipelineRenameTracking, ReportsNewNamesWhenSingleStageRenames) { + boost::intrusive_ptr<ExpressionContext> expCtx(new ExpressionContextForTest()); + auto pipeline = unittest::assertGet( + Pipeline::create({DocumentSourceMock::create(), RenamesAToB::create()}, expCtx)); + { + auto renames = pipeline->renamedPaths({"b"}); + ASSERT(static_cast<bool>(renames)); + auto nameMap = *renames; + ASSERT_EQ(nameMap.size(), 1UL); + ASSERT_EQ(nameMap["b"], "a"); + } + { + auto renames = pipeline->renamedPaths({"b", "c.d"}); + ASSERT(static_cast<bool>(renames)); + auto nameMap = *renames; + ASSERT_EQ(nameMap.size(), 2UL); + ASSERT_EQ(nameMap["b"], "a"); + ASSERT_EQ(nameMap["c.d"], "c.d"); + } + { + // This is strange; the mock stage reports to essentially duplicate the "a" field into "b". + // Because of this, both "b" and "a" should map to "a". + auto renames = pipeline->renamedPaths({"b", "a"}); + ASSERT(static_cast<bool>(renames)); + auto nameMap = *renames; + ASSERT_EQ(nameMap.size(), 2UL); + ASSERT_EQ(nameMap["b"], "a"); + ASSERT_EQ(nameMap["a"], "a"); + } +} + +TEST(PipelineRenameTracking, ReportsIdentityMapWhenGivenEmptyIteratorRange) { + boost::intrusive_ptr<ExpressionContext> expCtx(new ExpressionContextForTest()); + auto pipeline = unittest::assertGet( + Pipeline::create({DocumentSourceMock::create(), RenamesAToB::create()}, expCtx)); + { + auto renames = Pipeline::renamedPaths( + pipeline->getSources().rbegin(), pipeline->getSources().rbegin(), {"b"}); + ASSERT(static_cast<bool>(renames)); + auto nameMap = *renames; + ASSERT_EQ(nameMap.size(), 1UL); + ASSERT_EQ(nameMap["b"], "b"); + } + { + auto renames = Pipeline::renamedPaths( + pipeline->getSources().rbegin(), pipeline->getSources().rbegin(), {"b", "c.d"}); + ASSERT(static_cast<bool>(renames)); + auto nameMap = *renames; + ASSERT_EQ(nameMap.size(), 2UL); + ASSERT_EQ(nameMap["b"], "b"); + ASSERT_EQ(nameMap["c.d"], "c.d"); + } +} + +class RenamesBToC : public DocumentSourceTestOptimizations { +public: + RenamesBToC() : DocumentSourceTestOptimizations() {} + static boost::intrusive_ptr<RenamesBToC> create() { + return new RenamesBToC(); + } + GetModPathsReturn getModifiedPaths() const final { + return {GetModPathsReturn::Type::kFiniteSet, std::set<std::string>{}, {{"c", "b"}}}; + } +}; + +TEST(PipelineRenameTracking, ReportsNewNameAcrossMultipleRenames) { + boost::intrusive_ptr<ExpressionContext> expCtx(new ExpressionContextForTest()); + auto pipeline = unittest::assertGet(Pipeline::create( + {DocumentSourceMock::create(), RenamesAToB::create(), RenamesBToC::create()}, expCtx)); + auto renames = pipeline->renamedPaths({"c"}); + ASSERT(static_cast<bool>(renames)); + auto nameMap = *renames; + ASSERT_EQ(nameMap.size(), 1UL); + ASSERT_EQ(nameMap["c"], "a"); +} + +class RenamesBToA : public DocumentSourceTestOptimizations { +public: + RenamesBToA() : DocumentSourceTestOptimizations() {} + static boost::intrusive_ptr<RenamesBToA> create() { + return new RenamesBToA(); + } + GetModPathsReturn getModifiedPaths() const final { + return {GetModPathsReturn::Type::kFiniteSet, std::set<std::string>{}, {{"b", "a"}}}; + } +}; + +TEST(PipelineRenameTracking, CanHandleBackAndForthRename) { + boost::intrusive_ptr<ExpressionContext> expCtx(new ExpressionContextForTest()); + auto pipeline = unittest::assertGet(Pipeline::create( + {DocumentSourceMock::create(), RenamesAToB::create(), RenamesBToA::create()}, expCtx)); + auto renames = pipeline->renamedPaths({"a"}); + ASSERT(static_cast<bool>(renames)); + auto nameMap = *renames; + ASSERT_EQ(nameMap.size(), 1UL); + ASSERT_EQ(nameMap["a"], "a"); +} + +} // namespace + class All : public Suite { public: All() : Suite("PipelineOptimizations") {} diff --git a/src/mongo/s/SConscript b/src/mongo/s/SConscript index 2796119cc9e..522419420c8 100644 --- a/src/mongo/s/SConscript +++ b/src/mongo/s/SConscript @@ -360,7 +360,6 @@ env.CppUnitTest( 'shard_key_pattern_test.cpp', ], LIBDEPS=[ - "$BUILD_DIR/mongo/db/auth/authmocks", '$BUILD_DIR/mongo/db/serveronly', 'catalog_cache_test_fixture', ] @@ -392,6 +391,7 @@ env.Library( 'catalog_cache_test_fixture.cpp', ], LIBDEPS=[ + "$BUILD_DIR/mongo/db/auth/authmocks", '$BUILD_DIR/mongo/db/query/query_test_service_context', 'coreshard', 'sharding_router_test_fixture', diff --git a/src/mongo/s/catalog_cache_test_fixture.cpp b/src/mongo/s/catalog_cache_test_fixture.cpp index 835aedebf2f..c7df14e96b1 100644 --- a/src/mongo/s/catalog_cache_test_fixture.cpp +++ b/src/mongo/s/catalog_cache_test_fixture.cpp @@ -160,9 +160,9 @@ std::shared_ptr<ChunkManager> CatalogCacheTestFixture::makeChunkManager( return routingInfo->cm(); } -void CatalogCacheTestFixture::expectGetDatabase(NamespaceString nss) { +void CatalogCacheTestFixture::expectGetDatabase(NamespaceString nss, std::string shardId) { expectFindSendBSONObjVector(kConfigHostAndPort, [&]() { - DatabaseType db(nss.db().toString(), {"0"}, true, databaseVersion::makeNew()); + DatabaseType db(nss.db().toString(), {shardId}, true, databaseVersion::makeNew()); return std::vector<BSONObj>{db.toBSON()}; }()); } diff --git a/src/mongo/s/catalog_cache_test_fixture.h b/src/mongo/s/catalog_cache_test_fixture.h index ef155fa1c8a..c7cacad7eec 100644 --- a/src/mongo/s/catalog_cache_test_fixture.h +++ b/src/mongo/s/catalog_cache_test_fixture.h @@ -84,7 +84,7 @@ protected: /** * Mocks network responses for loading a sharded database and collection from the config server. */ - void expectGetDatabase(NamespaceString nss); + void expectGetDatabase(NamespaceString nss, std::string primaryShard = "0"); void expectGetCollection(NamespaceString nss, OID epoch, const ShardKeyPattern& shardKeyPattern); diff --git a/src/mongo/s/commands/SConscript b/src/mongo/s/commands/SConscript index 10d8ad623fb..3c6fe218bfd 100644 --- a/src/mongo/s/commands/SConscript +++ b/src/mongo/s/commands/SConscript @@ -153,7 +153,6 @@ env.CppUnitTest( LIBDEPS=[ 'cluster_commands', 'cluster_command_test_fixture', - '$BUILD_DIR/mongo/db/auth/authmocks', '$BUILD_DIR/mongo/db/auth/saslauth', ], ) diff --git a/src/mongo/s/grid.h b/src/mongo/s/grid.h index 02da388532b..ab61f840282 100644 --- a/src/mongo/s/grid.h +++ b/src/mongo/s/grid.h @@ -119,6 +119,10 @@ public: return _catalogClient.get(); } + /** + * Can return nullptr. For example, if this is a mongod that is not a shard server. This is + * always present on mongos after startup. + */ CatalogCache* catalogCache() const { return _catalogCache.get(); } diff --git a/src/mongo/s/query/SConscript b/src/mongo/s/query/SConscript index 9882356dd90..6dd7d6605c6 100644 --- a/src/mongo/s/query/SConscript +++ b/src/mongo/s/query/SConscript @@ -41,6 +41,7 @@ env.CppUnitTest( target="cluster_aggregate_test", source=[ "cluster_aggregate_test.cpp", + "cluster_aggregation_planner_test.cpp", ], LIBDEPS=[ '$BUILD_DIR/mongo/db/auth/authmocks', @@ -57,10 +58,9 @@ env.CppUnitTest( ], LIBDEPS=[ 'cluster_query', - '$BUILD_DIR/mongo/db/auth/authmocks', '$BUILD_DIR/mongo/db/keys_collection_client_sharded', - '$BUILD_DIR/mongo/s/commands/cluster_commands', '$BUILD_DIR/mongo/s/catalog_cache_test_fixture', + '$BUILD_DIR/mongo/s/commands/cluster_commands', ], ) diff --git a/src/mongo/s/query/cluster_aggregation_planner.cpp b/src/mongo/s/query/cluster_aggregation_planner.cpp index cd110ca31ff..288dcd48448 100644 --- a/src/mongo/s/query/cluster_aggregation_planner.cpp +++ b/src/mongo/s/query/cluster_aggregation_planner.cpp @@ -30,21 +30,25 @@ #include "mongo/s/query/cluster_aggregation_planner.h" +#include "mongo/db/pipeline/document_source_group.h" #include "mongo/db/pipeline/document_source_limit.h" #include "mongo/db/pipeline/document_source_match.h" #include "mongo/db/pipeline/document_source_merge_cursors.h" +#include "mongo/db/pipeline/document_source_out.h" #include "mongo/db/pipeline/document_source_project.h" #include "mongo/db/pipeline/document_source_skip.h" #include "mongo/db/pipeline/document_source_sort.h" #include "mongo/db/pipeline/document_source_unwind.h" #include "mongo/db/pipeline/document_source_update_on_add_shard.h" #include "mongo/executor/task_executor_pool.h" +#include "mongo/s/catalog_cache.h" #include "mongo/s/grid.h" #include "mongo/s/query/router_stage_limit.h" #include "mongo/s/query/router_stage_pipeline.h" #include "mongo/s/query/router_stage_remove_metadata_fields.h" #include "mongo/s/query/router_stage_skip.h" #include "mongo/s/shard_id.h" +#include "mongo/s/shard_key_pattern.h" namespace mongo { namespace cluster_aggregation_planner { @@ -186,6 +190,136 @@ ClusterClientCursorGuard convertPipelineToRouterStages( opCtx, std::move(root), Document::allMetadataFieldNames), std::move(cursorParams)); } + +bool stageCanRunInParallel(const boost::intrusive_ptr<DocumentSource>& stage, + const std::set<std::string>& nameOfShardKeyFieldsUponEntryToStage) { + if (auto needsMerger = dynamic_cast<NeedsMergerDocumentSource*>(stage.get())) { + return needsMerger->canRunInParallelBeforeOut(nameOfShardKeyFieldsUponEntryToStage); + } else { + // This stage is fine to execute in parallel on each stream. For example, a $match can be + // applied to each stream in parallel. + return true; + } +} + +std::string mapToString(const StringMap<std::string>& map) { + StringBuilder sb; + sb << "{"; + for (auto&& entry : map) { + if (sb.len() != 1) { + sb << ", "; + } + sb << entry.first << ": " << entry.second; + } + sb << "}"; + return sb.str(); +} + +BSONObj buildNewKeyPattern(const ShardKeyPattern& shardKey, StringMap<std::string> renames) { + BSONObjBuilder newPattern; + for (auto&& elem : shardKey.getKeyPattern().toBSON()) { + auto it = renames.find(elem.fieldNameStringData()); + invariant(it != renames.end(), + str::stream() << "Could not find new name of shard key field \"" + << elem.fieldName() + << "\": rename map was " + << mapToString(renames)); + newPattern.appendAs(elem, it->second); + } + return newPattern.obj(); +} + +StringMap<std::string> computeShardKeyRenameMap(const Pipeline* mergePipeline, + std::set<std::string>&& pathsOfShardKey) { + auto traversalStart = mergePipeline->getSources().crbegin(); + auto traversalEnd = mergePipeline->getSources().crend(); + const auto leadingGroup = + dynamic_cast<DocumentSourceGroup*>(mergePipeline->getSources().front().get()); + if (leadingGroup && leadingGroup->doingMerge()) { + // A leading $group stage will not report to preserve any fields, since it blows away the + // _id and replaces it with something new. It possibly renames some fields, but when + // computing the new shard key we are interested in the name of the shard key *in the middle + // of the $group*. The $exchange will be inserted between the shard-local groups and the + // global groups. Thus we want to exclude this stage from our rename tracking. + traversalEnd = std::prev(traversalEnd); + } + auto renameMap = Pipeline::renamedPaths(traversalStart, traversalEnd, pathsOfShardKey); + invariant(renameMap, + str::stream() + << "Analyzed pipeline was thought to preserve the shard key fields, but did not: " + << Value(mergePipeline->serialize()).toString()); + return *renameMap; +} + +/** + * Returns true if any stage in the pipeline would modify any of the fields in 'shardKeyPaths', or + * if there is any stage in the pipeline requires a unified stream to do its computation like a + * $limit would. + * + * Purposefully takes 'shardKeyPaths' by value so that it can be modified throughout. + */ +bool anyStageModifiesShardKeyOrNeedsMerge(std::set<std::string> shardKeyPaths, + const Pipeline* mergePipeline) { + const auto& stages = mergePipeline->getSources(); + for (auto it = stages.crbegin(); it != stages.crend(); ++it) { + const auto& stage = *it; + auto renames = stage->renamedPaths(std::move(shardKeyPaths)); + if (!renames) { + return true; + } + shardKeyPaths.clear(); + for (auto&& rename : *renames) { + shardKeyPaths.insert(rename.second); + } + if (!stageCanRunInParallel(stage, shardKeyPaths)) { + // In order for this stage to work it needs a single input stream which it wouldn't get + // if we inserted an exchange before it. + return true; + } + } + return false; +} + +boost::optional<ShardedExchangePolicy> walkPipelineBackwardsTrackingShardKey( + OperationContext* opCtx, + const boost::intrusive_ptr<const DocumentSourceOut>& outStage, + const Pipeline* mergePipeline, + const ChunkManager& chunkManager) { + + const ShardKeyPattern& shardKey = chunkManager.getShardKeyPattern(); + std::set<std::string> shardKeyPaths; + for (auto&& path : shardKey.getKeyPatternFields()) { + shardKeyPaths.emplace(path->dottedField().toString()); + } + if (anyStageModifiesShardKeyOrNeedsMerge(shardKeyPaths, mergePipeline)) { + return boost::none; + } + + // All the fields of the shard key are preserved by the pipeline, but they might be renamed. To + // set up the $exchange, we need to build a fake shard key pattern which uses the names of the + // shard key fields as they are at the split point of the pipeline. + auto renames = computeShardKeyRenameMap(mergePipeline, std::move(shardKeyPaths)); + ShardKeyPattern newShardKey(buildNewKeyPattern(shardKey, renames)); + + // Given the new shard key fields, build the distribution map. + StringMap<std::vector<ChunkRange>> distribution; + for (auto&& chunk : chunkManager.chunks()) { + // Append the boundaries with the new names from the new shard key. + auto translateBoundary = [&renames](const BSONObj& oldBoundary) { + BSONObjBuilder bob; + for (auto&& elem : oldBoundary) { + bob.appendAs(elem, renames[elem.fieldNameStringData()]); + } + return bob.obj(); + }; + distribution[chunk.getShardId().toString()].emplace_back(translateBoundary(chunk.getMin()), + translateBoundary(chunk.getMax())); + } + return ShardedExchangePolicy{ + ExchangePolicyEnum::kRange, + ShardDistributionInfo{ShardKeyPattern{std::move(newShardKey)}, std::move(distribution)}}; +} + } // namespace SplitPipeline splitPipeline(std::unique_ptr<Pipeline, PipelineDeleter> pipeline) { @@ -254,5 +388,36 @@ ClusterClientCursorGuard buildClusterCursor(OperationContext* opCtx, opCtx, std::make_unique<RouterStagePipeline>(std::move(pipeline)), std::move(cursorParams)); } +boost::optional<ShardedExchangePolicy> checkIfEligibleForExchange(OperationContext* opCtx, + const Pipeline* mergePipeline) { + const auto grid = Grid::get(opCtx); + invariant(grid); + + const auto outStage = + dynamic_cast<DocumentSourceOut*>(mergePipeline->getSources().back().get()); + if (!outStage || outStage->getMode() == WriteModeEnum::kModeReplaceCollection) { + // If there's no $out stage we won't try to do an $exchange. If the $out stage is using mode + // "replaceCollection", then there's no point doing an $exchange because all the writes will + // go to a single node, so we should just perform the merge on that host. + return boost::none; + } + + const auto routingInfo = uassertStatusOK( + grid->catalogCache()->getCollectionRoutingInfo(opCtx, outStage->getOutputNs())); + if (!routingInfo.cm()) { + return boost::none; + } + + // The collection is sharded and we have an $out stage! Here we assume the $out stage has + // already verified that the shard key pattern is compatible with the unique key being used. + // Assuming this, we just have to make sure the shard key is preserved (though possibly renamed) + // all the way to the front of the merge pipeline. If this is the case then for any document + // entering the merging pipeline we can predict which shard it will need to end up being + // inserted on. With this ability we can insert an exchange on the shards to partition the + // documents based on which shard will end up owning them. Then each shard can perform a merge + // of only those documents which belong to it (optimistically, barring chunk migrations). + return walkPipelineBackwardsTrackingShardKey(opCtx, outStage, mergePipeline, *routingInfo.cm()); +} + } // namespace cluster_aggregation_planner } // namespace mongo diff --git a/src/mongo/s/query/cluster_aggregation_planner.h b/src/mongo/s/query/cluster_aggregation_planner.h index 3b3aaa63df4..8a5f494cff2 100644 --- a/src/mongo/s/query/cluster_aggregation_planner.h +++ b/src/mongo/s/query/cluster_aggregation_planner.h @@ -28,9 +28,13 @@ #pragma once +#include "mongo/db/pipeline/document_source_exchange_gen.h" #include "mongo/db/pipeline/lite_parsed_pipeline.h" #include "mongo/db/pipeline/pipeline.h" +#include "mongo/db/pipeline/pipeline.h" +#include "mongo/s/catalog/type_chunk.h" #include "mongo/s/query/cluster_client_cursor_impl.h" +#include "mongo/s/shard_id.h" namespace mongo { namespace cluster_aggregation_planner { @@ -89,5 +93,29 @@ ClusterClientCursorGuard buildClusterCursor(OperationContext* opCtx, std::unique_ptr<Pipeline, PipelineDeleter> pipeline, ClusterClientCursorParams&&); +struct ShardDistributionInfo { + // If we want to send data to the shards which would own the data, 'logicalShardKeyAtSplitPoint' + // describes which of the fields to use to determine what the final shard key will be. For + // example, if the merging pipeline renames "x" to "out_shard_key" and then uses $out to output + // to a collection sharded by {out_shard_key: 1}, 'logicalShardKeyAtSplitPoint' will be {x: 1}. + ShardKeyPattern logicalShardKeyAtSplitPoint; + + // This map describes which shard is going to receive which range. The keys are the shard ids. + StringMap<std::vector<ChunkRange>> partitions; +}; + +struct ShardedExchangePolicy { + ExchangePolicyEnum policy; + + // Only set if the policy is ranged. + boost::optional<ShardDistributionInfo> shardDistributionInfo; +}; + +/** + * If the merging pipeline is eligible for an $exchange merge optimization, returns the information + * required to set that up. + */ +boost::optional<ShardedExchangePolicy> checkIfEligibleForExchange(OperationContext* opCtx, + const Pipeline* mergePipeline); } // namespace cluster_aggregation_planner } // namespace mongo diff --git a/src/mongo/s/query/cluster_aggregation_planner_test.cpp b/src/mongo/s/query/cluster_aggregation_planner_test.cpp new file mode 100644 index 00000000000..10782443e35 --- /dev/null +++ b/src/mongo/s/query/cluster_aggregation_planner_test.cpp @@ -0,0 +1,545 @@ +/** + * Copyright (C) 2018 MongoDB Inc. + * + * This program is free software: you can redistribute it and/or modify + * it under the terms of the GNU Affero General Public License, version 3, + * as published by the Free Software Foundation. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU Affero General Public License for more details. + * + * You should have received a copy of the GNU Affero General Public License + * along with this program. If not, see <http://www.gnu.org/licenses/>. + * + * As a special exception, the copyright holders give permission to link the + * code of portions of this program with the OpenSSL library under certain + * conditions as described in each individual source file and distribute + * linked combinations including the program with the OpenSSL library. You + * must comply with the GNU Affero General Public License in all respects + * for all of the code used other than as permitted herein. If you modify + * file(s) with this exception, you may extend this exception to your + * version of the file(s), but you are not obligated to do so. If you do not + * wish to do so, delete this exception statement from your version. If you + * delete this exception statement from all source files in the program, + * then also delete it in the license file. + */ + +#include "mongo/platform/basic.h" + + +#include "mongo/client/remote_command_targeter_factory_mock.h" +#include "mongo/client/remote_command_targeter_mock.h" +#include "mongo/db/pipeline/document_source_group.h" +#include "mongo/db/pipeline/document_source_match.h" +#include "mongo/db/pipeline/document_source_out.h" +#include "mongo/db/pipeline/document_source_out_gen.h" +#include "mongo/db/pipeline/document_source_project.h" +#include "mongo/db/pipeline/document_source_sort.h" +#include "mongo/db/pipeline/expression_context_for_test.h" +#include "mongo/db/pipeline/stub_mongo_process_interface.h" +#include "mongo/s/catalog/type_shard.h" +#include "mongo/s/catalog_cache_test_fixture.h" +#include "mongo/s/query/cluster_aggregation_planner.h" +#include "mongo/unittest/unittest.h" +#include "mongo/util/scopeguard.h" + +namespace mongo { + +namespace { + +const NamespaceString kTestAggregateNss = NamespaceString{"unittests", "cluster_exchange"}; +const NamespaceString kTestOutNss = NamespaceString{"unittests", "out_ns"}; + +/** + * For the purposes of this test, assume every collection is sharded. Stages may ask this during + * setup. For example, to compute its constraints, the $out stage needs to know if the output + * collection is sharded. + */ +class FakeMongoProcessInterface : public StubMongoProcessInterface { +public: + bool isSharded(OperationContext* opCtx, const NamespaceString& ns) override { + return true; + } +}; + +class ClusterExchangeTest : public CatalogCacheTestFixture { +public: + void setUp() { + CatalogCacheTestFixture::setUp(); + _expCtx = new ExpressionContextForTest(operationContext(), + AggregationRequest{kTestAggregateNss, {}}); + _expCtx->mongoProcessInterface = std::make_shared<FakeMongoProcessInterface>(); + } + + boost::intrusive_ptr<ExpressionContext> expCtx() { + return _expCtx; + } + + boost::intrusive_ptr<DocumentSource> parse(const std::string& json) { + auto stages = DocumentSource::parse(_expCtx, fromjson(json)); + ASSERT_EQ(stages.size(), 1UL); + return stages.front(); + } + + std::vector<ChunkType> makeChunks(const NamespaceString& nss, + const OID epoch, + std::vector<std::pair<ChunkRange, ShardId>> chunkInfos) { + ChunkVersion version(1, 0, epoch); + std::vector<ChunkType> chunks; + for (auto&& pair : chunkInfos) { + chunks.emplace_back(nss, pair.first, version, pair.second); + version.incMinor(); + } + return chunks; + } + + void loadRoutingTable(NamespaceString nss, + const OID epoch, + const ShardKeyPattern& shardKey, + const std::vector<ChunkType>& chunkDistribution) { + auto future = scheduleRoutingInfoRefresh(nss); + + // Mock the expected config server queries. + expectGetDatabase(nss); + expectGetCollection(nss, epoch, shardKey); + expectGetCollection(nss, epoch, shardKey); + expectFindSendBSONObjVector(kConfigHostAndPort, [&]() { + std::vector<BSONObj> response; + for (auto&& chunk : chunkDistribution) { + response.push_back(chunk.toConfigBSON()); + } + return response; + }()); + + future.timed_get(kFutureTimeout).get(); + } + +private: + boost::intrusive_ptr<ExpressionContext> _expCtx; +}; + +TEST_F(ClusterExchangeTest, ShouldNotExchangeIfPipelineDoesNotEndWithOut) { + setupNShards(2); + auto mergePipe = + unittest::assertGet(Pipeline::create({DocumentSourceLimit::create(expCtx(), 1)}, expCtx())); + ASSERT_FALSE(cluster_aggregation_planner::checkIfEligibleForExchange(operationContext(), + mergePipe.get())); + mergePipe = unittest::assertGet( + Pipeline::create({DocumentSourceMatch::create(BSONObj(), expCtx())}, expCtx())); + ASSERT_FALSE(cluster_aggregation_planner::checkIfEligibleForExchange(operationContext(), + mergePipe.get())); +} + +TEST_F(ClusterExchangeTest, ShouldNotExchangeIfPipelineEndsWithReplaceCollectionOut) { + setupNShards(2); + + // For this test pretend 'kTestOutNss' is not sharded so that we can use a "replaceCollection" + // $out. + const auto originalMongoProcessInterface = expCtx()->mongoProcessInterface; + expCtx()->mongoProcessInterface = std::make_shared<StubMongoProcessInterface>(); + ON_BLOCK_EXIT([&]() { expCtx()->mongoProcessInterface = originalMongoProcessInterface; }); + + auto mergePipe = unittest::assertGet(Pipeline::create( + {DocumentSourceOut::create(kTestOutNss, expCtx(), WriteModeEnum::kModeReplaceCollection)}, + expCtx())); + ASSERT_FALSE(cluster_aggregation_planner::checkIfEligibleForExchange(operationContext(), + mergePipe.get())); +} + +TEST_F(ClusterExchangeTest, SingleOutStageNotEligibleForExchangeIfOutputDatabaseDoesNotExist) { + setupNShards(2); + auto mergePipe = unittest::assertGet(Pipeline::create( + {DocumentSourceOut::create(kTestOutNss, expCtx(), WriteModeEnum::kModeInsertDocuments)}, + expCtx())); + + auto future = launchAsync([&] { + ASSERT_THROWS_CODE(cluster_aggregation_planner::checkIfEligibleForExchange( + operationContext(), mergePipe.get()), + AssertionException, + ErrorCodes::NamespaceNotFound); + }); + + // Mock out a response as if the database doesn't exist. + expectFindSendBSONObjVector(kConfigHostAndPort, []() { return std::vector<BSONObj>{}; }()); + expectFindSendBSONObjVector(kConfigHostAndPort, []() { return std::vector<BSONObj>{}; }()); + + future.timed_get(kFutureTimeout); +} + +// If the output collection doesn't exist, we don't know how to distribute the output documents so +// cannot insert an $exchange. The $out stage should later create a new, unsharded collection. +TEST_F(ClusterExchangeTest, SingleOutStageNotEligibleForExchangeIfOutputCollectionDoesNotExist) { + setupNShards(2); + auto mergePipe = unittest::assertGet(Pipeline::create( + {DocumentSourceOut::create(kTestOutNss, expCtx(), WriteModeEnum::kModeInsertDocuments)}, + expCtx())); + + auto future = launchAsync([&] { + ASSERT_FALSE(cluster_aggregation_planner::checkIfEligibleForExchange(operationContext(), + mergePipe.get())); + }); + + expectGetDatabase(kTestOutNss); + // Pretend there are no collections in this database. + expectFindSendBSONObjVector(kConfigHostAndPort, std::vector<BSONObj>()); + + future.timed_get(kFutureTimeout); +} + +// A $limit stage requires a single merger. +TEST_F(ClusterExchangeTest, LimitFollowedByOutStageIsNotEligibleForExchange) { + // Sharded by {_id: 1}, [MinKey, 0) on shard "0", [0, MaxKey) on shard "1". + setupNShards(2); + loadRoutingTableWithTwoChunksAndTwoShards(kTestOutNss); + + auto mergePipe = unittest::assertGet(Pipeline::create( + {DocumentSourceLimit::create(expCtx(), 6), + DocumentSourceOut::create(kTestOutNss, expCtx(), WriteModeEnum::kModeInsertDocuments)}, + expCtx())); + + auto future = launchAsync([&] { + ASSERT_FALSE(cluster_aggregation_planner::checkIfEligibleForExchange(operationContext(), + mergePipe.get())); + }); + + future.timed_get(kFutureTimeout); +} + +TEST_F(ClusterExchangeTest, GroupFollowedByOutIsEligbleForExchange) { + // Sharded by {_id: 1}, [MinKey, 0) on shard "0", [0, MaxKey) on shard "1". + setupNShards(2); + loadRoutingTableWithTwoChunksAndTwoShards(kTestOutNss); + + auto mergePipe = unittest::assertGet(Pipeline::create( + {parse("{$group: {_id: '$x', $doingMerge: true}}"), + DocumentSourceOut::create(kTestOutNss, expCtx(), WriteModeEnum::kModeInsertDocuments)}, + expCtx())); + + auto future = launchAsync([&] { + auto exchangeSpec = cluster_aggregation_planner::checkIfEligibleForExchange( + operationContext(), mergePipe.get()); + ASSERT_TRUE(exchangeSpec); + ASSERT(exchangeSpec->policy == ExchangePolicyEnum::kRange); + ASSERT_TRUE(exchangeSpec->shardDistributionInfo); + const auto& partitions = exchangeSpec->shardDistributionInfo->partitions; + ASSERT_EQ(partitions.size(), 2UL); // One for each shard. + + auto shard0Ranges = partitions.find("0"); + ASSERT(shard0Ranges != partitions.end()); + ASSERT_EQ(shard0Ranges->second.size(), 1UL); + auto shard0Range = shard0Ranges->second[0]; + ASSERT(shard0Range == ChunkRange(BSON("_id" << MINKEY), BSON("_id" << 0))); + }); + + future.timed_get(kFutureTimeout); +} + +TEST_F(ClusterExchangeTest, RenamesAreEligibleForExchange) { + // Sharded by {_id: 1}, [MinKey, 0) on shard "0", [0, MaxKey) on shard "1". + setupNShards(2); + loadRoutingTableWithTwoChunksAndTwoShards(kTestOutNss); + + auto mergePipe = unittest::assertGet(Pipeline::create( + {parse("{$group: {_id: '$x', $doingMerge: true}}"), + parse("{$project: {temporarily_renamed: '$_id'}}"), + parse("{$project: {_id: '$temporarily_renamed'}}"), + DocumentSourceOut::create(kTestOutNss, expCtx(), WriteModeEnum::kModeInsertDocuments)}, + expCtx())); + + auto future = launchAsync([&] { + auto exchangeSpec = cluster_aggregation_planner::checkIfEligibleForExchange( + operationContext(), mergePipe.get()); + ASSERT_TRUE(exchangeSpec); + ASSERT(exchangeSpec->policy == ExchangePolicyEnum::kRange); + ASSERT_TRUE(exchangeSpec->shardDistributionInfo); + const auto& partitions = exchangeSpec->shardDistributionInfo->partitions; + ASSERT_EQ(partitions.size(), 2UL); // One for each shard. + + auto shard0Ranges = partitions.find("0"); + ASSERT(shard0Ranges != partitions.end()); + ASSERT_EQ(shard0Ranges->second.size(), 1UL); + auto shard0Range = shard0Ranges->second[0]; + ASSERT(shard0Range == ChunkRange(BSON("_id" << MINKEY), BSON("_id" << 0))); + + auto shard1Ranges = partitions.find("1"); + ASSERT(shard1Ranges != partitions.end()); + ASSERT_EQ(shard1Ranges->second.size(), 1UL); + auto shard1Range = shard1Ranges->second[0]; + ASSERT(shard1Range == ChunkRange(BSON("_id" << 0), BSON("_id" << MAXKEY))); + }); + + future.timed_get(kFutureTimeout); +} + +TEST_F(ClusterExchangeTest, SortThenGroupIsEligibleForExchange) { + // Sharded by {_id: 1}, [MinKey, 0) on shard "0", [0, MaxKey) on shard "1". + setupNShards(2); + loadRoutingTableWithTwoChunksAndTwoShards(kTestOutNss); + + // This would be the merging half of the pipeline if the original pipeline was + // [{$sort: {x: 1}}, + // {$group: {_id: "$x"}}, + // {$out: {to: "sharded_by_id", mode: "replaceDocuments"}}]. + // No $sort stage appears in the merging half since we'd expect that to be absorbed by the + // $mergeCursors and AsyncResultsMerger. + auto mergePipe = unittest::assertGet(Pipeline::create( + {parse("{$group: {_id: '$x'}}"), + DocumentSourceOut::create(kTestOutNss, expCtx(), WriteModeEnum::kModeInsertDocuments)}, + expCtx())); + + auto future = launchAsync([&] { + auto exchangeSpec = cluster_aggregation_planner::checkIfEligibleForExchange( + operationContext(), mergePipe.get()); + ASSERT_TRUE(exchangeSpec); + ASSERT(exchangeSpec->policy == ExchangePolicyEnum::kRange); + ASSERT_TRUE(exchangeSpec->shardDistributionInfo); + ASSERT_BSONOBJ_EQ(exchangeSpec->shardDistributionInfo->logicalShardKeyAtSplitPoint.toBSON(), + BSON("x" << 1)); + const auto& partitions = exchangeSpec->shardDistributionInfo->partitions; + ASSERT_EQ(partitions.size(), 2UL); // One for each shard. + + auto shard0Ranges = partitions.find("0"); + ASSERT(shard0Ranges != partitions.end()); + ASSERT_EQ(shard0Ranges->second.size(), 1UL); + auto shard0Range = shard0Ranges->second[0]; + ASSERT(shard0Range == ChunkRange(BSON("x" << MINKEY), BSON("x" << 0))); + + auto shard1Ranges = partitions.find("1"); + ASSERT(shard1Ranges != partitions.end()); + ASSERT_EQ(shard1Ranges->second.size(), 1UL); + auto shard1Range = shard1Ranges->second[0]; + ASSERT(shard1Range == ChunkRange(BSON("x" << 0), BSON("x" << MAXKEY))); + }); + + future.timed_get(kFutureTimeout); +} + +TEST_F(ClusterExchangeTest, ProjectThroughDottedFieldDoesNotPreserveShardKey) { + // Sharded by {_id: 1}, [MinKey, 0) on shard "0", [0, MaxKey) on shard "1". + setupNShards(2); + loadRoutingTableWithTwoChunksAndTwoShards(kTestOutNss); + + auto mergePipe = unittest::assertGet(Pipeline::create( + {parse("{$group: {" + " _id: {region: '$region', country: '$country'}," + " population: {$sum: '$population'}," + " cities: {$push: {name: '$city', population: '$population'}}" + "}}"), + parse( + "{$project: {_id: '$_id.country', region: '$_id.region', population: 1, cities: 1}}"), + DocumentSourceOut::create(kTestOutNss, expCtx(), WriteModeEnum::kModeInsertDocuments)}, + expCtx())); + + auto future = launchAsync([&] { + auto exchangeSpec = cluster_aggregation_planner::checkIfEligibleForExchange( + operationContext(), mergePipe.get()); + // Because '_id' is populated from '$_id.country', we cannot prove that '_id' is a simple + // rename. We cannot prove that '_id' is not an array, and thus the $project could do more + // than a rename. + ASSERT_FALSE(exchangeSpec); + }); + + future.timed_get(kFutureTimeout); +} + +TEST_F(ClusterExchangeTest, WordCountUseCaseExample) { + // Sharded by {_id: 1}, [MinKey, 0) on shard "0", [0, MaxKey) on shard "1". + setupNShards(2); + loadRoutingTableWithTwoChunksAndTwoShards(kTestOutNss); + + // As an example of a pipeline that might replace a map reduce, imagine that we are performing a + // word count, and the shards part of the pipeline tokenized some text field of each document + // into {word: <token>, count: 1}. Then this is the merging half of the pipeline: + auto mergePipe = unittest::assertGet(Pipeline::create( + {parse("{$group: {" + " _id: '$word'," + " count: {$sum: 1}," + " $doingMerge: true" + "}}"), + DocumentSourceOut::create(kTestOutNss, expCtx(), WriteModeEnum::kModeInsertDocuments)}, + expCtx())); + + auto future = launchAsync([&] { + auto exchangeSpec = cluster_aggregation_planner::checkIfEligibleForExchange( + operationContext(), mergePipe.get()); + ASSERT_TRUE(exchangeSpec); + ASSERT(exchangeSpec->policy == ExchangePolicyEnum::kRange); + ASSERT_TRUE(exchangeSpec->shardDistributionInfo); + const auto& partitions = exchangeSpec->shardDistributionInfo->partitions; + ASSERT_EQ(partitions.size(), 2UL); // One for each shard. + + auto shard0Ranges = partitions.find("0"); + ASSERT(shard0Ranges != partitions.end()); + ASSERT_EQ(shard0Ranges->second.size(), 1UL); + auto shard0Range = shard0Ranges->second[0]; + ASSERT(shard0Range == ChunkRange(BSON("_id" << MINKEY), BSON("_id" << 0))); + + auto shard1Ranges = partitions.find("1"); + ASSERT(shard1Ranges != partitions.end()); + ASSERT_EQ(shard1Ranges->second.size(), 1UL); + auto shard1Range = shard1Ranges->second[0]; + ASSERT(shard1Range == ChunkRange(BSON("_id" << 0), BSON("_id" << MAXKEY))); + }); + + future.timed_get(kFutureTimeout); +} + +TEST_F(ClusterExchangeTest, WordCountUseCaseExampleShardedByWord) { + setupNShards(2); + const OID epoch = OID::gen(); + ShardKeyPattern shardKey(BSON("word" << 1)); + loadRoutingTable(kTestOutNss, + epoch, + shardKey, + makeChunks(kTestOutNss, + epoch, + {{ChunkRange{BSON("word" << MINKEY), + BSON("word" + << "hello")}, + ShardId("0")}, + {ChunkRange{BSON("word" + << "hello"), + BSON("word" + << "world")}, + ShardId("1")}, + {ChunkRange{BSON("word" + << "world"), + BSON("word" << MAXKEY)}, + ShardId("1")}})); + + // As an example of a pipeline that might replace a map reduce, imagine that we are performing a + // word count, and the shards part of the pipeline tokenized some text field of each document + // into {word: <token>, count: 1}. Then this is the merging half of the pipeline: + auto mergePipe = unittest::assertGet(Pipeline::create( + {parse("{$group: {" + " _id: '$word'," + " count: {$sum: 1}," + " $doingMerge: true" + "}}"), + parse("{$project: {word: '$_id', count: 1}}"), + DocumentSourceOut::create(kTestOutNss, expCtx(), WriteModeEnum::kModeInsertDocuments)}, + expCtx())); + + auto future = launchAsync([&] { + auto exchangeSpec = cluster_aggregation_planner::checkIfEligibleForExchange( + operationContext(), mergePipe.get()); + ASSERT_TRUE(exchangeSpec); + ASSERT(exchangeSpec->policy == ExchangePolicyEnum::kRange); + ASSERT_TRUE(exchangeSpec->shardDistributionInfo); + ASSERT_BSONOBJ_EQ(exchangeSpec->shardDistributionInfo->logicalShardKeyAtSplitPoint.toBSON(), + BSON("_id" << 1)); + const auto& partitions = exchangeSpec->shardDistributionInfo->partitions; + ASSERT_EQ(partitions.size(), 2UL); // One for each shard. + + auto shard0Ranges = partitions.find("0"); + ASSERT(shard0Ranges != partitions.end()); + ASSERT_EQ(shard0Ranges->second.size(), 1UL); + auto firstRangeOnShard0 = shard0Ranges->second[0]; + ASSERT(firstRangeOnShard0 == ChunkRange(BSON("_id" << MINKEY), + BSON("_id" + << "hello"))); + + auto shard1Ranges = partitions.find("1"); + ASSERT(shard1Ranges != partitions.end()); + ASSERT_EQ(shard1Ranges->second.size(), 2UL); + auto firstRangeOnShard1 = shard1Ranges->second[0]; + ASSERT(firstRangeOnShard1 == ChunkRange(BSON("_id" + << "hello"), + BSON("_id" + << "world"))); + auto secondRangeOnShard1 = shard1Ranges->second[1]; + ASSERT(secondRangeOnShard1 == ChunkRange(BSON("_id" + << "world"), + BSON("_id" << MAXKEY))); + }); + + future.timed_get(kFutureTimeout); +} + +// We'd like to test that a compound shard key pattern can be used. Strangely, the only case we can +// actually perform an exchange today on a compound shard key is when the shard key contains fields +// which are all duplicates. This is due to the limitations of tracking renames through dots, see +// SERVER-36787 for an example. +TEST_F(ClusterExchangeTest, CompoundShardKeyThreeShards) { + const OID epoch = OID::gen(); + ShardKeyPattern shardKey(BSON("x" << 1 << "y" << 1)); + + setupNShards(3); + const std::vector<std::string> xBoundaries = {"a", "g", "m", "r", "u"}; + auto chunks = [&]() { + std::vector<ChunkType> chunks; + ChunkVersion version(1, 0, epoch); + chunks.emplace_back(kTestOutNss, + ChunkRange{BSON("x" << MINKEY << "y" << MINKEY), + BSON("x" << xBoundaries[0] << "y" << MINKEY)}, + version, + ShardId("0")); + for (std::size_t i = 0; i < xBoundaries.size() - 1; ++i) { + chunks.emplace_back(kTestOutNss, + ChunkRange{BSON("x" << xBoundaries[i] << "y" << MINKEY), + BSON("x" << xBoundaries[i + 1] << "y" << MINKEY)}, + version, + ShardId(str::stream() << i % 3)); + } + chunks.emplace_back(kTestOutNss, + ChunkRange{BSON("x" << xBoundaries.back() << "y" << MINKEY), + BSON("x" << MAXKEY << "y" << MAXKEY)}, + version, + ShardId(str::stream() << "1")); + return chunks; + }(); + + loadRoutingTable(kTestOutNss, epoch, shardKey, chunks); + + auto mergePipe = unittest::assertGet(Pipeline::create( + {parse("{$group: {" + " _id: '$x'," + " $doingMerge: true" + "}}"), + parse("{$project: {x: '$_id', y: '$_id'}}"), + DocumentSourceOut::create(kTestOutNss, expCtx(), WriteModeEnum::kModeInsertDocuments)}, + expCtx())); + + auto future = launchAsync([&] { + auto exchangeSpec = cluster_aggregation_planner::checkIfEligibleForExchange( + operationContext(), mergePipe.get()); + ASSERT_TRUE(exchangeSpec); + ASSERT(exchangeSpec->policy == ExchangePolicyEnum::kRange); + ASSERT_TRUE(exchangeSpec->shardDistributionInfo); + ASSERT_BSONOBJ_EQ(exchangeSpec->shardDistributionInfo->logicalShardKeyAtSplitPoint.toBSON(), + BSON("_id" << 1 << "_id" << 1)); + const auto& partitions = exchangeSpec->shardDistributionInfo->partitions; + ASSERT_EQ(partitions.size(), 3UL); // One for each shard. + + // Make sure each shard has the same chunks that it started with, just with the names of the + // boundary fields translated. For each chunk that we created to begin with, make sure its + // corresponding/translated chunk is present on the same shard in the same order. + StringMap<std::size_t> numChunksExaminedOnShard = {{"0", 0}, {"1", 0}, {"2", 0}}; + for (auto&& chunk : chunks) { + auto shardId = chunk.getShard().toString(); + auto shardRanges = partitions.find(shardId); + ASSERT(shardRanges != partitions.end()); + auto nextChunkOnShard = numChunksExaminedOnShard[shardId]++; + ASSERT_LTE(nextChunkOnShard, shardRanges->second.size()); + auto outputChunk = shardRanges->second[nextChunkOnShard]; + + auto expectedChunkMin = [&]() { + ASSERT_EQ(chunk.getMin().nFields(), 2); + return BSON("_id" << chunk.getMin()["x"] << "_id" << chunk.getMin()["y"]); + }(); + ASSERT_BSONOBJ_EQ(outputChunk.getMin(), expectedChunkMin); + + auto expectedChunkMax = [&]() { + ASSERT_EQ(chunk.getMax().nFields(), 2); + return BSON("_id" << chunk.getMax()["x"] << "_id" << chunk.getMax()["y"]); + }(); + ASSERT_BSONOBJ_EQ(outputChunk.getMax(), expectedChunkMax); + } + }); + + future.timed_get(kFutureTimeout); +} +} // namespace +} // namespace mongo |