// distinct.cpp /** * Copyright (C) 2012-2014 MongoDB Inc. * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU Affero General Public License, version 3, * as published by the Free Software Foundation. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU Affero General Public License for more details. * * You should have received a copy of the GNU Affero General Public License * along with this program. If not, see . * * As a special exception, the copyright holders give permission to link the * code of portions of this program with the OpenSSL library under certain * conditions as described in each individual source file and distribute * linked combinations including the program with the OpenSSL library. You * must comply with the GNU Affero General Public License in all respects for * all of the code used other than as permitted herein. If you modify file(s) * with this exception, you may extend this exception to your version of the * file(s), but you are not obligated to do so. If you do not wish to do so, * delete this exception statement from your version. If you delete this * exception statement from all source files in the program, then also delete * it in the license file. */ #define MONGO_LOG_DEFAULT_COMPONENT ::mongo::logger::LogComponent::kQuery #include #include #include "mongo/bson/util/bson_extract.h" #include "mongo/db/auth/action_set.h" #include "mongo/db/auth/action_type.h" #include "mongo/db/auth/privilege.h" #include "mongo/db/catalog/collection.h" #include "mongo/db/catalog/database.h" #include "mongo/db/clientcursor.h" #include "mongo/db/commands.h" #include "mongo/db/db_raii.h" #include "mongo/db/exec/working_set_common.h" #include "mongo/db/instance.h" #include "mongo/db/jsobj.h" #include "mongo/db/query/explain.h" #include "mongo/db/query/find_common.h" #include "mongo/db/query/get_executor.h" #include "mongo/db/query/query_planner_common.h" #include "mongo/util/log.h" #include "mongo/util/timer.h" namespace mongo { using std::unique_ptr; using std::string; using std::stringstream; namespace { const char kKeyField[] = "key"; const char kQueryField[] = "query"; } // namespace class DistinctCommand : public Command { public: DistinctCommand() : Command("distinct") {} virtual bool slaveOk() const { return false; } virtual bool slaveOverrideOk() const { return true; } virtual bool supportsWriteConcern(const BSONObj& cmd) const override { return false; } bool supportsReadConcern() const final { return true; } std::size_t reserveBytesForReply() const override { return FindCommon::kInitReplyBufferSize; } virtual void addRequiredPrivileges(const std::string& dbname, const BSONObj& cmdObj, std::vector* out) { ActionSet actions; actions.addAction(ActionType::find); out->push_back(Privilege(parseResourcePattern(dbname, cmdObj), actions)); } virtual void help(stringstream& help) const { help << "{ distinct : 'collection name' , key : 'a.b' , query : {} }"; } /** * Used by explain() and run() to get the PlanExecutor for the query. */ StatusWith> getPlanExecutor(OperationContext* txn, Collection* collection, const string& ns, const BSONObj& cmdObj, bool isExplain) const { // Extract the key field. BSONElement keyElt; auto statusKey = bsonExtractTypedField(cmdObj, kKeyField, BSONType::String, &keyElt); if (!statusKey.isOK()) { return {statusKey}; } string key = keyElt.valuestrsafe(); // Extract the query field. If the query field is nonexistent, an empty query is used. BSONObj query; if (BSONElement queryElt = cmdObj[kQueryField]) { if (queryElt.type() == BSONType::Object) { query = queryElt.embeddedObject(); } else if (queryElt.type() != BSONType::jstNULL) { return Status(ErrorCodes::TypeMismatch, str::stream() << "\"" << kQueryField << "\" had the wrong type. Expected " << typeName(BSONType::Object) << " or " << typeName(BSONType::jstNULL) << ", found " << typeName(queryElt.type())); } } auto executor = getExecutorDistinct( txn, collection, ns, query, key, isExplain, PlanExecutor::YIELD_AUTO); if (!executor.isOK()) { return executor.getStatus(); } return std::move(executor.getValue()); } virtual Status explain(OperationContext* txn, const std::string& dbname, const BSONObj& cmdObj, ExplainCommon::Verbosity verbosity, const rpc::ServerSelectionMetadata&, BSONObjBuilder* out) const { const string ns = parseNs(dbname, cmdObj); AutoGetCollectionForRead ctx(txn, ns); Collection* collection = ctx.getCollection(); StatusWith> executor = getPlanExecutor(txn, collection, ns, cmdObj, true); if (!executor.isOK()) { return executor.getStatus(); } Explain::explainStages(executor.getValue().get(), verbosity, out); return Status::OK(); } bool run(OperationContext* txn, const string& dbname, BSONObj& cmdObj, int, string& errmsg, BSONObjBuilder& result) { Timer t; const string ns = parseNs(dbname, cmdObj); AutoGetCollectionForRead ctx(txn, ns); Collection* collection = ctx.getCollection(); auto executor = getPlanExecutor(txn, collection, ns, cmdObj, false); if (!executor.isOK()) { return appendCommandStatus(result, executor.getStatus()); } string key = cmdObj[kKeyField].valuestrsafe(); int bufSize = BSONObjMaxUserSize - 4096; BufBuilder bb(bufSize); char* start = bb.buf(); BSONArrayBuilder arr(bb); BSONElementSet values; BSONObj obj; PlanExecutor::ExecState state; while (PlanExecutor::ADVANCED == (state = executor.getValue()->getNext(&obj, NULL))) { // Distinct expands arrays. // // If our query is covered, each value of the key should be in the index key and // available to us without this. If a collection scan is providing the data, we may // have to expand an array. BSONElementSet elts; obj.getFieldsDotted(key, elts); for (BSONElementSet::iterator it = elts.begin(); it != elts.end(); ++it) { BSONElement elt = *it; if (values.count(elt)) { continue; } int currentBufPos = bb.len(); uassert(17217, "distinct too big, 16mb cap", (currentBufPos + elt.size() + 1024) < bufSize); arr.append(elt); BSONElement x(start + currentBufPos); values.insert(x); } } // Return an error if execution fails for any reason. if (PlanExecutor::FAILURE == state || PlanExecutor::DEAD == state) { log() << "Plan executor error during distinct command: " << PlanExecutor::statestr(state) << ", stats: " << Explain::getWinningPlanStats(executor.getValue().get()); return appendCommandStatus(result, Status(ErrorCodes::OperationFailed, str::stream() << "Executor error during distinct command: " << WorkingSetCommon::toStatusString(obj))); } // Get summary information about the plan. PlanSummaryStats stats; Explain::getSummaryStats(*executor.getValue(), &stats); if (collection) { collection->infoCache()->notifyOfQuery(txn, stats.indexesUsed); } CurOp::get(txn)->debug().fromMultiPlanner = stats.fromMultiPlanner; CurOp::get(txn)->debug().replanned = stats.replanned; verify(start == bb.buf()); result.appendArray("values", arr.done()); { BSONObjBuilder b; b.appendNumber("n", stats.nReturned); b.appendNumber("nscanned", stats.totalKeysExamined); b.appendNumber("nscannedObjects", stats.totalDocsExamined); b.appendNumber("timems", t.millis()); b.append("planSummary", Explain::getPlanSummary(executor.getValue().get())); result.append("stats", b.obj()); } return true; } } distinctCmd; } // namespace mongo