/** * Copyright (C) 2018-present MongoDB, Inc. * * This program is free software: you can redistribute it and/or modify * it under the terms of the Server Side Public License, version 1, * as published by MongoDB, Inc. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * Server Side Public License for more details. * * You should have received a copy of the Server Side Public License * along with this program. If not, see * . * * As a special exception, the copyright holders give permission to link the * code of portions of this program with the OpenSSL library under certain * conditions as described in each individual source file and distribute * linked combinations including the program with the OpenSSL library. You * must comply with the Server Side Public License in all respects for * all of the code used other than as permitted herein. If you modify file(s) * with this exception, you may extend this exception to your version of the * file(s), but you are not obligated to do so. If you do not wish to do so, * delete this exception statement from your version. If you delete this * exception statement from all source files in the program, then also delete * it in the license file. */ #pragma once #include "mongo/db/pipeline/document_source_out_gen.h" #include "mongo/db/pipeline/document_source_writer.h" namespace mongo { /** * Implementation for the $out aggregation stage. */ class DocumentSourceOut final : public DocumentSourceWriter { public: static constexpr StringData kStageName = "$out"_sd; /** * A "lite parsed" $out stage is similar to other stages involving foreign collections except in * some cases the foreign collection is allowed to be sharded. */ class LiteParsed final : public LiteParsedDocumentSourceForeignCollection { public: using LiteParsedDocumentSourceForeignCollection::LiteParsedDocumentSourceForeignCollection; static std::unique_ptr parse(const NamespaceString& nss, const BSONElement& spec); bool allowShardedForeignCollection(NamespaceString nss, bool inMultiDocumentTransaction) const final { return _foreignNss != nss; } bool allowedToPassthroughFromMongos() const final { return false; } PrivilegeVector requiredPrivileges(bool isMongos, bool bypassDocumentValidation) const { ActionSet actions{ActionType::insert, ActionType::remove}; if (bypassDocumentValidation) { actions.addAction(ActionType::bypassDocumentValidation); } return {Privilege(ResourcePattern::forExactNamespace(_foreignNss), actions)}; } ReadConcernSupportResult supportsReadConcern(repl::ReadConcernLevel level, bool isImplicitDefault) const final { return { {level == repl::ReadConcernLevel::kLinearizableReadConcern, {ErrorCodes::InvalidOptions, "{} cannot be used with a 'linearizable' read concern level"_format(kStageName)}}, Status::OK()}; } }; ~DocumentSourceOut() override; StageConstraints constraints(Pipeline::SplitState pipeState) const final override { return {StreamType::kStreaming, PositionRequirement::kLast, HostTypeRequirement::kPrimaryShard, DiskUseRequirement::kWritesPersistentData, FacetRequirement::kNotAllowed, TransactionRequirement::kNotAllowed, LookupRequirement::kNotAllowed, UnionRequirement::kNotAllowed}; } Value serialize(SerializationOptions opts = SerializationOptions()) const final override; /** * Creates a new $out stage from the given arguments. */ static boost::intrusive_ptr create( NamespaceString outputNs, const boost::intrusive_ptr& expCtx, boost::optional timeseries = boost::none); /** * Parses a $out stage from the user-supplied BSON. */ static boost::intrusive_ptr createFromBson( BSONElement elem, const boost::intrusive_ptr& pExpCtx); const char* getSourceName() const final override { return kStageName.rawData(); } void addVariableRefs(std::set* refs) const final {} private: DocumentSourceOut(NamespaceString outputNs, boost::optional timeseries, const boost::intrusive_ptr& expCtx) : DocumentSourceWriter(kStageName.rawData(), std::move(outputNs), expCtx), _timeseries(std::move(timeseries)) {} static DocumentSourceOutSpec parseOutSpecAndResolveTargetNamespace( const BSONElement& spec, const DatabaseName& defaultDB); void initialize() override; void finalize() override; void spill(BatchedCommandRequest&& bcr, BatchedObjects&& batch) override { DocumentSourceWriteBlock writeBlock(pExpCtx->opCtx); auto insertCommand = bcr.extractInsertRequest(); insertCommand->setDocuments(std::move(batch)); auto targetEpoch = boost::none; if (_timeseries) { uassertStatusOK(pExpCtx->mongoProcessInterface->insertTimeseries( pExpCtx, _tempNs.getTimeseriesViewNamespace(), std::move(insertCommand), _writeConcern, targetEpoch)); } else { uassertStatusOK(pExpCtx->mongoProcessInterface->insert( pExpCtx, _tempNs, std::move(insertCommand), _writeConcern, targetEpoch)); } } std::pair makeBatchObject(Document&& doc) const override { auto obj = doc.toBson(); tassert(6628900, "_writeSizeEstimator should be initialized", _writeSizeEstimator); return {obj, _writeSizeEstimator->estimateInsertSizeBytes(obj)}; } BatchedCommandRequest initializeBatchedWriteRequest() const override; void waitWhileFailPointEnabled() override; /** * Determines if an error exists with the user input and existing collections. * The function will error if: * 1. The user provides the 'timeseries' field, but a non time-series collection or view exists * in that namespace. * 2. The user provides the 'timeseries' field with a specification that does not match an * existing time-series collection. The function will replace the value of '_timeseries' if the * user does not provide the 'timeseries' field, but a time-series collection exists. */ boost::optional validateTimeseries(); NamespaceString makeBucketNsIfTimeseries(const NamespaceString& ns); // Holds on to the original collection options and index specs so we can check they didn't // change during computation. BSONObj _originalOutOptions; std::list _originalIndexes; // The temporary namespace for the $out writes. NamespaceString _tempNs; // Set if $out is writing to a time-series collection. This is how $out determines if it is // writing to a time-series collection or not. boost::optional _timeseries; // Set to true if the stage has not initialized or the view was successfully created. // Used by the destructor to determine if the "real" buckets collection should be destroyed. bool _timeseriesStateConsistent = true; }; } // namespace mongo