diff options
Diffstat (limited to 'src/mongo/db/query/query_stats.h')
-rw-r--r-- | src/mongo/db/query/query_stats.h | 224 |
1 files changed, 224 insertions, 0 deletions
diff --git a/src/mongo/db/query/query_stats.h b/src/mongo/db/query/query_stats.h new file mode 100644 index 00000000000..59d79d6c114 --- /dev/null +++ b/src/mongo/db/query/query_stats.h @@ -0,0 +1,224 @@ +/** + * Copyright (C) 2022-present MongoDB, Inc. + * + * This program is free software: you can redistribute it and/or modify + * it under the terms of the Server Side Public License, version 1, + * as published by MongoDB, Inc. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * Server Side Public License for more details. + * + * You should have received a copy of the Server Side Public License + * along with this program. If not, see + * <http://www.mongodb.com/licensing/server-side-public-license>. + * + * As a special exception, the copyright holders give permission to link the + * code of portions of this program with the OpenSSL library under certain + * conditions as described in each individual source file and distribute + * linked combinations including the program with the OpenSSL library. You + * must comply with the Server Side Public License in all respects for + * all of the code used other than as permitted herein. If you modify file(s) + * with this exception, you may extend this exception to your version of the + * file(s), but you are not obligated to do so. If you do not wish to do so, + * delete this exception statement from your version. If you delete this + * exception statement from all source files in the program, then also delete + * it in the license file. + */ + +#pragma once + +#include "mongo/base/status.h" +#include "mongo/bson/bsonobj.h" +#include "mongo/db/concurrency/d_concurrency.h" +#include "mongo/db/curop.h" +#include "mongo/db/namespace_string.h" +#include "mongo/db/query/partitioned_cache.h" +#include "mongo/db/query/plan_explainer.h" +#include "mongo/db/query/request_shapifier.h" +#include "mongo/db/query/util/memory_util.h" +#include "mongo/db/service_context.h" +#include <cstdint> +#include <memory> + +namespace mongo { + +class OpDebug; +class AggregateCommandRequest; +class FindCommandRequest; + +namespace { +/** + * Type we use to render values to BSON. + */ +using BSONNumeric = long long; +} // namespace + +namespace query_stats { + +/** + * An aggregated metric stores a compressed view of data. It balances the loss of information + * with the reduction in required storage. + */ +struct AggregatedMetric { + + /** + * Aggregate an observed value into the metric. + */ + void aggregate(uint64_t val) { + sum += val; + max = std::max(val, max); + min = std::min(val, min); + sumOfSquares += val * val; + } + + void appendTo(BSONObjBuilder& builder, const StringData& fieldName) const { + BSONObjBuilder metricsBuilder = builder.subobjStart(fieldName); + metricsBuilder.append("sum", (BSONNumeric)sum); + metricsBuilder.append("max", (BSONNumeric)max); + metricsBuilder.append("min", (BSONNumeric)min); + metricsBuilder.append("sumOfSquares", (BSONNumeric)sumOfSquares); + metricsBuilder.done(); + } + + uint64_t sum = 0; + // Default to the _signed_ maximum (which fits in unsigned range) because we cast to + // BSONNumeric when serializing. + uint64_t min = (uint64_t)std::numeric_limits<int64_t>::max; + uint64_t max = 0; + + /** + * The sum of squares along with (an externally stored) count will allow us to compute the + * variance/stddev. + */ + uint64_t sumOfSquares = 0; +}; + +extern CounterMetric queryStatsStoreSizeEstimateBytesMetric; +// Used to aggregate the metrics for one telemetry key over all its executions. +class QueryStatsEntry { +public: + QueryStatsEntry(std::unique_ptr<RequestShapifier> requestShapifier, + NamespaceStringOrUUID nss, + const BSONObj& cmdObj) + : firstSeenTimestamp(Date_t::now().toMillisSinceEpoch() / 1000, 0), + requestShapifier(std::move(requestShapifier)), + nss(nss), + oldQueryStatsKey(cmdObj.copy()) { + queryStatsStoreSizeEstimateBytesMetric.increment(sizeof(QueryStatsEntry) + sizeof(BSONObj)); + } + + ~QueryStatsEntry() { + queryStatsStoreSizeEstimateBytesMetric.decrement(sizeof(QueryStatsEntry) + sizeof(BSONObj)); + } + + BSONObj toBSON() const { + BSONObjBuilder builder{sizeof(QueryStatsEntry) + 100}; + builder.append("lastExecutionMicros", (BSONNumeric)lastExecutionMicros); + builder.append("execCount", (BSONNumeric)execCount); + queryExecMicros.appendTo(builder, "queryExecMicros"); + docsReturned.appendTo(builder, "docsReturned"); + builder.append("firstSeenTimestamp", firstSeenTimestamp); + return builder.obj(); + } + + /** + * Redact a given queryStats key and set _keySize. + */ + BSONObj computeQueryStatsKey(OperationContext* opCtx, + bool applyHmacToIdentifiers, + std::string hmacKey) const; + + /** + * Timestamp for when this query shape was added to the store. Set on construction. + */ + const Timestamp firstSeenTimestamp; + + /** + * Last execution time in microseconds. + */ + uint64_t lastExecutionMicros = 0; + + /** + * Number of query executions. + */ + uint64_t execCount = 0; + + AggregatedMetric queryExecMicros; + + AggregatedMetric docsReturned; + + std::unique_ptr<RequestShapifier> requestShapifier; + + NamespaceStringOrUUID nss; + + // TODO: SERVER-73152 remove oldQueryStatsKey when RequestShapifier is used for agg. + BSONObj oldQueryStatsKey; +}; + +struct TelemetryPartitioner { + // The partitioning function for use with the 'Partitioned' utility. + std::size_t operator()(const std::size_t k, const std::size_t nPartitions) const { + return k % nPartitions; + } +}; + +struct QueryStatsStoreEntryBudgetor { + size_t operator()(const std::size_t key, const std::shared_ptr<QueryStatsEntry>& value) { + // The buget estimator for <key,value> pair in LRU cache accounts for the size of the key + // and the size of the metrics, including the bson object used for generating the telemetry + // key at read time. + + return sizeof(QueryStatsEntry) + sizeof(std::size_t) + value->oldQueryStatsKey.objsize(); + } +}; + +using QueryStatsStore = PartitionedCache<std::size_t, + std::shared_ptr<QueryStatsEntry>, + QueryStatsStoreEntryBudgetor, + TelemetryPartitioner>; + +/** + * Acquire a reference to the global queryStats store. + */ +QueryStatsStore& getQueryStatsStore(OperationContext* opCtx); + +/** + * Register a request for queryStats collection. The queryStats machinery may decide not to + * collect anything but this should be called for all requests. The decision is made based on + * the feature flag and queryStats parameters such as rate limiting. + * + * The caller is still responsible for subsequently calling writeQueryStats() once the request is + * completed. + * + * Note that calling this affects internal state. It should be called once for each request for + * which telemetry may be collected. + * TODO SERVER-73152 remove request-specific registers, leave only registerRequest + */ +void registerAggRequest(const AggregateCommandRequest& request, OperationContext* opCtx); +void registerRequest(std::unique_ptr<RequestShapifier> requestShapifier, + const NamespaceString& collection, + OperationContext* opCtx, + const boost::intrusive_ptr<ExpressionContext>& expCtx); + +/** + * Writes queryStats to the queryStats store for the operation identified by `queryStatsKey`. + */ +void writeQueryStats(OperationContext* opCtx, + boost::optional<size_t> queryStatsKeyHash, + boost::optional<BSONObj> queryStatsKey, + std::unique_ptr<RequestShapifier> requestShapifier, + uint64_t queryExecMicros, + uint64_t docsReturned); + +/** + * Serialize the FindCommandRequest according to the Options passed in. Returns the serialized BSON + * with hmac applied to all field names and literals. + */ +BSONObj makeQueryStatsKey(const FindCommandRequest& findCommand, + const SerializationOptions& opts, + const boost::intrusive_ptr<ExpressionContext>& expCtx, + boost::optional<const QueryStatsEntry&> existingMetrics = boost::none); +} // namespace query_stats +} // namespace mongo |