summaryrefslogtreecommitdiff
path: root/src/mongo/db/query/query_stats.h
diff options
context:
space:
mode:
Diffstat (limited to 'src/mongo/db/query/query_stats.h')
-rw-r--r--src/mongo/db/query/query_stats.h224
1 files changed, 224 insertions, 0 deletions
diff --git a/src/mongo/db/query/query_stats.h b/src/mongo/db/query/query_stats.h
new file mode 100644
index 00000000000..59d79d6c114
--- /dev/null
+++ b/src/mongo/db/query/query_stats.h
@@ -0,0 +1,224 @@
+/**
+ * Copyright (C) 2022-present MongoDB, Inc.
+ *
+ * This program is free software: you can redistribute it and/or modify
+ * it under the terms of the Server Side Public License, version 1,
+ * as published by MongoDB, Inc.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ * Server Side Public License for more details.
+ *
+ * You should have received a copy of the Server Side Public License
+ * along with this program. If not, see
+ * <http://www.mongodb.com/licensing/server-side-public-license>.
+ *
+ * As a special exception, the copyright holders give permission to link the
+ * code of portions of this program with the OpenSSL library under certain
+ * conditions as described in each individual source file and distribute
+ * linked combinations including the program with the OpenSSL library. You
+ * must comply with the Server Side Public License in all respects for
+ * all of the code used other than as permitted herein. If you modify file(s)
+ * with this exception, you may extend this exception to your version of the
+ * file(s), but you are not obligated to do so. If you do not wish to do so,
+ * delete this exception statement from your version. If you delete this
+ * exception statement from all source files in the program, then also delete
+ * it in the license file.
+ */
+
+#pragma once
+
+#include "mongo/base/status.h"
+#include "mongo/bson/bsonobj.h"
+#include "mongo/db/concurrency/d_concurrency.h"
+#include "mongo/db/curop.h"
+#include "mongo/db/namespace_string.h"
+#include "mongo/db/query/partitioned_cache.h"
+#include "mongo/db/query/plan_explainer.h"
+#include "mongo/db/query/request_shapifier.h"
+#include "mongo/db/query/util/memory_util.h"
+#include "mongo/db/service_context.h"
+#include <cstdint>
+#include <memory>
+
+namespace mongo {
+
+class OpDebug;
+class AggregateCommandRequest;
+class FindCommandRequest;
+
+namespace {
+/**
+ * Type we use to render values to BSON.
+ */
+using BSONNumeric = long long;
+} // namespace
+
+namespace query_stats {
+
+/**
+ * An aggregated metric stores a compressed view of data. It balances the loss of information
+ * with the reduction in required storage.
+ */
+struct AggregatedMetric {
+
+ /**
+ * Aggregate an observed value into the metric.
+ */
+ void aggregate(uint64_t val) {
+ sum += val;
+ max = std::max(val, max);
+ min = std::min(val, min);
+ sumOfSquares += val * val;
+ }
+
+ void appendTo(BSONObjBuilder& builder, const StringData& fieldName) const {
+ BSONObjBuilder metricsBuilder = builder.subobjStart(fieldName);
+ metricsBuilder.append("sum", (BSONNumeric)sum);
+ metricsBuilder.append("max", (BSONNumeric)max);
+ metricsBuilder.append("min", (BSONNumeric)min);
+ metricsBuilder.append("sumOfSquares", (BSONNumeric)sumOfSquares);
+ metricsBuilder.done();
+ }
+
+ uint64_t sum = 0;
+ // Default to the _signed_ maximum (which fits in unsigned range) because we cast to
+ // BSONNumeric when serializing.
+ uint64_t min = (uint64_t)std::numeric_limits<int64_t>::max;
+ uint64_t max = 0;
+
+ /**
+ * The sum of squares along with (an externally stored) count will allow us to compute the
+ * variance/stddev.
+ */
+ uint64_t sumOfSquares = 0;
+};
+
+extern CounterMetric queryStatsStoreSizeEstimateBytesMetric;
+// Used to aggregate the metrics for one telemetry key over all its executions.
+class QueryStatsEntry {
+public:
+ QueryStatsEntry(std::unique_ptr<RequestShapifier> requestShapifier,
+ NamespaceStringOrUUID nss,
+ const BSONObj& cmdObj)
+ : firstSeenTimestamp(Date_t::now().toMillisSinceEpoch() / 1000, 0),
+ requestShapifier(std::move(requestShapifier)),
+ nss(nss),
+ oldQueryStatsKey(cmdObj.copy()) {
+ queryStatsStoreSizeEstimateBytesMetric.increment(sizeof(QueryStatsEntry) + sizeof(BSONObj));
+ }
+
+ ~QueryStatsEntry() {
+ queryStatsStoreSizeEstimateBytesMetric.decrement(sizeof(QueryStatsEntry) + sizeof(BSONObj));
+ }
+
+ BSONObj toBSON() const {
+ BSONObjBuilder builder{sizeof(QueryStatsEntry) + 100};
+ builder.append("lastExecutionMicros", (BSONNumeric)lastExecutionMicros);
+ builder.append("execCount", (BSONNumeric)execCount);
+ queryExecMicros.appendTo(builder, "queryExecMicros");
+ docsReturned.appendTo(builder, "docsReturned");
+ builder.append("firstSeenTimestamp", firstSeenTimestamp);
+ return builder.obj();
+ }
+
+ /**
+ * Redact a given queryStats key and set _keySize.
+ */
+ BSONObj computeQueryStatsKey(OperationContext* opCtx,
+ bool applyHmacToIdentifiers,
+ std::string hmacKey) const;
+
+ /**
+ * Timestamp for when this query shape was added to the store. Set on construction.
+ */
+ const Timestamp firstSeenTimestamp;
+
+ /**
+ * Last execution time in microseconds.
+ */
+ uint64_t lastExecutionMicros = 0;
+
+ /**
+ * Number of query executions.
+ */
+ uint64_t execCount = 0;
+
+ AggregatedMetric queryExecMicros;
+
+ AggregatedMetric docsReturned;
+
+ std::unique_ptr<RequestShapifier> requestShapifier;
+
+ NamespaceStringOrUUID nss;
+
+ // TODO: SERVER-73152 remove oldQueryStatsKey when RequestShapifier is used for agg.
+ BSONObj oldQueryStatsKey;
+};
+
+struct TelemetryPartitioner {
+ // The partitioning function for use with the 'Partitioned' utility.
+ std::size_t operator()(const std::size_t k, const std::size_t nPartitions) const {
+ return k % nPartitions;
+ }
+};
+
+struct QueryStatsStoreEntryBudgetor {
+ size_t operator()(const std::size_t key, const std::shared_ptr<QueryStatsEntry>& value) {
+ // The buget estimator for <key,value> pair in LRU cache accounts for the size of the key
+ // and the size of the metrics, including the bson object used for generating the telemetry
+ // key at read time.
+
+ return sizeof(QueryStatsEntry) + sizeof(std::size_t) + value->oldQueryStatsKey.objsize();
+ }
+};
+
+using QueryStatsStore = PartitionedCache<std::size_t,
+ std::shared_ptr<QueryStatsEntry>,
+ QueryStatsStoreEntryBudgetor,
+ TelemetryPartitioner>;
+
+/**
+ * Acquire a reference to the global queryStats store.
+ */
+QueryStatsStore& getQueryStatsStore(OperationContext* opCtx);
+
+/**
+ * Register a request for queryStats collection. The queryStats machinery may decide not to
+ * collect anything but this should be called for all requests. The decision is made based on
+ * the feature flag and queryStats parameters such as rate limiting.
+ *
+ * The caller is still responsible for subsequently calling writeQueryStats() once the request is
+ * completed.
+ *
+ * Note that calling this affects internal state. It should be called once for each request for
+ * which telemetry may be collected.
+ * TODO SERVER-73152 remove request-specific registers, leave only registerRequest
+ */
+void registerAggRequest(const AggregateCommandRequest& request, OperationContext* opCtx);
+void registerRequest(std::unique_ptr<RequestShapifier> requestShapifier,
+ const NamespaceString& collection,
+ OperationContext* opCtx,
+ const boost::intrusive_ptr<ExpressionContext>& expCtx);
+
+/**
+ * Writes queryStats to the queryStats store for the operation identified by `queryStatsKey`.
+ */
+void writeQueryStats(OperationContext* opCtx,
+ boost::optional<size_t> queryStatsKeyHash,
+ boost::optional<BSONObj> queryStatsKey,
+ std::unique_ptr<RequestShapifier> requestShapifier,
+ uint64_t queryExecMicros,
+ uint64_t docsReturned);
+
+/**
+ * Serialize the FindCommandRequest according to the Options passed in. Returns the serialized BSON
+ * with hmac applied to all field names and literals.
+ */
+BSONObj makeQueryStatsKey(const FindCommandRequest& findCommand,
+ const SerializationOptions& opts,
+ const boost::intrusive_ptr<ExpressionContext>& expCtx,
+ boost::optional<const QueryStatsEntry&> existingMetrics = boost::none);
+} // namespace query_stats
+} // namespace mongo