summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorPierlauro Sciarelli <pierlauro.sciarelli@mongodb.com>2022-07-27 12:08:08 +0000
committerEvergreen Agent <no-reply@evergreen.mongodb.com>2022-07-27 13:24:06 +0000
commitdaa784ee5f0deb97b15c78fd1adb6b9186fed414 (patch)
treeccdd17a98f40e0daba8f9628ff17efed8c076aa7
parent5bc09fbae89fd9db54e259e30f7189a117dd46a9 (diff)
downloadmongo-daa784ee5f0deb97b15c78fd1adb6b9186fed414.tar.gz
SERVER-68130 adjust autoSplitVector's estimatedAdditionalBytesPerItemInBSONArray
-rw-r--r--src/mongo/db/s/auto_split_vector.cpp11
1 files changed, 10 insertions, 1 deletions
diff --git a/src/mongo/db/s/auto_split_vector.cpp b/src/mongo/db/s/auto_split_vector.cpp
index 7569142fde0..9f4335f9f2b 100644
--- a/src/mongo/db/s/auto_split_vector.cpp
+++ b/src/mongo/db/s/auto_split_vector.cpp
@@ -49,7 +49,16 @@
namespace mongo {
namespace {
-constexpr int estimatedAdditionalBytesPerItemInBSONArray{2};
+/*
+ * BSON arrays are serialized as BSON objects with the index of each element as a string key: for
+ * example, the array ["a","b","c"] is going to be serialized as {"0":"a","1":"b","2":"c"}. The
+ * minimum size for a BSON object is `BSONObj::kMinBSONLength`.
+ *
+ * Given that the `vector<BSONObj>` returned by `autoSplitVector` can't be greater than 16MB when
+ * serialized, pessimistically assume that each key occupies the highest possible number of bytes.
+ */
+const int estimatedAdditionalBytesPerItemInBSONArray{
+ (int)std::to_string(BSONObjMaxUserSize / BSONObj::kMinBSONLength).length()};
constexpr int kMaxSplitPointsToReposition{3};