1 files changed, 260 insertions, 230 deletions
diff --git a/src/mongo/s/chunk_manager.h b/src/mongo/s/chunk_manager.h
index e3b61a30b62..c2c7a48286d 100644
--- a/src/mongo/s/chunk_manager.h
+++ b/src/mongo/s/chunk_manager.h
@@ -38,240 +38,270 @@
 
 namespace mongo {
 
-    class CanonicalQuery;
-    class ChunkManager;
-    class CollectionType;
-    struct QuerySolutionNode;
-
-    typedef std::shared_ptr<ChunkManager> ChunkManagerPtr;
-
-    // The key for the map is max for each Chunk or ChunkRange
-    typedef std::map<BSONObj, std::shared_ptr<Chunk>, BSONObjCmp> ChunkMap;
-
-    class ChunkRange {
-    public:
-        ChunkRange(ChunkMap::const_iterator begin, const ChunkMap::const_iterator end);
-
-        // Merge min and max (must be adjacent ranges)
-        ChunkRange(const ChunkRange& min, const ChunkRange& max);
-
-        const ChunkManager* getManager() const { return _manager; }
-        ShardId getShardId() const { return _shardId; }
-
-        const BSONObj& getMin() const { return _min; }
-        const BSONObj& getMax() const { return _max; }
-
-        // clones of Chunk methods
-        // Returns true if this ChunkRange contains the given shard key, and false otherwise
-        //
-        // Note: this function takes an extracted *key*, not an original document
-        // (the point may be computed by, say, hashing a given field or projecting
-        //  to a subset of fields).
-        bool containsKey( const BSONObj& shardKey ) const;
-
-        std::string toString() const;
-
-    private:
-        const ChunkManager* _manager;
-        const ShardId _shardId;
-        const BSONObj _min;
-        const BSONObj _max;
-    };
-
-    typedef std::map<BSONObj, std::shared_ptr<ChunkRange>, BSONObjCmp> ChunkRangeMap;
-
-
-    class ChunkRangeManager {
+class CanonicalQuery;
+class ChunkManager;
+class CollectionType;
+struct QuerySolutionNode;
+
+typedef std::shared_ptr<ChunkManager> ChunkManagerPtr;
+
+// The key for the map is max for each Chunk or ChunkRange
+typedef std::map<BSONObj, std::shared_ptr<Chunk>, BSONObjCmp> ChunkMap;
+
+class ChunkRange {
+public:
+    ChunkRange(ChunkMap::const_iterator begin, const ChunkMap::const_iterator end);
+
+    // Merge min and max (must be adjacent ranges)
+    ChunkRange(const ChunkRange& min, const ChunkRange& max);
+
+    const ChunkManager* getManager() const {
+        return _manager;
+    }
+    ShardId getShardId() const {
+        return _shardId;
+    }
+
+    const BSONObj& getMin() const {
+        return _min;
+    }
+    const BSONObj& getMax() const {
+        return _max;
+    }
+
+    // clones of Chunk methods
+    // Returns true if this ChunkRange contains the given shard key, and false otherwise
+    //
+    // Note: this function takes an extracted *key*, not an original document
+    // (the point may be computed by, say, hashing a given field or projecting
+    //  to a subset of fields).
+    bool containsKey(const BSONObj& shardKey) const;
+
+    std::string toString() const;
+
+private:
+    const ChunkManager* _manager;
+    const ShardId _shardId;
+    const BSONObj _min;
+    const BSONObj _max;
+};
+
+typedef std::map<BSONObj, std::shared_ptr<ChunkRange>, BSONObjCmp> ChunkRangeMap;
+
+
+class ChunkRangeManager {
+public:
+    const ChunkRangeMap& ranges() const {
+        return _ranges;
+    }
+
+    void clear() {
+        _ranges.clear();
+    }
+
+    void reloadAll(const ChunkMap& chunks);
+
+    // Slow operation -- wrap with DEV
+    void assertValid() const;
+
+    ChunkRangeMap::const_iterator upper_bound(const BSONObj& o) const {
+        return _ranges.upper_bound(o);
+    }
+    ChunkRangeMap::const_iterator lower_bound(const BSONObj& o) const {
+        return _ranges.lower_bound(o);
+    }
+
+private:
+    // assumes nothing in this range exists in _ranges
+    void _insertRange(ChunkMap::const_iterator begin, const ChunkMap::const_iterator end);
+
+    ChunkRangeMap _ranges;
+};
+
+
+/* config.sharding
+     { ns: 'alleyinsider.fs.chunks' ,
+       key: { ts : 1 } ,
+       shards: [ { min: 1, max: 100, server: a } , { min: 101, max: 200 , server : b } ]
+     }
+*/
+class ChunkManager {
+public:
+    typedef std::map<std::string, ChunkVersion> ShardVersionMap;
+
+    // Loads a new chunk manager from a collection document
+    explicit ChunkManager(const CollectionType& coll);
+
+    // Creates an empty chunk manager for the namespace
+    ChunkManager(const std::string& ns, const ShardKeyPattern& pattern, bool unique);
+
+    const std::string& getns() const {
+        return _ns;
+    }
+    const ShardKeyPattern& getShardKeyPattern() const {
+        return _keyPattern;
+    }
+    bool isUnique() const {
+        return _unique;
+    }
+
+    /**
+     * this is just an increasing number of how many ChunkManagers we have so we know if something has been updated
+     */
+    unsigned long long getSequenceNumber() const {
+        return _sequenceNumber;
+    }
+
+    //
+    // After constructor is invoked, we need to call loadExistingRanges.  If this is a new
+    // sharded collection, we can call createFirstChunks first.
+    //
+
+    // Creates new chunks based on info in chunk manager
+    void createFirstChunks(const ShardId& primaryShardId,
+                           const std::vector<BSONObj>* initPoints,
+                           const std::set<ShardId>* initShardIds);
+
+    // Loads existing ranges based on info in chunk manager
+    void loadExistingRanges(const ChunkManager* oldManager);
+
+
+    // Helpers for load
+    void calcInitSplitsAndShards(const ShardId& primaryShardId,
+                                 const std::vector<BSONObj>* initPoints,
+                                 const std::set<ShardId>* initShardIds,
+                                 std::vector<BSONObj>* splitPoints,
+                                 std::vector<ShardId>* shardIds) const;
+
+    //
+    // Methods to use once loaded / created
+    //
+
+    int numChunks() const {
+        return _chunkMap.size();
+    }
+
+    /**
+     * Given a key that has been extracted from a document, returns the
+     * chunk that contains that key.
+     *
+     * For instance, to locate the chunk for document {a : "foo" , b : "bar"}
+     * when the shard key is {a : "hashed"}, you can call
+     *  findIntersectingChunk() on {a : hash("foo") }
+     */
+    ChunkPtr findIntersectingChunk(const BSONObj& shardKey) const;
+
+    void getShardIdsForQuery(std::set<ShardId>& shardIds, const BSONObj& query) const;
+    void getAllShardIds(std::set<ShardId>* all) const;
+    /** @param shardIds set to the shard ids for shards
+     *         covered by the interval [min, max], see SERVER-4791
+     */
+    void getShardIdsForRange(std::set<ShardId>& shardIds,
+                             const BSONObj& min,
+                             const BSONObj& max) const;
+
+    // Transforms query into bounds for each field in the shard key
+    // for example :
+    //   Key { a: 1, b: 1 },
+    //   Query { a : { $gte : 1, $lt : 2 },
+    //            b : { $gte : 3, $lt : 4 } }
+    //   => Bounds { a : [1, 2), b : [3, 4) }
+    static IndexBounds getIndexBoundsForQuery(const BSONObj& key,
+                                              const CanonicalQuery* canonicalQuery);
+
+    // Collapse query solution tree.
+    //
+    // If it has OR node, the result could be a superset of the index bounds generated.
+    // Since to give a single IndexBounds, this gives the union of bounds on each field.
+    // for example:
+    //   OR: { a: (0, 1), b: (0, 1) },
+    //       { a: (2, 3), b: (2, 3) }
+    //   =>  { a: (0, 1), (2, 3), b: (0, 1), (2, 3) }
+    static IndexBounds collapseQuerySolution(const QuerySolutionNode* node);
+
+    const ChunkMap& getChunkMap() const {
+        return _chunkMap;
+    }
+
+    /**
+     * Returns true if, for this shard, the chunks are identical in both chunk managers
+     */
+    bool compatibleWith(const ChunkManager& other, const std::string& shard) const;
+
+    std::string toString() const;
+
+    ChunkVersion getVersion(const std::string& shardName) const;
+    ChunkVersion getVersion() const;
+
+    void _printChunks() const;
+
+    int getCurrentDesiredChunkSize() const;
+
+    std::shared_ptr<ChunkManager> reload(bool force = true) const;  // doesn't modify self!
+
+private:
+    // returns true if load was consistent
+    bool _load(ChunkMap& chunks,
+               std::set<ShardId>& shardIds,
+               ShardVersionMap* shardVersions,
+               const ChunkManager* oldManager);
+
+
+    // All members should be const for thread-safety
+    const std::string _ns;
+    const ShardKeyPattern _keyPattern;
+    const bool _unique;
+
+    // The shard versioning mechanism hinges on keeping track of the number of times we reload
+    // ChunkManagers. Increasing this number here will prompt checkShardVersion to refresh the
+    // connection-level versions to the most up to date value.
+    const unsigned long long _sequenceNumber;
+
+    ChunkMap _chunkMap;
+    ChunkRangeManager _chunkRanges;
+
+    std::set<ShardId> _shardIds;
+
+    // Max known version per shard
+    ShardVersionMap _shardVersions;
+
+    // Max version across all chunks
+    ChunkVersion _version;
+
+    //
+    // Split Heuristic info
+    //
+    class SplitHeuristics {
     public:
-        const ChunkRangeMap& ranges() const { return _ranges; }
-
-        void clear() { _ranges.clear(); }
-
-        void reloadAll(const ChunkMap& chunks);
-
-        // Slow operation -- wrap with DEV
-        void assertValid() const;
-
-        ChunkRangeMap::const_iterator upper_bound(const BSONObj& o) const { return _ranges.upper_bound(o); }
-        ChunkRangeMap::const_iterator lower_bound(const BSONObj& o) const { return _ranges.lower_bound(o); }
-
-    private:
-        // assumes nothing in this range exists in _ranges
-        void _insertRange(ChunkMap::const_iterator begin, const ChunkMap::const_iterator end);
-
-        ChunkRangeMap _ranges;
+        SplitHeuristics() : _splitTickets(maxParallelSplits) {}
+
+        TicketHolder _splitTickets;
+
+        // Test whether we should split once data * splitTestFactor > chunkSize (approximately)
+        static const int splitTestFactor = 5;
+        // Maximum number of parallel threads requesting a split
+        static const int maxParallelSplits = 5;
+
+        // The idea here is that we're over-aggressive on split testing by a factor of
+        // splitTestFactor, so we can safely wait until we get to splitTestFactor invalid splits
+        // before changing.  Unfortunately, we also potentially over-request the splits by a
+        // factor of maxParallelSplits, but since the factors are identical it works out
+        // (for now) for parallel or sequential oversplitting.
+        // TODO: Make splitting a separate thread with notifications?
+        static const int staleMinorReloadThreshold = maxParallelSplits;
     };
 
+    mutable SplitHeuristics _splitHeuristics;
 
-    /* config.sharding
-         { ns: 'alleyinsider.fs.chunks' ,
-           key: { ts : 1 } ,
-           shards: [ { min: 1, max: 100, server: a } , { min: 101, max: 200 , server : b } ]
-         }
-    */
-    class ChunkManager {
-    public:
-        typedef std::map<std::string, ChunkVersion> ShardVersionMap;
-
-        // Loads a new chunk manager from a collection document
-        explicit ChunkManager(const CollectionType& coll);
-
-        // Creates an empty chunk manager for the namespace
-        ChunkManager( const std::string& ns, const ShardKeyPattern& pattern, bool unique );
-
-        const std::string& getns() const { return _ns; }
-        const ShardKeyPattern& getShardKeyPattern() const { return _keyPattern; }
-        bool isUnique() const { return _unique; }
-
-        /**
-         * this is just an increasing number of how many ChunkManagers we have so we know if something has been updated
-         */
-        unsigned long long getSequenceNumber() const { return _sequenceNumber; }
-
-        //
-        // After constructor is invoked, we need to call loadExistingRanges.  If this is a new
-        // sharded collection, we can call createFirstChunks first.
-        //
-
-        // Creates new chunks based on info in chunk manager
-        void createFirstChunks(const ShardId& primaryShardId,
-                               const std::vector<BSONObj>* initPoints,
-                               const std::set<ShardId>* initShardIds);
+    //
+    // End split heuristics
+    //
 
-        // Loads existing ranges based on info in chunk manager
-        void loadExistingRanges(const ChunkManager* oldManager);
-
-
-        // Helpers for load
-        void calcInitSplitsAndShards(const ShardId& primaryShardId,
-                                     const std::vector<BSONObj>* initPoints,
-                                     const std::set<ShardId>* initShardIds,
-                                     std::vector<BSONObj>* splitPoints,
-                                     std::vector<ShardId>* shardIds) const;
-
-        //
-        // Methods to use once loaded / created
-        //
-
-        int numChunks() const { return _chunkMap.size(); }
-
-        /**
-         * Given a key that has been extracted from a document, returns the
-         * chunk that contains that key.
-         *
-         * For instance, to locate the chunk for document {a : "foo" , b : "bar"}
-         * when the shard key is {a : "hashed"}, you can call
-         *  findIntersectingChunk() on {a : hash("foo") }
-         */
-        ChunkPtr findIntersectingChunk( const BSONObj& shardKey ) const;
-
-        void getShardIdsForQuery(std::set<ShardId>& shardIds, const BSONObj& query) const;
-        void getAllShardIds(std::set<ShardId>* all) const;
-        /** @param shardIds set to the shard ids for shards
-         *         covered by the interval [min, max], see SERVER-4791
-         */
-        void getShardIdsForRange(std::set<ShardId>& shardIds, const BSONObj& min, const BSONObj& max) const;
-
-        // Transforms query into bounds for each field in the shard key
-        // for example :
-        //   Key { a: 1, b: 1 },
-        //   Query { a : { $gte : 1, $lt : 2 },
-        //            b : { $gte : 3, $lt : 4 } }
-        //   => Bounds { a : [1, 2), b : [3, 4) }
-        static IndexBounds getIndexBoundsForQuery(const BSONObj& key, const CanonicalQuery* canonicalQuery);
-
-        // Collapse query solution tree.
-        //
-        // If it has OR node, the result could be a superset of the index bounds generated.
-        // Since to give a single IndexBounds, this gives the union of bounds on each field.
-        // for example:
-        //   OR: { a: (0, 1), b: (0, 1) },
-        //       { a: (2, 3), b: (2, 3) }
-        //   =>  { a: (0, 1), (2, 3), b: (0, 1), (2, 3) }
-        static IndexBounds collapseQuerySolution( const QuerySolutionNode* node );
-
-        const ChunkMap& getChunkMap() const { return _chunkMap; }
-
-        /**
-         * Returns true if, for this shard, the chunks are identical in both chunk managers
-         */
-        bool compatibleWith(const ChunkManager& other, const std::string& shard) const;
-
-        std::string toString() const;
-
-        ChunkVersion getVersion(const std::string& shardName) const;
-        ChunkVersion getVersion() const;
-
-        void _printChunks() const;
-
-        int getCurrentDesiredChunkSize() const;
-
-        std::shared_ptr<ChunkManager> reload(bool force = true) const; // doesn't modify self!
-
-    private:
-        // returns true if load was consistent
-        bool _load(ChunkMap& chunks,
-                   std::set<ShardId>& shardIds,
-                   ShardVersionMap* shardVersions,
-                   const ChunkManager* oldManager);
-
-
-        // All members should be const for thread-safety
-        const std::string _ns;
-        const ShardKeyPattern _keyPattern;
-        const bool _unique;
-
-        // The shard versioning mechanism hinges on keeping track of the number of times we reload
-        // ChunkManagers. Increasing this number here will prompt checkShardVersion to refresh the
-        // connection-level versions to the most up to date value.
-        const unsigned long long _sequenceNumber;
-
-        ChunkMap _chunkMap;
-        ChunkRangeManager _chunkRanges;
-
-        std::set<ShardId> _shardIds;
-
-        // Max known version per shard
-        ShardVersionMap _shardVersions;
-
-        // Max version across all chunks
-        ChunkVersion _version;
-
-        //
-        // Split Heuristic info
-        //
-        class SplitHeuristics {
-        public:
-            SplitHeuristics() : _splitTickets(maxParallelSplits) {
-            }
-
-            TicketHolder _splitTickets;
-
-            // Test whether we should split once data * splitTestFactor > chunkSize (approximately)
-            static const int splitTestFactor = 5;
-            // Maximum number of parallel threads requesting a split
-            static const int maxParallelSplits = 5;
-
-            // The idea here is that we're over-aggressive on split testing by a factor of
-            // splitTestFactor, so we can safely wait until we get to splitTestFactor invalid splits
-            // before changing.  Unfortunately, we also potentially over-request the splits by a
-            // factor of maxParallelSplits, but since the factors are identical it works out
-            // (for now) for parallel or sequential oversplitting.
-            // TODO: Make splitting a separate thread with notifications?
-            static const int staleMinorReloadThreshold = maxParallelSplits;
-        };
-
-        mutable SplitHeuristics _splitHeuristics;
-
-        //
-        // End split heuristics
-        //
-
-        friend class Chunk;
-        friend class ChunkRangeManager; // only needed for CRM::assertValid()
-        static AtomicUInt32 NextSequenceNumber;
+    friend class Chunk;
+    friend class ChunkRangeManager;  // only needed for CRM::assertValid()
+    static AtomicUInt32 NextSequenceNumber;
 
-        friend class TestableChunkManager;
-    };
+    friend class TestableChunkManager;
+};
 
-} // namespace mongo
+}  // namespace mongo