summaryrefslogtreecommitdiff
path: root/src/mongo/db/repair_database.cpp
diff options
context:
space:
mode:
authorMathias Stearn <mathias@10gen.com>2014-12-04 18:24:21 -0500
committerMathias Stearn <mathias@10gen.com>2014-12-08 11:35:38 -0500
commit4bc54acaa78773dcf2fea55d4690e37b6e84aa0a (patch)
tree1eb70f491678049ef3350e1a800994ca20d657f7 /src/mongo/db/repair_database.cpp
parentd8dc1d99e730ae829f978f471c8da5f88ffc7f17 (diff)
downloadmongo-4bc54acaa78773dcf2fea55d4690e37b6e84aa0a.tar.gz
SERVER-16173 Rewrite repair for KVEngines
Diffstat (limited to 'src/mongo/db/repair_database.cpp')
-rw-r--r--src/mongo/db/repair_database.cpp223
1 files changed, 223 insertions, 0 deletions
diff --git a/src/mongo/db/repair_database.cpp b/src/mongo/db/repair_database.cpp
new file mode 100644
index 00000000000..7a133591a01
--- /dev/null
+++ b/src/mongo/db/repair_database.cpp
@@ -0,0 +1,223 @@
+/**
+* Copyright (C) 2014 MongoDB Inc.
+*
+* This program is free software: you can redistribute it and/or modify
+* it under the terms of the GNU Affero General Public License, version 3,
+* as published by the Free Software Foundation.
+*
+* This program is distributed in the hope that it will be useful,
+* but WITHOUT ANY WARRANTY; without even the implied warranty of
+* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+* GNU Affero General Public License for more details.
+*
+* You should have received a copy of the GNU Affero General Public License
+* along with this program. If not, see <http://www.gnu.org/licenses/>.
+*
+* As a special exception, the copyright holders give permission to link the
+* code of portions of this program with the OpenSSL library under certain
+* conditions as described in each individual source file and distribute
+* linked combinations including the program with the OpenSSL library. You
+* must comply with the GNU Affero General Public License in all respects for
+* all of the code used other than as permitted herein. If you modify file(s)
+* with this exception, you may extend this exception to your version of the
+* file(s), but you are not obligated to do so. If you do not wish to do so,
+* delete this exception statement from your version. If you delete this
+* exception statement from all source files in the program, then also delete
+* it in the license file.
+*/
+
+#define MONGO_LOG_DEFAULT_COMPONENT ::mongo::logger::LogComponent::kStorage
+
+#include "mongo/platform/basic.h"
+
+#include "mongo/db/repair_database.h"
+
+#include <boost/scoped_ptr.hpp>
+
+#include "mongo/db/background.h"
+#include "mongo/base/status.h"
+#include "mongo/base/string_data.h"
+#include "mongo/bson/bson_validate.h"
+#include "mongo/db/catalog/collection.h"
+#include "mongo/db/catalog/collection_catalog_entry.h"
+#include "mongo/db/catalog/database.h"
+#include "mongo/db/catalog/database_catalog_entry.h"
+#include "mongo/db/catalog/database_holder.h"
+#include "mongo/db/catalog/index_create.h"
+#include "mongo/db/catalog/index_key_validate.h"
+#include "mongo/db/storage/mmap_v1/mmap_v1_engine.h"
+#include "mongo/db/storage/storage_engine.h"
+#include "mongo/util/log.h"
+
+namespace mongo {
+namespace {
+ Status rebuildIndexesOnCollection(OperationContext* txn,
+ DatabaseCatalogEntry* dbce,
+ const std::string& collectionName) {
+
+ Database db(dbce->name(), dbce);
+ CollectionCatalogEntry* cce = dbce->getCollectionCatalogEntry(txn, collectionName);
+
+ std::vector<string> indexNames;
+ std::vector<BSONObj> indexSpecs;
+ {
+ // Fetch all indexes
+ cce->getAllIndexes( txn, &indexNames );
+ for ( size_t i = 0; i < indexNames.size(); i++ ) {
+ const string& name = indexNames[i];
+ BSONObj spec = cce->getIndexSpec( txn, name );
+ indexSpecs.push_back(spec.removeField("v").getOwned());
+
+ const BSONObj key = spec.getObjectField("key");
+ const Status keyStatus = validateKeyPattern(key);
+ if (!keyStatus.isOK()) {
+ return Status(ErrorCodes::CannotCreateIndex, str::stream()
+ << "Cannot rebuild index " << spec << ": " << keyStatus.reason()
+ << " For more info see http://dochub.mongodb.org/core/index-validation");
+ }
+ }
+ }
+
+ // Skip the rest if there are no indexes to rebuild.
+ if (indexSpecs.empty()) return Status::OK();
+
+ Collection* collection;
+ boost::scoped_ptr<MultiIndexBlock> indexer;
+ {
+ // These steps are combined into a single WUOW to ensure there are no commits without
+ // the indexes.
+ // 1) Drop all indexes.
+ // 2) Open the Collection
+ // 3) Start the index build process.
+
+ WriteUnitOfWork wuow(txn);
+
+ { // 1
+ for ( size_t i = 0; i < indexNames.size(); i++ ) {
+ Status s = cce->removeIndex(txn, indexNames[i]);
+ if (!s.isOK()) return s;
+ }
+ }
+
+ // Indexes must be dropped before we open the Collection otherwise we could attempt to
+ // open a bad index and fail.
+ // TODO see if MultiIndexBlock can be made to work without a Collection.
+ collection = db.getCollection(txn, collectionName);
+ invariant(collection);
+
+ indexer.reset(new MultiIndexBlock(txn, collection));
+ Status status = indexer->init(indexSpecs);
+ if (!status.isOK()) {
+ // The WUOW will handle cleanup, so the indexer shouldn't do its own.
+ indexer->abortWithoutCleanup();
+ return status;
+ }
+
+ wuow.commit();
+ }
+
+ // Iterate all records in the collection. Delete them if they aren't valid BSON. Index them
+ // if they are.
+
+ RecordStore* rs = collection->getRecordStore();
+ boost::scoped_ptr<RecordIterator> it(rs->getIterator(txn));
+ while (!it->isEOF()) {
+ RecordId id = it->curr();
+ RecordData data = it->dataFor(id);
+ invariant(id == it->getNext());
+
+ Status status = validateBSON(data.data(), data.size());
+ if (!status.isOK()) {
+ log() << "Invalid BSON detected at " << id << ": " << status << ". Deleting.";
+ it->saveState();
+ {
+ WriteUnitOfWork wunit(txn);
+ rs->deleteRecord(txn, id);
+ wunit.commit();
+ }
+ it->restoreState(txn);
+ continue;
+ }
+
+ // Now index the record.
+ // TODO SERVER-14812 add a mode that drops duplicates rather than failing
+ WriteUnitOfWork wunit(txn);
+ status = indexer->insert(data.releaseToBson(), id);
+ if (!status.isOK()) return status;
+ wunit.commit();
+ }
+
+ Status status = indexer->doneInserting();
+ if (!status.isOK()) return status;
+
+ {
+ WriteUnitOfWork wunit(txn);
+ indexer->commit();
+ wunit.commit();
+ }
+
+ return Status::OK();
+ }
+} // namespace
+
+ Status repairDatabase(OperationContext* txn,
+ StorageEngine* engine,
+ const std::string& dbName,
+ bool preserveClonedFilesOnFailure,
+ bool backupOriginalFiles) {
+
+ // We must hold some form of lock here
+ invariant(txn->lockState()->isLocked());
+ invariant( dbName.find( '.' ) == string::npos );
+
+ log() << "repairDatabase " << dbName << endl;
+
+ BackgroundOperation::assertNoBgOpInProgForDb(dbName);
+
+ txn->checkForInterrupt();
+
+ if (engine->isMmapV1()) {
+ // MMAPv1 is a layering violation so it implements its own repairDatabase.
+ return static_cast<MMAPV1Engine*>(engine)->repairDatabase(txn,
+ dbName,
+ preserveClonedFilesOnFailure,
+ backupOriginalFiles);
+ }
+
+ // These are MMAPv1 specific
+ if ( preserveClonedFilesOnFailure ) {
+ return Status( ErrorCodes::BadValue, "preserveClonedFilesOnFailure not supported" );
+ }
+ if ( backupOriginalFiles ) {
+ return Status( ErrorCodes::BadValue, "backupOriginalFiles not supported" );
+ }
+
+ // Close and reopen the db to invalidate all current users and caches.
+ // WARNING: it is important that the opened Database object isn't used for anything as its
+ // cache must remain empty until we return.
+ dbHolder().close(txn, dbName);
+ dbHolder().openDb(txn, dbName);
+
+ DatabaseCatalogEntry* dbce = engine->getDatabaseCatalogEntry(txn, dbName);
+
+ std::list<std::string> colls;
+ dbce->getCollectionNamespaces(&colls);
+
+ for (std::list<std::string>::const_iterator it = colls.begin(); it != colls.end(); ++it) {
+ // Don't check for interrupt after starting to repair a collection otherwise we can
+ // leave data in an inconsistent state. Interrupting between collections is ok, however.
+ txn->checkForInterrupt();
+
+ log() << "Repairing collection " << *it;
+
+ Status status = engine->repairRecordStore(txn, *it);
+ if (!status.isOK()) return status;
+
+ status = rebuildIndexesOnCollection(txn, dbce, *it);
+ if (!status.isOK()) return status;
+ }
+
+ return Status::OK();
+ }
+}
+