SCons refactoring, cleans up building and testing the C++ client.

This patch does the following: 1.) Remove pcre.h dependencies in the C++ client, and remove some other unnecessary dependencies. 2.) Clean up how we build the client from the client source tarball, so it's more like how we build it from the git repo / full source tarball. 3.) Fix up our "scons" so you only have to write "scons ." to build all of our binaries, the binary archive (zip or tgz) and client source archive (zip or tgz). 4.) Fix up SCons aliases "core", "tools", and "all". 5.) Let user specify the name of the client tarball via a SCons command line switch. Resolves SERVER-4231, SERVER-5255.
author: Andy Schwerin <Andy Schwerin schwerin@10gen.com> 2012-03-07 12:09:42 -0500
committer: Andy Schwerin <schwerin@10gen.com> 2012-03-23 10:35:31 -0400
commit: d67ce1cd31f6ea2e766d5c201ab5430735cbb3b8 (patch)
tree: 809d2a20ce0489d9f3fb5d390ea3a0f9686c9708
parent: f9c8560b866b3b286dc67548cbb82975fd4add46 (diff)
download: mongo-d67ce1cd31f6ea2e766d5c201ab5430735cbb3b8.tar.gz
43 files changed, 3328 insertions, 2920 deletions
diff --git a/SConscript.buildinfo b/SConscript.buildinfo
new file mode 100644
index 00000000000..3853adf2ba5
--- /dev/null
+++ b/SConscript.buildinfo
@@ -0,0 +1,45 @@
+# -*- mode: python; -*-
+
+# This SConscript describes construction of buildinfo.cpp, which is independent of the
+# build variant's target.
+
+import os
+import sys
+
+import buildscripts.utils
+
+Import('env windows')
+
+def getSysInfo():
+    if windows:
+        return "windows " + str( sys.getwindowsversion() )
+    else:
+        return " ".join( os.uname() )
+
+buildinfo_filename = '#build/buildinfo.cpp'
+
+buildinfo_template = '''
+#include <string>
+#include <boost/version.hpp>
+
+#include "mongo/util/version.h"
+
+namespace mongo {
+    const char * gitVersion() { return "%(git_version)s"; }
+    std::string sysInfo() { return "%(sys_info)s BOOST_LIB_VERSION=" BOOST_LIB_VERSION ; }
+}  // namespace mongo
+'''
+
+def generate_buildinfo(env, target, source, **kw):
+    contents = str(source[0]) % dict(git_version=buildscripts.utils.getGitVersion(),
+                                     sys_info=getSysInfo())
+    out = open(str(target[0]), 'wb')
+    try:
+        out.write(contents)
+    finally:
+        out.close()
+
+env.Command(buildinfo_filename, Value(buildinfo_template), generate_buildinfo)
+env.AlwaysBuild(buildinfo_filename)
+env.Install('$BUILD_DIR/mongo', buildinfo_filename)
+env.Install('$BUILD_DIR/client_build/mongo', buildinfo_filename)
diff --git a/SConstruct b/SConstruct
index 58dacd1c897..aa874789f8a 100644
--- a/SConstruct
+++ b/SConstruct
@@ -15,21 +15,23 @@
 
 EnsureSConsVersion( 1, 1, 0 )
 
-import os
-import sys
+import buildscripts
+import buildscripts.bb
+import datetime
 import imp
-import types
+import os
 import re
 import shutil
+import stat
+import sys
+import types
 import urllib
 import urllib2
-import buildscripts
-import buildscripts.bb
-import stat
 from buildscripts import utils
 
 import libdeps
 
+DEFAULT_INSTALL_DIR = "/usr/local"
 
 def _rpartition(string, sep):
     """A replacement for str.rpartition which is missing in Python < 2.5
@@ -64,8 +66,8 @@ options = {}
 
 options_topass = {}
 
-def add_option( name, help , nargs , contributesToVariantDir , dest=None,
-                type="string", choices=None ):
+def add_option( name, help, nargs, contributesToVariantDir,
+                dest=None, default = None, type="string", choices=None ):
 
     if dest is None:
         dest = name
@@ -76,6 +78,7 @@ def add_option( name, help , nargs , contributesToVariantDir , dest=None,
                nargs=nargs,
                action="store",
                choices=choices,
+               default=default,
                help=help )
 
     options[name] = { "help" : help ,
@@ -137,7 +140,7 @@ def get_variant_dir():
     return s
         
 # installation/packaging
-add_option( "prefix" , "installation prefix" , 1 , False )
+add_option( "prefix" , "installation prefix" , 1 , False, default=DEFAULT_INSTALL_DIR )
 add_option( "distname" , "dist name (0.8.0)" , 1 , False )
 add_option( "distmod", "additional piece for full dist name" , 1 , False )
 add_option( "nostrip", "do not strip installed binaries" , 0 , False )
@@ -220,6 +223,9 @@ add_option( "use-cpu-profiler",
 add_option("mongod-concurrency-level", "Concurrency level, \"global\" or \"db\"", 1, True,
            type="choice", choices=["global", "db"])
 
+add_option('client-dist-basename', "Name of the client source archive.", 1, False,
+           default='mongo-cxx-driver')
+
 # don't run configure if user calls --help
 if GetOption('help'):
     Return()
@@ -278,9 +284,16 @@ usePCH = has_option( "usePCH" )
 justClientLib = (COMMAND_LINE_TARGETS == ['mongoclient'])
 
 env = Environment( BUILD_DIR=variantDir,
+                   CLIENT_ARCHIVE='${CLIENT_DIST_BASENAME}${DIST_ARCHIVE_SUFFIX}',
+                   CLIENT_DIST_BASENAME=get_option('client-dist-basename'),
+                   CLIENT_LICENSE='#distsrc/client/LICENSE.txt',
+                   CLIENT_SCONSTRUCT='#distsrc/client/SConstruct',
+                   DIST_ARCHIVE_SUFFIX='.tgz',
                    MSVS_ARCH=msarch ,
+                   PYTHON=utils.find_python(),
+                   SERVER_ARCHIVE='${SERVER_DIST_BASENAME}${DIST_ARCHIVE_SUFFIX}',
                    TARGET_ARCH=msarch ,
-                   tools=["default", "gch", "jsheader", "mergelib" ],
+                   tools=["default", "gch", "jsheader", "mergelib"],
                    PYSYSPLATFORM=os.sys.platform,
 
                    PCRE_VERSION='8.30',
@@ -367,8 +380,6 @@ if ( not ( usesm or usev8 or justClientLib) ):
     usesm = True
     options_topass["usesm"] = True
 
-distBuild = len( COMMAND_LINE_TARGETS ) == 1 and ( str( COMMAND_LINE_TARGETS[0] ) == "s3dist" or str( COMMAND_LINE_TARGETS[0] ) == "dist" )
-
 extraLibPlaces = []
 
 env['EXTRACPPPATH'] = []
@@ -394,38 +405,18 @@ if has_option( "extralib" ):
 
 class InstallSetup:
     binaries = False
-    clientSrc = False
+    libraries = False
     headers = False
-    bannerFiles = tuple()
-    headerRoot = "include"
 
     def __init__(self):
         self.default()
-    
+
     def default(self):
         self.binaries = True
         self.libraries = False
-        self.clientSrc = False
         self.headers = False
-        self.bannerFiles = tuple()
-        self.headerRoot = "include"
-        self.clientTestsDir = None
-
-    def justClient(self):
-        self.binaries = False
-        self.libraries = False
-        self.clientSrc = True
-        self.headers = True
-        self.bannerFiles = [ "#distsrc/client/LICENSE.txt",
-                             "#distsrc/client/SConstruct" ]
-        self.headerRoot = "mongo/"
-        self.clientTestsDir = "#src/mongo/client/examples/"
 
 installSetup = InstallSetup()
-if distBuild:
-    installSetup.bannerFiles = [ "#distsrc/GNU-AGPL-3.0",
-                                 "#distsrc/README",
-                                 "#distsrc/THIRD-PARTY-NOTICES", ]
 
 if has_option( "full" ):
     installSetup.headers = True
@@ -446,24 +437,14 @@ if force64:
 
 env['PROCESSOR_ARCHITECTURE'] = processor
 
-DEFAULT_INSTALL_DIR = "/usr/local"
 installDir = DEFAULT_INSTALL_DIR
 nixLibPrefix = "lib"
 
-distName = GetOption( "distname" )
 dontReplacePackage = False
-
-if distBuild:
-    release = True
-
-def isDriverBuild():
-    return GetOption( "prefix" ) and GetOption( "prefix" ).find( "mongo-cxx-driver" ) >= 0
+isBuildingLatest = False
 
 if has_option( "prefix" ):
     installDir = GetOption( "prefix" )
-    if isDriverBuild():
-        installDir = '#' + installDir
-        installSetup.justClient()
 
 def findVersion( root , choices ):
     if not isinstance(root, list):
@@ -474,12 +455,6 @@ def findVersion( root , choices ):
                 return r + c
     raise RuntimeError("can't find a version of [" + repr(root) + "] choices: " + repr(choices))
 
-def choosePathExist( choices , default=None):
-    for c in choices:
-        if c != None and os.path.exists( c ):
-            return c
-    return default
-
 def filterExists(paths):
     return filter(os.path.exists, paths)
 
@@ -497,7 +472,7 @@ if "darwin" == os.sys.platform:
     if force64:
        env.Append( EXTRACPPPATH=["/usr/64/include"] )
        env.Append( EXTRALIBPATH=["/usr/64/lib"] )
-       if installDir == DEFAULT_INSTALL_DIR and not distBuild:
+       if installDir == DEFAULT_INSTALL_DIR:
            installDir = "/usr/64/"
     else:
        env.Append( EXTRACPPPATH=filterExists(["/sw/include" , "/opt/local/include"]) )
@@ -547,8 +522,8 @@ elif os.sys.platform.startswith( "openbsd" ):
 
 elif "win32" == os.sys.platform:
     windows = True
-    #if force64:
-    #    release = True
+
+    env['DIST_ARCHIVE_SUFFIX'] = '.zip'
 
     if has_option( "win2008plus" ):
         env.Append( CPPDEFINES=[ "MONGO_USE_SRW_ON_WINDOWS" ] )
@@ -690,9 +665,9 @@ if nix:
         if not has_option('clang'):
             env.Append( CPPFLAGS=" -fno-builtin-memcmp " ) # glibc's memcmp is faster than gcc's
 
-    env.Append( CPPDEFINES="_FILE_OFFSET_BITS=64" )
-    env.Append( CXXFLAGS=" -Wnon-virtual-dtor -Woverloaded-virtual" )
-    env.Append( LINKFLAGS=" -fPIC -pthread -rdynamic" )
+    env.Append( CPPDEFINES=["_FILE_OFFSET_BITS=64"] )
+    env.Append( CXXFLAGS=["-Wnon-virtual-dtor", "-Woverloaded-virtual"] )
+    env.Append( LINKFLAGS=["-fPIC", "-pthread",  "-rdynamic"] )
     env.Append( LIBS=[] )
 
     #make scons colorgcc friendly
@@ -811,12 +786,6 @@ env['MONGO_MODULE_FILES'] = moduleFiles
 
 # --- check system ---
 
-def getSysInfo():
-    if windows:
-        return "windows " + str( sys.getwindowsversion() )
-    else:
-        return " ".join( os.uname() )
-
 def doConfigure( myenv , shell=False ):
     conf = Configure(myenv)
     myenv["LINKFLAGS_CLEAN"] = list( myenv["LINKFLAGS"] )
@@ -1067,37 +1036,23 @@ def getCodeVersion():
         return None
     return allMatches[0]
 
-if getCodeVersion() == None:
+mongoCodeVersion = getCodeVersion()
+if mongoCodeVersion == None:
     Exit(-1)
 
-def getDistName( sofar ):
-    global distName
-    global dontReplacePackage
-
-    if distName is not None:
-        return distName
-
-    if str( COMMAND_LINE_TARGETS[0] ) == "s3dist":
-        version = getCodeVersion()
-        if not version.endswith( "+" ) and not version.endswith("-"):
-            print( "got real code version, doing release build for: " + version )
-            dontReplacePackage = True
-            distName = version
-            return version
-
+if has_option('distname'):
+    distName = GetOption( "distname" )
+elif mongoCodeVersion[-1] not in ("+", "-"):
+    dontReplacePackage = True
+    distName = mongoCodeVersion
+else:
+    isBuildingLatest = True
+    distName = utils.getGitBranchString("" , "-") + datetime.date.today().strftime("%Y-%m-%d")
 
-    return utils.getGitBranchString( "" , "-" ) + today.strftime( "%Y-%m-%d" )
 
+env['SERVER_DIST_BASENAME'] = 'mongodb-%s-%s' % (getSystemInstallName(), distName)
 
-if distBuild:
-    if isDriverBuild():
-        installDir = GetOption( "prefix" )
-    else:
-        from datetime import date
-        today = date.today()
-        installDir = "#mongodb-" + getSystemInstallName() + "-"
-        installDir += getDistName( installDir )
-        print "going to make dist: " + installDir[1:]
+distFile = "${SERVER_ARCHIVE}"
 
 env['NIX_LIB_DIR'] = nixLibPrefix
 env['INSTALL_DIR'] = installDir
@@ -1132,12 +1087,12 @@ env.AlwaysBuild( "push" )
 
 # ---- deploying ---
 
-def s3push( localName , remoteName=None , remotePrefix=None , fixName=True , platformDir=True ):
-
+def s3push( localName , remoteName=None , remotePrefix=None , fixName=True , platformDir=True,
+            isDriverBuild=False ):
     localName = str( localName )
 
     if remotePrefix is None:
-        if distName is None:
+        if isBuildingLatest:
             remotePrefix = utils.getGitBranchString( "-" ) + "-latest"
         else:
             remotePrefix = "-" + distName
@@ -1161,8 +1116,8 @@ def s3push( localName , remoteName=None , remotePrefix=None , fixName=True , pla
         name = name.lower()
     else:
         name = remoteName
-        
-    if isDriverBuild():
+
+    if isDriverBuild:
         name = "cxx-driver/" + name
     elif platformDir:
         name = platform + "/" + name
@@ -1182,19 +1137,15 @@ env.Alias( "s3shell" , [ "mongo" ] , [ s3shellpush ] )
 env.AlwaysBuild( "s3shell" )
 
 def s3dist( env , target , source ):
-    s3push( distFile , "mongodb" )
+    s3push( str(source[0]) , "mongodb" )
 
-env.Append( TARFLAGS=" -z " )
-
-if installDir[-1] != "/":
-    if windows:
-        distFile = env.Zip( installDir + ".zip", installDir )[0]
-    else:
-        distFile = env.Tar( installDir + '.tgz', installDir )[0]
+def s3distclient(env, target, source):
+    s3push(str(source[0]), "cxx-driver/mongodb")
 
-    env.Alias( "dist" , distFile )
-    env.Alias( "s3dist" , [ distFile ] , [ s3dist ] )
-    env.AlwaysBuild( "s3dist" )
+env.Alias( "dist" , '$SERVER_ARCHIVE' )
+env.Alias( "distclient", "$CLIENT_ARCHIVE")
+env.AlwaysBuild(env.Alias( "s3dist" , [ '$SERVER_ARCHIVE' ] , [ s3dist ] ))
+env.AlwaysBuild(env.Alias( "s3distclient" , [ '$CLIENT_ARCHIVE' ] , [ s3distclient ] ))
 
 # --- an uninstall target ---
 if len(COMMAND_LINE_TARGETS) > 0 and 'uninstall' in COMMAND_LINE_TARGETS:
@@ -1204,6 +1155,15 @@ if len(COMMAND_LINE_TARGETS) > 0 and 'uninstall' in COMMAND_LINE_TARGETS:
     BUILD_TARGETS.remove("uninstall")
     BUILD_TARGETS.append("install")
 
+clientEnv = env.Clone()
+clientEnv['CPPDEFINES'].remove('MONGO_EXPOSE_MACROS')
+
+if not has_option('use-system-all') and not has_option('use-system-boost'):
+    clientEnv.Append(LIBS=['boost_thread', 'boost_filesystem', 'boost_system'])
+    clientEnv.Prepend(LIBPATH=['$BUILD_DIR/third_party/boost/'])
+
+clientEnv.Prepend(LIBS=['mongoclient'], LIBPATH=['.'])
+
 # The following symbols are exported for use in subordinate SConscript files.
 # Ideally, the SConscript files would be purely declarative.  They would only
 # import build environment objects, and would contain few or no conditional
@@ -1213,15 +1173,17 @@ if len(COMMAND_LINE_TARGETS) > 0 and 'uninstall' in COMMAND_LINE_TARGETS:
 # conditional decision making that hasn't been moved up to this SConstruct file,
 # and they are exported here, as well.
 Export("env")
+Export("clientEnv")
 Export("shellEnv")
 Export("testEnv")
 Export("has_option")
-Export("installSetup getSysInfo")
+Export("installSetup")
 Export("usesm usev8")
 Export("darwin windows solaris linux nix")
 
-env.SConscript( 'src/SConscript', variant_dir=variantDir, duplicate=False )
-env.SConscript( 'SConscript.smoke' )
+env.SConscript( 'src/SConscript', variant_dir='$BUILD_DIR', duplicate=False )
+env.SConscript( 'src/SConscript.client', variant_dir='$BUILD_DIR/client_build', duplicate=False )
+env.SConscript( ['SConscript.buildinfo', 'SConscript.smoke'] )
 
 def clean_old_dist_builds(env, target, source):
     prefix = "mongodb-%s-%s" % (platform, processor)
@@ -1237,3 +1199,5 @@ def clean_old_dist_builds(env, target, source):
 
 env.Alias("dist_clean", [], [clean_old_dist_builds])
 env.AlwaysBuild("dist_clean")
+
+env.Alias('all', ['core', 'tools', 'clientTests'])
diff --git a/buildscripts/build_and_test_client.py b/buildscripts/build_and_test_client.py
new file mode 100755
index 00000000000..e95dbb42917
--- /dev/null
+++ b/buildscripts/build_and_test_client.py
@@ -0,0 +1,59 @@
+#!/usr/bin/python
+
+'''Script to attempt an isolated build of the C++ driver and its examples.
+
+Working directory must be the repository root.
+
+Usage:
+
+./buildscripts/build_and_test_client.py <mongo client archive file> [optional scons arguments]
+
+The client is built in a temporary directory, and the sample programs are run against a mongod
+instance found in the current working directory.  The temporary directory and its contents are
+destroyed at the end of execution.
+'''
+
+import os
+import shutil
+import subprocess
+import sys
+import tempfile
+import tarfile
+
+import utils
+
+def main(args):
+    archive_file = args[1]
+    scons_args = args[2:]
+    build_and_test(archive_file, scons_args)
+
+def build_and_test(archive, scons_args):
+    work_dir = tempfile.mkdtemp()
+    try:
+        extracted_root = extract_archive(work_dir, archive)
+        run_scons(extracted_root, scons_args)
+        smoke_client(extracted_root)
+    finally:
+        shutil.rmtree(work_dir)
+
+def extract_archive(work_dir, archive):
+    tf = tarfile.open(archive, 'r')
+    tf.extractall(path=work_dir)
+    return os.path.join(
+        work_dir,
+        os.path.dirname([n for n in tf.getnames() if n.endswith('SConstruct')][0])
+        )
+
+def run_scons(extracted_root, scons_args):
+    rc = subprocess.call(['scons', '-C', extracted_root, ] + scons_args + ['clientTests'])
+    if rc is not 0:
+        sys.exit(rc)
+
+def smoke_client(extracted_root):
+    rc = subprocess.call(utils.smoke_command("--test-path", extracted_root, "client"))
+    if rc is not 0:
+        sys.exit(rc)
+
+if __name__ == '__main__':
+    main(sys.argv)
+    sys.exit(0)
diff --git a/buildscripts/make_archive.py b/buildscripts/make_archive.py
new file mode 100755
index 00000000000..c4bd0100491
--- /dev/null
+++ b/buildscripts/make_archive.py
@@ -0,0 +1,116 @@
+#!/usr/bin/python
+
+'''Helper script for constructing an archive (zip or tar) from a list of files.
+
+The output format (tar, tgz, zip) is determined from the file name, unless the user specifies
+--format on the command line.
+
+This script simplifies the specification of filename transformations, so that, e.g.,
+src/mongo/foo.cpp and build/linux2/normal/buildinfo.cpp can get put into the same
+directory in the archive, perhaps mongodb-2.0.2/src/mongo.
+
+Usage:
+
+make_archive.py -o <output-file> [--format (tar|tgz|zip)] \
+    [--transform match1=replacement1 [--transform match2=replacement2 [...]]] \
+    <input file 1> [...]
+
+If the input file names start with "@", the file is expected to contain a list of
+whitespace-separated file names to include in the archive.  This helps get around the Windows
+command line length limit.
+
+Transformations are processed in command-line order and are short-circuiting.  So, if a file matches
+match1, it is never compared against match2 or later.  Matches are just python startswith()
+comparisons.
+
+For a detailed usage example, see src/SConscript.client or src/mongo/SConscript.
+'''
+
+import optparse
+import os
+import sys
+
+def main(argv):
+    opts = parse_options(argv[1:])
+    archive = open_archive_for_write(opts.output_filename, opts.archive_format)
+    try:
+        for input_filename in opts.input_filenames:
+            archive.add(input_filename, arcname=get_preferred_filename(input_filename,
+                                                                       opts.transformations))
+    finally:
+        archive.close()
+
+def parse_options(args):
+    parser = optparse.OptionParser()
+    parser.add_option('-o', dest='output_filename', default=None,
+                      help='Name of the archive to output.', metavar='FILE')
+    parser.add_option('--format', dest='archive_format', default=None,
+                      choices=('zip', 'tar', 'tgz'),
+                      help='Format of archive to create.  '
+                      'If omitted, use the suffix of the output filename to decide.')
+    parser.add_option('--transform', action='append', dest='transformations', default=[])
+
+    (opts, input_filenames) = parser.parse_args(args)
+    opts.input_filenames = []
+
+    for input_filename in input_filenames:
+        if input_filename.startswith('@'):
+            opts.input_filenames.extend(line.strip() for line in open(input_filename[1:], 'r'))
+        else:
+            opts.input_filenames.append(input_filename)
+
+    if opts.output_filename is None:
+        parser.error('-o switch is required')
+
+    if opts.archive_format is None:
+        if opts.output_filename.endswith('.zip'):
+            opts.archive_format = 'zip'
+        elif opts.output_filename.endswith('tar.gz') or opts.output_filename.endswith('.tgz'):
+            opts.archive_format = 'tgz'
+        elif opts.output_filename.endswith('.tar'):
+            opts.archive_format = 'tar'
+        else:
+            parser.error('Could not deduce archive format from output filename "%s"' %
+                         opts.output_filename)
+
+    try:
+        opts.transformations = [
+            xform.replace(os.path.altsep or os.path.sep, os.path.sep).split('=', 1)
+            for xform in opts.transformations]
+    except Exception, e:
+        parser.error(e)
+
+    return opts
+
+def open_archive_for_write(filename, archive_format):
+    '''Open a tar or zip archive for write, with the given format, and return it.
+
+    The type of archive is determined by the "archive_format" parameter, which should be
+    "tar", "tgz" (for gzipped tar) or "zip".
+    '''
+
+    if archive_format in ('tar', 'tgz'):
+        import tarfile
+        mode = 'w'
+        if archive_format is 'tgz':
+            mode += '|gz'
+        return tarfile.open(filename, mode)
+    if archive_format is 'zip':
+        import zipfile
+        # Infuriatingly, Zipfile calls the "add" method "write", but they're otherwise identical,
+        # for our purposes.  WrappedZipFile is a minimal adapter class.
+        class WrappedZipFile(zipfile.ZipFile):
+            def add(self, filename, arcname):
+                return self.write(filename, arcname)
+        return WrappedZipFile(filename, 'w', zipfile.ZIP_DEFLATED)
+    raise ValueError('Unsupported archive format "%s"' % archive_format)
+
+def get_preferred_filename(input_filename, transformations):
+    for match, replace in transformations:
+        if input_filename.startswith(match):
+            return replace + input_filename[len(match):]
+    return input_filename
+
+if __name__ == '__main__':
+    main(sys.argv)
+    sys.exit(0)
diff --git a/distsrc/client/SConstruct b/distsrc/client/SConstruct
index 503b71ccbc7..5b40f1a00aa 100755
--- a/distsrc/client/SConstruct
+++ b/distsrc/client/SConstruct
@@ -1,102 +1,85 @@
+# -*- mode: python -*-
+
 # scons file for MongoDB c++ client library and examples
 
 import os
-
-# options 
-AddOption( "--extrapath",
-           dest="extrapath",
-           type="string",
-           nargs=1,
-           action="store",
-           help="comma separated list of add'l paths  (--extrapath /opt/foo/,/foo) static linking" )
-
-AddOption( "--prefix",
-           dest="prefix",
-           type="string",
-           nargs=1,
-           action="store",
-           default="/usr/local",
-           help="installation root" )
-
-
-env = Environment( MSVS_ARCH=None )
-
-def addExtraLibs( s ):
+import sys
+
+# options
+AddOption("--extrapath",
+          dest="extrapath",
+          type="string",
+          nargs=1,
+          action="store",
+          help="comma separated list of add'l paths  (--extrapath /opt/foo/,/foo) static linking")
+
+AddOption("--prefix",
+          dest="prefix",
+          type="string",
+          nargs=1,
+          action="store",
+          default="/usr/local",
+          help="installation root")
+
+
+env = Environment(BUILD_DIR='#build',
+                  CLIENT_ARCHIVE='${CLIENT_DIST_BASENAME}${DIST_ARCHIVE_SUFFIX}',
+                  CLIENT_DIST_BASENAME='mongo-cxx-driver',
+                  CLIENT_LICENSE='#LICENSE.txt',
+                  CLIENT_SCONSTRUCT='#SConstruct',
+                  MSVS_ARCH=None,
+                  PYTHON=sys.executable)
+
+def addExtraLibs(s):
     for x in s.split(","):
-        if os.path.exists( x ):
-            env.Append( CPPPATH=[ x + "/include" ] )
-            env.Append( LIBPATH=[ x + "/lib" ] )
-            env.Append( LIBPATH=[ x + "/lib64" ] )
+        if os.path.exists(x):
+            env.Append(CPPPATH=[x + "/include", x],
+                       LIBPATH=[x + "/lib", x + "/lib64"])
 
 if GetOption( "extrapath" ) is not None:
     addExtraLibs( GetOption( "extrapath" ) )
 
-env.Append( CPPPATH=[ "mongo/" ] )
-
-env.Append( CPPDEFINES=[ "_SCONS" , "MONGO_EXPOSE_MACROS" ] )
+env.Prepend(CPPPATH=["$BUILD_DIR", "$BUILD_DIR/mongo"])
+env.Append(CPPDEFINES=[ "_SCONS", "MONGO_EXPOSE_MACROS" ])
 
 nix = False
 linux = False
 
-if "darwin" == os.sys.platform:
+
+if "darwin" == sys.platform:
     addExtraLibs( "/opt/local/" )
     nix = True
-elif "linux2" == os.sys.platform or "linux3" == os.sys.platform:
+elif sys.platform in ("linux2", "linux3"):
     nix = True
     linux = True
 
+if sys.platform is 'win32':
+    env['DIST_ARCHIVE_SUFFIX'] = '.zip'
+else:
+    env['DIST_ARCHIVE_SUFFIX'] = '.tgz'
+
 if nix:
-    env.Append( CPPFLAGS=" -O3" )
-    env.Append( LIBS=["pthread"] )
+    env.Append(CCFLAGS=["-O3", "-pthread"])
 if linux:
-    env.Append( LINKFLAGS=" -Wl,--as-needed -Wl,-zdefs " )
+    env.Append(LINKFLAGS=["-Wl,--as-needed", "-Wl,-zdefs"])
 
-boostLibs = [ "thread" , "filesystem" , "system", "thread" ]
+boostLibs = ["thread", "filesystem", "system"]
 conf = Configure(env)
 for lib in boostLibs:
-    if not conf.CheckLib("boost_%s-mt" % lib):
-        conf.CheckLib("boost_%s" % lib)
+    if not conf.CheckLib(["boost_%s-mt" % lib, "boost_%s" % lib],
+                         language="C++"):
+        Exit(1)
+conf.Finish()
 
-dirs = [ "" , "bson/" , "bson/util/" , 
-         "client/"  , "s/" , "shell/" , 
-         "db/" , 
-         "scripting/" , 
-         "util/" , "util/concurrency/" , "util/mongoutils/" , "util/net/" ]
+clientEnv = env.Clone()
+clientEnv['CPPDEFINES'].remove('MONGO_EXPOSE_MACROS')
+clientEnv.Prepend(LIBS=['mongoclient'], LIBPATH=['.'])
 
-allClientFiles = []
-for x in dirs:
-    allClientFiles += Glob( "mongo/" + x + "*.cpp" )
-allClientFiles += Glob( "mongo/util/*.c" )
+Export("env clientEnv")
+env.SConscript('src/SConscript.client', variant_dir='$BUILD_DIR', duplicate=False)
 
-libs = env.Library( "mongoclient" , allClientFiles )
+env.Default('${LIBPREFIX}mongoclient${LIBSUFFIX}')
 
-# install
-
-prefix = GetOption( "prefix" )
-
-for x in libs:
-    env.Install( prefix + "/lib/" , str(x) )
-
-for x in dirs:
-    x = "mongo/" + x
-    env.Install( prefix + "/include/" + x , Glob( x + "*.h" ) )
-
-env.Alias( "install" , prefix )
-
-# example setup
-
-clientTests = []
-clientEnv = env.Clone();
-clientEnv.Prepend( LIBS=["mongoclient"] )
-clientEnv.Prepend( LIBPATH=["."] )
-
-# examples
-
-clientTests += [ clientEnv.Program( "firstExample" , [ "client/examples/first.cpp" ] ) ]
-clientTests += [ clientEnv.Program( "secondExample" , [ "client/examples/second.cpp" ] ) ]
-clientTests += [ clientEnv.Program( "whereExample" , [ "client/examples/whereExample.cpp" ] ) ]
-clientTests += [ clientEnv.Program( "authTest" , [ "client/examples/authTest.cpp" ] ) ]
-clientTests += [ clientEnv.Program( "httpClientTest" , [ "client/examples/httpClientTest.cpp" ] ) ]
-clientTests += [ clientEnv.Program( "clientTest" , [ "client/examples/clientTest.cpp" ] ) ]
-clientEnv.Alias("clientTests", clientTests, [])
 
+# install
+env.Alias("install", GetOption('prefix'))
diff --git a/src/SConscript.client b/src/SConscript.client
new file mode 100644
index 00000000000..cb62622808a
--- /dev/null
+++ b/src/SConscript.client
@@ -0,0 +1,133 @@
+# -*- mode: python -*-
+
+# This SConscript describes build and install rules for the Mongo C++ driver and associated exmaple
+# programs.
+
+Import('env clientEnv')
+
+clientSource = [
+    'mongo/bson/oid.cpp',
+    'mongo/buildinfo.cpp',
+    'mongo/client/clientAndShell.cpp',
+    'mongo/client/clientOnly.cpp',
+    'mongo/client/connpool.cpp',
+    'mongo/client/dbclient.cpp',
+    'mongo/client/dbclient_rs.cpp',
+    'mongo/client/dbclientcursor.cpp',
+    'mongo/client/distlock.cpp',
+    'mongo/client/gridfs.cpp',
+    'mongo/client/model.cpp',
+    'mongo/client/syncclusterconnection.cpp',
+    'mongo/db/jsobj.cpp',
+    'mongo/db/json.cpp',
+    'mongo/db/lasterror.cpp',
+    'mongo/db/namespace.cpp',
+    'mongo/db/nonce.cpp',
+    'mongo/pch.cpp',
+    'mongo/util/assert_util.cpp',
+    'mongo/util/background.cpp',
+    'mongo/util/base64.cpp',
+    'mongo/util/concurrency/rwlockimpl.cpp',
+    'mongo/util/concurrency/spin_lock.cpp',
+    'mongo/util/concurrency/synchronization.cpp',
+    'mongo/util/concurrency/task.cpp',
+    'mongo/util/concurrency/thread_pool.cpp',
+    'mongo/util/concurrency/vars.cpp',
+    'mongo/util/debug_util.cpp',
+    'mongo/util/file_allocator.cpp',
+    'mongo/util/histogram.cpp',
+    'mongo/util/intrusive_counter.cpp',
+    'mongo/util/log.cpp',
+    'mongo/util/md5.cpp',
+    'mongo/util/md5main.cpp',
+    'mongo/util/net/httpclient.cpp',
+    'mongo/util/net/listen.cpp',
+    'mongo/util/net/message.cpp',
+    'mongo/util/net/message_port.cpp',
+    'mongo/util/net/sock.cpp',
+    'mongo/util/password.cpp',
+    'mongo/util/ramlog.cpp',
+    'mongo/util/signal_handlers.cpp',
+    'mongo/util/stringutils.cpp',
+    'mongo/util/text.cpp',
+    'mongo/util/trace.cpp',
+    'mongo/util/util.cpp',
+    ]
+
+exampleSourceMap = [
+        ('firstExample', 'mongo/client/examples/first.cpp'),
+        ('rsExample', 'mongo/client/examples/rs.cpp'),
+        ('secondExample', 'mongo/client/examples/second.cpp'),
+        ('whereExample', 'mongo/client/examples/whereExample.cpp'),
+        ('authTest', 'mongo/client/examples/authTest.cpp'),
+        ('httpClientTest', 'mongo/client/examples/httpClientTest.cpp'),
+        ('bsondemo', 'mongo/bson/bsondemo/bsondemo.cpp'),
+        ('clientTest', 'mongo/client/examples/clientTest.cpp'),
+        ]
+
+clientHeaders = []
+for id in ["",
+           "util/",
+           "util/net/",
+           "util/mongoutils/",
+           "util/concurrency/",
+           "db/",
+           "db/stats/",
+           "db/repl/",
+           "db/ops/",
+           "client/",
+           "bson/",
+           "bson/util/",
+           "s/",
+           "scripting/"]:
+    clientHeaders.extend(Glob('mongo/%s/*.h' % id))
+    clientHeaders.extend(Glob('mongo/%s/*.hpp' % id))
+
+env.Install('#/', [
+        env.Library('mongoclient', clientSource),
+        #env.SharedLibrary('mongoclient', clientSource),
+        ])
+
+clientTests = clientEnv.Install('#/', [
+        clientEnv.Program(target, [source]) for (target, source) in exampleSourceMap])
+
+clientEnv.Alias('clientTests', clientTests, [])
+
+env.Install(
+    '#/',
+    env.Command('$CLIENT_ARCHIVE',
+                ['#buildscripts/make_archive.py',
+                 '$CLIENT_SCONSTRUCT',
+                 '$CLIENT_LICENSE',
+                 'SConscript.client',
+                 '#buildscripts/make_archive.py',
+                 clientSource,
+                 clientHeaders,
+                 [source for (target, source) in exampleSourceMap]],
+                '${PYTHON} ${SOURCES[0]} -o $TARGET '
+                '--transform ${str(Dir(BUILD_DIR))}/client_build=$CLIENT_DIST_BASENAME/src '
+                '--transform ${str(Dir(BUILD_DIR))}=$CLIENT_DIST_BASENAME/src '
+                '--transform distsrc/client=$CLIENT_DIST_BASENAME '
+                '--transform =$CLIENT_DIST_BASENAME/ '
+                '${TEMPFILE(SOURCES[1:])}'))
+
+# install
+prefix = GetOption("prefix")
+
+env.Install(prefix + "/lib", '${LIBPREFIX}mongoclient${LIBSUFFIX}')
+
+for x in ["",
+          "bson/",
+          "bson/util/",
+          "client/",
+          "s/",
+          "shell/",
+          "db/",
+          "scripting/",
+          "util/",
+          "util/concurrency/",
+          "util/mongoutils/",
+          "util/net/" ]:
+    env.Install(prefix + "/include/mongo/" + x,
+                [Glob('mongo/%s*.h' % x), Glob('mongo/%s*.hpp' % x)])
+
diff --git a/src/mongo/SConscript b/src/mongo/SConscript
index 6fc891d48b8..ae484fbf077 100644
--- a/src/mongo/SConscript
+++ b/src/mongo/SConscript
@@ -10,42 +10,21 @@ Import("shellEnv")
 Import("testEnv")
 Import("has_option")
 Import("usesm usev8")
-Import("installSetup getSysInfo")
+Import("installSetup")
 Import("darwin windows solaris linux nix")
 
 def add_exe( v ):
     return "${PROGPREFIX}%s${PROGSUFFIX}" % v
 
-def setupBuildInfoFile( env, target, source, **kw ):
-    version = utils.getGitVersion()
-    sysInfo = getSysInfo()
-    contents = '\n'.join([
-        '#include "pch.h"',
-        '#include <iostream>',
-        '#include <boost/version.hpp>',
-        'namespace mongo { const char * gitVersion(){ return "' + version + '"; } }',
-        'namespace mongo { string sysInfo(){ return "' + sysInfo + ' BOOST_LIB_VERSION=" BOOST_LIB_VERSION ; } }',
-        ])
-
-    contents += '\n\n';
-
-    out = open( str( target[0] ) , 'wb' )
-    try:
-        out.write( contents )
-    finally:
-        out.close()
-
-env.AlwaysBuild( env.Command( 'buildinfo.cpp', [], setupBuildInfoFile ) )
-
 # ------    SOURCE FILE SETUP -----------
 
 commonFiles = [ "pch.cpp",
                 "buildinfo.cpp",
-                "db/indexkey.cpp",
                 "db/jsobj.cpp",
                 "bson/oid.cpp",
                 "db/json.cpp",
                 "db/lasterror.cpp",
+                "db/namespace.cpp",
                 "db/nonce.cpp",
                 "db/queryutil.cpp",
                 "db/querypattern.cpp",
@@ -111,6 +90,7 @@ coreServerFiles = [ "util/version.cpp",
                     "db/commands/cloud.cpp",
                     "db/dbmessage.cpp",
                     "db/commands/pipeline.cpp",
+                    "db/indexkey.cpp",
                     "db/pipeline/accumulator.cpp",
                     "db/pipeline/accumulator_add_to_set.cpp",
                     "db/pipeline/accumulator_avg.cpp",
@@ -156,14 +136,6 @@ coreServerFiles = [ "util/version.cpp",
 if "win32" == os.sys.platform:
     coreServerFiles.append( "util/ntservice.cpp" )
 
-clientFiles = commonFiles + [
-    'client/clientAndShell.cpp',
-    'client/clientOnly.cpp',
-    'client/gridfs.cpp',
-    'db/commands.cpp',
-]
-
-
 if usesm:
     coreServerFiles.append( "scripting/engine_spidermonkey.cpp" )
 elif usev8:
@@ -243,7 +215,7 @@ serverOnlyFiles = [ "db/curop.cpp",
                     "db/repl_block.cpp",
                     "db/btreecursor.cpp",
                     "db/cloner.cpp",
-                    "db/namespace.cpp",
+                    "db/namespace_details.cpp",
                     "db/cap.cpp",
                     "db/matcher_covered.cpp",
                     "db/dbeval.cpp",
@@ -375,31 +347,10 @@ env.Install( '#/', mongos )
 
 env.Library("clientandshell", "client/clientAndShell.cpp", LIBDEPS=["mongocommon", "coredb", "defaultversion", "gridfs"])
 env.Library("allclient", "client/clientOnly.cpp", LIBDEPS=["clientandshell"])
-# c++ library
-clientLib = env.MergeLibrary( "mongoclient", ["allclient"] )
-env.Install( '#/', clientLib )
-clientLibName = str( clientLib[0] )
+
 if has_option( "sharedclient" ):
     sharedClientLibName = str( env.SharedLibrary( "mongoclient", [], LIBDEPS=["allclient"], _LIBDEPS='$_LIBDEPS_OBJS' )[0] )
 
-clientEnv = env.Clone();
-clientEnv.Append( CPPPATH=["../"] )
-clientEnv.Prepend( LIBS=[ clientLib ] )
-clientEnv.Prepend( LIBPATH=["."] )
-clientEnv["CPPDEFINES"].remove( "MONGO_EXPOSE_MACROS" )
-l = clientEnv[ "LIBS" ]
-
-# examples
-clientTests = [
-    clientEnv.Program( "firstExample", [ "client/examples/first.cpp" ] ),
-    clientEnv.Program( "rsExample", [ "client/examples/rs.cpp" ] ),
-    clientEnv.Program( "secondExample", [ "client/examples/second.cpp" ] ),
-    clientEnv.Program( "whereExample", [ "client/examples/whereExample.cpp" ] ),
-    clientEnv.Program( "authTest", [ "client/examples/authTest.cpp" ] ),
-    clientEnv.Program( "httpClientTest", [ "client/examples/httpClientTest.cpp" ] ),
-    clientEnv.Program( "bsondemo", [ "bson/bsondemo/bsondemo.cpp" ] ),
-    ]
-
 # dbtests test binary
 env.StaticLibrary('testframework', ['dbtests/framework.cpp'])
 
@@ -412,13 +363,10 @@ if len(testEnv.subst('$PROGSUFFIX')):
     testEnv.Alias( "test", "#/${PROGPREFIX}test${PROGSUFFIX}" )
 
 env.Install( '#/', testEnv.Program( "perftest", [ "dbtests/perf/perftest.cpp" ], LIBDEPS=["serveronly", "coreserver", "coredb", "testframework" ] ) )
-clientTests += [ clientEnv.Program( "clientTest", [ "client/examples/clientTest.cpp" ] ) ]
-
-env.Install( '#/', clientTests )
 
 # --- sniffer ---
 mongosniff_built = False
-if darwin or clientEnv["_HAVEPCAP"]:
+if darwin or env["_HAVEPCAP"]:
     mongosniff_built = True
     sniffEnv = env.Clone()
     sniffEnv.Append( CPPDEFINES="MONGO_EXPOSE_MACROS" )
@@ -474,36 +422,36 @@ def checkGlibc(target,source,env):
         print( "************* " + str( target[0] ) + " has GLIBC_2.4 dependencies!" )
         Exit(-3)
 
-allBinaries = []
+distBinaries = []
 
 def installBinary( e, name ):
-    if not installSetup.binaries:
-        return
-
-    global allBinaries
+    global distBinaries
 
     name = add_exe( name )
 
-    inst = e.Install( "$INSTALL_DIR/bin", name )
+    if (not has_option( "no-glibc-check" ) and linux and "s3dist" in COMMAND_LINE_TARGETS):
+        e.AddPostAction( name, checkGlibc )
 
-    allBinaries += [ name ]
     if (solaris or linux) and (not has_option("nostrip")):
-        e.AddPostAction( inst, 'strip $TARGET' )
+        name = e.Command('stripped/%s' % name, name, 'strip -o $TARGET $SOURCE')[0]
 
-    if not has_option( "no-glibc-check" ) and linux and len( COMMAND_LINE_TARGETS ) == 1 and str( COMMAND_LINE_TARGETS[0] ) == "s3dist":
-        e.AddPostAction( inst, checkGlibc )
+    distBinaries.append(name)
+
+    if not installSetup.binaries:
+        return
+
+    inst = e.Install( "$INSTALL_DIR/bin", name )
 
     if nix:
         e.AddPostAction( inst, 'chmod 755 $TARGET' )
 
-for x in normalTools:
-    installBinary( env, "mongo" + x )
-installBinary( env, "mongofiles" )
-installBinary( env, "bsondump" )
-installBinary( env, "mongoperf" )
+for t in ["mongo" + x for x in normalTools] + ["mongofiles", "bsondump", "mongoperf"]:
+    installBinary( env, t )
+    env.Alias("tools", '#/' + add_exe(t))
 
 if mongosniff_built:
     installBinary(env, "mongosniff")
+    env.Alias("tools", '#/' + add_exe("mongosniff"))
 
 installBinary( env, "mongod" )
 installBinary( env, "mongos" )
@@ -511,61 +459,39 @@ installBinary( env, "mongos" )
 if shellEnv is not None:
     installBinary( env, "mongo" )
 
-env.Alias( "all", ['#/%s' % b for b in allBinaries ] )
 env.Alias( "core", [ '#/%s' % b for b in [ add_exe( "mongo" ), add_exe( "mongod" ), add_exe( "mongos" ) ] ] )
 
 #headers
 if installSetup.headers:
     for id in [ "", "util/", "util/net/", "util/mongoutils/", "util/concurrency/", "db/", "db/stats/", "db/repl/", "db/ops/", "client/", "bson/", "bson/util/", "s/", "scripting/" ]:
-        env.Install( "$INSTALL_DIR/" + installSetup.headerRoot + "/" + id, Glob( id + "*.h" ) )
-        env.Install( "$INSTALL_DIR/" + installSetup.headerRoot + "/" + id, Glob( id + "*.hpp" ) )
-
-if installSetup.clientSrc:
-    for x in clientFiles:
-        if isinstance(x, basestring):
-            x = [x]
-        for path in x:
-            path = str(path)
-            dirname, filename = os.path.split(path)
-            env.Install( "$INSTALL_DIR/mongo/" + dirname , path )
+        env.Install( "$INSTALL_DIR/include/" + id, Glob( id + "*.h" ) )
+        env.Install( "$INSTALL_DIR/include/" + id, Glob( id + "*.hpp" ) )
 
 #lib
 if installSetup.libraries:
-    env.Install( "$INSTALL_DIR/$NIX_LIB_DIR", clientLibName )
+    env.Install('$INSTALL_DIR/$NIX_LIB_DIR', '#${LIBPREFIX}mongoclient${LIBSUFFIX}')
     if has_option( "sharedclient" ):
-        env.Install( "$INSTALL_DIR/$NIX_LIB_DIR", sharedClientLibName )
-
-#textfiles
-env.Install( "$INSTALL_DIR", installSetup.bannerFiles )
-
-if installSetup.clientTestsDir:
-    env.Install( '$INSTALL_DIR/client/', installSetup.clientTestsDir )
+        env.Install( "$INSTALL_DIR/$NIX_LIB_DIR",  '#${SHLIBPREFIX}mongoclient${SHLIBSUFFIX}')
+
+env.Command(
+    '#/${SERVER_ARCHIVE}',
+    ['#buildscripts/make_archive.py',
+     '#distsrc/GNU-AGPL-3.0',
+     '#distsrc/README',
+     '#distsrc/THIRD-PARTY-NOTICES',
+     distBinaries],
+    '$PYTHON ${SOURCES[0]} -o $TARGET '
+    '--transform distsrc=$SERVER_DIST_BASENAME '
+    '--transform ${str(Dir(BUILD_DIR))}/mongo/stripped=$SERVER_DIST_BASENAME/bin '
+    '--transform ${str(Dir(BUILD_DIR))}/mongo=$SERVER_DIST_BASENAME/bin '
+    '${TEMPFILE(SOURCES[1:])}')
 
 #final alias
 env.Alias( "install", "$INSTALL_DIR" )
 
-# aliases
-env.Alias( "mongoclient", '#/%s' % ( has_option( "sharedclient" ) and sharedClientLibName or clientLibName ) )
-
-# client dist
-def build_and_test_client(env, target, source):
-    import subprocess
-
-    installDir = env.subst('$INSTALL_DIR', target=target, source=source)
-    installDir = env.GetBuildPath(installDir)
-    if GetOption("extrapath") is not None:
-        scons_command = ["scons", "--extrapath=" + GetOption("extrapath")]
-    else:
-        scons_command = ["scons"]
-
-    exit_code = subprocess.call(scons_command + ["clientTests"], cwd=installDir)
-    if exit_code:
-        return exit_code
-
-    smoke_cmd = utils.smoke_command("--test-path", installDir, "client")
-    exit_code = subprocess.call(smoke_cmd)
-    if exit_code:
-        return exit_code
-
-env.Alias("clientBuild", [mongod, '$INSTALL_DIR'], [build_and_test_client])
+env.Alias("clientBuild", ['#buildscripts/build_and_test_client.py',
+                          '#/${PROGPREFIX}mongod${PROGSUFFIX}',
+                          '#$CLIENT_ARCHIVE'],
+          '$PYTHON ${SOURCES[0]} ${SOURCES[2]}'
+          )
 env.AlwaysBuild("clientBuild")
diff --git a/src/mongo/client/dbclient.cpp b/src/mongo/client/dbclient.cpp
index 14fc7aaddd9..48e0edbcd0a 100644
--- a/src/mongo/client/dbclient.cpp
+++ b/src/mongo/client/dbclient.cpp
@@ -15,18 +15,26 @@
  *    limitations under the License.
  */
 
-#include "pch.h"
-#include "dbclient.h"
-#include "../bson/util/builder.h"
-#include "../db/jsobj.h"
-#include "../db/json.h"
-#include "../db/instance.h"
-#include "../util/md5.hpp"
-#include "../db/dbmessage.h"
-#include "../db/cmdline.h"
-#include "connpool.h"
-#include "../s/util.h"
-#include "syncclusterconnection.h"
+#include "mongo/pch.h"
+
+#include "mongo/client/dbclient.h"
+
+#include "mongo/bson/util/builder.h"
+#include "mongo/client/constants.h"
+#include "mongo/client/dbclient_rs.h"
+#include "mongo/client/dbclientcursor.h"
+#include "mongo/client/syncclusterconnection.h"
+#include "mongo/db/jsobj.h"
+#include "mongo/db/json.h"
+#include "mongo/db/namespace-inl.h"
+#include "mongo/db/namespacestring.h"
+#include "mongo/s/util.h"
+#include "mongo/util/md5.hpp"
+
+#ifdef MONGO_SSL
+// TODO: Remove references to cmdline from the client.
+#include "mongo/db/cmdline.h"
+#endif  // defined MONGO_SSL
 
 namespace mongo {
 
@@ -148,6 +156,12 @@ namespace mongo {
     }
 
 
+    Query::Query( const string &json ) : obj( fromjson( json ) ) {}
+
+    Query::Query( const char *json ) : obj( fromjson( json ) ) {}
+
+    Query& Query::hint(const string &jsonKeyPatt) { return hint( fromjson( jsonKeyPatt ) ); }
+
     Query& Query::where(const string &jscode, BSONObj scope) {
         /* use where() before sort() and hint() and explain(), else this will assert. */
         assert( ! isComplex() );
diff --git a/src/mongo/client/dbclient.h b/src/mongo/client/dbclient.h
index d2ad1ad0580..698f091874b 100644
--- a/src/mongo/client/dbclient.h
+++ b/src/mongo/client/dbclient.h
@@ -1,6 +1,7 @@
 /** @file dbclient.h
 
-    Core MongoDB C++ driver interfaces are defined here.
+    Include this file when writing client C++ applications, to get access to the
+    mongod C++ driver.
 */
 
 /*    Copyright 2009 10gen Inc.
@@ -20,1044 +21,10 @@
 
 #pragma once
 
-#include "../pch.h"
-#include "../util/net/message.h"
-#include "../util/net/message_port.h"
-#include "../db/jsobj.h"
-#include "../db/json.h"
-#include "../db/security.h"
-#include <stack>
+#include "mongo/client/redef_macros.h"
 
-namespace mongo {
+#include "mongo/client/dbclient_rs.h"
+#include "mongo/client/dbclientcursor.h"
+#include "mongo/client/dbclientinterface.h"
 
-    /** the query field 'options' can have these bits set: */
-    enum QueryOptions {
-        /** Tailable means cursor is not closed when the last data is retrieved.  rather, the cursor marks
-           the final object's position.  you can resume using the cursor later, from where it was located,
-           if more data were received.  Set on dbQuery and dbGetMore.
-
-           like any "latent cursor", the cursor may become invalid at some point -- for example if that
-           final object it references were deleted.  Thus, you should be prepared to requery if you get back
-           ResultFlag_CursorNotFound.
-        */
-        QueryOption_CursorTailable = 1 << 1,
-
-        /** allow query of replica slave.  normally these return an error except for namespace "local".
-        */
-        QueryOption_SlaveOk = 1 << 2,
-
-        // findingStart mode is used to find the first operation of interest when
-        // we are scanning through a repl log.  For efficiency in the common case,
-        // where the first operation of interest is closer to the tail than the head,
-        // we start from the tail of the log and work backwards until we find the
-        // first operation of interest.  Then we scan forward from that first operation,
-        // actually returning results to the client.  During the findingStart phase,
-        // we release the db mutex occasionally to avoid blocking the db process for
-        // an extended period of time.
-        QueryOption_OplogReplay = 1 << 3,
-
-        /** The server normally times out idle cursors after an inactivy period to prevent excess memory uses
-            Set this option to prevent that.
-        */
-        QueryOption_NoCursorTimeout = 1 << 4,
-
-        /** Use with QueryOption_CursorTailable.  If we are at the end of the data, block for a while rather
-            than returning no data. After a timeout period, we do return as normal.
-        */
-        QueryOption_AwaitData = 1 << 5,
-
-        /** Stream the data down full blast in multiple "more" packages, on the assumption that the client
-            will fully read all data queried.  Faster when you are pulling a lot of data and know you want to
-            pull it all down.  Note: it is not allowed to not read all the data unless you close the connection.
-
-            Use the query( boost::function<void(const BSONObj&)> f, ... ) version of the connection's query()
-            method, and it will take care of all the details for you.
-        */
-        QueryOption_Exhaust = 1 << 6,
-
-        /** When sharded, this means its ok to return partial results
-            Usually we will fail a query if all required shards aren't up
-            If this is set, it'll be a partial result set 
-         */
-        QueryOption_PartialResults = 1 << 7 ,
-
-        QueryOption_AllSupported = QueryOption_CursorTailable | QueryOption_SlaveOk | QueryOption_OplogReplay | QueryOption_NoCursorTimeout | QueryOption_AwaitData | QueryOption_Exhaust | QueryOption_PartialResults
-
-    };
-
-    enum UpdateOptions {
-        /** Upsert - that is, insert the item if no matching item is found. */
-        UpdateOption_Upsert = 1 << 0,
-
-        /** Update multiple documents (if multiple documents match query expression).
-           (Default is update a single document and stop.) */
-        UpdateOption_Multi = 1 << 1,
-
-        /** flag from mongo saying this update went everywhere */
-        UpdateOption_Broadcast = 1 << 2
-    };
-
-    enum RemoveOptions {
-        /** only delete one option */
-        RemoveOption_JustOne = 1 << 0,
-
-        /** flag from mongo saying this update went everywhere */
-        RemoveOption_Broadcast = 1 << 1
-    };
-
-    
-    /** 
-     * need to put in DbMesssage::ReservedOptions as well
-     */
-    enum InsertOptions {
-        /** With muli-insert keep processing inserts if one fails */
-        InsertOption_ContinueOnError = 1 << 0
-    };
-
-    class DBClientBase;
-
-    /**
-     * ConnectionString handles parsing different ways to connect to mongo and determining method
-     * samples:
-     *    server
-     *    server:port
-     *    foo/server:port,server:port   SET
-     *    server,server,server          SYNC
-     *
-     * tyipcal use
-     * string errmsg,
-     * ConnectionString cs = ConnectionString::parse( url , errmsg );
-     * if ( ! cs.isValid() ) throw "bad: " + errmsg;
-     * DBClientBase * conn = cs.connect( errmsg );
-     */
-    class ConnectionString {
-    public:
-        enum ConnectionType { INVALID , MASTER , PAIR , SET , SYNC };
-
-        ConnectionString() {
-            _type = INVALID;
-        }
-
-        ConnectionString( const HostAndPort& server ) {
-            _type = MASTER;
-            _servers.push_back( server );
-            _finishInit();
-        }
-
-        ConnectionString( ConnectionType type , const string& s , const string& setName = "" ) {
-            _type = type;
-            _setName = setName;
-            _fillServers( s );
-
-            switch ( _type ) {
-            case MASTER:
-                assert( _servers.size() == 1 );
-                break;
-            case SET:
-                assert( _setName.size() );
-                assert( _servers.size() >= 1 ); // 1 is ok since we can derive
-                break;
-            case PAIR:
-                assert( _servers.size() == 2 );
-                break;
-            default:
-                assert( _servers.size() > 0 );
-            }
-
-            _finishInit();
-        }
-
-        ConnectionString( const string& s , ConnectionType favoredMultipleType ) {
-            _type = INVALID;
-            
-            _fillServers( s );
-            if ( _type != INVALID ) {
-                // set already
-            }
-            else if ( _servers.size() == 1 ) {
-                _type = MASTER;
-            }
-            else {
-                _type = favoredMultipleType;
-                assert( _type == SET || _type == SYNC );
-            }
-            _finishInit();
-        }
-
-        bool isValid() const { return _type != INVALID; }
-
-        string toString() const { return _string; }
-        
-        DBClientBase* connect( string& errmsg, double socketTimeout = 0 ) const;
-
-        string getSetName() const { return _setName; }
-
-        vector<HostAndPort> getServers() const { return _servers; }
-        
-        ConnectionType type() const { return _type; }
-
-        static ConnectionString parse( const string& url , string& errmsg );
-
-        static string typeToString( ConnectionType type );
-
-    private:
-
-        void _fillServers( string s );
-        void _finishInit();
-
-        ConnectionType _type;
-        vector<HostAndPort> _servers;
-        string _string;
-        string _setName;
-    };
-
-    /**
-     * controls how much a clients cares about writes
-     * default is NORMAL
-     */
-    enum WriteConcern {
-        W_NONE = 0 , // TODO: not every connection type fully supports this
-        W_NORMAL = 1
-        // TODO SAFE = 2
-    };
-
-    class BSONObj;
-    class ScopedDbConnection;
-    class DBClientCursor;
-    class DBClientCursorBatchIterator;
-
-    /** Represents a Mongo query expression.  Typically one uses the QUERY(...) macro to construct a Query object.
-        Examples:
-           QUERY( "age" << 33 << "school" << "UCLA" ).sort("name")
-           QUERY( "age" << GT << 30 << LT << 50 )
-    */
-    class Query {
-    public:
-        BSONObj obj;
-        Query() : obj(BSONObj()) { }
-        Query(const BSONObj& b) : obj(b) { }
-        Query(const string &json) :
-            obj(fromjson(json)) { }
-        Query(const char * json) :
-            obj(fromjson(json)) { }
-
-        /** Add a sort (ORDER BY) criteria to the query expression.
-            @param sortPattern the sort order template.  For example to order by name ascending, time descending:
-              { name : 1, ts : -1 }
-            i.e.
-              BSON( "name" << 1 << "ts" << -1 )
-            or
-              fromjson(" name : 1, ts : -1 ")
-        */
-        Query& sort(const BSONObj& sortPattern);
-
-        /** Add a sort (ORDER BY) criteria to the query expression.
-            This version of sort() assumes you want to sort on a single field.
-            @param asc = 1 for ascending order
-            asc = -1 for descending order
-        */
-        Query& sort(const string &field, int asc = 1) { sort( BSON( field << asc ) ); return *this; }
-
-        /** Provide a hint to the query.
-            @param keyPattern Key pattern for the index to use.
-            Example:
-              hint("{ts:1}")
-        */
-        Query& hint(BSONObj keyPattern);
-        Query& hint(const string &jsonKeyPatt) { return hint(fromjson(jsonKeyPatt)); }
-
-        /** Provide min and/or max index limits for the query.
-            min <= x < max
-         */
-        Query& minKey(const BSONObj &val);
-        /**
-           max is exclusive
-         */
-        Query& maxKey(const BSONObj &val);
-
-        /** Return explain information about execution of this query instead of the actual query results.
-            Normally it is easier to use the mongo shell to run db.find(...).explain().
-        */
-        Query& explain();
-
-        /** Use snapshot mode for the query.  Snapshot mode assures no duplicates are returned, or objects missed, which were
-            present at both the start and end of the query's execution (if an object is new during the query, or deleted during
-            the query, it may or may not be returned, even with snapshot mode).
-
-            Note that short query responses (less than 1MB) are always effectively snapshotted.
-
-            Currently, snapshot mode may not be used with sorting or explicit hints.
-        */
-        Query& snapshot();
-
-        /** Queries to the Mongo database support a $where parameter option which contains
-            a javascript function that is evaluated to see whether objects being queried match
-            its criteria.  Use this helper to append such a function to a query object.
-            Your query may also contain other traditional Mongo query terms.
-
-            @param jscode The javascript function to evaluate against each potential object
-                   match.  The function must return true for matched objects.  Use the this
-                   variable to inspect the current object.
-            @param scope SavedContext for the javascript object.  List in a BSON object any
-                   variables you would like defined when the jscode executes.  One can think
-                   of these as "bind variables".
-
-            Examples:
-              conn.findOne("test.coll", Query("{a:3}").where("this.b == 2 || this.c == 3"));
-              Query badBalance = Query().where("this.debits - this.credits < 0");
-        */
-        Query& where(const string &jscode, BSONObj scope);
-        Query& where(const string &jscode) { return where(jscode, BSONObj()); }
-
-        /**
-         * @return true if this query has an orderby, hint, or some other field
-         */
-        bool isComplex( bool * hasDollar = 0 ) const;
-
-        BSONObj getFilter() const;
-        BSONObj getSort() const;
-        BSONObj getHint() const;
-        bool isExplain() const;
-
-        string toString() const;
-        operator string() const { return toString(); }
-    private:
-        void makeComplex();
-        template< class T >
-        void appendComplex( const char *fieldName, const T& val ) {
-            makeComplex();
-            BSONObjBuilder b;
-            b.appendElements(obj);
-            b.append(fieldName, val);
-            obj = b.obj();
-        }
-    };
-
-    /**
-     * Represents a full query description, including all options required for the query to be passed on
-     * to other hosts
-     */
-    class QuerySpec {
-
-        string _ns;
-        int _ntoskip;
-        int _ntoreturn;
-        int _options;
-        BSONObj _query;
-        BSONObj _fields;
-        Query _queryObj;
-
-    public:
-        
-        QuerySpec( const string& ns,
-                   const BSONObj& query, const BSONObj& fields,
-                   int ntoskip, int ntoreturn, int options )
-            : _ns( ns ), _ntoskip( ntoskip ), _ntoreturn( ntoreturn ), _options( options ),
-              _query( query.getOwned() ), _fields( fields.getOwned() ) , _queryObj( _query ) {
-        }
-
-        QuerySpec() {}
-
-        bool isEmpty() const { return _ns.size() == 0; }
-
-        bool isExplain() const { return _queryObj.isExplain(); }
-        BSONObj filter() const { return _queryObj.getFilter(); }
-
-        BSONObj hint() const { return _queryObj.getHint(); }
-        BSONObj sort() const { return _queryObj.getSort(); }
-        BSONObj query() const { return _query; }
-        BSONObj fields() const { return _fields; }
-        BSONObj* fieldsData() { return &_fields; }
-
-        // don't love this, but needed downstrem
-        const BSONObj* fieldsPtr() const { return &_fields; } 
-
-        string ns() const { return _ns; }
-        int ntoskip() const { return _ntoskip; }
-        int ntoreturn() const { return _ntoreturn; }
-        int options() const { return _options; }
-        
-        void setFields( BSONObj& o ) { _fields = o.getOwned(); }
-
-        string toString() const {
-            return str::stream() << "QSpec " << 
-                BSON( "ns" << _ns << "n2skip" << _ntoskip << "n2return" << _ntoreturn << "options" << _options
-                      << "query" << _query << "fields" << _fields );
-        }
-        
-    };
-
-
-    /** Typically one uses the QUERY(...) macro to construct a Query object.
-        Example: QUERY( "age" << 33 << "school" << "UCLA" )
-    */
-#define QUERY(x) mongo::Query( BSON(x) )
-
-    // Useful utilities for namespaces
-    /** @return the database name portion of an ns string */
-    string nsGetDB( const string &ns );
-
-    /** @return the collection name portion of an ns string */
-    string nsGetCollection( const string &ns );
-
-    /**
-       interface that handles communication with the db
-     */
-    class DBConnector {
-    public:
-        virtual ~DBConnector() {}
-        /** actualServer is set to the actual server where they call went if there was a choice (SlaveOk) */
-        virtual bool call( Message &toSend, Message &response, bool assertOk=true , string * actualServer = 0 ) = 0;
-        virtual void say( Message &toSend, bool isRetry = false , string * actualServer = 0 ) = 0;
-        virtual void sayPiggyBack( Message &toSend ) = 0;
-        /* used by QueryOption_Exhaust.  To use that your subclass must implement this. */
-        virtual bool recv( Message& m ) { assert(false); return false; }
-        // In general, for lazy queries, we'll need to say, recv, then checkResponse
-        virtual void checkResponse( const char* data, int nReturned, bool* retry = NULL, string* targetHost = NULL ) {
-            if( retry ) *retry = false; if( targetHost ) *targetHost = "";
-        }
-        virtual bool lazySupported() const = 0;
-    };
-
-    /**
-       The interface that any db connection should implement
-     */
-    class DBClientInterface : boost::noncopyable {
-    public:
-        virtual auto_ptr<DBClientCursor> query(const string &ns, Query query, int nToReturn = 0, int nToSkip = 0,
-                                               const BSONObj *fieldsToReturn = 0, int queryOptions = 0 , int batchSize = 0 ) = 0;
-
-        virtual void insert( const string &ns, BSONObj obj , int flags=0) = 0;
-
-        virtual void insert( const string &ns, const vector< BSONObj >& v , int flags=0) = 0;
-
-        virtual void remove( const string &ns , Query query, bool justOne = 0 ) = 0;
-
-        virtual void update( const string &ns , Query query , BSONObj obj , bool upsert = 0 , bool multi = 0 ) = 0;
-
-        virtual ~DBClientInterface() { }
-
-        /**
-           @return a single object that matches the query.  if none do, then the object is empty
-           @throws AssertionException
-        */
-        virtual BSONObj findOne(const string &ns, const Query& query, const BSONObj *fieldsToReturn = 0, int queryOptions = 0);
-
-        /** query N objects from the database into an array.  makes sense mostly when you want a small number of results.  if a huge number, use 
-            query() and iterate the cursor. 
-        */
-        void findN(vector<BSONObj>& out, const string&ns, Query query, int nToReturn, int nToSkip = 0, const BSONObj *fieldsToReturn = 0, int queryOptions = 0);
-
-        virtual string getServerAddress() const = 0;
-
-        /** don't use this - called automatically by DBClientCursor for you */
-        virtual auto_ptr<DBClientCursor> getMore( const string &ns, long long cursorId, int nToReturn = 0, int options = 0 ) = 0;
-    };
-
-    /**
-       DB "commands"
-       Basically just invocations of connection.$cmd.findOne({...});
-    */
-    class DBClientWithCommands : public DBClientInterface {
-        set<string> _seenIndexes;
-    public:
-        /** controls how chatty the client is about network errors & such.  See log.h */
-        int _logLevel;
-
-        DBClientWithCommands() : _logLevel(0), _cachedAvailableOptions( (enum QueryOptions)0 ), _haveCachedAvailableOptions(false) { }
-
-        /** helper function.  run a simple command where the command expression is simply
-              { command : 1 }
-            @param info -- where to put result object.  may be null if caller doesn't need that info
-            @param command -- command name
-            @return true if the command returned "ok".
-         */
-        bool simpleCommand(const string &dbname, BSONObj *info, const string &command);
-
-        /** Run a database command.  Database commands are represented as BSON objects.  Common database
-            commands have prebuilt helper functions -- see below.  If a helper is not available you can
-            directly call runCommand.
-
-            @param dbname database name.  Use "admin" for global administrative commands.
-            @param cmd  the command object to execute.  For example, { ismaster : 1 }
-            @param info the result object the database returns. Typically has { ok : ..., errmsg : ... } fields
-                   set.
-            @param options see enum QueryOptions - normally not needed to run a command
-            @return true if the command returned "ok".
-        */
-        virtual bool runCommand(const string &dbname, const BSONObj& cmd, BSONObj &info, int options=0);
-
-        /** Authorize access to a particular database.
-            Authentication is separate for each database on the server -- you may authenticate for any
-            number of databases on a single connection.
-            The "admin" database is special and once authenticated provides access to all databases on the
-            server.
-            @param      digestPassword  if password is plain text, set this to true.  otherwise assumed to be pre-digested
-            @param[out] authLevel       level of authentication for the given user
-            @return true if successful
-        */
-        virtual bool auth(const string &dbname, const string &username, const string &pwd, string& errmsg, bool digestPassword = true, Auth::Level * level = NULL);
-
-        /** count number of objects in collection ns that match the query criteria specified
-            throws UserAssertion if database returns an error
-        */
-        virtual unsigned long long count(const string &ns, const BSONObj& query = BSONObj(), int options=0, int limit=0, int skip=0 );
-
-        string createPasswordDigest( const string &username , const string &clearTextPassword );
-
-        /** returns true in isMaster parm if this db is the current master
-           of a replica pair.
-
-           pass in info for more details e.g.:
-             { "ismaster" : 1.0 , "msg" : "not paired" , "ok" : 1.0  }
-
-           returns true if command invoked successfully.
-        */
-        virtual bool isMaster(bool& isMaster, BSONObj *info=0);
-
-        /**
-           Create a new collection in the database.  Normally, collection creation is automatic.  You would
-           use this function if you wish to specify special options on creation.
-
-           If the collection already exists, no action occurs.
-
-           @param ns     fully qualified collection name
-           @param size   desired initial extent size for the collection.
-                         Must be <= 1000000000 for normal collections.
-                         For fixed size (capped) collections, this size is the total/max size of the
-                         collection.
-           @param capped if true, this is a fixed size collection (where old data rolls out).
-           @param max    maximum number of objects if capped (optional).
-
-           returns true if successful.
-        */
-        bool createCollection(const string &ns, long long size = 0, bool capped = false, int max = 0, BSONObj *info = 0);
-
-        /** Get error result from the last write operation (insert/update/delete) on this connection.
-            @return error message text, or empty string if no error.
-        */
-        string getLastError(bool fsync = false, bool j = false, int w = 0, int wtimeout = 0);
-
-        /** Get error result from the last write operation (insert/update/delete) on this connection.
-            @return full error object.
-
-            If "w" is -1, wait for propagation to majority of nodes.
-            If "wtimeout" is 0, the operation will block indefinitely if needed.
-        */
-        virtual BSONObj getLastErrorDetailed(bool fsync = false, bool j = false, int w = 0, int wtimeout = 0);
-
-        /** Can be called with the returned value from getLastErrorDetailed to extract an error string. 
-            If all you need is the string, just call getLastError() instead.
-        */
-        static string getLastErrorString( const BSONObj& res );
-
-        /** Return the last error which has occurred, even if not the very last operation.
-
-           @return { err : <error message>, nPrev : <how_many_ops_back_occurred>, ok : 1 }
-
-           result.err will be null if no error has occurred.
-        */
-        BSONObj getPrevError();
-
-        /** Reset the previous error state for this connection (accessed via getLastError and
-            getPrevError).  Useful when performing several operations at once and then checking
-            for an error after attempting all operations.
-        */
-        bool resetError() { return simpleCommand("admin", 0, "reseterror"); }
-
-        /** Delete the specified collection. */
-        virtual bool dropCollection( const string &ns ) {
-            string db = nsGetDB( ns );
-            string coll = nsGetCollection( ns );
-            uassert( 10011 ,  "no collection name", coll.size() );
-
-            BSONObj info;
-
-            bool res = runCommand( db.c_str() , BSON( "drop" << coll ) , info );
-            resetIndexCache();
-            return res;
-        }
-
-        /** Perform a repair and compaction of the specified database.  May take a long time to run.  Disk space
-           must be available equal to the size of the database while repairing.
-        */
-        bool repairDatabase(const string &dbname, BSONObj *info = 0) {
-            return simpleCommand(dbname, info, "repairDatabase");
-        }
-
-        /** Copy database from one server or name to another server or name.
-
-           Generally, you should dropDatabase() first as otherwise the copied information will MERGE
-           into whatever data is already present in this database.
-
-           For security reasons this function only works when you are authorized to access the "admin" db.  However,
-           if you have access to said db, you can copy any database from one place to another.
-           TODO: this needs enhancement to be more flexible in terms of security.
-
-           This method provides a way to "rename" a database by copying it to a new db name and
-           location.  The copy is "repaired" and compacted.
-
-           fromdb   database name from which to copy.
-           todb     database name to copy to.
-           fromhost hostname of the database (and optionally, ":port") from which to
-                    copy the data.  copies from self if "".
-
-           returns true if successful
-        */
-        bool copyDatabase(const string &fromdb, const string &todb, const string &fromhost = "", BSONObj *info = 0);
-
-        /** The Mongo database provides built-in performance profiling capabilities.  Uset setDbProfilingLevel()
-           to enable.  Profiling information is then written to the system.profile collection, which one can
-           then query.
-        */
-        enum ProfilingLevel {
-            ProfileOff = 0,
-            ProfileSlow = 1, // log very slow (>100ms) operations
-            ProfileAll = 2
-
-        };
-        bool setDbProfilingLevel(const string &dbname, ProfilingLevel level, BSONObj *info = 0);
-        bool getDbProfilingLevel(const string &dbname, ProfilingLevel& level, BSONObj *info = 0);
-
-
-        /** This implicitly converts from char*, string, and BSONObj to be an argument to mapreduce
-            You shouldn't need to explicitly construct this
-         */
-        struct MROutput {
-            MROutput(const char* collection) : out(BSON("replace" << collection)) {}
-            MROutput(const string& collection) : out(BSON("replace" << collection)) {}
-            MROutput(const BSONObj& obj) : out(obj) {}
-
-            BSONObj out;
-        };
-        static MROutput MRInline;
-
-        /** Run a map/reduce job on the server.
-
-            See http://www.mongodb.org/display/DOCS/MapReduce
-
-            ns        namespace (db+collection name) of input data
-            jsmapf    javascript map function code
-            jsreducef javascript reduce function code.
-            query     optional query filter for the input
-            output    either a string collection name or an object representing output type
-                      if not specified uses inline output type
-
-            returns a result object which contains:
-             { result : <collection_name>,
-               numObjects : <number_of_objects_scanned>,
-               timeMillis : <job_time>,
-               ok : <1_if_ok>,
-               [, err : <errmsg_if_error>]
-             }
-
-             For example one might call:
-               result.getField("ok").trueValue()
-             on the result to check if ok.
-        */
-        BSONObj mapreduce(const string &ns, const string &jsmapf, const string &jsreducef, BSONObj query = BSONObj(), MROutput output = MRInline);
-
-        /** Run javascript code on the database server.
-           dbname    database SavedContext in which the code runs. The javascript variable 'db' will be assigned
-                     to this database when the function is invoked.
-           jscode    source code for a javascript function.
-           info      the command object which contains any information on the invocation result including
-                      the return value and other information.  If an error occurs running the jscode, error
-                     information will be in info.  (try "out() << info.toString()")
-           retValue  return value from the jscode function.
-           args      args to pass to the jscode function.  when invoked, the 'args' variable will be defined
-                     for use by the jscode.
-
-           returns true if runs ok.
-
-           See testDbEval() in dbclient.cpp for an example of usage.
-        */
-        bool eval(const string &dbname, const string &jscode, BSONObj& info, BSONElement& retValue, BSONObj *args = 0);
-
-        /** validate a collection, checking for errors and reporting back statistics.
-            this operation is slow and blocking.
-         */
-        bool validate( const string &ns , bool scandata=true ) {
-            BSONObj cmd = BSON( "validate" << nsGetCollection( ns ) << "scandata" << scandata );
-            BSONObj info;
-            return runCommand( nsGetDB( ns ).c_str() , cmd , info );
-        }
-
-        /* The following helpers are simply more convenient forms of eval() for certain common cases */
-
-        /* invocation with no return value of interest -- with or without one simple parameter */
-        bool eval(const string &dbname, const string &jscode);
-        template< class T >
-        bool eval(const string &dbname, const string &jscode, T parm1) {
-            BSONObj info;
-            BSONElement retValue;
-            BSONObjBuilder b;
-            b.append("0", parm1);
-            BSONObj args = b.done();
-            return eval(dbname, jscode, info, retValue, &args);
-        }
-
-        /** eval invocation with one parm to server and one numeric field (either int or double) returned */
-        template< class T, class NumType >
-        bool eval(const string &dbname, const string &jscode, T parm1, NumType& ret) {
-            BSONObj info;
-            BSONElement retValue;
-            BSONObjBuilder b;
-            b.append("0", parm1);
-            BSONObj args = b.done();
-            if ( !eval(dbname, jscode, info, retValue, &args) )
-                return false;
-            ret = (NumType) retValue.number();
-            return true;
-        }
-
-        /**
-           get a list of all the current databases
-           uses the { listDatabases : 1 } command.
-           throws on error
-         */
-        list<string> getDatabaseNames();
-
-        /**
-           get a list of all the current collections in db
-         */
-        list<string> getCollectionNames( const string& db );
-
-        bool exists( const string& ns );
-
-        /** Create an index if it does not already exist.
-            ensureIndex calls are remembered so it is safe/fast to call this function many
-            times in your code.
-           @param ns collection to be indexed
-           @param keys the "key pattern" for the index.  e.g., { name : 1 }
-           @param unique if true, indicates that key uniqueness should be enforced for this index
-           @param name if not specified, it will be created from the keys automatically (which is recommended)
-           @param cache if set to false, the index cache for the connection won't remember this call
-           @param background build index in the background (see mongodb docs/wiki for details)
-           @param v index version. leave at default value. (unit tests set this parameter.)
-           @return whether or not sent message to db.
-             should be true on first call, false on subsequent unless resetIndexCache was called
-         */
-        virtual bool ensureIndex( const string &ns , BSONObj keys , bool unique = false, const string &name = "",
-                                  bool cache = true, bool background = false, int v = -1 );
-
-        /**
-           clears the index cache, so the subsequent call to ensureIndex for any index will go to the server
-         */
-        virtual void resetIndexCache();
-
-        virtual auto_ptr<DBClientCursor> getIndexes( const string &ns );
-
-        virtual void dropIndex( const string& ns , BSONObj keys );
-        virtual void dropIndex( const string& ns , const string& indexName );
-
-        /**
-           drops all indexes for the collection
-         */
-        virtual void dropIndexes( const string& ns );
-
-        virtual void reIndex( const string& ns );
-
-        string genIndexName( const BSONObj& keys );
-
-        /** Erase / drop an entire database */
-        virtual bool dropDatabase(const string &dbname, BSONObj *info = 0) {
-            bool ret = simpleCommand(dbname, info, "dropDatabase");
-            resetIndexCache();
-            return ret;
-        }
-
-        virtual string toString() = 0;
-
-    protected:
-        /** if the result of a command is ok*/
-        bool isOk(const BSONObj&);
-
-        /** if the element contains a not master error */
-        bool isNotMasterErrorString( const BSONElement& e );
-
-        BSONObj _countCmd(const string &ns, const BSONObj& query, int options, int limit, int skip );
-
-        /**
-         * Look up the options available on this client.  Caches the answer from
-         * _lookupAvailableOptions(), below.
-         */
-        QueryOptions availableOptions();
-
-        virtual QueryOptions _lookupAvailableOptions();
-
-    private:
-        enum QueryOptions _cachedAvailableOptions;
-        bool _haveCachedAvailableOptions;
-    };
-
-    /**
-     abstract class that implements the core db operations
-     */
-    class DBClientBase : public DBClientWithCommands, public DBConnector {
-    protected:
-        WriteConcern _writeConcern;
-
-    public:
-        DBClientBase() {
-            _writeConcern = W_NORMAL;
-        }
-
-        WriteConcern getWriteConcern() const { return _writeConcern; }
-        void setWriteConcern( WriteConcern w ) { _writeConcern = w; }
-
-        /** send a query to the database.
-         @param ns namespace to query, format is <dbname>.<collectname>[.<collectname>]*
-         @param query query to perform on the collection.  this is a BSONObj (binary JSON)
-         You may format as
-           { query: { ... }, orderby: { ... } }
-         to specify a sort order.
-         @param nToReturn n to return (i.e., limit).  0 = unlimited
-         @param nToSkip start with the nth item
-         @param fieldsToReturn optional template of which fields to select. if unspecified, returns all fields
-         @param queryOptions see options enum at top of this file
-
-         @return    cursor.   0 if error (connection failure)
-         @throws AssertionException
-        */
-        virtual auto_ptr<DBClientCursor> query(const string &ns, Query query, int nToReturn = 0, int nToSkip = 0,
-                                               const BSONObj *fieldsToReturn = 0, int queryOptions = 0 , int batchSize = 0 );
-
-
-        /** Uses QueryOption_Exhaust, when available.
-
-            Exhaust mode sends back all data queries as fast as possible, with no back-and-forth for
-            OP_GETMORE.  If you are certain you will exhaust the query, it could be useful.
-
-            Use the DBClientCursorBatchIterator version, below, if you want to do items in large
-            blocks, perhaps to avoid granular locking and such.
-         */
-        virtual unsigned long long query( boost::function<void(const BSONObj&)> f,
-                                          const string& ns,
-                                          Query query,
-                                          const BSONObj *fieldsToReturn = 0,
-                                          int queryOptions = 0 );
-
-        virtual unsigned long long query( boost::function<void(DBClientCursorBatchIterator&)> f,
-                                          const string& ns,
-                                          Query query,
-                                          const BSONObj *fieldsToReturn = 0,
-                                          int queryOptions = 0 );
-
-
-        /** don't use this - called automatically by DBClientCursor for you
-            @param cursorId id of cursor to retrieve
-            @return an handle to a previously allocated cursor
-            @throws AssertionException
-         */
-        virtual auto_ptr<DBClientCursor> getMore( const string &ns, long long cursorId, int nToReturn = 0, int options = 0 );
-
-        /**
-           insert an object into the database
-         */
-        virtual void insert( const string &ns , BSONObj obj , int flags=0);
-
-        /**
-           insert a vector of objects into the database
-         */
-        virtual void insert( const string &ns, const vector< BSONObj >& v , int flags=0);
-
-        /**
-           remove matching objects from the database
-           @param justOne if this true, then once a single match is found will stop
-         */
-        virtual void remove( const string &ns , Query q , bool justOne = 0 );
-
-        /**
-           updates objects matching query
-         */
-        virtual void update( const string &ns , Query query , BSONObj obj , bool upsert = false , bool multi = false );
-
-        virtual bool isFailed() const = 0;
-
-        virtual void killCursor( long long cursorID ) = 0;
-
-        virtual bool callRead( Message& toSend , Message& response ) = 0;
-        // virtual bool callWrite( Message& toSend , Message& response ) = 0; // TODO: add this if needed
-        
-        virtual ConnectionString::ConnectionType type() const = 0;
-        
-        virtual double getSoTimeout() const = 0;
-
-    }; // DBClientBase
-
-    class DBClientReplicaSet;
-
-    class ConnectException : public UserException {
-    public:
-        ConnectException(string msg) : UserException(9000,msg) { }
-    };
-
-    /**
-        A basic connection to the database.
-        This is the main entry point for talking to a simple Mongo setup
-    */
-    class DBClientConnection : public DBClientBase {
-    public:
-        using DBClientBase::query;
-
-        /**
-           @param _autoReconnect if true, automatically reconnect on a connection failure
-           @param cp used by DBClientReplicaSet.  You do not need to specify this parameter
-           @param timeout tcp timeout in seconds - this is for read/write, not connect.
-           Connect timeout is fixed, but short, at 5 seconds.
-         */
-        DBClientConnection(bool _autoReconnect=false, DBClientReplicaSet* cp=0, double so_timeout=0) :
-            clientSet(cp), _failed(false), autoReconnect(_autoReconnect), lastReconnectTry(0), _so_timeout(so_timeout) {
-            _numConnections++;
-        }
-
-        virtual ~DBClientConnection() {
-            _numConnections--;
-        }
-
-        /** Connect to a Mongo database server.
-
-           If autoReconnect is true, you can try to use the DBClientConnection even when
-           false was returned -- it will try to connect again.
-
-           @param serverHostname host to connect to.  can include port number ( 127.0.0.1 , 127.0.0.1:5555 )
-                                 If you use IPv6 you must add a port number ( ::1:27017 )
-           @param errmsg any relevant error message will appended to the string
-           @deprecated please use HostAndPort
-           @return false if fails to connect.
-        */
-        virtual bool connect(const char * hostname, string& errmsg) {
-            // TODO: remove this method
-            HostAndPort t( hostname );
-            return connect( t , errmsg );
-        }
-
-        /** Connect to a Mongo database server.
-
-           If autoReconnect is true, you can try to use the DBClientConnection even when
-           false was returned -- it will try to connect again.
-
-           @param server server to connect to.
-           @param errmsg any relevant error message will appended to the string
-           @return false if fails to connect.
-        */
-        virtual bool connect(const HostAndPort& server, string& errmsg);
-
-        /** Connect to a Mongo database server.  Exception throwing version.
-            Throws a UserException if cannot connect.
-
-           If autoReconnect is true, you can try to use the DBClientConnection even when
-           false was returned -- it will try to connect again.
-
-           @param serverHostname host to connect to.  can include port number ( 127.0.0.1 , 127.0.0.1:5555 )
-        */
-        void connect(const string& serverHostname) {
-            string errmsg;
-            if( !connect(HostAndPort(serverHostname), errmsg) )
-                throw ConnectException(string("can't connect ") + errmsg);
-        }
-
-        virtual bool auth(const string &dbname, const string &username, const string &pwd, string& errmsg, bool digestPassword = true, Auth::Level* level=NULL);
-
-        virtual auto_ptr<DBClientCursor> query(const string &ns, Query query=Query(), int nToReturn = 0, int nToSkip = 0,
-                                               const BSONObj *fieldsToReturn = 0, int queryOptions = 0 , int batchSize = 0 ) {
-            checkConnection();
-            return DBClientBase::query( ns, query, nToReturn, nToSkip, fieldsToReturn, queryOptions , batchSize );
-        }
-
-        virtual unsigned long long query( boost::function<void(DBClientCursorBatchIterator &)> f,
-                                          const string& ns,
-                                          Query query,
-                                          const BSONObj *fieldsToReturn,
-                                          int queryOptions );
-
-        virtual bool runCommand(const string &dbname, const BSONObj& cmd, BSONObj &info, int options=0);
-
-        /**
-           @return true if this connection is currently in a failed state.  When autoreconnect is on,
-                   a connection will transition back to an ok state after reconnecting.
-         */
-        bool isFailed() const { return _failed; }
-
-        MessagingPort& port() { assert(p); return *p; }
-
-        string toStringLong() const {
-            stringstream ss;
-            ss << _serverString;
-            if ( _failed ) ss << " failed";
-            return ss.str();
-        }
-
-        /** Returns the address of the server */
-        string toString() { return _serverString; }
-
-        string getServerAddress() const { return _serverString; }
-
-        virtual void killCursor( long long cursorID );
-        virtual bool callRead( Message& toSend , Message& response ) { return call( toSend , response ); }
-        virtual void say( Message &toSend, bool isRetry = false , string * actualServer = 0 );
-        virtual bool recv( Message& m );
-        virtual void checkResponse( const char *data, int nReturned, bool* retry = NULL, string* host = NULL );
-        virtual bool call( Message &toSend, Message &response, bool assertOk = true , string * actualServer = 0 );
-        virtual ConnectionString::ConnectionType type() const { return ConnectionString::MASTER; }
-        void setSoTimeout(double to) { _so_timeout = to; }
-        double getSoTimeout() const { return _so_timeout; }
-
-        virtual bool lazySupported() const { return true; }
-
-        static int getNumConnections() {
-            return _numConnections;
-        }
-        
-        static void setLazyKillCursor( bool lazy ) { _lazyKillCursor = lazy; }
-        static bool getLazyKillCursor() { return _lazyKillCursor; }
-        
-    protected:
-        friend class SyncClusterConnection;
-        virtual void sayPiggyBack( Message &toSend );
-
-        DBClientReplicaSet *clientSet;
-        boost::scoped_ptr<MessagingPort> p;
-        boost::scoped_ptr<SockAddr> server;
-        bool _failed;
-        const bool autoReconnect;
-        time_t lastReconnectTry;
-        HostAndPort _server; // remember for reconnects
-        string _serverString;
-        void _checkConnection();
-
-        // throws SocketException if in failed state and not reconnecting or if waiting to reconnect
-        void checkConnection() { if( _failed ) _checkConnection(); }
-
-        map< string, pair<string,string> > authCache;
-        double _so_timeout;
-        bool _connect( string& errmsg );
-
-        static AtomicUInt _numConnections;
-        static bool _lazyKillCursor; // lazy means we piggy back kill cursors on next op
-
-#ifdef MONGO_SSL
-        static SSLManager* sslManager();
-        static SSLManager* _sslManager;
-#endif
-    };
-
-    /** pings server to check if it's up
-     */
-    bool serverAlive( const string &uri );
-
-    DBClientBase * createDirectClient();
-
-    BSONElement getErrField( const BSONObj& result );
-    bool hasErrField( const BSONObj& result );
-
-    inline std::ostream& operator<<( std::ostream &s, const Query &q ) {
-        return s << q.toString();
-    }
-
-} // namespace mongo
-
-#include "dbclientcursor.h"
-#include "dbclient_rs.h"
-#include "undef_macros.h"
+#include "mongo/client/undef_macros.h"
diff --git a/src/mongo/client/dbclient_rs.cpp b/src/mongo/client/dbclient_rs.cpp
index 3cfbc82137f..ba69ca337c8 100644
--- a/src/mongo/client/dbclient_rs.cpp
+++ b/src/mongo/client/dbclient_rs.cpp
@@ -15,18 +15,22 @@
  *    limitations under the License.
  */
 
-#include "pch.h"
-#include "dbclient.h"
-#include "../bson/util/builder.h"
-#include "../db/jsobj.h"
-#include "../db/json.h"
-#include "../db/dbmessage.h"
-#include "connpool.h"
-#include "dbclient_rs.h"
-#include "../util/background.h"
-#include "../util/timer.h"
+#include "mongo/pch.h"
+
+#include "mongo/client/dbclient_rs.h"
+
 #include <fstream>
 
+#include "mongo/bson/util/builder.h"
+#include "mongo/client/connpool.h"
+#include "mongo/client/dbclient.h"
+#include "mongo/client/dbclientcursor.h"
+#include "mongo/db/dbmessage.h"
+#include "mongo/db/jsobj.h"
+#include "mongo/db/json.h"
+#include "mongo/util/background.h"
+#include "mongo/util/timer.h"
+
 namespace mongo {
 
     // --------------------------------
diff --git a/src/mongo/client/dbclient_rs.h b/src/mongo/client/dbclient_rs.h
index 8baffe941b2..6d415e5ab27 100644
--- a/src/mongo/client/dbclient_rs.h
+++ b/src/mongo/client/dbclient_rs.h
@@ -17,8 +17,15 @@
 
 #pragma once
 
-#include "../pch.h"
-#include "dbclient.h"
+#include "mongo/pch.h"
+
+#include <boost/function.hpp>
+#include <boost/shared_ptr.hpp>
+#include <set>
+#include <utility>
+
+#include "mongo/client/dbclientinterface.h"
+#include "mongo/util/net/hostandport.h"
 
 namespace mongo {
 
diff --git a/src/mongo/client/dbclientcursor.cpp b/src/mongo/client/dbclientcursor.cpp
index dcf86818dc6..0f7a4e3ae2c 100644
--- a/src/mongo/client/dbclientcursor.cpp
+++ b/src/mongo/client/dbclientcursor.cpp
@@ -15,13 +15,16 @@
  *    limitations under the License.
  */
 
-#include "pch.h"
-#include "dbclient.h"
-#include "../db/dbmessage.h"
-#include "../db/cmdline.h"
-#include "connpool.h"
-#include "../s/shard.h"
-#include "../s/util.h"
+#include "mongo/pch.h"
+
+#include "mongo/client/dbclientcursor.h"
+
+#include "mongo/client/connpool.h"
+#include "mongo/client/dbclient.h"
+#include "mongo/db/cmdline.h"
+#include "mongo/db/dbmessage.h"
+#include "mongo/s/shard.h"
+#include "mongo/s/util.h"
 
 namespace mongo {
 
diff --git a/src/mongo/client/dbclientcursor.h b/src/mongo/client/dbclientcursor.h
index d7661438516..4f2ff2c7916 100644
--- a/src/mongo/client/dbclientcursor.h
+++ b/src/mongo/client/dbclientcursor.h
@@ -17,12 +17,16 @@
 
 #pragma once
 
-#include "../pch.h"
-#include "../util/net/message.h"
-#include "../db/jsobj.h"
-#include "../db/json.h"
+#include "mongo/pch.h"
+
 #include <stack>
 
+#include "mongo/client/dbclientinterface.h"
+#include "mongo/db/jsobj.h"
+#include "mongo/db/json.h"
+#include "mongo/util/assert_util.h"
+#include "mongo/util/net/message.h"
+
 namespace mongo {
 
     class AScopedConnection;
diff --git a/src/mongo/client/dbclientinterface.h b/src/mongo/client/dbclientinterface.h
new file mode 100644
index 00000000000..77d6a39c4e8
--- /dev/null
+++ b/src/mongo/client/dbclientinterface.h
@@ -0,0 +1,1056 @@
+/** @file dbclientinterface.h
+
+    Core MongoDB C++ driver interfaces are defined here.
+*/
+
+/*    Copyright 2009 10gen Inc.
+ *
+ *    Licensed under the Apache License, Version 2.0 (the "License");
+ *    you may not use this file except in compliance with the License.
+ *    You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ *    Unless required by applicable law or agreed to in writing, software
+ *    distributed under the License is distributed on an "AS IS" BASIS,
+ *    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ *    See the License for the specific language governing permissions and
+ *    limitations under the License.
+ */
+
+#pragma once
+
+#include "mongo/pch.h"
+
+#include "mongo/db/authlevel.h"
+#include "mongo/db/jsobj.h"
+#include "mongo/util/net/message.h"
+#include "mongo/util/net/message_port.h"
+
+namespace mongo {
+
+    /** the query field 'options' can have these bits set: */
+    enum QueryOptions {
+        /** Tailable means cursor is not closed when the last data is retrieved.  rather, the cursor marks
+           the final object's position.  you can resume using the cursor later, from where it was located,
+           if more data were received.  Set on dbQuery and dbGetMore.
+
+           like any "latent cursor", the cursor may become invalid at some point -- for example if that
+           final object it references were deleted.  Thus, you should be prepared to requery if you get back
+           ResultFlag_CursorNotFound.
+        */
+        QueryOption_CursorTailable = 1 << 1,
+
+        /** allow query of replica slave.  normally these return an error except for namespace "local".
+        */
+        QueryOption_SlaveOk = 1 << 2,
+
+        // findingStart mode is used to find the first operation of interest when
+        // we are scanning through a repl log.  For efficiency in the common case,
+        // where the first operation of interest is closer to the tail than the head,
+        // we start from the tail of the log and work backwards until we find the
+        // first operation of interest.  Then we scan forward from that first operation,
+        // actually returning results to the client.  During the findingStart phase,
+        // we release the db mutex occasionally to avoid blocking the db process for
+        // an extended period of time.
+        QueryOption_OplogReplay = 1 << 3,
+
+        /** The server normally times out idle cursors after an inactivy period to prevent excess memory uses
+            Set this option to prevent that.
+        */
+        QueryOption_NoCursorTimeout = 1 << 4,
+
+        /** Use with QueryOption_CursorTailable.  If we are at the end of the data, block for a while rather
+            than returning no data. After a timeout period, we do return as normal.
+        */
+        QueryOption_AwaitData = 1 << 5,
+
+        /** Stream the data down full blast in multiple "more" packages, on the assumption that the client
+            will fully read all data queried.  Faster when you are pulling a lot of data and know you want to
+            pull it all down.  Note: it is not allowed to not read all the data unless you close the connection.
+
+            Use the query( boost::function<void(const BSONObj&)> f, ... ) version of the connection's query()
+            method, and it will take care of all the details for you.
+        */
+        QueryOption_Exhaust = 1 << 6,
+
+        /** When sharded, this means its ok to return partial results
+            Usually we will fail a query if all required shards aren't up
+            If this is set, it'll be a partial result set 
+         */
+        QueryOption_PartialResults = 1 << 7 ,
+
+        QueryOption_AllSupported = QueryOption_CursorTailable | QueryOption_SlaveOk | QueryOption_OplogReplay | QueryOption_NoCursorTimeout | QueryOption_AwaitData | QueryOption_Exhaust | QueryOption_PartialResults
+
+    };
+
+    enum UpdateOptions {
+        /** Upsert - that is, insert the item if no matching item is found. */
+        UpdateOption_Upsert = 1 << 0,
+
+        /** Update multiple documents (if multiple documents match query expression).
+           (Default is update a single document and stop.) */
+        UpdateOption_Multi = 1 << 1,
+
+        /** flag from mongo saying this update went everywhere */
+        UpdateOption_Broadcast = 1 << 2
+    };
+
+    enum RemoveOptions {
+        /** only delete one option */
+        RemoveOption_JustOne = 1 << 0,
+
+        /** flag from mongo saying this update went everywhere */
+        RemoveOption_Broadcast = 1 << 1
+    };
+
+    
+    /** 
+     * need to put in DbMesssage::ReservedOptions as well
+     */
+    enum InsertOptions {
+        /** With muli-insert keep processing inserts if one fails */
+        InsertOption_ContinueOnError = 1 << 0
+    };
+
+    class DBClientBase;
+
+    /**
+     * ConnectionString handles parsing different ways to connect to mongo and determining method
+     * samples:
+     *    server
+     *    server:port
+     *    foo/server:port,server:port   SET
+     *    server,server,server          SYNC
+     *
+     * tyipcal use
+     * string errmsg,
+     * ConnectionString cs = ConnectionString::parse( url , errmsg );
+     * if ( ! cs.isValid() ) throw "bad: " + errmsg;
+     * DBClientBase * conn = cs.connect( errmsg );
+     */
+    class ConnectionString {
+    public:
+        enum ConnectionType { INVALID , MASTER , PAIR , SET , SYNC };
+
+        ConnectionString() {
+            _type = INVALID;
+        }
+
+        ConnectionString( const HostAndPort& server ) {
+            _type = MASTER;
+            _servers.push_back( server );
+            _finishInit();
+        }
+
+        ConnectionString( ConnectionType type , const string& s , const string& setName = "" ) {
+            _type = type;
+            _setName = setName;
+            _fillServers( s );
+
+            switch ( _type ) {
+            case MASTER:
+                assert( _servers.size() == 1 );
+                break;
+            case SET:
+                assert( _setName.size() );
+                assert( _servers.size() >= 1 ); // 1 is ok since we can derive
+                break;
+            case PAIR:
+                assert( _servers.size() == 2 );
+                break;
+            default:
+                assert( _servers.size() > 0 );
+            }
+
+            _finishInit();
+        }
+
+        ConnectionString( const string& s , ConnectionType favoredMultipleType ) {
+            _type = INVALID;
+            
+            _fillServers( s );
+            if ( _type != INVALID ) {
+                // set already
+            }
+            else if ( _servers.size() == 1 ) {
+                _type = MASTER;
+            }
+            else {
+                _type = favoredMultipleType;
+                assert( _type == SET || _type == SYNC );
+            }
+            _finishInit();
+        }
+
+        bool isValid() const { return _type != INVALID; }
+
+        string toString() const { return _string; }
+        
+        DBClientBase* connect( string& errmsg, double socketTimeout = 0 ) const;
+
+        string getSetName() const { return _setName; }
+
+        vector<HostAndPort> getServers() const { return _servers; }
+        
+        ConnectionType type() const { return _type; }
+
+        static ConnectionString parse( const string& url , string& errmsg );
+
+        static string typeToString( ConnectionType type );
+
+    private:
+
+        void _fillServers( string s );
+        void _finishInit();
+
+        ConnectionType _type;
+        vector<HostAndPort> _servers;
+        string _string;
+        string _setName;
+    };
+
+    /**
+     * controls how much a clients cares about writes
+     * default is NORMAL
+     */
+    enum WriteConcern {
+        W_NONE = 0 , // TODO: not every connection type fully supports this
+        W_NORMAL = 1
+        // TODO SAFE = 2
+    };
+
+    class BSONObj;
+    class ScopedDbConnection;
+    class DBClientCursor;
+    class DBClientCursorBatchIterator;
+
+    /** Represents a Mongo query expression.  Typically one uses the QUERY(...) macro to construct a Query object.
+        Examples:
+           QUERY( "age" << 33 << "school" << "UCLA" ).sort("name")
+           QUERY( "age" << GT << 30 << LT << 50 )
+    */
+    class Query {
+    public:
+        BSONObj obj;
+        Query() : obj(BSONObj()) { }
+        Query(const BSONObj& b) : obj(b) { }
+        Query(const string &json);
+        Query(const char * json);
+
+        /** Add a sort (ORDER BY) criteria to the query expression.
+            @param sortPattern the sort order template.  For example to order by name ascending, time descending:
+              { name : 1, ts : -1 }
+            i.e.
+              BSON( "name" << 1 << "ts" << -1 )
+            or
+              fromjson(" name : 1, ts : -1 ")
+        */
+        Query& sort(const BSONObj& sortPattern);
+
+        /** Add a sort (ORDER BY) criteria to the query expression.
+            This version of sort() assumes you want to sort on a single field.
+            @param asc = 1 for ascending order
+            asc = -1 for descending order
+        */
+        Query& sort(const string &field, int asc = 1) { sort( BSON( field << asc ) ); return *this; }
+
+        /** Provide a hint to the query.
+            @param keyPattern Key pattern for the index to use.
+            Example:
+              hint("{ts:1}")
+        */
+        Query& hint(BSONObj keyPattern);
+        Query& hint(const string &jsonKeyPatt);
+
+        /** Provide min and/or max index limits for the query.
+            min <= x < max
+         */
+        Query& minKey(const BSONObj &val);
+        /**
+           max is exclusive
+         */
+        Query& maxKey(const BSONObj &val);
+
+        /** Return explain information about execution of this query instead of the actual query results.
+            Normally it is easier to use the mongo shell to run db.find(...).explain().
+        */
+        Query& explain();
+
+        /** Use snapshot mode for the query.  Snapshot mode assures no duplicates are returned, or objects missed, which were
+            present at both the start and end of the query's execution (if an object is new during the query, or deleted during
+            the query, it may or may not be returned, even with snapshot mode).
+
+            Note that short query responses (less than 1MB) are always effectively snapshotted.
+
+            Currently, snapshot mode may not be used with sorting or explicit hints.
+        */
+        Query& snapshot();
+
+        /** Queries to the Mongo database support a $where parameter option which contains
+            a javascript function that is evaluated to see whether objects being queried match
+            its criteria.  Use this helper to append such a function to a query object.
+            Your query may also contain other traditional Mongo query terms.
+
+            @param jscode The javascript function to evaluate against each potential object
+                   match.  The function must return true for matched objects.  Use the this
+                   variable to inspect the current object.
+            @param scope SavedContext for the javascript object.  List in a BSON object any
+                   variables you would like defined when the jscode executes.  One can think
+                   of these as "bind variables".
+
+            Examples:
+              conn.findOne("test.coll", Query("{a:3}").where("this.b == 2 || this.c == 3"));
+              Query badBalance = Query().where("this.debits - this.credits < 0");
+        */
+        Query& where(const string &jscode, BSONObj scope);
+        Query& where(const string &jscode) { return where(jscode, BSONObj()); }
+
+        /**
+         * @return true if this query has an orderby, hint, or some other field
+         */
+        bool isComplex( bool * hasDollar = 0 ) const;
+
+        BSONObj getFilter() const;
+        BSONObj getSort() const;
+        BSONObj getHint() const;
+        bool isExplain() const;
+
+        string toString() const;
+        operator string() const { return toString(); }
+    private:
+        void makeComplex();
+        template< class T >
+        void appendComplex( const char *fieldName, const T& val ) {
+            makeComplex();
+            BSONObjBuilder b;
+            b.appendElements(obj);
+            b.append(fieldName, val);
+            obj = b.obj();
+        }
+    };
+
+    /**
+     * Represents a full query description, including all options required for the query to be passed on
+     * to other hosts
+     */
+    class QuerySpec {
+
+        string _ns;
+        int _ntoskip;
+        int _ntoreturn;
+        int _options;
+        BSONObj _query;
+        BSONObj _fields;
+        Query _queryObj;
+
+    public:
+        
+        QuerySpec( const string& ns,
+                   const BSONObj& query, const BSONObj& fields,
+                   int ntoskip, int ntoreturn, int options )
+            : _ns( ns ), _ntoskip( ntoskip ), _ntoreturn( ntoreturn ), _options( options ),
+              _query( query.getOwned() ), _fields( fields.getOwned() ) , _queryObj( _query ) {
+        }
+
+        QuerySpec() {}
+
+        bool isEmpty() const { return _ns.size() == 0; }
+
+        bool isExplain() const { return _queryObj.isExplain(); }
+        BSONObj filter() const { return _queryObj.getFilter(); }
+
+        BSONObj hint() const { return _queryObj.getHint(); }
+        BSONObj sort() const { return _queryObj.getSort(); }
+        BSONObj query() const { return _query; }
+        BSONObj fields() const { return _fields; }
+        BSONObj* fieldsData() { return &_fields; }
+
+        // don't love this, but needed downstrem
+        const BSONObj* fieldsPtr() const { return &_fields; } 
+
+        string ns() const { return _ns; }
+        int ntoskip() const { return _ntoskip; }
+        int ntoreturn() const { return _ntoreturn; }
+        int options() const { return _options; }
+        
+        void setFields( BSONObj& o ) { _fields = o.getOwned(); }
+
+        string toString() const {
+            return str::stream() << "QSpec " << 
+                BSON( "ns" << _ns << "n2skip" << _ntoskip << "n2return" << _ntoreturn << "options" << _options
+                      << "query" << _query << "fields" << _fields );
+        }
+        
+    };
+
+
+    /** Typically one uses the QUERY(...) macro to construct a Query object.
+        Example: QUERY( "age" << 33 << "school" << "UCLA" )
+    */
+#define QUERY(x) mongo::Query( BSON(x) )
+
+    // Useful utilities for namespaces
+    /** @return the database name portion of an ns string */
+    string nsGetDB( const string &ns );
+
+    /** @return the collection name portion of an ns string */
+    string nsGetCollection( const string &ns );
+
+    /**
+       interface that handles communication with the db
+     */
+    class DBConnector {
+    public:
+        virtual ~DBConnector() {}
+        /** actualServer is set to the actual server where they call went if there was a choice (SlaveOk) */
+        virtual bool call( Message &toSend, Message &response, bool assertOk=true , string * actualServer = 0 ) = 0;
+        virtual void say( Message &toSend, bool isRetry = false , string * actualServer = 0 ) = 0;
+        virtual void sayPiggyBack( Message &toSend ) = 0;
+        /* used by QueryOption_Exhaust.  To use that your subclass must implement this. */
+        virtual bool recv( Message& m ) { assert(false); return false; }
+        // In general, for lazy queries, we'll need to say, recv, then checkResponse
+        virtual void checkResponse( const char* data, int nReturned, bool* retry = NULL, string* targetHost = NULL ) {
+            if( retry ) *retry = false; if( targetHost ) *targetHost = "";
+        }
+        virtual bool lazySupported() const = 0;
+    };
+
+    /**
+       The interface that any db connection should implement
+     */
+    class DBClientInterface : boost::noncopyable {
+    public:
+        virtual auto_ptr<DBClientCursor> query(const string &ns, Query query, int nToReturn = 0, int nToSkip = 0,
+                                               const BSONObj *fieldsToReturn = 0, int queryOptions = 0 , int batchSize = 0 ) = 0;
+
+        virtual void insert( const string &ns, BSONObj obj , int flags=0) = 0;
+
+        virtual void insert( const string &ns, const vector< BSONObj >& v , int flags=0) = 0;
+
+        virtual void remove( const string &ns , Query query, bool justOne = 0 ) = 0;
+
+        virtual void update( const string &ns , Query query , BSONObj obj , bool upsert = 0 , bool multi = 0 ) = 0;
+
+        virtual ~DBClientInterface() { }
+
+        /**
+           @return a single object that matches the query.  if none do, then the object is empty
+           @throws AssertionException
+        */
+        virtual BSONObj findOne(const string &ns, const Query& query, const BSONObj *fieldsToReturn = 0, int queryOptions = 0);
+
+        /** query N objects from the database into an array.  makes sense mostly when you want a small number of results.  if a huge number, use 
+            query() and iterate the cursor. 
+        */
+        void findN(vector<BSONObj>& out, const string&ns, Query query, int nToReturn, int nToSkip = 0, const BSONObj *fieldsToReturn = 0, int queryOptions = 0);
+
+        virtual string getServerAddress() const = 0;
+
+        /** don't use this - called automatically by DBClientCursor for you */
+        virtual auto_ptr<DBClientCursor> getMore( const string &ns, long long cursorId, int nToReturn = 0, int options = 0 ) = 0;
+    };
+
+    /**
+       DB "commands"
+       Basically just invocations of connection.$cmd.findOne({...});
+    */
+    class DBClientWithCommands : public DBClientInterface {
+        set<string> _seenIndexes;
+    public:
+        /** controls how chatty the client is about network errors & such.  See log.h */
+        int _logLevel;
+
+        DBClientWithCommands() : _logLevel(0), _cachedAvailableOptions( (enum QueryOptions)0 ), _haveCachedAvailableOptions(false) { }
+
+        /** helper function.  run a simple command where the command expression is simply
+              { command : 1 }
+            @param info -- where to put result object.  may be null if caller doesn't need that info
+            @param command -- command name
+            @return true if the command returned "ok".
+         */
+        bool simpleCommand(const string &dbname, BSONObj *info, const string &command);
+
+        /** Run a database command.  Database commands are represented as BSON objects.  Common database
+            commands have prebuilt helper functions -- see below.  If a helper is not available you can
+            directly call runCommand.
+
+            @param dbname database name.  Use "admin" for global administrative commands.
+            @param cmd  the command object to execute.  For example, { ismaster : 1 }
+            @param info the result object the database returns. Typically has { ok : ..., errmsg : ... } fields
+                   set.
+            @param options see enum QueryOptions - normally not needed to run a command
+            @return true if the command returned "ok".
+        */
+        virtual bool runCommand(const string &dbname, const BSONObj& cmd, BSONObj &info, int options=0);
+
+        /** Authorize access to a particular database.
+            Authentication is separate for each database on the server -- you may authenticate for any
+            number of databases on a single connection.
+            The "admin" database is special and once authenticated provides access to all databases on the
+            server.
+            @param      digestPassword  if password is plain text, set this to true.  otherwise assumed to be pre-digested
+            @param[out] authLevel       level of authentication for the given user
+            @return true if successful
+        */
+        virtual bool auth(const string &dbname, const string &username, const string &pwd, string& errmsg, bool digestPassword = true, Auth::Level * level = NULL);
+
+        /** count number of objects in collection ns that match the query criteria specified
+            throws UserAssertion if database returns an error
+        */
+        virtual unsigned long long count(const string &ns, const BSONObj& query = BSONObj(), int options=0, int limit=0, int skip=0 );
+
+        string createPasswordDigest( const string &username , const string &clearTextPassword );
+
+        /** returns true in isMaster parm if this db is the current master
+           of a replica pair.
+
+           pass in info for more details e.g.:
+             { "ismaster" : 1.0 , "msg" : "not paired" , "ok" : 1.0  }
+
+           returns true if command invoked successfully.
+        */
+        virtual bool isMaster(bool& isMaster, BSONObj *info=0);
+
+        /**
+           Create a new collection in the database.  Normally, collection creation is automatic.  You would
+           use this function if you wish to specify special options on creation.
+
+           If the collection already exists, no action occurs.
+
+           @param ns     fully qualified collection name
+           @param size   desired initial extent size for the collection.
+                         Must be <= 1000000000 for normal collections.
+                         For fixed size (capped) collections, this size is the total/max size of the
+                         collection.
+           @param capped if true, this is a fixed size collection (where old data rolls out).
+           @param max    maximum number of objects if capped (optional).
+
+           returns true if successful.
+        */
+        bool createCollection(const string &ns, long long size = 0, bool capped = false, int max = 0, BSONObj *info = 0);
+
+        /** Get error result from the last write operation (insert/update/delete) on this connection.
+            @return error message text, or empty string if no error.
+        */
+        string getLastError(bool fsync = false, bool j = false, int w = 0, int wtimeout = 0);
+
+        /** Get error result from the last write operation (insert/update/delete) on this connection.
+            @return full error object.
+
+            If "w" is -1, wait for propagation to majority of nodes.
+            If "wtimeout" is 0, the operation will block indefinitely if needed.
+        */
+        virtual BSONObj getLastErrorDetailed(bool fsync = false, bool j = false, int w = 0, int wtimeout = 0);
+
+        /** Can be called with the returned value from getLastErrorDetailed to extract an error string. 
+            If all you need is the string, just call getLastError() instead.
+        */
+        static string getLastErrorString( const BSONObj& res );
+
+        /** Return the last error which has occurred, even if not the very last operation.
+
+           @return { err : <error message>, nPrev : <how_many_ops_back_occurred>, ok : 1 }
+
+           result.err will be null if no error has occurred.
+        */
+        BSONObj getPrevError();
+
+        /** Reset the previous error state for this connection (accessed via getLastError and
+            getPrevError).  Useful when performing several operations at once and then checking
+            for an error after attempting all operations.
+        */
+        bool resetError() { return simpleCommand("admin", 0, "reseterror"); }
+
+        /** Delete the specified collection. */
+        virtual bool dropCollection( const string &ns ) {
+            string db = nsGetDB( ns );
+            string coll = nsGetCollection( ns );
+            uassert( 10011 ,  "no collection name", coll.size() );
+
+            BSONObj info;
+
+            bool res = runCommand( db.c_str() , BSON( "drop" << coll ) , info );
+            resetIndexCache();
+            return res;
+        }
+
+        /** Perform a repair and compaction of the specified database.  May take a long time to run.  Disk space
+           must be available equal to the size of the database while repairing.
+        */
+        bool repairDatabase(const string &dbname, BSONObj *info = 0) {
+            return simpleCommand(dbname, info, "repairDatabase");
+        }
+
+        /** Copy database from one server or name to another server or name.
+
+           Generally, you should dropDatabase() first as otherwise the copied information will MERGE
+           into whatever data is already present in this database.
+
+           For security reasons this function only works when you are authorized to access the "admin" db.  However,
+           if you have access to said db, you can copy any database from one place to another.
+           TODO: this needs enhancement to be more flexible in terms of security.
+
+           This method provides a way to "rename" a database by copying it to a new db name and
+           location.  The copy is "repaired" and compacted.
+
+           fromdb   database name from which to copy.
+           todb     database name to copy to.
+           fromhost hostname of the database (and optionally, ":port") from which to
+                    copy the data.  copies from self if "".
+
+           returns true if successful
+        */
+        bool copyDatabase(const string &fromdb, const string &todb, const string &fromhost = "", BSONObj *info = 0);
+
+        /** The Mongo database provides built-in performance profiling capabilities.  Uset setDbProfilingLevel()
+           to enable.  Profiling information is then written to the system.profile collection, which one can
+           then query.
+        */
+        enum ProfilingLevel {
+            ProfileOff = 0,
+            ProfileSlow = 1, // log very slow (>100ms) operations
+            ProfileAll = 2
+
+        };
+        bool setDbProfilingLevel(const string &dbname, ProfilingLevel level, BSONObj *info = 0);
+        bool getDbProfilingLevel(const string &dbname, ProfilingLevel& level, BSONObj *info = 0);
+
+
+        /** This implicitly converts from char*, string, and BSONObj to be an argument to mapreduce
+            You shouldn't need to explicitly construct this
+         */
+        struct MROutput {
+            MROutput(const char* collection) : out(BSON("replace" << collection)) {}
+            MROutput(const string& collection) : out(BSON("replace" << collection)) {}
+            MROutput(const BSONObj& obj) : out(obj) {}
+
+            BSONObj out;
+        };
+        static MROutput MRInline;
+
+        /** Run a map/reduce job on the server.
+
+            See http://www.mongodb.org/display/DOCS/MapReduce
+
+            ns        namespace (db+collection name) of input data
+            jsmapf    javascript map function code
+            jsreducef javascript reduce function code.
+            query     optional query filter for the input
+            output    either a string collection name or an object representing output type
+                      if not specified uses inline output type
+
+            returns a result object which contains:
+             { result : <collection_name>,
+               numObjects : <number_of_objects_scanned>,
+               timeMillis : <job_time>,
+               ok : <1_if_ok>,
+               [, err : <errmsg_if_error>]
+             }
+
+             For example one might call:
+               result.getField("ok").trueValue()
+             on the result to check if ok.
+        */
+        BSONObj mapreduce(const string &ns, const string &jsmapf, const string &jsreducef, BSONObj query = BSONObj(), MROutput output = MRInline);
+
+        /** Run javascript code on the database server.
+           dbname    database SavedContext in which the code runs. The javascript variable 'db' will be assigned
+                     to this database when the function is invoked.
+           jscode    source code for a javascript function.
+           info      the command object which contains any information on the invocation result including
+                      the return value and other information.  If an error occurs running the jscode, error
+                     information will be in info.  (try "out() << info.toString()")
+           retValue  return value from the jscode function.
+           args      args to pass to the jscode function.  when invoked, the 'args' variable will be defined
+                     for use by the jscode.
+
+           returns true if runs ok.
+
+           See testDbEval() in dbclient.cpp for an example of usage.
+        */
+        bool eval(const string &dbname, const string &jscode, BSONObj& info, BSONElement& retValue, BSONObj *args = 0);
+
+        /** validate a collection, checking for errors and reporting back statistics.
+            this operation is slow and blocking.
+         */
+        bool validate( const string &ns , bool scandata=true ) {
+            BSONObj cmd = BSON( "validate" << nsGetCollection( ns ) << "scandata" << scandata );
+            BSONObj info;
+            return runCommand( nsGetDB( ns ).c_str() , cmd , info );
+        }
+
+        /* The following helpers are simply more convenient forms of eval() for certain common cases */
+
+        /* invocation with no return value of interest -- with or without one simple parameter */
+        bool eval(const string &dbname, const string &jscode);
+        template< class T >
+        bool eval(const string &dbname, const string &jscode, T parm1) {
+            BSONObj info;
+            BSONElement retValue;
+            BSONObjBuilder b;
+            b.append("0", parm1);
+            BSONObj args = b.done();
+            return eval(dbname, jscode, info, retValue, &args);
+        }
+
+        /** eval invocation with one parm to server and one numeric field (either int or double) returned */
+        template< class T, class NumType >
+        bool eval(const string &dbname, const string &jscode, T parm1, NumType& ret) {
+            BSONObj info;
+            BSONElement retValue;
+            BSONObjBuilder b;
+            b.append("0", parm1);
+            BSONObj args = b.done();
+            if ( !eval(dbname, jscode, info, retValue, &args) )
+                return false;
+            ret = (NumType) retValue.number();
+            return true;
+        }
+
+        /**
+           get a list of all the current databases
+           uses the { listDatabases : 1 } command.
+           throws on error
+         */
+        list<string> getDatabaseNames();
+
+        /**
+           get a list of all the current collections in db
+         */
+        list<string> getCollectionNames( const string& db );
+
+        bool exists( const string& ns );
+
+        /** Create an index if it does not already exist.
+            ensureIndex calls are remembered so it is safe/fast to call this function many
+            times in your code.
+           @param ns collection to be indexed
+           @param keys the "key pattern" for the index.  e.g., { name : 1 }
+           @param unique if true, indicates that key uniqueness should be enforced for this index
+           @param name if not specified, it will be created from the keys automatically (which is recommended)
+           @param cache if set to false, the index cache for the connection won't remember this call
+           @param background build index in the background (see mongodb docs/wiki for details)
+           @param v index version. leave at default value. (unit tests set this parameter.)
+           @return whether or not sent message to db.
+             should be true on first call, false on subsequent unless resetIndexCache was called
+         */
+        virtual bool ensureIndex( const string &ns , BSONObj keys , bool unique = false, const string &name = "",
+                                  bool cache = true, bool background = false, int v = -1 );
+
+        /**
+           clears the index cache, so the subsequent call to ensureIndex for any index will go to the server
+         */
+        virtual void resetIndexCache();
+
+        virtual auto_ptr<DBClientCursor> getIndexes( const string &ns );
+
+        virtual void dropIndex( const string& ns , BSONObj keys );
+        virtual void dropIndex( const string& ns , const string& indexName );
+
+        /**
+           drops all indexes for the collection
+         */
+        virtual void dropIndexes( const string& ns );
+
+        virtual void reIndex( const string& ns );
+
+        string genIndexName( const BSONObj& keys );
+
+        /** Erase / drop an entire database */
+        virtual bool dropDatabase(const string &dbname, BSONObj *info = 0) {
+            bool ret = simpleCommand(dbname, info, "dropDatabase");
+            resetIndexCache();
+            return ret;
+        }
+
+        virtual string toString() = 0;
+
+    protected:
+        /** if the result of a command is ok*/
+        bool isOk(const BSONObj&);
+
+        /** if the element contains a not master error */
+        bool isNotMasterErrorString( const BSONElement& e );
+
+        BSONObj _countCmd(const string &ns, const BSONObj& query, int options, int limit, int skip );
+
+        /**
+         * Look up the options available on this client.  Caches the answer from
+         * _lookupAvailableOptions(), below.
+         */
+        QueryOptions availableOptions();
+
+        virtual QueryOptions _lookupAvailableOptions();
+
+    private:
+        enum QueryOptions _cachedAvailableOptions;
+        bool _haveCachedAvailableOptions;
+    };
+
+    /**
+     abstract class that implements the core db operations
+     */
+    class DBClientBase : public DBClientWithCommands, public DBConnector {
+    protected:
+        WriteConcern _writeConcern;
+
+    public:
+        DBClientBase() {
+            _writeConcern = W_NORMAL;
+        }
+
+        WriteConcern getWriteConcern() const { return _writeConcern; }
+        void setWriteConcern( WriteConcern w ) { _writeConcern = w; }
+
+        /** send a query to the database.
+         @param ns namespace to query, format is <dbname>.<collectname>[.<collectname>]*
+         @param query query to perform on the collection.  this is a BSONObj (binary JSON)
+         You may format as
+           { query: { ... }, orderby: { ... } }
+         to specify a sort order.
+         @param nToReturn n to return (i.e., limit).  0 = unlimited
+         @param nToSkip start with the nth item
+         @param fieldsToReturn optional template of which fields to select. if unspecified, returns all fields
+         @param queryOptions see options enum at top of this file
+
+         @return    cursor.   0 if error (connection failure)
+         @throws AssertionException
+        */
+        virtual auto_ptr<DBClientCursor> query(const string &ns, Query query, int nToReturn = 0, int nToSkip = 0,
+                                               const BSONObj *fieldsToReturn = 0, int queryOptions = 0 , int batchSize = 0 );
+
+
+        /** Uses QueryOption_Exhaust, when available.
+
+            Exhaust mode sends back all data queries as fast as possible, with no back-and-forth for
+            OP_GETMORE.  If you are certain you will exhaust the query, it could be useful.
+
+            Use the DBClientCursorBatchIterator version, below, if you want to do items in large
+            blocks, perhaps to avoid granular locking and such.
+         */
+        virtual unsigned long long query( boost::function<void(const BSONObj&)> f,
+                                          const string& ns,
+                                          Query query,
+                                          const BSONObj *fieldsToReturn = 0,
+                                          int queryOptions = 0 );
+
+        virtual unsigned long long query( boost::function<void(DBClientCursorBatchIterator&)> f,
+                                          const string& ns,
+                                          Query query,
+                                          const BSONObj *fieldsToReturn = 0,
+                                          int queryOptions = 0 );
+
+
+        /** don't use this - called automatically by DBClientCursor for you
+            @param cursorId id of cursor to retrieve
+            @return an handle to a previously allocated cursor
+            @throws AssertionException
+         */
+        virtual auto_ptr<DBClientCursor> getMore( const string &ns, long long cursorId, int nToReturn = 0, int options = 0 );
+
+        /**
+           insert an object into the database
+         */
+        virtual void insert( const string &ns , BSONObj obj , int flags=0);
+
+        /**
+           insert a vector of objects into the database
+         */
+        virtual void insert( const string &ns, const vector< BSONObj >& v , int flags=0);
+
+        /**
+           remove matching objects from the database
+           @param justOne if this true, then once a single match is found will stop
+         */
+        virtual void remove( const string &ns , Query q , bool justOne = 0 );
+
+        /**
+           updates objects matching query
+         */
+        virtual void update( const string &ns , Query query , BSONObj obj , bool upsert = false , bool multi = false );
+
+        virtual bool isFailed() const = 0;
+
+        virtual void killCursor( long long cursorID ) = 0;
+
+        virtual bool callRead( Message& toSend , Message& response ) = 0;
+        // virtual bool callWrite( Message& toSend , Message& response ) = 0; // TODO: add this if needed
+        
+        virtual ConnectionString::ConnectionType type() const = 0;
+        
+        virtual double getSoTimeout() const = 0;
+
+    }; // DBClientBase
+
+    class DBClientReplicaSet;
+
+    class ConnectException : public UserException {
+    public:
+        ConnectException(string msg) : UserException(9000,msg) { }
+    };
+
+    /**
+        A basic connection to the database.
+        This is the main entry point for talking to a simple Mongo setup
+    */
+    class DBClientConnection : public DBClientBase {
+    public:
+        using DBClientBase::query;
+
+        /**
+           @param _autoReconnect if true, automatically reconnect on a connection failure
+           @param cp used by DBClientReplicaSet.  You do not need to specify this parameter
+           @param timeout tcp timeout in seconds - this is for read/write, not connect.
+           Connect timeout is fixed, but short, at 5 seconds.
+         */
+        DBClientConnection(bool _autoReconnect=false, DBClientReplicaSet* cp=0, double so_timeout=0) :
+            clientSet(cp), _failed(false), autoReconnect(_autoReconnect), lastReconnectTry(0), _so_timeout(so_timeout) {
+            _numConnections++;
+        }
+
+        virtual ~DBClientConnection() {
+            _numConnections--;
+        }
+
+        /** Connect to a Mongo database server.
+
+           If autoReconnect is true, you can try to use the DBClientConnection even when
+           false was returned -- it will try to connect again.
+
+           @param serverHostname host to connect to.  can include port number ( 127.0.0.1 , 127.0.0.1:5555 )
+                                 If you use IPv6 you must add a port number ( ::1:27017 )
+           @param errmsg any relevant error message will appended to the string
+           @deprecated please use HostAndPort
+           @return false if fails to connect.
+        */
+        virtual bool connect(const char * hostname, string& errmsg) {
+            // TODO: remove this method
+            HostAndPort t( hostname );
+            return connect( t , errmsg );
+        }
+
+        /** Connect to a Mongo database server.
+
+           If autoReconnect is true, you can try to use the DBClientConnection even when
+           false was returned -- it will try to connect again.
+
+           @param server server to connect to.
+           @param errmsg any relevant error message will appended to the string
+           @return false if fails to connect.
+        */
+        virtual bool connect(const HostAndPort& server, string& errmsg);
+
+        /** Connect to a Mongo database server.  Exception throwing version.
+            Throws a UserException if cannot connect.
+
+           If autoReconnect is true, you can try to use the DBClientConnection even when
+           false was returned -- it will try to connect again.
+
+           @param serverHostname host to connect to.  can include port number ( 127.0.0.1 , 127.0.0.1:5555 )
+        */
+        void connect(const string& serverHostname) {
+            string errmsg;
+            if( !connect(HostAndPort(serverHostname), errmsg) )
+                throw ConnectException(string("can't connect ") + errmsg);
+        }
+
+        virtual bool auth(const string &dbname, const string &username, const string &pwd, string& errmsg, bool digestPassword = true, Auth::Level* level=NULL);
+
+        virtual auto_ptr<DBClientCursor> query(const string &ns, Query query=Query(), int nToReturn = 0, int nToSkip = 0,
+                                               const BSONObj *fieldsToReturn = 0, int queryOptions = 0 , int batchSize = 0 ) {
+            checkConnection();
+            return DBClientBase::query( ns, query, nToReturn, nToSkip, fieldsToReturn, queryOptions , batchSize );
+        }
+
+        virtual unsigned long long query( boost::function<void(DBClientCursorBatchIterator &)> f,
+                                          const string& ns,
+                                          Query query,
+                                          const BSONObj *fieldsToReturn,
+                                          int queryOptions );
+
+        virtual bool runCommand(const string &dbname, const BSONObj& cmd, BSONObj &info, int options=0);
+
+        /**
+           @return true if this connection is currently in a failed state.  When autoreconnect is on,
+                   a connection will transition back to an ok state after reconnecting.
+         */
+        bool isFailed() const { return _failed; }
+
+        MessagingPort& port() { assert(p); return *p; }
+
+        string toStringLong() const {
+            stringstream ss;
+            ss << _serverString;
+            if ( _failed ) ss << " failed";
+            return ss.str();
+        }
+
+        /** Returns the address of the server */
+        string toString() { return _serverString; }
+
+        string getServerAddress() const { return _serverString; }
+
+        virtual void killCursor( long long cursorID );
+        virtual bool callRead( Message& toSend , Message& response ) { return call( toSend , response ); }
+        virtual void say( Message &toSend, bool isRetry = false , string * actualServer = 0 );
+        virtual bool recv( Message& m );
+        virtual void checkResponse( const char *data, int nReturned, bool* retry = NULL, string* host = NULL );
+        virtual bool call( Message &toSend, Message &response, bool assertOk = true , string * actualServer = 0 );
+        virtual ConnectionString::ConnectionType type() const { return ConnectionString::MASTER; }
+        void setSoTimeout(double to) { _so_timeout = to; }
+        double getSoTimeout() const { return _so_timeout; }
+
+        virtual bool lazySupported() const { return true; }
+
+        static int getNumConnections() {
+            return _numConnections;
+        }
+        
+        static void setLazyKillCursor( bool lazy ) { _lazyKillCursor = lazy; }
+        static bool getLazyKillCursor() { return _lazyKillCursor; }
+        
+    protected:
+        friend class SyncClusterConnection;
+        virtual void sayPiggyBack( Message &toSend );
+
+        DBClientReplicaSet *clientSet;
+        boost::scoped_ptr<MessagingPort> p;
+        boost::scoped_ptr<SockAddr> server;
+        bool _failed;
+        const bool autoReconnect;
+        time_t lastReconnectTry;
+        HostAndPort _server; // remember for reconnects
+        string _serverString;
+        void _checkConnection();
+
+        // throws SocketException if in failed state and not reconnecting or if waiting to reconnect
+        void checkConnection() { if( _failed ) _checkConnection(); }
+
+        map< string, pair<string,string> > authCache;
+        double _so_timeout;
+        bool _connect( string& errmsg );
+
+        static AtomicUInt _numConnections;
+        static bool _lazyKillCursor; // lazy means we piggy back kill cursors on next op
+
+#ifdef MONGO_SSL
+        static SSLManager* sslManager();
+        static SSLManager* _sslManager;
+#endif
+    };
+
+    /** pings server to check if it's up
+     */
+    bool serverAlive( const string &uri );
+
+    DBClientBase * createDirectClient();
+
+    BSONElement getErrField( const BSONObj& result );
+    bool hasErrField( const BSONObj& result );
+
+    inline std::ostream& operator<<( std::ostream &s, const Query &q ) {
+        return s << q.toString();
+    }
+
+} // namespace mongo
diff --git a/src/mongo/client/distlock.cpp b/src/mongo/client/distlock.cpp
index 5e30f4ad52c..7316ba063cc 100644
--- a/src/mongo/client/distlock.cpp
+++ b/src/mongo/client/distlock.cpp
@@ -15,9 +15,13 @@
  *    limitations under the License.
  */
 
-#include "pch.h"
-#include "dbclient.h"
-#include "distlock.h"
+#include "mongo/pch.h"
+
+#include "mongo/client/distlock.h"
+
+#include "mongo/client/dbclient.h"
+#include "mongo/client/dbclientcursor.h"
+
 
 namespace mongo {
 
diff --git a/src/mongo/client/examples/first.cpp b/src/mongo/client/examples/first.cpp
index 047ff1914b7..01428bc977a 100644
--- a/src/mongo/client/examples/first.cpp
+++ b/src/mongo/client/examples/first.cpp
@@ -21,7 +21,7 @@
 
 #include <iostream>
 
-#include "client/dbclient.h"
+#include "mongo/client/dbclient.h"
 
 using namespace std;
 
diff --git a/src/mongo/client/examples/second.cpp b/src/mongo/client/examples/second.cpp
index 6cc2111580f..2126e5f8418 100644
--- a/src/mongo/client/examples/second.cpp
+++ b/src/mongo/client/examples/second.cpp
@@ -18,6 +18,7 @@
 #include <iostream>
 
 #include "client/dbclient.h"
+#include "client/connpool.h"
 
 using namespace std;
 using namespace mongo;
@@ -31,26 +32,23 @@ int main( int argc, const char **argv ) {
         port = argv[ 2 ];
     }
 
-    DBClientConnection conn;
-    string errmsg;
-    if ( ! conn.connect( string( "127.0.0.1:" ) + port , errmsg ) ) {
-        cout << "couldn't connect : " << errmsg << endl;
-        throw -11;
-    }
+    ScopedDbConnection conn( string( "127.0.0.1:" ) + port );
 
     const char * ns = "test.second";
 
-    conn.remove( ns , BSONObj() );
+    conn->remove( ns , BSONObj() );
 
-    conn.insert( ns , BSON( "name" << "eliot" << "num" << 17 ) );
-    conn.insert( ns , BSON( "name" << "sara" << "num" << 24 ) );
+    conn->insert( ns , BSON( "name" << "eliot" << "num" << 17 ) );
+    conn->insert( ns , BSON( "name" << "sara" << "num" << 24 ) );
 
-    auto_ptr<DBClientCursor> cursor = conn.query( ns , BSONObj() );
+    auto_ptr<DBClientCursor> cursor = conn->query( ns , BSONObj() );
     cout << "using cursor" << endl;
     while ( cursor->more() ) {
         BSONObj obj = cursor->next();
         cout << "\t" << obj.jsonString() << endl;
     }
 
-    conn.ensureIndex( ns , BSON( "name" << 1 << "num" << -1 ) );
+    conn->ensureIndex( ns , BSON( "name" << 1 << "num" << -1 ) );
+
+    conn.done();
 }
diff --git a/src/mongo/client/gridfs.cpp b/src/mongo/client/gridfs.cpp
index 7dcb1d5bcb1..b3f23a07277 100644
--- a/src/mongo/client/gridfs.cpp
+++ b/src/mongo/client/gridfs.cpp
@@ -15,13 +15,15 @@
  *    limitations under the License.
  */
 
-#include "pch.h"
+#include "mongo/pch.h"
+
+#include <boost/smart_ptr.hpp>
 #include <fcntl.h>
-#include <utility>
 #include <fstream>
+#include <utility>
 
-#include "gridfs.h"
-#include <boost/smart_ptr.hpp>
+#include "mongo/client/gridfs.h"
+#include "mongo/client/dbclientcursor.h"
 
 #if defined(_WIN32)
 #include <io.h>
diff --git a/src/mongo/client/parallel.h b/src/mongo/client/parallel.h
index a968464910f..f7ad47d9dd1 100644
--- a/src/mongo/client/parallel.h
+++ b/src/mongo/client/parallel.h
@@ -21,13 +21,17 @@
 
 #pragma once
 
-#include "../pch.h"
-#include "dbclient.h"
-#include "redef_macros.h"
-#include "../db/dbmessage.h"
-#include "../db/matcher.h"
-#include "../util/concurrency/mvar.h"
-#include "../s/util.h"
+#include "mongo/pch.h"
+
+#include "mongo/client/dbclient.h"
+
+#include "mongo/client/redef_macros.h"
+
+#include "mongo/db/dbmessage.h"
+#include "mongo/db/matcher.h"
+#include "mongo/db/namespacestring.h"
+#include "mongo/s/util.h"
+#include "mongo/util/concurrency/mvar.h"
 
 namespace mongo {
 
@@ -462,4 +466,4 @@ namespace mongo {
 
 }
 
-#include "undef_macros.h"
+#include "mongo/client/undef_macros.h"
diff --git a/src/mongo/client/syncclusterconnection.cpp b/src/mongo/client/syncclusterconnection.cpp
index fbb93dc8af2..f9262ab6240 100644
--- a/src/mongo/client/syncclusterconnection.cpp
+++ b/src/mongo/client/syncclusterconnection.cpp
@@ -16,9 +16,12 @@
  */
 
 
-#include "pch.h"
-#include "syncclusterconnection.h"
-#include "../db/dbmessage.h"
+#include "mongo/pch.h"
+
+#include "mongo/client/syncclusterconnection.h"
+
+#include "mongo/client/dbclientcursor.h"
+#include "mongo/db/dbmessage.h"
 
 // error codes 8000-8009
 
diff --git a/src/mongo/db/authlevel.h b/src/mongo/db/authlevel.h
new file mode 100644
index 00000000000..af0a5665424
--- /dev/null
+++ b/src/mongo/db/authlevel.h
@@ -0,0 +1,43 @@
+// mongo/db/authlevel.h
+
+/**
+ *    Copyright (C) 2009 10gen Inc.
+ *
+ *    This program is free software: you can redistribute it and/or  modify
+ *    it under the terms of the GNU Affero General Public License, version 3,
+ *    as published by the Free Software Foundation.
+ *
+ *    This program is distributed in the hope that it will be useful,
+ *    but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *    GNU Affero General Public License for more details.
+ *
+ *    You should have received a copy of the GNU Affero General Public License
+ *    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+
+#pragma once
+
+#include <string>
+
+namespace mongo {
+
+    /*
+     * for a particular db
+     * levels
+     *     0 : none
+     *     1 : read
+     *     2 : write
+     */
+    struct Auth {
+
+        enum Level { NONE = 0 ,
+                     READ = 1 ,
+                     WRITE = 2 };
+
+        Auth() : level( NONE ) {}
+
+        Level level;
+        string user;
+    };
+}  // namespace mongo
diff --git a/src/mongo/db/client.h b/src/mongo/db/client.h
index c18642ee96e..a277a97ec89 100644
--- a/src/mongo/db/client.h
+++ b/src/mongo/db/client.h
@@ -34,6 +34,7 @@
 #include "../util/net/message_port.h"
 #include "../util/concurrency/rwlock.h"
 #include "d_concurrency.h"
+#include "mongo/util/paths.h"
 
 namespace mongo {
 
diff --git a/src/mongo/db/d_concurrency.cpp b/src/mongo/db/d_concurrency.cpp
index 049b8948682..55ed6f389da 100644
--- a/src/mongo/db/d_concurrency.cpp
+++ b/src/mongo/db/d_concurrency.cpp
@@ -12,6 +12,7 @@
 #include "d_globals.h"
 #include "mongomutex.h"
 #include "server.h"
+#include "dur.h"
 
 // oplog locking
 // no top level read locks
diff --git a/src/mongo/db/database.h b/src/mongo/db/database.h
index a7867e20e8c..7cac667a6f5 100644
--- a/src/mongo/db/database.h
+++ b/src/mongo/db/database.h
@@ -18,8 +18,8 @@
 
 #pragma once
 
-#include "cmdline.h"
-#include "namespace.h"
+#include "mongo/db/cmdline.h"
+#include "mongo/db/namespace_details.h"
 
 namespace mongo {
 
diff --git a/src/mongo/db/dbmessage.h b/src/mongo/db/dbmessage.h
index a789bff849c..ad5aea2cdff 100644
--- a/src/mongo/db/dbmessage.h
+++ b/src/mongo/db/dbmessage.h
@@ -18,7 +18,6 @@
 
 #pragma once
 
-#include "diskloc.h"
 #include "jsobj.h"
 #include "namespace-inl.h"
 #include "../util/net/message.h"
diff --git a/src/mongo/db/dur_journal.cpp b/src/mongo/db/dur_journal.cpp
index 43825bf25e8..7f1e4351c46 100644
--- a/src/mongo/db/dur_journal.cpp
+++ b/src/mongo/db/dur_journal.cpp
@@ -38,6 +38,7 @@
 #include "../util/compress.h"
 #include "../util/progress_meter.h"
 #include "../server.h"
+#include "../util/mmap.h"
 
 using namespace mongoutils;
 
diff --git a/src/mongo/db/extsort.h b/src/mongo/db/extsort.h
index 8c9c173989c..c292ed12ad6 100644
--- a/src/mongo/db/extsort.h
+++ b/src/mongo/db/extsort.h
@@ -18,11 +18,14 @@
 
 #pragma once
 
-#include "../pch.h"
-#include "jsobj.h"
-#include "namespace-inl.h"
-#include "curop-inl.h"
-#include "../util/array.h"
+#include "mongo/pch.h"
+
+#include "mongo/db/index.h"
+#include "mongo/db/jsobj.h"
+#include "mongo/db/namespace-inl.h"
+#include "mongo/db/curop-inl.h"
+#include "mongo/util/array.h"
+#include "mongo/util/mmap.h"
 
 namespace mongo {
 
diff --git a/src/mongo/db/index.h b/src/mongo/db/index.h
index d297f8a4ca1..4418f2ad382 100644
--- a/src/mongo/db/index.h
+++ b/src/mongo/db/index.h
@@ -23,6 +23,7 @@
 #include "jsobj.h"
 #include "indexkey.h"
 #include "key.h"
+#include "namespace.h"
 
 namespace mongo {
 
diff --git a/src/mongo/db/instance.h b/src/mongo/db/instance.h
index cf9698a95da..090250ace0a 100644
--- a/src/mongo/db/instance.h
+++ b/src/mongo/db/instance.h
@@ -20,7 +20,7 @@
 #pragma once
 
 
-#include "../client/dbclient.h"
+#include "mongo/client/dbclient.h"
 #include "curop-inl.h"
 #include "security.h"
 #include "cmdline.h"
diff --git a/src/mongo/db/namespace-inl.h b/src/mongo/db/namespace-inl.h
index a621a229546..c18f681e0b9 100644
--- a/src/mongo/db/namespace-inl.h
+++ b/src/mongo/db/namespace-inl.h
@@ -18,7 +18,7 @@
 
 #pragma once
 
-#include "namespace.h"
+#include "mongo/db/namespace.h"
 
 namespace mongo {
 
@@ -70,63 +70,4 @@ namespace mongo {
         return old + "." + local;
     }
 
-    inline IndexDetails& NamespaceDetails::idx(int idxNo, bool missingExpected ) {
-        if( idxNo < NIndexesBase ) {
-            IndexDetails& id = _indexes[idxNo];
-            return id;
-        }
-        Extra *e = extra();
-        if ( ! e ) {
-            if ( missingExpected )
-                throw MsgAssertionException( 13283 , "Missing Extra" );
-            massert(14045, "missing Extra", e);
-        }
-        int i = idxNo - NIndexesBase;
-        if( i >= NIndexesExtra ) {
-            e = e->next(this);
-            if ( ! e ) {
-                if ( missingExpected )
-                    throw MsgAssertionException( 14823 , "missing extra" );
-                massert(14824, "missing Extra", e);
-            }
-            i -= NIndexesExtra;
-        }
-        return e->details[i];
-    }
-
-    inline int NamespaceDetails::idxNo(IndexDetails& idx) {
-        IndexIterator i = ii();
-        while( i.more() ) {
-            if( &i.next() == &idx )
-                return i.pos()-1;
-        }
-        massert( 10349 , "E12000 idxNo fails", false);
-        return -1;
-    }
-
-    inline int NamespaceDetails::findIndexByKeyPattern(const BSONObj& keyPattern) {
-        IndexIterator i = ii();
-        while( i.more() ) {
-            if( i.next().keyPattern() == keyPattern )
-                return i.pos()-1;
-        }
-        return -1;
-    }
-
-    // @return offset in indexes[]
-    inline int NamespaceDetails::findIndexByName(const char *name) {
-        IndexIterator i = ii();
-        while( i.more() ) {
-            if ( strcmp(i.next().info.obj().getStringField("name"),name) == 0 )
-                return i.pos()-1;
-        }
-        return -1;
-    }
-
-    inline NamespaceDetails::IndexIterator::IndexIterator(NamespaceDetails *_d) {
-        d = _d;
-        i = 0;
-        n = d->nIndexes;
-    }
-
-}
+}  // namespace mongo
diff --git a/src/mongo/db/namespace.cpp b/src/mongo/db/namespace.cpp
index c84afa824e6..77a45fe8da1 100644
--- a/src/mongo/db/namespace.cpp
+++ b/src/mongo/db/namespace.cpp
@@ -16,788 +16,16 @@
 *    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 */
 
-#include "pch.h"
-#include "pdfile.h"
-#include "db.h"
-#include "mongommf.h"
-#include "../util/hashtab.h"
-#include "../scripting/engine.h"
-#include "btree.h"
-#include <algorithm>
-#include <list>
-#include "json.h"
-#include "ops/delete.h"
+#include "mongo/db/namespace.h"
 
-#include <boost/filesystem/operations.hpp>
+#include <boost/static_assert.hpp>
 
-namespace mongo {
-
-    BOOST_STATIC_ASSERT( sizeof(Namespace) == 128 );
-
-    BSONObj idKeyPattern = fromjson("{\"_id\":1}");
-
-    /* deleted lists -- linked lists of deleted records -- are placed in 'buckets' of various sizes
-       so you can look for a deleterecord about the right size.
-    */
-    int bucketSizes[] = {
-        32, 64, 128, 256, 0x200, 0x400, 0x800, 0x1000, 0x2000, 0x4000,
-        0x8000, 0x10000, 0x20000, 0x40000, 0x80000, 0x100000, 0x200000,
-        0x400000, 0x800000
-    };
-
-    NamespaceDetails::NamespaceDetails( const DiskLoc &loc, bool _capped ) {
-        /* be sure to initialize new fields here -- doesn't default to zeroes the way we use it */
-        firstExtent = lastExtent = capExtent = loc;
-        stats.datasize = stats.nrecords = 0;
-        lastExtentSize = 0;
-        nIndexes = 0;
-        capped = _capped;
-        max = 0x7fffffff;
-        paddingFactor = 1.0;
-        flags = 0;
-        capFirstNewRecord = DiskLoc();
-        // Signal that we are on first allocation iteration through extents.
-        capFirstNewRecord.setInvalid();
-        // For capped case, signal that we are doing initial extent allocation.
-        if ( capped )
-            cappedLastDelRecLastExtent().setInvalid();
-        assert( sizeof(dataFileVersion) == 2 );
-        dataFileVersion = 0;
-        indexFileVersion = 0;
-        multiKeyIndexBits = 0;
-        reservedA = 0;
-        extraOffset = 0;
-        indexBuildInProgress = 0;
-        reservedB = 0;
-        capped2.cc2_ptr = 0;
-        capped2.fileNumber = 0;
-        memset(reserved, 0, sizeof(reserved));
-    }
-
-    bool NamespaceIndex::exists() const {
-        return !boost::filesystem::exists(path());
-    }
-
-    boost::filesystem::path NamespaceIndex::path() const {
-        boost::filesystem::path ret( dir_ );
-        if ( directoryperdb )
-            ret /= database_;
-        ret /= ( database_ + ".ns" );
-        return ret;
-    }
-
-    void NamespaceIndex::maybeMkdir() const {
-        if ( !directoryperdb )
-            return;
-        boost::filesystem::path dir( dir_ );
-        dir /= database_;
-        if ( !boost::filesystem::exists( dir ) )
-            MONGO_BOOST_CHECK_EXCEPTION_WITH_MSG( boost::filesystem::create_directory( dir ), "create dir for db " );
-    }
-
-    unsigned lenForNewNsFiles = 16 * 1024 * 1024;
-
-#if defined(_DEBUG)
-    void NamespaceDetails::dump(const Namespace& k) {
-        if( !cmdLine.dur )
-            cout << "ns offsets which follow will not display correctly with --journal disabled" << endl;
-
-        size_t ofs = 1; // 1 is sentinel that the find call below failed
-        privateViews.find(this, /*out*/ofs);
-
-        cout << "ns" << hex << setw(8) << ofs << ' ';
-        cout << k.toString() << '\n';
-
-        if( k.isExtra() ) {
-            cout << "ns\t extra" << endl;
-            return;
-        }
-
-        cout << "ns         " << firstExtent.toString() << ' ' << lastExtent.toString() << " nidx:" << nIndexes << '\n';
-        cout << "ns         " << stats.datasize << ' ' << stats.nrecords << ' ' << nIndexes << '\n';
-        cout << "ns         " << capped << ' ' << paddingFactor << ' ' << flags << ' ' << dataFileVersion << '\n';
-        cout << "ns         " << multiKeyIndexBits << ' ' << indexBuildInProgress << '\n';
-        cout << "ns         " << (int) reserved[0] << ' ' << (int) reserved[59];
-        cout << endl;
-    }
-#endif
-
-    void NamespaceDetails::onLoad(const Namespace& k) {
-
-        if( k.isExtra() ) {
-            /* overflow storage for indexes - so don't treat as a NamespaceDetails object. */
-            return;
-        }
-
-        if( indexBuildInProgress || capped2.cc2_ptr ) {
-            assertInWriteLock();
-            if( indexBuildInProgress ) {
-                log() << "indexBuildInProgress was " << indexBuildInProgress << " for " << k << ", indicating an abnormal db shutdown" << endl;
-                getDur().writingInt( indexBuildInProgress ) = 0;
-            }
-            if( capped2.cc2_ptr )
-                *getDur().writing(&capped2.cc2_ptr) = 0;
-        }
-    }
-
-    static void namespaceOnLoadCallback(const Namespace& k, NamespaceDetails& v) {
-        v.onLoad(k);
-    }
-
-    bool checkNsFilesOnLoad = true;
-
-    NOINLINE_DECL void NamespaceIndex::_init() {
-        assert( !ht );
-
-        Lock::assertWriteLocked(database_);
-
-        /* if someone manually deleted the datafiles for a database,
-           we need to be sure to clear any cached info for the database in
-           local.*.
-        */
-        /*
-        if ( "local" != database_ ) {
-            DBInfo i(database_.c_str());
-            i.dbDropped();
-        }
-        */
-
-        unsigned long long len = 0;
-        boost::filesystem::path nsPath = path();
-        string pathString = nsPath.string();
-        void *p = 0;
-        if( boost::filesystem::exists(nsPath) ) {
-            if( f.open(pathString, true) ) {
-                len = f.length();
-                if ( len % (1024*1024) != 0 ) {
-                    log() << "bad .ns file: " << pathString << endl;
-                    uassert( 10079 ,  "bad .ns file length, cannot open database", len % (1024*1024) == 0 );
-                }
-                p = f.getView();
-            }
-        }
-        else {
-            // use lenForNewNsFiles, we are making a new database
-            massert( 10343, "bad lenForNewNsFiles", lenForNewNsFiles >= 1024*1024 );
-            maybeMkdir();
-            unsigned long long l = lenForNewNsFiles;
-            if( f.create(pathString, l, true) ) {
-                getDur().createdFile(pathString, l); // always a new file
-                len = l;
-                assert( len == lenForNewNsFiles );
-                p = f.getView();
-            }
-        }
-
-        if ( p == 0 ) {
-            /** TODO: this shouldn't terminate? */
-            log() << "error couldn't open file " << pathString << " terminating" << endl;
-            dbexit( EXIT_FS );
-        }
-
-
-        assert( len <= 0x7fffffff );
-        ht = new HashTable<Namespace,NamespaceDetails>(p, (int) len, "namespace index");
-        if( checkNsFilesOnLoad )
-            ht->iterAll(namespaceOnLoadCallback);
-    }
-
-    static void namespaceGetNamespacesCallback( const Namespace& k , NamespaceDetails& v , void * extra ) {
-        list<string> * l = (list<string>*)extra;
-        if ( ! k.hasDollarSign() )
-            l->push_back( (string)k );
-    }
-    void NamespaceIndex::getNamespaces( list<string>& tofill , bool onlyCollections ) const {
-        assert( onlyCollections ); // TODO: need to implement this
-        //                                  need boost::bind or something to make this less ugly
-
-        if ( ht )
-            ht->iterAll( namespaceGetNamespacesCallback , (void*)&tofill );
-    }
-
-    void NamespaceDetails::addDeletedRec(DeletedRecord *d, DiskLoc dloc) {
-        BOOST_STATIC_ASSERT( sizeof(NamespaceDetails::Extra) <= sizeof(NamespaceDetails) );
-
-        {
-            Record *r = (Record *) getDur().writingPtr(d, sizeof(Record));
-            d = &r->asDeleted();
-            // defensive code: try to make us notice if we reference a deleted record
-            (unsigned&) (r->data) = 0xeeeeeeee;
-        }
-        DEBUGGING log() << "TEMP: add deleted rec " << dloc.toString() << ' ' << hex << d->extentOfs << endl;
-        if ( capped ) {
-            if ( !cappedLastDelRecLastExtent().isValid() ) {
-                // Initial extent allocation.  Insert at end.
-                d->nextDeleted = DiskLoc();
-                if ( cappedListOfAllDeletedRecords().isNull() )
-                    getDur().writingDiskLoc( cappedListOfAllDeletedRecords() ) = dloc;
-                else {
-                    DiskLoc i = cappedListOfAllDeletedRecords();
-                    for (; !i.drec()->nextDeleted.isNull(); i = i.drec()->nextDeleted )
-                        ;
-                    i.drec()->nextDeleted.writing() = dloc;
-                }
-            }
-            else {
-                d->nextDeleted = cappedFirstDeletedInCurExtent();
-                getDur().writingDiskLoc( cappedFirstDeletedInCurExtent() ) = dloc;
-                // always compact() after this so order doesn't matter
-            }
-        }
-        else {
-            int b = bucket(d->lengthWithHeaders);
-            DiskLoc& list = deletedList[b];
-            DiskLoc oldHead = list;
-            getDur().writingDiskLoc(list) = dloc;
-            d->nextDeleted = oldHead;
-        }
-    }
-
-    /* predetermine location of the next alloc without actually doing it. 
-        if cannot predetermine returns null (so still call alloc() then)
-    */
-    DiskLoc NamespaceDetails::allocWillBeAt(const char *ns, int lenToAlloc) {
-        if ( !capped ) {
-            lenToAlloc = (lenToAlloc + 3) & 0xfffffffc;
-            return __stdAlloc(lenToAlloc, true);
-        }
-        return DiskLoc();
-    }
-
-    /** allocate space for a new record from deleted lists.
-        @param lenToAlloc is WITH header
-        @param extentLoc OUT returns the extent location
-        @return null diskloc if no room - allocate a new extent then
-    */
-    DiskLoc NamespaceDetails::alloc(const char *ns, int lenToAlloc, DiskLoc& extentLoc) {
-        {
-            // align very slightly.  
-            // note that if doing more coarse-grained quantization (really just if it isn't always
-            //   a constant amount but if it varied by record size) then that quantization should 
-            //   NOT be done here but rather in __stdAlloc so that we can grab a deletedrecord that 
-            //   is just big enough if we happen to run into one.
-            lenToAlloc = (lenToAlloc + 3) & 0xfffffffc;
-        }
-
-        DiskLoc loc = _alloc(ns, lenToAlloc);
-        if ( loc.isNull() )
-            return loc;
-
-        const DeletedRecord *r = loc.drec();
-        //r = getDur().writing(r);
-
-        /* note we want to grab from the front so our next pointers on disk tend
-        to go in a forward direction which is important for performance. */
-        int regionlen = r->lengthWithHeaders;
-        extentLoc.set(loc.a(), r->extentOfs);
-        assert( r->extentOfs < loc.getOfs() );
-
-        DEBUGGING out() << "TEMP: alloc() returns " << loc.toString() << ' ' << ns << " lentoalloc:" << lenToAlloc << " ext:" << extentLoc.toString() << endl;
-
-        int left = regionlen - lenToAlloc;
-        if ( capped == 0 ) {
-            if ( left < 24 || left < (lenToAlloc >> 3) ) {
-                // you get the whole thing.
-                return loc;
-            }
-        }
-
-        /* split off some for further use. */
-        getDur().writingInt(r->lengthWithHeaders) = lenToAlloc;
-        DiskLoc newDelLoc = loc;
-        newDelLoc.inc(lenToAlloc);
-        DeletedRecord *newDel = DataFileMgr::makeDeletedRecord(newDelLoc, left);
-        DeletedRecord *newDelW = getDur().writing(newDel);
-        newDelW->extentOfs = r->extentOfs;
-        newDelW->lengthWithHeaders = left;
-        newDelW->nextDeleted.Null();
-
-        addDeletedRec(newDel, newDelLoc);
-
-        return loc;
-    }
-
-    /* for non-capped collections.
-       @param peekOnly just look up where and don't reserve
-       returned item is out of the deleted list upon return
-    */
-    DiskLoc NamespaceDetails::__stdAlloc(int len, bool peekOnly) {
-        DiskLoc *prev;
-        DiskLoc *bestprev = 0;
-        DiskLoc bestmatch;
-        int bestmatchlen = 0x7fffffff;
-        int b = bucket(len);
-        DiskLoc cur = deletedList[b];
-        prev = &deletedList[b];
-        int extra = 5; // look for a better fit, a little.
-        int chain = 0;
-        while ( 1 ) {
-            {
-                int a = cur.a();
-                if ( a < -1 || a >= 100000 ) {
-                    problem() << "~~ Assertion - cur out of range in _alloc() " << cur.toString() <<
-                              " a:" << a << " b:" << b << " chain:" << chain << '\n';
-                    sayDbContext();
-                    if ( cur == *prev )
-                        prev->Null();
-                    cur.Null();
-                }
-            }
-            if ( cur.isNull() ) {
-                // move to next bucket.  if we were doing "extra", just break
-                if ( bestmatchlen < 0x7fffffff )
-                    break;
-                b++;
-                if ( b > MaxBucket ) {
-                    // out of space. alloc a new extent.
-                    return DiskLoc();
-                }
-                cur = deletedList[b];
-                prev = &deletedList[b];
-                continue;
-            }
-            DeletedRecord *r = cur.drec();
-            if ( r->lengthWithHeaders >= len &&
-                    r->lengthWithHeaders < bestmatchlen ) {
-                bestmatchlen = r->lengthWithHeaders;
-                bestmatch = cur;
-                bestprev = prev;
-            }
-            if ( bestmatchlen < 0x7fffffff && --extra <= 0 )
-                break;
-            if ( ++chain > 30 && b < MaxBucket ) {
-                // too slow, force move to next bucket to grab a big chunk
-                //b++;
-                chain = 0;
-                cur.Null();
-            }
-            else {
-                /*this defensive check only made sense for the mmap storage engine:
-                  if ( r->nextDeleted.getOfs() == 0 ) {
-                    problem() << "~~ Assertion - bad nextDeleted " << r->nextDeleted.toString() <<
-                    " b:" << b << " chain:" << chain << ", fixing.\n";
-                    r->nextDeleted.Null();
-                }*/
-                cur = r->nextDeleted;
-                prev = &r->nextDeleted;
-            }
-        }
-
-        /* unlink ourself from the deleted list */
-        if( !peekOnly ) {
-            const DeletedRecord *bmr = bestmatch.drec();
-            *getDur().writing(bestprev) = bmr->nextDeleted;
-            bmr->nextDeleted.writing().setInvalid(); // defensive.
-            assert(bmr->extentOfs < bestmatch.getOfs());
-        }
-
-        return bestmatch;
-    }
-
-    void NamespaceDetails::dumpDeleted(set<DiskLoc> *extents) {
-        for ( int i = 0; i < Buckets; i++ ) {
-            DiskLoc dl = deletedList[i];
-            while ( !dl.isNull() ) {
-                DeletedRecord *r = dl.drec();
-                DiskLoc extLoc(dl.a(), r->extentOfs);
-                if ( extents == 0 || extents->count(extLoc) <= 0 ) {
-                    out() << "  bucket " << i << endl;
-                    out() << "   " << dl.toString() << " ext:" << extLoc.toString();
-                    if ( extents && extents->count(extLoc) <= 0 )
-                        out() << '?';
-                    out() << " len:" << r->lengthWithHeaders << endl;
-                }
-                dl = r->nextDeleted;
-            }
-        }
-    }
-
-    DiskLoc NamespaceDetails::firstRecord( const DiskLoc &startExtent ) const {
-        for (DiskLoc i = startExtent.isNull() ? firstExtent : startExtent;
-                !i.isNull(); i = i.ext()->xnext ) {
-            if ( !i.ext()->firstRecord.isNull() )
-                return i.ext()->firstRecord;
-        }
-        return DiskLoc();
-    }
+#include "mongo/db/namespacestring.h"
 
-    DiskLoc NamespaceDetails::lastRecord( const DiskLoc &startExtent ) const {
-        for (DiskLoc i = startExtent.isNull() ? lastExtent : startExtent;
-                !i.isNull(); i = i.ext()->xprev ) {
-            if ( !i.ext()->lastRecord.isNull() )
-                return i.ext()->lastRecord;
-        }
-        return DiskLoc();
-    }
-
-    int n_complaints_cap = 0;
-    void NamespaceDetails::maybeComplain( const char *ns, int len ) const {
-        if ( ++n_complaints_cap < 8 ) {
-            out() << "couldn't make room for new record (len: " << len << ") in capped ns " << ns << '\n';
-            int i = 0;
-            for ( DiskLoc e = firstExtent; !e.isNull(); e = e.ext()->xnext, ++i ) {
-                out() << "  Extent " << i;
-                if ( e == capExtent )
-                    out() << " (capExtent)";
-                out() << '\n';
-                out() << "    magic: " << hex << e.ext()->magic << dec << " extent->ns: " << e.ext()->nsDiagnostic.toString() << '\n';
-                out() << "    fr: " << e.ext()->firstRecord.toString() <<
-                      " lr: " << e.ext()->lastRecord.toString() << " extent->len: " << e.ext()->length << '\n';
-            }
-            assert( len * 5 > lastExtentSize ); // assume it is unusually large record; if not, something is broken
-        }
-    }
-
-    /* alloc with capped table handling. */
-    DiskLoc NamespaceDetails::_alloc(const char *ns, int len) {
-        if ( !capped )
-            return __stdAlloc(len, false);
-
-        return cappedAlloc(ns,len);
-    }
-
-    void NamespaceIndex::kill_ns(const char *ns) {
-        Lock::assertWriteLocked(ns);
-        if ( !ht )
-            return;
-        Namespace n(ns);
-        ht->kill(n);
-
-        for( int i = 0; i<=1; i++ ) {
-            try {
-                Namespace extra(n.extraName(i).c_str());
-                ht->kill(extra);
-            }
-            catch(DBException&) { 
-                dlog(3) << "caught exception in kill_ns" << endl;
-            }
-        }
-    }
-
-    void NamespaceIndex::add_ns(const char *ns, DiskLoc& loc, bool capped) {
-        NamespaceDetails details( loc, capped );
-        add_ns( ns, details );
-    }
-    void NamespaceIndex::add_ns( const char *ns, const NamespaceDetails &details ) {
-        Lock::assertWriteLocked(ns);
-        init();
-        Namespace n(ns);
-        uassert( 10081 , "too many namespaces/collections", ht->put(n, details));
-    }
-
-    /* extra space for indexes when more than 10 */
-    NamespaceDetails::Extra* NamespaceIndex::newExtra(const char *ns, int i, NamespaceDetails *d) {
-        Lock::assertWriteLocked(ns);
-        assert( i >= 0 && i <= 1 );
-        Namespace n(ns);
-        Namespace extra(n.extraName(i).c_str()); // throws userexception if ns name too long
-
-        massert( 10350 ,  "allocExtra: base ns missing?", d );
-        massert( 10351 ,  "allocExtra: extra already exists", ht->get(extra) == 0 );
-
-        NamespaceDetails::Extra temp;
-        temp.init();
-        uassert( 10082 ,  "allocExtra: too many namespaces/collections", ht->put(extra, (NamespaceDetails&) temp));
-        NamespaceDetails::Extra *e = (NamespaceDetails::Extra *) ht->get(extra);
-        return e;
-    }
-    NamespaceDetails::Extra* NamespaceDetails::allocExtra(const char *ns, int nindexessofar) {
-        NamespaceIndex *ni = nsindex(ns);
-        int i = (nindexessofar - NIndexesBase) / NIndexesExtra;
-        Extra *e = ni->newExtra(ns, i, this);
-        long ofs = e->ofsFrom(this);
-        if( i == 0 ) {
-            assert( extraOffset == 0 );
-            *getDur().writing(&extraOffset) = ofs;
-            assert( extra() == e );
-        }
-        else {
-            Extra *hd = extra();
-            assert( hd->next(this) == 0 );
-            hd->setNext(ofs);
-        }
-        return e;
-    }
-
-    /* you MUST call when adding an index.  see pdfile.cpp */
-    IndexDetails& NamespaceDetails::addIndex(const char *thisns, bool resetTransient) {
-        IndexDetails *id;
-        try {
-            id = &idx(nIndexes,true);
-        }
-        catch(DBException&) {
-            allocExtra(thisns, nIndexes);
-            id = &idx(nIndexes,false);
-        }
-
-        (*getDur().writing(&nIndexes))++;
-        if ( resetTransient )
-            NamespaceDetailsTransient::get(thisns).addedIndex();
-        return *id;
-    }
-
-    // must be called when renaming a NS to fix up extra
-    void NamespaceDetails::copyingFrom(const char *thisns, NamespaceDetails *src) {
-        extraOffset = 0; // we are a copy -- the old value is wrong.  fixing it up below.
-        Extra *se = src->extra();
-        int n = NIndexesBase;
-        if( se ) {
-            Extra *e = allocExtra(thisns, n);
-            while( 1 ) {
-                n += NIndexesExtra;
-                e->copy(this, *se);
-                se = se->next(src);
-                if( se == 0 ) break;
-                Extra *nxt = allocExtra(thisns, n);
-                e->setNext( nxt->ofsFrom(this) );
-                e = nxt;
-            }
-            assert( extraOffset );
-        }
-    }
-
-    /* returns index of the first index in which the field is present. -1 if not present.
-       (aug08 - this method not currently used)
-    */
-    int NamespaceDetails::fieldIsIndexed(const char *fieldName) {
-        massert( 10346 , "not implemented", false);
-        /*
-        for ( int i = 0; i < nIndexes; i++ ) {
-            IndexDetails& idx = indexes[i];
-            BSONObj idxKey = idx.info.obj().getObjectField("key"); // e.g., { ts : -1 }
-            if ( !idxKey.getField(fieldName).eoo() )
-                return i;
-        }*/
-        return -1;
-    }
-
-    long long NamespaceDetails::storageSize( int * numExtents , BSONArrayBuilder * extentInfo ) const {
-        Extent * e = firstExtent.ext();
-        assert( e );
-
-        long long total = 0;
-        int n = 0;
-        while ( e ) {
-            total += e->length;
-            n++;
-
-            if ( extentInfo ) {
-                extentInfo->append( BSON( "len" << e->length << "loc: " << e->myLoc.toBSONObj() ) );
-            }
-
-            e = e->getNextExtent();
-        }
-
-        if ( numExtents )
-            *numExtents = n;
-
-        return total;
-    }
-
-    NamespaceDetails *NamespaceDetails::writingWithExtra() {
-        vector< pair< long long, unsigned > > writeRanges;
-        writeRanges.push_back( make_pair( 0, sizeof( NamespaceDetails ) ) );
-        for( Extra *e = extra(); e; e = e->next( this ) ) {
-            writeRanges.push_back( make_pair( (char*)e - (char*)this, sizeof( Extra ) ) );
-        }
-        return reinterpret_cast< NamespaceDetails* >( getDur().writingRangesAtOffsets( this, writeRanges ) );
-    }
-
-    /* ------------------------------------------------------------------------- */
-
-    SimpleMutex NamespaceDetailsTransient::_qcMutex("qc");
-    SimpleMutex NamespaceDetailsTransient::_isMutex("is");
-    map< string, shared_ptr< NamespaceDetailsTransient > > NamespaceDetailsTransient::_nsdMap;
-    typedef map< string, shared_ptr< NamespaceDetailsTransient > >::iterator ouriter;
-
-    void NamespaceDetailsTransient::reset() {
-        Lock::assertWriteLocked(_ns); 
-        clearQueryCache();
-        _keysComputed = false;
-        _indexSpecs.clear();
-    }
-
-    /*static*/ NOINLINE_DECL NamespaceDetailsTransient& NamespaceDetailsTransient::make_inlock(const char *ns) {
-        shared_ptr< NamespaceDetailsTransient > &t = _nsdMap[ ns ];
-        assert( t.get() == 0 );
-        Database *database = cc().database();
-        assert( database );
-        if( _nsdMap.size() % 20000 == 10000 ) { 
-            // so we notice if insanely large #s
-            log() << "opening namespace " << ns << endl;
-            log() << _nsdMap.size() << " namespaces in nsdMap" << endl;
-        }
-        t.reset( new NamespaceDetailsTransient(database, ns) );
-        return *t;
-    }
-
-    // note with repair there could be two databases with the same ns name.
-    // that is NOT handled here yet!  TODO
-    // repair may not use nsdt though not sure.  anyway, requires work.
-    NamespaceDetailsTransient::NamespaceDetailsTransient(Database *db, const char *ns) : 
-        _ns(ns), _keysComputed(false), _qcWriteCount() 
-    {
-        dassert(db);
-    }
-
-    NamespaceDetailsTransient::~NamespaceDetailsTransient() { 
-    }
-    
-    void NamespaceDetailsTransient::clearForPrefix(const char *prefix) {
-        SimpleMutex::scoped_lock lk(_qcMutex);
-        vector< string > found;
-        for( ouriter i = _nsdMap.begin(); i != _nsdMap.end(); ++i ) {
-            if ( strncmp( i->first.c_str(), prefix, strlen( prefix ) ) == 0 ) {
-                found.push_back( i->first );
-                Lock::assertWriteLocked(i->first);
-            }
-        }
-        for( vector< string >::iterator i = found.begin(); i != found.end(); ++i ) {
-            _nsdMap[ *i ].reset();
-        }
-    }
-
-    void NamespaceDetailsTransient::eraseForPrefix(const char *prefix) {
-        SimpleMutex::scoped_lock lk(_qcMutex);
-        vector< string > found;
-        for( ouriter i = _nsdMap.begin(); i != _nsdMap.end(); ++i ) {
-            if ( strncmp( i->first.c_str(), prefix, strlen( prefix ) ) == 0 ) {
-                found.push_back( i->first );
-                Lock::assertWriteLocked(i->first);
-            }
-        }
-        for( vector< string >::iterator i = found.begin(); i != found.end(); ++i ) {
-            _nsdMap.erase(*i);
-        }
-    }
-
-    void NamespaceDetailsTransient::computeIndexKeys() {
-        _keysComputed = true;
-        _indexKeys.clear();
-        NamespaceDetails *d = nsdetails(_ns.c_str());
-        if ( ! d )
-            return;
-        NamespaceDetails::IndexIterator i = d->ii();
-        while( i.more() )
-            i.next().keyPattern().getFieldNames(_indexKeys);
-    }
-
-
-    /* ------------------------------------------------------------------------- */
-
-    /* add a new namespace to the system catalog (<dbname>.system.namespaces).
-       options: { capped : ..., size : ... }
-    */
-    void addNewNamespaceToCatalog(const char *ns, const BSONObj *options = 0) {
-        LOG(1) << "New namespace: " << ns << endl;
-        if ( strstr(ns, "system.namespaces") ) {
-            // system.namespaces holds all the others, so it is not explicitly listed in the catalog.
-            // TODO: fix above should not be strstr!
-            return;
-        }
-        
-        BSONObjBuilder b;
-        b.append("name", ns);
-        if ( options )
-            b.append("options", *options);
-        BSONObj j = b.done();
-        char database[256];
-        nsToDatabase(ns, database);
-        string s = string(database) + ".system.namespaces";
-        theDataFileMgr.insert(s.c_str(), j.objdata(), j.objsize(), true);
-    }
-
-    void renameNamespace( const char *from, const char *to, bool stayTemp) {
-        NamespaceIndex *ni = nsindex( from );
-        assert( ni );
-        assert( ni->details( from ) );
-        assert( ! ni->details( to ) );
-
-        // Our namespace and index details will move to a different
-        // memory location.  The only references to namespace and
-        // index details across commands are in cursors and nsd
-        // transient (including query cache) so clear these.
-        ClientCursor::invalidate( from );
-        NamespaceDetailsTransient::eraseForPrefix( from );
-
-        NamespaceDetails *details = ni->details( from );
-        ni->add_ns( to, *details );
-        NamespaceDetails *todetails = ni->details( to );
-        try {
-            todetails->copyingFrom(to, details); // fixes extraOffset
-        }
-        catch( DBException& ) {
-            // could end up here if .ns is full - if so try to clean up / roll back a little
-            ni->kill_ns(to);
-            throw;
-        }
-        ni->kill_ns( from );
-        details = todetails;
-
-        BSONObj oldSpec;
-        char database[MaxDatabaseNameLen];
-        nsToDatabase(from, database);
-        string s = database;
-        s += ".system.namespaces";
-        assert( Helpers::findOne( s.c_str(), BSON( "name" << from ), oldSpec ) );
-
-        BSONObjBuilder newSpecB;
-        BSONObjIterator i( oldSpec.getObjectField( "options" ) );
-        while( i.more() ) {
-            BSONElement e = i.next();
-            if ( strcmp( e.fieldName(), "create" ) != 0 ) {
-                if (stayTemp || (strcmp(e.fieldName(), "temp") != 0))
-                    newSpecB.append( e );
-            }
-            else {
-                newSpecB << "create" << to;
-            }
-        }
-        BSONObj newSpec = newSpecB.done();
-        addNewNamespaceToCatalog( to, newSpec.isEmpty() ? 0 : &newSpec );
-
-        deleteObjects( s.c_str(), BSON( "name" << from ), false, false, true );
-        // oldSpec variable no longer valid memory
-
-        BSONObj oldIndexSpec;
-        s = database;
-        s += ".system.indexes";
-        while( Helpers::findOne( s.c_str(), BSON( "ns" << from ), oldIndexSpec ) ) {
-            BSONObjBuilder newIndexSpecB;
-            BSONObjIterator i( oldIndexSpec );
-            while( i.more() ) {
-                BSONElement e = i.next();
-                if ( strcmp( e.fieldName(), "ns" ) != 0 )
-                    newIndexSpecB.append( e );
-                else
-                    newIndexSpecB << "ns" << to;
-            }
-            BSONObj newIndexSpec = newIndexSpecB.done();
-            DiskLoc newIndexSpecLoc = theDataFileMgr.insert( s.c_str(), newIndexSpec.objdata(), newIndexSpec.objsize(), true, false );
-            int indexI = details->findIndexByName( oldIndexSpec.getStringField( "name" ) );
-            IndexDetails &indexDetails = details->idx(indexI);
-            string oldIndexNs = indexDetails.indexNamespace();
-            indexDetails.info = newIndexSpecLoc;
-            string newIndexNs = indexDetails.indexNamespace();
-
-            renameIndexNamespace( oldIndexNs.c_str(), newIndexNs.c_str() );
-            deleteObjects( s.c_str(), oldIndexSpec.getOwned(), true, false, true );
-        }
-    }
-
-    bool legalClientSystemNS( const string& ns , bool write ) {
-        if( ns == "local.system.replset" ) return true;
-
-        if ( ns.find( ".system.users" ) != string::npos )
-            return true;
-
-        if ( ns.find( ".system.js" ) != string::npos ) {
-            if ( write )
-                Scope::storedFuncMod();
-            return true;
-        }
-
-        return false;
-    }
+namespace mongo {
+namespace {
+BOOST_STATIC_ASSERT( sizeof(Namespace) == 128 );
+BOOST_STATIC_ASSERT( Namespace::MaxNsLen == MaxDatabaseNameLen );
+}  // namespace
+}  // namespace mongo
 
-} // namespace mongo
diff --git a/src/mongo/db/namespace.h b/src/mongo/db/namespace.h
index 0e2042940c8..b0907a58acc 100644
--- a/src/mongo/db/namespace.h
+++ b/src/mongo/db/namespace.h
@@ -18,25 +18,14 @@
 
 #pragma once
 
-#include "../pch.h"
-#include "namespacestring.h"
-#include "jsobj.h"
-#include "querypattern.h"
-#include "diskloc.h"
-#include "../util/hashtab.h"
-#include "mongommf.h"
-#include "d_concurrency.h"
-#include "queryoptimizer.h"
-#include "queryoptimizercursor.h"
+#include "mongo/pch.h"
 
-namespace mongo {
+#include <cstring>
+#include <string>
 
-    class Database;
+namespace mongo {
 
 #pragma pack(1)
-    /* This helper class is used to make the HashMap below in NamespaceIndex e.g. see line:
-          HashTable<Namespace,NamespaceDetails> *ht;
-    */
     class Namespace {
     public:
         explicit Namespace(const char *ns) { *this = ns; }
@@ -50,8 +39,8 @@ namespace mongo {
 
         size_t size() const { return strlen( buf ); }
 
-        string toString() const { return (string) buf; }
-        operator string() const { return (string) buf; }
+        string toString() const { return buf; }
+        operator string() const { return buf; }
 
         /* NamespaceDetails::Extra was added after fact to allow chaining of data blocks to support more than 10 indexes
            (more than 10 IndexDetails).  It's a bit hacky because of this late addition with backward
@@ -70,585 +59,4 @@ namespace mongo {
     };
 #pragma pack()
 
-    BOOST_STATIC_ASSERT( Namespace::MaxNsLen == MaxDatabaseNameLen );
-
-} // namespace mongo
-
-#include "index.h"
-
-namespace mongo {
-
-    /** @return true if a client can modify this namespace even though it is under ".system."
-        For example <dbname>.system.users is ok for regular clients to update.
-        @param write used when .system.js
-    */
-    bool legalClientSystemNS( const string& ns , bool write );
-
-    /* deleted lists -- linked lists of deleted records -- are placed in 'buckets' of various sizes
-       so you can look for a deleterecord about the right size.
-    */
-    const int Buckets = 19;
-    const int MaxBucket = 18;
-
-    extern int bucketSizes[];
-
-#pragma pack(1)
-    /* NamespaceDetails : this is the "header" for a collection that has all its details.
-       It's in the .ns file and this is a memory mapped region (thus the pack pragma above).
-    */
-    class NamespaceDetails {
-    public:
-        enum { NIndexesMax = 64, NIndexesExtra = 30, NIndexesBase  = 10 };
-
-        /*-------- data fields, as present on disk : */
-        DiskLoc firstExtent;
-        DiskLoc lastExtent;
-        /* NOTE: capped collections v1 override the meaning of deletedList.
-                 deletedList[0] points to a list of free records (DeletedRecord's) for all extents in
-                 the capped namespace.
-                 deletedList[1] points to the last record in the prev extent.  When the "current extent"
-                 changes, this value is updated.  !deletedList[1].isValid() when this value is not
-                 yet computed.
-        */
-        DiskLoc deletedList[Buckets];
-        // ofs 168 (8 byte aligned)
-        struct Stats {
-            // datasize and nrecords MUST Be adjacent code assumes!
-            long long datasize; // this includes padding, but not record headers
-            long long nrecords;
-        } stats;
-        int lastExtentSize;
-        int nIndexes;
-    private:
-        // ofs 192
-        IndexDetails _indexes[NIndexesBase];
-    public:
-        // ofs 352 (16 byte aligned)
-        int capped;
-        int max;                              // max # of objects for a capped table.  TODO: should this be 64 bit?
-        double paddingFactor;                 // 1.0 = no padding.
-        // ofs 386 (16)
-        int flags;
-        DiskLoc capExtent;
-        DiskLoc capFirstNewRecord;
-        unsigned short dataFileVersion;       // NamespaceDetails version.  So we can do backward compatibility in the future. See filever.h
-        unsigned short indexFileVersion;
-        unsigned long long multiKeyIndexBits;
-    private:
-        // ofs 400 (16)
-        unsigned long long reservedA;
-        long long extraOffset;                // where the $extra info is located (bytes relative to this)
-    public:
-        int indexBuildInProgress;             // 1 if in prog
-        unsigned reservedB;
-        // ofs 424 (8)
-        struct Capped2 {
-            unsigned long long cc2_ptr;       // see capped.cpp
-            unsigned fileNumber;
-        } capped2;
-        char reserved[60];
-        /*-------- end data 496 bytes */
-
-        explicit NamespaceDetails( const DiskLoc &loc, bool _capped );
-
-        class Extra {
-            long long _next;
-        public:
-            IndexDetails details[NIndexesExtra];
-        private:
-            unsigned reserved2;
-            unsigned reserved3;
-            Extra(const Extra&) { assert(false); }
-            Extra& operator=(const Extra& r) { assert(false); return *this; }
-        public:
-            Extra() { }
-            long ofsFrom(NamespaceDetails *d) {
-                return ((char *) this) - ((char *) d);
-            }
-            void init() { memset(this, 0, sizeof(Extra)); }
-            Extra* next(NamespaceDetails *d) {
-                if( _next == 0 ) return 0;
-                return (Extra*) (((char *) d) + _next);
-            }
-            void setNext(long ofs) { *getDur().writing(&_next) = ofs;  }
-            void copy(NamespaceDetails *d, const Extra& e) {
-                memcpy(this, &e, sizeof(Extra));
-                _next = 0;
-            }
-        };
-        Extra* extra() {
-            if( extraOffset == 0 ) return 0;
-            return (Extra *) (((char *) this) + extraOffset);
-        }
-        /* add extra space for indexes when more than 10 */
-        Extra* allocExtra(const char *ns, int nindexessofar);
-        void copyingFrom(const char *thisns, NamespaceDetails *src); // must be called when renaming a NS to fix up extra
-
-        /* called when loaded from disk */
-        void onLoad(const Namespace& k);
-
-        /* dump info on this namespace.  for debugging. */
-        void dump(const Namespace& k);
-
-        /* dump info on all extents for this namespace.  for debugging. */
-        void dumpExtents();
-
-    private:
-        Extent *theCapExtent() const { return capExtent.ext(); }
-        void advanceCapExtent( const char *ns );
-        DiskLoc __capAlloc(int len);
-        DiskLoc cappedAlloc(const char *ns, int len);
-        DiskLoc &cappedFirstDeletedInCurExtent();
-        bool nextIsInCapExtent( const DiskLoc &dl ) const;
-
-    public:
-        DiskLoc& cappedListOfAllDeletedRecords() { return deletedList[0]; }
-        DiskLoc& cappedLastDelRecLastExtent()    { return deletedList[1]; }
-        void cappedDumpDelInfo();
-        bool capLooped() const { return capped && capFirstNewRecord.isValid();  }
-        bool inCapExtent( const DiskLoc &dl ) const;
-        void cappedCheckMigrate();
-        /**
-         * Truncate documents newer than the document at 'end' from the capped
-         * collection.  The collection cannot be completely emptied using this
-         * function.  An assertion will be thrown if that is attempted.
-         * @param inclusive - Truncate 'end' as well iff true
-         */
-        void cappedTruncateAfter(const char *ns, DiskLoc end, bool inclusive);
-        /** Remove all documents from the capped collection */
-        void emptyCappedCollection(const char *ns);
-
-        /* when a background index build is in progress, we don't count the index in nIndexes until
-           complete, yet need to still use it in _indexRecord() - thus we use this function for that.
-        */
-        int nIndexesBeingBuilt() const { return nIndexes + indexBuildInProgress; }
-
-        /* NOTE: be careful with flags.  are we manipulating them in read locks?  if so,
-                 this isn't thread safe.  TODO
-        */
-        enum NamespaceFlags {
-            Flag_HaveIdIndex = 1 << 0 // set when we have _id index (ONLY if ensureIdIndex was called -- 0 if that has never been called)
-        };
-
-        IndexDetails& idx(int idxNo, bool missingExpected = false );
-
-        /** get the IndexDetails for the index currently being built in the background. (there is at most one) */
-        IndexDetails& inProgIdx() {
-            DEV assert(indexBuildInProgress);
-            return idx(nIndexes);
-        }
-
-        class IndexIterator {
-        public:
-            int pos() { return i; } // note this is the next one to come
-            bool more() { return i < n; }
-            IndexDetails& next() { return d->idx(i++); }
-        private:
-            friend class NamespaceDetails;
-            int i, n;
-            NamespaceDetails *d;
-            IndexIterator(NamespaceDetails *_d);
-        };
-
-        IndexIterator ii() { return IndexIterator(this); }
-
-        /* hackish - find our index # in the indexes array */
-        int idxNo(IndexDetails& idx);
-
-        /* multikey indexes are indexes where there are more than one key in the index
-             for a single document. see multikey in wiki.
-           for these, we have to do some dedup work on queries.
-        */
-        bool isMultikey(int i) const { return (multiKeyIndexBits & (((unsigned long long) 1) << i)) != 0; }
-        void setIndexIsMultikey(int i) {
-            dassert( i < NIndexesMax );
-            unsigned long long x = ((unsigned long long) 1) << i;
-            if( multiKeyIndexBits & x ) return;
-            *getDur().writing(&multiKeyIndexBits) |= x;
-        }
-        void clearIndexIsMultikey(int i) {
-            dassert( i < NIndexesMax );
-            unsigned long long x = ((unsigned long long) 1) << i;
-            if( (multiKeyIndexBits & x) == 0 ) return;
-            *getDur().writing(&multiKeyIndexBits) &= ~x;
-        }
-
-        /* add a new index.  does not add to system.indexes etc. - just to NamespaceDetails.
-           caller must populate returned object.
-         */
-        IndexDetails& addIndex(const char *thisns, bool resetTransient=true);
-
-        void aboutToDeleteAnIndex() { 
-            *getDur().writing(&flags) = flags & ~Flag_HaveIdIndex;
-        }
-
-        /* returns index of the first index in which the field is present. -1 if not present. */
-        int fieldIsIndexed(const char *fieldName);
-
-        /* called to indicate that an update fit in place.  
-           fits also called on an insert -- idea there is that if you had some mix and then went to
-           pure inserts it would adapt and PF would trend to 1.0.  note update calls insert on a move
-           so there is a double count there that must be adjusted for below.
-
-           todo: greater sophistication could be helpful and added later.  for example the absolute 
-                 size of documents might be considered -- in some cases smaller ones are more likely 
-                 to grow than larger ones in the same collection? (not always)
-        */
-        void paddingFits() {
-            MONGO_SOMETIMES(sometimes, 4) { // do this on a sampled basis to journal less
-                double x = paddingFactor - 0.001;
-                if ( x >= 1.0 ) {
-                    *getDur().writing(&paddingFactor) = x;
-                }
-            }
-        }
-        void paddingTooSmall() {            
-            MONGO_SOMETIMES(sometimes, 4) { // do this on a sampled basis to journal less       
-                /* the more indexes we have, the higher the cost of a move.  so we take that into 
-                   account herein.  note on a move that insert() calls paddingFits(), thus
-                   here for example with no inserts and nIndexes = 1 we have
-                   .001*4-.001 or a 3:1 ratio to non moves -> 75% nonmoves.  insert heavy 
-                   can pushes this down considerably. further tweaking will be a good idea but 
-                   this should be an adequate starting point.
-                */
-                double N = min(nIndexes,7) + 3;
-                double x = paddingFactor + (0.001 * N);
-                if ( x <= 2.0 ) {
-                    *getDur().writing(&paddingFactor) = x;
-                }
-            }
-        }
-
-        // @return offset in indexes[]
-        int findIndexByName(const char *name);
-
-        // @return offset in indexes[]
-        int findIndexByKeyPattern(const BSONObj& keyPattern);
-
-        void findIndexByType( const string& name , vector<int>& matches ) {
-            IndexIterator i = ii();
-            while ( i.more() ) {
-                if ( i.next().getSpec().getTypeName() == name )
-                    matches.push_back( i.pos() - 1 );
-            }
-        }
-
-        /* @return -1 = not found
-           generally id is first index, so not that expensive an operation (assuming present).
-        */
-        int findIdIndex() {
-            IndexIterator i = ii();
-            while( i.more() ) {
-                if( i.next().isIdIndex() )
-                    return i.pos()-1;
-            }
-            return -1;
-        }
-
-        bool haveIdIndex() { 
-            return (flags & NamespaceDetails::Flag_HaveIdIndex) || findIdIndex() >= 0;
-        }
-
-        /* return which "deleted bucket" for this size object */
-        static int bucket(int n) {
-            for ( int i = 0; i < Buckets; i++ )
-                if ( bucketSizes[i] > n )
-                    return i;
-            return Buckets-1;
-        }
-
-        /* predetermine location of the next alloc without actually doing it. 
-           if cannot predetermine returns null (so still call alloc() then)
-        */
-        DiskLoc allocWillBeAt(const char *ns, int lenToAlloc);
-
-        /* allocate a new record.  lenToAlloc includes headers. */
-        DiskLoc alloc(const char *ns, int lenToAlloc, DiskLoc& extentLoc);
-
-        /* add a given record to the deleted chains for this NS */
-        void addDeletedRec(DeletedRecord *d, DiskLoc dloc);
-        void dumpDeleted(set<DiskLoc> *extents = 0);
-        // Start from firstExtent by default.
-        DiskLoc firstRecord( const DiskLoc &startExtent = DiskLoc() ) const;
-        // Start from lastExtent by default.
-        DiskLoc lastRecord( const DiskLoc &startExtent = DiskLoc() ) const;
-        long long storageSize( int * numExtents = 0 , BSONArrayBuilder * extentInfo = 0 ) const;
-
-        int averageObjectSize() {
-            if ( stats.nrecords == 0 )
-                return 5;
-            return (int) (stats.datasize / stats.nrecords);
-        }
-
-        NamespaceDetails *writingWithoutExtra() {
-            return ( NamespaceDetails* ) getDur().writingPtr( this, sizeof( NamespaceDetails ) );
-        }
-        /** Make all linked Extra objects writeable as well */
-        NamespaceDetails *writingWithExtra();
-
-    private:
-        DiskLoc _alloc(const char *ns, int len);
-        void maybeComplain( const char *ns, int len ) const;
-        DiskLoc __stdAlloc(int len, bool willBeAt);
-        void compact(); // combine adjacent deleted records
-        friend class NamespaceIndex;
-        struct ExtraOld {
-            // note we could use this field for more chaining later, so don't waste it:
-            unsigned long long reserved1;
-            IndexDetails details[NIndexesExtra];
-            unsigned reserved2;
-            unsigned reserved3;
-        };
-        /** Update cappedLastDelRecLastExtent() after capExtent changed in cappedTruncateAfter() */
-        void cappedTruncateLastDelUpdate();
-        BOOST_STATIC_ASSERT( NIndexesMax <= NIndexesBase + NIndexesExtra*2 );
-        BOOST_STATIC_ASSERT( NIndexesMax <= 64 ); // multiKey bits
-        BOOST_STATIC_ASSERT( sizeof(NamespaceDetails::ExtraOld) == 496 );
-        BOOST_STATIC_ASSERT( sizeof(NamespaceDetails::Extra) == 496 );
-    }; // NamespaceDetails
-#pragma pack()
-
-    /* NamespaceDetailsTransient
-
-       these are things we know / compute about a namespace that are transient -- things
-       we don't actually store in the .ns file.  so mainly caching of frequently used
-       information.
-
-       CAUTION: Are you maintaining this properly on a collection drop()?  A dropdatabase()?  Be careful.
-                The current field "allIndexKeys" may have too many keys in it on such an occurrence;
-                as currently used that does not cause anything terrible to happen.
-
-       todo: cleanup code, need abstractions and separation
-    */
-    // todo: multiple db's with the same name (repairDatbase) is not handled herein.  that may be 
-    //       the way to go, if not used by repair, but need some sort of enforcement / asserts.
-    class NamespaceDetailsTransient : boost::noncopyable {
-        BOOST_STATIC_ASSERT( sizeof(NamespaceDetails) == 496 );
-
-        //Database *database;
-        const string _ns;
-        void reset();
-        static std::map< string, shared_ptr< NamespaceDetailsTransient > > _nsdMap;
-
-        NamespaceDetailsTransient(Database*,const char *ns);
-    public:
-        ~NamespaceDetailsTransient();
-        void addedIndex() { reset(); }
-        void deletedIndex() { reset(); }
-        /* Drop cached information on all namespaces beginning with the specified prefix.
-           Can be useful as index namespaces share the same start as the regular collection.
-           SLOW - sequential scan of all NamespaceDetailsTransient objects */
-        static void clearForPrefix(const char *prefix);
-        static void eraseForPrefix(const char *prefix);
-
-        /**
-         * @return a cursor interface to the query optimizer.  The implementation may utilize a
-         * single query plan or interleave results from multiple query plans before settling on a
-         * single query plan.  Note that the schema of currKey() documents, indexKeyPattern(), the
-         * matcher(), and the isMultiKey() nature of the cursor may change over the course of
-         * iteration.
-         *
-         * @param query - Query used to select indexes and populate matchers; not copied if unowned
-         * (see bsonobj.h).
-         *
-         * @param order - Required ordering spec for documents produced by this cursor, empty object
-         * default indicates no order requirement.  If no index exists that satisfies the required
-         * sort order, an empty shared_ptr is returned unless parsedQuery is also provided.  This is
-         * not copied if unowned.
-         *
-         * @param planPolicy - A policy for selecting query plans - see queryoptimizercursor.h
-         *
-         * @param simpleEqualityMatch - Set to true for certain simple queries - see
-         * queryoptimizer.cpp.
-         *
-         * @param parsedQuery - Additional query parameters, as from a client query request.  If
-         * specified, the resulting cursor may return results from out of order plans.  See
-         * queryoptimizercursor.h for information on handling these results.
-         *
-         * @param singlePlanSummary - Query plan summary information that may be provided when a
-         * cursor running a single plan is returned.
-         *
-         * The returned cursor may @throw inside of advance() or recoverFromYield() in certain error
-         * cases, for example if a capped overrun occurred during a yield.  This indicates that the
-         * cursor was unable to perform a complete scan.
-         *
-         * This is a work in progress.  Partial list of features not yet implemented through this
-         * interface:
-         * 
-         * - covered indexes
-         * - in memory sorting
-         */
-        static shared_ptr<Cursor> getCursor( const char *ns, const BSONObj &query,
-                                            const BSONObj &order = BSONObj(),
-                                            const QueryPlanSelectionPolicy &planPolicy =
-                                            QueryPlanSelectionPolicy::any(),
-                                            bool *simpleEqualityMatch = 0,
-                                            const ParsedQuery *parsedQuery = 0,
-                                            QueryPlan::Summary *singlePlanSummary = 0 );
-
-        /**
-         * @return a single cursor that may work well for the given query.  A $or style query will
-         * produce a single cursor, not a MultiCursor.
-         * It is possible no cursor is returned if the sort is not supported by an index.  Clients are responsible
-         * for checking this if they are not sure an index for a sort exists, and defaulting to a non-sort if
-         * no suitable indices exist.
-         */
-        static shared_ptr<Cursor> bestGuessCursor( const char *ns, const BSONObj &query, const BSONObj &sort );
-
-        /* indexKeys() cache ---------------------------------------------------- */
-        /* assumed to be in write lock for this */
-    private:
-        bool _keysComputed;
-        set<string> _indexKeys;
-        void computeIndexKeys();
-    public:
-        /* get set of index keys for this namespace.  handy to quickly check if a given
-           field is indexed (Note it might be a secondary component of a compound index.)
-        */
-        set<string>& indexKeys() {
-            DEV Lock::assertWriteLocked(_ns);
-            if ( !_keysComputed )
-                computeIndexKeys();
-            return _indexKeys;
-        }
-
-        /* IndexSpec caching */
-    private:
-        map<const IndexDetails*,IndexSpec> _indexSpecs;
-        static SimpleMutex _isMutex;
-    public:
-        const IndexSpec& getIndexSpec( const IndexDetails * details ) {
-            IndexSpec& spec = _indexSpecs[details];
-            if ( ! spec._finishedInit ) {
-                SimpleMutex::scoped_lock lk(_isMutex);
-                if ( ! spec._finishedInit ) {
-                    spec.reset( details );
-                    assert( spec._finishedInit );
-                }
-            }
-            return spec;
-        }
-
-        /* query cache (for query optimizer) ------------------------------------- */
-    private:
-        int _qcWriteCount;
-        map< QueryPattern, pair< BSONObj, long long > > _qcCache;
-        static NamespaceDetailsTransient& make_inlock(const char *ns);
-    public:
-        static SimpleMutex _qcMutex;
-
-        /* you must be in the qcMutex when calling this.
-           A NamespaceDetailsTransient object will not go out of scope on you if you are
-           d.dbMutex.atLeastReadLocked(), so you do't have to stay locked.
-           Creates a NamespaceDetailsTransient before returning if one DNE. 
-           todo: avoid creating too many on erroneous ns queries.
-           */
-        static NamespaceDetailsTransient& get_inlock(const char *ns);
-
-        static NamespaceDetailsTransient& get(const char *ns) {
-            // todo : _qcMutex will create bottlenecks in our parallelism
-            SimpleMutex::scoped_lock lk(_qcMutex);
-            return get_inlock(ns);
-        }
-
-        void clearQueryCache() { // public for unit tests
-            _qcCache.clear();
-            _qcWriteCount = 0;
-        }
-        /* you must notify the cache if you are doing writes, as query plan optimality will change */
-        void notifyOfWriteOp() {
-            if ( _qcCache.empty() )
-                return;
-            if ( ++_qcWriteCount >= 100 )
-                clearQueryCache();
-        }
-        BSONObj indexForPattern( const QueryPattern &pattern ) {
-            return _qcCache[ pattern ].first;
-        }
-        long long nScannedForPattern( const QueryPattern &pattern ) {
-            return _qcCache[ pattern ].second;
-        }
-        void registerIndexForPattern( const QueryPattern &pattern, const BSONObj &indexKey, long long nScanned ) {
-            _qcCache[ pattern ] = make_pair( indexKey, nScanned );
-        }
-
-    }; /* NamespaceDetailsTransient */
-
-    inline NamespaceDetailsTransient& NamespaceDetailsTransient::get_inlock(const char *ns) {
-        std::map< string, shared_ptr< NamespaceDetailsTransient > >::iterator i = _nsdMap.find(ns);
-        if( i != _nsdMap.end() && 
-            i->second.get() ) { // could be null ptr from clearForPrefix
-            return *i->second;
-        }
-        return make_inlock(ns);
-    }
-
-    /* NamespaceIndex is the ".ns" file you see in the data directory.  It is the "system catalog"
-       if you will: at least the core parts.  (Additional info in system.* collections.)
-    */
-    class NamespaceIndex {
-    public:
-        NamespaceIndex(const string &dir, const string &database) :
-            ht( 0 ), dir_( dir ), database_( database ) {}
-
-        /* returns true if new db will be created if we init lazily */
-        bool exists() const;
-
-        void init() {
-            if( !ht ) 
-                _init();
-        }
-
-        void add_ns(const char *ns, DiskLoc& loc, bool capped);
-        void add_ns( const char *ns, const NamespaceDetails &details );
-
-        NamespaceDetails* details(const char *ns) {
-            if ( !ht )
-                return 0;
-            Namespace n(ns);
-            NamespaceDetails *d = ht->get(n);
-            if ( d && d->capped )
-                d->cappedCheckMigrate();
-            return d;
-        }
-
-        void kill_ns(const char *ns);
-
-        bool find(const char *ns, DiskLoc& loc) {
-            NamespaceDetails *l = details(ns);
-            if ( l ) {
-                loc = l->firstExtent;
-                return true;
-            }
-            return false;
-        }
-
-        bool allocated() const { return ht != 0; }
-
-        void getNamespaces( list<string>& tofill , bool onlyCollections = true ) const;
-
-        NamespaceDetails::Extra* newExtra(const char *ns, int n, NamespaceDetails *d);
-
-        boost::filesystem::path path() const;
-
-        unsigned long long fileLength() const { return f.length(); }
-
-    private:
-        void _init();
-        void maybeMkdir() const;
-
-        MongoMMF f;
-        HashTable<Namespace,NamespaceDetails> *ht;
-        string dir_;
-        string database_;
-    };
-
-    extern string dbpath; // --dbpath parm
-    extern bool directoryperdb;
-
-    // Rename a namespace within current 'client' db.
-    // (Arguments should include db name)
-    void renameNamespace( const char *from, const char *to, bool stayTemp);
-
-
 } // namespace mongo
diff --git a/src/mongo/db/namespace_details-inl.h b/src/mongo/db/namespace_details-inl.h
new file mode 100644
index 00000000000..96f85e13a13
--- /dev/null
+++ b/src/mongo/db/namespace_details-inl.h
@@ -0,0 +1,84 @@
+// @file namespace-inl.h
+
+/**
+*    Copyright (C) 2009 10gen Inc.
+*
+*    This program is free software: you can redistribute it and/or  modify
+*    it under the terms of the GNU Affero General Public License, version 3,
+*    as published by the Free Software Foundation.
+*
+*    This program is distributed in the hope that it will be useful,
+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+*    GNU Affero General Public License for more details.
+*
+*    You should have received a copy of the GNU Affero General Public License
+*    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+*/
+
+#pragma once
+
+#include "mongo/db/namespace_details.h"
+
+namespace mongo {
+
+    inline IndexDetails& NamespaceDetails::idx(int idxNo, bool missingExpected ) {
+        if( idxNo < NIndexesBase ) {
+            IndexDetails& id = _indexes[idxNo];
+            return id;
+        }
+        Extra *e = extra();
+        if ( ! e ) {
+            if ( missingExpected )
+                throw MsgAssertionException( 13283 , "Missing Extra" );
+            massert(14045, "missing Extra", e);
+        }
+        int i = idxNo - NIndexesBase;
+        if( i >= NIndexesExtra ) {
+            e = e->next(this);
+            if ( ! e ) {
+                if ( missingExpected )
+                    throw MsgAssertionException( 14823 , "missing extra" );
+                massert(14824, "missing Extra", e);
+            }
+            i -= NIndexesExtra;
+        }
+        return e->details[i];
+    }
+
+    inline int NamespaceDetails::idxNo(IndexDetails& idx) {
+        IndexIterator i = ii();
+        while( i.more() ) {
+            if( &i.next() == &idx )
+                return i.pos()-1;
+        }
+        massert( 10349 , "E12000 idxNo fails", false);
+        return -1;
+    }
+
+    inline int NamespaceDetails::findIndexByKeyPattern(const BSONObj& keyPattern) {
+        IndexIterator i = ii();
+        while( i.more() ) {
+            if( i.next().keyPattern() == keyPattern )
+                return i.pos()-1;
+        }
+        return -1;
+    }
+
+    // @return offset in indexes[]
+    inline int NamespaceDetails::findIndexByName(const char *name) {
+        IndexIterator i = ii();
+        while( i.more() ) {
+            if ( strcmp(i.next().info.obj().getStringField("name"),name) == 0 )
+                return i.pos()-1;
+        }
+        return -1;
+    }
+
+    inline NamespaceDetails::IndexIterator::IndexIterator(NamespaceDetails *_d) {
+        d = _d;
+        i = 0;
+        n = d->nIndexes;
+    }
+
+}
diff --git a/src/mongo/db/namespace_details.cpp b/src/mongo/db/namespace_details.cpp
new file mode 100644
index 00000000000..2e5d3757d56
--- /dev/null
+++ b/src/mongo/db/namespace_details.cpp
@@ -0,0 +1,801 @@
+// namespace.cpp
+
+/**
+*    Copyright (C) 2008 10gen Inc.
+*
+*    This program is free software: you can redistribute it and/or  modify
+*    it under the terms of the GNU Affero General Public License, version 3,
+*    as published by the Free Software Foundation.
+*
+*    This program is distributed in the hope that it will be useful,
+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+*    GNU Affero General Public License for more details.
+*
+*    You should have received a copy of the GNU Affero General Public License
+*    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+*/
+
+#include "pch.h"
+#include "pdfile.h"
+#include "db.h"
+#include "mongommf.h"
+#include "../util/hashtab.h"
+#include "../scripting/engine.h"
+#include "btree.h"
+#include <algorithm>
+#include <list>
+#include "json.h"
+#include "ops/delete.h"
+
+#include <boost/filesystem/operations.hpp>
+
+namespace mongo {
+
+    BSONObj idKeyPattern = fromjson("{\"_id\":1}");
+
+    /* deleted lists -- linked lists of deleted records -- are placed in 'buckets' of various sizes
+       so you can look for a deleterecord about the right size.
+    */
+    int bucketSizes[] = {
+        32, 64, 128, 256, 0x200, 0x400, 0x800, 0x1000, 0x2000, 0x4000,
+        0x8000, 0x10000, 0x20000, 0x40000, 0x80000, 0x100000, 0x200000,
+        0x400000, 0x800000
+    };
+
+    NamespaceDetails::NamespaceDetails( const DiskLoc &loc, bool _capped ) {
+        /* be sure to initialize new fields here -- doesn't default to zeroes the way we use it */
+        firstExtent = lastExtent = capExtent = loc;
+        stats.datasize = stats.nrecords = 0;
+        lastExtentSize = 0;
+        nIndexes = 0;
+        capped = _capped;
+        max = 0x7fffffff;
+        paddingFactor = 1.0;
+        flags = 0;
+        capFirstNewRecord = DiskLoc();
+        // Signal that we are on first allocation iteration through extents.
+        capFirstNewRecord.setInvalid();
+        // For capped case, signal that we are doing initial extent allocation.
+        if ( capped )
+            cappedLastDelRecLastExtent().setInvalid();
+        assert( sizeof(dataFileVersion) == 2 );
+        dataFileVersion = 0;
+        indexFileVersion = 0;
+        multiKeyIndexBits = 0;
+        reservedA = 0;
+        extraOffset = 0;
+        indexBuildInProgress = 0;
+        reservedB = 0;
+        capped2.cc2_ptr = 0;
+        capped2.fileNumber = 0;
+        memset(reserved, 0, sizeof(reserved));
+    }
+
+    bool NamespaceIndex::exists() const {
+        return !boost::filesystem::exists(path());
+    }
+
+    boost::filesystem::path NamespaceIndex::path() const {
+        boost::filesystem::path ret( dir_ );
+        if ( directoryperdb )
+            ret /= database_;
+        ret /= ( database_ + ".ns" );
+        return ret;
+    }
+
+    void NamespaceIndex::maybeMkdir() const {
+        if ( !directoryperdb )
+            return;
+        boost::filesystem::path dir( dir_ );
+        dir /= database_;
+        if ( !boost::filesystem::exists( dir ) )
+            MONGO_BOOST_CHECK_EXCEPTION_WITH_MSG( boost::filesystem::create_directory( dir ), "create dir for db " );
+    }
+
+    unsigned lenForNewNsFiles = 16 * 1024 * 1024;
+
+#if defined(_DEBUG)
+    void NamespaceDetails::dump(const Namespace& k) {
+        if( !cmdLine.dur )
+            cout << "ns offsets which follow will not display correctly with --journal disabled" << endl;
+
+        size_t ofs = 1; // 1 is sentinel that the find call below failed
+        privateViews.find(this, /*out*/ofs);
+
+        cout << "ns" << hex << setw(8) << ofs << ' ';
+        cout << k.toString() << '\n';
+
+        if( k.isExtra() ) {
+            cout << "ns\t extra" << endl;
+            return;
+        }
+
+        cout << "ns         " << firstExtent.toString() << ' ' << lastExtent.toString() << " nidx:" << nIndexes << '\n';
+        cout << "ns         " << stats.datasize << ' ' << stats.nrecords << ' ' << nIndexes << '\n';
+        cout << "ns         " << capped << ' ' << paddingFactor << ' ' << flags << ' ' << dataFileVersion << '\n';
+        cout << "ns         " << multiKeyIndexBits << ' ' << indexBuildInProgress << '\n';
+        cout << "ns         " << (int) reserved[0] << ' ' << (int) reserved[59];
+        cout << endl;
+    }
+#endif
+
+    void NamespaceDetails::onLoad(const Namespace& k) {
+
+        if( k.isExtra() ) {
+            /* overflow storage for indexes - so don't treat as a NamespaceDetails object. */
+            return;
+        }
+
+        if( indexBuildInProgress || capped2.cc2_ptr ) {
+            assertInWriteLock();
+            if( indexBuildInProgress ) {
+                log() << "indexBuildInProgress was " << indexBuildInProgress << " for " << k << ", indicating an abnormal db shutdown" << endl;
+                getDur().writingInt( indexBuildInProgress ) = 0;
+            }
+            if( capped2.cc2_ptr )
+                *getDur().writing(&capped2.cc2_ptr) = 0;
+        }
+    }
+
+    static void namespaceOnLoadCallback(const Namespace& k, NamespaceDetails& v) {
+        v.onLoad(k);
+    }
+
+    bool checkNsFilesOnLoad = true;
+
+    NOINLINE_DECL void NamespaceIndex::_init() {
+        assert( !ht );
+
+        Lock::assertWriteLocked(database_);
+
+        /* if someone manually deleted the datafiles for a database,
+           we need to be sure to clear any cached info for the database in
+           local.*.
+        */
+        /*
+        if ( "local" != database_ ) {
+            DBInfo i(database_.c_str());
+            i.dbDropped();
+        }
+        */
+
+        unsigned long long len = 0;
+        boost::filesystem::path nsPath = path();
+        string pathString = nsPath.string();
+        void *p = 0;
+        if( boost::filesystem::exists(nsPath) ) {
+            if( f.open(pathString, true) ) {
+                len = f.length();
+                if ( len % (1024*1024) != 0 ) {
+                    log() << "bad .ns file: " << pathString << endl;
+                    uassert( 10079 ,  "bad .ns file length, cannot open database", len % (1024*1024) == 0 );
+                }
+                p = f.getView();
+            }
+        }
+        else {
+            // use lenForNewNsFiles, we are making a new database
+            massert( 10343, "bad lenForNewNsFiles", lenForNewNsFiles >= 1024*1024 );
+            maybeMkdir();
+            unsigned long long l = lenForNewNsFiles;
+            if( f.create(pathString, l, true) ) {
+                getDur().createdFile(pathString, l); // always a new file
+                len = l;
+                assert( len == lenForNewNsFiles );
+                p = f.getView();
+            }
+        }
+
+        if ( p == 0 ) {
+            /** TODO: this shouldn't terminate? */
+            log() << "error couldn't open file " << pathString << " terminating" << endl;
+            dbexit( EXIT_FS );
+        }
+
+
+        assert( len <= 0x7fffffff );
+        ht = new HashTable<Namespace,NamespaceDetails>(p, (int) len, "namespace index");
+        if( checkNsFilesOnLoad )
+            ht->iterAll(namespaceOnLoadCallback);
+    }
+
+    static void namespaceGetNamespacesCallback( const Namespace& k , NamespaceDetails& v , void * extra ) {
+        list<string> * l = (list<string>*)extra;
+        if ( ! k.hasDollarSign() )
+            l->push_back( (string)k );
+    }
+    void NamespaceIndex::getNamespaces( list<string>& tofill , bool onlyCollections ) const {
+        assert( onlyCollections ); // TODO: need to implement this
+        //                                  need boost::bind or something to make this less ugly
+
+        if ( ht )
+            ht->iterAll( namespaceGetNamespacesCallback , (void*)&tofill );
+    }
+
+    void NamespaceDetails::addDeletedRec(DeletedRecord *d, DiskLoc dloc) {
+        BOOST_STATIC_ASSERT( sizeof(NamespaceDetails::Extra) <= sizeof(NamespaceDetails) );
+
+        {
+            Record *r = (Record *) getDur().writingPtr(d, sizeof(Record));
+            d = &r->asDeleted();
+            // defensive code: try to make us notice if we reference a deleted record
+            (unsigned&) (r->data) = 0xeeeeeeee;
+        }
+        DEBUGGING log() << "TEMP: add deleted rec " << dloc.toString() << ' ' << hex << d->extentOfs << endl;
+        if ( capped ) {
+            if ( !cappedLastDelRecLastExtent().isValid() ) {
+                // Initial extent allocation.  Insert at end.
+                d->nextDeleted = DiskLoc();
+                if ( cappedListOfAllDeletedRecords().isNull() )
+                    getDur().writingDiskLoc( cappedListOfAllDeletedRecords() ) = dloc;
+                else {
+                    DiskLoc i = cappedListOfAllDeletedRecords();
+                    for (; !i.drec()->nextDeleted.isNull(); i = i.drec()->nextDeleted )
+                        ;
+                    i.drec()->nextDeleted.writing() = dloc;
+                }
+            }
+            else {
+                d->nextDeleted = cappedFirstDeletedInCurExtent();
+                getDur().writingDiskLoc( cappedFirstDeletedInCurExtent() ) = dloc;
+                // always compact() after this so order doesn't matter
+            }
+        }
+        else {
+            int b = bucket(d->lengthWithHeaders);
+            DiskLoc& list = deletedList[b];
+            DiskLoc oldHead = list;
+            getDur().writingDiskLoc(list) = dloc;
+            d->nextDeleted = oldHead;
+        }
+    }
+
+    /* predetermine location of the next alloc without actually doing it. 
+        if cannot predetermine returns null (so still call alloc() then)
+    */
+    DiskLoc NamespaceDetails::allocWillBeAt(const char *ns, int lenToAlloc) {
+        if ( !capped ) {
+            lenToAlloc = (lenToAlloc + 3) & 0xfffffffc;
+            return __stdAlloc(lenToAlloc, true);
+        }
+        return DiskLoc();
+    }
+
+    /** allocate space for a new record from deleted lists.
+        @param lenToAlloc is WITH header
+        @param extentLoc OUT returns the extent location
+        @return null diskloc if no room - allocate a new extent then
+    */
+    DiskLoc NamespaceDetails::alloc(const char *ns, int lenToAlloc, DiskLoc& extentLoc) {
+        {
+            // align very slightly.  
+            // note that if doing more coarse-grained quantization (really just if it isn't always
+            //   a constant amount but if it varied by record size) then that quantization should 
+            //   NOT be done here but rather in __stdAlloc so that we can grab a deletedrecord that 
+            //   is just big enough if we happen to run into one.
+            lenToAlloc = (lenToAlloc + 3) & 0xfffffffc;
+        }
+
+        DiskLoc loc = _alloc(ns, lenToAlloc);
+        if ( loc.isNull() )
+            return loc;
+
+        const DeletedRecord *r = loc.drec();
+        //r = getDur().writing(r);
+
+        /* note we want to grab from the front so our next pointers on disk tend
+        to go in a forward direction which is important for performance. */
+        int regionlen = r->lengthWithHeaders;
+        extentLoc.set(loc.a(), r->extentOfs);
+        assert( r->extentOfs < loc.getOfs() );
+
+        DEBUGGING out() << "TEMP: alloc() returns " << loc.toString() << ' ' << ns << " lentoalloc:" << lenToAlloc << " ext:" << extentLoc.toString() << endl;
+
+        int left = regionlen - lenToAlloc;
+        if ( capped == 0 ) {
+            if ( left < 24 || left < (lenToAlloc >> 3) ) {
+                // you get the whole thing.
+                return loc;
+            }
+        }
+
+        /* split off some for further use. */
+        getDur().writingInt(r->lengthWithHeaders) = lenToAlloc;
+        DiskLoc newDelLoc = loc;
+        newDelLoc.inc(lenToAlloc);
+        DeletedRecord *newDel = DataFileMgr::makeDeletedRecord(newDelLoc, left);
+        DeletedRecord *newDelW = getDur().writing(newDel);
+        newDelW->extentOfs = r->extentOfs;
+        newDelW->lengthWithHeaders = left;
+        newDelW->nextDeleted.Null();
+
+        addDeletedRec(newDel, newDelLoc);
+
+        return loc;
+    }
+
+    /* for non-capped collections.
+       @param peekOnly just look up where and don't reserve
+       returned item is out of the deleted list upon return
+    */
+    DiskLoc NamespaceDetails::__stdAlloc(int len, bool peekOnly) {
+        DiskLoc *prev;
+        DiskLoc *bestprev = 0;
+        DiskLoc bestmatch;
+        int bestmatchlen = 0x7fffffff;
+        int b = bucket(len);
+        DiskLoc cur = deletedList[b];
+        prev = &deletedList[b];
+        int extra = 5; // look for a better fit, a little.
+        int chain = 0;
+        while ( 1 ) {
+            {
+                int a = cur.a();
+                if ( a < -1 || a >= 100000 ) {
+                    problem() << "~~ Assertion - cur out of range in _alloc() " << cur.toString() <<
+                              " a:" << a << " b:" << b << " chain:" << chain << '\n';
+                    sayDbContext();
+                    if ( cur == *prev )
+                        prev->Null();
+                    cur.Null();
+                }
+            }
+            if ( cur.isNull() ) {
+                // move to next bucket.  if we were doing "extra", just break
+                if ( bestmatchlen < 0x7fffffff )
+                    break;
+                b++;
+                if ( b > MaxBucket ) {
+                    // out of space. alloc a new extent.
+                    return DiskLoc();
+                }
+                cur = deletedList[b];
+                prev = &deletedList[b];
+                continue;
+            }
+            DeletedRecord *r = cur.drec();
+            if ( r->lengthWithHeaders >= len &&
+                    r->lengthWithHeaders < bestmatchlen ) {
+                bestmatchlen = r->lengthWithHeaders;
+                bestmatch = cur;
+                bestprev = prev;
+            }
+            if ( bestmatchlen < 0x7fffffff && --extra <= 0 )
+                break;
+            if ( ++chain > 30 && b < MaxBucket ) {
+                // too slow, force move to next bucket to grab a big chunk
+                //b++;
+                chain = 0;
+                cur.Null();
+            }
+            else {
+                /*this defensive check only made sense for the mmap storage engine:
+                  if ( r->nextDeleted.getOfs() == 0 ) {
+                    problem() << "~~ Assertion - bad nextDeleted " << r->nextDeleted.toString() <<
+                    " b:" << b << " chain:" << chain << ", fixing.\n";
+                    r->nextDeleted.Null();
+                }*/
+                cur = r->nextDeleted;
+                prev = &r->nextDeleted;
+            }
+        }
+
+        /* unlink ourself from the deleted list */
+        if( !peekOnly ) {
+            const DeletedRecord *bmr = bestmatch.drec();
+            *getDur().writing(bestprev) = bmr->nextDeleted;
+            bmr->nextDeleted.writing().setInvalid(); // defensive.
+            assert(bmr->extentOfs < bestmatch.getOfs());
+        }
+
+        return bestmatch;
+    }
+
+    void NamespaceDetails::dumpDeleted(set<DiskLoc> *extents) {
+        for ( int i = 0; i < Buckets; i++ ) {
+            DiskLoc dl = deletedList[i];
+            while ( !dl.isNull() ) {
+                DeletedRecord *r = dl.drec();
+                DiskLoc extLoc(dl.a(), r->extentOfs);
+                if ( extents == 0 || extents->count(extLoc) <= 0 ) {
+                    out() << "  bucket " << i << endl;
+                    out() << "   " << dl.toString() << " ext:" << extLoc.toString();
+                    if ( extents && extents->count(extLoc) <= 0 )
+                        out() << '?';
+                    out() << " len:" << r->lengthWithHeaders << endl;
+                }
+                dl = r->nextDeleted;
+            }
+        }
+    }
+
+    DiskLoc NamespaceDetails::firstRecord( const DiskLoc &startExtent ) const {
+        for (DiskLoc i = startExtent.isNull() ? firstExtent : startExtent;
+                !i.isNull(); i = i.ext()->xnext ) {
+            if ( !i.ext()->firstRecord.isNull() )
+                return i.ext()->firstRecord;
+        }
+        return DiskLoc();
+    }
+
+    DiskLoc NamespaceDetails::lastRecord( const DiskLoc &startExtent ) const {
+        for (DiskLoc i = startExtent.isNull() ? lastExtent : startExtent;
+                !i.isNull(); i = i.ext()->xprev ) {
+            if ( !i.ext()->lastRecord.isNull() )
+                return i.ext()->lastRecord;
+        }
+        return DiskLoc();
+    }
+
+    int n_complaints_cap = 0;
+    void NamespaceDetails::maybeComplain( const char *ns, int len ) const {
+        if ( ++n_complaints_cap < 8 ) {
+            out() << "couldn't make room for new record (len: " << len << ") in capped ns " << ns << '\n';
+            int i = 0;
+            for ( DiskLoc e = firstExtent; !e.isNull(); e = e.ext()->xnext, ++i ) {
+                out() << "  Extent " << i;
+                if ( e == capExtent )
+                    out() << " (capExtent)";
+                out() << '\n';
+                out() << "    magic: " << hex << e.ext()->magic << dec << " extent->ns: " << e.ext()->nsDiagnostic.toString() << '\n';
+                out() << "    fr: " << e.ext()->firstRecord.toString() <<
+                      " lr: " << e.ext()->lastRecord.toString() << " extent->len: " << e.ext()->length << '\n';
+            }
+            assert( len * 5 > lastExtentSize ); // assume it is unusually large record; if not, something is broken
+        }
+    }
+
+    /* alloc with capped table handling. */
+    DiskLoc NamespaceDetails::_alloc(const char *ns, int len) {
+        if ( !capped )
+            return __stdAlloc(len, false);
+
+        return cappedAlloc(ns,len);
+    }
+
+    void NamespaceIndex::kill_ns(const char *ns) {
+        Lock::assertWriteLocked(ns);
+        if ( !ht )
+            return;
+        Namespace n(ns);
+        ht->kill(n);
+
+        for( int i = 0; i<=1; i++ ) {
+            try {
+                Namespace extra(n.extraName(i).c_str());
+                ht->kill(extra);
+            }
+            catch(DBException&) { 
+                dlog(3) << "caught exception in kill_ns" << endl;
+            }
+        }
+    }
+
+    void NamespaceIndex::add_ns(const char *ns, DiskLoc& loc, bool capped) {
+        NamespaceDetails details( loc, capped );
+        add_ns( ns, details );
+    }
+    void NamespaceIndex::add_ns( const char *ns, const NamespaceDetails &details ) {
+        Lock::assertWriteLocked(ns);
+        init();
+        Namespace n(ns);
+        uassert( 10081 , "too many namespaces/collections", ht->put(n, details));
+    }
+
+    /* extra space for indexes when more than 10 */
+    NamespaceDetails::Extra* NamespaceIndex::newExtra(const char *ns, int i, NamespaceDetails *d) {
+        Lock::assertWriteLocked(ns);
+        assert( i >= 0 && i <= 1 );
+        Namespace n(ns);
+        Namespace extra(n.extraName(i).c_str()); // throws userexception if ns name too long
+
+        massert( 10350 ,  "allocExtra: base ns missing?", d );
+        massert( 10351 ,  "allocExtra: extra already exists", ht->get(extra) == 0 );
+
+        NamespaceDetails::Extra temp;
+        temp.init();
+        uassert( 10082 ,  "allocExtra: too many namespaces/collections", ht->put(extra, (NamespaceDetails&) temp));
+        NamespaceDetails::Extra *e = (NamespaceDetails::Extra *) ht->get(extra);
+        return e;
+    }
+    NamespaceDetails::Extra* NamespaceDetails::allocExtra(const char *ns, int nindexessofar) {
+        NamespaceIndex *ni = nsindex(ns);
+        int i = (nindexessofar - NIndexesBase) / NIndexesExtra;
+        Extra *e = ni->newExtra(ns, i, this);
+        long ofs = e->ofsFrom(this);
+        if( i == 0 ) {
+            assert( extraOffset == 0 );
+            *getDur().writing(&extraOffset) = ofs;
+            assert( extra() == e );
+        }
+        else {
+            Extra *hd = extra();
+            assert( hd->next(this) == 0 );
+            hd->setNext(ofs);
+        }
+        return e;
+    }
+
+    /* you MUST call when adding an index.  see pdfile.cpp */
+    IndexDetails& NamespaceDetails::addIndex(const char *thisns, bool resetTransient) {
+        IndexDetails *id;
+        try {
+            id = &idx(nIndexes,true);
+        }
+        catch(DBException&) {
+            allocExtra(thisns, nIndexes);
+            id = &idx(nIndexes,false);
+        }
+
+        (*getDur().writing(&nIndexes))++;
+        if ( resetTransient )
+            NamespaceDetailsTransient::get(thisns).addedIndex();
+        return *id;
+    }
+
+    // must be called when renaming a NS to fix up extra
+    void NamespaceDetails::copyingFrom(const char *thisns, NamespaceDetails *src) {
+        extraOffset = 0; // we are a copy -- the old value is wrong.  fixing it up below.
+        Extra *se = src->extra();
+        int n = NIndexesBase;
+        if( se ) {
+            Extra *e = allocExtra(thisns, n);
+            while( 1 ) {
+                n += NIndexesExtra;
+                e->copy(this, *se);
+                se = se->next(src);
+                if( se == 0 ) break;
+                Extra *nxt = allocExtra(thisns, n);
+                e->setNext( nxt->ofsFrom(this) );
+                e = nxt;
+            }
+            assert( extraOffset );
+        }
+    }
+
+    /* returns index of the first index in which the field is present. -1 if not present.
+       (aug08 - this method not currently used)
+    */
+    int NamespaceDetails::fieldIsIndexed(const char *fieldName) {
+        massert( 10346 , "not implemented", false);
+        /*
+        for ( int i = 0; i < nIndexes; i++ ) {
+            IndexDetails& idx = indexes[i];
+            BSONObj idxKey = idx.info.obj().getObjectField("key"); // e.g., { ts : -1 }
+            if ( !idxKey.getField(fieldName).eoo() )
+                return i;
+        }*/
+        return -1;
+    }
+
+    long long NamespaceDetails::storageSize( int * numExtents , BSONArrayBuilder * extentInfo ) const {
+        Extent * e = firstExtent.ext();
+        assert( e );
+
+        long long total = 0;
+        int n = 0;
+        while ( e ) {
+            total += e->length;
+            n++;
+
+            if ( extentInfo ) {
+                extentInfo->append( BSON( "len" << e->length << "loc: " << e->myLoc.toBSONObj() ) );
+            }
+
+            e = e->getNextExtent();
+        }
+
+        if ( numExtents )
+            *numExtents = n;
+
+        return total;
+    }
+
+    NamespaceDetails *NamespaceDetails::writingWithExtra() {
+        vector< pair< long long, unsigned > > writeRanges;
+        writeRanges.push_back( make_pair( 0, sizeof( NamespaceDetails ) ) );
+        for( Extra *e = extra(); e; e = e->next( this ) ) {
+            writeRanges.push_back( make_pair( (char*)e - (char*)this, sizeof( Extra ) ) );
+        }
+        return reinterpret_cast< NamespaceDetails* >( getDur().writingRangesAtOffsets( this, writeRanges ) );
+    }
+
+    /* ------------------------------------------------------------------------- */
+
+    SimpleMutex NamespaceDetailsTransient::_qcMutex("qc");
+    SimpleMutex NamespaceDetailsTransient::_isMutex("is");
+    map< string, shared_ptr< NamespaceDetailsTransient > > NamespaceDetailsTransient::_nsdMap;
+    typedef map< string, shared_ptr< NamespaceDetailsTransient > >::iterator ouriter;
+
+    void NamespaceDetailsTransient::reset() {
+        Lock::assertWriteLocked(_ns); 
+        clearQueryCache();
+        _keysComputed = false;
+        _indexSpecs.clear();
+    }
+
+    /*static*/ NOINLINE_DECL NamespaceDetailsTransient& NamespaceDetailsTransient::make_inlock(const char *ns) {
+        shared_ptr< NamespaceDetailsTransient > &t = _nsdMap[ ns ];
+        assert( t.get() == 0 );
+        Database *database = cc().database();
+        assert( database );
+        if( _nsdMap.size() % 20000 == 10000 ) { 
+            // so we notice if insanely large #s
+            log() << "opening namespace " << ns << endl;
+            log() << _nsdMap.size() << " namespaces in nsdMap" << endl;
+        }
+        t.reset( new NamespaceDetailsTransient(database, ns) );
+        return *t;
+    }
+
+    // note with repair there could be two databases with the same ns name.
+    // that is NOT handled here yet!  TODO
+    // repair may not use nsdt though not sure.  anyway, requires work.
+    NamespaceDetailsTransient::NamespaceDetailsTransient(Database *db, const char *ns) : 
+        _ns(ns), _keysComputed(false), _qcWriteCount() 
+    {
+        dassert(db);
+    }
+
+    NamespaceDetailsTransient::~NamespaceDetailsTransient() { 
+    }
+    
+    void NamespaceDetailsTransient::clearForPrefix(const char *prefix) {
+        SimpleMutex::scoped_lock lk(_qcMutex);
+        vector< string > found;
+        for( ouriter i = _nsdMap.begin(); i != _nsdMap.end(); ++i ) {
+            if ( strncmp( i->first.c_str(), prefix, strlen( prefix ) ) == 0 ) {
+                found.push_back( i->first );
+                Lock::assertWriteLocked(i->first);
+            }
+        }
+        for( vector< string >::iterator i = found.begin(); i != found.end(); ++i ) {
+            _nsdMap[ *i ].reset();
+        }
+    }
+
+    void NamespaceDetailsTransient::eraseForPrefix(const char *prefix) {
+        SimpleMutex::scoped_lock lk(_qcMutex);
+        vector< string > found;
+        for( ouriter i = _nsdMap.begin(); i != _nsdMap.end(); ++i ) {
+            if ( strncmp( i->first.c_str(), prefix, strlen( prefix ) ) == 0 ) {
+                found.push_back( i->first );
+                Lock::assertWriteLocked(i->first);
+            }
+        }
+        for( vector< string >::iterator i = found.begin(); i != found.end(); ++i ) {
+            _nsdMap.erase(*i);
+        }
+    }
+
+    void NamespaceDetailsTransient::computeIndexKeys() {
+        _keysComputed = true;
+        _indexKeys.clear();
+        NamespaceDetails *d = nsdetails(_ns.c_str());
+        if ( ! d )
+            return;
+        NamespaceDetails::IndexIterator i = d->ii();
+        while( i.more() )
+            i.next().keyPattern().getFieldNames(_indexKeys);
+    }
+
+
+    /* ------------------------------------------------------------------------- */
+
+    /* add a new namespace to the system catalog (<dbname>.system.namespaces).
+       options: { capped : ..., size : ... }
+    */
+    void addNewNamespaceToCatalog(const char *ns, const BSONObj *options = 0) {
+        LOG(1) << "New namespace: " << ns << endl;
+        if ( strstr(ns, "system.namespaces") ) {
+            // system.namespaces holds all the others, so it is not explicitly listed in the catalog.
+            // TODO: fix above should not be strstr!
+            return;
+        }
+        
+        BSONObjBuilder b;
+        b.append("name", ns);
+        if ( options )
+            b.append("options", *options);
+        BSONObj j = b.done();
+        char database[256];
+        nsToDatabase(ns, database);
+        string s = string(database) + ".system.namespaces";
+        theDataFileMgr.insert(s.c_str(), j.objdata(), j.objsize(), true);
+    }
+
+    void renameNamespace( const char *from, const char *to, bool stayTemp) {
+        NamespaceIndex *ni = nsindex( from );
+        assert( ni );
+        assert( ni->details( from ) );
+        assert( ! ni->details( to ) );
+
+        // Our namespace and index details will move to a different
+        // memory location.  The only references to namespace and
+        // index details across commands are in cursors and nsd
+        // transient (including query cache) so clear these.
+        ClientCursor::invalidate( from );
+        NamespaceDetailsTransient::eraseForPrefix( from );
+
+        NamespaceDetails *details = ni->details( from );
+        ni->add_ns( to, *details );
+        NamespaceDetails *todetails = ni->details( to );
+        try {
+            todetails->copyingFrom(to, details); // fixes extraOffset
+        }
+        catch( DBException& ) {
+            // could end up here if .ns is full - if so try to clean up / roll back a little
+            ni->kill_ns(to);
+            throw;
+        }
+        ni->kill_ns( from );
+        details = todetails;
+
+        BSONObj oldSpec;
+        char database[MaxDatabaseNameLen];
+        nsToDatabase(from, database);
+        string s = database;
+        s += ".system.namespaces";
+        assert( Helpers::findOne( s.c_str(), BSON( "name" << from ), oldSpec ) );
+
+        BSONObjBuilder newSpecB;
+        BSONObjIterator i( oldSpec.getObjectField( "options" ) );
+        while( i.more() ) {
+            BSONElement e = i.next();
+            if ( strcmp( e.fieldName(), "create" ) != 0 ) {
+                if (stayTemp || (strcmp(e.fieldName(), "temp") != 0))
+                    newSpecB.append( e );
+            }
+            else {
+                newSpecB << "create" << to;
+            }
+        }
+        BSONObj newSpec = newSpecB.done();
+        addNewNamespaceToCatalog( to, newSpec.isEmpty() ? 0 : &newSpec );
+
+        deleteObjects( s.c_str(), BSON( "name" << from ), false, false, true );
+        // oldSpec variable no longer valid memory
+
+        BSONObj oldIndexSpec;
+        s = database;
+        s += ".system.indexes";
+        while( Helpers::findOne( s.c_str(), BSON( "ns" << from ), oldIndexSpec ) ) {
+            BSONObjBuilder newIndexSpecB;
+            BSONObjIterator i( oldIndexSpec );
+            while( i.more() ) {
+                BSONElement e = i.next();
+                if ( strcmp( e.fieldName(), "ns" ) != 0 )
+                    newIndexSpecB.append( e );
+                else
+                    newIndexSpecB << "ns" << to;
+            }
+            BSONObj newIndexSpec = newIndexSpecB.done();
+            DiskLoc newIndexSpecLoc = theDataFileMgr.insert( s.c_str(), newIndexSpec.objdata(), newIndexSpec.objsize(), true, false );
+            int indexI = details->findIndexByName( oldIndexSpec.getStringField( "name" ) );
+            IndexDetails &indexDetails = details->idx(indexI);
+            string oldIndexNs = indexDetails.indexNamespace();
+            indexDetails.info = newIndexSpecLoc;
+            string newIndexNs = indexDetails.indexNamespace();
+
+            renameIndexNamespace( oldIndexNs.c_str(), newIndexNs.c_str() );
+            deleteObjects( s.c_str(), oldIndexSpec.getOwned(), true, false, true );
+        }
+    }
+
+    bool legalClientSystemNS( const string& ns , bool write ) {
+        if( ns == "local.system.replset" ) return true;
+
+        if ( ns.find( ".system.users" ) != string::npos )
+            return true;
+
+        if ( ns.find( ".system.js" ) != string::npos ) {
+            if ( write )
+                Scope::storedFuncMod();
+            return true;
+        }
+
+        return false;
+    }
+
+} // namespace mongo
diff --git a/src/mongo/db/namespace_details.h b/src/mongo/db/namespace_details.h
new file mode 100644
index 00000000000..83aa8bc5e36
--- /dev/null
+++ b/src/mongo/db/namespace_details.h
@@ -0,0 +1,610 @@
+// namespace_details.h
+
+/**
+*    Copyright (C) 2008 10gen Inc.
+*
+*    This program is free software: you can redistribute it and/or  modify
+*    it under the terms of the GNU Affero General Public License, version 3,
+*    as published by the Free Software Foundation.
+*
+*    This program is distributed in the hope that it will be useful,
+*    but WITHOUT ANY WARRANTY; without even the implied warranty of
+*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+*    GNU Affero General Public License for more details.
+*
+*    You should have received a copy of the GNU Affero General Public License
+*    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+*/
+
+#pragma once
+
+#include "mongo/pch.h"
+
+#include "mongo/db/d_concurrency.h"
+#include "mongo/db/diskloc.h"
+#include "mongo/db/index.h"
+#include "mongo/db/jsobj.h"
+#include "mongo/db/mongommf.h"
+#include "mongo/db/namespace.h"
+#include "mongo/db/queryoptimizer.h"
+#include "mongo/db/queryoptimizercursor.h"
+#include "mongo/db/querypattern.h"
+#include "mongo/util/hashtab.h"
+
+namespace mongo {
+    class Database;
+
+    /** @return true if a client can modify this namespace even though it is under ".system."
+        For example <dbname>.system.users is ok for regular clients to update.
+        @param write used when .system.js
+    */
+    bool legalClientSystemNS( const string& ns , bool write );
+
+    /* deleted lists -- linked lists of deleted records -- are placed in 'buckets' of various sizes
+       so you can look for a deleterecord about the right size.
+    */
+    const int Buckets = 19;
+    const int MaxBucket = 18;
+
+    extern int bucketSizes[];
+
+#pragma pack(1)
+    /* NamespaceDetails : this is the "header" for a collection that has all its details.
+       It's in the .ns file and this is a memory mapped region (thus the pack pragma above).
+    */
+    class NamespaceDetails {
+    public:
+        enum { NIndexesMax = 64, NIndexesExtra = 30, NIndexesBase  = 10 };
+
+        /*-------- data fields, as present on disk : */
+        DiskLoc firstExtent;
+        DiskLoc lastExtent;
+        /* NOTE: capped collections v1 override the meaning of deletedList.
+                 deletedList[0] points to a list of free records (DeletedRecord's) for all extents in
+                 the capped namespace.
+                 deletedList[1] points to the last record in the prev extent.  When the "current extent"
+                 changes, this value is updated.  !deletedList[1].isValid() when this value is not
+                 yet computed.
+        */
+        DiskLoc deletedList[Buckets];
+        // ofs 168 (8 byte aligned)
+        struct Stats {
+            // datasize and nrecords MUST Be adjacent code assumes!
+            long long datasize; // this includes padding, but not record headers
+            long long nrecords;
+        } stats;
+        int lastExtentSize;
+        int nIndexes;
+    private:
+        // ofs 192
+        IndexDetails _indexes[NIndexesBase];
+    public:
+        // ofs 352 (16 byte aligned)
+        int capped;
+        int max;                              // max # of objects for a capped table.  TODO: should this be 64 bit?
+        double paddingFactor;                 // 1.0 = no padding.
+        // ofs 386 (16)
+        int flags;
+        DiskLoc capExtent;
+        DiskLoc capFirstNewRecord;
+        unsigned short dataFileVersion;       // NamespaceDetails version.  So we can do backward compatibility in the future. See filever.h
+        unsigned short indexFileVersion;
+        unsigned long long multiKeyIndexBits;
+    private:
+        // ofs 400 (16)
+        unsigned long long reservedA;
+        long long extraOffset;                // where the $extra info is located (bytes relative to this)
+    public:
+        int indexBuildInProgress;             // 1 if in prog
+        unsigned reservedB;
+        // ofs 424 (8)
+        struct Capped2 {
+            unsigned long long cc2_ptr;       // see capped.cpp
+            unsigned fileNumber;
+        } capped2;
+        char reserved[60];
+        /*-------- end data 496 bytes */
+
+        explicit NamespaceDetails( const DiskLoc &loc, bool _capped );
+
+        class Extra {
+            long long _next;
+        public:
+            IndexDetails details[NIndexesExtra];
+        private:
+            unsigned reserved2;
+            unsigned reserved3;
+            Extra(const Extra&) { assert(false); }
+            Extra& operator=(const Extra& r) { assert(false); return *this; }
+        public:
+            Extra() { }
+            long ofsFrom(NamespaceDetails *d) {
+                return ((char *) this) - ((char *) d);
+            }
+            void init() { memset(this, 0, sizeof(Extra)); }
+            Extra* next(NamespaceDetails *d) {
+                if( _next == 0 ) return 0;
+                return (Extra*) (((char *) d) + _next);
+            }
+            void setNext(long ofs) { *getDur().writing(&_next) = ofs;  }
+            void copy(NamespaceDetails *d, const Extra& e) {
+                memcpy(this, &e, sizeof(Extra));
+                _next = 0;
+            }
+        };
+        Extra* extra() {
+            if( extraOffset == 0 ) return 0;
+            return (Extra *) (((char *) this) + extraOffset);
+        }
+        /* add extra space for indexes when more than 10 */
+        Extra* allocExtra(const char *ns, int nindexessofar);
+        void copyingFrom(const char *thisns, NamespaceDetails *src); // must be called when renaming a NS to fix up extra
+
+        /* called when loaded from disk */
+        void onLoad(const Namespace& k);
+
+        /* dump info on this namespace.  for debugging. */
+        void dump(const Namespace& k);
+
+        /* dump info on all extents for this namespace.  for debugging. */
+        void dumpExtents();
+
+    private:
+        Extent *theCapExtent() const { return capExtent.ext(); }
+        void advanceCapExtent( const char *ns );
+        DiskLoc __capAlloc(int len);
+        DiskLoc cappedAlloc(const char *ns, int len);
+        DiskLoc &cappedFirstDeletedInCurExtent();
+        bool nextIsInCapExtent( const DiskLoc &dl ) const;
+
+    public:
+        DiskLoc& cappedListOfAllDeletedRecords() { return deletedList[0]; }
+        DiskLoc& cappedLastDelRecLastExtent()    { return deletedList[1]; }
+        void cappedDumpDelInfo();
+        bool capLooped() const { return capped && capFirstNewRecord.isValid();  }
+        bool inCapExtent( const DiskLoc &dl ) const;
+        void cappedCheckMigrate();
+        /**
+         * Truncate documents newer than the document at 'end' from the capped
+         * collection.  The collection cannot be completely emptied using this
+         * function.  An assertion will be thrown if that is attempted.
+         * @param inclusive - Truncate 'end' as well iff true
+         */
+        void cappedTruncateAfter(const char *ns, DiskLoc end, bool inclusive);
+        /** Remove all documents from the capped collection */
+        void emptyCappedCollection(const char *ns);
+
+        /* when a background index build is in progress, we don't count the index in nIndexes until
+           complete, yet need to still use it in _indexRecord() - thus we use this function for that.
+        */
+        int nIndexesBeingBuilt() const { return nIndexes + indexBuildInProgress; }
+
+        /* NOTE: be careful with flags.  are we manipulating them in read locks?  if so,
+                 this isn't thread safe.  TODO
+        */
+        enum NamespaceFlags {
+            Flag_HaveIdIndex = 1 << 0 // set when we have _id index (ONLY if ensureIdIndex was called -- 0 if that has never been called)
+        };
+
+        IndexDetails& idx(int idxNo, bool missingExpected = false );
+
+        /** get the IndexDetails for the index currently being built in the background. (there is at most one) */
+        IndexDetails& inProgIdx() {
+            DEV assert(indexBuildInProgress);
+            return idx(nIndexes);
+        }
+
+        class IndexIterator {
+        public:
+            int pos() { return i; } // note this is the next one to come
+            bool more() { return i < n; }
+            IndexDetails& next() { return d->idx(i++); }
+        private:
+            friend class NamespaceDetails;
+            int i, n;
+            NamespaceDetails *d;
+            IndexIterator(NamespaceDetails *_d);
+        };
+
+        IndexIterator ii() { return IndexIterator(this); }
+
+        /* hackish - find our index # in the indexes array */
+        int idxNo(IndexDetails& idx);
+
+        /* multikey indexes are indexes where there are more than one key in the index
+             for a single document. see multikey in wiki.
+           for these, we have to do some dedup work on queries.
+        */
+        bool isMultikey(int i) const { return (multiKeyIndexBits & (((unsigned long long) 1) << i)) != 0; }
+        void setIndexIsMultikey(int i) {
+            dassert( i < NIndexesMax );
+            unsigned long long x = ((unsigned long long) 1) << i;
+            if( multiKeyIndexBits & x ) return;
+            *getDur().writing(&multiKeyIndexBits) |= x;
+        }
+        void clearIndexIsMultikey(int i) {
+            dassert( i < NIndexesMax );
+            unsigned long long x = ((unsigned long long) 1) << i;
+            if( (multiKeyIndexBits & x) == 0 ) return;
+            *getDur().writing(&multiKeyIndexBits) &= ~x;
+        }
+
+        /* add a new index.  does not add to system.indexes etc. - just to NamespaceDetails.
+           caller must populate returned object.
+         */
+        IndexDetails& addIndex(const char *thisns, bool resetTransient=true);
+
+        void aboutToDeleteAnIndex() { 
+            *getDur().writing(&flags) = flags & ~Flag_HaveIdIndex;
+        }
+
+        /* returns index of the first index in which the field is present. -1 if not present. */
+        int fieldIsIndexed(const char *fieldName);
+
+        /* called to indicate that an update fit in place.  
+           fits also called on an insert -- idea there is that if you had some mix and then went to
+           pure inserts it would adapt and PF would trend to 1.0.  note update calls insert on a move
+           so there is a double count there that must be adjusted for below.
+
+           todo: greater sophistication could be helpful and added later.  for example the absolute 
+                 size of documents might be considered -- in some cases smaller ones are more likely 
+                 to grow than larger ones in the same collection? (not always)
+        */
+        void paddingFits() {
+            MONGO_SOMETIMES(sometimes, 4) { // do this on a sampled basis to journal less
+                double x = paddingFactor - 0.001;
+                if ( x >= 1.0 ) {
+                    *getDur().writing(&paddingFactor) = x;
+                }
+            }
+        }
+        void paddingTooSmall() {            
+            MONGO_SOMETIMES(sometimes, 4) { // do this on a sampled basis to journal less       
+                /* the more indexes we have, the higher the cost of a move.  so we take that into 
+                   account herein.  note on a move that insert() calls paddingFits(), thus
+                   here for example with no inserts and nIndexes = 1 we have
+                   .001*4-.001 or a 3:1 ratio to non moves -> 75% nonmoves.  insert heavy 
+                   can pushes this down considerably. further tweaking will be a good idea but 
+                   this should be an adequate starting point.
+                */
+                double N = min(nIndexes,7) + 3;
+                double x = paddingFactor + (0.001 * N);
+                if ( x <= 2.0 ) {
+                    *getDur().writing(&paddingFactor) = x;
+                }
+            }
+        }
+
+        // @return offset in indexes[]
+        int findIndexByName(const char *name);
+
+        // @return offset in indexes[]
+        int findIndexByKeyPattern(const BSONObj& keyPattern);
+
+        void findIndexByType( const string& name , vector<int>& matches ) {
+            IndexIterator i = ii();
+            while ( i.more() ) {
+                if ( i.next().getSpec().getTypeName() == name )
+                    matches.push_back( i.pos() - 1 );
+            }
+        }
+
+        /* @return -1 = not found
+           generally id is first index, so not that expensive an operation (assuming present).
+        */
+        int findIdIndex() {
+            IndexIterator i = ii();
+            while( i.more() ) {
+                if( i.next().isIdIndex() )
+                    return i.pos()-1;
+            }
+            return -1;
+        }
+
+        bool haveIdIndex() { 
+            return (flags & NamespaceDetails::Flag_HaveIdIndex) || findIdIndex() >= 0;
+        }
+
+        /* return which "deleted bucket" for this size object */
+        static int bucket(int n) {
+            for ( int i = 0; i < Buckets; i++ )
+                if ( bucketSizes[i] > n )
+                    return i;
+            return Buckets-1;
+        }
+
+        /* predetermine location of the next alloc without actually doing it. 
+           if cannot predetermine returns null (so still call alloc() then)
+        */
+        DiskLoc allocWillBeAt(const char *ns, int lenToAlloc);
+
+        /* allocate a new record.  lenToAlloc includes headers. */
+        DiskLoc alloc(const char *ns, int lenToAlloc, DiskLoc& extentLoc);
+
+        /* add a given record to the deleted chains for this NS */
+        void addDeletedRec(DeletedRecord *d, DiskLoc dloc);
+        void dumpDeleted(set<DiskLoc> *extents = 0);
+        // Start from firstExtent by default.
+        DiskLoc firstRecord( const DiskLoc &startExtent = DiskLoc() ) const;
+        // Start from lastExtent by default.
+        DiskLoc lastRecord( const DiskLoc &startExtent = DiskLoc() ) const;
+        long long storageSize( int * numExtents = 0 , BSONArrayBuilder * extentInfo = 0 ) const;
+
+        int averageObjectSize() {
+            if ( stats.nrecords == 0 )
+                return 5;
+            return (int) (stats.datasize / stats.nrecords);
+        }
+
+        NamespaceDetails *writingWithoutExtra() {
+            return ( NamespaceDetails* ) getDur().writingPtr( this, sizeof( NamespaceDetails ) );
+        }
+        /** Make all linked Extra objects writeable as well */
+        NamespaceDetails *writingWithExtra();
+
+    private:
+        DiskLoc _alloc(const char *ns, int len);
+        void maybeComplain( const char *ns, int len ) const;
+        DiskLoc __stdAlloc(int len, bool willBeAt);
+        void compact(); // combine adjacent deleted records
+        friend class NamespaceIndex;
+        struct ExtraOld {
+            // note we could use this field for more chaining later, so don't waste it:
+            unsigned long long reserved1;
+            IndexDetails details[NIndexesExtra];
+            unsigned reserved2;
+            unsigned reserved3;
+        };
+        /** Update cappedLastDelRecLastExtent() after capExtent changed in cappedTruncateAfter() */
+        void cappedTruncateLastDelUpdate();
+        BOOST_STATIC_ASSERT( NIndexesMax <= NIndexesBase + NIndexesExtra*2 );
+        BOOST_STATIC_ASSERT( NIndexesMax <= 64 ); // multiKey bits
+        BOOST_STATIC_ASSERT( sizeof(NamespaceDetails::ExtraOld) == 496 );
+        BOOST_STATIC_ASSERT( sizeof(NamespaceDetails::Extra) == 496 );
+    }; // NamespaceDetails
+#pragma pack()
+
+    /* NamespaceDetailsTransient
+
+       these are things we know / compute about a namespace that are transient -- things
+       we don't actually store in the .ns file.  so mainly caching of frequently used
+       information.
+
+       CAUTION: Are you maintaining this properly on a collection drop()?  A dropdatabase()?  Be careful.
+                The current field "allIndexKeys" may have too many keys in it on such an occurrence;
+                as currently used that does not cause anything terrible to happen.
+
+       todo: cleanup code, need abstractions and separation
+    */
+    // todo: multiple db's with the same name (repairDatbase) is not handled herein.  that may be 
+    //       the way to go, if not used by repair, but need some sort of enforcement / asserts.
+    class NamespaceDetailsTransient : boost::noncopyable {
+        BOOST_STATIC_ASSERT( sizeof(NamespaceDetails) == 496 );
+
+        //Database *database;
+        const string _ns;
+        void reset();
+        static std::map< string, shared_ptr< NamespaceDetailsTransient > > _nsdMap;
+
+        NamespaceDetailsTransient(Database*,const char *ns);
+    public:
+        ~NamespaceDetailsTransient();
+        void addedIndex() { reset(); }
+        void deletedIndex() { reset(); }
+        /* Drop cached information on all namespaces beginning with the specified prefix.
+           Can be useful as index namespaces share the same start as the regular collection.
+           SLOW - sequential scan of all NamespaceDetailsTransient objects */
+        static void clearForPrefix(const char *prefix);
+        static void eraseForPrefix(const char *prefix);
+
+        /**
+         * @return a cursor interface to the query optimizer.  The implementation may utilize a
+         * single query plan or interleave results from multiple query plans before settling on a
+         * single query plan.  Note that the schema of currKey() documents, indexKeyPattern(), the
+         * matcher(), and the isMultiKey() nature of the cursor may change over the course of
+         * iteration.
+         *
+         * @param query - Query used to select indexes and populate matchers; not copied if unowned
+         * (see bsonobj.h).
+         *
+         * @param order - Required ordering spec for documents produced by this cursor, empty object
+         * default indicates no order requirement.  If no index exists that satisfies the required
+         * sort order, an empty shared_ptr is returned unless parsedQuery is also provided.  This is
+         * not copied if unowned.
+         *
+         * @param planPolicy - A policy for selecting query plans - see queryoptimizercursor.h
+         *
+         * @param simpleEqualityMatch - Set to true for certain simple queries - see
+         * queryoptimizer.cpp.
+         *
+         * @param parsedQuery - Additional query parameters, as from a client query request.  If
+         * specified, the resulting cursor may return results from out of order plans.  See
+         * queryoptimizercursor.h for information on handling these results.
+         *
+         * @param singlePlanSummary - Query plan summary information that may be provided when a
+         * cursor running a single plan is returned.
+         *
+         * The returned cursor may @throw inside of advance() or recoverFromYield() in certain error
+         * cases, for example if a capped overrun occurred during a yield.  This indicates that the
+         * cursor was unable to perform a complete scan.
+         *
+         * This is a work in progress.  Partial list of features not yet implemented through this
+         * interface:
+         * 
+         * - covered indexes
+         * - in memory sorting
+         */
+        static shared_ptr<Cursor> getCursor( const char *ns, const BSONObj &query,
+                                            const BSONObj &order = BSONObj(),
+                                            const QueryPlanSelectionPolicy &planPolicy =
+                                            QueryPlanSelectionPolicy::any(),
+                                            bool *simpleEqualityMatch = 0,
+                                            const ParsedQuery *parsedQuery = 0,
+                                            QueryPlan::Summary *singlePlanSummary = 0 );
+
+        /**
+         * @return a single cursor that may work well for the given query.  A $or style query will
+         * produce a single cursor, not a MultiCursor.
+         * It is possible no cursor is returned if the sort is not supported by an index.  Clients are responsible
+         * for checking this if they are not sure an index for a sort exists, and defaulting to a non-sort if
+         * no suitable indices exist.
+         */
+        static shared_ptr<Cursor> bestGuessCursor( const char *ns, const BSONObj &query, const BSONObj &sort );
+
+        /* indexKeys() cache ---------------------------------------------------- */
+        /* assumed to be in write lock for this */
+    private:
+        bool _keysComputed;
+        set<string> _indexKeys;
+        void computeIndexKeys();
+    public:
+        /* get set of index keys for this namespace.  handy to quickly check if a given
+           field is indexed (Note it might be a secondary component of a compound index.)
+        */
+        set<string>& indexKeys() {
+            DEV Lock::assertWriteLocked(_ns);
+            if ( !_keysComputed )
+                computeIndexKeys();
+            return _indexKeys;
+        }
+
+        /* IndexSpec caching */
+    private:
+        map<const IndexDetails*,IndexSpec> _indexSpecs;
+        static SimpleMutex _isMutex;
+    public:
+        const IndexSpec& getIndexSpec( const IndexDetails * details ) {
+            IndexSpec& spec = _indexSpecs[details];
+            if ( ! spec._finishedInit ) {
+                SimpleMutex::scoped_lock lk(_isMutex);
+                if ( ! spec._finishedInit ) {
+                    spec.reset( details );
+                    assert( spec._finishedInit );
+                }
+            }
+            return spec;
+        }
+
+        /* query cache (for query optimizer) ------------------------------------- */
+    private:
+        int _qcWriteCount;
+        map< QueryPattern, pair< BSONObj, long long > > _qcCache;
+        static NamespaceDetailsTransient& make_inlock(const char *ns);
+    public:
+        static SimpleMutex _qcMutex;
+
+        /* you must be in the qcMutex when calling this.
+           A NamespaceDetailsTransient object will not go out of scope on you if you are
+           d.dbMutex.atLeastReadLocked(), so you do't have to stay locked.
+           Creates a NamespaceDetailsTransient before returning if one DNE. 
+           todo: avoid creating too many on erroneous ns queries.
+           */
+        static NamespaceDetailsTransient& get_inlock(const char *ns);
+
+        static NamespaceDetailsTransient& get(const char *ns) {
+            // todo : _qcMutex will create bottlenecks in our parallelism
+            SimpleMutex::scoped_lock lk(_qcMutex);
+            return get_inlock(ns);
+        }
+
+        void clearQueryCache() { // public for unit tests
+            _qcCache.clear();
+            _qcWriteCount = 0;
+        }
+        /* you must notify the cache if you are doing writes, as query plan optimality will change */
+        void notifyOfWriteOp() {
+            if ( _qcCache.empty() )
+                return;
+            if ( ++_qcWriteCount >= 100 )
+                clearQueryCache();
+        }
+        BSONObj indexForPattern( const QueryPattern &pattern ) {
+            return _qcCache[ pattern ].first;
+        }
+        long long nScannedForPattern( const QueryPattern &pattern ) {
+            return _qcCache[ pattern ].second;
+        }
+        void registerIndexForPattern( const QueryPattern &pattern, const BSONObj &indexKey, long long nScanned ) {
+            _qcCache[ pattern ] = make_pair( indexKey, nScanned );
+        }
+
+    }; /* NamespaceDetailsTransient */
+
+    inline NamespaceDetailsTransient& NamespaceDetailsTransient::get_inlock(const char *ns) {
+        std::map< string, shared_ptr< NamespaceDetailsTransient > >::iterator i = _nsdMap.find(ns);
+        if( i != _nsdMap.end() && 
+            i->second.get() ) { // could be null ptr from clearForPrefix
+            return *i->second;
+        }
+        return make_inlock(ns);
+    }
+
+    /* NamespaceIndex is the ".ns" file you see in the data directory.  It is the "system catalog"
+       if you will: at least the core parts.  (Additional info in system.* collections.)
+    */
+    class NamespaceIndex {
+    public:
+        NamespaceIndex(const string &dir, const string &database) :
+            ht( 0 ), dir_( dir ), database_( database ) {}
+
+        /* returns true if new db will be created if we init lazily */
+        bool exists() const;
+
+        void init() {
+            if( !ht ) 
+                _init();
+        }
+
+        void add_ns(const char *ns, DiskLoc& loc, bool capped);
+        void add_ns( const char *ns, const NamespaceDetails &details );
+
+        NamespaceDetails* details(const char *ns) {
+            if ( !ht )
+                return 0;
+            Namespace n(ns);
+            NamespaceDetails *d = ht->get(n);
+            if ( d && d->capped )
+                d->cappedCheckMigrate();
+            return d;
+        }
+
+        void kill_ns(const char *ns);
+
+        bool find(const char *ns, DiskLoc& loc) {
+            NamespaceDetails *l = details(ns);
+            if ( l ) {
+                loc = l->firstExtent;
+                return true;
+            }
+            return false;
+        }
+
+        bool allocated() const { return ht != 0; }
+
+        void getNamespaces( list<string>& tofill , bool onlyCollections = true ) const;
+
+        NamespaceDetails::Extra* newExtra(const char *ns, int n, NamespaceDetails *d);
+
+        boost::filesystem::path path() const;
+
+        unsigned long long fileLength() const { return f.length(); }
+
+    private:
+        void _init();
+        void maybeMkdir() const;
+
+        MongoMMF f;
+        HashTable<Namespace,NamespaceDetails> *ht;
+        string dir_;
+        string database_;
+    };
+
+    extern string dbpath; // --dbpath parm
+    extern bool directoryperdb;
+
+    // Rename a namespace within current 'client' db.
+    // (Arguments should include db name)
+    void renameNamespace( const char *from, const char *to, bool stayTemp);
+
+
+} // namespace mongo
diff --git a/src/mongo/db/pdfile.h b/src/mongo/db/pdfile.h
index ccab3eb8945..8520fb11af2 100644
--- a/src/mongo/db/pdfile.h
+++ b/src/mongo/db/pdfile.h
@@ -25,14 +25,16 @@
 
 #pragma once
 
-#include "../pch.h"
-#include "../util/mmap.h"
-#include "diskloc.h"
-#include "jsobjmanipulator.h"
-#include "namespace-inl.h"
-#include "client.h"
-#include "mongommf.h"
-#include "memconcept.h"
+#include "mongo/db/client.h"
+#include "mongo/db/diskloc.h"
+#include "mongo/db/jsobjmanipulator.h"
+#include "mongo/db/memconcept.h"
+#include "mongo/db/mongommf.h"
+#include "mongo/db/namespace-inl.h"
+#include "mongo/db/namespace_details-inl.h"
+#include "mongo/db/namespacestring.h"
+#include "mongo/pch.h"
+#include "mongo/util/mmap.h"
 
 namespace mongo {
 
diff --git a/src/mongo/db/security.h b/src/mongo/db/security.h
index f193f305def..625a3e116bc 100755
--- a/src/mongo/db/security.h
+++ b/src/mongo/db/security.h
@@ -18,31 +18,16 @@
 
 #pragma once
 
-#include "nonce.h"
-#include "concurrency.h"
-#include "security_common.h"
-#include "../util/concurrency/spin_lock.h"
+#include "mongo/db/authlevel.h"
+#include "mongo/db/concurrency.h"
+#include "mongo/db/nonce.h"
+#include "mongo/db/security_common.h"
+#include "mongo/util/concurrency/spin_lock.h"
 
 // this is used by both mongos and mongod
 
 namespace mongo {
 
-    /* 
-     * for a particular db
-     * levels
-     *     0 : none
-     *     1 : read
-     *     2 : write
-     */
-    struct Auth {
-        
-        enum Level { NONE = 0 , READ = 1 , WRITE = 2 };
-
-        Auth() { level = NONE; }
-        Level level;
-        string user;
-    };
-
     class AuthenticationInfo : boost::noncopyable {
     public:
         bool isLocalHost;
diff --git a/src/mongo/s/shard.h b/src/mongo/s/shard.h
index 6b52c58a932..e30cd79841e 100644
--- a/src/mongo/s/shard.h
+++ b/src/mongo/s/shard.h
@@ -18,8 +18,10 @@
 
 #pragma once
 
-#include "../pch.h"
-#include "../client/connpool.h"
+#include "mongo/pch.h"
+
+#include "mongo/client/connpool.h"
+#include "mongo/client/dbclient_rs.h"
 
 namespace mongo {
 
diff --git a/src/mongo/s/strategy_shard.cpp b/src/mongo/s/strategy_shard.cpp
index 97d51890615..4d971859d99 100644
--- a/src/mongo/s/strategy_shard.cpp
+++ b/src/mongo/s/strategy_shard.cpp
@@ -16,16 +16,17 @@
 
 // strategy_sharded.cpp
 
-#include "pch.h"
-#include "request.h"
-#include "chunk.h"
-#include "cursors.h"
-#include "stats.h"
-#include "client.h"
-#include "../bson/util/builder.h"
-
-#include "../client/connpool.h"
-#include "../db/commands.h"
+#include "mongo/pch.h"
+
+#include "mongo/bson/util/builder.h"
+#include "mongo/client/connpool.h"
+#include "mongo/db/commands.h"
+#include "mongo/db/index.h"
+#include "mongo/s/client.h"
+#include "mongo/s/cursors.h"
+#include "mongo/s/request.h"
+#include "mongo/s/stats.h"
+#include "mongo/s/chunk.h"
 
 // error codes 8010-8040
 
diff --git a/src/mongo/tools/restore.cpp b/src/mongo/tools/restore.cpp
index 82cc99f8395..eaa4ea77dcb 100644
--- a/src/mongo/tools/restore.cpp
+++ b/src/mongo/tools/restore.cpp
@@ -16,19 +16,20 @@
 *    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 */
 
-#include "../pch.h"
-#include "../client/dbclient.h"
-#include "../util/mmap.h"
-#include "../util/version.h"
-#include "tool.h"
+#include "mongo/pch.h"
 
-#include <boost/program_options.hpp>
-#include <boost/filesystem/operations.hpp>
 #include <boost/filesystem/convenience.hpp>
-
+#include <boost/filesystem/operations.hpp>
+#include <boost/program_options.hpp>
 #include <fcntl.h>
-#include <set>
 #include <fstream>
+#include <set>
+
+#include "mongo/client/dbclient.h"
+#include "mongo/db/namespacestring.h"
+#include "mongo/tools/tool.h"
+#include "mongo/util/mmap.h"
+#include "mongo/util/version.h"
 
 using namespace mongo;
 
diff --git a/src/mongo/tools/tool.cpp b/src/mongo/tools/tool.cpp
index 767debbf947..eafae9cdfd0 100644
--- a/src/mongo/tools/tool.cpp
+++ b/src/mongo/tools/tool.cpp
@@ -16,16 +16,17 @@
 
 // Tool.cpp
 
-#include "tool.h"
+#include "mongo/tools/tool.h"
 
 #include <fstream>
 #include <iostream>
 
 #include "pcrecpp.h"
 
-#include "util/file_allocator.h"
-#include "util/password.h"
-#include "util/version.h"
+#include "mongo/db/namespace_details.h"
+#include "mongo/util/file_allocator.h"
+#include "mongo/util/password.h"
+#include "mongo/util/version.h"
 
 #include <boost/filesystem/operations.hpp>
 
diff --git a/src/mongo/util/mmap.cpp b/src/mongo/util/mmap.cpp
index 85af905584c..a3911f83d75 100755
--- a/src/mongo/util/mmap.cpp
+++ b/src/mongo/util/mmap.cpp
@@ -15,16 +15,19 @@
  *    limitations under the License.
  */
 
-#include "pch.h"
-#include "mmap.h"
-#include "processinfo.h"
-#include "concurrency/rwlock.h"
-#include "../db/namespace.h"
-#include "../db/cmdline.h"
-#include "progress_meter.h"
+#include "mongo/pch.h"
+
+#include "mongo/util/mmap.h"
 
 #include <boost/filesystem/operations.hpp>
 
+#include "mongo/db/cmdline.h"
+#include "mongo/db/namespace.h"
+#include "mongo/util/concurrency/rwlock.h"
+#include "mongo/util/mongoutils/str.h"
+#include "mongo/util/processinfo.h"
+#include "mongo/util/progress_meter.h"
+
 namespace mongo {
 
     set<MongoFile*> MongoFile::mmfiles;
@@ -58,7 +61,7 @@ namespace mongo {
             l = boost::filesystem::file_size( filename );
         } 
         catch(boost::filesystem::filesystem_error& e) { 
-            uasserted(15922, str::stream() << "couldn't get file length when opening mapping " << filename << ' ' << e.what() );
+            uasserted(15922, mongoutils::str::stream() << "couldn't get file length when opening mapping " << filename << ' ' << e.what() );
         }
         return map( filename , l );
     }
@@ -68,7 +71,7 @@ namespace mongo {
             l = boost::filesystem::file_size( filename );
         } 
         catch(boost::filesystem::filesystem_error& e) { 
-            uasserted(15923, str::stream() << "couldn't get file length when opening mapping " << filename << ' ' << e.what() );
+            uasserted(15923, mongoutils::str::stream() << "couldn't get file length when opening mapping " << filename << ' ' << e.what() );
         }
         return map( filename , l, options );
     }
diff --git a/src/mongo/util/version.h b/src/mongo/util/version.h
index 64f8b140fd5..fcccc1494ab 100644
--- a/src/mongo/util/version.h
+++ b/src/mongo/util/version.h
@@ -3,21 +3,21 @@
 
 #include <string>
 
+#include "mongo/bson/stringdata.h"
+
 namespace mongo {
     struct BSONArray;
 
-    using std::string;
-
     // mongo version
     extern const char versionString[];
     extern const BSONArray versionArray;
-    string mongodVersion();
+    std::string mongodVersion();
     int versionCmp(StringData rhs, StringData lhs); // like strcmp
 
     const char * gitVersion();
     void printGitVersion();
 
-    string sysInfo();
+    std::string sysInfo();
     void printSysInfo();
 
     void show_warnings();
author	Andy Schwerin <Andy Schwerin schwerin@10gen.com>	2012-03-07 12:09:42 -0500
committer	Andy Schwerin <schwerin@10gen.com>	2012-03-23 10:35:31 -0400
commit	d67ce1cd31f6ea2e766d5c201ab5430735cbb3b8 (patch)
tree	809d2a20ce0489d9f3fb5d390ea3a0f9686c9708
parent	f9c8560b866b3b286dc67548cbb82975fd4add46 (diff)
download	mongo-d67ce1cd31f6ea2e766d5c201ab5430735cbb3b8.tar.gz