summaryrefslogtreecommitdiff
path: root/src/dbreg/dbreg.c
diff options
context:
space:
mode:
Diffstat (limited to 'src/dbreg/dbreg.c')
-rw-r--r--src/dbreg/dbreg.c1012
1 files changed, 1012 insertions, 0 deletions
diff --git a/src/dbreg/dbreg.c b/src/dbreg/dbreg.c
new file mode 100644
index 00000000..5067edac
--- /dev/null
+++ b/src/dbreg/dbreg.c
@@ -0,0 +1,1012 @@
+/*-
+ * See the file LICENSE for redistribution information.
+ *
+ * Copyright (c) 1996, 2012 Oracle and/or its affiliates. All rights reserved.
+ *
+ * $Id$
+ */
+
+#include "db_config.h"
+
+#include "db_int.h"
+#include "dbinc/db_page.h"
+#include "dbinc/log.h"
+#include "dbinc/txn.h"
+#include "dbinc/db_am.h"
+
+static int __dbreg_push_id __P((ENV *, int32_t));
+static int __dbreg_pop_id __P((ENV *, int32_t *));
+static int __dbreg_pluck_id __P((ENV *, int32_t));
+
+/*
+ * The dbreg subsystem, as its name implies, registers database handles so
+ * that we can associate log messages with them without logging a filename
+ * or a full, unique DB ID. Instead, we assign each dbp an int32_t which is
+ * easy and cheap to log, and use this subsystem to map back and forth.
+ *
+ * Overview of how dbreg ids are managed:
+ *
+ * OPEN
+ * dbreg_setup (Creates FNAME struct.)
+ * dbreg_new_id (Assigns new ID to dbp and logs it. May be postponed
+ * until we attempt to log something else using that dbp, if the dbp
+ * was opened on a replication client.)
+ *
+ * CLOSE
+ * dbreg_close_id (Logs closure of dbp/revocation of ID.)
+ * dbreg_revoke_id (As name implies, revokes ID.)
+ * dbreg_teardown (Destroys FNAME.)
+ *
+ * RECOVERY
+ * dbreg_setup
+ * dbreg_assign_id (Assigns a particular ID we have in the log to a dbp.)
+ *
+ * sometimes: dbreg_revoke_id; dbreg_teardown
+ * other times: normal close path
+ *
+ * A note about locking:
+ *
+ * FNAME structures are referenced only by their corresponding dbp's
+ * until they have a valid id.
+ *
+ * Once they have a valid id, they must get linked into the log
+ * region list so they can get logged on checkpoints.
+ *
+ * An FNAME that may/does have a valid id must be accessed under
+ * protection of the mtx_filelist, with the following exception:
+ *
+ * We don't want to have to grab the mtx_filelist on every log
+ * record, and it should be safe not to do so when we're just
+ * looking at the id, because once allocated, the id should
+ * not change under a handle until the handle is closed.
+ *
+ * If a handle is closed during an attempt by another thread to
+ * log with it, well, the application doing the close deserves to
+ * go down in flames and a lot else is about to fail anyway.
+ *
+ * When in the course of logging we encounter an invalid id
+ * and go to allocate it lazily, we *do* need to check again
+ * after grabbing the mutex, because it's possible to race with
+ * another thread that has also decided that it needs to allocate
+ * a id lazily.
+ *
+ * See SR #5623 for further discussion of the new dbreg design.
+ */
+
+/*
+ * __dbreg_setup --
+ * Allocate and initialize an FNAME structure. The FNAME structures
+ * live in the log shared region and map one-to-one with open database handles.
+ * When the handle needs to be logged, the FNAME should have a valid fid
+ * allocated. If the handle currently isn't logged, it still has an FNAME
+ * entry. If we later discover that the handle needs to be logged, we can
+ * allocate a id for it later. (This happens when the handle is on a
+ * replication client that later becomes a master.)
+ *
+ * PUBLIC: int __dbreg_setup __P((DB *, const char *, const char *, u_int32_t));
+ */
+int
+__dbreg_setup(dbp, fname, dname, create_txnid)
+ DB *dbp;
+ const char *fname, *dname;
+ u_int32_t create_txnid;
+{
+ DB_LOG *dblp;
+ ENV *env;
+ FNAME *fnp;
+#ifdef HAVE_STATISTICS
+ LOG *lp;
+#endif
+ REGINFO *infop;
+ int ret;
+ size_t len;
+ void *p;
+
+ env = dbp->env;
+ dblp = env->lg_handle;
+ infop = &dblp->reginfo;
+
+ fnp = NULL;
+ p = NULL;
+
+ /* Allocate an FNAME and, if necessary, a buffer for the name itself. */
+ LOG_SYSTEM_LOCK(env);
+ if ((ret = __env_alloc(infop, sizeof(FNAME), &fnp)) != 0)
+ goto err;
+
+#ifdef HAVE_STATISTICS
+ lp = dblp->reginfo.primary;
+ if (++lp->stat.st_nfileid > lp->stat.st_maxnfileid)
+ lp->stat.st_maxnfileid = lp->stat.st_nfileid;
+#endif
+
+ memset(fnp, 0, sizeof(FNAME));
+ if (fname == NULL)
+ fnp->fname_off = INVALID_ROFF;
+ else {
+ len = strlen(fname) + 1;
+ if ((ret = __env_alloc(infop, len, &p)) != 0)
+ goto err;
+ fnp->fname_off = R_OFFSET(infop, p);
+ memcpy(p, fname, len);
+ }
+ if (dname == NULL)
+ fnp->dname_off = INVALID_ROFF;
+ else {
+ len = strlen(dname) + 1;
+ if ((ret = __env_alloc(infop, len, &p)) != 0)
+ goto err;
+ fnp->dname_off = R_OFFSET(infop, p);
+ memcpy(p, dname, len);
+ }
+ LOG_SYSTEM_UNLOCK(env);
+
+ /*
+ * Fill in all the remaining info that we'll need later to register
+ * the file, if we use it for logging.
+ */
+ fnp->id = fnp->old_id = DB_LOGFILEID_INVALID;
+ fnp->s_type = dbp->type;
+ memcpy(fnp->ufid, dbp->fileid, DB_FILE_ID_LEN);
+ fnp->meta_pgno = dbp->meta_pgno;
+ fnp->create_txnid = create_txnid;
+ dbp->dbenv->thread_id(dbp->dbenv, &fnp->pid, NULL);
+
+ if (F_ISSET(dbp, DB_AM_INMEM))
+ F_SET(fnp, DB_FNAME_INMEM);
+ if (F_ISSET(dbp, DB_AM_RECOVER))
+ F_SET(fnp, DB_FNAME_RECOVER);
+ /*
+ * The DB is BIGENDed if its bytes are swapped XOR
+ * the machine is bigended
+ */
+ if ((F_ISSET(dbp, DB_AM_SWAP) != 0) ^
+ (F_ISSET(env, ENV_LITTLEENDIAN) == 0))
+ F_SET(fnp, DBREG_BIGEND);
+ if (F_ISSET(dbp, DB_AM_CHKSUM))
+ F_SET(fnp, DBREG_CHKSUM);
+ if (F_ISSET(dbp, DB_AM_ENCRYPT))
+ F_SET(fnp, DBREG_ENCRYPT);
+ if (F2_ISSET(dbp, DB2_AM_EXCL))
+ F_SET(fnp, DBREG_EXCL);
+ fnp->txn_ref = 1;
+ fnp->mutex = dbp->mutex;
+
+ dbp->log_filename = fnp;
+
+ return (0);
+
+err: LOG_SYSTEM_UNLOCK(env);
+ if (ret == ENOMEM)
+ __db_errx(env, DB_STR("1501",
+ "Logging region out of memory; you may need to increase its size"));
+
+ return (ret);
+}
+
+/*
+ * __dbreg_teardown --
+ * Destroy a DB handle's FNAME struct. This is only called when closing
+ * the DB.
+ *
+ * PUBLIC: int __dbreg_teardown __P((DB *));
+ */
+int
+__dbreg_teardown(dbp)
+ DB *dbp;
+{
+ int ret;
+
+ /*
+ * We may not have an FNAME if we were never opened. This is not an
+ * error.
+ */
+ if (dbp->log_filename == NULL)
+ return (0);
+
+ ret = __dbreg_teardown_int(dbp->env, dbp->log_filename);
+
+ /* We freed the copy of the mutex from the FNAME. */
+ dbp->log_filename = NULL;
+ dbp->mutex = MUTEX_INVALID;
+
+ return (ret);
+}
+
+/*
+ * __dbreg_teardown_int --
+ * Destroy an FNAME struct.
+ *
+ * PUBLIC: int __dbreg_teardown_int __P((ENV *, FNAME *));
+ */
+int
+__dbreg_teardown_int(env, fnp)
+ ENV *env;
+ FNAME *fnp;
+{
+ DB_LOG *dblp;
+#ifdef HAVE_STATISTICS
+ LOG *lp;
+#endif
+ REGINFO *infop;
+ int ret;
+
+ if (F_ISSET(fnp, DB_FNAME_NOTLOGGED))
+ return (0);
+ dblp = env->lg_handle;
+ infop = &dblp->reginfo;
+#ifdef HAVE_STATISTICS
+ lp = dblp->reginfo.primary;
+#endif
+
+ DB_ASSERT(env, fnp->id == DB_LOGFILEID_INVALID);
+ ret = __mutex_free(env, &fnp->mutex);
+
+ LOG_SYSTEM_LOCK(env);
+ if (fnp->fname_off != INVALID_ROFF)
+ __env_alloc_free(infop, R_ADDR(infop, fnp->fname_off));
+ if (fnp->dname_off != INVALID_ROFF)
+ __env_alloc_free(infop, R_ADDR(infop, fnp->dname_off));
+ __env_alloc_free(infop, fnp);
+ STAT(lp->stat.st_nfileid--);
+ LOG_SYSTEM_UNLOCK(env);
+
+ return (ret);
+}
+
+/*
+ * __dbreg_new_id --
+ * Get an unused dbreg id to this database handle.
+ * Used as a wrapper to acquire the mutex and
+ * only set the id on success.
+ *
+ * PUBLIC: int __dbreg_new_id __P((DB *, DB_TXN *));
+ */
+int
+__dbreg_new_id(dbp, txn)
+ DB *dbp;
+ DB_TXN *txn;
+{
+ DB_LOG *dblp;
+ ENV *env;
+ FNAME *fnp;
+ LOG *lp;
+ int32_t id;
+ int ret;
+
+ env = dbp->env;
+ dblp = env->lg_handle;
+ lp = dblp->reginfo.primary;
+ fnp = dbp->log_filename;
+
+ /* The mtx_filelist protects the FNAME list and id management. */
+ MUTEX_LOCK(env, lp->mtx_filelist);
+ if (fnp->id != DB_LOGFILEID_INVALID) {
+ MUTEX_UNLOCK(env, lp->mtx_filelist);
+ return (0);
+ }
+ if ((ret = __dbreg_get_id(dbp, txn, &id)) == 0)
+ fnp->id = id;
+ MUTEX_UNLOCK(env, lp->mtx_filelist);
+ return (ret);
+}
+
+/*
+ * __dbreg_get_id --
+ * Assign an unused dbreg id to this database handle.
+ * Assume the caller holds the mtx_filelist locked. Assume the
+ * caller will set the fnp->id field with the id we return.
+ *
+ * PUBLIC: int __dbreg_get_id __P((DB *, DB_TXN *, int32_t *));
+ */
+int
+__dbreg_get_id(dbp, txn, idp)
+ DB *dbp;
+ DB_TXN *txn;
+ int32_t *idp;
+{
+ DB_LOG *dblp;
+ ENV *env;
+ FNAME *fnp;
+ LOG *lp;
+ int32_t id;
+ int ret;
+
+ env = dbp->env;
+ dblp = env->lg_handle;
+ lp = dblp->reginfo.primary;
+ fnp = dbp->log_filename;
+
+ /*
+ * It's possible that after deciding we needed to call this function,
+ * someone else allocated an ID before we grabbed the lock. Check
+ * to make sure there was no race and we have something useful to do.
+ */
+ /* Get an unused ID from the free list. */
+ if ((ret = __dbreg_pop_id(env, &id)) != 0)
+ goto err;
+
+ /* If no ID was found, allocate a new one. */
+ if (id == DB_LOGFILEID_INVALID)
+ id = lp->fid_max++;
+
+ /* If the file is durable (i.e., not, not-durable), mark it as such. */
+ if (!F_ISSET(dbp, DB_AM_NOT_DURABLE))
+ F_SET(fnp, DB_FNAME_DURABLE);
+
+ /* Hook the FNAME into the list of open files. */
+ SH_TAILQ_INSERT_HEAD(&lp->fq, fnp, q, __fname);
+
+ /*
+ * Log the registry. We should only request a new ID in situations
+ * where logging is reasonable.
+ */
+ DB_ASSERT(env, !F_ISSET(dbp, DB_AM_RECOVER));
+
+ if ((ret = __dbreg_log_id(dbp, txn, id, 0)) != 0)
+ goto err;
+
+ /*
+ * Once we log the create_txnid, we need to make sure we never
+ * log it again (as might happen if this is a replication client
+ * that later upgrades to a master).
+ */
+ fnp->create_txnid = TXN_INVALID;
+
+ DB_ASSERT(env, dbp->type == fnp->s_type);
+ DB_ASSERT(env, dbp->meta_pgno == fnp->meta_pgno);
+
+ if ((ret = __dbreg_add_dbentry(env, dblp, dbp, id)) != 0)
+ goto err;
+ /*
+ * If we have a successful call, set the ID. Otherwise
+ * we have to revoke it and remove it from all the lists
+ * it has been added to, and return an invalid id.
+ */
+err:
+ if (ret != 0 && id != DB_LOGFILEID_INVALID) {
+ (void)__dbreg_revoke_id(dbp, 1, id);
+ id = DB_LOGFILEID_INVALID;
+ }
+ *idp = id;
+ return (ret);
+}
+
+/*
+ * __dbreg_assign_id --
+ * Assign a particular dbreg id to this database handle.
+ *
+ * PUBLIC: int __dbreg_assign_id __P((DB *, int32_t, int));
+ */
+int
+__dbreg_assign_id(dbp, id, deleted)
+ DB *dbp;
+ int32_t id;
+ int deleted;
+{
+ DB *close_dbp;
+ DB_LOG *dblp;
+ ENV *env;
+ FNAME *close_fnp, *fnp;
+ LOG *lp;
+ int ret;
+
+ env = dbp->env;
+ dblp = env->lg_handle;
+ lp = dblp->reginfo.primary;
+ fnp = dbp->log_filename;
+
+ close_dbp = NULL;
+ close_fnp = NULL;
+
+ /* The mtx_filelist protects the FNAME list and id management. */
+ MUTEX_LOCK(env, lp->mtx_filelist);
+
+ /* We should only call this on DB handles that have no ID. */
+ DB_ASSERT(env, fnp->id == DB_LOGFILEID_INVALID);
+
+ /*
+ * Make sure there isn't already a file open with this ID. There can
+ * be in recovery, if we're recovering across a point where an ID got
+ * reused.
+ */
+ if (__dbreg_id_to_fname(dblp, id, 1, &close_fnp) == 0) {
+ /*
+ * We want to save off any dbp we have open with this id. We
+ * can't safely close it now, because we hold the mtx_filelist,
+ * but we should be able to rely on it being open in this
+ * process, and we're running recovery, so no other thread
+ * should muck with it if we just put off closing it until
+ * we're ready to return.
+ *
+ * Once we have the dbp, revoke its id; we're about to
+ * reuse it.
+ */
+ ret = __dbreg_id_to_db(env, NULL, &close_dbp, id, 0);
+ if (ret == ENOENT) {
+ ret = 0;
+ goto cont;
+ } else if (ret != 0)
+ goto err;
+
+ if ((ret = __dbreg_revoke_id(close_dbp, 1,
+ DB_LOGFILEID_INVALID)) != 0)
+ goto err;
+ }
+
+ /*
+ * Remove this ID from the free list, if it's there, and make sure
+ * we don't allocate it anew.
+ */
+cont: if ((ret = __dbreg_pluck_id(env, id)) != 0)
+ goto err;
+ if (id >= lp->fid_max)
+ lp->fid_max = id + 1;
+
+ /* Now go ahead and assign the id to our dbp. */
+ fnp->id = id;
+ /* If the file is durable (i.e., not, not-durable), mark it as such. */
+ if (!F_ISSET(dbp, DB_AM_NOT_DURABLE))
+ F_SET(fnp, DB_FNAME_DURABLE);
+ SH_TAILQ_INSERT_HEAD(&lp->fq, fnp, q, __fname);
+
+ /*
+ * If we get an error adding the dbentry, revoke the id.
+ * We void the return value since we want to retain and
+ * return the original error in ret anyway.
+ */
+ if ((ret = __dbreg_add_dbentry(env, dblp, dbp, id)) != 0)
+ (void)__dbreg_revoke_id(dbp, 1, id);
+ else
+ dblp->dbentry[id].deleted = deleted;
+
+err: MUTEX_UNLOCK(env, lp->mtx_filelist);
+
+ /* There's nothing useful that our caller can do if this close fails. */
+ if (close_dbp != NULL)
+ (void)__db_close(close_dbp, NULL, DB_NOSYNC);
+
+ return (ret);
+}
+
+/*
+ * __dbreg_revoke_id --
+ * Take a log id away from a dbp, in preparation for closing it,
+ * but without logging the close.
+ *
+ * PUBLIC: int __dbreg_revoke_id __P((DB *, int, int32_t));
+ */
+int
+__dbreg_revoke_id(dbp, have_lock, force_id)
+ DB *dbp;
+ int have_lock;
+ int32_t force_id;
+{
+ DB_REP *db_rep;
+ ENV *env;
+ int push;
+
+ env = dbp->env;
+
+ /*
+ * If we are not in recovery but the file was opened for a recovery
+ * operation, then this process aborted a transaction for another
+ * process and the id may still be in use, so don't reuse this id.
+ * If our fid generation in replication has changed, this fid
+ * should not be reused
+ */
+ db_rep = env->rep_handle;
+ push = (!F_ISSET(dbp, DB_AM_RECOVER) || IS_RECOVERING(env)) &&
+ (!REP_ON(env) || ((REP *)db_rep->region)->gen == dbp->fid_gen);
+
+ return (__dbreg_revoke_id_int(dbp->env,
+ dbp->log_filename, have_lock, push, force_id));
+}
+/*
+ * __dbreg_revoke_id_int --
+ * Revoke a log, in preparation for closing it, but without logging
+ * the close.
+ *
+ * PUBLIC: int __dbreg_revoke_id_int
+ * PUBLIC: __P((ENV *, FNAME *, int, int, int32_t));
+ */
+int
+__dbreg_revoke_id_int(env, fnp, have_lock, push, force_id)
+ ENV *env;
+ FNAME *fnp;
+ int have_lock, push;
+ int32_t force_id;
+{
+ DB_LOG *dblp;
+ LOG *lp;
+ int32_t id;
+ int ret;
+
+ dblp = env->lg_handle;
+ lp = dblp->reginfo.primary;
+ ret = 0;
+
+ /* If we lack an ID, this is a null-op. */
+ if (fnp == NULL)
+ return (0);
+
+ /*
+ * If we have a force_id, we had an error after allocating
+ * the id, and putting it on the fq list, but before we
+ * finished setting up fnp. So, if we have a force_id use it.
+ */
+ if (force_id != DB_LOGFILEID_INVALID)
+ id = force_id;
+ else if (fnp->id == DB_LOGFILEID_INVALID) {
+ if (fnp->old_id == DB_LOGFILEID_INVALID)
+ return (0);
+ id = fnp->old_id;
+ } else
+ id = fnp->id;
+ if (!have_lock)
+ MUTEX_LOCK(env, lp->mtx_filelist);
+
+ fnp->id = DB_LOGFILEID_INVALID;
+ fnp->old_id = DB_LOGFILEID_INVALID;
+
+ /* Remove the FNAME from the list of open files. */
+ SH_TAILQ_REMOVE(&lp->fq, fnp, q, __fname);
+
+ /*
+ * This FNAME may be for a DBP which is already closed. Its ID may
+ * still be in use by an aborting transaction. If not,
+ * remove this id from the dbentry table and push it onto the
+ * free list.
+ */
+ if ((ret = __dbreg_rem_dbentry(dblp, id)) == 0 && push)
+ ret = __dbreg_push_id(env, id);
+
+ if (!have_lock)
+ MUTEX_UNLOCK(env, lp->mtx_filelist);
+ return (ret);
+}
+
+/*
+ * __dbreg_close_id --
+ * Take a dbreg id away from a dbp that we're closing, and log
+ * the unregistry if the refcount goes to 0.
+ *
+ * PUBLIC: int __dbreg_close_id __P((DB *, DB_TXN *, u_int32_t));
+ */
+int
+__dbreg_close_id(dbp, txn, op)
+ DB *dbp;
+ DB_TXN *txn;
+ u_int32_t op;
+{
+ DB_LOG *dblp;
+ ENV *env;
+ FNAME *fnp;
+ LOG *lp;
+ int ret, t_ret;
+
+ env = dbp->env;
+ dblp = env->lg_handle;
+ lp = dblp->reginfo.primary;
+ fnp = dbp->log_filename;
+
+ /* If we lack an ID, this is a null-op. */
+ if (fnp == NULL)
+ return (0);
+
+ if (fnp->id == DB_LOGFILEID_INVALID) {
+ ret = __dbreg_revoke_id(dbp, 0, DB_LOGFILEID_INVALID);
+ goto done;
+ }
+
+ /*
+ * If we are the last reference to this db then we need to log it
+ * as closed. Otherwise the last transaction will do the logging.
+ * Remove the DBP from the db entry table since it can nolonger
+ * be used. If we abort it will have to be reopened.
+ */
+ ret = 0;
+ DB_ASSERT(env, fnp->txn_ref > 0);
+ if (fnp->txn_ref > 1) {
+ MUTEX_LOCK(env, dbp->mutex);
+ if (fnp->txn_ref > 1) {
+ if ((t_ret = __dbreg_rem_dbentry(
+ env->lg_handle, fnp->id)) != 0 && ret == 0)
+ ret = t_ret;
+
+ /*
+ * The DB handle has been closed in the logging system.
+ * Transactions may still have a ref to this name.
+ * Mark it so that if recovery reopens the file id
+ * the transaction will not close the wrong handle.
+ */
+ F_SET(fnp, DB_FNAME_CLOSED);
+ fnp->txn_ref--;
+ MUTEX_UNLOCK(env, dbp->mutex);
+ /* The mutex now lives only in the FNAME. */
+ dbp->mutex = MUTEX_INVALID;
+ dbp->log_filename = NULL;
+ goto no_log;
+ }
+ }
+ MUTEX_LOCK(env, lp->mtx_filelist);
+
+ if ((ret = __dbreg_log_close(env, fnp, txn, op)) != 0)
+ goto err;
+ ret = __dbreg_revoke_id(dbp, 1, DB_LOGFILEID_INVALID);
+
+err: MUTEX_UNLOCK(env, lp->mtx_filelist);
+
+done: if ((t_ret = __dbreg_teardown(dbp)) != 0 && ret == 0)
+ ret = t_ret;
+no_log:
+ return (ret);
+}
+/*
+ * __dbreg_close_id_int --
+ * Close down a dbreg id and log the unregistry. This is called only
+ * when a transaction has the last ref to the fname.
+ *
+ * PUBLIC: int __dbreg_close_id_int __P((ENV *, FNAME *, u_int32_t, int));
+ */
+int
+__dbreg_close_id_int(env, fnp, op, locked)
+ ENV *env;
+ FNAME *fnp;
+ u_int32_t op;
+ int locked;
+{
+ DB_LOG *dblp;
+ LOG *lp;
+ int ret, t_ret;
+
+ DB_ASSERT(env, fnp->txn_ref == 1);
+ dblp = env->lg_handle;
+ lp = dblp->reginfo.primary;
+
+ if (fnp->id == DB_LOGFILEID_INVALID)
+ return (__dbreg_revoke_id_int(env,
+ fnp, locked, 1, DB_LOGFILEID_INVALID));
+
+ if (F_ISSET(fnp, DB_FNAME_RECOVER))
+ return (__dbreg_close_file(env, fnp));
+ /*
+ * If log_close fails then it will mark the name DB_FNAME_NOTLOGGED
+ * and the id must persist.
+ */
+ if (!locked)
+ MUTEX_LOCK(env, lp->mtx_filelist);
+ if ((ret = __dbreg_log_close(env, fnp, NULL, op)) != 0)
+ goto err;
+
+ ret = __dbreg_revoke_id_int(env, fnp, 1, 1, DB_LOGFILEID_INVALID);
+
+err: if (!locked)
+ MUTEX_UNLOCK(env, lp->mtx_filelist);
+
+ if ((t_ret = __dbreg_teardown_int(env, fnp)) != 0 && ret == 0)
+ ret = t_ret;
+ return (ret);
+}
+
+/*
+ * __dbreg_failchk --
+ *
+ * Look for entries that belong to dead processes and either close them
+ * out or, if there are pending transactions, just remove the mutex which
+ * will get discarded later.
+ *
+ * PUBLIC: int __dbreg_failchk __P((ENV *));
+ */
+int
+__dbreg_failchk(env)
+ ENV *env;
+{
+ DB_ENV *dbenv;
+ DB_LOG *dblp;
+ FNAME *fnp, *nnp;
+ LOG *lp;
+ int ret, t_ret;
+ char buf[DB_THREADID_STRLEN];
+ db_threadid_t unused;
+
+ if ((dblp = env->lg_handle) == NULL)
+ return (0);
+
+ DB_THREADID_INIT(unused);
+
+ lp = dblp->reginfo.primary;
+ dbenv = env->dbenv;
+ ret = 0;
+
+ MUTEX_LOCK(env, lp->mtx_filelist);
+ for (fnp = SH_TAILQ_FIRST(&lp->fq, __fname); fnp != NULL; fnp = nnp) {
+ nnp = SH_TAILQ_NEXT(fnp, q, __fname);
+ if (dbenv->is_alive(dbenv,
+ fnp->pid, unused, DB_MUTEX_PROCESS_ONLY))
+ continue;
+ MUTEX_LOCK(env, fnp->mutex);
+ __db_msg(env, DB_STR_A("1502",
+ "Freeing log information for process: %s, (ref %lu)",
+ "%s %lu"),
+ dbenv->thread_id_string(dbenv, fnp->pid, unused, buf),
+ (u_long)fnp->txn_ref);
+ if (fnp->txn_ref > 1 || F_ISSET(fnp, DB_FNAME_CLOSED)) {
+ if (!F_ISSET(fnp, DB_FNAME_CLOSED)) {
+ fnp->txn_ref--;
+ F_SET(fnp, DB_FNAME_CLOSED);
+ }
+ MUTEX_UNLOCK(env, fnp->mutex);
+ fnp->mutex = MUTEX_INVALID;
+ fnp->pid = 0;
+ } else {
+ F_SET(fnp, DB_FNAME_CLOSED);
+ if ((t_ret = __dbreg_close_id_int(env,
+ fnp, DBREG_CLOSE, 1)) && ret == 0)
+ ret = t_ret;
+ }
+ }
+
+ MUTEX_UNLOCK(env, lp->mtx_filelist);
+ return (ret);
+}
+/*
+ * __dbreg_log_close --
+ *
+ * Log a close of a database. Called when closing a file or when a
+ * replication client is becoming a master. That closes all the
+ * files it previously had open.
+ *
+ * Assumes caller holds the lp->mutex_filelist lock already.
+ *
+ * PUBLIC: int __dbreg_log_close __P((ENV *, FNAME *,
+ * PUBLIC: DB_TXN *, u_int32_t));
+ */
+int
+__dbreg_log_close(env, fnp, txn, op)
+ ENV *env;
+ FNAME *fnp;
+ DB_TXN *txn;
+ u_int32_t op;
+{
+ DBT fid_dbt, r_name, *dbtp;
+ DB_LOG *dblp;
+ DB_LSN r_unused;
+ int ret;
+
+ dblp = env->lg_handle;
+ ret = 0;
+
+ if (fnp->fname_off == INVALID_ROFF)
+ dbtp = NULL;
+ else {
+ memset(&r_name, 0, sizeof(r_name));
+ r_name.data = R_ADDR(&dblp->reginfo, fnp->fname_off);
+ r_name.size = (u_int32_t)strlen((char *)r_name.data) + 1;
+ dbtp = &r_name;
+ }
+ memset(&fid_dbt, 0, sizeof(fid_dbt));
+ fid_dbt.data = fnp->ufid;
+ fid_dbt.size = DB_FILE_ID_LEN;
+ if ((ret = __dbreg_register_log(env, txn, &r_unused,
+ F_ISSET(fnp, DB_FNAME_DURABLE) ? 0 : DB_LOG_NOT_DURABLE,
+ op, dbtp, &fid_dbt, fnp->id,
+ fnp->s_type, fnp->meta_pgno, TXN_INVALID)) != 0) {
+ /*
+ * We are trying to close, but the log write failed.
+ * Unfortunately, close needs to plow forward, because
+ * the application can't do anything with the handle.
+ * Make the entry in the shared memory region so that
+ * when we close the environment, we know that this
+ * happened. Also, make sure we remove this from the
+ * per-process table, so that we don't try to close it
+ * later.
+ */
+ F_SET(fnp, DB_FNAME_NOTLOGGED);
+ (void)__dbreg_rem_dbentry(dblp, fnp->id);
+ }
+ return (ret);
+}
+
+/*
+ * __dbreg_push_id and __dbreg_pop_id --
+ * Dbreg ids from closed files are kept on a stack in shared memory
+ * for recycling. (We want to reuse them as much as possible because each
+ * process keeps open files in an array by ID.) Push them to the stack and
+ * pop them from it, managing memory as appropriate.
+ *
+ * The stack is protected by the mtx_filelist, and both functions assume it
+ * is already locked.
+ */
+static int
+__dbreg_push_id(env, id)
+ ENV *env;
+ int32_t id;
+{
+ DB_LOG *dblp;
+ LOG *lp;
+ REGINFO *infop;
+ int32_t *stack, *newstack;
+ int ret;
+
+ dblp = env->lg_handle;
+ infop = &dblp->reginfo;
+ lp = infop->primary;
+
+ if (id == lp->fid_max - 1) {
+ lp->fid_max--;
+ return (0);
+ }
+
+ /* Check if we have room on the stack. */
+ if (lp->free_fid_stack == INVALID_ROFF ||
+ lp->free_fids_alloced <= lp->free_fids + 1) {
+ LOG_SYSTEM_LOCK(env);
+ if ((ret = __env_alloc(infop,
+ (lp->free_fids_alloced + 20) * sizeof(u_int32_t),
+ &newstack)) != 0) {
+ LOG_SYSTEM_UNLOCK(env);
+ return (ret);
+ }
+
+ if (lp->free_fid_stack != INVALID_ROFF) {
+ stack = R_ADDR(infop, lp->free_fid_stack);
+ memcpy(newstack, stack,
+ lp->free_fids_alloced * sizeof(u_int32_t));
+ __env_alloc_free(infop, stack);
+ }
+ lp->free_fid_stack = R_OFFSET(infop, newstack);
+ lp->free_fids_alloced += 20;
+ LOG_SYSTEM_UNLOCK(env);
+ }
+
+ stack = R_ADDR(infop, lp->free_fid_stack);
+ stack[lp->free_fids++] = id;
+ return (0);
+}
+
+static int
+__dbreg_pop_id(env, id)
+ ENV *env;
+ int32_t *id;
+{
+ DB_LOG *dblp;
+ LOG *lp;
+ int32_t *stack;
+
+ dblp = env->lg_handle;
+ lp = dblp->reginfo.primary;
+
+ /* Do we have anything to pop? */
+ if (lp->free_fid_stack != INVALID_ROFF && lp->free_fids > 0) {
+ stack = R_ADDR(&dblp->reginfo, lp->free_fid_stack);
+ *id = stack[--lp->free_fids];
+ } else
+ *id = DB_LOGFILEID_INVALID;
+
+ return (0);
+}
+
+/*
+ * __dbreg_pluck_id --
+ * Remove a particular dbreg id from the stack of free ids. This is
+ * used when we open a file, as in recovery, with a specific ID that might
+ * be on the stack.
+ *
+ * Returns success whether or not the particular id was found, and like
+ * push and pop, assumes that the mtx_filelist is locked.
+ */
+static int
+__dbreg_pluck_id(env, id)
+ ENV *env;
+ int32_t id;
+{
+ DB_LOG *dblp;
+ LOG *lp;
+ int32_t *stack;
+ u_int i;
+
+ dblp = env->lg_handle;
+ lp = dblp->reginfo.primary;
+
+ if (id >= lp->fid_max)
+ return (0);
+
+ /* Do we have anything to look at? */
+ if (lp->free_fid_stack != INVALID_ROFF) {
+ stack = R_ADDR(&dblp->reginfo, lp->free_fid_stack);
+ for (i = 0; i < lp->free_fids; i++)
+ if (id == stack[i]) {
+ /*
+ * Found it. Overwrite it with the top
+ * id (which may harmlessly be itself),
+ * and shorten the stack by one.
+ */
+ stack[i] = stack[lp->free_fids - 1];
+ lp->free_fids--;
+ return (0);
+ }
+ }
+
+ return (0);
+}
+
+/*
+ * __dbreg_log_id --
+ * Used for in-memory named files. They are created in mpool and
+ * are given id's early in the open process so that we can read and
+ * create pages in the mpool for the files. However, at the time that
+ * the mpf is created, the file may not be fully created and/or its
+ * meta-data may not be fully known, so we can't do a full dbregister.
+ * This is a routine exported that will log a complete dbregister
+ * record that will allow for both recovery and replication.
+ *
+ * PUBLIC: int __dbreg_log_id __P((DB *, DB_TXN *, int32_t, int));
+ */
+int
+__dbreg_log_id(dbp, txn, id, needlock)
+ DB *dbp;
+ DB_TXN *txn;
+ int32_t id;
+ int needlock;
+{
+ DBT fid_dbt, r_name;
+ DB_LOG *dblp;
+ DB_LSN unused;
+ ENV *env;
+ FNAME *fnp;
+ LOG *lp;
+ u_int32_t op;
+ int i, ret;
+
+ env = dbp->env;
+ dblp = env->lg_handle;
+ lp = dblp->reginfo.primary;
+ fnp = dbp->log_filename;
+
+ /*
+ * Verify that the fnp has been initialized, by seeing if it
+ * has any non-zero bytes in it.
+ */
+ for (i = 0; i < DB_FILE_ID_LEN; i++)
+ if (fnp->ufid[i] != 0)
+ break;
+ if (i == DB_FILE_ID_LEN)
+ memcpy(fnp->ufid, dbp->fileid, DB_FILE_ID_LEN);
+
+ if (fnp->s_type == DB_UNKNOWN)
+ fnp->s_type = dbp->type;
+
+ /*
+ * Log the registry. We should only request a new ID in situations
+ * where logging is reasonable.
+ */
+ memset(&fid_dbt, 0, sizeof(fid_dbt));
+ memset(&r_name, 0, sizeof(r_name));
+
+ if (needlock)
+ MUTEX_LOCK(env, lp->mtx_filelist);
+
+ if (fnp->fname_off != INVALID_ROFF) {
+ r_name.data = R_ADDR(&dblp->reginfo, fnp->fname_off);
+ r_name.size = (u_int32_t)strlen((char *)r_name.data) + 1;
+ }
+
+ fid_dbt.data = dbp->fileid;
+ fid_dbt.size = DB_FILE_ID_LEN;
+
+ op = !F_ISSET(dbp, DB_AM_OPEN_CALLED) ? DBREG_PREOPEN :
+ (F_ISSET(dbp, DB_AM_INMEM) ?
+ (F2_ISSET(dbp, DB2_AM_EXCL) ? DBREG_XREOPEN : DBREG_REOPEN):
+ (F2_ISSET(dbp, DB2_AM_EXCL) ? DBREG_XOPEN : DBREG_OPEN));
+ ret = __dbreg_register_log(env, txn, &unused,
+ F_ISSET(dbp, DB_AM_NOT_DURABLE) ? DB_LOG_NOT_DURABLE : 0,
+ op | F_ISSET(fnp, DB_FNAME_DBREG_MASK),
+ r_name.size == 0 ? NULL : &r_name, &fid_dbt, id,
+ fnp->s_type, fnp->meta_pgno, fnp->create_txnid);
+
+ if (needlock)
+ MUTEX_UNLOCK(env, lp->mtx_filelist);
+
+ return (ret);
+}