summaryrefslogtreecommitdiff
path: root/bdb/db/db_overflow.c
diff options
context:
space:
mode:
Diffstat (limited to 'bdb/db/db_overflow.c')
-rw-r--r--bdb/db/db_overflow.c213
1 files changed, 129 insertions, 84 deletions
diff --git a/bdb/db/db_overflow.c b/bdb/db/db_overflow.c
index 54f0a03aafe..27dcb41a2ff 100644
--- a/bdb/db/db_overflow.c
+++ b/bdb/db/db_overflow.c
@@ -1,7 +1,7 @@
/*-
* See the file LICENSE for redistribution information.
*
- * Copyright (c) 1996, 1997, 1998, 1999, 2000
+ * Copyright (c) 1996-2002
* Sleepycat Software. All rights reserved.
*/
/*
@@ -43,7 +43,7 @@
#include "db_config.h"
#ifndef lint
-static const char revid[] = "$Id: db_overflow.c,v 11.21 2000/11/30 00:58:32 ubell Exp $";
+static const char revid[] = "$Id: db_overflow.c,v 11.46 2002/08/08 03:57:48 bostic Exp $";
#endif /* not lint */
#ifndef NO_SYSTEM_INCLUDES
@@ -53,9 +53,9 @@ static const char revid[] = "$Id: db_overflow.c,v 11.21 2000/11/30 00:58:32 ubel
#endif
#include "db_int.h"
-#include "db_page.h"
-#include "db_am.h"
-#include "db_verify.h"
+#include "dbinc/db_page.h"
+#include "dbinc/db_am.h"
+#include "dbinc/db_verify.h"
/*
* Big key/data code.
@@ -83,6 +83,7 @@ __db_goff(dbp, dbt, tlen, pgno, bpp, bpsz)
u_int32_t *bpsz;
{
DB_ENV *dbenv;
+ DB_MPOOLFILE *mpf;
PAGE *h;
db_indx_t bytes;
u_int32_t curoff, needed, start;
@@ -90,6 +91,7 @@ __db_goff(dbp, dbt, tlen, pgno, bpp, bpsz)
int ret;
dbenv = dbp->dbenv;
+ mpf = dbp->mpf;
/*
* Check if the buffer is big enough; if it is not and we are
@@ -99,7 +101,12 @@ __db_goff(dbp, dbt, tlen, pgno, bpp, bpsz)
*/
if (F_ISSET(dbt, DB_DBT_PARTIAL)) {
start = dbt->doff;
- needed = dbt->dlen;
+ if (start > tlen)
+ needed = 0;
+ else if (dbt->dlen > tlen - start)
+ needed = tlen - start;
+ else
+ needed = dbt->dlen;
} else {
start = 0;
needed = tlen;
@@ -112,15 +119,13 @@ __db_goff(dbp, dbt, tlen, pgno, bpp, bpsz)
return (ENOMEM);
}
} else if (F_ISSET(dbt, DB_DBT_MALLOC)) {
- if ((ret = __os_malloc(dbenv,
- needed, dbp->db_malloc, &dbt->data)) != 0)
+ if ((ret = __os_umalloc(dbenv, needed, &dbt->data)) != 0)
return (ret);
} else if (F_ISSET(dbt, DB_DBT_REALLOC)) {
- if ((ret = __os_realloc(dbenv,
- needed, dbp->db_realloc, &dbt->data)) != 0)
+ if ((ret = __os_urealloc(dbenv, needed, &dbt->data)) != 0)
return (ret);
} else if (*bpsz == 0 || *bpsz < needed) {
- if ((ret = __os_realloc(dbenv, needed, NULL, bpp)) != 0)
+ if ((ret = __os_realloc(dbenv, needed, bpp)) != 0)
return (ret);
*bpsz = needed;
dbt->data = *bpp;
@@ -133,13 +138,12 @@ __db_goff(dbp, dbt, tlen, pgno, bpp, bpsz)
*/
dbt->size = needed;
for (curoff = 0, p = dbt->data; pgno != PGNO_INVALID && needed > 0;) {
- if ((ret = memp_fget(dbp->mpf, &pgno, 0, &h)) != 0) {
- (void)__db_pgerr(dbp, pgno);
+ if ((ret = mpf->get(mpf, &pgno, 0, &h)) != 0)
return (ret);
- }
+
/* Check if we need any bytes from this page. */
if (curoff + OV_LEN(h) >= start) {
- src = (u_int8_t *)h + P_OVERHEAD;
+ src = (u_int8_t *)h + P_OVERHEAD(dbp);
bytes = OV_LEN(h);
if (start > curoff) {
src += start - curoff;
@@ -153,7 +157,7 @@ __db_goff(dbp, dbt, tlen, pgno, bpp, bpsz)
}
curoff += OV_LEN(h);
pgno = h->next_pgno;
- memp_fput(dbp->mpf, h, 0);
+ (void)mpf->put(mpf, h, 0);
}
return (0);
}
@@ -171,13 +175,14 @@ __db_poff(dbc, dbt, pgnop)
db_pgno_t *pgnop;
{
DB *dbp;
- PAGE *pagep, *lastp;
- DB_LSN new_lsn, null_lsn;
DBT tmp_dbt;
+ DB_LSN new_lsn, null_lsn;
+ DB_MPOOLFILE *mpf;
+ PAGE *pagep, *lastp;
db_indx_t pagespace;
u_int32_t sz;
u_int8_t *p;
- int ret;
+ int ret, t_ret;
/*
* Allocate pages and copy the key/data item into them. Calculate the
@@ -185,8 +190,10 @@ __db_poff(dbc, dbt, pgnop)
* item.
*/
dbp = dbc->dbp;
- pagespace = P_MAXSPACE(dbp->pgsize);
+ mpf = dbp->mpf;
+ pagespace = P_MAXSPACE(dbp, dbp->pgsize);
+ ret = 0;
lastp = NULL;
for (p = dbt->data,
sz = dbt->size; sz > 0; p += pagespace, sz -= pagespace) {
@@ -203,30 +210,36 @@ __db_poff(dbc, dbt, pgnop)
* have a partial record.
*/
if ((ret = __db_new(dbc, P_OVERFLOW, &pagep)) != 0)
- return (ret);
- if (DB_LOGGING(dbc)) {
+ break;
+ if (DBC_LOGGING(dbc)) {
tmp_dbt.data = p;
tmp_dbt.size = pagespace;
ZERO_LSN(null_lsn);
- if ((ret = __db_big_log(dbp->dbenv, dbc->txn,
- &new_lsn, 0, DB_ADD_BIG, dbp->log_fileid,
- PGNO(pagep), lastp ? PGNO(lastp) : PGNO_INVALID,
+ if ((ret = __db_big_log(dbp, dbc->txn,
+ &new_lsn, 0, DB_ADD_BIG, PGNO(pagep),
+ lastp ? PGNO(lastp) : PGNO_INVALID,
PGNO_INVALID, &tmp_dbt, &LSN(pagep),
lastp == NULL ? &null_lsn : &LSN(lastp),
- &null_lsn)) != 0)
- return (ret);
+ &null_lsn)) != 0) {
+ if (lastp != NULL)
+ (void)mpf->put(mpf,
+ lastp, DB_MPOOL_DIRTY);
+ lastp = pagep;
+ break;
+ }
+ } else
+ LSN_NOT_LOGGED(new_lsn);
- /* Move lsn onto page. */
- if (lastp)
- LSN(lastp) = new_lsn;
- LSN(pagep) = new_lsn;
- }
+ /* Move LSN onto page. */
+ if (lastp != NULL)
+ LSN(lastp) = new_lsn;
+ LSN(pagep) = new_lsn;
P_INIT(pagep, dbp->pgsize,
PGNO(pagep), PGNO_INVALID, PGNO_INVALID, 0, P_OVERFLOW);
OV_LEN(pagep) = pagespace;
OV_REF(pagep) = 1;
- memcpy((u_int8_t *)pagep + P_OVERHEAD, p, pagespace);
+ memcpy((u_int8_t *)pagep + P_OVERHEAD(dbp), p, pagespace);
/*
* If this is the first entry, update the user's info.
@@ -238,12 +251,14 @@ __db_poff(dbc, dbt, pgnop)
else {
lastp->next_pgno = PGNO(pagep);
pagep->prev_pgno = PGNO(lastp);
- (void)memp_fput(dbp->mpf, lastp, DB_MPOOL_DIRTY);
+ (void)mpf->put(mpf, lastp, DB_MPOOL_DIRTY);
}
lastp = pagep;
}
- (void)memp_fput(dbp->mpf, lastp, DB_MPOOL_DIRTY);
- return (0);
+ if (lastp != NULL &&
+ (t_ret = mpf->put(mpf, lastp, DB_MPOOL_DIRTY)) != 0 && ret == 0)
+ ret = t_ret;
+ return (ret);
}
/*
@@ -259,23 +274,29 @@ __db_ovref(dbc, pgno, adjust)
int32_t adjust;
{
DB *dbp;
+ DB_MPOOLFILE *mpf;
PAGE *h;
int ret;
dbp = dbc->dbp;
- if ((ret = memp_fget(dbp->mpf, &pgno, 0, &h)) != 0) {
- (void)__db_pgerr(dbp, pgno);
+ mpf = dbp->mpf;
+
+ if ((ret = mpf->get(mpf, &pgno, 0, &h)) != 0) {
+ __db_pgerr(dbp, pgno, ret);
return (ret);
}
- if (DB_LOGGING(dbc))
- if ((ret = __db_ovref_log(dbp->dbenv, dbc->txn,
- &LSN(h), 0, dbp->log_fileid, h->pgno, adjust,
- &LSN(h))) != 0)
+ if (DBC_LOGGING(dbc)) {
+ if ((ret = __db_ovref_log(dbp,
+ dbc->txn, &LSN(h), 0, h->pgno, adjust, &LSN(h))) != 0) {
+ (void)mpf->put(mpf, h, 0);
return (ret);
+ }
+ } else
+ LSN_NOT_LOGGED(LSN(h));
OV_REF(h) += adjust;
- (void)memp_fput(dbp->mpf, h, DB_MPOOL_DIRTY);
+ (void)mpf->put(mpf, h, DB_MPOOL_DIRTY);
return (0);
}
@@ -293,13 +314,16 @@ __db_doff(dbc, pgno)
DB *dbp;
PAGE *pagep;
DB_LSN null_lsn;
+ DB_MPOOLFILE *mpf;
DBT tmp_dbt;
int ret;
dbp = dbc->dbp;
+ mpf = dbp->mpf;
+
do {
- if ((ret = memp_fget(dbp->mpf, &pgno, 0, &pagep)) != 0) {
- (void)__db_pgerr(dbp, pgno);
+ if ((ret = mpf->get(mpf, &pgno, 0, &pagep)) != 0) {
+ __db_pgerr(dbp, pgno, ret);
return (ret);
}
@@ -309,20 +333,24 @@ __db_doff(dbc, pgno)
* decrement the reference count and return.
*/
if (OV_REF(pagep) > 1) {
- (void)memp_fput(dbp->mpf, pagep, 0);
+ (void)mpf->put(mpf, pagep, 0);
return (__db_ovref(dbc, pgno, -1));
}
- if (DB_LOGGING(dbc)) {
- tmp_dbt.data = (u_int8_t *)pagep + P_OVERHEAD;
+ if (DBC_LOGGING(dbc)) {
+ tmp_dbt.data = (u_int8_t *)pagep + P_OVERHEAD(dbp);
tmp_dbt.size = OV_LEN(pagep);
ZERO_LSN(null_lsn);
- if ((ret = __db_big_log(dbp->dbenv, dbc->txn,
- &LSN(pagep), 0, DB_REM_BIG, dbp->log_fileid,
- PGNO(pagep), PREV_PGNO(pagep), NEXT_PGNO(pagep),
- &tmp_dbt, &LSN(pagep), &null_lsn, &null_lsn)) != 0)
+ if ((ret = __db_big_log(dbp, dbc->txn,
+ &LSN(pagep), 0, DB_REM_BIG,
+ PGNO(pagep), PREV_PGNO(pagep),
+ NEXT_PGNO(pagep), &tmp_dbt,
+ &LSN(pagep), &null_lsn, &null_lsn)) != 0) {
+ (void)mpf->put(mpf, pagep, 0);
return (ret);
- }
+ }
+ } else
+ LSN_NOT_LOGGED(LSN(pagep));
pgno = pagep->next_pgno;
if ((ret = __db_free(dbc, pagep)) != 0)
return (ret);
@@ -352,13 +380,16 @@ __db_moff(dbp, dbt, pgno, tlen, cmpfunc, cmpp)
u_int32_t tlen;
int (*cmpfunc) __P((DB *, const DBT *, const DBT *)), *cmpp;
{
- PAGE *pagep;
DBT local_dbt;
+ DB_MPOOLFILE *mpf;
+ PAGE *pagep;
void *buf;
u_int32_t bufsize, cmp_bytes, key_left;
u_int8_t *p1, *p2;
int ret;
+ mpf = dbp->mpf;
+
/*
* If there is a user-specified comparison function, build a
* contiguous copy of the key, and call it.
@@ -373,27 +404,27 @@ __db_moff(dbp, dbt, pgno, tlen, cmpfunc, cmpp)
return (ret);
/* Pass the key as the first argument */
*cmpp = cmpfunc(dbp, dbt, &local_dbt);
- __os_free(buf, bufsize);
+ __os_free(dbp->dbenv, buf);
return (0);
}
/* While there are both keys to compare. */
for (*cmpp = 0, p1 = dbt->data,
key_left = dbt->size; key_left > 0 && pgno != PGNO_INVALID;) {
- if ((ret = memp_fget(dbp->mpf, &pgno, 0, &pagep)) != 0)
+ if ((ret = mpf->get(mpf, &pgno, 0, &pagep)) != 0)
return (ret);
cmp_bytes = OV_LEN(pagep) < key_left ? OV_LEN(pagep) : key_left;
tlen -= cmp_bytes;
key_left -= cmp_bytes;
- for (p2 =
- (u_int8_t *)pagep + P_OVERHEAD; cmp_bytes-- > 0; ++p1, ++p2)
+ for (p2 = (u_int8_t *)pagep + P_OVERHEAD(dbp);
+ cmp_bytes-- > 0; ++p1, ++p2)
if (*p1 != *p2) {
*cmpp = (long)*p1 - (long)*p2;
break;
}
pgno = NEXT_PGNO(pagep);
- if ((ret = memp_fput(dbp->mpf, pagep, 0)) != 0)
+ if ((ret = mpf->put(mpf, pagep, 0)) != 0)
return (ret);
if (*cmpp != 0)
return (0);
@@ -440,7 +471,7 @@ __db_vrfy_overflow(dbp, vdp, h, pgno, flags)
pip->refcount = OV_REF(h);
if (pip->refcount < 1) {
EPRINT((dbp->dbenv,
- "Overflow page %lu has zero reference count",
+ "Page %lu: overflow page has zero reference count",
(u_long)pgno));
isbad = 1;
}
@@ -448,7 +479,7 @@ __db_vrfy_overflow(dbp, vdp, h, pgno, flags)
/* Just store for now. */
pip->olen = HOFFSET(h);
-err: if ((t_ret = __db_vrfy_putpageinfo(vdp, pip)) != 0)
+err: if ((t_ret = __db_vrfy_putpageinfo(dbp->dbenv, vdp, pip)) != 0)
ret = t_ret;
return ((ret == 0 && isbad == 1) ? DB_VERIFY_BAD : ret);
}
@@ -495,7 +526,7 @@ __db_vrfy_ovfl_structure(dbp, vdp, pgno, tlen, flags)
if (pip->type != P_OVERFLOW) {
EPRINT((dbp->dbenv,
- "Overflow page %lu of invalid type",
+ "Page %lu: overflow page of invalid type %lu",
(u_long)pgno, (u_long)pip->type));
ret = DB_VERIFY_BAD;
goto err; /* Unsafe to continue. */
@@ -504,7 +535,8 @@ __db_vrfy_ovfl_structure(dbp, vdp, pgno, tlen, flags)
prev = pip->prev_pgno;
if (prev != PGNO_INVALID) {
EPRINT((dbp->dbenv,
- "First overflow page %lu has a prev_pgno", (u_long)pgno));
+ "Page %lu: first page in overflow chain has a prev_pgno %lu",
+ (u_long)pgno, (u_long)prev));
isbad = 1;
}
@@ -543,7 +575,7 @@ __db_vrfy_ovfl_structure(dbp, vdp, pgno, tlen, flags)
*/
if ((u_int32_t)p > refcount) {
EPRINT((dbp->dbenv,
- "Page %lu encountered twice in overflow traversal",
+ "Page %lu: encountered twice in overflow traversal",
(u_long)pgno));
ret = DB_VERIFY_BAD;
goto err;
@@ -571,19 +603,20 @@ __db_vrfy_ovfl_structure(dbp, vdp, pgno, tlen, flags)
if (!IS_VALID_PGNO(next)) {
DB_ASSERT(0);
EPRINT((dbp->dbenv,
- "Overflow page %lu has bad next_pgno",
- (u_long)pgno));
+ "Page %lu: bad next_pgno %lu on overflow page",
+ (u_long)pgno, (u_long)next));
ret = DB_VERIFY_BAD;
goto err;
}
- if ((ret = __db_vrfy_putpageinfo(vdp, pip)) != 0 ||
+ if ((ret = __db_vrfy_putpageinfo(dbp->dbenv, vdp, pip)) != 0 ||
(ret = __db_vrfy_getpageinfo(vdp, next, &pip)) != 0)
return (ret);
if (pip->prev_pgno != pgno) {
EPRINT((dbp->dbenv,
- "Overflow page %lu has bogus prev_pgno value",
- (u_long)next));
+ "Page %lu: bad prev_pgno %lu on overflow page (should be %lu)",
+ (u_long)next, (u_long)pip->prev_pgno,
+ (u_long)pgno));
isbad = 1;
/*
* It's safe to continue because we have separate
@@ -597,10 +630,11 @@ __db_vrfy_ovfl_structure(dbp, vdp, pgno, tlen, flags)
if (tlen > 0) {
isbad = 1;
EPRINT((dbp->dbenv,
- "Overflow item incomplete on page %lu", (u_long)pgno));
+ "Page %lu: overflow item incomplete", (u_long)pgno));
}
-err: if ((t_ret = __db_vrfy_putpageinfo(vdp, pip)) != 0 && ret == 0)
+err: if ((t_ret =
+ __db_vrfy_putpageinfo(dbp->dbenv, vdp, pip)) != 0 && ret == 0)
ret = t_ret;
return ((ret == 0 && isbad == 1) ? DB_VERIFY_BAD : ret);
}
@@ -622,13 +656,15 @@ __db_safe_goff(dbp, vdp, pgno, dbt, buf, flags)
void **buf;
u_int32_t flags;
{
+ DB_MPOOLFILE *mpf;
PAGE *h;
- int ret, err_ret;
+ int ret, t_ret;
u_int32_t bytesgot, bytes;
u_int8_t *src, *dest;
- ret = DB_VERIFY_BAD;
- err_ret = 0;
+ mpf = dbp->mpf;
+ h = NULL;
+ ret = t_ret = 0;
bytesgot = bytes = 0;
while ((pgno != PGNO_INVALID) && (IS_VALID_PGNO(pgno))) {
@@ -639,7 +675,7 @@ __db_safe_goff(dbp, vdp, pgno, dbt, buf, flags)
if ((ret = __db_salvage_markdone(vdp, pgno)) != 0)
break;
- if ((ret = memp_fget(dbp->mpf, &pgno, 0, &h)) != 0)
+ if ((ret = mpf->get(mpf, &pgno, 0, &h)) != 0)
break;
/*
@@ -651,14 +687,14 @@ __db_safe_goff(dbp, vdp, pgno, dbt, buf, flags)
break;
}
- src = (u_int8_t *)h + P_OVERHEAD;
+ src = (u_int8_t *)h + P_OVERHEAD(dbp);
bytes = OV_LEN(h);
- if (bytes + P_OVERHEAD > dbp->pgsize)
- bytes = dbp->pgsize - P_OVERHEAD;
+ if (bytes + P_OVERHEAD(dbp) > dbp->pgsize)
+ bytes = dbp->pgsize - P_OVERHEAD(dbp);
if ((ret = __os_realloc(dbp->dbenv,
- bytesgot + bytes, 0, buf)) != 0)
+ bytesgot + bytes, buf)) != 0)
break;
dest = (u_int8_t *)*buf + bytesgot;
@@ -667,15 +703,24 @@ __db_safe_goff(dbp, vdp, pgno, dbt, buf, flags)
memcpy(dest, src, bytes);
pgno = NEXT_PGNO(h);
- /* Not much we can do here--we don't want to quit. */
- if ((ret = memp_fput(dbp->mpf, h, 0)) != 0)
- err_ret = ret;
+
+ if ((ret = mpf->put(mpf, h, 0)) != 0)
+ break;
+ h = NULL;
}
- if (ret == 0) {
+ /*
+ * If we're being aggressive, salvage a partial datum if there
+ * was an error somewhere along the way.
+ */
+ if (ret == 0 || LF_ISSET(DB_AGGRESSIVE)) {
dbt->size = bytesgot;
dbt->data = *buf;
}
- return ((err_ret != 0 && ret == 0) ? err_ret : ret);
+ /* If we broke out on error, don't leave pages pinned. */
+ if (h != NULL && (t_ret = mpf->put(mpf, h, 0)) != 0 && ret == 0)
+ ret = t_ret;
+
+ return (ret);
}