1997-08-27 20:26:10 +00:00
|
|
|
/*-
|
|
|
|
* See the file LICENSE for redistribution information.
|
|
|
|
*
|
1998-06-09 15:16:55 +00:00
|
|
|
* Copyright (c) 1996, 1997, 1998
|
1997-08-27 20:26:10 +00:00
|
|
|
* Sleepycat Software. All rights reserved.
|
|
|
|
*/
|
|
|
|
/*
|
|
|
|
* Copyright (c) 1990, 1993, 1994, 1995, 1996
|
|
|
|
* Keith Bostic. All rights reserved.
|
|
|
|
*/
|
|
|
|
/*
|
|
|
|
* Copyright (c) 1990, 1993
|
|
|
|
* The Regents of the University of California. All rights reserved.
|
|
|
|
*
|
|
|
|
* Redistribution and use in source and binary forms, with or without
|
|
|
|
* modification, are permitted provided that the following conditions
|
|
|
|
* are met:
|
|
|
|
* 1. Redistributions of source code must retain the above copyright
|
|
|
|
* notice, this list of conditions and the following disclaimer.
|
|
|
|
* 2. Redistributions in binary form must reproduce the above copyright
|
|
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
|
|
* documentation and/or other materials provided with the distribution.
|
|
|
|
* 3. All advertising materials mentioning features or use of this software
|
|
|
|
* must display the following acknowledgement:
|
|
|
|
* This product includes software developed by the University of
|
|
|
|
* California, Berkeley and its contributors.
|
|
|
|
* 4. Neither the name of the University nor the names of its contributors
|
|
|
|
* may be used to endorse or promote products derived from this software
|
|
|
|
* without specific prior written permission.
|
|
|
|
*
|
|
|
|
* THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
|
|
|
|
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
|
|
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
|
|
* ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
|
|
|
|
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
|
|
|
|
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
|
|
|
|
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
|
|
|
|
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
|
|
|
|
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
|
|
|
|
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
|
|
|
|
* SUCH DAMAGE.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "config.h"
|
|
|
|
|
|
|
|
#ifndef lint
|
1998-06-09 15:16:55 +00:00
|
|
|
static const char sccsid[] = "@(#)bt_rsearch.c 10.15 (Sleepycat) 5/6/98";
|
1997-08-27 20:26:10 +00:00
|
|
|
#endif /* not lint */
|
|
|
|
|
|
|
|
#ifndef NO_SYSTEM_INCLUDES
|
|
|
|
#include <sys/types.h>
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#include "db_int.h"
|
|
|
|
#include "db_page.h"
|
|
|
|
#include "btree.h"
|
|
|
|
|
|
|
|
/*
|
|
|
|
* __bam_rsearch --
|
|
|
|
* Search a btree for a record number.
|
|
|
|
*
|
1998-06-09 15:16:55 +00:00
|
|
|
* PUBLIC: int __bam_rsearch __P((DB *, db_recno_t *, u_int32_t, int, int *));
|
1997-08-27 20:26:10 +00:00
|
|
|
*/
|
|
|
|
int
|
|
|
|
__bam_rsearch(dbp, recnop, flags, stop, exactp)
|
|
|
|
DB *dbp;
|
|
|
|
db_recno_t *recnop;
|
1998-06-09 15:16:55 +00:00
|
|
|
u_int32_t flags;
|
1997-08-27 20:26:10 +00:00
|
|
|
int stop, *exactp;
|
|
|
|
{
|
|
|
|
BINTERNAL *bi;
|
|
|
|
BTREE *t;
|
|
|
|
DB_LOCK lock;
|
|
|
|
PAGE *h;
|
|
|
|
RINTERNAL *ri;
|
|
|
|
db_indx_t indx, top;
|
|
|
|
db_pgno_t pg;
|
1998-06-09 15:16:55 +00:00
|
|
|
db_recno_t i, recno, total;
|
1997-08-27 20:26:10 +00:00
|
|
|
int isappend, ret, stack;
|
|
|
|
|
|
|
|
t = dbp->internal;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* We test for groups of flags, S_APPEND is the only one that can be
|
|
|
|
* OR'd into the set. Clear it now so that the tests for equality
|
|
|
|
* will work.
|
|
|
|
*/
|
|
|
|
if ((isappend = LF_ISSET(S_APPEND)) != 0)
|
|
|
|
LF_CLR(S_APPEND);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* There are several ways we search a btree tree. The flags argument
|
|
|
|
* specifies if we're acquiring read or write locks and if we are
|
|
|
|
* locking pairs of pages. See btree.h for more details.
|
|
|
|
*
|
|
|
|
* If write-locking pages, we need to know whether or not to acquire a
|
|
|
|
* write lock on a page before getting it. This depends on how deep it
|
|
|
|
* is in tree, which we don't know until we acquire the root page. So,
|
|
|
|
* if we need to lock the root page we may have to upgrade it later,
|
|
|
|
* because we won't get the correct lock initially.
|
|
|
|
*
|
|
|
|
* Retrieve the root page.
|
|
|
|
*/
|
|
|
|
pg = PGNO_ROOT;
|
|
|
|
if ((ret = __bam_lget(dbp, 0, PGNO_ROOT,
|
|
|
|
flags == S_INSERT || flags == S_DELETE ?
|
|
|
|
DB_LOCK_WRITE : DB_LOCK_READ, &lock)) != 0)
|
|
|
|
return (ret);
|
|
|
|
if ((ret = __bam_pget(dbp, &h, &pg, 0)) != 0) {
|
|
|
|
(void)__BT_LPUT(dbp, lock);
|
|
|
|
return (ret);
|
|
|
|
}
|
|
|
|
total = RE_NREC(h);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* If appending to the tree, set the record number now -- we have the
|
|
|
|
* root page locked.
|
|
|
|
*
|
|
|
|
* Delete only deletes exact matches, read only returns exact matches.
|
|
|
|
* Note, this is different from __bam_search(), which returns non-exact
|
|
|
|
* matches for read.
|
|
|
|
*
|
|
|
|
* The record may not exist. We can only return the correct location
|
|
|
|
* for the record immediately after the last record in the tree, so do
|
|
|
|
* a fast check now.
|
|
|
|
*/
|
|
|
|
if (isappend) {
|
|
|
|
*exactp = 0;
|
|
|
|
*recnop = recno = total + 1;
|
|
|
|
} else {
|
|
|
|
recno = *recnop;
|
|
|
|
if (recno <= total)
|
|
|
|
*exactp = 1;
|
|
|
|
else {
|
|
|
|
*exactp = 0;
|
1998-06-09 15:16:55 +00:00
|
|
|
if (!PAST_END_OK(flags) || recno > total + 1) {
|
1997-08-27 20:26:10 +00:00
|
|
|
(void)memp_fput(dbp->mpf, h, 0);
|
|
|
|
(void)__BT_LPUT(dbp, lock);
|
|
|
|
return (DB_NOTFOUND);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Decide if we're building a stack based on the operation. */
|
|
|
|
BT_STK_CLR(t);
|
|
|
|
stack = flags == S_DELETE || flags == S_INSERT;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Decide if we need to save this page; if we do, write lock it, and
|
|
|
|
* start to build a stack.
|
|
|
|
*/
|
|
|
|
if (LF_ISSET(S_PARENT) && (u_int8_t)(stop + 1) >= h->level) {
|
|
|
|
(void)memp_fput(dbp->mpf, h, 0);
|
|
|
|
if ((ret = __bam_lget(dbp, 1, pg, DB_LOCK_WRITE, &lock)) != 0)
|
|
|
|
return (ret);
|
|
|
|
if ((ret = __bam_pget(dbp, &h, &pg, 0)) != 0) {
|
|
|
|
(void)__BT_LPUT(dbp, lock);
|
|
|
|
return (ret);
|
|
|
|
}
|
|
|
|
stack = 1;
|
|
|
|
}
|
|
|
|
|
1998-06-09 15:16:55 +00:00
|
|
|
/*
|
|
|
|
* !!!
|
|
|
|
* Record numbers in the tree are 0-based, but the recno is
|
|
|
|
* 1-based. All of the calculations below have to take this
|
|
|
|
* into account.
|
|
|
|
*/
|
1997-08-27 20:26:10 +00:00
|
|
|
for (total = 0;;) {
|
|
|
|
switch (TYPE(h)) {
|
|
|
|
case P_LBTREE:
|
1998-06-09 15:16:55 +00:00
|
|
|
recno -= total;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* There may be logically deleted records on the page,
|
|
|
|
* walk the page correcting for them. The record may
|
|
|
|
* not exist if there are enough deleted records in the
|
|
|
|
* page.
|
|
|
|
*/
|
|
|
|
if (recno <= NUM_ENT(h))
|
|
|
|
for (i = recno - 1;; --i) {
|
|
|
|
if (B_DISSET(GET_BKEYDATA(h,
|
|
|
|
i * P_INDX + O_INDX)->type))
|
|
|
|
++recno;
|
|
|
|
if (i == 0)
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
if (recno > NUM_ENT(h)) {
|
|
|
|
*exactp = 0;
|
|
|
|
if (!PAST_END_OK(flags) ||
|
|
|
|
recno > (db_recno_t)(NUM_ENT(h) + 1)) {
|
|
|
|
ret = DB_NOTFOUND;
|
|
|
|
goto err;
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Correct from 1-based to 0-based for a page offset. */
|
|
|
|
--recno;
|
|
|
|
BT_STK_ENTER(t, h, recno * P_INDX, lock, ret);
|
1997-08-27 20:26:10 +00:00
|
|
|
return (ret);
|
|
|
|
case P_IBTREE:
|
|
|
|
for (indx = 0, top = NUM_ENT(h);;) {
|
|
|
|
bi = GET_BINTERNAL(h, indx);
|
1998-06-09 15:16:55 +00:00
|
|
|
if (++indx == top || total + bi->nrecs >= recno)
|
1997-08-27 20:26:10 +00:00
|
|
|
break;
|
|
|
|
total += bi->nrecs;
|
|
|
|
}
|
|
|
|
pg = bi->pgno;
|
|
|
|
break;
|
|
|
|
case P_LRECNO:
|
1998-06-09 15:16:55 +00:00
|
|
|
recno -= total;
|
|
|
|
|
|
|
|
/* Correct from 1-based to 0-based for a page offset. */
|
|
|
|
--recno;
|
|
|
|
BT_STK_ENTER(t, h, recno, lock, ret);
|
1997-08-27 20:26:10 +00:00
|
|
|
return (ret);
|
|
|
|
case P_IRECNO:
|
|
|
|
for (indx = 0, top = NUM_ENT(h);;) {
|
|
|
|
ri = GET_RINTERNAL(h, indx);
|
1998-06-09 15:16:55 +00:00
|
|
|
if (++indx == top || total + ri->nrecs >= recno)
|
1997-08-27 20:26:10 +00:00
|
|
|
break;
|
|
|
|
total += ri->nrecs;
|
|
|
|
}
|
|
|
|
pg = ri->pgno;
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
return (__db_pgfmt(dbp, h->pgno));
|
|
|
|
}
|
|
|
|
--indx;
|
|
|
|
|
|
|
|
if (stack) {
|
|
|
|
/* Return if this is the lowest page wanted. */
|
|
|
|
if (LF_ISSET(S_PARENT) && stop == h->level) {
|
|
|
|
BT_STK_ENTER(t, h, indx, lock, ret);
|
|
|
|
return (ret);
|
|
|
|
}
|
|
|
|
BT_STK_PUSH(t, h, indx, lock, ret);
|
|
|
|
if (ret)
|
|
|
|
goto err;
|
|
|
|
|
|
|
|
if ((ret = __bam_lget(dbp, 0, pg,
|
|
|
|
LF_ISSET(S_WRITE) ? DB_LOCK_WRITE : DB_LOCK_READ,
|
|
|
|
&lock)) != 0)
|
|
|
|
goto err;
|
|
|
|
} else {
|
|
|
|
(void)memp_fput(dbp->mpf, h, 0);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Decide if we want to return a pointer to the next
|
|
|
|
* page in the stack. If we do, write lock it and
|
|
|
|
* never unlock it.
|
|
|
|
*/
|
|
|
|
if (LF_ISSET(S_PARENT) &&
|
|
|
|
(u_int8_t)(stop + 1) >= (u_int8_t)(h->level - 1))
|
|
|
|
stack = 1;
|
|
|
|
|
|
|
|
if ((ret = __bam_lget(dbp, 1, pg,
|
|
|
|
LF_ISSET(S_WRITE) ? DB_LOCK_WRITE : DB_LOCK_READ,
|
|
|
|
&lock)) != 0)
|
|
|
|
goto err;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ((ret = __bam_pget(dbp, &h, &pg, 0)) != 0)
|
|
|
|
goto err;
|
|
|
|
}
|
|
|
|
/* NOTREACHED */
|
|
|
|
|
|
|
|
err: BT_STK_POP(t);
|
|
|
|
__bam_stkrel(dbp);
|
|
|
|
return (ret);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* __bam_adjust --
|
|
|
|
* Adjust the tree after adding or deleting a record.
|
|
|
|
*
|
1998-06-09 15:16:55 +00:00
|
|
|
* PUBLIC: int __bam_adjust __P((DB *, BTREE *, int32_t));
|
1997-08-27 20:26:10 +00:00
|
|
|
*/
|
|
|
|
int
|
|
|
|
__bam_adjust(dbp, t, adjust)
|
|
|
|
DB *dbp;
|
|
|
|
BTREE *t;
|
1998-06-09 15:16:55 +00:00
|
|
|
int32_t adjust;
|
1997-08-27 20:26:10 +00:00
|
|
|
{
|
|
|
|
EPG *epg;
|
|
|
|
PAGE *h;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
/* Update the record counts for the tree. */
|
|
|
|
for (epg = t->bt_sp; epg <= t->bt_csp; ++epg) {
|
|
|
|
h = epg->page;
|
|
|
|
if (TYPE(h) == P_IBTREE || TYPE(h) == P_IRECNO) {
|
|
|
|
if (DB_LOGGING(dbp) &&
|
|
|
|
(ret = __bam_cadjust_log(dbp->dbenv->lg_info,
|
|
|
|
dbp->txn, &LSN(h), 0, dbp->log_fileid,
|
|
|
|
PGNO(h), &LSN(h), (u_int32_t)epg->indx,
|
1998-06-09 15:16:55 +00:00
|
|
|
adjust, 1)) != 0)
|
1997-08-27 20:26:10 +00:00
|
|
|
return (ret);
|
|
|
|
|
|
|
|
if (TYPE(h) == P_IBTREE)
|
|
|
|
GET_BINTERNAL(h, epg->indx)->nrecs += adjust;
|
|
|
|
else
|
|
|
|
GET_RINTERNAL(h, epg->indx)->nrecs += adjust;
|
|
|
|
|
|
|
|
if (PGNO(h) == PGNO_ROOT)
|
|
|
|
RE_NREC_ADJ(h, adjust);
|
|
|
|
|
|
|
|
if ((ret = memp_fset(dbp->mpf, h, DB_MPOOL_DIRTY)) != 0)
|
|
|
|
return (ret);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return (0);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* __bam_nrecs --
|
|
|
|
* Return the number of records in the tree.
|
|
|
|
*
|
|
|
|
* PUBLIC: int __bam_nrecs __P((DB *, db_recno_t *));
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
__bam_nrecs(dbp, rep)
|
|
|
|
DB *dbp;
|
|
|
|
db_recno_t *rep;
|
|
|
|
{
|
|
|
|
DB_LOCK lock;
|
|
|
|
PAGE *h;
|
|
|
|
db_pgno_t pgno;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
pgno = PGNO_ROOT;
|
|
|
|
if ((ret = __bam_lget(dbp, 0, pgno, DB_LOCK_READ, &lock)) != 0)
|
|
|
|
return (ret);
|
|
|
|
if ((ret = __bam_pget(dbp, &h, &pgno, 0)) != 0)
|
|
|
|
return (ret);
|
|
|
|
|
|
|
|
*rep = RE_NREC(h);
|
|
|
|
|
|
|
|
(void)memp_fput(dbp->mpf, h, 0);
|
|
|
|
(void)__BT_TLPUT(dbp, lock);
|
|
|
|
|
|
|
|
return (0);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* __bam_total --
|
|
|
|
* Return the number of records below a page.
|
|
|
|
*
|
|
|
|
* PUBLIC: db_recno_t __bam_total __P((PAGE *));
|
|
|
|
*/
|
|
|
|
db_recno_t
|
|
|
|
__bam_total(h)
|
|
|
|
PAGE *h;
|
|
|
|
{
|
1998-06-09 15:16:55 +00:00
|
|
|
db_recno_t nrecs;
|
|
|
|
db_indx_t indx, top;
|
|
|
|
|
|
|
|
nrecs = 0;
|
|
|
|
top = NUM_ENT(h);
|
1997-08-27 20:26:10 +00:00
|
|
|
|
|
|
|
switch (TYPE(h)) {
|
|
|
|
case P_LBTREE:
|
1998-06-09 15:16:55 +00:00
|
|
|
/* Check for logically deleted records. */
|
|
|
|
for (indx = 0; indx < top; indx += P_INDX)
|
|
|
|
if (!B_DISSET(GET_BKEYDATA(h, indx + O_INDX)->type))
|
|
|
|
++nrecs;
|
1997-08-27 20:26:10 +00:00
|
|
|
break;
|
|
|
|
case P_IBTREE:
|
1998-06-09 15:16:55 +00:00
|
|
|
for (indx = 0; indx < top; indx += O_INDX)
|
|
|
|
nrecs += GET_BINTERNAL(h, indx)->nrecs;
|
1997-08-27 20:26:10 +00:00
|
|
|
break;
|
|
|
|
case P_LRECNO:
|
1998-06-09 15:16:55 +00:00
|
|
|
nrecs = NUM_ENT(h);
|
1997-08-27 20:26:10 +00:00
|
|
|
break;
|
|
|
|
case P_IRECNO:
|
1998-06-09 15:16:55 +00:00
|
|
|
for (indx = 0; indx < top; indx += O_INDX)
|
|
|
|
nrecs += GET_RINTERNAL(h, indx)->nrecs;
|
1997-08-27 20:26:10 +00:00
|
|
|
break;
|
|
|
|
}
|
1998-06-09 15:16:55 +00:00
|
|
|
|
|
|
|
return (nrecs);
|
1997-08-27 20:26:10 +00:00
|
|
|
}
|