xref: /freebsd/lib/libc/db/btree/bt_utils.c (revision 8a16b7a18f5d0b031f09832fd7752fba717e2a97)
158f0484fSRodney W. Grimes /*-
2*8a16b7a1SPedro F. Giffuni  * SPDX-License-Identifier: BSD-3-Clause
3*8a16b7a1SPedro F. Giffuni  *
4ef5d438eSPaul Traina  * Copyright (c) 1990, 1993, 1994
558f0484fSRodney W. Grimes  *	The Regents of the University of California.  All rights reserved.
658f0484fSRodney W. Grimes  *
758f0484fSRodney W. Grimes  * This code is derived from software contributed to Berkeley by
858f0484fSRodney W. Grimes  * Mike Olson.
958f0484fSRodney W. Grimes  *
1058f0484fSRodney W. Grimes  * Redistribution and use in source and binary forms, with or without
1158f0484fSRodney W. Grimes  * modification, are permitted provided that the following conditions
1258f0484fSRodney W. Grimes  * are met:
1358f0484fSRodney W. Grimes  * 1. Redistributions of source code must retain the above copyright
1458f0484fSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer.
1558f0484fSRodney W. Grimes  * 2. Redistributions in binary form must reproduce the above copyright
1658f0484fSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer in the
1758f0484fSRodney W. Grimes  *    documentation and/or other materials provided with the distribution.
18fbbd9655SWarner Losh  * 3. Neither the name of the University nor the names of its contributors
1958f0484fSRodney W. Grimes  *    may be used to endorse or promote products derived from this software
2058f0484fSRodney W. Grimes  *    without specific prior written permission.
2158f0484fSRodney W. Grimes  *
2258f0484fSRodney W. Grimes  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
2358f0484fSRodney W. Grimes  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
2458f0484fSRodney W. Grimes  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
2558f0484fSRodney W. Grimes  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
2658f0484fSRodney W. Grimes  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
2758f0484fSRodney W. Grimes  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
2858f0484fSRodney W. Grimes  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
2958f0484fSRodney W. Grimes  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
3058f0484fSRodney W. Grimes  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
3158f0484fSRodney W. Grimes  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
3258f0484fSRodney W. Grimes  * SUCH DAMAGE.
3358f0484fSRodney W. Grimes  */
3458f0484fSRodney W. Grimes 
3558f0484fSRodney W. Grimes #if defined(LIBC_SCCS) && !defined(lint)
36ef5d438eSPaul Traina static char sccsid[] = "@(#)bt_utils.c	8.8 (Berkeley) 7/20/94";
3758f0484fSRodney W. Grimes #endif /* LIBC_SCCS and not lint */
388fb3f3f6SDavid E. O'Brien #include <sys/cdefs.h>
398fb3f3f6SDavid E. O'Brien __FBSDID("$FreeBSD$");
4058f0484fSRodney W. Grimes 
4158f0484fSRodney W. Grimes #include <sys/param.h>
4258f0484fSRodney W. Grimes 
4358f0484fSRodney W. Grimes #include <stdio.h>
4458f0484fSRodney W. Grimes #include <stdlib.h>
4558f0484fSRodney W. Grimes #include <string.h>
4658f0484fSRodney W. Grimes 
4758f0484fSRodney W. Grimes #include <db.h>
4858f0484fSRodney W. Grimes #include "btree.h"
4958f0484fSRodney W. Grimes 
5058f0484fSRodney W. Grimes /*
51ef5d438eSPaul Traina  * __bt_ret --
52ef5d438eSPaul Traina  *	Build return key/data pair.
5358f0484fSRodney W. Grimes  *
5458f0484fSRodney W. Grimes  * Parameters:
5558f0484fSRodney W. Grimes  *	t:	tree
56ef5d438eSPaul Traina  *	e:	key/data pair to be returned
5758f0484fSRodney W. Grimes  *	key:	user's key structure (NULL if not to be filled in)
58ef5d438eSPaul Traina  *	rkey:	memory area to hold key
59ef5d438eSPaul Traina  *	data:	user's data structure (NULL if not to be filled in)
60ef5d438eSPaul Traina  *	rdata:	memory area to hold data
61ef5d438eSPaul Traina  *       copy:	always copy the key/data item
6258f0484fSRodney W. Grimes  *
6358f0484fSRodney W. Grimes  * Returns:
6458f0484fSRodney W. Grimes  *	RET_SUCCESS, RET_ERROR.
6558f0484fSRodney W. Grimes  */
6658f0484fSRodney W. Grimes int
670ac22237SXin LI __bt_ret(BTREE *t, EPG *e, DBT *key, DBT *rkey, DBT *data, DBT *rdata, int copy)
6858f0484fSRodney W. Grimes {
69ef5d438eSPaul Traina 	BLEAF *bl;
70ef5d438eSPaul Traina 	void *p;
7158f0484fSRodney W. Grimes 
7258f0484fSRodney W. Grimes 	bl = GETBLEAF(e->page, e->index);
7358f0484fSRodney W. Grimes 
7458f0484fSRodney W. Grimes 	/*
75ef5d438eSPaul Traina 	 * We must copy big keys/data to make them contigous.  Otherwise,
76ef5d438eSPaul Traina 	 * leave the page pinned and don't copy unless the user specified
7758f0484fSRodney W. Grimes 	 * concurrent access.
7858f0484fSRodney W. Grimes 	 */
79ef5d438eSPaul Traina 	if (key == NULL)
80ef5d438eSPaul Traina 		goto dataonly;
81ef5d438eSPaul Traina 
82ef5d438eSPaul Traina 	if (bl->flags & P_BIGKEY) {
83ef5d438eSPaul Traina 		if (__ovfl_get(t, bl->bytes,
84ef5d438eSPaul Traina 		    &key->size, &rkey->data, &rkey->size))
85ef5d438eSPaul Traina 			return (RET_ERROR);
86ef5d438eSPaul Traina 		key->data = rkey->data;
87ef5d438eSPaul Traina 	} else if (copy || F_ISSET(t, B_DB_LOCK)) {
88ef5d438eSPaul Traina 		if (bl->ksize > rkey->size) {
897ccf00dfSXin LI 			p = realloc(rkey->data, bl->ksize);
90ef5d438eSPaul Traina 			if (p == NULL)
91ef5d438eSPaul Traina 				return (RET_ERROR);
92ef5d438eSPaul Traina 			rkey->data = p;
93ef5d438eSPaul Traina 			rkey->size = bl->ksize;
94ef5d438eSPaul Traina 		}
95ef5d438eSPaul Traina 		memmove(rkey->data, bl->bytes, bl->ksize);
96ef5d438eSPaul Traina 		key->size = bl->ksize;
97ef5d438eSPaul Traina 		key->data = rkey->data;
98ef5d438eSPaul Traina 	} else {
99ef5d438eSPaul Traina 		key->size = bl->ksize;
100ef5d438eSPaul Traina 		key->data = bl->bytes;
101ef5d438eSPaul Traina 	}
102ef5d438eSPaul Traina 
103ef5d438eSPaul Traina dataonly:
104ef5d438eSPaul Traina 	if (data == NULL)
105ef5d438eSPaul Traina 		return (RET_SUCCESS);
106ef5d438eSPaul Traina 
10758f0484fSRodney W. Grimes 	if (bl->flags & P_BIGDATA) {
10858f0484fSRodney W. Grimes 		if (__ovfl_get(t, bl->bytes + bl->ksize,
109ef5d438eSPaul Traina 		    &data->size, &rdata->data, &rdata->size))
11058f0484fSRodney W. Grimes 			return (RET_ERROR);
111ef5d438eSPaul Traina 		data->data = rdata->data;
112ef5d438eSPaul Traina 	} else if (copy || F_ISSET(t, B_DB_LOCK)) {
11358f0484fSRodney W. Grimes 		/* Use +1 in case the first record retrieved is 0 length. */
114ef5d438eSPaul Traina 		if (bl->dsize + 1 > rdata->size) {
1157ccf00dfSXin LI 			p = realloc(rdata->data, bl->dsize + 1);
116ef5d438eSPaul Traina 			if (p == NULL)
11758f0484fSRodney W. Grimes 				return (RET_ERROR);
118ef5d438eSPaul Traina 			rdata->data = p;
119ef5d438eSPaul Traina 			rdata->size = bl->dsize + 1;
12058f0484fSRodney W. Grimes 		}
121ef5d438eSPaul Traina 		memmove(rdata->data, bl->bytes + bl->ksize, bl->dsize);
12258f0484fSRodney W. Grimes 		data->size = bl->dsize;
123ef5d438eSPaul Traina 		data->data = rdata->data;
12458f0484fSRodney W. Grimes 	} else {
12558f0484fSRodney W. Grimes 		data->size = bl->dsize;
12658f0484fSRodney W. Grimes 		data->data = bl->bytes + bl->ksize;
12758f0484fSRodney W. Grimes 	}
12858f0484fSRodney W. Grimes 
12958f0484fSRodney W. Grimes 	return (RET_SUCCESS);
13058f0484fSRodney W. Grimes }
13158f0484fSRodney W. Grimes 
13258f0484fSRodney W. Grimes /*
13358f0484fSRodney W. Grimes  * __BT_CMP -- Compare a key to a given record.
13458f0484fSRodney W. Grimes  *
13558f0484fSRodney W. Grimes  * Parameters:
13658f0484fSRodney W. Grimes  *	t:	tree
13758f0484fSRodney W. Grimes  *	k1:	DBT pointer of first arg to comparison
13858f0484fSRodney W. Grimes  *	e:	pointer to EPG for comparison
13958f0484fSRodney W. Grimes  *
14058f0484fSRodney W. Grimes  * Returns:
14158f0484fSRodney W. Grimes  *	< 0 if k1 is < record
14258f0484fSRodney W. Grimes  *	= 0 if k1 is = record
14358f0484fSRodney W. Grimes  *	> 0 if k1 is > record
14458f0484fSRodney W. Grimes  */
14558f0484fSRodney W. Grimes int
1460ac22237SXin LI __bt_cmp(BTREE *t, const DBT *k1, EPG *e)
14758f0484fSRodney W. Grimes {
14858f0484fSRodney W. Grimes 	BINTERNAL *bi;
14958f0484fSRodney W. Grimes 	BLEAF *bl;
15058f0484fSRodney W. Grimes 	DBT k2;
15158f0484fSRodney W. Grimes 	PAGE *h;
15258f0484fSRodney W. Grimes 	void *bigkey;
15358f0484fSRodney W. Grimes 
15458f0484fSRodney W. Grimes 	/*
15558f0484fSRodney W. Grimes 	 * The left-most key on internal pages, at any level of the tree, is
15658f0484fSRodney W. Grimes 	 * guaranteed by the following code to be less than any user key.
15758f0484fSRodney W. Grimes 	 * This saves us from having to update the leftmost key on an internal
15858f0484fSRodney W. Grimes 	 * page when the user inserts a new key in the tree smaller than
15958f0484fSRodney W. Grimes 	 * anything we've yet seen.
16058f0484fSRodney W. Grimes 	 */
16158f0484fSRodney W. Grimes 	h = e->page;
16258f0484fSRodney W. Grimes 	if (e->index == 0 && h->prevpg == P_INVALID && !(h->flags & P_BLEAF))
16358f0484fSRodney W. Grimes 		return (1);
16458f0484fSRodney W. Grimes 
16558f0484fSRodney W. Grimes 	bigkey = NULL;
16658f0484fSRodney W. Grimes 	if (h->flags & P_BLEAF) {
16758f0484fSRodney W. Grimes 		bl = GETBLEAF(h, e->index);
16858f0484fSRodney W. Grimes 		if (bl->flags & P_BIGKEY)
16958f0484fSRodney W. Grimes 			bigkey = bl->bytes;
17058f0484fSRodney W. Grimes 		else {
17158f0484fSRodney W. Grimes 			k2.data = bl->bytes;
17258f0484fSRodney W. Grimes 			k2.size = bl->ksize;
17358f0484fSRodney W. Grimes 		}
17458f0484fSRodney W. Grimes 	} else {
17558f0484fSRodney W. Grimes 		bi = GETBINTERNAL(h, e->index);
17658f0484fSRodney W. Grimes 		if (bi->flags & P_BIGKEY)
17758f0484fSRodney W. Grimes 			bigkey = bi->bytes;
17858f0484fSRodney W. Grimes 		else {
17958f0484fSRodney W. Grimes 			k2.data = bi->bytes;
18058f0484fSRodney W. Grimes 			k2.size = bi->ksize;
18158f0484fSRodney W. Grimes 		}
18258f0484fSRodney W. Grimes 	}
18358f0484fSRodney W. Grimes 
18458f0484fSRodney W. Grimes 	if (bigkey) {
18558f0484fSRodney W. Grimes 		if (__ovfl_get(t, bigkey,
186ef5d438eSPaul Traina 		    &k2.size, &t->bt_rdata.data, &t->bt_rdata.size))
18758f0484fSRodney W. Grimes 			return (RET_ERROR);
188ef5d438eSPaul Traina 		k2.data = t->bt_rdata.data;
18958f0484fSRodney W. Grimes 	}
19058f0484fSRodney W. Grimes 	return ((*t->bt_cmp)(k1, &k2));
19158f0484fSRodney W. Grimes }
19258f0484fSRodney W. Grimes 
19358f0484fSRodney W. Grimes /*
19458f0484fSRodney W. Grimes  * __BT_DEFCMP -- Default comparison routine.
19558f0484fSRodney W. Grimes  *
19658f0484fSRodney W. Grimes  * Parameters:
19758f0484fSRodney W. Grimes  *	a:	DBT #1
19858f0484fSRodney W. Grimes  *	b:	DBT #2
19958f0484fSRodney W. Grimes  *
20058f0484fSRodney W. Grimes  * Returns:
20158f0484fSRodney W. Grimes  *	< 0 if a is < b
20258f0484fSRodney W. Grimes  *	= 0 if a is = b
20358f0484fSRodney W. Grimes  *	> 0 if a is > b
20458f0484fSRodney W. Grimes  */
20558f0484fSRodney W. Grimes int
2060ac22237SXin LI __bt_defcmp(const DBT *a, const DBT *b)
20758f0484fSRodney W. Grimes {
2088fb3f3f6SDavid E. O'Brien 	size_t len;
2098fb3f3f6SDavid E. O'Brien 	u_char *p1, *p2;
21058f0484fSRodney W. Grimes 
21158f0484fSRodney W. Grimes 	/*
21258f0484fSRodney W. Grimes 	 * XXX
21358f0484fSRodney W. Grimes 	 * If a size_t doesn't fit in an int, this routine can lose.
2149d5abbddSJens Schweikhardt 	 * What we need is an integral type which is guaranteed to be
21558f0484fSRodney W. Grimes 	 * larger than a size_t, and there is no such thing.
21658f0484fSRodney W. Grimes 	 */
21758f0484fSRodney W. Grimes 	len = MIN(a->size, b->size);
21858f0484fSRodney W. Grimes 	for (p1 = a->data, p2 = b->data; len--; ++p1, ++p2)
21958f0484fSRodney W. Grimes 		if (*p1 != *p2)
22058f0484fSRodney W. Grimes 			return ((int)*p1 - (int)*p2);
22158f0484fSRodney W. Grimes 	return ((int)a->size - (int)b->size);
22258f0484fSRodney W. Grimes }
22358f0484fSRodney W. Grimes 
22458f0484fSRodney W. Grimes /*
22558f0484fSRodney W. Grimes  * __BT_DEFPFX -- Default prefix routine.
22658f0484fSRodney W. Grimes  *
22758f0484fSRodney W. Grimes  * Parameters:
22858f0484fSRodney W. Grimes  *	a:	DBT #1
22958f0484fSRodney W. Grimes  *	b:	DBT #2
23058f0484fSRodney W. Grimes  *
23158f0484fSRodney W. Grimes  * Returns:
23258f0484fSRodney W. Grimes  *	Number of bytes needed to distinguish b from a.
23358f0484fSRodney W. Grimes  */
23458f0484fSRodney W. Grimes size_t
2350ac22237SXin LI __bt_defpfx(const DBT *a, const DBT *b)
23658f0484fSRodney W. Grimes {
2378fb3f3f6SDavid E. O'Brien 	u_char *p1, *p2;
2388fb3f3f6SDavid E. O'Brien 	size_t cnt, len;
23958f0484fSRodney W. Grimes 
24058f0484fSRodney W. Grimes 	cnt = 1;
24158f0484fSRodney W. Grimes 	len = MIN(a->size, b->size);
24258f0484fSRodney W. Grimes 	for (p1 = a->data, p2 = b->data; len--; ++p1, ++p2, ++cnt)
24358f0484fSRodney W. Grimes 		if (*p1 != *p2)
24458f0484fSRodney W. Grimes 			return (cnt);
24558f0484fSRodney W. Grimes 
24658f0484fSRodney W. Grimes 	/* a->size must be <= b->size, or they wouldn't be in this order. */
24758f0484fSRodney W. Grimes 	return (a->size < b->size ? a->size + 1 : a->size);
24858f0484fSRodney W. Grimes }
249