xref: /titanic_52/usr/src/tools/ctf/cvt/strtab.c (revision 7c478bd95313f5f23a4c958a745db2134aa03244)
1*7c478bd9Sstevel@tonic-gate /*
2*7c478bd9Sstevel@tonic-gate  * CDDL HEADER START
3*7c478bd9Sstevel@tonic-gate  *
4*7c478bd9Sstevel@tonic-gate  * The contents of this file are subject to the terms of the
5*7c478bd9Sstevel@tonic-gate  * Common Development and Distribution License, Version 1.0 only
6*7c478bd9Sstevel@tonic-gate  * (the "License").  You may not use this file except in compliance
7*7c478bd9Sstevel@tonic-gate  * with the License.
8*7c478bd9Sstevel@tonic-gate  *
9*7c478bd9Sstevel@tonic-gate  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
10*7c478bd9Sstevel@tonic-gate  * or http://www.opensolaris.org/os/licensing.
11*7c478bd9Sstevel@tonic-gate  * See the License for the specific language governing permissions
12*7c478bd9Sstevel@tonic-gate  * and limitations under the License.
13*7c478bd9Sstevel@tonic-gate  *
14*7c478bd9Sstevel@tonic-gate  * When distributing Covered Code, include this CDDL HEADER in each
15*7c478bd9Sstevel@tonic-gate  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
16*7c478bd9Sstevel@tonic-gate  * If applicable, add the following below this CDDL HEADER, with the
17*7c478bd9Sstevel@tonic-gate  * fields enclosed by brackets "[]" replaced with your own identifying
18*7c478bd9Sstevel@tonic-gate  * information: Portions Copyright [yyyy] [name of copyright owner]
19*7c478bd9Sstevel@tonic-gate  *
20*7c478bd9Sstevel@tonic-gate  * CDDL HEADER END
21*7c478bd9Sstevel@tonic-gate  */
22*7c478bd9Sstevel@tonic-gate /*
23*7c478bd9Sstevel@tonic-gate  * Copyright (c) 2001 by Sun Microsystems, Inc.
24*7c478bd9Sstevel@tonic-gate  * All rights reserved.
25*7c478bd9Sstevel@tonic-gate  */
26*7c478bd9Sstevel@tonic-gate 
27*7c478bd9Sstevel@tonic-gate #pragma ident	"%Z%%M%	%I%	%E% SMI"
28*7c478bd9Sstevel@tonic-gate 
29*7c478bd9Sstevel@tonic-gate #include <sys/types.h>
30*7c478bd9Sstevel@tonic-gate #include <sys/sysmacros.h>
31*7c478bd9Sstevel@tonic-gate #include <strings.h>
32*7c478bd9Sstevel@tonic-gate #include <stdlib.h>
33*7c478bd9Sstevel@tonic-gate #include <stdio.h>
34*7c478bd9Sstevel@tonic-gate 
35*7c478bd9Sstevel@tonic-gate #include "strtab.h"
36*7c478bd9Sstevel@tonic-gate #include "memory.h"
37*7c478bd9Sstevel@tonic-gate 
38*7c478bd9Sstevel@tonic-gate #define	STRTAB_HASHSZ	211		/* use a prime number of hash buckets */
39*7c478bd9Sstevel@tonic-gate #define	STRTAB_BUFSZ	(64 * 1024)	/* use 64K data buffers by default */
40*7c478bd9Sstevel@tonic-gate 
41*7c478bd9Sstevel@tonic-gate static void
42*7c478bd9Sstevel@tonic-gate strtab_grow(strtab_t *sp)
43*7c478bd9Sstevel@tonic-gate {
44*7c478bd9Sstevel@tonic-gate 	sp->str_nbufs++;
45*7c478bd9Sstevel@tonic-gate 	sp->str_bufs = xrealloc(sp->str_bufs, sp->str_nbufs * sizeof (char *));
46*7c478bd9Sstevel@tonic-gate 	sp->str_ptr = xmalloc(sp->str_bufsz);
47*7c478bd9Sstevel@tonic-gate 	sp->str_bufs[sp->str_nbufs - 1] = sp->str_ptr;
48*7c478bd9Sstevel@tonic-gate }
49*7c478bd9Sstevel@tonic-gate 
50*7c478bd9Sstevel@tonic-gate void
51*7c478bd9Sstevel@tonic-gate strtab_create(strtab_t *sp)
52*7c478bd9Sstevel@tonic-gate {
53*7c478bd9Sstevel@tonic-gate 	sp->str_hash = xcalloc(STRTAB_HASHSZ * sizeof (strhash_t *));
54*7c478bd9Sstevel@tonic-gate 	sp->str_hashsz = STRTAB_HASHSZ;
55*7c478bd9Sstevel@tonic-gate 	sp->str_bufs = NULL;
56*7c478bd9Sstevel@tonic-gate 	sp->str_ptr = NULL;
57*7c478bd9Sstevel@tonic-gate 	sp->str_nbufs = 0;
58*7c478bd9Sstevel@tonic-gate 	sp->str_bufsz = STRTAB_BUFSZ;
59*7c478bd9Sstevel@tonic-gate 	sp->str_nstrs = 1;
60*7c478bd9Sstevel@tonic-gate 	sp->str_size = 1;
61*7c478bd9Sstevel@tonic-gate 
62*7c478bd9Sstevel@tonic-gate 	strtab_grow(sp);
63*7c478bd9Sstevel@tonic-gate 	*sp->str_ptr++ = '\0';
64*7c478bd9Sstevel@tonic-gate }
65*7c478bd9Sstevel@tonic-gate 
66*7c478bd9Sstevel@tonic-gate void
67*7c478bd9Sstevel@tonic-gate strtab_destroy(strtab_t *sp)
68*7c478bd9Sstevel@tonic-gate {
69*7c478bd9Sstevel@tonic-gate 	strhash_t *hp, *hq;
70*7c478bd9Sstevel@tonic-gate 	ulong_t i;
71*7c478bd9Sstevel@tonic-gate 
72*7c478bd9Sstevel@tonic-gate 	for (i = 0; i < sp->str_hashsz; i++) {
73*7c478bd9Sstevel@tonic-gate 		for (hp = sp->str_hash[i]; hp != NULL; hp = hq) {
74*7c478bd9Sstevel@tonic-gate 			hq = hp->str_next;
75*7c478bd9Sstevel@tonic-gate 			free(hp);
76*7c478bd9Sstevel@tonic-gate 		}
77*7c478bd9Sstevel@tonic-gate 	}
78*7c478bd9Sstevel@tonic-gate 
79*7c478bd9Sstevel@tonic-gate 	for (i = 0; i < sp->str_nbufs; i++)
80*7c478bd9Sstevel@tonic-gate 		free(sp->str_bufs[i]);
81*7c478bd9Sstevel@tonic-gate 
82*7c478bd9Sstevel@tonic-gate 	free(sp->str_hash);
83*7c478bd9Sstevel@tonic-gate 	free(sp->str_bufs);
84*7c478bd9Sstevel@tonic-gate }
85*7c478bd9Sstevel@tonic-gate 
86*7c478bd9Sstevel@tonic-gate static ulong_t
87*7c478bd9Sstevel@tonic-gate strtab_hash(const char *key, size_t *len)
88*7c478bd9Sstevel@tonic-gate {
89*7c478bd9Sstevel@tonic-gate 	ulong_t g, h = 0;
90*7c478bd9Sstevel@tonic-gate 	const char *p;
91*7c478bd9Sstevel@tonic-gate 	size_t n = 0;
92*7c478bd9Sstevel@tonic-gate 
93*7c478bd9Sstevel@tonic-gate 	for (p = key; *p != '\0'; p++, n++) {
94*7c478bd9Sstevel@tonic-gate 		h = (h << 4) + *p;
95*7c478bd9Sstevel@tonic-gate 
96*7c478bd9Sstevel@tonic-gate 		if ((g = (h & 0xf0000000)) != 0) {
97*7c478bd9Sstevel@tonic-gate 			h ^= (g >> 24);
98*7c478bd9Sstevel@tonic-gate 			h ^= g;
99*7c478bd9Sstevel@tonic-gate 		}
100*7c478bd9Sstevel@tonic-gate 	}
101*7c478bd9Sstevel@tonic-gate 
102*7c478bd9Sstevel@tonic-gate 	*len = n;
103*7c478bd9Sstevel@tonic-gate 	return (h);
104*7c478bd9Sstevel@tonic-gate }
105*7c478bd9Sstevel@tonic-gate 
106*7c478bd9Sstevel@tonic-gate static int
107*7c478bd9Sstevel@tonic-gate strtab_compare(strtab_t *sp, strhash_t *hp, const char *str, size_t len)
108*7c478bd9Sstevel@tonic-gate {
109*7c478bd9Sstevel@tonic-gate 	ulong_t b = hp->str_buf;
110*7c478bd9Sstevel@tonic-gate 	const char *buf = hp->str_data;
111*7c478bd9Sstevel@tonic-gate 	size_t resid, n;
112*7c478bd9Sstevel@tonic-gate 	int rv;
113*7c478bd9Sstevel@tonic-gate 
114*7c478bd9Sstevel@tonic-gate 	while (len != 0) {
115*7c478bd9Sstevel@tonic-gate 		if (buf == sp->str_bufs[b] + sp->str_bufsz)
116*7c478bd9Sstevel@tonic-gate 			buf = sp->str_bufs[++b];
117*7c478bd9Sstevel@tonic-gate 
118*7c478bd9Sstevel@tonic-gate 		resid = sp->str_bufs[b] + sp->str_bufsz - buf;
119*7c478bd9Sstevel@tonic-gate 		n = MIN(resid, len);
120*7c478bd9Sstevel@tonic-gate 
121*7c478bd9Sstevel@tonic-gate 		if ((rv = strncmp(buf, str, n)) != 0)
122*7c478bd9Sstevel@tonic-gate 			return (rv);
123*7c478bd9Sstevel@tonic-gate 
124*7c478bd9Sstevel@tonic-gate 		buf += n;
125*7c478bd9Sstevel@tonic-gate 		str += n;
126*7c478bd9Sstevel@tonic-gate 		len -= n;
127*7c478bd9Sstevel@tonic-gate 	}
128*7c478bd9Sstevel@tonic-gate 
129*7c478bd9Sstevel@tonic-gate 	return (0);
130*7c478bd9Sstevel@tonic-gate }
131*7c478bd9Sstevel@tonic-gate 
132*7c478bd9Sstevel@tonic-gate static void
133*7c478bd9Sstevel@tonic-gate strtab_copyin(strtab_t *sp, const char *str, size_t len)
134*7c478bd9Sstevel@tonic-gate {
135*7c478bd9Sstevel@tonic-gate 	ulong_t b = sp->str_nbufs - 1;
136*7c478bd9Sstevel@tonic-gate 	size_t resid, n;
137*7c478bd9Sstevel@tonic-gate 
138*7c478bd9Sstevel@tonic-gate 	while (len != 0) {
139*7c478bd9Sstevel@tonic-gate 		if (sp->str_ptr == sp->str_bufs[b] + sp->str_bufsz) {
140*7c478bd9Sstevel@tonic-gate 			strtab_grow(sp);
141*7c478bd9Sstevel@tonic-gate 			b++;
142*7c478bd9Sstevel@tonic-gate 		}
143*7c478bd9Sstevel@tonic-gate 
144*7c478bd9Sstevel@tonic-gate 		resid = sp->str_bufs[b] + sp->str_bufsz - sp->str_ptr;
145*7c478bd9Sstevel@tonic-gate 		n = MIN(resid, len);
146*7c478bd9Sstevel@tonic-gate 		bcopy(str, sp->str_ptr, n);
147*7c478bd9Sstevel@tonic-gate 
148*7c478bd9Sstevel@tonic-gate 		sp->str_ptr += n;
149*7c478bd9Sstevel@tonic-gate 		str += n;
150*7c478bd9Sstevel@tonic-gate 		len -= n;
151*7c478bd9Sstevel@tonic-gate 	}
152*7c478bd9Sstevel@tonic-gate }
153*7c478bd9Sstevel@tonic-gate 
154*7c478bd9Sstevel@tonic-gate size_t
155*7c478bd9Sstevel@tonic-gate strtab_insert(strtab_t *sp, const char *str)
156*7c478bd9Sstevel@tonic-gate {
157*7c478bd9Sstevel@tonic-gate 	strhash_t *hp;
158*7c478bd9Sstevel@tonic-gate 	size_t len;
159*7c478bd9Sstevel@tonic-gate 	ulong_t h;
160*7c478bd9Sstevel@tonic-gate 
161*7c478bd9Sstevel@tonic-gate 	if (str == NULL || str[0] == '\0')
162*7c478bd9Sstevel@tonic-gate 		return (0); /* we keep a \0 at offset 0 to simplify things */
163*7c478bd9Sstevel@tonic-gate 
164*7c478bd9Sstevel@tonic-gate 	h = strtab_hash(str, &len) % sp->str_hashsz;
165*7c478bd9Sstevel@tonic-gate 
166*7c478bd9Sstevel@tonic-gate 	/*
167*7c478bd9Sstevel@tonic-gate 	 * If the string is already in our hash table, just return the offset
168*7c478bd9Sstevel@tonic-gate 	 * of the existing string element and do not add a duplicate string.
169*7c478bd9Sstevel@tonic-gate 	 */
170*7c478bd9Sstevel@tonic-gate 	for (hp = sp->str_hash[h]; hp != NULL; hp = hp->str_next) {
171*7c478bd9Sstevel@tonic-gate 		if (strtab_compare(sp, hp, str, len + 1) == 0)
172*7c478bd9Sstevel@tonic-gate 			return (hp->str_off);
173*7c478bd9Sstevel@tonic-gate 	}
174*7c478bd9Sstevel@tonic-gate 
175*7c478bd9Sstevel@tonic-gate 	/*
176*7c478bd9Sstevel@tonic-gate 	 * Create a new hash bucket, initialize it, and insert it at the front
177*7c478bd9Sstevel@tonic-gate 	 * of the hash chain for the appropriate bucket.
178*7c478bd9Sstevel@tonic-gate 	 */
179*7c478bd9Sstevel@tonic-gate 	hp = xmalloc(sizeof (strhash_t));
180*7c478bd9Sstevel@tonic-gate 
181*7c478bd9Sstevel@tonic-gate 	hp->str_data = sp->str_ptr;
182*7c478bd9Sstevel@tonic-gate 	hp->str_buf = sp->str_nbufs - 1;
183*7c478bd9Sstevel@tonic-gate 	hp->str_off = sp->str_size;
184*7c478bd9Sstevel@tonic-gate 	hp->str_len = len;
185*7c478bd9Sstevel@tonic-gate 	hp->str_next = sp->str_hash[h];
186*7c478bd9Sstevel@tonic-gate 
187*7c478bd9Sstevel@tonic-gate 	sp->str_hash[h] = hp;
188*7c478bd9Sstevel@tonic-gate 
189*7c478bd9Sstevel@tonic-gate 	/*
190*7c478bd9Sstevel@tonic-gate 	 * Now copy the string data into our buffer list, and then update
191*7c478bd9Sstevel@tonic-gate 	 * the global counts of strings and bytes.  Return str's byte offset.
192*7c478bd9Sstevel@tonic-gate 	 */
193*7c478bd9Sstevel@tonic-gate 	strtab_copyin(sp, str, len + 1);
194*7c478bd9Sstevel@tonic-gate 	sp->str_nstrs++;
195*7c478bd9Sstevel@tonic-gate 	sp->str_size += len + 1;
196*7c478bd9Sstevel@tonic-gate 
197*7c478bd9Sstevel@tonic-gate 	return (hp->str_off);
198*7c478bd9Sstevel@tonic-gate }
199*7c478bd9Sstevel@tonic-gate 
200*7c478bd9Sstevel@tonic-gate size_t
201*7c478bd9Sstevel@tonic-gate strtab_size(const strtab_t *sp)
202*7c478bd9Sstevel@tonic-gate {
203*7c478bd9Sstevel@tonic-gate 	return (sp->str_size);
204*7c478bd9Sstevel@tonic-gate }
205*7c478bd9Sstevel@tonic-gate 
206*7c478bd9Sstevel@tonic-gate ssize_t
207*7c478bd9Sstevel@tonic-gate strtab_write(const strtab_t *sp,
208*7c478bd9Sstevel@tonic-gate     ssize_t (*func)(const void *, size_t, void *), void *priv)
209*7c478bd9Sstevel@tonic-gate {
210*7c478bd9Sstevel@tonic-gate 	ssize_t res, total = 0;
211*7c478bd9Sstevel@tonic-gate 	ulong_t i;
212*7c478bd9Sstevel@tonic-gate 	size_t n;
213*7c478bd9Sstevel@tonic-gate 
214*7c478bd9Sstevel@tonic-gate 	for (i = 0; i < sp->str_nbufs; i++, total += res) {
215*7c478bd9Sstevel@tonic-gate 		if (i == sp->str_nbufs - 1)
216*7c478bd9Sstevel@tonic-gate 			n = sp->str_ptr - sp->str_bufs[i];
217*7c478bd9Sstevel@tonic-gate 		else
218*7c478bd9Sstevel@tonic-gate 			n = sp->str_bufsz;
219*7c478bd9Sstevel@tonic-gate 
220*7c478bd9Sstevel@tonic-gate 		if ((res = func(sp->str_bufs[i], n, priv)) <= 0)
221*7c478bd9Sstevel@tonic-gate 			break;
222*7c478bd9Sstevel@tonic-gate 	}
223*7c478bd9Sstevel@tonic-gate 
224*7c478bd9Sstevel@tonic-gate 	if (total == 0 && sp->str_size != 0)
225*7c478bd9Sstevel@tonic-gate 		return (-1);
226*7c478bd9Sstevel@tonic-gate 
227*7c478bd9Sstevel@tonic-gate 	return (total);
228*7c478bd9Sstevel@tonic-gate }
229*7c478bd9Sstevel@tonic-gate 
230*7c478bd9Sstevel@tonic-gate void
231*7c478bd9Sstevel@tonic-gate strtab_print(const strtab_t *sp)
232*7c478bd9Sstevel@tonic-gate {
233*7c478bd9Sstevel@tonic-gate 	const strhash_t *hp;
234*7c478bd9Sstevel@tonic-gate 	ulong_t i;
235*7c478bd9Sstevel@tonic-gate 
236*7c478bd9Sstevel@tonic-gate 	for (i = 0; i < sp->str_hashsz; i++) {
237*7c478bd9Sstevel@tonic-gate 		for (hp = sp->str_hash[i]; hp != NULL; hp = hp->str_next) {
238*7c478bd9Sstevel@tonic-gate 			const char *buf = hp->str_data;
239*7c478bd9Sstevel@tonic-gate 			ulong_t b = hp->str_buf;
240*7c478bd9Sstevel@tonic-gate 			size_t resid, len, n;
241*7c478bd9Sstevel@tonic-gate 
242*7c478bd9Sstevel@tonic-gate 			(void) printf("[%lu] %lu \"", (ulong_t)hp->str_off, b);
243*7c478bd9Sstevel@tonic-gate 
244*7c478bd9Sstevel@tonic-gate 			for (len = hp->str_len; len != 0; len -= n) {
245*7c478bd9Sstevel@tonic-gate 				if (buf == sp->str_bufs[b] + sp->str_bufsz)
246*7c478bd9Sstevel@tonic-gate 					buf = sp->str_bufs[++b];
247*7c478bd9Sstevel@tonic-gate 
248*7c478bd9Sstevel@tonic-gate 				resid = sp->str_bufs[b] + sp->str_bufsz - buf;
249*7c478bd9Sstevel@tonic-gate 				n = MIN(resid, len);
250*7c478bd9Sstevel@tonic-gate 
251*7c478bd9Sstevel@tonic-gate 				(void) printf("%.*s", (int)n, buf);
252*7c478bd9Sstevel@tonic-gate 				buf += n;
253*7c478bd9Sstevel@tonic-gate 			}
254*7c478bd9Sstevel@tonic-gate 
255*7c478bd9Sstevel@tonic-gate 			(void) printf("\"\n");
256*7c478bd9Sstevel@tonic-gate 		}
257*7c478bd9Sstevel@tonic-gate 	}
258*7c478bd9Sstevel@tonic-gate }
259