xref: /freebsd/contrib/tcsh/tc.str.c (revision 9bd497b8354567454e075076d40c996e21bd6095)
1 /* $Header: /p/tcsh/cvsroot/tcsh/tc.str.c,v 3.30 2009/06/25 21:27:38 christos Exp $ */
2 /*
3  * tc.str.c: Short string package
4  * 	     This has been a lesson of how to write buggy code!
5  */
6 /*-
7  * Copyright (c) 1980, 1991 The Regents of the University of California.
8  * All rights reserved.
9  *
10  * Redistribution and use in source and binary forms, with or without
11  * modification, are permitted provided that the following conditions
12  * are met:
13  * 1. Redistributions of source code must retain the above copyright
14  *    notice, this list of conditions and the following disclaimer.
15  * 2. Redistributions in binary form must reproduce the above copyright
16  *    notice, this list of conditions and the following disclaimer in the
17  *    documentation and/or other materials provided with the distribution.
18  * 3. Neither the name of the University nor the names of its contributors
19  *    may be used to endorse or promote products derived from this software
20  *    without specific prior written permission.
21  *
22  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
23  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
26  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32  * SUCH DAMAGE.
33  */
34 #include "sh.h"
35 
36 #include <limits.h>
37 
38 RCSID("$tcsh: tc.str.c,v 3.30 2009/06/25 21:27:38 christos Exp $")
39 
40 #define MALLOC_INCR	128
41 #ifdef WIDE_STRINGS
42 #define MALLOC_SURPLUS	MB_LEN_MAX /* Space for one multibyte character */
43 #else
44 #define MALLOC_SURPLUS	0
45 #endif
46 
47 #ifdef WIDE_STRINGS
48 size_t
49 one_mbtowc(wchar_t *pwc, const char *s, size_t n)
50 {
51     int len;
52 
53     len = rt_mbtowc(pwc, s, n);
54     if (len == -1) {
55         reset_mbtowc();
56 	*pwc = (unsigned char)*s | INVALID_BYTE;
57     }
58     if (len <= 0)
59 	len = 1;
60     return len;
61 }
62 
63 size_t
64 one_wctomb(char *s, wchar_t wchar)
65 {
66     int len;
67 
68     if (wchar & INVALID_BYTE) {
69 	s[0] = wchar & 0xFF;
70 	len = 1;
71     } else {
72 	len = wctomb(s, wchar);
73 	if (len == -1)
74 	    s[0] = wchar;
75 	if (len <= 0)
76 	    len = 1;
77     }
78     return len;
79 }
80 
81 int
82 rt_mbtowc(wchar_t *pwc, const char *s, size_t n)
83 {
84     int ret;
85     char back[MB_LEN_MAX];
86 
87     ret = mbtowc(pwc, s, n);
88     if (ret > 0 && (wctomb(back, *pwc) != ret || memcmp(s, back, ret) != 0))
89 	ret = -1;
90     return ret;
91 }
92 #endif
93 
94 #ifdef SHORT_STRINGS
95 Char  **
96 blk2short(char **src)
97 {
98     size_t     n;
99     Char **sdst, **dst;
100 
101     /*
102      * Count
103      */
104     for (n = 0; src[n] != NULL; n++)
105 	continue;
106     sdst = dst = xmalloc((n + 1) * sizeof(Char *));
107 
108     for (; *src != NULL; src++)
109 	*dst++ = SAVE(*src);
110     *dst = NULL;
111     return (sdst);
112 }
113 
114 char  **
115 short2blk(Char **src)
116 {
117     size_t     n;
118     char **sdst, **dst;
119 
120     /*
121      * Count
122      */
123     for (n = 0; src[n] != NULL; n++)
124 	continue;
125     sdst = dst = xmalloc((n + 1) * sizeof(char *));
126 
127     for (; *src != NULL; src++)
128 	*dst++ = strsave(short2str(*src));
129     *dst = NULL;
130     return (sdst);
131 }
132 
133 Char   *
134 str2short(const char *src)
135 {
136     static struct Strbuf buf; /* = Strbuf_INIT; */
137 
138     if (src == NULL)
139 	return (NULL);
140 
141     buf.len = 0;
142     while (*src) {
143 	Char wc;
144 
145 	src += one_mbtowc(&wc, src, MB_LEN_MAX);
146 	Strbuf_append1(&buf, wc);
147     }
148     Strbuf_terminate(&buf);
149     return buf.s;
150 }
151 
152 char   *
153 short2str(const Char *src)
154 {
155     static char *sdst = NULL;
156     static size_t dstsize = 0;
157     char *dst, *edst;
158 
159     if (src == NULL)
160 	return (NULL);
161 
162     if (sdst == NULL) {
163 	dstsize = MALLOC_INCR;
164 	sdst = xmalloc((dstsize + MALLOC_SURPLUS) * sizeof(char));
165     }
166     dst = sdst;
167     edst = &dst[dstsize];
168     while (*src) {
169 	dst += one_wctomb(dst, *src & CHAR);
170 	src++;
171 	if (dst >= edst) {
172 	    char *wdst = dst;
173 	    char *wedst = edst;
174 
175 	    dstsize += MALLOC_INCR;
176 	    sdst = xrealloc(sdst, (dstsize + MALLOC_SURPLUS) * sizeof(char));
177 	    edst = &sdst[dstsize];
178 	    dst = &edst[-MALLOC_INCR];
179 	    while (wdst > wedst) {
180 		dst++;
181 		wdst--;
182 	    }
183 	}
184     }
185     *dst = 0;
186     return (sdst);
187 }
188 
189 #ifndef WIDE_STRINGS
190 Char   *
191 s_strcpy(Char *dst, const Char *src)
192 {
193     Char *sdst;
194 
195     sdst = dst;
196     while ((*dst++ = *src++) != '\0')
197 	continue;
198     return (sdst);
199 }
200 
201 Char   *
202 s_strncpy(Char *dst, const Char *src, size_t n)
203 {
204     Char *sdst;
205 
206     if (n == 0)
207 	return(dst);
208 
209     sdst = dst;
210     do
211 	if ((*dst++ = *src++) == '\0') {
212 	    while (--n != 0)
213 		*dst++ = '\0';
214 	    return(sdst);
215 	}
216     while (--n != 0);
217     return (sdst);
218 }
219 
220 Char   *
221 s_strcat(Char *dst, const Char *src)
222 {
223     Strcpy(Strend(dst), src);
224     return dst;
225 }
226 
227 #ifdef NOTUSED
228 Char   *
229 s_strncat(Char *dst, const Char *src, size_t n)
230 {
231     Char *sdst;
232 
233     if (n == 0)
234 	return (dst);
235 
236     sdst = dst;
237 
238     while (*dst)
239 	dst++;
240 
241     do
242 	if ((*dst++ = *src++) == '\0')
243 	    return(sdst);
244     while (--n != 0)
245 	continue;
246 
247     *dst = '\0';
248     return (sdst);
249 }
250 
251 #endif
252 
253 Char   *
254 s_strchr(const Char *str, int ch)
255 {
256     do
257 	if (*str == ch)
258 	    return ((Char *)(intptr_t)str);
259     while (*str++);
260     return (NULL);
261 }
262 
263 Char   *
264 s_strrchr(const Char *str, int ch)
265 {
266     const Char *rstr;
267 
268     rstr = NULL;
269     do
270 	if (*str == ch)
271 	    rstr = str;
272     while (*str++);
273     return ((Char *)(intptr_t)rstr);
274 }
275 
276 size_t
277 s_strlen(const Char *str)
278 {
279     size_t n;
280 
281     for (n = 0; *str++; n++)
282 	continue;
283     return (n);
284 }
285 
286 int
287 s_strcmp(const Char *str1, const Char *str2)
288 {
289     for (; *str1 && *str1 == *str2; str1++, str2++)
290 	continue;
291     /*
292      * The following case analysis is necessary so that characters which look
293      * negative collate low against normal characters but high against the
294      * end-of-string NUL.
295      */
296     if (*str1 == '\0' && *str2 == '\0')
297 	return (0);
298     else if (*str1 == '\0')
299 	return (-1);
300     else if (*str2 == '\0')
301 	return (1);
302     else
303 	return (*str1 - *str2);
304 }
305 
306 int
307 s_strncmp(const Char *str1, const Char *str2, size_t n)
308 {
309     if (n == 0)
310 	return (0);
311     do {
312 	if (*str1 != *str2) {
313 	    /*
314 	     * The following case analysis is necessary so that characters
315 	     * which look negative collate low against normal characters
316 	     * but high against the end-of-string NUL.
317 	     */
318 	    if (*str1 == '\0')
319 		return (-1);
320 	    else if (*str2 == '\0')
321 		return (1);
322 	    else
323 		return (*str1 - *str2);
324 	}
325         if (*str1 == '\0')
326 	    return(0);
327 	str1++, str2++;
328     } while (--n != 0);
329     return(0);
330 }
331 #endif /* not WIDE_STRINGS */
332 
333 int
334 s_strcasecmp(const Char *str1, const Char *str2)
335 {
336 #ifdef WIDE_STRINGS
337     wchar_t l1 = 0, l2 = 0;
338     for (; *str1 && ((*str1 == *str2 && (l1 = l2 = 0) == 0) ||
339 	(l1 = towlower(*str1)) == (l2 = towlower(*str2))); str1++, str2++)
340 	continue;
341 
342 #else
343     unsigned char c1, c2, l1 = 0, l2 = 0;
344     for (; *str1 && ((*str1 == *str2 && (l1 = l2 = 0) == 0) ||
345 	((c1 = (unsigned char)*str1) == *str1 &&
346 	 (c2 = (unsigned char)*str2) == *str2 &&
347 	(l1 = tolower(c1)) == (l2 = tolower(c2)))); str1++, str2++)
348 	continue;
349 #endif
350     /*
351      * The following case analysis is necessary so that characters which look
352      * negative collate low against normal characters but high against the
353      * end-of-string NUL.
354      */
355     if (*str1 == '\0' && *str2 == '\0')
356 	return (0);
357     else if (*str1 == '\0')
358 	return (-1);
359     else if (*str2 == '\0')
360 	return (1);
361     else if (l1 == l2)	/* They are zero when they are equal */
362 	return (*str1 - *str2);
363     else
364 	return (l1 - l2);
365 }
366 
367 Char   *
368 s_strnsave(const Char *s, size_t len)
369 {
370     Char *n;
371 
372     n = xmalloc((len + 1) * sizeof (*n));
373     memcpy(n, s, len * sizeof (*n));
374     n[len] = '\0';
375     return n;
376 }
377 
378 Char   *
379 s_strsave(const Char *s)
380 {
381     Char   *n;
382     size_t size;
383 
384     if (s == NULL)
385 	s = STRNULL;
386     size = (Strlen(s) + 1) * sizeof(*n);
387     n = xmalloc(size);
388     memcpy(n, s, size);
389     return (n);
390 }
391 
392 Char   *
393 s_strspl(const Char *cp, const Char *dp)
394 {
395     Char *res, *ep;
396     const Char *p, *q;
397 
398     if (!cp)
399 	cp = STRNULL;
400     if (!dp)
401 	dp = STRNULL;
402     for (p = cp; *p++;)
403 	continue;
404     for (q = dp; *q++;)
405 	continue;
406     res = xmalloc(((p - cp) + (q - dp) - 1) * sizeof(Char));
407     for (ep = res, q = cp; (*ep++ = *q++) != '\0';)
408 	continue;
409     for (ep--, q = dp; (*ep++ = *q++) != '\0';)
410 	continue;
411     return (res);
412 }
413 
414 Char   *
415 s_strend(const Char *cp)
416 {
417     if (!cp)
418 	return ((Char *)(intptr_t) cp);
419     while (*cp)
420 	cp++;
421     return ((Char *)(intptr_t) cp);
422 }
423 
424 Char   *
425 s_strstr(const Char *s, const Char *t)
426 {
427     do {
428 	const Char *ss = s;
429 	const Char *tt = t;
430 
431 	do
432 	    if (*tt == '\0')
433 		return ((Char *)(intptr_t) s);
434 	while (*ss++ == *tt++);
435     } while (*s++ != '\0');
436     return (NULL);
437 }
438 
439 #else /* !SHORT_STRINGS */
440 char *
441 caching_strip(const char *s)
442 {
443     static char *buf = NULL;
444     static size_t buf_size = 0;
445     size_t size;
446 
447     if (s == NULL)
448       return NULL;
449     size = strlen(s) + 1;
450     if (buf_size < size) {
451 	buf = xrealloc(buf, size);
452 	buf_size = size;
453     }
454     memcpy(buf, s, size);
455     strip(buf);
456     return buf;
457 }
458 #endif
459 
460 char   *
461 short2qstr(const Char *src)
462 {
463     static char *sdst = NULL;
464     static size_t dstsize = 0;
465     char *dst, *edst;
466 
467     if (src == NULL)
468 	return (NULL);
469 
470     if (sdst == NULL) {
471 	dstsize = MALLOC_INCR;
472 	sdst = xmalloc((dstsize + MALLOC_SURPLUS) * sizeof(char));
473     }
474     dst = sdst;
475     edst = &dst[dstsize];
476     while (*src) {
477 	if (*src & QUOTE) {
478 	    *dst++ = '\\';
479 	    if (dst == edst) {
480 		dstsize += MALLOC_INCR;
481 		sdst = xrealloc(sdst,
482 				(dstsize + MALLOC_SURPLUS) * sizeof(char));
483 		edst = &sdst[dstsize];
484 		dst = &edst[-MALLOC_INCR];
485 	    }
486 	}
487 	dst += one_wctomb(dst, *src & CHAR);
488 	src++;
489 	if (dst >= edst) {
490 	    ptrdiff_t i = dst - edst;
491 	    dstsize += MALLOC_INCR;
492 	    sdst = xrealloc(sdst, (dstsize + MALLOC_SURPLUS) * sizeof(char));
493 	    edst = &sdst[dstsize];
494 	    dst = &edst[-MALLOC_INCR + i];
495 	}
496     }
497     *dst = 0;
498     return (sdst);
499 }
500 
501 struct blk_buf *
502 bb_alloc()
503 {
504     return xcalloc(1, sizeof(struct blk_buf));
505 }
506 
507 static void
508 bb_store(struct blk_buf *bb, Char *str)
509 {
510     if (bb->len == bb->size) { /* Keep space for terminating NULL */
511 	if (bb->size == 0)
512 	    bb->size = 16; /* Arbitrary */
513 	else
514 	    bb->size *= 2;
515 	bb->vec = xrealloc(bb->vec, bb->size * sizeof (*bb->vec));
516     }
517     bb->vec[bb->len] = str;
518 }
519 
520 void
521 bb_append(struct blk_buf *bb, Char *str)
522 {
523     bb_store(bb, str);
524     bb->len++;
525 }
526 
527 void
528 bb_cleanup(void *xbb)
529 {
530     struct blk_buf *bb;
531     size_t i;
532 
533     bb = xbb;
534     for (i = 0; i < bb->len; i++)
535 	xfree(bb->vec[i]);
536     xfree(bb->vec);
537 }
538 
539 void
540 bb_free(void *bb)
541 {
542     bb_cleanup(bb);
543     xfree(bb);
544 }
545 
546 Char **
547 bb_finish(struct blk_buf *bb)
548 {
549     bb_store(bb, NULL);
550     return xrealloc(bb->vec, (bb->len + 1) * sizeof (*bb->vec));
551 }
552 
553 #define DO_STRBUF(STRBUF, CHAR, STRLEN)				\
554 								\
555 struct STRBUF *							\
556 STRBUF##_alloc(void)						\
557 {								\
558     return xcalloc(1, sizeof(struct STRBUF));			\
559 }								\
560 								\
561 static void							\
562 STRBUF##_store1(struct STRBUF *buf, CHAR c)			\
563 {								\
564     if (buf->size == buf->len) {				\
565 	if (buf->size == 0)					\
566 	    buf->size = 64; /* Arbitrary */			\
567 	else							\
568 	    buf->size *= 2;					\
569 	buf->s = xrealloc(buf->s, buf->size * sizeof(*buf->s));	\
570     }								\
571     buf->s[buf->len] = c;					\
572 }								\
573 								\
574 /* Like strbuf_append1(buf, '\0'), but don't advance len */	\
575 void								\
576 STRBUF##_terminate(struct STRBUF *buf)				\
577 {								\
578     STRBUF##_store1(buf, '\0');					\
579 }								\
580 								\
581 void								\
582 STRBUF##_append1(struct STRBUF *buf, CHAR c)			\
583 {								\
584     STRBUF##_store1(buf, c);					\
585     buf->len++;							\
586 }								\
587 								\
588 void								\
589 STRBUF##_appendn(struct STRBUF *buf, const CHAR *s, size_t len)	\
590 {								\
591     if (buf->size < buf->len + len) {				\
592 	if (buf->size == 0)					\
593 	    buf->size = 64; /* Arbitrary */			\
594 	while (buf->size < buf->len + len)			\
595 	    buf->size *= 2;					\
596 	buf->s = xrealloc(buf->s, buf->size * sizeof(*buf->s));	\
597     }								\
598     memcpy(buf->s + buf->len, s, len * sizeof(*buf->s));	\
599     buf->len += len;						\
600 }								\
601 								\
602 void								\
603 STRBUF##_append(struct STRBUF *buf, const CHAR *s)		\
604 {								\
605     STRBUF##_appendn(buf, s, STRLEN(s));			\
606 }								\
607 								\
608 CHAR *								\
609 STRBUF##_finish(struct STRBUF *buf)				\
610 {								\
611     STRBUF##_append1(buf, 0);					\
612     return xrealloc(buf->s, buf->len * sizeof(*buf->s));	\
613 }								\
614 								\
615 void								\
616 STRBUF##_cleanup(void *xbuf)					\
617 {								\
618     struct STRBUF *buf;						\
619 								\
620     buf = xbuf;							\
621     xfree(buf->s);						\
622 }								\
623 								\
624 void								\
625 STRBUF##_free(void *xbuf)					\
626 {								\
627     STRBUF##_cleanup(xbuf);					\
628     xfree(xbuf);						\
629 }								\
630 								\
631 const struct STRBUF STRBUF##_init /* = STRBUF##_INIT; */
632 
633 DO_STRBUF(strbuf, char, strlen);
634 DO_STRBUF(Strbuf, Char, Strlen);
635