xref: /freebsd/contrib/tcsh/glob.c (revision f4dc9bf43457515e5c88d1400d4f5ff70a82d9c7)
1 /*
2  * Copyright (c) 1989 The Regents of the University of California.
3  * All rights reserved.
4  *
5  * This code is derived from software contributed to Berkeley by
6  * Guido van Rossum.
7  *
8  * Redistribution and use in source and binary forms, with or without
9  * modification, are permitted provided that the following conditions
10  * are met:
11  * 1. Redistributions of source code must retain the above copyright
12  *    notice, this list of conditions and the following disclaimer.
13  * 2. Redistributions in binary form must reproduce the above copyright
14  *    notice, this list of conditions and the following disclaimer in the
15  *    documentation and/or other materials provided with the distribution.
16  * 3. Neither the name of the University nor the names of its contributors
17  *    may be used to endorse or promote products derived from this software
18  *    without specific prior written permission.
19  *
20  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
21  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
22  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
23  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
24  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
25  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
26  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
28  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
29  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
30  * SUCH DAMAGE.
31  */
32 #if defined(LIBC_SCCS) && !defined(lint)
33 static char sccsid[] = "@(#)glob.c	5.12 (Berkeley) 6/24/91";
34 #endif /* LIBC_SCCS and not lint */
35 /*
36  * Glob: the interface is a superset of the one defined in POSIX 1003.2,
37  * draft 9.
38  *
39  * The [!...] convention to negate a range is supported (SysV, Posix, ksh).
40  *
41  * Optional extra services, controlled by flags not defined by POSIX:
42  *
43  * GLOB_QUOTE:
44  *	Escaping convention: \ inhibits any special meaning the following
45  *	character might have (except \ at end of string is retained).
46  * GLOB_MAGCHAR:
47  *	Set in gl_flags if pattern contained a globbing character.
48  * GLOB_ALTNOT:
49  *	Use ^ instead of ! for "not".
50  * gl_matchc:
51  *	Number of matches in the current invocation of glob.
52  */
53 
54 #ifdef WINNT_NATIVE
55 	#pragma warning(disable:4244)
56 #endif /* WINNT_NATIVE */
57 
58 #define Char __Char
59 #include "sh.h"
60 #include "glob.h"
61 
62 #undef Char
63 #undef QUOTE
64 #undef TILDE
65 #undef META
66 #undef ismeta
67 #undef Strchr
68 
69 #ifndef S_ISDIR
70 #define S_ISDIR(a)	(((a) & S_IFMT) == S_IFDIR)
71 #endif
72 
73 #if !defined(S_ISLNK) && defined(S_IFLNK)
74 #define S_ISLNK(a)	(((a) & S_IFMT) == S_IFLNK)
75 #endif
76 
77 #if !defined(S_ISLNK) && !defined(lstat)
78 #define lstat stat
79 #endif
80 
81 typedef unsigned short Char;
82 
83 static	int	 glob1 		(Char *, glob_t *, int);
84 static	int	 glob2		(struct strbuf *, const Char *, glob_t *, int);
85 static	int	 glob3		(struct strbuf *, const Char *, const Char *,
86 				 const Char *, glob_t *, int);
87 static	void	 globextend	(const char *, glob_t *);
88 static	int	 match		(const char *, const Char *, const Char *,
89 				 int);
90 static	int	 compare	(const void *, const void *);
91 static 	DIR	*Opendir	(const char *);
92 #ifdef S_IFLNK
93 static	int	 Lstat		(const char *, struct stat *);
94 #endif
95 static	int	 Stat		(const char *, struct stat *sb);
96 static 	Char 	*Strchr		(Char *, int);
97 #ifdef DEBUG
98 static	void	 qprintf	(const Char *);
99 #endif
100 
101 #define	DOLLAR		'$'
102 #define	DOT		'.'
103 #define	EOS		'\0'
104 #define	LBRACKET	'['
105 #define	NOT		'!'
106 #define ALTNOT		'^'
107 #define	QUESTION	'?'
108 #define	QUOTE		'\\'
109 #define	RANGE		'-'
110 #define	RBRACKET	']'
111 #define	SEP		'/'
112 #define	STAR		'*'
113 #define	TILDE		'~'
114 #define	UNDERSCORE	'_'
115 
116 #define	M_META		0x8000
117 #define M_PROTECT	0x4000
118 #define	M_MASK		0xffff
119 #define	M_ASCII		0x00ff
120 
121 #define	LCHAR(c)	((c)&M_ASCII)
122 #define	META(c)		((c)|M_META)
123 #define	M_ALL		META('*')
124 #define	M_END		META(']')
125 #define	M_NOT		META('!')
126 #define	M_ALTNOT	META('^')
127 #define	M_ONE		META('?')
128 #define	M_RNG		META('-')
129 #define	M_SET		META('[')
130 #define	ismeta(c)	(((c)&M_META) != 0)
131 
132 int
133 globcharcoll(__Char c1, __Char c2, int cs)
134 {
135 #if defined(NLS) && defined(LC_COLLATE) && defined(HAVE_STRCOLL)
136 # if defined(WIDE_STRINGS)
137     wchar_t s1[2], s2[2];
138 
139     if (c1 == c2)
140 	return (0);
141     if (cs) {
142 	c1 = towlower(c1);
143 	c2 = towlower(c2);
144     } else {
145 #ifndef __FreeBSD__
146 	/* This should not be here, but I'll rather leave it in than engage in
147 	   a LC_COLLATE flamewar about a shell I don't use... */
148 	if (iswlower(c1) && iswupper(c2))
149 	    return (1);
150 	if (iswupper(c1) && iswlower(c2))
151 	    return (-1);
152 #endif
153     }
154     s1[0] = c1;
155     s2[0] = c2;
156     s1[1] = s2[1] = '\0';
157 #ifdef __FreeBSD__
158     return wcscmp(s1, s2);
159 #else
160     return wcscoll(s1, s2);
161 #endif
162 # else /* not WIDE_STRINGS */
163     char s1[2], s2[2];
164 
165     if (c1 == c2)
166 	return (0);
167     /*
168      * From kevin lyda <kevin@suberic.net>:
169      * strcoll does not guarantee case sorting, so we pre-process now:
170      */
171     if (cs) {
172 	c1 = islower(c1) ? c1 : tolower(c1);
173 	c2 = islower(c2) ? c2 : tolower(c2);
174     } else {
175 	if (islower(c1) && isupper(c2))
176 	    return (1);
177 	if (isupper(c1) && islower(c2))
178 	    return (-1);
179     }
180     s1[0] = c1;
181     s2[0] = c2;
182     s1[1] = s2[1] = '\0';
183     return strcoll(s1, s2);
184 # endif
185 #else
186     return (c1 - c2);
187 #endif
188 }
189 
190 /*
191  * Need to dodge two kernel bugs:
192  * opendir("") != opendir(".")
193  * NAMEI_BUG: on plain files trailing slashes are ignored in some kernels.
194  *            POSIX specifies that they should be ignored in directories.
195  */
196 
197 static DIR *
198 Opendir(const char *str)
199 {
200 #if defined(hpux) || defined(__hpux)
201     struct stat st;
202 #endif
203 
204     if (!*str)
205 	return (opendir("."));
206 #if defined(hpux) || defined(__hpux)
207     /*
208      * Opendir on some device files hangs, so avoid it
209      */
210     if (stat(str, &st) == -1 || !S_ISDIR(st.st_mode))
211 	return NULL;
212 #endif
213     return opendir(str);
214 }
215 
216 #ifdef S_IFLNK
217 static int
218 Lstat(const char *fn, struct stat *sb)
219 {
220     int st;
221 
222     st = lstat(fn, sb);
223 # ifdef NAMEI_BUG
224     if (*fn != 0 && strend(fn)[-1] == '/' && !S_ISDIR(sb->st_mode))
225 	st = -1;
226 # endif	/* NAMEI_BUG */
227     return st;
228 }
229 #else
230 #define Lstat Stat
231 #endif /* S_IFLNK */
232 
233 static int
234 Stat(const char *fn, struct stat *sb)
235 {
236     int st;
237 
238     st = stat(fn, sb);
239 #ifdef NAMEI_BUG
240     if (*fn != 0 && strend(fn)[-1] == '/' && !S_ISDIR(sb->st_mode))
241 	st = -1;
242 #endif /* NAMEI_BUG */
243     return st;
244 }
245 
246 static Char *
247 Strchr(Char *str, int ch)
248 {
249     do
250 	if (*str == ch)
251 	    return (str);
252     while (*str++);
253     return (NULL);
254 }
255 
256 #ifdef DEBUG
257 static void
258 qprintf(const Char *s)
259 {
260     const Char *p;
261 
262     for (p = s; *p; p++)
263 	printf("%c", *p & 0xff);
264     printf("\n");
265     for (p = s; *p; p++)
266 	printf("%c", *p & M_PROTECT ? '"' : ' ');
267     printf("\n");
268     for (p = s; *p; p++)
269 	printf("%c", *p & M_META ? '_' : ' ');
270     printf("\n");
271 }
272 #endif /* DEBUG */
273 
274 static int
275 compare(const void *p, const void *q)
276 {
277 #if defined(NLS) && defined(HAVE_STRCOLL)
278     return (strcoll(*(char *const *) p, *(char *const *) q));
279 #else
280     return (strcmp(*(char *const *) p, *(char *const *) q));
281 #endif /* NLS && HAVE_STRCOLL */
282 }
283 
284 /*
285  * The main glob() routine: compiles the pattern (optionally processing
286  * quotes), calls glob1() to do the real pattern matching, and finally
287  * sorts the list (unless unsorted operation is requested).  Returns 0
288  * if things went well, nonzero if errors occurred.  It is not an error
289  * to find no matches.
290  */
291 int
292 glob(const char *pattern, int flags, int (*errfunc) (const char *, int),
293      glob_t *pglob)
294 {
295     int     err, oldpathc;
296     Char *bufnext, m_not;
297     const unsigned char *patnext;
298     int     c, not;
299     Char *qpatnext, *patbuf;
300     int     no_match;
301 
302     patnext = (const unsigned char *) pattern;
303     if (!(flags & GLOB_APPEND)) {
304 	pglob->gl_pathc = 0;
305 	pglob->gl_pathv = NULL;
306 	if (!(flags & GLOB_DOOFFS))
307 	    pglob->gl_offs = 0;
308     }
309     pglob->gl_flags = flags & ~GLOB_MAGCHAR;
310     pglob->gl_errfunc = errfunc;
311     oldpathc = pglob->gl_pathc;
312     pglob->gl_matchc = 0;
313 
314     if (pglob->gl_flags & GLOB_ALTNOT) {
315 	not = ALTNOT;
316 	m_not = M_ALTNOT;
317     }
318     else {
319 	not = NOT;
320 	m_not = M_NOT;
321     }
322 
323     patbuf = xmalloc((strlen(pattern) + 1) * sizeof(*patbuf));
324     bufnext = patbuf;
325 
326     no_match = *patnext == not;
327     if (no_match)
328 	patnext++;
329 
330     if (flags & GLOB_QUOTE) {
331 	/* Protect the quoted characters */
332 	while ((c = *patnext++) != EOS) {
333 #ifdef WIDE_STRINGS
334 	    int len;
335 
336 	    len = mblen((const char *)(patnext - 1), MB_LEN_MAX);
337 	    if (len == -1)
338 		TCSH_IGNORE(mblen(NULL, 0));
339 	    else if (len > 1) {
340 		*bufnext++ = (Char) c;
341 		while (--len != 0)
342 		    *bufnext++ = (Char) (*patnext++ | M_PROTECT);
343 	    } else
344 #endif /* WIDE_STRINGS */
345 	    if (c == QUOTE) {
346 		if ((c = *patnext++) == EOS) {
347 		    c = QUOTE;
348 		    --patnext;
349 		}
350 		*bufnext++ = (Char) (c | M_PROTECT);
351 	    }
352 	    else
353 		*bufnext++ = (Char) c;
354 	}
355     }
356     else
357 	while ((c = *patnext++) != EOS)
358 	    *bufnext++ = (Char) c;
359     *bufnext = EOS;
360 
361     bufnext = patbuf;
362     qpatnext = patbuf;
363     while ((c = *qpatnext++) != EOS) {
364 	switch (c) {
365 	case LBRACKET:
366 	    c = *qpatnext;
367 	    if (c == not)
368 		++qpatnext;
369 	    if (*qpatnext == EOS ||
370 		Strchr(qpatnext + 1, RBRACKET) == NULL) {
371 		*bufnext++ = LBRACKET;
372 		if (c == not)
373 		    --qpatnext;
374 		break;
375 	    }
376 	    pglob->gl_flags |= GLOB_MAGCHAR;
377 	    *bufnext++ = M_SET;
378 	    if (c == not)
379 		*bufnext++ = m_not;
380 	    c = *qpatnext++;
381 	    do {
382 		*bufnext++ = LCHAR(c);
383 		if (*qpatnext == RANGE &&
384 		    (c = qpatnext[1]) != RBRACKET) {
385 		    *bufnext++ = M_RNG;
386 		    *bufnext++ = LCHAR(c);
387 		    qpatnext += 2;
388 		}
389 	    } while ((c = *qpatnext++) != RBRACKET);
390 	    *bufnext++ = M_END;
391 	    break;
392 	case QUESTION:
393 	    pglob->gl_flags |= GLOB_MAGCHAR;
394 	    *bufnext++ = M_ONE;
395 	    break;
396 	case STAR:
397 	    pglob->gl_flags |= GLOB_MAGCHAR;
398 	    /* collapse adjacent stars to one [or three if globstar],
399 	     * to avoid exponential behavior
400 	     */
401 	    if (bufnext == patbuf || bufnext[-1] != M_ALL ||
402 	       ((flags & GLOB_STAR) != 0 &&
403 		 (bufnext - 1 == patbuf || bufnext[-2] != M_ALL ||
404 		 bufnext - 2 == patbuf || bufnext[-3] != M_ALL)))
405 		*bufnext++ = M_ALL;
406 	    break;
407 	default:
408 	    *bufnext++ = LCHAR(c);
409 	    break;
410 	}
411     }
412     *bufnext = EOS;
413 #ifdef DEBUG
414     qprintf(patbuf);
415 #endif
416 
417     if ((err = glob1(patbuf, pglob, no_match)) != 0) {
418 	xfree(patbuf);
419 	return (err);
420     }
421 
422     /*
423      * If there was no match we are going to append the pattern
424      * if GLOB_NOCHECK was specified or if GLOB_NOMAGIC was specified
425      * and the pattern did not contain any magic characters
426      * GLOB_NOMAGIC is there just for compatibility with csh.
427      */
428     if (pglob->gl_pathc == oldpathc &&
429 	((flags & GLOB_NOCHECK) ||
430 	 ((flags & GLOB_NOMAGIC) && !(pglob->gl_flags & GLOB_MAGCHAR)))) {
431 	if (!(flags & GLOB_QUOTE))
432 	    globextend(pattern, pglob);
433 	else {
434 	    char *copy, *dest;
435 	    const char *src;
436 
437 	    /* copy pattern, interpreting quotes */
438 	    copy = xmalloc(strlen(pattern) + 1);
439 	    dest = copy;
440 	    src = pattern;
441 	    while (*src != EOS) {
442 		if (*src == QUOTE) {
443 		    if (*++src == EOS)
444 			--src;
445 		}
446 		*dest++ = *src++;
447 	    }
448 	    *dest = EOS;
449 	    globextend(copy, pglob);
450 	    xfree(copy);
451 	}
452 	xfree(patbuf);
453 	return 0;
454     }
455     else if (!(flags & GLOB_NOSORT) && (pglob->gl_pathc != oldpathc))
456 	qsort(pglob->gl_pathv + pglob->gl_offs + oldpathc,
457 	      pglob->gl_pathc - oldpathc, sizeof(char *), compare);
458     xfree(patbuf);
459     return (0);
460 }
461 
462 static int
463 glob1(Char *pattern, glob_t *pglob, int no_match)
464 {
465     struct strbuf pathbuf = strbuf_INIT;
466     int err;
467 
468     /*
469      * a null pathname is invalid -- POSIX 1003.1 sect. 2.4.
470      */
471     if (*pattern == EOS)
472 	return (0);
473     err = glob2(&pathbuf, pattern, pglob, no_match);
474     xfree(pathbuf.s);
475     return err;
476 }
477 
478 /*
479  * functions glob2 and glob3 are mutually recursive; there is one level
480  * of recursion for each segment in the pattern that contains one or
481  * more meta characters.
482  */
483 static int
484 glob2(struct strbuf *pathbuf, const Char *pattern, glob_t *pglob, int no_match)
485 {
486     struct stat sbuf;
487     int anymeta;
488     const Char *p;
489     size_t orig_len;
490 
491     /*
492      * loop over pattern segments until end of pattern or until segment with
493      * meta character found.
494      */
495     anymeta = 0;
496     for (;;) {
497 	if (*pattern == EOS) {	/* end of pattern? */
498 	    strbuf_terminate(pathbuf);
499 
500 	    if (Lstat(pathbuf->s, &sbuf))
501 		return (0);
502 
503 	    if (((pglob->gl_flags & GLOB_MARK) &&
504 		 pathbuf->s[pathbuf->len - 1] != SEP) &&
505 		(S_ISDIR(sbuf.st_mode)
506 #ifdef S_IFLNK
507 		 || (S_ISLNK(sbuf.st_mode) &&
508 		     (Stat(pathbuf->s, &sbuf) == 0) &&
509 		     S_ISDIR(sbuf.st_mode))
510 #endif
511 		 )) {
512 		strbuf_append1(pathbuf, SEP);
513 		strbuf_terminate(pathbuf);
514 	    }
515 	    ++pglob->gl_matchc;
516 	    globextend(pathbuf->s, pglob);
517 	    return 0;
518 	}
519 
520 	/* find end of next segment, tentatively copy to pathbuf */
521 	p = pattern;
522 	orig_len = pathbuf->len;
523 	while (*p != EOS && *p != SEP) {
524 	    if (ismeta(*p))
525 		anymeta = 1;
526 	    strbuf_append1(pathbuf, *p++);
527 	}
528 
529 	if (!anymeta) {		/* no expansion, do next segment */
530 	    pattern = p;
531 	    while (*pattern == SEP)
532 		strbuf_append1(pathbuf, *pattern++);
533 	}
534 	else {			/* need expansion, recurse */
535 	    pathbuf->len = orig_len;
536 	    return (glob3(pathbuf, pattern, p, pattern, pglob, no_match));
537 	}
538     }
539     /* NOTREACHED */
540 }
541 
542 static size_t
543 One_Char_mbtowc(__Char *pwc, const Char *s, size_t n)
544 {
545 #ifdef WIDE_STRINGS
546     char buf[MB_LEN_MAX], *p;
547 
548     if (n > MB_LEN_MAX)
549 	n = MB_LEN_MAX;
550     p = buf;
551     while (p < buf + n && (*p++ = LCHAR(*s++)) != 0)
552 	;
553     return one_mbtowc(pwc, buf, n);
554 #else
555     *pwc = *s & CHAR;
556     return 1;
557 #endif
558 }
559 
560 static int
561 glob3(struct strbuf *pathbuf, const Char *pattern, const Char *restpattern,
562       const Char *pglobstar, glob_t *pglob, int no_match)
563 {
564     DIR    *dirp;
565     struct dirent *dp;
566     struct stat sbuf;
567     int     err;
568     Char m_not = (pglob->gl_flags & GLOB_ALTNOT) ? M_ALTNOT : M_NOT;
569     size_t orig_len;
570     int globstar = 0;
571     int chase_symlinks = 0;
572     const Char *termstar = NULL;
573 
574     strbuf_terminate(pathbuf);
575     orig_len = pathbuf->len;
576     errno = err = 0;
577 
578     while (pglobstar < restpattern) {
579 	__Char wc;
580 	size_t width = One_Char_mbtowc(&wc, pglobstar, MB_LEN_MAX);
581 	if ((pglobstar[0] & M_MASK) == M_ALL &&
582 	    (pglobstar[width] & M_MASK) == M_ALL) {
583 	    globstar = 1;
584 	    chase_symlinks = (pglobstar[2 * width] & M_MASK) == M_ALL;
585 	    termstar = pglobstar + (2 + chase_symlinks) * width;
586 	    break;
587 	}
588         pglobstar += width;
589     }
590 
591     if (globstar) {
592 	err = pglobstar==pattern && termstar==restpattern ?
593 		*restpattern == EOS ?
594 		glob2(pathbuf, restpattern - 1, pglob, no_match) :
595 		glob2(pathbuf, restpattern + 1, pglob, no_match) :
596 		glob3(pathbuf, pattern, restpattern, termstar, pglob, no_match);
597 	if (err)
598 	    return err;
599 	pathbuf->len = orig_len;
600 	strbuf_terminate(pathbuf);
601     }
602 
603     if (*pathbuf->s && (Lstat(pathbuf->s, &sbuf) || !S_ISDIR(sbuf.st_mode)
604 #ifdef S_IFLINK
605 	     && ((globstar && !chase_symlinks) || !S_ISLNK(sbuf.st_mode))
606 #endif
607 	))
608 	return 0;
609 
610     if (!(dirp = Opendir(pathbuf->s))) {
611 	/* todo: don't call for ENOENT or ENOTDIR? */
612 	if ((pglob->gl_errfunc && (*pglob->gl_errfunc) (pathbuf->s, errno)) ||
613 	    (pglob->gl_flags & GLOB_ERR))
614 	    return (GLOB_ABEND);
615 	else
616 	    return (0);
617     }
618 
619     /* search directory for matching names */
620     while ((dp = readdir(dirp)) != NULL) {
621 	/* initial DOT must be matched literally */
622 	if (dp->d_name[0] == DOT && *pattern != DOT)
623 	    if (!(pglob->gl_flags & GLOB_DOT) || !dp->d_name[1] ||
624 		(dp->d_name[1] == DOT && !dp->d_name[2]))
625 		continue; /*unless globdot and not . or .. */
626 	pathbuf->len = orig_len;
627 	strbuf_append(pathbuf, dp->d_name);
628 	strbuf_terminate(pathbuf);
629 
630 	if (globstar) {
631 #ifdef S_IFLNK
632 	    if (!chase_symlinks &&
633 		(Lstat(pathbuf->s, &sbuf) || S_ISLNK(sbuf.st_mode)))
634 		    continue;
635 #endif
636 	    if (match(pathbuf->s + orig_len, pattern, termstar,
637 		(int)m_not) == no_match)
638 		    continue;
639 	    strbuf_append1(pathbuf, SEP);
640 	    strbuf_terminate(pathbuf);
641 	    if ((err = glob2(pathbuf, pglobstar, pglob, no_match)) != 0)
642 		break;
643 	} else {
644 	    if (match(pathbuf->s + orig_len, pattern, restpattern,
645 		(int) m_not) == no_match)
646 		continue;
647 	    if ((err = glob2(pathbuf, restpattern, pglob, no_match)) != 0)
648 		break;
649 	}
650     }
651     /* todo: check error from readdir? */
652     closedir(dirp);
653     return (err);
654 }
655 
656 
657 /*
658  * Extend the gl_pathv member of a glob_t structure to accomodate a new item,
659  * add the new item, and update gl_pathc.
660  *
661  * This assumes the BSD realloc, which only copies the block when its size
662  * crosses a power-of-two boundary; for v7 realloc, this would cause quadratic
663  * behavior.
664  *
665  * Return 0 if new item added, error code if memory couldn't be allocated.
666  *
667  * Invariant of the glob_t structure:
668  *	Either gl_pathc is zero and gl_pathv is NULL; or gl_pathc > 0 and
669  *	 gl_pathv points to (gl_offs + gl_pathc + 1) items.
670  */
671 static void
672 globextend(const char *path, glob_t *pglob)
673 {
674     char **pathv;
675     int i;
676     size_t newsize;
677 
678     newsize = sizeof(*pathv) * (2 + pglob->gl_pathc + pglob->gl_offs);
679     pathv = xrealloc(pglob->gl_pathv, newsize);
680 
681     if (pglob->gl_pathv == NULL && pglob->gl_offs > 0) {
682 	/* first time around -- clear initial gl_offs items */
683 	pathv += pglob->gl_offs;
684 	for (i = pglob->gl_offs; --i >= 0;)
685 	    *--pathv = NULL;
686     }
687     pglob->gl_pathv = pathv;
688 
689     pathv[pglob->gl_offs + pglob->gl_pathc++] = strsave(path);
690     pathv[pglob->gl_offs + pglob->gl_pathc] = NULL;
691 }
692 
693 /*
694  * pattern matching function for filenames.  Each occurrence of the *
695  * pattern causes a recursion level.
696  */
697 static  int
698 match(const char *name, const Char *pat, const Char *patend, int m_not)
699 {
700     int ok, negate_range;
701     Char c;
702 
703     while (pat < patend) {
704 	size_t lwk;
705 	__Char wc, wk;
706 
707 	c = *pat; /* Only for M_MASK bits */
708 	pat += One_Char_mbtowc(&wc, pat, MB_LEN_MAX);
709 	lwk = one_mbtowc(&wk, name, MB_LEN_MAX);
710 	switch (c & M_MASK) {
711 	case M_ALL:
712 	    while (pat < patend && (*pat & M_MASK) == M_ALL)  /* eat consecutive '*' */
713 		pat += One_Char_mbtowc(&wc, pat, MB_LEN_MAX);
714 	    if (pat == patend)
715 	        return (1);
716 	    while (!match(name, pat, patend, m_not)) {
717 		if (*name == EOS)
718 		    return (0);
719 		name += lwk;
720 		lwk = one_mbtowc(&wk, name, MB_LEN_MAX);
721 	    }
722 	    return (1);
723 	case M_ONE:
724 	    if (*name == EOS)
725 		return (0);
726 	    name += lwk;
727 	    break;
728 	case M_SET:
729 	    ok = 0;
730 	    if (*name == EOS)
731 		return (0);
732 	    name += lwk;
733 	    if ((negate_range = ((*pat & M_MASK) == m_not)) != 0)
734 		++pat;
735 	    while ((*pat & M_MASK) != M_END) {
736 		pat += One_Char_mbtowc(&wc, pat, MB_LEN_MAX);
737 		if ((*pat & M_MASK) == M_RNG) {
738 		    __Char wc2;
739 
740 		    pat++;
741 		    pat += One_Char_mbtowc(&wc2, pat, MB_LEN_MAX);
742 		    if (globcharcoll(wc, wk, 0) <= 0 &&
743 			globcharcoll(wk, wc2, 0) <= 0)
744 			ok = 1;
745 		} else if (wc == wk)
746 		    ok = 1;
747 	    }
748 	    pat += One_Char_mbtowc(&wc, pat, MB_LEN_MAX);
749 	    if (ok == negate_range)
750 		return (0);
751 	    break;
752 	default:
753 	    if (*name == EOS || samecase(wk) != samecase(wc))
754 		return (0);
755 	    name += lwk;
756 	    break;
757 	}
758     }
759     return (*name == EOS);
760 }
761 
762 /* free allocated data belonging to a glob_t structure */
763 void
764 globfree(glob_t *pglob)
765 {
766     int i;
767     char **pp;
768 
769     if (pglob->gl_pathv != NULL) {
770 	pp = pglob->gl_pathv + pglob->gl_offs;
771 	for (i = pglob->gl_pathc; i--; ++pp)
772 	    if (*pp)
773 		xfree(*pp), *pp = NULL;
774 	xfree(pglob->gl_pathv), pglob->gl_pathv = NULL;
775     }
776 }
777