1*7c478bd9Sstevel@tonic-gate /*
2*7c478bd9Sstevel@tonic-gate * CDDL HEADER START
3*7c478bd9Sstevel@tonic-gate *
4*7c478bd9Sstevel@tonic-gate * The contents of this file are subject to the terms of the
5*7c478bd9Sstevel@tonic-gate * Common Development and Distribution License, Version 1.0 only
6*7c478bd9Sstevel@tonic-gate * (the "License"). You may not use this file except in compliance
7*7c478bd9Sstevel@tonic-gate * with the License.
8*7c478bd9Sstevel@tonic-gate *
9*7c478bd9Sstevel@tonic-gate * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
10*7c478bd9Sstevel@tonic-gate * or http://www.opensolaris.org/os/licensing.
11*7c478bd9Sstevel@tonic-gate * See the License for the specific language governing permissions
12*7c478bd9Sstevel@tonic-gate * and limitations under the License.
13*7c478bd9Sstevel@tonic-gate *
14*7c478bd9Sstevel@tonic-gate * When distributing Covered Code, include this CDDL HEADER in each
15*7c478bd9Sstevel@tonic-gate * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
16*7c478bd9Sstevel@tonic-gate * If applicable, add the following below this CDDL HEADER, with the
17*7c478bd9Sstevel@tonic-gate * fields enclosed by brackets "[]" replaced with your own identifying
18*7c478bd9Sstevel@tonic-gate * information: Portions Copyright [yyyy] [name of copyright owner]
19*7c478bd9Sstevel@tonic-gate *
20*7c478bd9Sstevel@tonic-gate * CDDL HEADER END
21*7c478bd9Sstevel@tonic-gate */
22*7c478bd9Sstevel@tonic-gate /*
23*7c478bd9Sstevel@tonic-gate * Copyright (c) 1997, by Sun Microsystems, Inc.
24*7c478bd9Sstevel@tonic-gate * All rights reserved.
25*7c478bd9Sstevel@tonic-gate */
26*7c478bd9Sstevel@tonic-gate
27*7c478bd9Sstevel@tonic-gate /* Copyright (c) 1984, 1986, 1987, 1988, 1989 AT&T */
28*7c478bd9Sstevel@tonic-gate /* All Rights Reserved */
29*7c478bd9Sstevel@tonic-gate
30*7c478bd9Sstevel@tonic-gate
31*7c478bd9Sstevel@tonic-gate /* Portions Copyright(c) 1988, Sun Microsystems Inc. */
32*7c478bd9Sstevel@tonic-gate /* All Rights Reserved */
33*7c478bd9Sstevel@tonic-gate
34*7c478bd9Sstevel@tonic-gate #pragma ident "%Z%%M% %I% %E% SMI" /* SVr4.0 1.1 */
35*7c478bd9Sstevel@tonic-gate
36*7c478bd9Sstevel@tonic-gate /*LINTLIBRARY*/
37*7c478bd9Sstevel@tonic-gate
38*7c478bd9Sstevel@tonic-gate /*
39*7c478bd9Sstevel@tonic-gate * routines to do regular expression matching
40*7c478bd9Sstevel@tonic-gate *
41*7c478bd9Sstevel@tonic-gate * Entry points:
42*7c478bd9Sstevel@tonic-gate *
43*7c478bd9Sstevel@tonic-gate * re_comp(s)
44*7c478bd9Sstevel@tonic-gate * char *s;
45*7c478bd9Sstevel@tonic-gate * ... returns 0 if the string s was compiled successfully,
46*7c478bd9Sstevel@tonic-gate * a pointer to an error message otherwise.
47*7c478bd9Sstevel@tonic-gate * If passed 0 or a null string returns without changing
48*7c478bd9Sstevel@tonic-gate * the currently compiled re (see note 11 below).
49*7c478bd9Sstevel@tonic-gate *
50*7c478bd9Sstevel@tonic-gate * re_exec(s)
51*7c478bd9Sstevel@tonic-gate * char *s;
52*7c478bd9Sstevel@tonic-gate * ... returns 1 if the string s matches the last compiled regular
53*7c478bd9Sstevel@tonic-gate * expression,
54*7c478bd9Sstevel@tonic-gate * 0 if the string s failed to match the last compiled
55*7c478bd9Sstevel@tonic-gate * regular expression, and
56*7c478bd9Sstevel@tonic-gate * -1 if the compiled regular expression was invalid
57*7c478bd9Sstevel@tonic-gate * (indicating an internal error).
58*7c478bd9Sstevel@tonic-gate *
59*7c478bd9Sstevel@tonic-gate * The strings passed to both re_comp and re_exec may have trailing or
60*7c478bd9Sstevel@tonic-gate * embedded newline characters; they are terminated by nulls.
61*7c478bd9Sstevel@tonic-gate *
62*7c478bd9Sstevel@tonic-gate * The identity of the author of these routines is lost in antiquity;
63*7c478bd9Sstevel@tonic-gate * this is essentially the same as the re code in the original V6 ed.
64*7c478bd9Sstevel@tonic-gate *
65*7c478bd9Sstevel@tonic-gate * The regular expressions recognized are described below. This description
66*7c478bd9Sstevel@tonic-gate * is essentially the same as that for ed.
67*7c478bd9Sstevel@tonic-gate *
68*7c478bd9Sstevel@tonic-gate * A regular expression specifies a set of strings of characters.
69*7c478bd9Sstevel@tonic-gate * A member of this set of strings is said to be matched by
70*7c478bd9Sstevel@tonic-gate * the regular expression. In the following specification for
71*7c478bd9Sstevel@tonic-gate * regular expressions the word `character' means any character but NUL.
72*7c478bd9Sstevel@tonic-gate *
73*7c478bd9Sstevel@tonic-gate * 1. Any character except a special character matches itself.
74*7c478bd9Sstevel@tonic-gate * Special characters are the regular expression delimiter plus
75*7c478bd9Sstevel@tonic-gate * \ [ . and sometimes ^ * $.
76*7c478bd9Sstevel@tonic-gate * 2. A . matches any character.
77*7c478bd9Sstevel@tonic-gate * 3. A \ followed by any character except a digit or ( )
78*7c478bd9Sstevel@tonic-gate * matches that character.
79*7c478bd9Sstevel@tonic-gate * 4. A nonempty string s bracketed [s] (or [^s]) matches any
80*7c478bd9Sstevel@tonic-gate * character in (or not in) s. In s, \ has no special meaning,
81*7c478bd9Sstevel@tonic-gate * and ] may only appear as the first letter. A substring
82*7c478bd9Sstevel@tonic-gate * a-b, with a and b in ascending ASCII order, stands for
83*7c478bd9Sstevel@tonic-gate * the inclusive range of ASCII characters.
84*7c478bd9Sstevel@tonic-gate * 5. A regular expression of form 1-4 followed by * matches a
85*7c478bd9Sstevel@tonic-gate * sequence of 0 or more matches of the regular expression.
86*7c478bd9Sstevel@tonic-gate * 6. A regular expression, x, of form 1-8, bracketed \(x\)
87*7c478bd9Sstevel@tonic-gate * matches what x matches.
88*7c478bd9Sstevel@tonic-gate * 7. A \ followed by a digit n matches a copy of the string that the
89*7c478bd9Sstevel@tonic-gate * bracketed regular expression beginning with the nth \( matched.
90*7c478bd9Sstevel@tonic-gate * 8. A regular expression of form 1-8, x, followed by a regular
91*7c478bd9Sstevel@tonic-gate * expression of form 1-7, y matches a match for x followed by
92*7c478bd9Sstevel@tonic-gate * a match for y, with the x match being as long as possible
93*7c478bd9Sstevel@tonic-gate * while still permitting a y match.
94*7c478bd9Sstevel@tonic-gate * 9. A regular expression of form 1-8 preceded by ^ (or followed
95*7c478bd9Sstevel@tonic-gate * by $), is constrained to matches that begin at the left
96*7c478bd9Sstevel@tonic-gate * (or end at the right) end of a line.
97*7c478bd9Sstevel@tonic-gate * 10. A regular expression of form 1-9 picks out the longest among
98*7c478bd9Sstevel@tonic-gate * the leftmost matches in a line.
99*7c478bd9Sstevel@tonic-gate * 11. An empty regular expression stands for a copy of the last
100*7c478bd9Sstevel@tonic-gate * regular expression encountered.
101*7c478bd9Sstevel@tonic-gate */
102*7c478bd9Sstevel@tonic-gate
103*7c478bd9Sstevel@tonic-gate #include <sys/types.h>
104*7c478bd9Sstevel@tonic-gate #include <stdlib.h>
105*7c478bd9Sstevel@tonic-gate #include <stddef.h>
106*7c478bd9Sstevel@tonic-gate
107*7c478bd9Sstevel@tonic-gate /*
108*7c478bd9Sstevel@tonic-gate * constants for re's
109*7c478bd9Sstevel@tonic-gate */
110*7c478bd9Sstevel@tonic-gate #define CBRA 1
111*7c478bd9Sstevel@tonic-gate #define CCHR 2
112*7c478bd9Sstevel@tonic-gate #define CDOT 4
113*7c478bd9Sstevel@tonic-gate #define CCL 6
114*7c478bd9Sstevel@tonic-gate #define NCCL 8
115*7c478bd9Sstevel@tonic-gate #define CDOL 10
116*7c478bd9Sstevel@tonic-gate #define CEOF 11
117*7c478bd9Sstevel@tonic-gate #define CKET 12
118*7c478bd9Sstevel@tonic-gate #define CBACK 18
119*7c478bd9Sstevel@tonic-gate
120*7c478bd9Sstevel@tonic-gate #define CSTAR 01
121*7c478bd9Sstevel@tonic-gate
122*7c478bd9Sstevel@tonic-gate #define ESIZE 512
123*7c478bd9Sstevel@tonic-gate #define NBRA 9
124*7c478bd9Sstevel@tonic-gate
125*7c478bd9Sstevel@tonic-gate static struct re_globals {
126*7c478bd9Sstevel@tonic-gate char _expbuf[ESIZE];
127*7c478bd9Sstevel@tonic-gate char *_braslist[NBRA], *_braelist[NBRA];
128*7c478bd9Sstevel@tonic-gate char _circf;
129*7c478bd9Sstevel@tonic-gate } *re_globals;
130*7c478bd9Sstevel@tonic-gate #define expbuf (_re->_expbuf)
131*7c478bd9Sstevel@tonic-gate #define braslist (_re->_braslist)
132*7c478bd9Sstevel@tonic-gate #define braelist (_re->_braelist)
133*7c478bd9Sstevel@tonic-gate #define circf (_re->_circf)
134*7c478bd9Sstevel@tonic-gate
135*7c478bd9Sstevel@tonic-gate /*
136*7c478bd9Sstevel@tonic-gate * forward declarations
137*7c478bd9Sstevel@tonic-gate */
138*7c478bd9Sstevel@tonic-gate static int backref(int, char *);
139*7c478bd9Sstevel@tonic-gate static int advance(char *, char *);
140*7c478bd9Sstevel@tonic-gate static int cclass(char *, char, int);
141*7c478bd9Sstevel@tonic-gate
142*7c478bd9Sstevel@tonic-gate /*
143*7c478bd9Sstevel@tonic-gate * compile the regular expression argument into a dfa
144*7c478bd9Sstevel@tonic-gate */
145*7c478bd9Sstevel@tonic-gate char *
re_comp(char * sp)146*7c478bd9Sstevel@tonic-gate re_comp(char *sp)
147*7c478bd9Sstevel@tonic-gate {
148*7c478bd9Sstevel@tonic-gate char c;
149*7c478bd9Sstevel@tonic-gate struct re_globals *_re = re_globals;
150*7c478bd9Sstevel@tonic-gate char *ep;
151*7c478bd9Sstevel@tonic-gate int cclcnt, numbra = 0;
152*7c478bd9Sstevel@tonic-gate char *lastep = 0;
153*7c478bd9Sstevel@tonic-gate char bracket[NBRA];
154*7c478bd9Sstevel@tonic-gate char *bracketp = &bracket[0];
155*7c478bd9Sstevel@tonic-gate char *retoolong = "Regular expression too long";
156*7c478bd9Sstevel@tonic-gate
157*7c478bd9Sstevel@tonic-gate if (_re == 0) {
158*7c478bd9Sstevel@tonic-gate _re = (struct re_globals *)calloc(1, sizeof (*_re));
159*7c478bd9Sstevel@tonic-gate if (_re == 0)
160*7c478bd9Sstevel@tonic-gate return ("Out of memory");
161*7c478bd9Sstevel@tonic-gate re_globals = _re;
162*7c478bd9Sstevel@tonic-gate }
163*7c478bd9Sstevel@tonic-gate ep = expbuf;
164*7c478bd9Sstevel@tonic-gate
165*7c478bd9Sstevel@tonic-gate #define comerr(msg) {expbuf[0] = 0; return (msg); }
166*7c478bd9Sstevel@tonic-gate
167*7c478bd9Sstevel@tonic-gate if (sp == 0 || *sp == '\0') {
168*7c478bd9Sstevel@tonic-gate if (*ep == 0)
169*7c478bd9Sstevel@tonic-gate return ("No previous regular expression");
170*7c478bd9Sstevel@tonic-gate return (0);
171*7c478bd9Sstevel@tonic-gate }
172*7c478bd9Sstevel@tonic-gate if (*sp == '^') {
173*7c478bd9Sstevel@tonic-gate circf = 1;
174*7c478bd9Sstevel@tonic-gate sp++;
175*7c478bd9Sstevel@tonic-gate }
176*7c478bd9Sstevel@tonic-gate else
177*7c478bd9Sstevel@tonic-gate circf = 0;
178*7c478bd9Sstevel@tonic-gate for (;;) {
179*7c478bd9Sstevel@tonic-gate if (ep >= &expbuf[ESIZE])
180*7c478bd9Sstevel@tonic-gate comerr(retoolong);
181*7c478bd9Sstevel@tonic-gate if ((c = *sp++) == '\0') {
182*7c478bd9Sstevel@tonic-gate if (bracketp != bracket)
183*7c478bd9Sstevel@tonic-gate comerr("unmatched \\(");
184*7c478bd9Sstevel@tonic-gate *ep++ = CEOF;
185*7c478bd9Sstevel@tonic-gate *ep++ = 0;
186*7c478bd9Sstevel@tonic-gate return (0);
187*7c478bd9Sstevel@tonic-gate }
188*7c478bd9Sstevel@tonic-gate if (c != '*')
189*7c478bd9Sstevel@tonic-gate lastep = ep;
190*7c478bd9Sstevel@tonic-gate switch (c) {
191*7c478bd9Sstevel@tonic-gate
192*7c478bd9Sstevel@tonic-gate case '.':
193*7c478bd9Sstevel@tonic-gate *ep++ = CDOT;
194*7c478bd9Sstevel@tonic-gate continue;
195*7c478bd9Sstevel@tonic-gate
196*7c478bd9Sstevel@tonic-gate case '*':
197*7c478bd9Sstevel@tonic-gate if (lastep == 0 || *lastep == CBRA || *lastep == CKET)
198*7c478bd9Sstevel@tonic-gate goto defchar;
199*7c478bd9Sstevel@tonic-gate *lastep |= CSTAR;
200*7c478bd9Sstevel@tonic-gate continue;
201*7c478bd9Sstevel@tonic-gate
202*7c478bd9Sstevel@tonic-gate case '$':
203*7c478bd9Sstevel@tonic-gate if (*sp != '\0')
204*7c478bd9Sstevel@tonic-gate goto defchar;
205*7c478bd9Sstevel@tonic-gate *ep++ = CDOL;
206*7c478bd9Sstevel@tonic-gate continue;
207*7c478bd9Sstevel@tonic-gate
208*7c478bd9Sstevel@tonic-gate case '[':
209*7c478bd9Sstevel@tonic-gate *ep++ = CCL;
210*7c478bd9Sstevel@tonic-gate *ep++ = 0;
211*7c478bd9Sstevel@tonic-gate cclcnt = 1;
212*7c478bd9Sstevel@tonic-gate if ((c = *sp++) == '^') {
213*7c478bd9Sstevel@tonic-gate c = *sp++;
214*7c478bd9Sstevel@tonic-gate ep[-2] = NCCL;
215*7c478bd9Sstevel@tonic-gate }
216*7c478bd9Sstevel@tonic-gate do {
217*7c478bd9Sstevel@tonic-gate if (c == '\0')
218*7c478bd9Sstevel@tonic-gate comerr("missing ]");
219*7c478bd9Sstevel@tonic-gate if (c == '-' && ep [-1] != 0) {
220*7c478bd9Sstevel@tonic-gate if ((c = *sp++) == ']') {
221*7c478bd9Sstevel@tonic-gate *ep++ = '-';
222*7c478bd9Sstevel@tonic-gate cclcnt++;
223*7c478bd9Sstevel@tonic-gate break;
224*7c478bd9Sstevel@tonic-gate }
225*7c478bd9Sstevel@tonic-gate while (ep[-1] < c) {
226*7c478bd9Sstevel@tonic-gate *ep = ep[-1] + 1;
227*7c478bd9Sstevel@tonic-gate ep++;
228*7c478bd9Sstevel@tonic-gate cclcnt++;
229*7c478bd9Sstevel@tonic-gate if (ep >= &expbuf[ESIZE])
230*7c478bd9Sstevel@tonic-gate comerr(retoolong);
231*7c478bd9Sstevel@tonic-gate }
232*7c478bd9Sstevel@tonic-gate }
233*7c478bd9Sstevel@tonic-gate *ep++ = c;
234*7c478bd9Sstevel@tonic-gate cclcnt++;
235*7c478bd9Sstevel@tonic-gate if (ep >= &expbuf[ESIZE])
236*7c478bd9Sstevel@tonic-gate comerr(retoolong);
237*7c478bd9Sstevel@tonic-gate } while ((c = *sp++) != ']');
238*7c478bd9Sstevel@tonic-gate lastep[1] = (char)cclcnt;
239*7c478bd9Sstevel@tonic-gate continue;
240*7c478bd9Sstevel@tonic-gate
241*7c478bd9Sstevel@tonic-gate case '\\':
242*7c478bd9Sstevel@tonic-gate if ((c = *sp++) == '(') {
243*7c478bd9Sstevel@tonic-gate if (numbra >= NBRA)
244*7c478bd9Sstevel@tonic-gate comerr("too many \\(\\) pairs");
245*7c478bd9Sstevel@tonic-gate *bracketp++ = (char)numbra;
246*7c478bd9Sstevel@tonic-gate *ep++ = CBRA;
247*7c478bd9Sstevel@tonic-gate *ep++ = numbra++;
248*7c478bd9Sstevel@tonic-gate continue;
249*7c478bd9Sstevel@tonic-gate }
250*7c478bd9Sstevel@tonic-gate if (c == ')') {
251*7c478bd9Sstevel@tonic-gate if (bracketp <= bracket)
252*7c478bd9Sstevel@tonic-gate comerr("unmatched \\)");
253*7c478bd9Sstevel@tonic-gate *ep++ = CKET;
254*7c478bd9Sstevel@tonic-gate *ep++ = *--bracketp;
255*7c478bd9Sstevel@tonic-gate continue;
256*7c478bd9Sstevel@tonic-gate }
257*7c478bd9Sstevel@tonic-gate if (c >= '1' && c < ('1' + NBRA)) {
258*7c478bd9Sstevel@tonic-gate *ep++ = CBACK;
259*7c478bd9Sstevel@tonic-gate *ep++ = c - '1';
260*7c478bd9Sstevel@tonic-gate continue;
261*7c478bd9Sstevel@tonic-gate }
262*7c478bd9Sstevel@tonic-gate *ep++ = CCHR;
263*7c478bd9Sstevel@tonic-gate *ep++ = c;
264*7c478bd9Sstevel@tonic-gate continue;
265*7c478bd9Sstevel@tonic-gate
266*7c478bd9Sstevel@tonic-gate defchar:
267*7c478bd9Sstevel@tonic-gate default:
268*7c478bd9Sstevel@tonic-gate *ep++ = CCHR;
269*7c478bd9Sstevel@tonic-gate *ep++ = c;
270*7c478bd9Sstevel@tonic-gate }
271*7c478bd9Sstevel@tonic-gate }
272*7c478bd9Sstevel@tonic-gate }
273*7c478bd9Sstevel@tonic-gate
274*7c478bd9Sstevel@tonic-gate /*
275*7c478bd9Sstevel@tonic-gate * match the argument string against the compiled re
276*7c478bd9Sstevel@tonic-gate */
277*7c478bd9Sstevel@tonic-gate int
re_exec(char * p1)278*7c478bd9Sstevel@tonic-gate re_exec(char *p1)
279*7c478bd9Sstevel@tonic-gate {
280*7c478bd9Sstevel@tonic-gate struct re_globals *_re = re_globals;
281*7c478bd9Sstevel@tonic-gate char *p2;
282*7c478bd9Sstevel@tonic-gate int c;
283*7c478bd9Sstevel@tonic-gate int rv;
284*7c478bd9Sstevel@tonic-gate
285*7c478bd9Sstevel@tonic-gate if (_re == 0)
286*7c478bd9Sstevel@tonic-gate return (0);
287*7c478bd9Sstevel@tonic-gate p2 = expbuf;
288*7c478bd9Sstevel@tonic-gate for (c = 0; c < NBRA; c++) {
289*7c478bd9Sstevel@tonic-gate braslist[c] = 0;
290*7c478bd9Sstevel@tonic-gate braelist[c] = 0;
291*7c478bd9Sstevel@tonic-gate }
292*7c478bd9Sstevel@tonic-gate if (circf)
293*7c478bd9Sstevel@tonic-gate return ((advance(p1, p2)));
294*7c478bd9Sstevel@tonic-gate /*
295*7c478bd9Sstevel@tonic-gate * fast check for first character
296*7c478bd9Sstevel@tonic-gate */
297*7c478bd9Sstevel@tonic-gate if (*p2 == CCHR) {
298*7c478bd9Sstevel@tonic-gate c = p2[1];
299*7c478bd9Sstevel@tonic-gate do {
300*7c478bd9Sstevel@tonic-gate if (*p1 != c)
301*7c478bd9Sstevel@tonic-gate continue;
302*7c478bd9Sstevel@tonic-gate if (rv = advance(p1, p2))
303*7c478bd9Sstevel@tonic-gate return (rv);
304*7c478bd9Sstevel@tonic-gate } while (*p1++);
305*7c478bd9Sstevel@tonic-gate return (0);
306*7c478bd9Sstevel@tonic-gate }
307*7c478bd9Sstevel@tonic-gate /*
308*7c478bd9Sstevel@tonic-gate * regular algorithm
309*7c478bd9Sstevel@tonic-gate */
310*7c478bd9Sstevel@tonic-gate do
311*7c478bd9Sstevel@tonic-gate if (rv = advance(p1, p2))
312*7c478bd9Sstevel@tonic-gate return (rv);
313*7c478bd9Sstevel@tonic-gate while (*p1++);
314*7c478bd9Sstevel@tonic-gate return (0);
315*7c478bd9Sstevel@tonic-gate }
316*7c478bd9Sstevel@tonic-gate
317*7c478bd9Sstevel@tonic-gate /*
318*7c478bd9Sstevel@tonic-gate * try to match the next thing in the dfa
319*7c478bd9Sstevel@tonic-gate */
320*7c478bd9Sstevel@tonic-gate static int
advance(char * lp,char * ep)321*7c478bd9Sstevel@tonic-gate advance(char *lp, char *ep)
322*7c478bd9Sstevel@tonic-gate {
323*7c478bd9Sstevel@tonic-gate char *curlp;
324*7c478bd9Sstevel@tonic-gate int i;
325*7c478bd9Sstevel@tonic-gate ptrdiff_t ct;
326*7c478bd9Sstevel@tonic-gate int rv;
327*7c478bd9Sstevel@tonic-gate struct re_globals *_re = re_globals;
328*7c478bd9Sstevel@tonic-gate
329*7c478bd9Sstevel@tonic-gate for (;;)
330*7c478bd9Sstevel@tonic-gate switch (*ep++) {
331*7c478bd9Sstevel@tonic-gate
332*7c478bd9Sstevel@tonic-gate case CCHR:
333*7c478bd9Sstevel@tonic-gate if (*ep++ == *lp++)
334*7c478bd9Sstevel@tonic-gate continue;
335*7c478bd9Sstevel@tonic-gate return (0);
336*7c478bd9Sstevel@tonic-gate
337*7c478bd9Sstevel@tonic-gate case CDOT:
338*7c478bd9Sstevel@tonic-gate if (*lp++)
339*7c478bd9Sstevel@tonic-gate continue;
340*7c478bd9Sstevel@tonic-gate return (0);
341*7c478bd9Sstevel@tonic-gate
342*7c478bd9Sstevel@tonic-gate case CDOL:
343*7c478bd9Sstevel@tonic-gate if (*lp == '\0')
344*7c478bd9Sstevel@tonic-gate continue;
345*7c478bd9Sstevel@tonic-gate return (0);
346*7c478bd9Sstevel@tonic-gate
347*7c478bd9Sstevel@tonic-gate case CEOF:
348*7c478bd9Sstevel@tonic-gate return (1);
349*7c478bd9Sstevel@tonic-gate
350*7c478bd9Sstevel@tonic-gate case CCL:
351*7c478bd9Sstevel@tonic-gate if (cclass(ep, *lp++, 1)) {
352*7c478bd9Sstevel@tonic-gate ep += *ep;
353*7c478bd9Sstevel@tonic-gate continue;
354*7c478bd9Sstevel@tonic-gate }
355*7c478bd9Sstevel@tonic-gate return (0);
356*7c478bd9Sstevel@tonic-gate
357*7c478bd9Sstevel@tonic-gate case NCCL:
358*7c478bd9Sstevel@tonic-gate if (cclass(ep, *lp++, 0)) {
359*7c478bd9Sstevel@tonic-gate ep += *ep;
360*7c478bd9Sstevel@tonic-gate continue;
361*7c478bd9Sstevel@tonic-gate }
362*7c478bd9Sstevel@tonic-gate return (0);
363*7c478bd9Sstevel@tonic-gate
364*7c478bd9Sstevel@tonic-gate case CBRA:
365*7c478bd9Sstevel@tonic-gate braslist[*ep++] = lp;
366*7c478bd9Sstevel@tonic-gate continue;
367*7c478bd9Sstevel@tonic-gate
368*7c478bd9Sstevel@tonic-gate case CKET:
369*7c478bd9Sstevel@tonic-gate braelist[*ep++] = lp;
370*7c478bd9Sstevel@tonic-gate continue;
371*7c478bd9Sstevel@tonic-gate
372*7c478bd9Sstevel@tonic-gate case CBACK:
373*7c478bd9Sstevel@tonic-gate if (braelist[i = *ep++] == 0)
374*7c478bd9Sstevel@tonic-gate return (-1);
375*7c478bd9Sstevel@tonic-gate if (backref(i, lp)) {
376*7c478bd9Sstevel@tonic-gate lp += braelist[i] - braslist[i];
377*7c478bd9Sstevel@tonic-gate continue;
378*7c478bd9Sstevel@tonic-gate }
379*7c478bd9Sstevel@tonic-gate return (0);
380*7c478bd9Sstevel@tonic-gate
381*7c478bd9Sstevel@tonic-gate case CBACK|CSTAR:
382*7c478bd9Sstevel@tonic-gate if (braelist[i = *ep++] == 0)
383*7c478bd9Sstevel@tonic-gate return (-1);
384*7c478bd9Sstevel@tonic-gate curlp = lp;
385*7c478bd9Sstevel@tonic-gate ct = braelist[i] - braslist[i];
386*7c478bd9Sstevel@tonic-gate while (backref(i, lp))
387*7c478bd9Sstevel@tonic-gate lp += ct;
388*7c478bd9Sstevel@tonic-gate while (lp >= curlp) {
389*7c478bd9Sstevel@tonic-gate if (rv = advance(lp, ep))
390*7c478bd9Sstevel@tonic-gate return (rv);
391*7c478bd9Sstevel@tonic-gate lp -= ct;
392*7c478bd9Sstevel@tonic-gate }
393*7c478bd9Sstevel@tonic-gate continue;
394*7c478bd9Sstevel@tonic-gate
395*7c478bd9Sstevel@tonic-gate case CDOT|CSTAR:
396*7c478bd9Sstevel@tonic-gate curlp = lp;
397*7c478bd9Sstevel@tonic-gate while (*lp++)
398*7c478bd9Sstevel@tonic-gate ;
399*7c478bd9Sstevel@tonic-gate goto star;
400*7c478bd9Sstevel@tonic-gate
401*7c478bd9Sstevel@tonic-gate case CCHR|CSTAR:
402*7c478bd9Sstevel@tonic-gate curlp = lp;
403*7c478bd9Sstevel@tonic-gate while (*lp++ == *ep)
404*7c478bd9Sstevel@tonic-gate ;
405*7c478bd9Sstevel@tonic-gate ep++;
406*7c478bd9Sstevel@tonic-gate goto star;
407*7c478bd9Sstevel@tonic-gate
408*7c478bd9Sstevel@tonic-gate case CCL|CSTAR:
409*7c478bd9Sstevel@tonic-gate case NCCL|CSTAR:
410*7c478bd9Sstevel@tonic-gate curlp = lp;
411*7c478bd9Sstevel@tonic-gate while (cclass(ep, *lp++, ep[-1] == (CCL|CSTAR)))
412*7c478bd9Sstevel@tonic-gate ;
413*7c478bd9Sstevel@tonic-gate ep += *ep;
414*7c478bd9Sstevel@tonic-gate goto star;
415*7c478bd9Sstevel@tonic-gate
416*7c478bd9Sstevel@tonic-gate star:
417*7c478bd9Sstevel@tonic-gate do {
418*7c478bd9Sstevel@tonic-gate lp--;
419*7c478bd9Sstevel@tonic-gate if (rv = advance(lp, ep))
420*7c478bd9Sstevel@tonic-gate return (rv);
421*7c478bd9Sstevel@tonic-gate } while (lp > curlp);
422*7c478bd9Sstevel@tonic-gate return (0);
423*7c478bd9Sstevel@tonic-gate
424*7c478bd9Sstevel@tonic-gate default:
425*7c478bd9Sstevel@tonic-gate return (-1);
426*7c478bd9Sstevel@tonic-gate }
427*7c478bd9Sstevel@tonic-gate }
428*7c478bd9Sstevel@tonic-gate
429*7c478bd9Sstevel@tonic-gate static int
backref(int i,char * lp)430*7c478bd9Sstevel@tonic-gate backref(int i, char *lp)
431*7c478bd9Sstevel@tonic-gate {
432*7c478bd9Sstevel@tonic-gate char *bp;
433*7c478bd9Sstevel@tonic-gate struct re_globals *_re = re_globals;
434*7c478bd9Sstevel@tonic-gate
435*7c478bd9Sstevel@tonic-gate bp = braslist[i];
436*7c478bd9Sstevel@tonic-gate while (*bp++ == *lp++)
437*7c478bd9Sstevel@tonic-gate if (bp >= braelist[i])
438*7c478bd9Sstevel@tonic-gate return (1);
439*7c478bd9Sstevel@tonic-gate return (0);
440*7c478bd9Sstevel@tonic-gate }
441*7c478bd9Sstevel@tonic-gate
442*7c478bd9Sstevel@tonic-gate static int
cclass(char * set,char c,int af)443*7c478bd9Sstevel@tonic-gate cclass(char *set, char c, int af)
444*7c478bd9Sstevel@tonic-gate {
445*7c478bd9Sstevel@tonic-gate int n;
446*7c478bd9Sstevel@tonic-gate
447*7c478bd9Sstevel@tonic-gate if (c == 0)
448*7c478bd9Sstevel@tonic-gate return (0);
449*7c478bd9Sstevel@tonic-gate n = *set++;
450*7c478bd9Sstevel@tonic-gate while (--n)
451*7c478bd9Sstevel@tonic-gate if (*set++ == c)
452*7c478bd9Sstevel@tonic-gate return (af);
453*7c478bd9Sstevel@tonic-gate return (! af);
454*7c478bd9Sstevel@tonic-gate }
455