xref: /illumos-gate/usr/src/contrib/ast/src/cmd/ksh93/include/lexstates.h (revision c7b656fc7125adc5888ce934f1a3433da4b1bbc5)
1b30d1939SAndy Fiddaman /***********************************************************************
2b30d1939SAndy Fiddaman *                                                                      *
3b30d1939SAndy Fiddaman *               This software is part of the ast package               *
4b30d1939SAndy Fiddaman *          Copyright (c) 1982-2011 AT&T Intellectual Property          *
5b30d1939SAndy Fiddaman *                      and is licensed under the                       *
6b30d1939SAndy Fiddaman *                 Eclipse Public License, Version 1.0                  *
7b30d1939SAndy Fiddaman *                    by AT&T Intellectual Property                     *
8b30d1939SAndy Fiddaman *                                                                      *
9b30d1939SAndy Fiddaman *                A copy of the License is available at                 *
10b30d1939SAndy Fiddaman *          http://www.eclipse.org/org/documents/epl-v10.html           *
11b30d1939SAndy Fiddaman *         (with md5 checksum b35adb5213ca9657e911e9befb180842)         *
12b30d1939SAndy Fiddaman *                                                                      *
13b30d1939SAndy Fiddaman *              Information and Software Systems Research               *
14b30d1939SAndy Fiddaman *                            AT&T Research                             *
15b30d1939SAndy Fiddaman *                           Florham Park NJ                            *
16b30d1939SAndy Fiddaman *                                                                      *
17b30d1939SAndy Fiddaman *                  David Korn <dgk@research.att.com>                   *
18b30d1939SAndy Fiddaman *                                                                      *
19b30d1939SAndy Fiddaman ***********************************************************************/
20b30d1939SAndy Fiddaman #pragma prototyped
21b30d1939SAndy Fiddaman #ifndef S_BREAK
22b30d1939SAndy Fiddaman #define S_BREAK	1	/* end of token */
23b30d1939SAndy Fiddaman #define S_EOF	2	/* end of buffer */
24b30d1939SAndy Fiddaman #define S_NL	3	/* new-line when not a token */
25b30d1939SAndy Fiddaman #define S_RES	4	/* first character of reserved word */
26b30d1939SAndy Fiddaman #define S_NAME	5	/* other identifier characters */
27b30d1939SAndy Fiddaman #define S_REG	6	/* non-special characters */
28b30d1939SAndy Fiddaman #define S_TILDE	7	/* first char is tilde */
29b30d1939SAndy Fiddaman #define S_PUSH	8
30b30d1939SAndy Fiddaman #define S_POP	9
31b30d1939SAndy Fiddaman #define S_BRACT	10
32b30d1939SAndy Fiddaman #define S_LIT	11	/* literal quote character */
33b30d1939SAndy Fiddaman #define S_NLTOK	12	/* new-line token */
34b30d1939SAndy Fiddaman #define S_OP	13	/* operator character */
35b30d1939SAndy Fiddaman #define S_PAT	14	/* pattern characters * and ? */
36b30d1939SAndy Fiddaman #define S_EPAT	15	/* pattern char when followed by ( */
37b30d1939SAndy Fiddaman #define S_EQ	16	/* assignment character */
38b30d1939SAndy Fiddaman #define S_COM	17	/* comment character */
39b30d1939SAndy Fiddaman #define S_MOD1	18	/* ${...} modifier character - old quoting */
40b30d1939SAndy Fiddaman #define S_MOD2	19	/* ${...} modifier character - new quoting */
41b30d1939SAndy Fiddaman #define S_ERR	20	/* invalid character in ${...} */
42b30d1939SAndy Fiddaman #define S_SPC1	21	/* special prefix characters after $ */
43b30d1939SAndy Fiddaman #define S_SPC2	22	/* special characters after $ */
44b30d1939SAndy Fiddaman #define S_DIG	23	/* digit character after $*/
45b30d1939SAndy Fiddaman #define S_ALP	24	/* alpahbetic character after $ */
46b30d1939SAndy Fiddaman #define S_LBRA	25	/* left brace after $ */
47b30d1939SAndy Fiddaman #define S_RBRA	26	/* right brace after $ */
48b30d1939SAndy Fiddaman #define S_PAR	27	/* set for $( */
49b30d1939SAndy Fiddaman #define S_ENDCH	28	/* macro expansion terminator */
50b30d1939SAndy Fiddaman #define S_SLASH	29	/* / character terminates ~ expansion  */
51b30d1939SAndy Fiddaman #define S_COLON	30	/* for character : */
52b30d1939SAndy Fiddaman #define S_LABEL	31	/* for goto label */
53b30d1939SAndy Fiddaman #define S_EDOL	32	/* ends $identifier */
54b30d1939SAndy Fiddaman #define S_BRACE	33	/* left brace */
55b30d1939SAndy Fiddaman #define S_DOT	34	/* . char */
56b30d1939SAndy Fiddaman #define S_META	35	/* | & ; < > inside ${...} reserved for future use */
57b30d1939SAndy Fiddaman #define S_SPACE	S_BREAK	/* IFS space characters */
58b30d1939SAndy Fiddaman #define S_DELIM	S_RES	/* IFS delimter characters */
59b30d1939SAndy Fiddaman #define S_MBYTE S_NAME	/* IFS first byte of multi-byte char */
60b30d1939SAndy Fiddaman #define S_BLNK	36	/* space or tab */
61b30d1939SAndy Fiddaman /* The following must be the highest numbered states */
62b30d1939SAndy Fiddaman #define S_QUOTE	37	/* double quote character */
63b30d1939SAndy Fiddaman #define S_GRAVE	38	/* old comsub character */
64b30d1939SAndy Fiddaman #define S_ESC	39	/* escape character */
65b30d1939SAndy Fiddaman #define S_DOL	40	/* $ subsitution character */
66b30d1939SAndy Fiddaman #define S_ESC2	41	/* escape character inside '...' */
67b30d1939SAndy Fiddaman 
68b30d1939SAndy Fiddaman /* These are the lexical state table names */
69b30d1939SAndy Fiddaman #define ST_BEGIN	0
70b30d1939SAndy Fiddaman #define ST_NAME		1
71b30d1939SAndy Fiddaman #define ST_NORM		2
72b30d1939SAndy Fiddaman #define ST_LIT		3
73b30d1939SAndy Fiddaman #define ST_QUOTE	4
74b30d1939SAndy Fiddaman #define ST_NESTED	5
75b30d1939SAndy Fiddaman #define ST_DOL		6
76b30d1939SAndy Fiddaman #define ST_BRACE	7
77b30d1939SAndy Fiddaman #define ST_DOLNAME	8
78b30d1939SAndy Fiddaman #define ST_MACRO	9
79b30d1939SAndy Fiddaman #define ST_QNEST	10
80b30d1939SAndy Fiddaman #define ST_NONE		11
81b30d1939SAndy Fiddaman 
82b30d1939SAndy Fiddaman #include "FEATURE/locale"
83b30d1939SAndy Fiddaman 
84b30d1939SAndy Fiddaman #if _hdr_wchar
85b30d1939SAndy Fiddaman #   include <wchar.h>
86b30d1939SAndy Fiddaman #   if _hdr_wctype
87b30d1939SAndy Fiddaman #       include <wctype.h>
88b30d1939SAndy Fiddaman #       undef  isalpha
89b30d1939SAndy Fiddaman #       define isalpha(x)      iswalpha(x)
90b30d1939SAndy Fiddaman #       if defined(iswblank) || _lib_iswblank
91b30d1939SAndy Fiddaman #           undef  isblank
92b30d1939SAndy Fiddaman #           define isblank(x)      iswblank(x)
93b30d1939SAndy Fiddaman #       else
94b30d1939SAndy Fiddaman #           if _lib_wctype && _lib_iswctype
95b30d1939SAndy Fiddaman #               define _lib_iswblank	-1
96b30d1939SAndy Fiddaman #               undef  isblank
97b30d1939SAndy Fiddaman #	        define isblank(x)	local_iswblank(x)
98b30d1939SAndy Fiddaman 	        extern int		local_iswblank(wchar_t);
99b30d1939SAndy Fiddaman #           endif
100b30d1939SAndy Fiddaman #       endif
101b30d1939SAndy Fiddaman #   endif
102b30d1939SAndy Fiddaman #endif
103b30d1939SAndy Fiddaman #ifndef isblank
104b30d1939SAndy Fiddaman #   define isblank(x)      ((x)==' '||(x)=='\t')
105b30d1939SAndy Fiddaman #endif
106b30d1939SAndy Fiddaman 
107b30d1939SAndy Fiddaman #undef LEN
108b30d1939SAndy Fiddaman #if SHOPT_MULTIBYTE
109b30d1939SAndy Fiddaman #   define LEN		_Fcin.fclen
110b30d1939SAndy Fiddaman #   define isaname(c)	((c)>0x7f?isalpha(c): sh_lexstates[ST_NAME][(c)]==0)
111b30d1939SAndy Fiddaman #   define isaletter(c)	((c)>0x7f?isalpha(c): sh_lexstates[ST_DOL][(c)]==S_ALP && (c)!='.')
112b30d1939SAndy Fiddaman #else
113b30d1939SAndy Fiddaman #   undef mbwide
114b30d1939SAndy Fiddaman #   define mbwide()	(0)
115b30d1939SAndy Fiddaman #   define LEN		1
116b30d1939SAndy Fiddaman #   define isaname(c)	(sh_lexstates[ST_NAME][c]==0)
117b30d1939SAndy Fiddaman #   define isaletter(c)	(sh_lexstates[ST_DOL][c]==S_ALP && (c)!='.')
118b30d1939SAndy Fiddaman #endif
119b30d1939SAndy Fiddaman #define STATE(s,c)	(s[mbwide()?((c=fcmbget(&LEN)),LEN>1?'a':c):(c=fcget())])
120b30d1939SAndy Fiddaman #define isadigit(c)	(sh_lexstates[ST_DOL][c]==S_DIG)
121b30d1939SAndy Fiddaman #define isastchar(c)	((c)=='@' || (c)=='*')
122b30d1939SAndy Fiddaman #define isexp(c)	(sh_lexstates[ST_MACRO][c]==S_PAT||(c)=='$'||(c)=='`')
123b30d1939SAndy Fiddaman #define ismeta(c)	(sh_lexstates[ST_NAME][c]==S_BREAK)
124b30d1939SAndy Fiddaman 
125b30d1939SAndy Fiddaman extern char *sh_lexstates[ST_NONE];
126b30d1939SAndy Fiddaman extern const char *sh_lexrstates[ST_NONE];
127b30d1939SAndy Fiddaman extern const char e_lexversion[];
128b30d1939SAndy Fiddaman extern const char e_lexspace[];
129b30d1939SAndy Fiddaman extern const char e_lexslash[];
130b30d1939SAndy Fiddaman extern const char e_lexlabignore[];
131b30d1939SAndy Fiddaman extern const char e_lexlabunknown[];
132b30d1939SAndy Fiddaman extern const char e_lexsyntax1[];
133b30d1939SAndy Fiddaman extern const char e_lexsyntax2[];
134b30d1939SAndy Fiddaman extern const char e_lexsyntax3[];
135b30d1939SAndy Fiddaman extern const char e_lexsyntax4[];
136b30d1939SAndy Fiddaman extern const char e_lexsyntax5[];
137b30d1939SAndy Fiddaman extern const char e_lexwarnvar[];
138b30d1939SAndy Fiddaman extern const char e_lexobsolete1[];
139b30d1939SAndy Fiddaman extern const char e_lexobsolete2[];
140b30d1939SAndy Fiddaman extern const char e_lexobsolete3[];
141b30d1939SAndy Fiddaman extern const char e_lexobsolete4[];
142*c7b656fcSAndy Fiddaman extern const char e_lexobsolete4b[];
143b30d1939SAndy Fiddaman extern const char e_lexobsolete5[];
144b30d1939SAndy Fiddaman extern const char e_lexobsolete6[];
145b30d1939SAndy Fiddaman extern const char e_lexnonstandard[];
146b30d1939SAndy Fiddaman extern const char e_lexusebrace[];
147b30d1939SAndy Fiddaman extern const char e_lexusequote[];
148b30d1939SAndy Fiddaman extern const char e_lexescape[];
149b30d1939SAndy Fiddaman extern const char e_lexquote[];
150b30d1939SAndy Fiddaman extern const char e_lexnested[];
151b30d1939SAndy Fiddaman extern const char e_lexbadchar[];
152b30d1939SAndy Fiddaman extern const char e_lexlongquote[];
153b30d1939SAndy Fiddaman extern const char e_lexfuture[];
154b30d1939SAndy Fiddaman extern const char e_lexzerobyte[];
155b30d1939SAndy Fiddaman extern const char e_lexemptyfor[];
156b30d1939SAndy Fiddaman extern const char e_lextypeset[];
157b30d1939SAndy Fiddaman extern const char e_lexcharclass[];
158b30d1939SAndy Fiddaman #endif
159