1 /* $Header: /src/pub/tcsh/sh.char.h,v 3.18 2001/03/18 19:06:29 christos Exp $ */ 2 /* 3 * sh.char.h: Table for spotting special characters quickly 4 * Makes for very obscure but efficient coding. 5 */ 6 /*- 7 * Copyright (c) 1980, 1991 The Regents of the University of California. 8 * All rights reserved. 9 * 10 * Redistribution and use in source and binary forms, with or without 11 * modification, are permitted provided that the following conditions 12 * are met: 13 * 1. Redistributions of source code must retain the above copyright 14 * notice, this list of conditions and the following disclaimer. 15 * 2. Redistributions in binary form must reproduce the above copyright 16 * notice, this list of conditions and the following disclaimer in the 17 * documentation and/or other materials provided with the distribution. 18 * 3. All advertising materials mentioning features or use of this software 19 * must display the following acknowledgement: 20 * This product includes software developed by the University of 21 * California, Berkeley and its contributors. 22 * 4. Neither the name of the University nor the names of its contributors 23 * may be used to endorse or promote products derived from this software 24 * without specific prior written permission. 25 * 26 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 27 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 28 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 29 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 30 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 31 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 32 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 33 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 34 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 35 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 36 * SUCH DAMAGE. 37 */ 38 #ifndef _h_sh_char 39 #define _h_sh_char 40 #if defined(NeXT) && defined(NLS) 41 # include <appkit/NXCType.h> 42 #else 43 # include <ctype.h> 44 #endif 45 46 typedef unsigned char tcshuc; 47 #ifdef _MINIX 48 # undef _SP 49 #endif /* _MINIX */ 50 extern unsigned short _cmap[]; 51 #if defined(DSPMBYTE) 52 extern unsigned short _mbmap[]; 53 # define CHECK_MBYTEVAR STRdspmbyte 54 #endif 55 extern unsigned short _cmap_c[]; 56 extern unsigned short _cmap_mbyte[]; 57 extern short _enable_mbdisp; 58 extern unsigned short _mbmap[]; 59 extern unsigned short _mbmap_euc[]; 60 extern unsigned short _mbmap_sjis[]; 61 extern unsigned short _mbmap_big5[]; 62 /* VARIABLE Check str */ 63 /* same compiler require #define even not define DSPMBYTE */ 64 #define _MB1 0x0001 65 #define _MB2 0x0002 66 67 #ifndef NLS 68 extern tcshuc _cmap_lower[], _cmap_upper[]; 69 70 #endif 71 72 #define _QF 0x0001 /* '" (Forward quotes) */ 73 #define _QB 0x0002 /* ` (Backquote) */ 74 #define _SP 0x0004 /* space and tab */ 75 #define _NL 0x0008 /* \n */ 76 #define _META 0x0010 /* lex meta characters, sp #'`";&<>()|\t\n */ 77 #define _GLOB 0x0020 /* glob characters, *?{[` */ 78 #define _ESC 0x0040 /* \ */ 79 #define _DOL 0x0080 /* $ */ 80 #define _DIG 0x0100 /* 0-9 */ 81 #define _LET 0x0200 /* a-z, A-Z, _ */ 82 #define _UP 0x0400 /* A-Z */ 83 #define _DOW 0x0800 /* a-z */ 84 #define _XD 0x1000 /* 0-9, a-f, A-F */ 85 #define _CMD 0x2000 /* lex end of command chars, ;&(|` */ 86 #define _CTR 0x4000 /* control */ 87 #define _PUN 0x8000 /* punctuation */ 88 89 #if defined(SHORT_STRINGS) && defined(KANJI) 90 # define ASC(ch) ch 91 # define CTL_ESC(ch) ch 92 # define cmap(c, bits) \ 93 ((((c) & QUOTE) || ((c & 0x80) && adrof(STRnokanji))) ? \ 94 0 : (_cmap[(tcshuc)(c)] & (bits))) 95 #else /* SHORT_STRINGS && KANJI */ 96 # ifdef IS_ASCII 97 # define ASC(ch) ch 98 # define CTL_ESC(ch) ch 99 # define cmap(c, bits) \ 100 (((c) & QUOTE) ? 0 : (_cmap[(tcshuc)(c)] & (bits))) 101 # else /* IS_ASCII */ 102 /* "BS2000 OSD" is a POSIX on a main frame using a EBCDIC char set */ 103 /* "OS/390 USS" is a POSIX on a main frame using an IBM1047 char set */ 104 extern unsigned short _toascii[256]; 105 extern unsigned short _toebcdic[256]; 106 107 /* mainly for comparisons if (ASC(ch)=='\177')... */ 108 # define ASC(ch) _toascii[(tcshuc)ch] 109 110 /* Literal escapes ('\010') must be mapped to EBCDIC, 111 * for C-Escapes ('\b'), the compiler already does it. 112 */ 113 # define CTL_ESC(ch) _toebcdic[(tcshuc)ch] 114 115 # define cmap(c, bits) \ 116 (((c) & QUOTE) ? 0 : (_cmap[_toascii[(tcshuc)(c)]] & (bits))) 117 # endif /* IS_ASCII */ 118 #endif /* SHORT_STRINGS && KANJI */ 119 120 #define isglob(c) cmap(c, _GLOB) 121 #define isspc(c) cmap(c, _SP) 122 #define ismeta(c) cmap(c, _META) 123 #define iscmdmeta(c) cmap(c, _CMD) 124 #define letter(c) (((Char)(c) & QUOTE) ? 0 : \ 125 (isalpha((tcshuc) (c)) || (c) == '_')) 126 #define alnum(c) (((Char)(c) & QUOTE) ? 0 : \ 127 (isalnum((tcshuc) (c)) || (c) == '_')) 128 129 #if defined(DSPMBYTE) 130 # define IsmbyteU(c) (Ismbyte1((Char)(c))||(Ismbyte2((Char)(c))&&((c)&0200))) 131 #endif 132 133 #ifdef NLS 134 # ifdef NeXT 135 # define Isspace(c) (((Char)(c) & QUOTE) ? 0 : NXIsSpace((unsigned) (c))) 136 # define Isdigit(c) (((Char)(c) & QUOTE) ? 0 : NXIsDigit((unsigned) (c))) 137 # define Isalpha(c) (((Char)(c) & QUOTE) ? 0 : NXIsAlpha((unsigned) (c))) 138 # define Islower(c) (((Char)(c) & QUOTE) ? 0 : NXIsLower((unsigned) (c))) 139 # define Isupper(c) (((Char)(c) & QUOTE) ? 0 : NXIsUpper((unsigned) (c))) 140 # define Tolower(c) (((Char)(c) & QUOTE) ? 0 : NXToLower((unsigned) (c))) 141 # define Toupper(c) (((Char)(c) & QUOTE) ? 0 : NXToUpper((unsigned) (c))) 142 # define Isxdigit(c) (((Char)(c) & QUOTE) ? 0 : NXIsXDigit((unsigned) (c))) 143 #if defined(DSPMBYTE) 144 # define IscntrlM(c) (((Char)(c) & QUOTE) ? 0 : NXIsCntrl((unsigned) (c))) 145 # define Iscntrl(c) ( (IscntrlM(c)) && !(_enable_mbdisp&&(IsmbyteU((c)))) ) 146 # define IsprintM(c) (((Char)(c) & QUOTE) ? 0 : NXIsPrint((unsigned) (c))) 147 # define Isprint(c) ( (IsprintM(c)) || (_enable_mbdisp&&(IsmbyteU((c)))) ) 148 #else 149 # define Isalnum(c) (((Char)(c) & QUOTE) ? 0 : NXIsAlNum((unsigned) (c))) 150 # define Iscntrl(c) (((Char)(c) & QUOTE) ? 0 : NXIsCntrl((unsigned) (c))) 151 # define Isprint(c) (((Char)(c) & QUOTE) ? 0 : NXIsPrint((unsigned) (c))) 152 #endif /* !defined(DSPMBYTE) */ 153 # define Ispunct(c) (((Char)(c) & QUOTE) ? 0 : NXIsPunct((unsigned) (c))) 154 # else /* !NeXT */ 155 # ifndef WINNT_NATIVE 156 # define Isspace(c) (((Char)(c) & QUOTE) ? 0 : isspace((tcshuc) (c))) 157 # define Isdigit(c) (((Char)(c) & QUOTE) ? 0 : isdigit((tcshuc) (c))) 158 # define Isalpha(c) (((Char)(c) & QUOTE) ? 0 : isalpha((tcshuc) (c))) 159 # define Islower(c) (((Char)(c) & QUOTE) ? 0 : islower((tcshuc) (c))) 160 # define Isupper(c) (((Char)(c) & QUOTE) ? 0 : isupper((tcshuc) (c))) 161 # define Tolower(c) (((Char)(c) & QUOTE) ? 0 : tolower((tcshuc) (c))) 162 # define Toupper(c) (((Char)(c) & QUOTE) ? 0 : toupper((tcshuc) (c))) 163 # define Isxdigit(c) (((Char)(c) & QUOTE) ? 0 : isxdigit((tcshuc) (c))) 164 # define Isalnum(c) (((Char)(c) & QUOTE) ? 0 : isalnum((tcshuc) (c))) 165 #if defined(DSPMBYTE) 166 # define IscntrlM(c) (((Char)(c) & QUOTE) ? 0 : iscntrl((tcshuc) (c))) 167 # define Iscntrl(c) ( (IscntrlM(c)) && !(_enable_mbdisp&&(IsmbyteU((c)))) ) 168 #else 169 # define Iscntrl(c) (((Char)(c) & QUOTE) ? 0 : iscntrl((tcshuc) (c))) 170 #endif /* !defined(DSPMBYTE) */ 171 # if SOLARIS2 == 24 172 /* 173 * From <casper@fwi.uva.nl> Casper Dik: 174 * In Solaris 2.4, isprint('\t') returns true after setlocal(LC_ALL,""). 175 * This breaks commandline editing when you include tabs. 176 * (This is in the en_US locale). 177 */ 178 #if defined(DSPMBYTE) 179 # define IsprintM(c) (((Char)(c) & QUOTE) ? 0 : \ 180 (isprint((tcshuc) (c)) && (c) != '\t')) 181 #else 182 # define Isprint(c) (((Char)(c) & QUOTE) ? 0 : \ 183 (isprint((tcshuc) (c)) && (c) != '\t')) 184 #endif /* !defined(DSPMBYTE) */ 185 # else 186 #if defined(DSPMBYTE) 187 # define IsprintM(c) (((Char)(c) & QUOTE) ? 0 : isprint((tcshuc) (c))) 188 #else 189 # define Isprint(c) (((Char)(c) & QUOTE) ? 0 : isprint((tcshuc) (c))) 190 #endif /* !defined(DSPMBYTE) */ 191 # endif /* SOLARIS2 == 24 */ 192 #if defined(DSPMBYTE) 193 # define Isprint(c) ( (IsprintM(c)) || (_enable_mbdisp&&(IsmbyteU((c)))) ) 194 #endif /* !defined(DSPMBYTE) */ 195 # define Ispunct(c) (((Char)(c) & QUOTE) ? 0 : ispunct((tcshuc) (c))) 196 # else /* WINNT_NATIVE */ 197 # define Isspace(c) (((Char)(c) & QUOTE) ? 0 : isspace( oem_it((tcshuc)(c)))) 198 # define Isdigit(c) (((Char)(c) & QUOTE) ? 0 : isdigit( oem_it((tcshuc)(c)))) 199 # define Isalpha(c) (((Char)(c) & QUOTE) ? 0 : isalpha( oem_it((tcshuc)(c)))) 200 # define Islower(c) (((Char)(c) & QUOTE) ? 0 : islower( oem_it((tcshuc)(c)))) 201 # define Isupper(c) (((Char)(c) & QUOTE) ? 0 : isupper( oem_it((tcshuc)(c)))) 202 # define Tolower(c) (((Char)(c) & QUOTE) ? 0 : tolower( oem_it((tcshuc)(c)))) 203 # define Toupper(c) (((Char)(c) & QUOTE) ? 0 : toupper( oem_it((tcshuc)(c)))) 204 # define Isxdigit(c)(((Char)(c) & QUOTE) ? 0 : isxdigit(oem_it((tcshuc)(c)))) 205 # define Isalnum(c) (((Char)(c) & QUOTE) ? 0 : isalnum( oem_it((tcshuc)(c)))) 206 # define Ispunct(c) (((Char)(c) & QUOTE) ? 0 : ispunct( oem_it((tcshuc)(c)))) 207 #if defined(DSPMBYTE) 208 # define IscntrlM(c) (((Char)(c) & QUOTE) ? 0 : iscntrl( oem_it((tcshuc)(c)))) 209 # define Iscntrl(c) ( (IscntrlM(c)) && !(_enable_mbdisp&&(IsmbyteU((c)))) ) 210 # define IsprintM(c) (((Char)(c) & QUOTE) ? 0 : isprint( oem_it((tcshuc)(c)))) 211 # define Isprint(c) ( (IsprintM(c)) || (_enable_mbdisp&&(IsmbyteU((c)))) ) 212 #else 213 # define Iscntrl(c) (((Char)(c) & QUOTE) ? 0 : iscntrl( oem_it((tcshuc)(c)))) 214 # define Isprint(c) (((Char)(c) & QUOTE) ? 0 : isprint( oem_it((tcshuc)(c)))) 215 #endif /* !defined(DSPMBYTE) */ 216 # endif /* WINNT_NATIVE */ 217 # endif /* !NeXT */ 218 #else /* !NLS */ 219 # define Isspace(c) cmap(c, _SP|_NL) 220 # define Isdigit(c) cmap(c, _DIG) 221 # define Isalpha(c) (cmap(c,_LET) && !(((c) & META) && AsciiOnly)) 222 # define Islower(c) (cmap(c,_DOW) && !(((c) & META) && AsciiOnly)) 223 # define Isupper(c) (cmap(c, _UP) && !(((c) & META) && AsciiOnly)) 224 # ifdef IS_ASCII 225 # define Tolower(c) (_cmap_lower[(tcshuc)(c)]) 226 # define Toupper(c) (_cmap_upper[(tcshuc)(c)]) 227 # else 228 /* "BS2000 OSD" is a POSIX on a main frame using a EBCDIC char set */ 229 # define Tolower(c) (_cmap_lower[_toascii[(tcshuc)(c)]]) 230 # define Toupper(c) (_cmap_upper[_toascii[(tcshuc)(c)]]) 231 # endif 232 # define Isxdigit(c) cmap(c, _XD) 233 # define Isalnum(c) (cmap(c, _DIG|_LET) && !(((Char)(c) & META) && AsciiOnly)) 234 #if defined(DSPMBYTE) 235 # define IscntrlM(c) (cmap(c,_CTR) && !(((c) & META) && AsciiOnly)) 236 # define Iscntrl(c) ( (IscntrlM(c)) && !(_enable_mbdisp&&(IsmbyteU((c)))) ) 237 # define IsprintM(c) (!cmap(c,_CTR) && !(((c) & META) && AsciiOnly)) 238 # define Isprint(c) ( (IsprintM(c)) || (_enable_mbdisp&&(IsmbyteU((c)))) ) 239 #else 240 # define Iscntrl(c) (cmap(c,_CTR) && !(((c) & META) && AsciiOnly)) 241 # define Isprint(c) (!cmap(c,_CTR) && !(((c) & META) && AsciiOnly)) 242 #endif /* !defined(DSPMBYTE) */ 243 # define Ispunct(c) (cmap(c,_PUN) && !(((c) & META) && AsciiOnly)) 244 245 #endif /* !NLS */ 246 247 #if defined(DSPMBYTE) 248 # define Ismbyte1(c) ((_mbmap[(c) & 0377] & _MB1) ? 1 : 0) 249 # define Ismbyte2(c) ((_mbmap[(c) & 0377] & _MB2) ? 1 : 0) 250 #endif 251 252 #endif /* _h_sh_char */ 253