xref: /illumos-gate/usr/src/lib/libc/port/locale/table.c (revision 94ddd0900a8838f62bba15e270649a42f4ef9f81)
1 /*
2  * Copyright 2013 Garrett D'Amore <garrett@damore.org>
3  * Copyright 2017 Nexenta Systems, Inc.
4  * Copyright (c) 1993
5  *	The Regents of the University of California.  All rights reserved.
6  *
7  * This code is derived from software contributed to Berkeley by
8  * Paul Borman at Krystal Technologies.
9  *
10  * Redistribution and use in source and binary forms, with or without
11  * modification, are permitted provided that the following conditions
12  * are met:
13  * 1. Redistributions of source code must retain the above copyright
14  *    notice, this list of conditions and the following disclaimer.
15  * 2. Redistributions in binary form must reproduce the above copyright
16  *    notice, this list of conditions and the following disclaimer in the
17  *    documentation and/or other materials provided with the distribution.
18  * 4. Neither the name of the University nor the names of its contributors
19  *    may be used to endorse or promote products derived from this software
20  *    without specific prior written permission.
21  *
22  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
23  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
26  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32  * SUCH DAMAGE.
33  */
34 
35 #include "lint.h"
36 #include <ctype.h>
37 #include <wchar.h>
38 #include "runetype.h"
39 #include "mblocal.h"
40 #include "_ctype.h"
41 
42 #define	_DEFRUNETYPE { \
43 	/* 00 */ \
44 	_CTYPE_C, \
45 	_CTYPE_C, \
46 	_CTYPE_C, \
47 	_CTYPE_C, \
48 	_CTYPE_C, \
49 	_CTYPE_C, \
50 	_CTYPE_C, \
51 	_CTYPE_C, \
52 	/* 08 */ \
53 	_CTYPE_C, \
54 	_CTYPE_C|_CTYPE_S|_CTYPE_B, \
55 	_CTYPE_C|_CTYPE_S, \
56 	_CTYPE_C|_CTYPE_S, \
57 	_CTYPE_C|_CTYPE_S, \
58 	_CTYPE_C|_CTYPE_S, \
59 	_CTYPE_C, \
60 	_CTYPE_C, \
61 	/* 10 */ \
62 	_CTYPE_C, \
63 	_CTYPE_C, \
64 	_CTYPE_C, \
65 	_CTYPE_C, \
66 	_CTYPE_C, \
67 	_CTYPE_C, \
68 	_CTYPE_C, \
69 	_CTYPE_C, \
70 	/* 18 */ \
71 	_CTYPE_C, \
72 	_CTYPE_C, \
73 	_CTYPE_C, \
74 	_CTYPE_C, \
75 	_CTYPE_C, \
76 	_CTYPE_C, \
77 	_CTYPE_C, \
78 	_CTYPE_C, \
79 	/* 20 */ \
80 	_CTYPE_S|_CTYPE_B|_CTYPE_R, \
81 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
82 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
83 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
84 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
85 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
86 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
87 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
88 	/* 28 */ \
89 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
90 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
91 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
92 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
93 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
94 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
95 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
96 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
97 	/* 30 */ \
98 	_CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \
99 	_CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \
100 	_CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \
101 	_CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \
102 	_CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \
103 	_CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \
104 	_CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \
105 	_CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \
106 	/* 38 */ \
107 	_CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \
108 	_CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \
109 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
110 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
111 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
112 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
113 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
114 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
115 	/* 40 */ \
116 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
117 	_CTYPE_U|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
118 	_CTYPE_U|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
119 	_CTYPE_U|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
120 	_CTYPE_U|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
121 	_CTYPE_U|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
122 	_CTYPE_U|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
123 	_CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
124 	/* 48 */ \
125 	_CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
126 	_CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
127 	_CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
128 	_CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
129 	_CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
130 	_CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
131 	_CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
132 	_CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
133 	/* 50 */ \
134 	_CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
135 	_CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
136 	_CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
137 	_CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
138 	_CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
139 	_CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
140 	_CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
141 	_CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
142 	/* 58 */ \
143 	_CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
144 	_CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
145 	_CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
146 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
147 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
148 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
149 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
150 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
151 	/* 60 */ \
152 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
153 	_CTYPE_L|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
154 	_CTYPE_L|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
155 	_CTYPE_L|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
156 	_CTYPE_L|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
157 	_CTYPE_L|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
158 	_CTYPE_L|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
159 	_CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
160 	/* 68 */ \
161 	_CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
162 	_CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
163 	_CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
164 	_CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
165 	_CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
166 	_CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
167 	_CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
168 	_CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
169 	/* 70 */ \
170 	_CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
171 	_CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
172 	_CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
173 	_CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
174 	_CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
175 	_CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
176 	_CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
177 	_CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
178 	/* 78 */ \
179 	_CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
180 	_CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
181 	_CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
182 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
183 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
184 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
185 	_CTYPE_P|_CTYPE_R|_CTYPE_G, \
186 	_CTYPE_C, \
187 }
188 
189 #define	_DEFMAPLOWER { \
190 	0x00,	0x01,	0x02,	0x03,	0x04,	0x05,	0x06,	0x07, \
191 	0x08,	0x09,	0x0a,	0x0b,	0x0c,	0x0d,	0x0e,	0x0f, \
192 	0x10,	0x11,	0x12,	0x13,	0x14,	0x15,	0x16,	0x17, \
193 	0x18,	0x19,	0x1a,	0x1b,	0x1c,	0x1d,	0x1e,	0x1f, \
194 	0x20,	0x21,	0x22,	0x23,	0x24,	0x25,	0x26,	0x27, \
195 	0x28,	0x29,	0x2a,	0x2b,	0x2c,	0x2d,	0x2e,	0x2f, \
196 	0x30,	0x31,	0x32,	0x33,	0x34,	0x35,	0x36,	0x37, \
197 	0x38,	0x39,	0x3a,	0x3b,	0x3c,	0x3d,	0x3e,	0x3f, \
198 	0x40,	'a',	'b',	'c',	'd',	'e',	'f',	'g', \
199 	'h',	'i',	'j',	'k',	'l',	'm',	'n',	'o', \
200 	'p',	'q',	'r',	's',	't',	'u',	'v',	'w', \
201 	'x',	'y',	'z',	0x5b,	0x5c,	0x5d,	0x5e,	0x5f, \
202 	0x60,	'a',	'b',	'c',	'd',	'e',	'f',	'g', \
203 	'h',	'i',	'j',	'k',	'l',	'm',	'n',	'o', \
204 	'p',	'q',	'r',	's',	't',	'u',	'v',	'w', \
205 	'x',	'y',	'z',	0x7b,	0x7c,	0x7d,	0x7e,	0x7f, \
206 	0x80,	0x81,	0x82,	0x83,	0x84,	0x85,	0x86,	0x87, \
207 	0x88,	0x89,	0x8a,	0x8b,	0x8c,	0x8d,	0x8e,	0x8f, \
208 	0x90,	0x91,	0x92,	0x93,	0x94,	0x95,	0x96,	0x97, \
209 	0x98,	0x99,	0x9a,	0x9b,	0x9c,	0x9d,	0x9e,	0x9f, \
210 	0xa0,	0xa1,	0xa2,	0xa3,	0xa4,	0xa5,	0xa6,	0xa7, \
211 	0xa8,	0xa9,	0xaa,	0xab,	0xac,	0xad,	0xae,	0xaf, \
212 	0xb0,	0xb1,	0xb2,	0xb3,	0xb4,	0xb5,	0xb6,	0xb7, \
213 	0xb8,	0xb9,	0xba,	0xbb,	0xbc,	0xbd,	0xbe,	0xbf, \
214 	0xc0,	0xc1,	0xc2,	0xc3,	0xc4,	0xc5,	0xc6,	0xc7, \
215 	0xc8,	0xc9,	0xca,	0xcb,	0xcc,	0xcd,	0xce,	0xcf, \
216 	0xd0,	0xd1,	0xd2,	0xd3,	0xd4,	0xd5,	0xd6,	0xd7, \
217 	0xd8,	0xd9,	0xda,	0xdb,	0xdc,	0xdd,	0xde,	0xdf, \
218 	0xe0,	0xe1,	0xe2,	0xe3,	0xe4,	0xe5,	0xe6,	0xe7, \
219 	0xe8,	0xe9,	0xea,	0xeb,	0xec,	0xed,	0xee,	0xef, \
220 	0xf0,	0xf1,	0xf2,	0xf3,	0xf4,	0xf5,	0xf6,	0xf7, \
221 	0xf8,	0xf9,	0xfa,	0xfb,	0xfc,	0xfd,	0xfe,	0xff, \
222 }
223 
224 #define	_DEFMAPUPPER { \
225 	0x00,	0x01,	0x02,	0x03,	0x04,	0x05,	0x06,	0x07, \
226 	0x08,	0x09,	0x0a,	0x0b,	0x0c,	0x0d,	0x0e,	0x0f, \
227 	0x10,	0x11,	0x12,	0x13,	0x14,	0x15,	0x16,	0x17, \
228 	0x18,	0x19,	0x1a,	0x1b,	0x1c,	0x1d,	0x1e,	0x1f, \
229 	0x20,	0x21,	0x22,	0x23,	0x24,	0x25,	0x26,	0x27, \
230 	0x28,	0x29,	0x2a,	0x2b,	0x2c,	0x2d,	0x2e,	0x2f, \
231 	0x30,	0x31,	0x32,	0x33,	0x34,	0x35,	0x36,	0x37, \
232 	0x38,	0x39,	0x3a,	0x3b,	0x3c,	0x3d,	0x3e,	0x3f, \
233 	0x40,	'A',	'B',	'C',	'D',	'E',	'F',	'G', \
234 	'H',	'I',	'J',	'K',	'L',	'M',	'N',	'O', \
235 	'P',	'Q',	'R',	'S',	'T',	'U',	'V',	'W', \
236 	'X',	'Y',	'Z',	0x5b,	0x5c,	0x5d,	0x5e,	0x5f, \
237 	0x60,	'A',	'B',	'C',	'D',	'E',	'F',	'G', \
238 	'H',	'I',	'J',	'K',	'L',	'M',	'N',	'O', \
239 	'P',	'Q',	'R',	'S',	'T',	'U',	'V',	'W', \
240 	'X',	'Y',	'Z',	0x7b,	0x7c,	0x7d,	0x7e,	0x7f, \
241 	0x80,	0x81,	0x82,	0x83,	0x84,	0x85,	0x86,	0x87, \
242 	0x88,	0x89,	0x8a,	0x8b,	0x8c,	0x8d,	0x8e,	0x8f, \
243 	0x90,	0x91,	0x92,	0x93,	0x94,	0x95,	0x96,	0x97, \
244 	0x98,	0x99,	0x9a,	0x9b,	0x9c,	0x9d,	0x9e,	0x9f, \
245 	0xa0,	0xa1,	0xa2,	0xa3,	0xa4,	0xa5,	0xa6,	0xa7, \
246 	0xa8,	0xa9,	0xaa,	0xab,	0xac,	0xad,	0xae,	0xaf, \
247 	0xb0,	0xb1,	0xb2,	0xb3,	0xb4,	0xb5,	0xb6,	0xb7, \
248 	0xb8,	0xb9,	0xba,	0xbb,	0xbc,	0xbd,	0xbe,	0xbf, \
249 	0xc0,	0xc1,	0xc2,	0xc3,	0xc4,	0xc5,	0xc6,	0xc7, \
250 	0xc8,	0xc9,	0xca,	0xcb,	0xcc,	0xcd,	0xce,	0xcf, \
251 	0xd0,	0xd1,	0xd2,	0xd3,	0xd4,	0xd5,	0xd6,	0xd7, \
252 	0xd8,	0xd9,	0xda,	0xdb,	0xdc,	0xdd,	0xde,	0xdf, \
253 	0xe0,	0xe1,	0xe2,	0xe3,	0xe4,	0xe5,	0xe6,	0xe7, \
254 	0xe8,	0xe9,	0xea,	0xeb,	0xec,	0xed,	0xee,	0xef, \
255 	0xf0,	0xf1,	0xf2,	0xf3,	0xf4,	0xf5,	0xf6,	0xf7, \
256 	0xf8,	0xf9,	0xfa,	0xfb,	0xfc,	0xfd,	0xfe,	0xff, \
257 }
258 
259 _RuneLocale _DefaultRuneLocale = {
260 	_RUNE_MAGIC_1,
261 	"NONE",
262 	_DEFRUNETYPE,
263 	_DEFMAPLOWER,
264 	_DEFMAPUPPER,
265 };
266 
267 /*
268  * __ctype_mask, __trans_lower, and __trans_upper come from former _ctype.c and
269  * have to stay pointers for binary compatibility, so we provide separate
270  * storage for them, initialized to "C" locale contents by default.
271  */
272 static unsigned int ___ctype_mask[_CACHED_RUNES] = _DEFRUNETYPE;
273 unsigned int *__ctype_mask = ___ctype_mask;
274 
275 static int ___trans_lower[_CACHED_RUNES] = _DEFMAPLOWER;
276 int *__trans_lower = ___trans_lower;
277 
278 static int ___trans_upper[_CACHED_RUNES] = _DEFMAPUPPER;
279 int *__trans_upper = ___trans_upper;
280