xref: /freebsd/lib/libiconv_modules/EUC/citrus_euc.c (revision 6be3386466ab79a84b48429ae66244f21526d3df)
1 /* $FreeBSD$ */
2 /*	$NetBSD: citrus_euc.c,v 1.14 2009/01/11 02:46:24 christos Exp $	*/
3 
4 /*-
5  * Copyright (c)2002 Citrus Project,
6  * All rights reserved.
7  *
8  * Redistribution and use in source and binary forms, with or without
9  * modification, are permitted provided that the following conditions
10  * are met:
11  * 1. Redistributions of source code must retain the above copyright
12  *    notice, this list of conditions and the following disclaimer.
13  * 2. Redistributions in binary form must reproduce the above copyright
14  *    notice, this list of conditions and the following disclaimer in the
15  *    documentation and/or other materials provided with the distribution.
16  *
17  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
18  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
21  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27  * SUCH DAMAGE.
28  */
29 
30 /*-
31  * SPDX-License-Identifier: BSD-3-Clause
32  *
33  * Copyright (c) 1993
34  *	The Regents of the University of California.  All rights reserved.
35  *
36  * This code is derived from software contributed to Berkeley by
37  * Paul Borman at Krystal Technologies.
38  *
39  * Redistribution and use in source and binary forms, with or without
40  * modification, are permitted provided that the following conditions
41  * are met:
42  * 1. Redistributions of source code must retain the above copyright
43  *    notice, this list of conditions and the following disclaimer.
44  * 2. Redistributions in binary form must reproduce the above copyright
45  *    notice, this list of conditions and the following disclaimer in the
46  *    documentation and/or other materials provided with the distribution.
47  * 3. Neither the name of the University nor the names of its contributors
48  *    may be used to endorse or promote products derived from this software
49  *    without specific prior written permission.
50  *
51  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
52  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
53  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
54  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
55  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
56  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
57  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
58  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
59  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
60  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
61  * SUCH DAMAGE.
62  */
63 
64 #include <sys/cdefs.h>
65 #include <sys/types.h>
66 
67 #include <assert.h>
68 #include <errno.h>
69 #include <limits.h>
70 #include <stddef.h>
71 #include <stdio.h>
72 #include <stdlib.h>
73 #include <string.h>
74 #include <wchar.h>
75 
76 #include "citrus_namespace.h"
77 #include "citrus_bcs.h"
78 #include "citrus_types.h"
79 #include "citrus_module.h"
80 #include "citrus_stdenc.h"
81 #include "citrus_euc.h"
82 
83 
84 /* ----------------------------------------------------------------------
85  * private stuffs used by templates
86  */
87 
88 typedef struct {
89 	int	 chlen;
90 	char	 ch[3];
91 } _EUCState;
92 
93 typedef struct {
94 	wchar_t		 bits[4];
95 	wchar_t		 mask;
96 	unsigned	 count[4];
97 	unsigned	 mb_cur_max;
98 } _EUCEncodingInfo;
99 
100 #define	_SS2	0x008e
101 #define	_SS3	0x008f
102 
103 #define _CEI_TO_EI(_cei_)		(&(_cei_)->ei)
104 #define _CEI_TO_STATE(_cei_, _func_)	(_cei_)->states.s_##_func_
105 
106 #define _FUNCNAME(m)			_citrus_EUC_##m
107 #define _ENCODING_INFO			_EUCEncodingInfo
108 #define _ENCODING_STATE			_EUCState
109 #define _ENCODING_MB_CUR_MAX(_ei_)	(_ei_)->mb_cur_max
110 #define _ENCODING_IS_STATE_DEPENDENT	0
111 #define _STATE_NEEDS_EXPLICIT_INIT(_ps_)	0
112 
113 
114 static __inline int
115 _citrus_EUC_cs(unsigned int c)
116 {
117 
118 	c &= 0xff;
119 
120 	return ((c & 0x80) ? c == _SS3 ? 3 : c == _SS2 ? 2 : 1 : 0);
121 }
122 
123 static __inline int
124 _citrus_EUC_parse_variable(_EUCEncodingInfo *ei, const void *var,
125     size_t lenvar __unused)
126 {
127 	char *e;
128 	const char *v;
129 	int x;
130 
131 	/* parse variable string */
132 	if (!var)
133 		return (EFTYPE);
134 
135 	v = (const char *)var;
136 
137 	while (*v == ' ' || *v == '\t')
138 		++v;
139 
140 	ei->mb_cur_max = 1;
141 	for (x = 0; x < 4; ++x) {
142 		ei->count[x] = (int)_bcs_strtol(v, (char **)&e, 0);
143 		if (v == e || !(v = e) || ei->count[x] < 1 || ei->count[x] > 4) {
144 			return (EFTYPE);
145 		}
146 		if (ei->mb_cur_max < ei->count[x])
147 			ei->mb_cur_max = ei->count[x];
148 		while (*v == ' ' || *v == '\t')
149 			++v;
150 		ei->bits[x] = (int)_bcs_strtol(v, (char **)&e, 0);
151 		if (v == e || !(v = e)) {
152 			return (EFTYPE);
153 		}
154 		while (*v == ' ' || *v == '\t')
155 			++v;
156 	}
157 	ei->mask = (int)_bcs_strtol(v, (char **)&e, 0);
158 	if (v == e || !(v = e)) {
159 		return (EFTYPE);
160 	}
161 
162 	return (0);
163 }
164 
165 
166 static __inline void
167 /*ARGSUSED*/
168 _citrus_EUC_init_state(_EUCEncodingInfo *ei __unused, _EUCState *s)
169 {
170 
171 	memset(s, 0, sizeof(*s));
172 }
173 
174 #if 0
175 static __inline void
176 /*ARGSUSED*/
177 _citrus_EUC_pack_state(_EUCEncodingInfo *ei __unused, void *pspriv,
178     const _EUCState *s)
179 {
180 
181 	memcpy(pspriv, (const void *)s, sizeof(*s));
182 }
183 
184 static __inline void
185 /*ARGSUSED*/
186 _citrus_EUC_unpack_state(_EUCEncodingInfo *ei __unused, _EUCState *s,
187     const void *pspriv)
188 {
189 
190 	memcpy((void *)s, pspriv, sizeof(*s));
191 }
192 #endif
193 
194 static int
195 _citrus_EUC_mbrtowc_priv(_EUCEncodingInfo *ei, wchar_t *pwc, char **s,
196     size_t n, _EUCState *psenc, size_t *nresult)
197 {
198 	wchar_t wchar;
199 	int c, chlenbak, cs, len;
200 	char *s0, *s1 = NULL;
201 
202 	s0 = *s;
203 
204 	if (s0 == NULL) {
205 		_citrus_EUC_init_state(ei, psenc);
206 		*nresult = 0; /* state independent */
207 		return (0);
208 	}
209 
210 	chlenbak = psenc->chlen;
211 
212 	/* make sure we have the first byte in the buffer */
213 	switch (psenc->chlen) {
214 	case 0:
215 		if (n < 1)
216 			goto restart;
217 		psenc->ch[0] = *s0++;
218 		psenc->chlen = 1;
219 		n--;
220 		break;
221 	case 1:
222 	case 2:
223 		break;
224 	default:
225 		/* illgeal state */
226 		goto encoding_error;
227 	}
228 
229 	c = ei->count[cs = _citrus_EUC_cs(psenc->ch[0] & 0xff)];
230 	if (c == 0)
231 		goto encoding_error;
232 	while (psenc->chlen < c) {
233 		if (n < 1)
234 			goto restart;
235 		psenc->ch[psenc->chlen] = *s0++;
236 		psenc->chlen++;
237 		n--;
238 	}
239 	*s = s0;
240 
241 	switch (cs) {
242 	case 3:
243 	case 2:
244 		/* skip SS2/SS3 */
245 		len = c - 1;
246 		s1 = &psenc->ch[1];
247 		break;
248 	case 1:
249 	case 0:
250 		len = c;
251 		s1 = &psenc->ch[0];
252 		break;
253 	default:
254 		goto encoding_error;
255 	}
256 	wchar = 0;
257 	while (len-- > 0)
258 		wchar = (wchar << 8) | (*s1++ & 0xff);
259 	wchar = (wchar & ~ei->mask) | ei->bits[cs];
260 
261 	psenc->chlen = 0;
262 	if (pwc)
263 		*pwc = wchar;
264 	*nresult = wchar ? (size_t)(c - chlenbak) : 0;
265 	return (0);
266 
267 encoding_error:
268 	psenc->chlen = 0;
269 	*nresult = (size_t)-1;
270 	return (EILSEQ);
271 
272 restart:
273 	*nresult = (size_t)-2;
274 	*s = s0;
275 	return (0);
276 }
277 
278 static int
279 _citrus_EUC_wcrtomb_priv(_EUCEncodingInfo *ei, char *s, size_t n, wchar_t wc,
280     _EUCState *psenc __unused, size_t *nresult)
281 {
282 	wchar_t m, nm;
283 	unsigned int cs;
284 	int ret;
285 	short i;
286 
287 	m = wc & ei->mask;
288 	nm = wc & ~m;
289 
290 	for (cs = 0; cs < sizeof(ei->count) / sizeof(ei->count[0]); cs++)
291 		if (m == ei->bits[cs])
292 			break;
293 	/* fallback case - not sure if it is necessary */
294 	if (cs == sizeof(ei->count) / sizeof(ei->count[0]))
295 		cs = 1;
296 
297 	i = ei->count[cs];
298 	if (n < (unsigned)i) {
299 		ret = E2BIG;
300 		goto err;
301 	}
302 	m = (cs) ? 0x80 : 0x00;
303 	switch (cs) {
304 	case 2:
305 		*s++ = _SS2;
306 		i--;
307 		break;
308 	case 3:
309 		*s++ = _SS3;
310 		i--;
311 		break;
312 	}
313 
314 	while (i-- > 0)
315 		*s++ = ((nm >> (i << 3)) & 0xff) | m;
316 
317 	*nresult = (size_t)ei->count[cs];
318 	return (0);
319 
320 err:
321 	*nresult = (size_t)-1;
322 	return (ret);
323 }
324 
325 static __inline int
326 /*ARGSUSED*/
327 _citrus_EUC_stdenc_wctocs(_EUCEncodingInfo * __restrict ei,
328     _csid_t * __restrict csid, _index_t * __restrict idx, wchar_t wc)
329 {
330 	wchar_t m, nm;
331 
332 	m = wc & ei->mask;
333 	nm = wc & ~m;
334 
335 	*csid = (_citrus_csid_t)m;
336 	*idx  = (_citrus_index_t)nm;
337 
338 	return (0);
339 }
340 
341 static __inline int
342 /*ARGSUSED*/
343 _citrus_EUC_stdenc_cstowc(_EUCEncodingInfo * __restrict ei,
344     wchar_t * __restrict wc, _csid_t csid, _index_t idx)
345 {
346 
347 	if ((csid & ~ei->mask) != 0 || (idx & ei->mask) != 0)
348 		return (EINVAL);
349 
350 	*wc = (wchar_t)csid | (wchar_t)idx;
351 
352 	return (0);
353 }
354 
355 static __inline int
356 /*ARGSUSED*/
357 _citrus_EUC_stdenc_get_state_desc_generic(_EUCEncodingInfo * __restrict ei __unused,
358     _EUCState * __restrict psenc, int * __restrict rstate)
359 {
360 
361 	*rstate = (psenc->chlen == 0) ? _STDENC_SDGEN_INITIAL :
362 	    _STDENC_SDGEN_INCOMPLETE_CHAR;
363 	return (0);
364 }
365 
366 static int
367 /*ARGSUSED*/
368 _citrus_EUC_encoding_module_init(_EUCEncodingInfo * __restrict ei,
369     const void * __restrict var, size_t lenvar)
370 {
371 
372 	return (_citrus_EUC_parse_variable(ei, var, lenvar));
373 }
374 
375 static void
376 /*ARGSUSED*/
377 _citrus_EUC_encoding_module_uninit(_EUCEncodingInfo * __restrict ei __unused)
378 {
379 
380 }
381 
382 /* ----------------------------------------------------------------------
383  * public interface for stdenc
384  */
385 
386 _CITRUS_STDENC_DECLS(EUC);
387 _CITRUS_STDENC_DEF_OPS(EUC);
388 
389 #include "citrus_stdenc_template.h"
390