xref: /freebsd/lib/libc/locale/mskanji.c (revision 3823d5e198425b4f5e5a80267d195769d1063773)
1 /*
2  * Copyright (c) 2002-2004 Tim J. Robbins. All rights reserved.
3  *
4  *    ja_JP.SJIS locale table for BSD4.4/rune
5  *    version 1.0
6  *    (C) Sin'ichiro MIYATANI / Phase One, Inc
7  *    May 12, 1995
8  *
9  * Copyright (c) 2011 The FreeBSD Foundation
10  * All rights reserved.
11  * Portions of this software were developed by David Chisnall
12  * under sponsorship from the FreeBSD Foundation.
13  *
14  * Redistribution and use in source and binary forms, with or without
15  * modification, are permitted provided that the following conditions
16  * are met:
17  * 1. Redistributions of source code must retain the above copyright
18  *    notice, this list of conditions and the following disclaimer.
19  * 2. Redistributions in binary form must reproduce the above copyright
20  *    notice, this list of conditions and the following disclaimer in the
21  *    documentation and/or other materials provided with the distribution.
22  * 3. All advertising materials mentioning features or use of this software
23  *    must display the following acknowledgement:
24  *      This product includes software developed by Phase One, Inc.
25  * 4. The name of Phase One, Inc. may be used to endorse or promote products
26  *    derived from this software without specific prior written permission.
27  *
28  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
29  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
30  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
31  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
32  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
33  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
34  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
35  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
36  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
37  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
38  * SUCH DAMAGE.
39  */
40 
41 #if defined(LIBC_SCCS) && !defined(lint)
42 static char sccsid[] = "@(#)mskanji.c	1.0 (Phase One) 5/5/95";
43 #endif /* LIBC_SCCS and not lint */
44 #include <sys/cdefs.h>
45 __FBSDID("$FreeBSD$");
46 
47 #include <sys/types.h>
48 #include <errno.h>
49 #include <runetype.h>
50 #include <stdlib.h>
51 #include <string.h>
52 #include <wchar.h>
53 #include "mblocal.h"
54 
55 extern int __mb_sb_limit;
56 
57 static size_t	_MSKanji_mbrtowc(wchar_t * __restrict, const char * __restrict,
58 		    size_t, mbstate_t * __restrict);
59 static int	_MSKanji_mbsinit(const mbstate_t *);
60 static size_t	_MSKanji_wcrtomb(char * __restrict, wchar_t,
61 		    mbstate_t * __restrict);
62 
63 typedef struct {
64 	wchar_t	ch;
65 } _MSKanjiState;
66 
67 int
68 _MSKanji_init(struct xlocale_ctype *l, _RuneLocale *rl)
69 {
70 
71 	l->__mbrtowc = _MSKanji_mbrtowc;
72 	l->__wcrtomb = _MSKanji_wcrtomb;
73 	l->__mbsinit = _MSKanji_mbsinit;
74 	l->runes = rl;
75 	l->__mb_cur_max = 2;
76 	l->__mb_sb_limit = 256;
77 	return (0);
78 }
79 
80 static int
81 _MSKanji_mbsinit(const mbstate_t *ps)
82 {
83 
84 	return (ps == NULL || ((const _MSKanjiState *)ps)->ch == 0);
85 }
86 
87 static size_t
88 _MSKanji_mbrtowc(wchar_t * __restrict pwc, const char * __restrict s, size_t n,
89     mbstate_t * __restrict ps)
90 {
91 	_MSKanjiState *ms;
92 	wchar_t wc;
93 
94 	ms = (_MSKanjiState *)ps;
95 
96 	if ((ms->ch & ~0xFF) != 0) {
97 		/* Bad conversion state. */
98 		errno = EINVAL;
99 		return ((size_t)-1);
100 	}
101 
102 	if (s == NULL) {
103 		s = "";
104 		n = 1;
105 		pwc = NULL;
106 	}
107 
108 	if (n == 0)
109 		/* Incomplete multibyte sequence */
110 		return ((size_t)-2);
111 
112 	if (ms->ch != 0) {
113 		if (*s == '\0') {
114 			errno = EILSEQ;
115 			return ((size_t)-1);
116 		}
117 		wc = (ms->ch << 8) | (*s & 0xFF);
118 		if (pwc != NULL)
119 			*pwc = wc;
120 		ms->ch = 0;
121 		return (1);
122 	}
123 	wc = *s++ & 0xff;
124 	if ((wc > 0x80 && wc < 0xa0) || (wc >= 0xe0 && wc < 0xfd)) {
125 		if (n < 2) {
126 			/* Incomplete multibyte sequence */
127 			ms->ch = wc;
128 			return ((size_t)-2);
129 		}
130 		if (*s == '\0') {
131 			errno = EILSEQ;
132 			return ((size_t)-1);
133 		}
134 		wc = (wc << 8) | (*s++ & 0xff);
135 		if (pwc != NULL)
136 			*pwc = wc;
137 		return (2);
138 	} else {
139 		if (pwc != NULL)
140 			*pwc = wc;
141 		return (wc == L'\0' ? 0 : 1);
142 	}
143 }
144 
145 static size_t
146 _MSKanji_wcrtomb(char * __restrict s, wchar_t wc, mbstate_t * __restrict ps)
147 {
148 	_MSKanjiState *ms;
149 	int len, i;
150 
151 	ms = (_MSKanjiState *)ps;
152 
153 	if (ms->ch != 0) {
154 		errno = EINVAL;
155 		return ((size_t)-1);
156 	}
157 
158 	if (s == NULL)
159 		/* Reset to initial shift state (no-op) */
160 		return (1);
161 	len = (wc > 0x100) ? 2 : 1;
162 	for (i = len; i-- > 0; )
163 		*s++ = wc >> (i << 3);
164 	return (len);
165 }
166