xref: /illumos-gate/usr/src/lib/libc/port/locale/mskanji.c (revision 2ad72058bc680e30f084e9f9ba8ceb0f77386821)
1 /*
2  * Copyright (c) 2002-2004 Tim J. Robbins. All rights reserved.
3  *
4  *    ja_JP.SJIS locale table for BSD4.4/rune
5  *    version 1.0
6  *    (C) Sin'ichiro MIYATANI / Phase One, Inc
7  *    May 12, 1995
8  *
9  * Redistribution and use in source and binary forms, with or without
10  * modification, are permitted provided that the following conditions
11  * are met:
12  * 1. Redistributions of source code must retain the above copyright
13  *    notice, this list of conditions and the following disclaimer.
14  * 2. Redistributions in binary form must reproduce the above copyright
15  *    notice, this list of conditions and the following disclaimer in the
16  *    documentation and/or other materials provided with the distribution.
17  * 3. All advertising materials mentioning features or use of this software
18  *    must display the following acknowledgement:
19  *      This product includes software developed by Phase One, Inc.
20  * 4. The name of Phase One, Inc. may be used to endorse or promote products
21  *    derived from this software without specific prior written permission.
22  *
23  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
24  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
27  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
28  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
29  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
30  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
31  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
32  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
33  * SUCH DAMAGE.
34  */
35 
36 /*
37  * Copyright 2010 Nexenta Systems, Inc.  All rights reserved.
38  * Use is subject to license terms.
39  */
40 
41 #include "lint.h"
42 #include <sys/types.h>
43 #include <errno.h>
44 #include "runetype.h"
45 #include <stdlib.h>
46 #include <string.h>
47 #include <wchar.h>
48 #include "mblocal.h"
49 
50 static size_t	_MSKanji_mbrtowc(wchar_t *_RESTRICT_KYWD,
51 		    const char *_RESTRICT_KYWD,
52 		    size_t, mbstate_t *_RESTRICT_KYWD);
53 static int	_MSKanji_mbsinit(const mbstate_t *);
54 static size_t	_MSKanji_wcrtomb(char *_RESTRICT_KYWD, wchar_t,
55 		    mbstate_t *_RESTRICT_KYWD);
56 
57 typedef struct {
58 	wchar_t	ch;
59 } _MSKanjiState;
60 
61 int
62 _MSKanji_init(_RuneLocale *rl)
63 {
64 
65 	__mbrtowc = _MSKanji_mbrtowc;
66 	__wcrtomb = _MSKanji_wcrtomb;
67 	__mbsinit = _MSKanji_mbsinit;
68 	_CurrentRuneLocale = rl;
69 	__ctype[520] = 2;
70 	charset_is_ascii = 0;
71 	return (0);
72 }
73 
74 static int
75 _MSKanji_mbsinit(const mbstate_t *ps)
76 {
77 
78 	return (ps == NULL || ((const _MSKanjiState *)ps)->ch == 0);
79 }
80 
81 static size_t
82 _MSKanji_mbrtowc(wchar_t *_RESTRICT_KYWD pwc, const char *_RESTRICT_KYWD s,
83     size_t n, mbstate_t *_RESTRICT_KYWD ps)
84 {
85 	_MSKanjiState *ms;
86 	wchar_t wc;
87 
88 	ms = (_MSKanjiState *)ps;
89 
90 	if ((ms->ch & ~0xFF) != 0) {
91 		/* Bad conversion state. */
92 		errno = EINVAL;
93 		return ((size_t)-1);
94 	}
95 
96 	if (s == NULL) {
97 		s = "";
98 		n = 1;
99 		pwc = NULL;
100 	}
101 
102 	if (n == 0)
103 		/* Incomplete multibyte sequence */
104 		return ((size_t)-2);
105 
106 	if (ms->ch != 0) {
107 		if (*s == '\0') {
108 			errno = EILSEQ;
109 			return ((size_t)-1);
110 		}
111 		wc = (ms->ch << 8) | (*s & 0xFF);
112 		if (pwc != NULL)
113 			*pwc = wc;
114 		ms->ch = 0;
115 		return (1);
116 	}
117 	wc = *s++ & 0xff;
118 	if ((wc > 0x80 && wc < 0xa0) || (wc >= 0xe0 && wc < 0xfd)) {
119 		if (n < 2) {
120 			/* Incomplete multibyte sequence */
121 			ms->ch = wc;
122 			return ((size_t)-2);
123 		}
124 		if (*s == '\0') {
125 			errno = EILSEQ;
126 			return ((size_t)-1);
127 		}
128 		wc = (wc << 8) | (*s++ & 0xff);
129 		if (pwc != NULL)
130 			*pwc = wc;
131 		return (2);
132 	} else {
133 		if (pwc != NULL)
134 			*pwc = wc;
135 		return (wc == L'\0' ? 0 : 1);
136 	}
137 }
138 
139 static size_t
140 _MSKanji_wcrtomb(char *_RESTRICT_KYWD s, wchar_t wc,
141     mbstate_t *_RESTRICT_KYWD ps)
142 {
143 	_MSKanjiState *ms;
144 	int len, i;
145 
146 	ms = (_MSKanjiState *)ps;
147 
148 	if (ms->ch != 0) {
149 		errno = EINVAL;
150 		return ((size_t)-1);
151 	}
152 
153 	if (s == NULL)
154 		/* Reset to initial shift state (no-op) */
155 		return (1);
156 	len = (wc > 0x100) ? 2 : 1;
157 	for (i = len; i-- > 0; )
158 		*s++ = wc >> (i << 3);
159 	return (len);
160 }
161