xref: /illumos-gate/usr/src/lib/iconv_modules/ja/common/EUC-JIS-2004_TO_Unicode.c (revision 16d8656330ae5622ec32e5007f62145ebafdc50f)
1*16d86563SAlexander Pyhalov /*
2*16d86563SAlexander Pyhalov  * CDDL HEADER START
3*16d86563SAlexander Pyhalov  *
4*16d86563SAlexander Pyhalov  * The contents of this file are subject to the terms of the
5*16d86563SAlexander Pyhalov  * Common Development and Distribution License (the "License").
6*16d86563SAlexander Pyhalov  * You may not use this file except in compliance with the License.
7*16d86563SAlexander Pyhalov  *
8*16d86563SAlexander Pyhalov  * You can obtain a copy of the license at src/OPENSOLARIS.LICENSE
9*16d86563SAlexander Pyhalov  * or http://www.opensolaris.org/os/licensing.
10*16d86563SAlexander Pyhalov  * See the License for the specific language governing permissions
11*16d86563SAlexander Pyhalov  * and limitations under the License.
12*16d86563SAlexander Pyhalov  *
13*16d86563SAlexander Pyhalov  * When distributing Covered Code, include this CDDL HEADER in each
14*16d86563SAlexander Pyhalov  * file and include the License file at src/OPENSOLARIS.LICENSE.
15*16d86563SAlexander Pyhalov  * If applicable, add the following below this CDDL HEADER, with the
16*16d86563SAlexander Pyhalov  * fields enclosed by brackets "[]" replaced with your own identifying
17*16d86563SAlexander Pyhalov  * information: Portions Copyright [yyyy] [name of copyright owner]
18*16d86563SAlexander Pyhalov  *
19*16d86563SAlexander Pyhalov  * CDDL HEADER END
20*16d86563SAlexander Pyhalov  */
21*16d86563SAlexander Pyhalov /*
22*16d86563SAlexander Pyhalov  * Copyright 2007 Sun Microsystems, Inc.  All rights reserved.
23*16d86563SAlexander Pyhalov  * Use is subject to license terms.
24*16d86563SAlexander Pyhalov  */
25*16d86563SAlexander Pyhalov 
26*16d86563SAlexander Pyhalov 
27*16d86563SAlexander Pyhalov #include <stdlib.h>
28*16d86563SAlexander Pyhalov #include <errno.h>
29*16d86563SAlexander Pyhalov #include <euc.h>
30*16d86563SAlexander Pyhalov #include "japanese.h"
31*16d86563SAlexander Pyhalov #include "jfp_iconv_unicode.h"
32*16d86563SAlexander Pyhalov 
33*16d86563SAlexander Pyhalov #define	JFP_J2U_ICONV_X0213
34*16d86563SAlexander Pyhalov #include "jfp_jis_to_ucs2.h"
35*16d86563SAlexander Pyhalov 
36*16d86563SAlexander Pyhalov void *
_icv_open(void)37*16d86563SAlexander Pyhalov _icv_open(void)
38*16d86563SAlexander Pyhalov {
39*16d86563SAlexander Pyhalov 	return (_icv_open_unicode((size_t)0));
40*16d86563SAlexander Pyhalov }
41*16d86563SAlexander Pyhalov 
42*16d86563SAlexander Pyhalov void
_icv_close(void * cd)43*16d86563SAlexander Pyhalov _icv_close(void *cd)
44*16d86563SAlexander Pyhalov {
45*16d86563SAlexander Pyhalov 	_icv_close_unicode(cd);
46*16d86563SAlexander Pyhalov 	return;
47*16d86563SAlexander Pyhalov }
48*16d86563SAlexander Pyhalov 
49*16d86563SAlexander Pyhalov size_t
_icv_iconv(void * cd,char ** inbuf,size_t * inbytesleft,char ** outbuf,size_t * outbytesleft)50*16d86563SAlexander Pyhalov _icv_iconv(void *cd, char **inbuf, size_t *inbytesleft,
51*16d86563SAlexander Pyhalov 				char **outbuf, size_t *outbytesleft)
52*16d86563SAlexander Pyhalov {
53*16d86563SAlexander Pyhalov 	unsigned int	u32;		/* UTF-32 */
54*16d86563SAlexander Pyhalov 	unsigned short	e16;		/* 16-bit EUC */
55*16d86563SAlexander Pyhalov 	unsigned char	ic1, ic2, ic3;	/* 1st, 2nd, and 3rd bytes of a char */
56*16d86563SAlexander Pyhalov 	size_t		rv = (size_t)0;	/* return value of this function */
57*16d86563SAlexander Pyhalov 
58*16d86563SAlexander Pyhalov 	unsigned char	*ip;
59*16d86563SAlexander Pyhalov         size_t		ileft;
60*16d86563SAlexander Pyhalov 	char		*op;
61*16d86563SAlexander Pyhalov         size_t		oleft;
62*16d86563SAlexander Pyhalov 
63*16d86563SAlexander Pyhalov 	/*
64*16d86563SAlexander Pyhalov 	 * If inbuf and/or *inbuf are NULL, reset conversion descriptor
65*16d86563SAlexander Pyhalov 	 * and put escape sequence if needed.
66*16d86563SAlexander Pyhalov 	 */
67*16d86563SAlexander Pyhalov 	if ((inbuf == NULL) || (*inbuf == NULL)) {
68*16d86563SAlexander Pyhalov 		_icv_reset_unicode(cd);
69*16d86563SAlexander Pyhalov 		return ((size_t)0);
70*16d86563SAlexander Pyhalov 	}
71*16d86563SAlexander Pyhalov 
72*16d86563SAlexander Pyhalov 	ip = (unsigned char *)*inbuf;
73*16d86563SAlexander Pyhalov 	ileft = *inbytesleft;
74*16d86563SAlexander Pyhalov 	op = *outbuf;
75*16d86563SAlexander Pyhalov 	oleft = *outbytesleft;
76*16d86563SAlexander Pyhalov 
77*16d86563SAlexander Pyhalov 	while (ileft != 0) {
78*16d86563SAlexander Pyhalov 		NGET(ic1, "never fail here"); /* get 1st byte */
79*16d86563SAlexander Pyhalov 
80*16d86563SAlexander Pyhalov 		if (ISASC(ic1)) { /* CS0; 1 byte */
81*16d86563SAlexander Pyhalov 			u32 = (unsigned int)_jfp_tbl_jisx0201roman_to_ucs2[ic1];
82*16d86563SAlexander Pyhalov 			PUTU(u32, "CS0");
83*16d86563SAlexander Pyhalov 		} else if (ISCS1(ic1)) { /* JIS X 0213 plane 1; 2 bytes */
84*16d86563SAlexander Pyhalov 			NGET(ic2, "CS1-2");
85*16d86563SAlexander Pyhalov 			if (ISCS1(ic2)) { /* 2nd byte check passed */
86*16d86563SAlexander Pyhalov 				e16 = (ic1 << 8) | ic2;
87*16d86563SAlexander Pyhalov 				u32 = (unsigned int)_jfp_tbl_jisx0208_to_ucs2[
88*16d86563SAlexander Pyhalov 					(ic1 - 0xa1) * 94 + (ic2 - 0xa1)];
89*16d86563SAlexander Pyhalov 				if (IFHISUR(u32)) {
90*16d86563SAlexander Pyhalov 					u32 = _jfp_lookup_x0213_nonbmp(
91*16d86563SAlexander Pyhalov 						e16, u32);
92*16d86563SAlexander Pyhalov 					PUTU(u32, "CS1->NONBMP");
93*16d86563SAlexander Pyhalov 				} else if (u32 == 0xffff) {
94*16d86563SAlexander Pyhalov 					/* need to compose */
95*16d86563SAlexander Pyhalov 					unsigned int	u32_2;
96*16d86563SAlexander Pyhalov 					u32 = _jfp_lookup_x0213_compose(
97*16d86563SAlexander Pyhalov 						e16, &u32_2);
98*16d86563SAlexander Pyhalov 					PUTU(u32, "CS1->CP1");
99*16d86563SAlexander Pyhalov 					PUTU(u32_2, "CS1->CP2");
100*16d86563SAlexander Pyhalov 				} else {
101*16d86563SAlexander Pyhalov 					PUTU(u32, "CS1->BMP");
102*16d86563SAlexander Pyhalov 				}
103*16d86563SAlexander Pyhalov 			} else { /* 2nd byte check failed */
104*16d86563SAlexander Pyhalov 				RETERROR(EILSEQ, "CS1-2")
105*16d86563SAlexander Pyhalov 			}
106*16d86563SAlexander Pyhalov 		} else if (ic1 == SS2) { /* JIS X 0201 Kana; 2 bytes */
107*16d86563SAlexander Pyhalov 			NGET(ic2, "CS2-2");
108*16d86563SAlexander Pyhalov 			if (ISCS2(ic2)) { /* 2nd byte check passed */
109*16d86563SAlexander Pyhalov 				u32 = (unsigned int)
110*16d86563SAlexander Pyhalov 				_jfp_tbl_jisx0201kana_to_ucs2[ic2 - 0xa1];
111*16d86563SAlexander Pyhalov 				PUTU(u32, "CS2->Kana");
112*16d86563SAlexander Pyhalov 			} else { /* 2nd byte check failed */
113*16d86563SAlexander Pyhalov 				RETERROR(EILSEQ, "CS2-2")
114*16d86563SAlexander Pyhalov 			}
115*16d86563SAlexander Pyhalov 		} else if (ic1 == SS3) { /* JIS X 0213 plane 2; 3 bytes */
116*16d86563SAlexander Pyhalov 			NGET(ic2, "CS3-2");
117*16d86563SAlexander Pyhalov 			if (ISCS3(ic2)) { /* 2nd byte check passed */
118*16d86563SAlexander Pyhalov 				NGET(ic3, "CS3-3");
119*16d86563SAlexander Pyhalov 				if (ISCS3(ic3)) { /* 3rd byte check passed */
120*16d86563SAlexander Pyhalov 					e16 = (ic2 << 8) | (ic3 & 0x7f);
121*16d86563SAlexander Pyhalov 					u32 = (unsigned int)
122*16d86563SAlexander Pyhalov 					_jfp_tbl_jisx0213p2_to_ucs2[
123*16d86563SAlexander Pyhalov 					(ic2 - 0xa1) * 94 + (ic3 - 0xa1)];
124*16d86563SAlexander Pyhalov 					if (IFHISUR(u32)) {
125*16d86563SAlexander Pyhalov 						u32 = _jfp_lookup_x0213_nonbmp(
126*16d86563SAlexander Pyhalov 						e16, u32);
127*16d86563SAlexander Pyhalov 						PUTU(u32, "CS3->NONBMP");
128*16d86563SAlexander Pyhalov 					} else {
129*16d86563SAlexander Pyhalov 						PUTU(u32, "CS3->BMP");
130*16d86563SAlexander Pyhalov 					}
131*16d86563SAlexander Pyhalov 				} else { /* 3rd byte check failed */
132*16d86563SAlexander Pyhalov 					RETERROR(EILSEQ, "CS3-3")
133*16d86563SAlexander Pyhalov 				}
134*16d86563SAlexander Pyhalov 			} else { /* 2nd byte check failed */
135*16d86563SAlexander Pyhalov 				RETERROR(EILSEQ, "CS3-2")
136*16d86563SAlexander Pyhalov 			}
137*16d86563SAlexander Pyhalov 		} else if (ISC1CTRLEUC(ic1)) { /* C1 control; 1 byte */
138*16d86563SAlexander Pyhalov 			u32 = ic1;
139*16d86563SAlexander Pyhalov 			PUTU(u32, "E2BIG C1CTRL");
140*16d86563SAlexander Pyhalov 		} else { /* 1st byte check failed */
141*16d86563SAlexander Pyhalov 			RETERROR(EILSEQ, "CS?-1")
142*16d86563SAlexander Pyhalov 		}
143*16d86563SAlexander Pyhalov 
144*16d86563SAlexander Pyhalov 		/*
145*16d86563SAlexander Pyhalov 		 * One character successfully converted so update
146*16d86563SAlexander Pyhalov 		 * values outside of this function's stack.
147*16d86563SAlexander Pyhalov 		 */
148*16d86563SAlexander Pyhalov 		*inbuf = (char *)ip;
149*16d86563SAlexander Pyhalov 		*inbytesleft = ileft;
150*16d86563SAlexander Pyhalov 		*outbuf = op;
151*16d86563SAlexander Pyhalov 		*outbytesleft = oleft;
152*16d86563SAlexander Pyhalov 	}
153*16d86563SAlexander Pyhalov 
154*16d86563SAlexander Pyhalov ret:
155*16d86563SAlexander Pyhalov 	DEBUGPRINTERROR
156*16d86563SAlexander Pyhalov 
157*16d86563SAlexander Pyhalov 	/*
158*16d86563SAlexander Pyhalov 	 * Return value for successful return is not defined by XPG
159*16d86563SAlexander Pyhalov 	 * so return same as *inbytesleft as existing codes do.
160*16d86563SAlexander Pyhalov 	 */
161*16d86563SAlexander Pyhalov 	return ((rv == (size_t)-1) ? rv : *inbytesleft);
162*16d86563SAlexander Pyhalov }
163