1ad30f8e7SGabor Kovesdan /* $FreeBSD$ */ 2ad30f8e7SGabor Kovesdan /* $NetBSD: citrus_mskanji.c,v 1.13 2008/06/14 16:01:08 tnozaki Exp $ */ 3ad30f8e7SGabor Kovesdan 4ad30f8e7SGabor Kovesdan /*- 5*5e53a4f9SPedro F. Giffuni * SPDX-License-Identifier: BSD-2-Clause 6*5e53a4f9SPedro F. Giffuni * 7ad30f8e7SGabor Kovesdan * Copyright (c)2002 Citrus Project, 8ad30f8e7SGabor Kovesdan * All rights reserved. 9ad30f8e7SGabor Kovesdan * 10ad30f8e7SGabor Kovesdan * Redistribution and use in source and binary forms, with or without 11ad30f8e7SGabor Kovesdan * modification, are permitted provided that the following conditions 12ad30f8e7SGabor Kovesdan * are met: 13ad30f8e7SGabor Kovesdan * 1. Redistributions of source code must retain the above copyright 14ad30f8e7SGabor Kovesdan * notice, this list of conditions and the following disclaimer. 15ad30f8e7SGabor Kovesdan * 2. Redistributions in binary form must reproduce the above copyright 16ad30f8e7SGabor Kovesdan * notice, this list of conditions and the following disclaimer in the 17ad30f8e7SGabor Kovesdan * documentation and/or other materials provided with the distribution. 18ad30f8e7SGabor Kovesdan * 19ad30f8e7SGabor Kovesdan * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 20ad30f8e7SGabor Kovesdan * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 21ad30f8e7SGabor Kovesdan * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 22ad30f8e7SGabor Kovesdan * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 23ad30f8e7SGabor Kovesdan * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 24ad30f8e7SGabor Kovesdan * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 25ad30f8e7SGabor Kovesdan * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 26ad30f8e7SGabor Kovesdan * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27ad30f8e7SGabor Kovesdan * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 28ad30f8e7SGabor Kovesdan * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 29ad30f8e7SGabor Kovesdan * SUCH DAMAGE. 30ad30f8e7SGabor Kovesdan */ 31ad30f8e7SGabor Kovesdan 32ad30f8e7SGabor Kovesdan /* 33ad30f8e7SGabor Kovesdan * ja_JP.SJIS locale table for BSD4.4/rune 34ad30f8e7SGabor Kovesdan * version 1.0 35ad30f8e7SGabor Kovesdan * (C) Sin'ichiro MIYATANI / Phase One, Inc 36ad30f8e7SGabor Kovesdan * May 12, 1995 37ad30f8e7SGabor Kovesdan * 38ad30f8e7SGabor Kovesdan * Redistribution and use in source and binary forms, with or without 39ad30f8e7SGabor Kovesdan * modification, are permitted provided that the following conditions 40ad30f8e7SGabor Kovesdan * are met: 41ad30f8e7SGabor Kovesdan * 1. Redistributions of source code must retain the above copyright 42ad30f8e7SGabor Kovesdan * notice, this list of conditions and the following disclaimer. 43ad30f8e7SGabor Kovesdan * 2. Redistributions in binary form must reproduce the above copyright 44ad30f8e7SGabor Kovesdan * notice, this list of conditions and the following disclaimer in the 45ad30f8e7SGabor Kovesdan * documentation and/or other materials provided with the distribution. 46ad30f8e7SGabor Kovesdan * 3. All advertising materials mentioning features or use of this software 47ad30f8e7SGabor Kovesdan * must display the following acknowledgement: 48ad30f8e7SGabor Kovesdan * This product includes software developed by Phase One, Inc. 49ad30f8e7SGabor Kovesdan * 4. The name of Phase One, Inc. may be used to endorse or promote products 50ad30f8e7SGabor Kovesdan * derived from this software without specific prior written permission. 51ad30f8e7SGabor Kovesdan * 52ad30f8e7SGabor Kovesdan * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 53ad30f8e7SGabor Kovesdan * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 54ad30f8e7SGabor Kovesdan * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 55ad30f8e7SGabor Kovesdan * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 56ad30f8e7SGabor Kovesdan * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 57ad30f8e7SGabor Kovesdan * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 58ad30f8e7SGabor Kovesdan * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 59ad30f8e7SGabor Kovesdan * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 60ad30f8e7SGabor Kovesdan * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 61ad30f8e7SGabor Kovesdan * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 62ad30f8e7SGabor Kovesdan * SUCH DAMAGE. 63ad30f8e7SGabor Kovesdan */ 64ad30f8e7SGabor Kovesdan 65ad30f8e7SGabor Kovesdan 66ad30f8e7SGabor Kovesdan #include <sys/cdefs.h> 67ad30f8e7SGabor Kovesdan #include <sys/types.h> 68ad30f8e7SGabor Kovesdan 69ad30f8e7SGabor Kovesdan #include <assert.h> 70ad30f8e7SGabor Kovesdan #include <errno.h> 71ad30f8e7SGabor Kovesdan #include <limits.h> 72ad30f8e7SGabor Kovesdan #include <stdbool.h> 73ad30f8e7SGabor Kovesdan #include <stddef.h> 74ad30f8e7SGabor Kovesdan #include <stdio.h> 75ad30f8e7SGabor Kovesdan #include <stdlib.h> 76ad30f8e7SGabor Kovesdan #include <string.h> 77ad30f8e7SGabor Kovesdan #include <wchar.h> 78ad30f8e7SGabor Kovesdan 79ad30f8e7SGabor Kovesdan #include "citrus_namespace.h" 80ad30f8e7SGabor Kovesdan #include "citrus_types.h" 81ad30f8e7SGabor Kovesdan #include "citrus_bcs.h" 82ad30f8e7SGabor Kovesdan #include "citrus_module.h" 83ad30f8e7SGabor Kovesdan #include "citrus_stdenc.h" 84ad30f8e7SGabor Kovesdan #include "citrus_mskanji.h" 85ad30f8e7SGabor Kovesdan 86ad30f8e7SGabor Kovesdan 87ad30f8e7SGabor Kovesdan /* ---------------------------------------------------------------------- 88ad30f8e7SGabor Kovesdan * private stuffs used by templates 89ad30f8e7SGabor Kovesdan */ 90ad30f8e7SGabor Kovesdan 91ad30f8e7SGabor Kovesdan typedef struct _MSKanjiState { 92ad30f8e7SGabor Kovesdan int chlen; 93ad30f8e7SGabor Kovesdan char ch[2]; 94ad30f8e7SGabor Kovesdan } _MSKanjiState; 95ad30f8e7SGabor Kovesdan 96ad30f8e7SGabor Kovesdan typedef struct { 97ad30f8e7SGabor Kovesdan int mode; 98ad30f8e7SGabor Kovesdan #define MODE_JIS2004 1 99ad30f8e7SGabor Kovesdan } _MSKanjiEncodingInfo; 100ad30f8e7SGabor Kovesdan 101ad30f8e7SGabor Kovesdan #define _CEI_TO_EI(_cei_) (&(_cei_)->ei) 102ad30f8e7SGabor Kovesdan #define _CEI_TO_STATE(_cei_, _func_) (_cei_)->states.s_##_func_ 103ad30f8e7SGabor Kovesdan 104ad30f8e7SGabor Kovesdan #define _FUNCNAME(m) _citrus_MSKanji_##m 105ad30f8e7SGabor Kovesdan #define _ENCODING_INFO _MSKanjiEncodingInfo 106ad30f8e7SGabor Kovesdan #define _ENCODING_STATE _MSKanjiState 107ad30f8e7SGabor Kovesdan #define _ENCODING_MB_CUR_MAX(_ei_) 2 108ad30f8e7SGabor Kovesdan #define _ENCODING_IS_STATE_DEPENDENT 0 109ad30f8e7SGabor Kovesdan #define _STATE_NEEDS_EXPLICIT_INIT(_ps_) 0 110ad30f8e7SGabor Kovesdan 111ad30f8e7SGabor Kovesdan 112ad30f8e7SGabor Kovesdan static bool 113ad30f8e7SGabor Kovesdan _mskanji1(int c) 114ad30f8e7SGabor Kovesdan { 115ad30f8e7SGabor Kovesdan 116ad30f8e7SGabor Kovesdan return ((c >= 0x81 && c <= 0x9f) || (c >= 0xe0 && c <= 0xfc)); 117ad30f8e7SGabor Kovesdan } 118ad30f8e7SGabor Kovesdan 119ad30f8e7SGabor Kovesdan static bool 120ad30f8e7SGabor Kovesdan _mskanji2(int c) 121ad30f8e7SGabor Kovesdan { 122ad30f8e7SGabor Kovesdan 123ad30f8e7SGabor Kovesdan return ((c >= 0x40 && c <= 0x7e) || (c >= 0x80 && c <= 0xfc)); 124ad30f8e7SGabor Kovesdan } 125ad30f8e7SGabor Kovesdan 126ad30f8e7SGabor Kovesdan static __inline void 127ad30f8e7SGabor Kovesdan /*ARGSUSED*/ 128ad30f8e7SGabor Kovesdan _citrus_MSKanji_init_state(_MSKanjiEncodingInfo * __restrict ei __unused, 129ad30f8e7SGabor Kovesdan _MSKanjiState * __restrict s) 130ad30f8e7SGabor Kovesdan { 131ad30f8e7SGabor Kovesdan 132ad30f8e7SGabor Kovesdan s->chlen = 0; 133ad30f8e7SGabor Kovesdan } 134ad30f8e7SGabor Kovesdan 135b61949ddSDimitry Andric #if 0 136ad30f8e7SGabor Kovesdan static __inline void 137ad30f8e7SGabor Kovesdan /*ARGSUSED*/ 138ad30f8e7SGabor Kovesdan _citrus_MSKanji_pack_state(_MSKanjiEncodingInfo * __restrict ei __unused, 139ad30f8e7SGabor Kovesdan void * __restrict pspriv, const _MSKanjiState * __restrict s) 140ad30f8e7SGabor Kovesdan { 141ad30f8e7SGabor Kovesdan 142ad30f8e7SGabor Kovesdan memcpy(pspriv, (const void *)s, sizeof(*s)); 143ad30f8e7SGabor Kovesdan } 144ad30f8e7SGabor Kovesdan 145ad30f8e7SGabor Kovesdan static __inline void 146ad30f8e7SGabor Kovesdan /*ARGSUSED*/ 147ad30f8e7SGabor Kovesdan _citrus_MSKanji_unpack_state(_MSKanjiEncodingInfo * __restrict ei __unused, 148ad30f8e7SGabor Kovesdan _MSKanjiState * __restrict s, const void * __restrict pspriv) 149ad30f8e7SGabor Kovesdan { 150ad30f8e7SGabor Kovesdan 151ad30f8e7SGabor Kovesdan memcpy((void *)s, pspriv, sizeof(*s)); 152ad30f8e7SGabor Kovesdan } 153b61949ddSDimitry Andric #endif 154ad30f8e7SGabor Kovesdan 155ad30f8e7SGabor Kovesdan static int 156ad30f8e7SGabor Kovesdan /*ARGSUSED*/ 157ad30f8e7SGabor Kovesdan _citrus_MSKanji_mbrtowc_priv(_MSKanjiEncodingInfo * __restrict ei, 1581243a98eSTijl Coosemans wchar_t * __restrict pwc, char ** __restrict s, size_t n, 159ad30f8e7SGabor Kovesdan _MSKanjiState * __restrict psenc, size_t * __restrict nresult) 160ad30f8e7SGabor Kovesdan { 1611243a98eSTijl Coosemans char *s0; 162ad30f8e7SGabor Kovesdan wchar_t wchar; 163ad30f8e7SGabor Kovesdan int chlenbak, len; 164ad30f8e7SGabor Kovesdan 165ad30f8e7SGabor Kovesdan s0 = *s; 166ad30f8e7SGabor Kovesdan 167ad30f8e7SGabor Kovesdan if (s0 == NULL) { 168ad30f8e7SGabor Kovesdan _citrus_MSKanji_init_state(ei, psenc); 169ad30f8e7SGabor Kovesdan *nresult = 0; /* state independent */ 170ad30f8e7SGabor Kovesdan return (0); 171ad30f8e7SGabor Kovesdan } 172ad30f8e7SGabor Kovesdan 173ad30f8e7SGabor Kovesdan chlenbak = psenc->chlen; 174ad30f8e7SGabor Kovesdan 175ad30f8e7SGabor Kovesdan /* make sure we have the first byte in the buffer */ 176ad30f8e7SGabor Kovesdan switch (psenc->chlen) { 177ad30f8e7SGabor Kovesdan case 0: 178ad30f8e7SGabor Kovesdan if (n < 1) 179ad30f8e7SGabor Kovesdan goto restart; 180ad30f8e7SGabor Kovesdan psenc->ch[0] = *s0++; 181ad30f8e7SGabor Kovesdan psenc->chlen = 1; 182ad30f8e7SGabor Kovesdan n--; 183ad30f8e7SGabor Kovesdan break; 184ad30f8e7SGabor Kovesdan case 1: 185ad30f8e7SGabor Kovesdan break; 186ad30f8e7SGabor Kovesdan default: 187ad30f8e7SGabor Kovesdan /* illegal state */ 188ad30f8e7SGabor Kovesdan goto encoding_error; 189ad30f8e7SGabor Kovesdan } 190ad30f8e7SGabor Kovesdan 191ad30f8e7SGabor Kovesdan len = _mskanji1(psenc->ch[0] & 0xff) ? 2 : 1; 192ad30f8e7SGabor Kovesdan while (psenc->chlen < len) { 193ad30f8e7SGabor Kovesdan if (n < 1) 194ad30f8e7SGabor Kovesdan goto restart; 195ad30f8e7SGabor Kovesdan psenc->ch[psenc->chlen] = *s0++; 196ad30f8e7SGabor Kovesdan psenc->chlen++; 197ad30f8e7SGabor Kovesdan n--; 198ad30f8e7SGabor Kovesdan } 199ad30f8e7SGabor Kovesdan 200ad30f8e7SGabor Kovesdan *s = s0; 201ad30f8e7SGabor Kovesdan 202ad30f8e7SGabor Kovesdan switch (len) { 203ad30f8e7SGabor Kovesdan case 1: 204ad30f8e7SGabor Kovesdan wchar = psenc->ch[0] & 0xff; 205ad30f8e7SGabor Kovesdan break; 206ad30f8e7SGabor Kovesdan case 2: 207ad30f8e7SGabor Kovesdan if (!_mskanji2(psenc->ch[1] & 0xff)) 208ad30f8e7SGabor Kovesdan goto encoding_error; 209ad30f8e7SGabor Kovesdan wchar = ((psenc->ch[0] & 0xff) << 8) | (psenc->ch[1] & 0xff); 210ad30f8e7SGabor Kovesdan break; 211ad30f8e7SGabor Kovesdan default: 212ad30f8e7SGabor Kovesdan /* illegal state */ 213ad30f8e7SGabor Kovesdan goto encoding_error; 214ad30f8e7SGabor Kovesdan } 215ad30f8e7SGabor Kovesdan 216ad30f8e7SGabor Kovesdan psenc->chlen = 0; 217ad30f8e7SGabor Kovesdan 218ad30f8e7SGabor Kovesdan if (pwc) 219ad30f8e7SGabor Kovesdan *pwc = wchar; 220ad30f8e7SGabor Kovesdan *nresult = wchar ? len - chlenbak : 0; 221ad30f8e7SGabor Kovesdan return (0); 222ad30f8e7SGabor Kovesdan 223ad30f8e7SGabor Kovesdan encoding_error: 224ad30f8e7SGabor Kovesdan psenc->chlen = 0; 225ad30f8e7SGabor Kovesdan *nresult = (size_t)-1; 226ad30f8e7SGabor Kovesdan return (EILSEQ); 227ad30f8e7SGabor Kovesdan 228ad30f8e7SGabor Kovesdan restart: 229ad30f8e7SGabor Kovesdan *nresult = (size_t)-2; 230ad30f8e7SGabor Kovesdan *s = s0; 231ad30f8e7SGabor Kovesdan return (0); 232ad30f8e7SGabor Kovesdan } 233ad30f8e7SGabor Kovesdan 234ad30f8e7SGabor Kovesdan 235ad30f8e7SGabor Kovesdan static int 236ad30f8e7SGabor Kovesdan _citrus_MSKanji_wcrtomb_priv(_MSKanjiEncodingInfo * __restrict ei __unused, 237ad30f8e7SGabor Kovesdan char * __restrict s, size_t n, wchar_t wc, 238ad30f8e7SGabor Kovesdan _MSKanjiState * __restrict psenc __unused, size_t * __restrict nresult) 239ad30f8e7SGabor Kovesdan { 240ad30f8e7SGabor Kovesdan int ret; 241ad30f8e7SGabor Kovesdan 242ad30f8e7SGabor Kovesdan /* check invalid sequence */ 243ad30f8e7SGabor Kovesdan if (wc & ~0xffff) { 244ad30f8e7SGabor Kovesdan ret = EILSEQ; 245ad30f8e7SGabor Kovesdan goto err; 246ad30f8e7SGabor Kovesdan } 247ad30f8e7SGabor Kovesdan 248ad30f8e7SGabor Kovesdan if (wc & 0xff00) { 249ad30f8e7SGabor Kovesdan if (n < 2) { 250ad30f8e7SGabor Kovesdan ret = E2BIG; 251ad30f8e7SGabor Kovesdan goto err; 252ad30f8e7SGabor Kovesdan } 253ad30f8e7SGabor Kovesdan 254ad30f8e7SGabor Kovesdan s[0] = (wc >> 8) & 0xff; 255ad30f8e7SGabor Kovesdan s[1] = wc & 0xff; 256ad30f8e7SGabor Kovesdan if (!_mskanji1(s[0] & 0xff) || !_mskanji2(s[1] & 0xff)) { 257ad30f8e7SGabor Kovesdan ret = EILSEQ; 258ad30f8e7SGabor Kovesdan goto err; 259ad30f8e7SGabor Kovesdan } 260ad30f8e7SGabor Kovesdan 261ad30f8e7SGabor Kovesdan *nresult = 2; 262ad30f8e7SGabor Kovesdan return (0); 263ad30f8e7SGabor Kovesdan } else { 264ad30f8e7SGabor Kovesdan if (n < 1) { 265ad30f8e7SGabor Kovesdan ret = E2BIG; 266ad30f8e7SGabor Kovesdan goto err; 267ad30f8e7SGabor Kovesdan } 268ad30f8e7SGabor Kovesdan 269ad30f8e7SGabor Kovesdan s[0] = wc & 0xff; 270ad30f8e7SGabor Kovesdan if (_mskanji1(s[0] & 0xff)) { 271ad30f8e7SGabor Kovesdan ret = EILSEQ; 272ad30f8e7SGabor Kovesdan goto err; 273ad30f8e7SGabor Kovesdan } 274ad30f8e7SGabor Kovesdan 275ad30f8e7SGabor Kovesdan *nresult = 1; 276ad30f8e7SGabor Kovesdan return (0); 277ad30f8e7SGabor Kovesdan } 278ad30f8e7SGabor Kovesdan 279ad30f8e7SGabor Kovesdan err: 280ad30f8e7SGabor Kovesdan *nresult = (size_t)-1; 281ad30f8e7SGabor Kovesdan return (ret); 282ad30f8e7SGabor Kovesdan } 283ad30f8e7SGabor Kovesdan 284ad30f8e7SGabor Kovesdan 285ad30f8e7SGabor Kovesdan static __inline int 286ad30f8e7SGabor Kovesdan /*ARGSUSED*/ 287ad30f8e7SGabor Kovesdan _citrus_MSKanji_stdenc_wctocs(_MSKanjiEncodingInfo * __restrict ei, 288ad30f8e7SGabor Kovesdan _csid_t * __restrict csid, _index_t * __restrict idx, wchar_t wc) 289ad30f8e7SGabor Kovesdan { 290ad30f8e7SGabor Kovesdan _index_t col, row; 291ad30f8e7SGabor Kovesdan int offset; 292ad30f8e7SGabor Kovesdan 293ad30f8e7SGabor Kovesdan if ((_wc_t)wc < 0x80) { 294ad30f8e7SGabor Kovesdan /* ISO-646 */ 295ad30f8e7SGabor Kovesdan *csid = 0; 296ad30f8e7SGabor Kovesdan *idx = (_index_t)wc; 297ad30f8e7SGabor Kovesdan } else if ((_wc_t)wc < 0x100) { 298ad30f8e7SGabor Kovesdan /* KANA */ 299ad30f8e7SGabor Kovesdan *csid = 1; 300ad30f8e7SGabor Kovesdan *idx = (_index_t)wc & 0x7F; 301ad30f8e7SGabor Kovesdan } else { 302ad30f8e7SGabor Kovesdan /* Kanji (containing Gaiji zone) */ 303ad30f8e7SGabor Kovesdan /* 304ad30f8e7SGabor Kovesdan * 94^2 zone (contains a part of Gaiji (0xED40 - 0xEEFC)): 305ad30f8e7SGabor Kovesdan * 0x8140 - 0x817E -> 0x2121 - 0x215F 306ad30f8e7SGabor Kovesdan * 0x8180 - 0x819E -> 0x2160 - 0x217E 307ad30f8e7SGabor Kovesdan * 0x819F - 0x81FC -> 0x2221 - 0x227E 308ad30f8e7SGabor Kovesdan * 309ad30f8e7SGabor Kovesdan * 0x8240 - 0x827E -> 0x2321 - 0x235F 310ad30f8e7SGabor Kovesdan * ... 311ad30f8e7SGabor Kovesdan * 0x9F9F - 0x9FFc -> 0x5E21 - 0x5E7E 312ad30f8e7SGabor Kovesdan * 313ad30f8e7SGabor Kovesdan * 0xE040 - 0xE07E -> 0x5F21 - 0x5F5F 314ad30f8e7SGabor Kovesdan * ... 315ad30f8e7SGabor Kovesdan * 0xEF9F - 0xEFFC -> 0x7E21 - 0x7E7E 316ad30f8e7SGabor Kovesdan * 317ad30f8e7SGabor Kovesdan * extended Gaiji zone: 318ad30f8e7SGabor Kovesdan * 0xF040 - 0xFCFC 319ad30f8e7SGabor Kovesdan * 320ad30f8e7SGabor Kovesdan * JIS X0213-plane2: 321ad30f8e7SGabor Kovesdan * 0xF040 - 0xF09E -> 0x2121 - 0x217E 322ad30f8e7SGabor Kovesdan * 0xF140 - 0xF19E -> 0x2321 - 0x237E 323ad30f8e7SGabor Kovesdan * ... 324ad30f8e7SGabor Kovesdan * 0xF240 - 0xF29E -> 0x2521 - 0x257E 325ad30f8e7SGabor Kovesdan * 326ad30f8e7SGabor Kovesdan * 0xF09F - 0xF0FC -> 0x2821 - 0x287E 327ad30f8e7SGabor Kovesdan * 0xF29F - 0xF2FC -> 0x2C21 - 0x2C7E 328ad30f8e7SGabor Kovesdan * ... 329ad30f8e7SGabor Kovesdan * 0xF44F - 0xF49E -> 0x2F21 - 0x2F7E 330ad30f8e7SGabor Kovesdan * 331ad30f8e7SGabor Kovesdan * 0xF49F - 0xF4FC -> 0x6E21 - 0x6E7E 332ad30f8e7SGabor Kovesdan * ... 333ad30f8e7SGabor Kovesdan * 0xFC9F - 0xFCFC -> 0x7E21 - 0x7E7E 334ad30f8e7SGabor Kovesdan */ 335ad30f8e7SGabor Kovesdan row = ((_wc_t)wc >> 8) & 0xFF; 336ad30f8e7SGabor Kovesdan col = (_wc_t)wc & 0xFF; 337ad30f8e7SGabor Kovesdan if (!_mskanji1(row) || !_mskanji2(col)) 338ad30f8e7SGabor Kovesdan return (EILSEQ); 339ad30f8e7SGabor Kovesdan if ((ei->mode & MODE_JIS2004) == 0 || row < 0xF0) { 340ad30f8e7SGabor Kovesdan *csid = 2; 341ad30f8e7SGabor Kovesdan offset = 0x81; 342ad30f8e7SGabor Kovesdan } else { 343ad30f8e7SGabor Kovesdan *csid = 3; 344ad30f8e7SGabor Kovesdan if ((_wc_t)wc <= 0xF49E) { 345ad30f8e7SGabor Kovesdan offset = (_wc_t)wc >= 0xF29F || 346ad30f8e7SGabor Kovesdan ((_wc_t)wc >= 0xF09F && 347ad30f8e7SGabor Kovesdan (_wc_t)wc <= 0xF0FC) ? 0xED : 0xF0; 348ad30f8e7SGabor Kovesdan } else 349ad30f8e7SGabor Kovesdan offset = 0xCE; 350ad30f8e7SGabor Kovesdan } 351ad30f8e7SGabor Kovesdan row -= offset; 352ad30f8e7SGabor Kovesdan if (row >= 0x5F) 353ad30f8e7SGabor Kovesdan row -= 0x40; 354ad30f8e7SGabor Kovesdan row = row * 2 + 0x21; 355ad30f8e7SGabor Kovesdan col -= 0x1F; 356ad30f8e7SGabor Kovesdan if (col >= 0x61) 357ad30f8e7SGabor Kovesdan col -= 1; 358ad30f8e7SGabor Kovesdan if (col > 0x7E) { 359ad30f8e7SGabor Kovesdan row += 1; 360ad30f8e7SGabor Kovesdan col -= 0x5E; 361ad30f8e7SGabor Kovesdan } 362ad30f8e7SGabor Kovesdan *idx = ((_index_t)row << 8) | col; 363ad30f8e7SGabor Kovesdan } 364ad30f8e7SGabor Kovesdan 365ad30f8e7SGabor Kovesdan return (0); 366ad30f8e7SGabor Kovesdan } 367ad30f8e7SGabor Kovesdan 368ad30f8e7SGabor Kovesdan static __inline int 369ad30f8e7SGabor Kovesdan /*ARGSUSED*/ 370ad30f8e7SGabor Kovesdan _citrus_MSKanji_stdenc_cstowc(_MSKanjiEncodingInfo * __restrict ei, 371ad30f8e7SGabor Kovesdan wchar_t * __restrict wc, _csid_t csid, _index_t idx) 372ad30f8e7SGabor Kovesdan { 373ad30f8e7SGabor Kovesdan uint32_t col, row; 374ad30f8e7SGabor Kovesdan int offset; 375ad30f8e7SGabor Kovesdan 376ad30f8e7SGabor Kovesdan switch (csid) { 377ad30f8e7SGabor Kovesdan case 0: 378ad30f8e7SGabor Kovesdan /* ISO-646 */ 379ad30f8e7SGabor Kovesdan if (idx >= 0x80) 380ad30f8e7SGabor Kovesdan return (EILSEQ); 381ad30f8e7SGabor Kovesdan *wc = (wchar_t)idx; 382ad30f8e7SGabor Kovesdan break; 383ad30f8e7SGabor Kovesdan case 1: 384ad30f8e7SGabor Kovesdan /* kana */ 385ad30f8e7SGabor Kovesdan if (idx >= 0x80) 386ad30f8e7SGabor Kovesdan return (EILSEQ); 387ad30f8e7SGabor Kovesdan *wc = (wchar_t)idx + 0x80; 388ad30f8e7SGabor Kovesdan break; 389ad30f8e7SGabor Kovesdan case 3: 390ad30f8e7SGabor Kovesdan if ((ei->mode & MODE_JIS2004) == 0) 391ad30f8e7SGabor Kovesdan return (EILSEQ); 392ad30f8e7SGabor Kovesdan /*FALLTHROUGH*/ 393ad30f8e7SGabor Kovesdan case 2: 394ad30f8e7SGabor Kovesdan /* kanji */ 395ad30f8e7SGabor Kovesdan row = (idx >> 8); 396ad30f8e7SGabor Kovesdan if (row < 0x21) 397ad30f8e7SGabor Kovesdan return (EILSEQ); 398ad30f8e7SGabor Kovesdan if (csid == 3) { 399ad30f8e7SGabor Kovesdan if (row <= 0x2F) 400ad30f8e7SGabor Kovesdan offset = (row == 0x22 || row >= 0x26) ? 401ad30f8e7SGabor Kovesdan 0xED : 0xF0; 402ad30f8e7SGabor Kovesdan else if (row >= 0x4D && row <= 0x7E) 403ad30f8e7SGabor Kovesdan offset = 0xCE; 404ad30f8e7SGabor Kovesdan else 405ad30f8e7SGabor Kovesdan return (EILSEQ); 406ad30f8e7SGabor Kovesdan } else { 407ad30f8e7SGabor Kovesdan if (row > 0x97) 408ad30f8e7SGabor Kovesdan return (EILSEQ); 409ad30f8e7SGabor Kovesdan offset = (row < 0x5F) ? 0x81 : 0xC1; 410ad30f8e7SGabor Kovesdan } 411ad30f8e7SGabor Kovesdan col = idx & 0xFF; 412ad30f8e7SGabor Kovesdan if (col < 0x21 || col > 0x7E) 413ad30f8e7SGabor Kovesdan return (EILSEQ); 414ad30f8e7SGabor Kovesdan row -= 0x21; col -= 0x21; 415ad30f8e7SGabor Kovesdan if ((row & 1) == 0) { 416ad30f8e7SGabor Kovesdan col += 0x40; 417ad30f8e7SGabor Kovesdan if (col >= 0x7F) 418ad30f8e7SGabor Kovesdan col += 1; 419ad30f8e7SGabor Kovesdan } else 420ad30f8e7SGabor Kovesdan col += 0x9F; 421ad30f8e7SGabor Kovesdan row = row / 2 + offset; 422ad30f8e7SGabor Kovesdan *wc = ((wchar_t)row << 8) | col; 423ad30f8e7SGabor Kovesdan break; 424ad30f8e7SGabor Kovesdan default: 425ad30f8e7SGabor Kovesdan return (EILSEQ); 426ad30f8e7SGabor Kovesdan } 427ad30f8e7SGabor Kovesdan 428ad30f8e7SGabor Kovesdan return (0); 429ad30f8e7SGabor Kovesdan } 430ad30f8e7SGabor Kovesdan 431ad30f8e7SGabor Kovesdan static __inline int 432ad30f8e7SGabor Kovesdan /*ARGSUSED*/ 433ad30f8e7SGabor Kovesdan _citrus_MSKanji_stdenc_get_state_desc_generic(_MSKanjiEncodingInfo * __restrict ei __unused, 434ad30f8e7SGabor Kovesdan _MSKanjiState * __restrict psenc, int * __restrict rstate) 435ad30f8e7SGabor Kovesdan { 436ad30f8e7SGabor Kovesdan 437ad30f8e7SGabor Kovesdan *rstate = (psenc->chlen == 0) ? _STDENC_SDGEN_INITIAL : 438ad30f8e7SGabor Kovesdan _STDENC_SDGEN_INCOMPLETE_CHAR; 439ad30f8e7SGabor Kovesdan return (0); 440ad30f8e7SGabor Kovesdan } 441ad30f8e7SGabor Kovesdan 442ad30f8e7SGabor Kovesdan static int 443ad30f8e7SGabor Kovesdan /*ARGSUSED*/ 444ad30f8e7SGabor Kovesdan _citrus_MSKanji_encoding_module_init(_MSKanjiEncodingInfo * __restrict ei, 445ad30f8e7SGabor Kovesdan const void * __restrict var, size_t lenvar) 446ad30f8e7SGabor Kovesdan { 447ad30f8e7SGabor Kovesdan const char *p; 448ad30f8e7SGabor Kovesdan 449ad30f8e7SGabor Kovesdan p = var; 450ad30f8e7SGabor Kovesdan memset((void *)ei, 0, sizeof(*ei)); 451ad30f8e7SGabor Kovesdan while (lenvar > 0) { 452ad30f8e7SGabor Kovesdan switch (_bcs_toupper(*p)) { 453ad30f8e7SGabor Kovesdan case 'J': 454ad30f8e7SGabor Kovesdan MATCH(JIS2004, ei->mode |= MODE_JIS2004); 455ad30f8e7SGabor Kovesdan break; 456ad30f8e7SGabor Kovesdan } 457ad30f8e7SGabor Kovesdan ++p; 458ad30f8e7SGabor Kovesdan --lenvar; 459ad30f8e7SGabor Kovesdan } 460ad30f8e7SGabor Kovesdan 461ad30f8e7SGabor Kovesdan return (0); 462ad30f8e7SGabor Kovesdan } 463ad30f8e7SGabor Kovesdan 464ad30f8e7SGabor Kovesdan static void 465ad30f8e7SGabor Kovesdan _citrus_MSKanji_encoding_module_uninit(_MSKanjiEncodingInfo *ei __unused) 466ad30f8e7SGabor Kovesdan { 467ad30f8e7SGabor Kovesdan 468ad30f8e7SGabor Kovesdan } 469ad30f8e7SGabor Kovesdan 470ad30f8e7SGabor Kovesdan /* ---------------------------------------------------------------------- 471ad30f8e7SGabor Kovesdan * public interface for stdenc 472ad30f8e7SGabor Kovesdan */ 473ad30f8e7SGabor Kovesdan 474ad30f8e7SGabor Kovesdan _CITRUS_STDENC_DECLS(MSKanji); 475ad30f8e7SGabor Kovesdan _CITRUS_STDENC_DEF_OPS(MSKanji); 476ad30f8e7SGabor Kovesdan 477ad30f8e7SGabor Kovesdan #include "citrus_stdenc_template.h" 478