1ad30f8e7SGabor Kovesdan /* $FreeBSD$ */ 29ca40936STijl Coosemans /* $NetBSD: citrus_iso2022.c,v 1.20 2010/12/07 22:01:45 joerg Exp $ */ 3ad30f8e7SGabor Kovesdan 4ad30f8e7SGabor Kovesdan /*- 5*5e53a4f9SPedro F. Giffuni * SPDX-License-Identifier: BSD-2-Clause 6*5e53a4f9SPedro F. Giffuni * 7ad30f8e7SGabor Kovesdan * Copyright (c)1999, 2002 Citrus Project, 8ad30f8e7SGabor Kovesdan * All rights reserved. 9ad30f8e7SGabor Kovesdan * 10ad30f8e7SGabor Kovesdan * Redistribution and use in source and binary forms, with or without 11ad30f8e7SGabor Kovesdan * modification, are permitted provided that the following conditions 12ad30f8e7SGabor Kovesdan * are met: 13ad30f8e7SGabor Kovesdan * 1. Redistributions of source code must retain the above copyright 14ad30f8e7SGabor Kovesdan * notice, this list of conditions and the following disclaimer. 15ad30f8e7SGabor Kovesdan * 2. Redistributions in binary form must reproduce the above copyright 16ad30f8e7SGabor Kovesdan * notice, this list of conditions and the following disclaimer in the 17ad30f8e7SGabor Kovesdan * documentation and/or other materials provided with the distribution. 18ad30f8e7SGabor Kovesdan * 19ad30f8e7SGabor Kovesdan * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 20ad30f8e7SGabor Kovesdan * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 21ad30f8e7SGabor Kovesdan * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 22ad30f8e7SGabor Kovesdan * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 23ad30f8e7SGabor Kovesdan * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 24ad30f8e7SGabor Kovesdan * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 25ad30f8e7SGabor Kovesdan * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 26ad30f8e7SGabor Kovesdan * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27ad30f8e7SGabor Kovesdan * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 28ad30f8e7SGabor Kovesdan * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 29ad30f8e7SGabor Kovesdan * SUCH DAMAGE. 30ad30f8e7SGabor Kovesdan * 31ad30f8e7SGabor Kovesdan * $Citrus: xpg4dl/FreeBSD/lib/libc/locale/iso2022.c,v 1.23 2001/06/21 01:51:44 yamt Exp $ 32ad30f8e7SGabor Kovesdan */ 33ad30f8e7SGabor Kovesdan 34ad30f8e7SGabor Kovesdan #include <sys/cdefs.h> 35ad30f8e7SGabor Kovesdan #include <sys/types.h> 36ad30f8e7SGabor Kovesdan 37ad30f8e7SGabor Kovesdan #include <assert.h> 38ad30f8e7SGabor Kovesdan #include <errno.h> 39ad30f8e7SGabor Kovesdan #include <limits.h> 40ad30f8e7SGabor Kovesdan #include <stdbool.h> 41ad30f8e7SGabor Kovesdan #include <stddef.h> 42ad30f8e7SGabor Kovesdan #include <stdio.h> 43ad30f8e7SGabor Kovesdan #include <stdlib.h> 44ad30f8e7SGabor Kovesdan #include <string.h> 45ad30f8e7SGabor Kovesdan #include <wchar.h> 46ad30f8e7SGabor Kovesdan 47ad30f8e7SGabor Kovesdan #include "citrus_namespace.h" 48ad30f8e7SGabor Kovesdan #include "citrus_types.h" 49ad30f8e7SGabor Kovesdan #include "citrus_module.h" 50ad30f8e7SGabor Kovesdan #include "citrus_stdenc.h" 51ad30f8e7SGabor Kovesdan #include "citrus_iso2022.h" 52ad30f8e7SGabor Kovesdan 53ad30f8e7SGabor Kovesdan 54ad30f8e7SGabor Kovesdan /* ---------------------------------------------------------------------- 55ad30f8e7SGabor Kovesdan * private stuffs used by templates 56ad30f8e7SGabor Kovesdan */ 57ad30f8e7SGabor Kovesdan 58ad30f8e7SGabor Kovesdan 59ad30f8e7SGabor Kovesdan /* 60ad30f8e7SGabor Kovesdan * wchar_t mappings: 61ad30f8e7SGabor Kovesdan * ASCII (ESC ( B) 00000000 00000000 00000000 0xxxxxxx 62ad30f8e7SGabor Kovesdan * iso-8859-1 (ESC , A) 00000000 00000000 00000000 1xxxxxxx 63ad30f8e7SGabor Kovesdan * 94 charset (ESC ( F) 0fffffff 00000000 00000000 0xxxxxxx 64ad30f8e7SGabor Kovesdan * 94 charset (ESC ( M F) 0fffffff 1mmmmmmm 00000000 0xxxxxxx 65ad30f8e7SGabor Kovesdan * 96 charset (ESC , F) 0fffffff 00000000 00000000 1xxxxxxx 66ad30f8e7SGabor Kovesdan * 96 charset (ESC , M F) 0fffffff 1mmmmmmm 00000000 1xxxxxxx 67ad30f8e7SGabor Kovesdan * 94x94 charset (ESC $ ( F) 0fffffff 00000000 0xxxxxxx 0xxxxxxx 68ad30f8e7SGabor Kovesdan * 96x96 charset (ESC $ , F) 0fffffff 00000000 0xxxxxxx 1xxxxxxx 69ad30f8e7SGabor Kovesdan * 94x94 charset (ESC & V ESC $ ( F) 70ad30f8e7SGabor Kovesdan * 0fffffff 1vvvvvvv 0xxxxxxx 0xxxxxxx 71ad30f8e7SGabor Kovesdan * 94x94x94 charset (ESC $ ( F) 0fffffff 0xxxxxxx 0xxxxxxx 0xxxxxxx 72ad30f8e7SGabor Kovesdan * 96x96x96 charset (ESC $ , F) 0fffffff 0xxxxxxx 0xxxxxxx 1xxxxxxx 73ad30f8e7SGabor Kovesdan * reserved for UCS4 co-existence (UCS4 is 31bit encoding thanks to mohta bit) 74ad30f8e7SGabor Kovesdan * 1xxxxxxx xxxxxxxx xxxxxxxx xxxxxxxx 75ad30f8e7SGabor Kovesdan */ 76ad30f8e7SGabor Kovesdan 77ad30f8e7SGabor Kovesdan #define CS94 (0U) 78ad30f8e7SGabor Kovesdan #define CS96 (1U) 79ad30f8e7SGabor Kovesdan #define CS94MULTI (2U) 80ad30f8e7SGabor Kovesdan #define CS96MULTI (3U) 81ad30f8e7SGabor Kovesdan 82ad30f8e7SGabor Kovesdan typedef struct { 83ad30f8e7SGabor Kovesdan unsigned char type; 849ca40936STijl Coosemans unsigned char final; 859ca40936STijl Coosemans unsigned char interm; 86ad30f8e7SGabor Kovesdan unsigned char vers; 87ad30f8e7SGabor Kovesdan } _ISO2022Charset; 88ad30f8e7SGabor Kovesdan 89ad30f8e7SGabor Kovesdan static const _ISO2022Charset ascii = { CS94, 'B', '\0', '\0' }; 90ad30f8e7SGabor Kovesdan static const _ISO2022Charset iso88591 = { CS96, 'A', '\0', '\0' }; 91ad30f8e7SGabor Kovesdan 92ad30f8e7SGabor Kovesdan typedef struct { 93ad30f8e7SGabor Kovesdan _ISO2022Charset g[4]; 94ad30f8e7SGabor Kovesdan /* need 3 bits to hold -1, 0, ..., 3 */ 95ad30f8e7SGabor Kovesdan int gl:3, 96ad30f8e7SGabor Kovesdan gr:3, 97ad30f8e7SGabor Kovesdan singlegl:3, 98ad30f8e7SGabor Kovesdan singlegr:3; 99ad30f8e7SGabor Kovesdan char ch[7]; /* longest escape sequence (ESC & V ESC $ ( F) */ 100ad30f8e7SGabor Kovesdan size_t chlen; 101ad30f8e7SGabor Kovesdan int flags; 102ad30f8e7SGabor Kovesdan #define _ISO2022STATE_FLAG_INITIALIZED 1 103ad30f8e7SGabor Kovesdan } _ISO2022State; 104ad30f8e7SGabor Kovesdan 105ad30f8e7SGabor Kovesdan typedef struct { 106ad30f8e7SGabor Kovesdan _ISO2022Charset *recommend[4]; 107ad30f8e7SGabor Kovesdan size_t recommendsize[4]; 108ad30f8e7SGabor Kovesdan _ISO2022Charset initg[4]; 109ad30f8e7SGabor Kovesdan int maxcharset; 110ad30f8e7SGabor Kovesdan int flags; 111ad30f8e7SGabor Kovesdan #define F_8BIT 0x0001 112ad30f8e7SGabor Kovesdan #define F_NOOLD 0x0002 113ad30f8e7SGabor Kovesdan #define F_SI 0x0010 /*0F*/ 114ad30f8e7SGabor Kovesdan #define F_SO 0x0020 /*0E*/ 115ad30f8e7SGabor Kovesdan #define F_LS0 0x0010 /*0F*/ 116ad30f8e7SGabor Kovesdan #define F_LS1 0x0020 /*0E*/ 117ad30f8e7SGabor Kovesdan #define F_LS2 0x0040 /*ESC n*/ 118ad30f8e7SGabor Kovesdan #define F_LS3 0x0080 /*ESC o*/ 119ad30f8e7SGabor Kovesdan #define F_LS1R 0x0100 /*ESC ~*/ 120ad30f8e7SGabor Kovesdan #define F_LS2R 0x0200 /*ESC }*/ 121ad30f8e7SGabor Kovesdan #define F_LS3R 0x0400 /*ESC |*/ 122ad30f8e7SGabor Kovesdan #define F_SS2 0x0800 /*ESC N*/ 123ad30f8e7SGabor Kovesdan #define F_SS3 0x1000 /*ESC O*/ 124ad30f8e7SGabor Kovesdan #define F_SS2R 0x2000 /*8E*/ 125ad30f8e7SGabor Kovesdan #define F_SS3R 0x4000 /*8F*/ 126ad30f8e7SGabor Kovesdan } _ISO2022EncodingInfo; 127ad30f8e7SGabor Kovesdan 128ad30f8e7SGabor Kovesdan #define _CEI_TO_EI(_cei_) (&(_cei_)->ei) 129ad30f8e7SGabor Kovesdan #define _CEI_TO_STATE(_cei_, _func_) (_cei_)->states.s_##_func_ 130ad30f8e7SGabor Kovesdan 131ad30f8e7SGabor Kovesdan #define _FUNCNAME(m) _citrus_ISO2022_##m 132ad30f8e7SGabor Kovesdan #define _ENCODING_INFO _ISO2022EncodingInfo 133ad30f8e7SGabor Kovesdan #define _ENCODING_STATE _ISO2022State 134ad30f8e7SGabor Kovesdan #define _ENCODING_MB_CUR_MAX(_ei_) MB_LEN_MAX 135ad30f8e7SGabor Kovesdan #define _ENCODING_IS_STATE_DEPENDENT 1 136ad30f8e7SGabor Kovesdan #define _STATE_NEEDS_EXPLICIT_INIT(_ps_) \ 137ad30f8e7SGabor Kovesdan (!((_ps_)->flags & _ISO2022STATE_FLAG_INITIALIZED)) 138ad30f8e7SGabor Kovesdan 139ad30f8e7SGabor Kovesdan 140ad30f8e7SGabor Kovesdan #define _ISO2022INVALID (wchar_t)-1 141ad30f8e7SGabor Kovesdan 142ad30f8e7SGabor Kovesdan static __inline bool isc0(__uint8_t x) 143ad30f8e7SGabor Kovesdan { 144ad30f8e7SGabor Kovesdan 145ad30f8e7SGabor Kovesdan return ((x & 0x1f) == x); 146ad30f8e7SGabor Kovesdan } 147ad30f8e7SGabor Kovesdan 148ad30f8e7SGabor Kovesdan static __inline bool isc1(__uint8_t x) 149ad30f8e7SGabor Kovesdan { 150ad30f8e7SGabor Kovesdan 151ad30f8e7SGabor Kovesdan return (0x80 <= x && x <= 0x9f); 152ad30f8e7SGabor Kovesdan } 153ad30f8e7SGabor Kovesdan 154ad30f8e7SGabor Kovesdan static __inline bool iscntl(__uint8_t x) 155ad30f8e7SGabor Kovesdan { 156ad30f8e7SGabor Kovesdan 157ad30f8e7SGabor Kovesdan return (isc0(x) || isc1(x) || x == 0x7f); 158ad30f8e7SGabor Kovesdan } 159ad30f8e7SGabor Kovesdan 160ad30f8e7SGabor Kovesdan static __inline bool is94(__uint8_t x) 161ad30f8e7SGabor Kovesdan { 162ad30f8e7SGabor Kovesdan 163ad30f8e7SGabor Kovesdan return (0x21 <= x && x <= 0x7e); 164ad30f8e7SGabor Kovesdan } 165ad30f8e7SGabor Kovesdan 166ad30f8e7SGabor Kovesdan static __inline bool is96(__uint8_t x) 167ad30f8e7SGabor Kovesdan { 168ad30f8e7SGabor Kovesdan 169ad30f8e7SGabor Kovesdan return (0x20 <= x && x <= 0x7f); 170ad30f8e7SGabor Kovesdan } 171ad30f8e7SGabor Kovesdan 172ad30f8e7SGabor Kovesdan static __inline bool isecma(__uint8_t x) 173ad30f8e7SGabor Kovesdan { 174ad30f8e7SGabor Kovesdan 175ad30f8e7SGabor Kovesdan return (0x30 <= x && x <= 0x7f); 176ad30f8e7SGabor Kovesdan } 177ad30f8e7SGabor Kovesdan 178ad30f8e7SGabor Kovesdan static __inline bool isinterm(__uint8_t x) 179ad30f8e7SGabor Kovesdan { 180ad30f8e7SGabor Kovesdan 181ad30f8e7SGabor Kovesdan return (0x20 <= x && x <= 0x2f); 182ad30f8e7SGabor Kovesdan } 183ad30f8e7SGabor Kovesdan 184ad30f8e7SGabor Kovesdan static __inline bool isthree(__uint8_t x) 185ad30f8e7SGabor Kovesdan { 186ad30f8e7SGabor Kovesdan 187ad30f8e7SGabor Kovesdan return (0x60 <= x && x <= 0x6f); 188ad30f8e7SGabor Kovesdan } 189ad30f8e7SGabor Kovesdan 190ad30f8e7SGabor Kovesdan static __inline int 191ad30f8e7SGabor Kovesdan getcs(const char * __restrict p, _ISO2022Charset * __restrict cs) 192ad30f8e7SGabor Kovesdan { 193ad30f8e7SGabor Kovesdan 194ad30f8e7SGabor Kovesdan if (!strncmp(p, "94$", 3) && p[3] && !p[4]) { 195ad30f8e7SGabor Kovesdan cs->final = (unsigned char)(p[3] & 0xff); 196ad30f8e7SGabor Kovesdan cs->interm = '\0'; 197ad30f8e7SGabor Kovesdan cs->vers = '\0'; 198ad30f8e7SGabor Kovesdan cs->type = CS94MULTI; 199ad30f8e7SGabor Kovesdan } else if (!strncmp(p, "96$", 3) && p[3] && !p[4]) { 200ad30f8e7SGabor Kovesdan cs->final = (unsigned char)(p[3] & 0xff); 201ad30f8e7SGabor Kovesdan cs->interm = '\0'; 202ad30f8e7SGabor Kovesdan cs->vers = '\0'; 203ad30f8e7SGabor Kovesdan cs->type = CS96MULTI; 204ad30f8e7SGabor Kovesdan } else if (!strncmp(p, "94", 2) && p[2] && !p[3]) { 205ad30f8e7SGabor Kovesdan cs->final = (unsigned char)(p[2] & 0xff); 206ad30f8e7SGabor Kovesdan cs->interm = '\0'; 207ad30f8e7SGabor Kovesdan cs->vers = '\0'; 208ad30f8e7SGabor Kovesdan cs->type = CS94; 209ad30f8e7SGabor Kovesdan } else if (!strncmp(p, "96", 2) && p[2] && !p[3]) { 210ad30f8e7SGabor Kovesdan cs->final = (unsigned char )(p[2] & 0xff); 211ad30f8e7SGabor Kovesdan cs->interm = '\0'; 212ad30f8e7SGabor Kovesdan cs->vers = '\0'; 213ad30f8e7SGabor Kovesdan cs->type = CS96; 214ad30f8e7SGabor Kovesdan } else 215ad30f8e7SGabor Kovesdan return (1); 216ad30f8e7SGabor Kovesdan 217ad30f8e7SGabor Kovesdan return (0); 218ad30f8e7SGabor Kovesdan } 219ad30f8e7SGabor Kovesdan 220ad30f8e7SGabor Kovesdan 221ad30f8e7SGabor Kovesdan #define _NOTMATCH 0 222ad30f8e7SGabor Kovesdan #define _MATCH 1 223ad30f8e7SGabor Kovesdan #define _PARSEFAIL 2 224ad30f8e7SGabor Kovesdan 225ad30f8e7SGabor Kovesdan static __inline int 226ad30f8e7SGabor Kovesdan get_recommend(_ISO2022EncodingInfo * __restrict ei, 227ad30f8e7SGabor Kovesdan const char * __restrict token) 228ad30f8e7SGabor Kovesdan { 229ad30f8e7SGabor Kovesdan _ISO2022Charset cs, *p; 230ad30f8e7SGabor Kovesdan int i; 231ad30f8e7SGabor Kovesdan 232ad30f8e7SGabor Kovesdan if (!strchr("0123", token[0]) || token[1] != '=') 233ad30f8e7SGabor Kovesdan return (_NOTMATCH); 234ad30f8e7SGabor Kovesdan 235ad30f8e7SGabor Kovesdan if (getcs(&token[2], &cs) == 0) 236ad30f8e7SGabor Kovesdan ; 237ad30f8e7SGabor Kovesdan else if (!strcmp(&token[2], "94")) { 238ad30f8e7SGabor Kovesdan cs.final = (unsigned char)(token[4]); 239ad30f8e7SGabor Kovesdan cs.interm = '\0'; 240ad30f8e7SGabor Kovesdan cs.vers = '\0'; 241ad30f8e7SGabor Kovesdan cs.type = CS94; 242ad30f8e7SGabor Kovesdan } else if (!strcmp(&token[2], "96")) { 243ad30f8e7SGabor Kovesdan cs.final = (unsigned char)(token[4]); 244ad30f8e7SGabor Kovesdan cs.interm = '\0'; 245ad30f8e7SGabor Kovesdan cs.vers = '\0'; 246ad30f8e7SGabor Kovesdan cs.type = CS96; 247ad30f8e7SGabor Kovesdan } else if (!strcmp(&token[2], "94$")) { 248ad30f8e7SGabor Kovesdan cs.final = (unsigned char)(token[5]); 249ad30f8e7SGabor Kovesdan cs.interm = '\0'; 250ad30f8e7SGabor Kovesdan cs.vers = '\0'; 251ad30f8e7SGabor Kovesdan cs.type = CS94MULTI; 252ad30f8e7SGabor Kovesdan } else if (!strcmp(&token[2], "96$")) { 253ad30f8e7SGabor Kovesdan cs.final = (unsigned char)(token[5]); 254ad30f8e7SGabor Kovesdan cs.interm = '\0'; 255ad30f8e7SGabor Kovesdan cs.vers = '\0'; 256ad30f8e7SGabor Kovesdan cs.type = CS96MULTI; 257ad30f8e7SGabor Kovesdan } else 258ad30f8e7SGabor Kovesdan return (_PARSEFAIL); 259ad30f8e7SGabor Kovesdan 260ad30f8e7SGabor Kovesdan i = token[0] - '0'; 261ad30f8e7SGabor Kovesdan if (!ei->recommend[i]) 262ad30f8e7SGabor Kovesdan ei->recommend[i] = malloc(sizeof(_ISO2022Charset)); 263ad30f8e7SGabor Kovesdan else { 264efa8af7cSPedro F. Giffuni p = reallocarray(ei->recommend[i], ei->recommendsize[i] + 1, 265efa8af7cSPedro F. Giffuni sizeof(_ISO2022Charset)); 266ad30f8e7SGabor Kovesdan if (!p) 267ad30f8e7SGabor Kovesdan return (_PARSEFAIL); 268ad30f8e7SGabor Kovesdan ei->recommend[i] = p; 269ad30f8e7SGabor Kovesdan } 270ad30f8e7SGabor Kovesdan if (!ei->recommend[i]) 271ad30f8e7SGabor Kovesdan return (_PARSEFAIL); 272ad30f8e7SGabor Kovesdan ei->recommendsize[i]++; 273ad30f8e7SGabor Kovesdan 274ad30f8e7SGabor Kovesdan (ei->recommend[i] + (ei->recommendsize[i] - 1))->final = cs.final; 275ad30f8e7SGabor Kovesdan (ei->recommend[i] + (ei->recommendsize[i] - 1))->interm = cs.interm; 276ad30f8e7SGabor Kovesdan (ei->recommend[i] + (ei->recommendsize[i] - 1))->vers = cs.vers; 277ad30f8e7SGabor Kovesdan (ei->recommend[i] + (ei->recommendsize[i] - 1))->type = cs.type; 278ad30f8e7SGabor Kovesdan 279ad30f8e7SGabor Kovesdan return (_MATCH); 280ad30f8e7SGabor Kovesdan } 281ad30f8e7SGabor Kovesdan 282ad30f8e7SGabor Kovesdan static __inline int 283ad30f8e7SGabor Kovesdan get_initg(_ISO2022EncodingInfo * __restrict ei, 284ad30f8e7SGabor Kovesdan const char * __restrict token) 285ad30f8e7SGabor Kovesdan { 286ad30f8e7SGabor Kovesdan _ISO2022Charset cs; 287ad30f8e7SGabor Kovesdan 288ad30f8e7SGabor Kovesdan if (strncmp("INIT", &token[0], 4) || 289ad30f8e7SGabor Kovesdan !strchr("0123", token[4]) || 290ad30f8e7SGabor Kovesdan token[5] != '=') 291ad30f8e7SGabor Kovesdan return (_NOTMATCH); 292ad30f8e7SGabor Kovesdan 293ad30f8e7SGabor Kovesdan if (getcs(&token[6], &cs) != 0) 294ad30f8e7SGabor Kovesdan return (_PARSEFAIL); 295ad30f8e7SGabor Kovesdan 296ad30f8e7SGabor Kovesdan ei->initg[token[4] - '0'].type = cs.type; 297ad30f8e7SGabor Kovesdan ei->initg[token[4] - '0'].final = cs.final; 298ad30f8e7SGabor Kovesdan ei->initg[token[4] - '0'].interm = cs.interm; 299ad30f8e7SGabor Kovesdan ei->initg[token[4] - '0'].vers = cs.vers; 300ad30f8e7SGabor Kovesdan 301ad30f8e7SGabor Kovesdan return (_MATCH); 302ad30f8e7SGabor Kovesdan } 303ad30f8e7SGabor Kovesdan 304ad30f8e7SGabor Kovesdan static __inline int 305ad30f8e7SGabor Kovesdan get_max(_ISO2022EncodingInfo * __restrict ei, 306ad30f8e7SGabor Kovesdan const char * __restrict token) 307ad30f8e7SGabor Kovesdan { 308ad30f8e7SGabor Kovesdan if (!strcmp(token, "MAX1")) 309ad30f8e7SGabor Kovesdan ei->maxcharset = 1; 310ad30f8e7SGabor Kovesdan else if (!strcmp(token, "MAX2")) 311ad30f8e7SGabor Kovesdan ei->maxcharset = 2; 312ad30f8e7SGabor Kovesdan else if (!strcmp(token, "MAX3")) 313ad30f8e7SGabor Kovesdan ei->maxcharset = 3; 314ad30f8e7SGabor Kovesdan else 315ad30f8e7SGabor Kovesdan return (_NOTMATCH); 316ad30f8e7SGabor Kovesdan 317ad30f8e7SGabor Kovesdan return (_MATCH); 318ad30f8e7SGabor Kovesdan } 319ad30f8e7SGabor Kovesdan 320ad30f8e7SGabor Kovesdan 321ad30f8e7SGabor Kovesdan static __inline int 322ad30f8e7SGabor Kovesdan get_flags(_ISO2022EncodingInfo * __restrict ei, 323ad30f8e7SGabor Kovesdan const char * __restrict token) 324ad30f8e7SGabor Kovesdan { 325ad30f8e7SGabor Kovesdan static struct { 326ad30f8e7SGabor Kovesdan const char *tag; 327ad30f8e7SGabor Kovesdan int flag; 328ad30f8e7SGabor Kovesdan } const tags[] = { 329ad30f8e7SGabor Kovesdan { "DUMMY", 0 }, 330ad30f8e7SGabor Kovesdan { "8BIT", F_8BIT }, 331ad30f8e7SGabor Kovesdan { "NOOLD", F_NOOLD }, 332ad30f8e7SGabor Kovesdan { "SI", F_SI }, 333ad30f8e7SGabor Kovesdan { "SO", F_SO }, 334ad30f8e7SGabor Kovesdan { "LS0", F_LS0 }, 335ad30f8e7SGabor Kovesdan { "LS1", F_LS1 }, 336ad30f8e7SGabor Kovesdan { "LS2", F_LS2 }, 337ad30f8e7SGabor Kovesdan { "LS3", F_LS3 }, 338ad30f8e7SGabor Kovesdan { "LS1R", F_LS1R }, 339ad30f8e7SGabor Kovesdan { "LS2R", F_LS2R }, 340ad30f8e7SGabor Kovesdan { "LS3R", F_LS3R }, 341ad30f8e7SGabor Kovesdan { "SS2", F_SS2 }, 342ad30f8e7SGabor Kovesdan { "SS3", F_SS3 }, 343ad30f8e7SGabor Kovesdan { "SS2R", F_SS2R }, 344ad30f8e7SGabor Kovesdan { "SS3R", F_SS3R }, 345ad30f8e7SGabor Kovesdan { NULL, 0 } 346ad30f8e7SGabor Kovesdan }; 347ad30f8e7SGabor Kovesdan int i; 348ad30f8e7SGabor Kovesdan 349ad30f8e7SGabor Kovesdan for (i = 0; tags[i].tag; i++) 350ad30f8e7SGabor Kovesdan if (!strcmp(token, tags[i].tag)) { 351ad30f8e7SGabor Kovesdan ei->flags |= tags[i].flag; 352ad30f8e7SGabor Kovesdan return (_MATCH); 353ad30f8e7SGabor Kovesdan } 354ad30f8e7SGabor Kovesdan 355ad30f8e7SGabor Kovesdan return (_NOTMATCH); 356ad30f8e7SGabor Kovesdan } 357ad30f8e7SGabor Kovesdan 358ad30f8e7SGabor Kovesdan 359ad30f8e7SGabor Kovesdan static __inline int 360ad30f8e7SGabor Kovesdan _citrus_ISO2022_parse_variable(_ISO2022EncodingInfo * __restrict ei, 361ad30f8e7SGabor Kovesdan const void * __restrict var, size_t lenvar __unused) 362ad30f8e7SGabor Kovesdan { 363ad30f8e7SGabor Kovesdan char const *e, *v; 364ad30f8e7SGabor Kovesdan char buf[20]; 365ad30f8e7SGabor Kovesdan size_t len; 366ad30f8e7SGabor Kovesdan int i, ret; 367ad30f8e7SGabor Kovesdan 368ad30f8e7SGabor Kovesdan /* 369ad30f8e7SGabor Kovesdan * parse VARIABLE section. 370ad30f8e7SGabor Kovesdan */ 371ad30f8e7SGabor Kovesdan 372ad30f8e7SGabor Kovesdan if (!var) 373ad30f8e7SGabor Kovesdan return (EFTYPE); 374ad30f8e7SGabor Kovesdan 375ad30f8e7SGabor Kovesdan v = (const char *) var; 376ad30f8e7SGabor Kovesdan 377ad30f8e7SGabor Kovesdan /* initialize structure */ 378ad30f8e7SGabor Kovesdan ei->maxcharset = 0; 379ad30f8e7SGabor Kovesdan for (i = 0; i < 4; i++) { 380ad30f8e7SGabor Kovesdan ei->recommend[i] = NULL; 381ad30f8e7SGabor Kovesdan ei->recommendsize[i] = 0; 382ad30f8e7SGabor Kovesdan } 383ad30f8e7SGabor Kovesdan ei->flags = 0; 384ad30f8e7SGabor Kovesdan 385ad30f8e7SGabor Kovesdan while (*v) { 386ad30f8e7SGabor Kovesdan while (*v == ' ' || *v == '\t') 387ad30f8e7SGabor Kovesdan ++v; 388ad30f8e7SGabor Kovesdan 389ad30f8e7SGabor Kovesdan /* find the token */ 390ad30f8e7SGabor Kovesdan e = v; 391ad30f8e7SGabor Kovesdan while (*e && *e != ' ' && *e != '\t') 392ad30f8e7SGabor Kovesdan ++e; 393ad30f8e7SGabor Kovesdan 394ad30f8e7SGabor Kovesdan len = e - v; 395ad30f8e7SGabor Kovesdan if (len == 0) 396ad30f8e7SGabor Kovesdan break; 397ad30f8e7SGabor Kovesdan if (len >= sizeof(buf)) 398ad30f8e7SGabor Kovesdan goto parsefail; 399ad30f8e7SGabor Kovesdan snprintf(buf, sizeof(buf), "%.*s", (int)len, v); 400ad30f8e7SGabor Kovesdan 401ad30f8e7SGabor Kovesdan if ((ret = get_recommend(ei, buf)) != _NOTMATCH) 402ad30f8e7SGabor Kovesdan ; 403ad30f8e7SGabor Kovesdan else if ((ret = get_initg(ei, buf)) != _NOTMATCH) 404ad30f8e7SGabor Kovesdan ; 405ad30f8e7SGabor Kovesdan else if ((ret = get_max(ei, buf)) != _NOTMATCH) 406ad30f8e7SGabor Kovesdan ; 407ad30f8e7SGabor Kovesdan else if ((ret = get_flags(ei, buf)) != _NOTMATCH) 408ad30f8e7SGabor Kovesdan ; 409ad30f8e7SGabor Kovesdan else 410ad30f8e7SGabor Kovesdan ret = _PARSEFAIL; 411ad30f8e7SGabor Kovesdan if (ret == _PARSEFAIL) 412ad30f8e7SGabor Kovesdan goto parsefail; 413ad30f8e7SGabor Kovesdan v = e; 414ad30f8e7SGabor Kovesdan 415ad30f8e7SGabor Kovesdan } 416ad30f8e7SGabor Kovesdan 417ad30f8e7SGabor Kovesdan return (0); 418ad30f8e7SGabor Kovesdan 419ad30f8e7SGabor Kovesdan parsefail: 420ad30f8e7SGabor Kovesdan free(ei->recommend[0]); 421ad30f8e7SGabor Kovesdan free(ei->recommend[1]); 422ad30f8e7SGabor Kovesdan free(ei->recommend[2]); 423ad30f8e7SGabor Kovesdan free(ei->recommend[3]); 424ad30f8e7SGabor Kovesdan 425ad30f8e7SGabor Kovesdan return (EFTYPE); 426ad30f8e7SGabor Kovesdan } 427ad30f8e7SGabor Kovesdan 428ad30f8e7SGabor Kovesdan static __inline void 429ad30f8e7SGabor Kovesdan /*ARGSUSED*/ 430ad30f8e7SGabor Kovesdan _citrus_ISO2022_init_state(_ISO2022EncodingInfo * __restrict ei, 431ad30f8e7SGabor Kovesdan _ISO2022State * __restrict s) 432ad30f8e7SGabor Kovesdan { 433ad30f8e7SGabor Kovesdan int i; 434ad30f8e7SGabor Kovesdan 435ad30f8e7SGabor Kovesdan memset(s, 0, sizeof(*s)); 436ad30f8e7SGabor Kovesdan s->gl = 0; 437ad30f8e7SGabor Kovesdan s->gr = (ei->flags & F_8BIT) ? 1 : -1; 438ad30f8e7SGabor Kovesdan 439ad30f8e7SGabor Kovesdan for (i = 0; i < 4; i++) 440ad30f8e7SGabor Kovesdan if (ei->initg[i].final) { 441ad30f8e7SGabor Kovesdan s->g[i].type = ei->initg[i].type; 442ad30f8e7SGabor Kovesdan s->g[i].final = ei->initg[i].final; 443ad30f8e7SGabor Kovesdan s->g[i].interm = ei->initg[i].interm; 444ad30f8e7SGabor Kovesdan } 445ad30f8e7SGabor Kovesdan s->singlegl = s->singlegr = -1; 446ad30f8e7SGabor Kovesdan s->flags |= _ISO2022STATE_FLAG_INITIALIZED; 447ad30f8e7SGabor Kovesdan } 448ad30f8e7SGabor Kovesdan 449b61949ddSDimitry Andric #if 0 450ad30f8e7SGabor Kovesdan static __inline void 451ad30f8e7SGabor Kovesdan /*ARGSUSED*/ 452ad30f8e7SGabor Kovesdan _citrus_ISO2022_pack_state(_ISO2022EncodingInfo * __restrict ei __unused, 453ad30f8e7SGabor Kovesdan void * __restrict pspriv, const _ISO2022State * __restrict s) 454ad30f8e7SGabor Kovesdan { 455ad30f8e7SGabor Kovesdan 456ad30f8e7SGabor Kovesdan memcpy(pspriv, (const void *)s, sizeof(*s)); 457ad30f8e7SGabor Kovesdan } 458ad30f8e7SGabor Kovesdan 459ad30f8e7SGabor Kovesdan static __inline void 460ad30f8e7SGabor Kovesdan /*ARGSUSED*/ 461ad30f8e7SGabor Kovesdan _citrus_ISO2022_unpack_state(_ISO2022EncodingInfo * __restrict ei __unused, 462ad30f8e7SGabor Kovesdan _ISO2022State * __restrict s, const void * __restrict pspriv) 463ad30f8e7SGabor Kovesdan { 464ad30f8e7SGabor Kovesdan 465ad30f8e7SGabor Kovesdan memcpy((void *)s, pspriv, sizeof(*s)); 466ad30f8e7SGabor Kovesdan } 467b61949ddSDimitry Andric #endif 468ad30f8e7SGabor Kovesdan 469ad30f8e7SGabor Kovesdan static int 470ad30f8e7SGabor Kovesdan /*ARGSUSED*/ 471ad30f8e7SGabor Kovesdan _citrus_ISO2022_encoding_module_init(_ISO2022EncodingInfo * __restrict ei, 472ad30f8e7SGabor Kovesdan const void * __restrict var, size_t lenvar) 473ad30f8e7SGabor Kovesdan { 474ad30f8e7SGabor Kovesdan 475ad30f8e7SGabor Kovesdan return (_citrus_ISO2022_parse_variable(ei, var, lenvar)); 476ad30f8e7SGabor Kovesdan } 477ad30f8e7SGabor Kovesdan 478ad30f8e7SGabor Kovesdan static void 479ad30f8e7SGabor Kovesdan /*ARGSUSED*/ 480ad30f8e7SGabor Kovesdan _citrus_ISO2022_encoding_module_uninit(_ISO2022EncodingInfo *ei __unused) 481ad30f8e7SGabor Kovesdan { 482ad30f8e7SGabor Kovesdan 483ad30f8e7SGabor Kovesdan } 484ad30f8e7SGabor Kovesdan 485ad30f8e7SGabor Kovesdan #define ESC '\033' 486ad30f8e7SGabor Kovesdan #define ECMA -1 487ad30f8e7SGabor Kovesdan #define INTERM -2 488ad30f8e7SGabor Kovesdan #define OECMA -3 489ad30f8e7SGabor Kovesdan static const struct seqtable { 490ad30f8e7SGabor Kovesdan int type; 491ad30f8e7SGabor Kovesdan int csoff; 492ad30f8e7SGabor Kovesdan int finaloff; 493ad30f8e7SGabor Kovesdan int intermoff; 494ad30f8e7SGabor Kovesdan int versoff; 495ad30f8e7SGabor Kovesdan int len; 496ad30f8e7SGabor Kovesdan int chars[10]; 497ad30f8e7SGabor Kovesdan } seqtable[] = { 498ad30f8e7SGabor Kovesdan /* G0 94MULTI special */ 499ad30f8e7SGabor Kovesdan { CS94MULTI, -1, 2, -1, -1, 3, { ESC, '$', OECMA }, }, 500ad30f8e7SGabor Kovesdan /* G0 94MULTI special with version identification */ 501ad30f8e7SGabor Kovesdan { CS94MULTI, -1, 5, -1, 2, 6, { ESC, '&', ECMA, ESC, '$', OECMA }, }, 502ad30f8e7SGabor Kovesdan /* G? 94 */ 503ad30f8e7SGabor Kovesdan { CS94, 1, 2, -1, -1, 3, { ESC, CS94, ECMA, }, }, 504ad30f8e7SGabor Kovesdan /* G? 94 with 2nd intermediate char */ 505ad30f8e7SGabor Kovesdan { CS94, 1, 3, 2, -1, 4, { ESC, CS94, INTERM, ECMA, }, }, 506ad30f8e7SGabor Kovesdan /* G? 96 */ 507ad30f8e7SGabor Kovesdan { CS96, 1, 2, -1, -1, 3, { ESC, CS96, ECMA, }, }, 508ad30f8e7SGabor Kovesdan /* G? 96 with 2nd intermediate char */ 509ad30f8e7SGabor Kovesdan { CS96, 1, 3, 2, -1, 4, { ESC, CS96, INTERM, ECMA, }, }, 510ad30f8e7SGabor Kovesdan /* G? 94MULTI */ 511ad30f8e7SGabor Kovesdan { CS94MULTI, 2, 3, -1, -1, 4, { ESC, '$', CS94, ECMA, }, }, 512ad30f8e7SGabor Kovesdan /* G? 96MULTI */ 513ad30f8e7SGabor Kovesdan { CS96MULTI, 2, 3, -1, -1, 4, { ESC, '$', CS96, ECMA, }, }, 514ad30f8e7SGabor Kovesdan /* G? 94MULTI with version specification */ 515ad30f8e7SGabor Kovesdan { CS94MULTI, 5, 6, -1, 2, 7, { ESC, '&', ECMA, ESC, '$', CS94, ECMA, }, }, 516ad30f8e7SGabor Kovesdan /* LS2/3 */ 517ad30f8e7SGabor Kovesdan { -1, -1, -1, -1, -1, 2, { ESC, 'n', }, }, 518ad30f8e7SGabor Kovesdan { -1, -1, -1, -1, -1, 2, { ESC, 'o', }, }, 519ad30f8e7SGabor Kovesdan /* LS1/2/3R */ 520ad30f8e7SGabor Kovesdan { -1, -1, -1, -1, -1, 2, { ESC, '~', }, }, 521ad30f8e7SGabor Kovesdan { -1, -1, -1, -1, -1, 2, { ESC, /*{*/ '}', }, }, 522ad30f8e7SGabor Kovesdan { -1, -1, -1, -1, -1, 2, { ESC, '|', }, }, 523ad30f8e7SGabor Kovesdan /* SS2/3 */ 524ad30f8e7SGabor Kovesdan { -1, -1, -1, -1, -1, 2, { ESC, 'N', }, }, 525ad30f8e7SGabor Kovesdan { -1, -1, -1, -1, -1, 2, { ESC, 'O', }, }, 526ad30f8e7SGabor Kovesdan /* end of records */ 527ad30f8e7SGabor Kovesdan // { 0, } 528ad30f8e7SGabor Kovesdan { 0, 0, 0, 0, 0, 0, { ESC, 0, }, } 529ad30f8e7SGabor Kovesdan }; 530ad30f8e7SGabor Kovesdan 531ad30f8e7SGabor Kovesdan static int 532ad30f8e7SGabor Kovesdan seqmatch(const char * __restrict s, size_t n, 533ad30f8e7SGabor Kovesdan const struct seqtable * __restrict sp) 534ad30f8e7SGabor Kovesdan { 535ad30f8e7SGabor Kovesdan const int *p; 536ad30f8e7SGabor Kovesdan 537ad30f8e7SGabor Kovesdan p = sp->chars; 538ad30f8e7SGabor Kovesdan while ((size_t)(p - sp->chars) < n && p - sp->chars < sp->len) { 539ad30f8e7SGabor Kovesdan switch (*p) { 540ad30f8e7SGabor Kovesdan case ECMA: 541ad30f8e7SGabor Kovesdan if (!isecma(*s)) 542ad30f8e7SGabor Kovesdan goto terminate; 543ad30f8e7SGabor Kovesdan break; 544ad30f8e7SGabor Kovesdan case OECMA: 545ad30f8e7SGabor Kovesdan if (*s && strchr("@AB", *s)) 546ad30f8e7SGabor Kovesdan break; 547ad30f8e7SGabor Kovesdan else 548ad30f8e7SGabor Kovesdan goto terminate; 549ad30f8e7SGabor Kovesdan case INTERM: 550ad30f8e7SGabor Kovesdan if (!isinterm(*s)) 551ad30f8e7SGabor Kovesdan goto terminate; 552ad30f8e7SGabor Kovesdan break; 553ad30f8e7SGabor Kovesdan case CS94: 554ad30f8e7SGabor Kovesdan if (*s && strchr("()*+", *s)) 555ad30f8e7SGabor Kovesdan break; 556ad30f8e7SGabor Kovesdan else 557ad30f8e7SGabor Kovesdan goto terminate; 558ad30f8e7SGabor Kovesdan case CS96: 559ad30f8e7SGabor Kovesdan if (*s && strchr(",-./", *s)) 560ad30f8e7SGabor Kovesdan break; 561ad30f8e7SGabor Kovesdan else 562ad30f8e7SGabor Kovesdan goto terminate; 563ad30f8e7SGabor Kovesdan default: 564ad30f8e7SGabor Kovesdan if (*s != *p) 565ad30f8e7SGabor Kovesdan goto terminate; 566ad30f8e7SGabor Kovesdan break; 567ad30f8e7SGabor Kovesdan } 568ad30f8e7SGabor Kovesdan 569ad30f8e7SGabor Kovesdan p++; 570ad30f8e7SGabor Kovesdan s++; 571ad30f8e7SGabor Kovesdan } 572ad30f8e7SGabor Kovesdan 573ad30f8e7SGabor Kovesdan terminate: 574ad30f8e7SGabor Kovesdan return (p - sp->chars); 575ad30f8e7SGabor Kovesdan } 576ad30f8e7SGabor Kovesdan 577ad30f8e7SGabor Kovesdan static wchar_t 578ad30f8e7SGabor Kovesdan _ISO2022_sgetwchar(_ISO2022EncodingInfo * __restrict ei __unused, 5791243a98eSTijl Coosemans char * __restrict string, size_t n, char ** __restrict result, 580ad30f8e7SGabor Kovesdan _ISO2022State * __restrict psenc) 581ad30f8e7SGabor Kovesdan { 582ad30f8e7SGabor Kovesdan const struct seqtable *sp; 583ad30f8e7SGabor Kovesdan wchar_t wchar = 0; 584ad30f8e7SGabor Kovesdan int i, cur, nmatch; 585ad30f8e7SGabor Kovesdan 586ad30f8e7SGabor Kovesdan while (1) { 587ad30f8e7SGabor Kovesdan /* SI/SO */ 588ad30f8e7SGabor Kovesdan if (1 <= n && string[0] == '\017') { 589ad30f8e7SGabor Kovesdan psenc->gl = 0; 590ad30f8e7SGabor Kovesdan string++; 591ad30f8e7SGabor Kovesdan n--; 592ad30f8e7SGabor Kovesdan continue; 593ad30f8e7SGabor Kovesdan } 594ad30f8e7SGabor Kovesdan if (1 <= n && string[0] == '\016') { 595ad30f8e7SGabor Kovesdan psenc->gl = 1; 596ad30f8e7SGabor Kovesdan string++; 597ad30f8e7SGabor Kovesdan n--; 598ad30f8e7SGabor Kovesdan continue; 599ad30f8e7SGabor Kovesdan } 600ad30f8e7SGabor Kovesdan 601ad30f8e7SGabor Kovesdan /* SS2/3R */ 602ad30f8e7SGabor Kovesdan if (1 <= n && string[0] && strchr("\217\216", string[0])) { 603ad30f8e7SGabor Kovesdan psenc->singlegl = psenc->singlegr = 604ad30f8e7SGabor Kovesdan (string[0] - '\216') + 2; 605ad30f8e7SGabor Kovesdan string++; 606ad30f8e7SGabor Kovesdan n--; 607ad30f8e7SGabor Kovesdan continue; 608ad30f8e7SGabor Kovesdan } 609ad30f8e7SGabor Kovesdan 610ad30f8e7SGabor Kovesdan /* eat the letter if this is not ESC */ 611ad30f8e7SGabor Kovesdan if (1 <= n && string[0] != '\033') 612ad30f8e7SGabor Kovesdan break; 613ad30f8e7SGabor Kovesdan 614ad30f8e7SGabor Kovesdan /* look for a perfect match from escape sequences */ 615ad30f8e7SGabor Kovesdan for (sp = &seqtable[0]; sp->len; sp++) { 616ad30f8e7SGabor Kovesdan nmatch = seqmatch(string, n, sp); 617ad30f8e7SGabor Kovesdan if (sp->len == nmatch && n >= (size_t)(sp->len)) 618ad30f8e7SGabor Kovesdan break; 619ad30f8e7SGabor Kovesdan } 620ad30f8e7SGabor Kovesdan 621ad30f8e7SGabor Kovesdan if (!sp->len) 622ad30f8e7SGabor Kovesdan goto notseq; 623ad30f8e7SGabor Kovesdan 624ad30f8e7SGabor Kovesdan if (sp->type != -1) { 625ad30f8e7SGabor Kovesdan if (sp->csoff == -1) 626ad30f8e7SGabor Kovesdan i = 0; 627ad30f8e7SGabor Kovesdan else { 628ad30f8e7SGabor Kovesdan switch (sp->type) { 629ad30f8e7SGabor Kovesdan case CS94: 630ad30f8e7SGabor Kovesdan case CS94MULTI: 631ad30f8e7SGabor Kovesdan i = string[sp->csoff] - '('; 632ad30f8e7SGabor Kovesdan break; 633ad30f8e7SGabor Kovesdan case CS96: 634ad30f8e7SGabor Kovesdan case CS96MULTI: 635ad30f8e7SGabor Kovesdan i = string[sp->csoff] - ','; 636ad30f8e7SGabor Kovesdan break; 637ad30f8e7SGabor Kovesdan default: 638ad30f8e7SGabor Kovesdan return (_ISO2022INVALID); 639ad30f8e7SGabor Kovesdan } 640ad30f8e7SGabor Kovesdan } 641ad30f8e7SGabor Kovesdan psenc->g[i].type = sp->type; 642ad30f8e7SGabor Kovesdan psenc->g[i].final = '\0'; 643ad30f8e7SGabor Kovesdan psenc->g[i].interm = '\0'; 644ad30f8e7SGabor Kovesdan psenc->g[i].vers = '\0'; 645ad30f8e7SGabor Kovesdan /* sp->finaloff must not be -1 */ 646ad30f8e7SGabor Kovesdan if (sp->finaloff != -1) 647ad30f8e7SGabor Kovesdan psenc->g[i].final = string[sp->finaloff]; 648ad30f8e7SGabor Kovesdan if (sp->intermoff != -1) 649ad30f8e7SGabor Kovesdan psenc->g[i].interm = string[sp->intermoff]; 650ad30f8e7SGabor Kovesdan if (sp->versoff != -1) 651ad30f8e7SGabor Kovesdan psenc->g[i].vers = string[sp->versoff]; 652ad30f8e7SGabor Kovesdan 653ad30f8e7SGabor Kovesdan string += sp->len; 654ad30f8e7SGabor Kovesdan n -= sp->len; 655ad30f8e7SGabor Kovesdan continue; 656ad30f8e7SGabor Kovesdan } 657ad30f8e7SGabor Kovesdan 658ad30f8e7SGabor Kovesdan /* LS2/3 */ 659ad30f8e7SGabor Kovesdan if (2 <= n && string[0] == '\033' && 660ad30f8e7SGabor Kovesdan string[1] && strchr("no", string[1])) { 661ad30f8e7SGabor Kovesdan psenc->gl = string[1] - 'n' + 2; 662ad30f8e7SGabor Kovesdan string += 2; 663ad30f8e7SGabor Kovesdan n -= 2; 664ad30f8e7SGabor Kovesdan continue; 665ad30f8e7SGabor Kovesdan } 666ad30f8e7SGabor Kovesdan 667ad30f8e7SGabor Kovesdan /* LS1/2/3R */ 668ad30f8e7SGabor Kovesdan /* XXX: { for vi showmatch */ 669ad30f8e7SGabor Kovesdan if (2 <= n && string[0] == '\033' && 670ad30f8e7SGabor Kovesdan string[1] && strchr("~}|", string[1])) { 671ad30f8e7SGabor Kovesdan psenc->gr = 3 - (string[1] - '|'); 672ad30f8e7SGabor Kovesdan string += 2; 673ad30f8e7SGabor Kovesdan n -= 2; 674ad30f8e7SGabor Kovesdan continue; 675ad30f8e7SGabor Kovesdan } 676ad30f8e7SGabor Kovesdan 677ad30f8e7SGabor Kovesdan /* SS2/3 */ 678ad30f8e7SGabor Kovesdan if (2 <= n && string[0] == '\033' && string[1] && 679ad30f8e7SGabor Kovesdan strchr("NO", string[1])) { 680ad30f8e7SGabor Kovesdan psenc->singlegl = (string[1] - 'N') + 2; 681ad30f8e7SGabor Kovesdan string += 2; 682ad30f8e7SGabor Kovesdan n -= 2; 683ad30f8e7SGabor Kovesdan continue; 684ad30f8e7SGabor Kovesdan } 685ad30f8e7SGabor Kovesdan 686ad30f8e7SGabor Kovesdan notseq: 687ad30f8e7SGabor Kovesdan /* 688ad30f8e7SGabor Kovesdan * if we've got an unknown escape sequence, eat the ESC at the 689ad30f8e7SGabor Kovesdan * head. otherwise, wait till full escape sequence comes. 690ad30f8e7SGabor Kovesdan */ 691ad30f8e7SGabor Kovesdan for (sp = &seqtable[0]; sp->len; sp++) { 692ad30f8e7SGabor Kovesdan nmatch = seqmatch(string, n, sp); 693ad30f8e7SGabor Kovesdan if (!nmatch) 694ad30f8e7SGabor Kovesdan continue; 695ad30f8e7SGabor Kovesdan 696ad30f8e7SGabor Kovesdan /* 697ad30f8e7SGabor Kovesdan * if we are in the middle of escape sequence, 698ad30f8e7SGabor Kovesdan * we still need to wait for more characters to come 699ad30f8e7SGabor Kovesdan */ 700ad30f8e7SGabor Kovesdan if (n < (size_t)(sp->len)) { 701ad30f8e7SGabor Kovesdan if ((size_t)(nmatch) == n) { 702ad30f8e7SGabor Kovesdan if (result) 703ad30f8e7SGabor Kovesdan *result = string; 704ad30f8e7SGabor Kovesdan return (_ISO2022INVALID); 705ad30f8e7SGabor Kovesdan } 706ad30f8e7SGabor Kovesdan } else { 707ad30f8e7SGabor Kovesdan if (nmatch == sp->len) { 708ad30f8e7SGabor Kovesdan /* this case should not happen */ 709ad30f8e7SGabor Kovesdan goto eat; 710ad30f8e7SGabor Kovesdan } 711ad30f8e7SGabor Kovesdan } 712ad30f8e7SGabor Kovesdan } 713ad30f8e7SGabor Kovesdan 714ad30f8e7SGabor Kovesdan break; 715ad30f8e7SGabor Kovesdan } 716ad30f8e7SGabor Kovesdan 717ad30f8e7SGabor Kovesdan eat: 718ad30f8e7SGabor Kovesdan /* no letter to eat */ 719ad30f8e7SGabor Kovesdan if (n < 1) { 720ad30f8e7SGabor Kovesdan if (result) 721ad30f8e7SGabor Kovesdan *result = string; 722ad30f8e7SGabor Kovesdan return (_ISO2022INVALID); 723ad30f8e7SGabor Kovesdan } 724ad30f8e7SGabor Kovesdan 725ad30f8e7SGabor Kovesdan /* normal chars. always eat C0/C1 as is. */ 726ad30f8e7SGabor Kovesdan if (iscntl(*string & 0xff)) 727ad30f8e7SGabor Kovesdan cur = -1; 728ad30f8e7SGabor Kovesdan else if (*string & 0x80) 729ad30f8e7SGabor Kovesdan cur = (psenc->singlegr == -1) ? psenc->gr : psenc->singlegr; 730ad30f8e7SGabor Kovesdan else 731ad30f8e7SGabor Kovesdan cur = (psenc->singlegl == -1) ? psenc->gl : psenc->singlegl; 732ad30f8e7SGabor Kovesdan 733ad30f8e7SGabor Kovesdan if (cur == -1) { 734ad30f8e7SGabor Kovesdan asis: 735ad30f8e7SGabor Kovesdan wchar = *string++ & 0xff; 736ad30f8e7SGabor Kovesdan if (result) 737ad30f8e7SGabor Kovesdan *result = string; 738ad30f8e7SGabor Kovesdan /* reset single shift state */ 739ad30f8e7SGabor Kovesdan psenc->singlegr = psenc->singlegl = -1; 740ad30f8e7SGabor Kovesdan return (wchar); 741ad30f8e7SGabor Kovesdan } 742ad30f8e7SGabor Kovesdan 743ad30f8e7SGabor Kovesdan /* length error check */ 744ad30f8e7SGabor Kovesdan switch (psenc->g[cur].type) { 745ad30f8e7SGabor Kovesdan case CS94MULTI: 746ad30f8e7SGabor Kovesdan case CS96MULTI: 747ad30f8e7SGabor Kovesdan if (!isthree(psenc->g[cur].final)) { 748ad30f8e7SGabor Kovesdan if (2 <= n && 749ad30f8e7SGabor Kovesdan (string[0] & 0x80) == (string[1] & 0x80)) 750ad30f8e7SGabor Kovesdan break; 751ad30f8e7SGabor Kovesdan } else { 752ad30f8e7SGabor Kovesdan if (3 <= n && 753ad30f8e7SGabor Kovesdan (string[0] & 0x80) == (string[1] & 0x80) && 754ad30f8e7SGabor Kovesdan (string[0] & 0x80) == (string[2] & 0x80)) 755ad30f8e7SGabor Kovesdan break; 756ad30f8e7SGabor Kovesdan } 757ad30f8e7SGabor Kovesdan 758ad30f8e7SGabor Kovesdan /* we still need to wait for more characters to come */ 759ad30f8e7SGabor Kovesdan if (result) 760ad30f8e7SGabor Kovesdan *result = string; 761ad30f8e7SGabor Kovesdan return (_ISO2022INVALID); 762ad30f8e7SGabor Kovesdan 763ad30f8e7SGabor Kovesdan case CS94: 764ad30f8e7SGabor Kovesdan case CS96: 765ad30f8e7SGabor Kovesdan if (1 <= n) 766ad30f8e7SGabor Kovesdan break; 767ad30f8e7SGabor Kovesdan 768ad30f8e7SGabor Kovesdan /* we still need to wait for more characters to come */ 769ad30f8e7SGabor Kovesdan if (result) 770ad30f8e7SGabor Kovesdan *result = string; 771ad30f8e7SGabor Kovesdan return (_ISO2022INVALID); 772ad30f8e7SGabor Kovesdan } 773ad30f8e7SGabor Kovesdan 774ad30f8e7SGabor Kovesdan /* range check */ 775ad30f8e7SGabor Kovesdan switch (psenc->g[cur].type) { 776ad30f8e7SGabor Kovesdan case CS94: 777ad30f8e7SGabor Kovesdan if (!(is94(string[0] & 0x7f))) 778ad30f8e7SGabor Kovesdan goto asis; 779ad30f8e7SGabor Kovesdan case CS96: 780ad30f8e7SGabor Kovesdan if (!(is96(string[0] & 0x7f))) 781ad30f8e7SGabor Kovesdan goto asis; 782ad30f8e7SGabor Kovesdan break; 783ad30f8e7SGabor Kovesdan case CS94MULTI: 784ad30f8e7SGabor Kovesdan if (!(is94(string[0] & 0x7f) && is94(string[1] & 0x7f))) 785ad30f8e7SGabor Kovesdan goto asis; 786ad30f8e7SGabor Kovesdan break; 787ad30f8e7SGabor Kovesdan case CS96MULTI: 788ad30f8e7SGabor Kovesdan if (!(is96(string[0] & 0x7f) && is96(string[1] & 0x7f))) 789ad30f8e7SGabor Kovesdan goto asis; 790ad30f8e7SGabor Kovesdan break; 791ad30f8e7SGabor Kovesdan } 792ad30f8e7SGabor Kovesdan 793ad30f8e7SGabor Kovesdan /* extract the character. */ 794ad30f8e7SGabor Kovesdan switch (psenc->g[cur].type) { 795ad30f8e7SGabor Kovesdan case CS94: 796ad30f8e7SGabor Kovesdan /* special case for ASCII. */ 797ad30f8e7SGabor Kovesdan if (psenc->g[cur].final == 'B' && !psenc->g[cur].interm) { 798ad30f8e7SGabor Kovesdan wchar = *string++; 799ad30f8e7SGabor Kovesdan wchar &= 0x7f; 800ad30f8e7SGabor Kovesdan break; 801ad30f8e7SGabor Kovesdan } 802ad30f8e7SGabor Kovesdan wchar = psenc->g[cur].final; 803ad30f8e7SGabor Kovesdan wchar = (wchar << 8); 804ad30f8e7SGabor Kovesdan wchar |= (psenc->g[cur].interm ? (0x80 | psenc->g[cur].interm) : 0); 805ad30f8e7SGabor Kovesdan wchar = (wchar << 8); 806ad30f8e7SGabor Kovesdan wchar = (wchar << 8) | (*string++ & 0x7f); 807ad30f8e7SGabor Kovesdan break; 808ad30f8e7SGabor Kovesdan case CS96: 809ad30f8e7SGabor Kovesdan /* special case for ISO-8859-1. */ 810ad30f8e7SGabor Kovesdan if (psenc->g[cur].final == 'A' && !psenc->g[cur].interm) { 811ad30f8e7SGabor Kovesdan wchar = *string++; 812ad30f8e7SGabor Kovesdan wchar &= 0x7f; 813ad30f8e7SGabor Kovesdan wchar |= 0x80; 814ad30f8e7SGabor Kovesdan break; 815ad30f8e7SGabor Kovesdan } 816ad30f8e7SGabor Kovesdan wchar = psenc->g[cur].final; 817ad30f8e7SGabor Kovesdan wchar = (wchar << 8); 818ad30f8e7SGabor Kovesdan wchar |= (psenc->g[cur].interm ? (0x80 | psenc->g[cur].interm) : 0); 819ad30f8e7SGabor Kovesdan wchar = (wchar << 8); 820ad30f8e7SGabor Kovesdan wchar = (wchar << 8) | (*string++ & 0x7f); 821ad30f8e7SGabor Kovesdan wchar |= 0x80; 822ad30f8e7SGabor Kovesdan break; 823ad30f8e7SGabor Kovesdan case CS94MULTI: 824ad30f8e7SGabor Kovesdan case CS96MULTI: 825ad30f8e7SGabor Kovesdan wchar = psenc->g[cur].final; 826ad30f8e7SGabor Kovesdan wchar = (wchar << 8); 827ad30f8e7SGabor Kovesdan if (isthree(psenc->g[cur].final)) 828ad30f8e7SGabor Kovesdan wchar |= (*string++ & 0x7f); 829ad30f8e7SGabor Kovesdan wchar = (wchar << 8) | (*string++ & 0x7f); 830ad30f8e7SGabor Kovesdan wchar = (wchar << 8) | (*string++ & 0x7f); 831ad30f8e7SGabor Kovesdan if (psenc->g[cur].type == CS96MULTI) 832ad30f8e7SGabor Kovesdan wchar |= 0x80; 833ad30f8e7SGabor Kovesdan break; 834ad30f8e7SGabor Kovesdan } 835ad30f8e7SGabor Kovesdan 836ad30f8e7SGabor Kovesdan if (result) 837ad30f8e7SGabor Kovesdan *result = string; 838ad30f8e7SGabor Kovesdan /* reset single shift state */ 839ad30f8e7SGabor Kovesdan psenc->singlegr = psenc->singlegl = -1; 840ad30f8e7SGabor Kovesdan return (wchar); 841ad30f8e7SGabor Kovesdan } 842ad30f8e7SGabor Kovesdan 843ad30f8e7SGabor Kovesdan 844ad30f8e7SGabor Kovesdan 845ad30f8e7SGabor Kovesdan static int 846ad30f8e7SGabor Kovesdan _citrus_ISO2022_mbrtowc_priv(_ISO2022EncodingInfo * __restrict ei, 8471243a98eSTijl Coosemans wchar_t * __restrict pwc, char ** __restrict s, 848ad30f8e7SGabor Kovesdan size_t n, _ISO2022State * __restrict psenc, size_t * __restrict nresult) 849ad30f8e7SGabor Kovesdan { 8501243a98eSTijl Coosemans char *p, *result, *s0; 851ad30f8e7SGabor Kovesdan wchar_t wchar; 852ad30f8e7SGabor Kovesdan int c, chlenbak; 853ad30f8e7SGabor Kovesdan 854ad30f8e7SGabor Kovesdan if (*s == NULL) { 855ad30f8e7SGabor Kovesdan _citrus_ISO2022_init_state(ei, psenc); 856ad30f8e7SGabor Kovesdan *nresult = _ENCODING_IS_STATE_DEPENDENT; 857ad30f8e7SGabor Kovesdan return (0); 858ad30f8e7SGabor Kovesdan } 859ad30f8e7SGabor Kovesdan s0 = *s; 860ad30f8e7SGabor Kovesdan c = 0; 861ad30f8e7SGabor Kovesdan chlenbak = psenc->chlen; 862ad30f8e7SGabor Kovesdan 863ad30f8e7SGabor Kovesdan /* 864ad30f8e7SGabor Kovesdan * if we have something in buffer, use that. 865ad30f8e7SGabor Kovesdan * otherwise, skip here 866ad30f8e7SGabor Kovesdan */ 867ad30f8e7SGabor Kovesdan if (psenc->chlen > sizeof(psenc->ch)) { 868ad30f8e7SGabor Kovesdan /* illgeal state */ 869ad30f8e7SGabor Kovesdan _citrus_ISO2022_init_state(ei, psenc); 870ad30f8e7SGabor Kovesdan goto encoding_error; 871ad30f8e7SGabor Kovesdan } 872ad30f8e7SGabor Kovesdan if (psenc->chlen == 0) 873ad30f8e7SGabor Kovesdan goto emptybuf; 874ad30f8e7SGabor Kovesdan 875ad30f8e7SGabor Kovesdan /* buffer is not empty */ 876ad30f8e7SGabor Kovesdan p = psenc->ch; 877ad30f8e7SGabor Kovesdan while (psenc->chlen < sizeof(psenc->ch)) { 878ad30f8e7SGabor Kovesdan if (n > 0) { 879ad30f8e7SGabor Kovesdan psenc->ch[psenc->chlen++] = *s0++; 880ad30f8e7SGabor Kovesdan n--; 881ad30f8e7SGabor Kovesdan } 882ad30f8e7SGabor Kovesdan 883ad30f8e7SGabor Kovesdan wchar = _ISO2022_sgetwchar(ei, p, psenc->chlen - (p-psenc->ch), 884ad30f8e7SGabor Kovesdan &result, psenc); 885ad30f8e7SGabor Kovesdan c += result - p; 886ad30f8e7SGabor Kovesdan if (wchar != _ISO2022INVALID) { 887ad30f8e7SGabor Kovesdan if (psenc->chlen > (size_t)c) 888ad30f8e7SGabor Kovesdan memmove(psenc->ch, result, psenc->chlen - c); 889ad30f8e7SGabor Kovesdan if (psenc->chlen < (size_t)c) 890ad30f8e7SGabor Kovesdan psenc->chlen = 0; 891ad30f8e7SGabor Kovesdan else 892ad30f8e7SGabor Kovesdan psenc->chlen -= c; 893ad30f8e7SGabor Kovesdan goto output; 894ad30f8e7SGabor Kovesdan } 895ad30f8e7SGabor Kovesdan 896ad30f8e7SGabor Kovesdan if (n == 0) { 897ad30f8e7SGabor Kovesdan if ((size_t)(result - p) == psenc->chlen) 898ad30f8e7SGabor Kovesdan /* complete shift sequence. */ 899ad30f8e7SGabor Kovesdan psenc->chlen = 0; 900ad30f8e7SGabor Kovesdan goto restart; 901ad30f8e7SGabor Kovesdan } 902ad30f8e7SGabor Kovesdan 903ad30f8e7SGabor Kovesdan p = result; 904ad30f8e7SGabor Kovesdan } 905ad30f8e7SGabor Kovesdan 906ad30f8e7SGabor Kovesdan /* escape sequence too long? */ 907ad30f8e7SGabor Kovesdan goto encoding_error; 908ad30f8e7SGabor Kovesdan 909ad30f8e7SGabor Kovesdan emptybuf: 910ad30f8e7SGabor Kovesdan wchar = _ISO2022_sgetwchar(ei, s0, n, &result, psenc); 911ad30f8e7SGabor Kovesdan if (wchar != _ISO2022INVALID) { 912ad30f8e7SGabor Kovesdan c += result - s0; 913ad30f8e7SGabor Kovesdan psenc->chlen = 0; 914ad30f8e7SGabor Kovesdan s0 = result; 915ad30f8e7SGabor Kovesdan goto output; 916ad30f8e7SGabor Kovesdan } 917ad30f8e7SGabor Kovesdan if (result > s0) { 918ad30f8e7SGabor Kovesdan c += (result - s0); 919ad30f8e7SGabor Kovesdan n -= (result - s0); 920ad30f8e7SGabor Kovesdan s0 = result; 921ad30f8e7SGabor Kovesdan if (n > 0) 922ad30f8e7SGabor Kovesdan goto emptybuf; 923ad30f8e7SGabor Kovesdan /* complete shift sequence. */ 924ad30f8e7SGabor Kovesdan goto restart; 925ad30f8e7SGabor Kovesdan } 926ad30f8e7SGabor Kovesdan n += c; 927ad30f8e7SGabor Kovesdan if (n < sizeof(psenc->ch)) { 928ad30f8e7SGabor Kovesdan memcpy(psenc->ch, s0 - c, n); 929ad30f8e7SGabor Kovesdan psenc->chlen = n; 930ad30f8e7SGabor Kovesdan s0 = result; 931ad30f8e7SGabor Kovesdan goto restart; 932ad30f8e7SGabor Kovesdan } 933ad30f8e7SGabor Kovesdan 934ad30f8e7SGabor Kovesdan /* escape sequence too long? */ 935ad30f8e7SGabor Kovesdan 936ad30f8e7SGabor Kovesdan encoding_error: 937ad30f8e7SGabor Kovesdan psenc->chlen = 0; 938ad30f8e7SGabor Kovesdan *nresult = (size_t)-1; 939ad30f8e7SGabor Kovesdan return (EILSEQ); 940ad30f8e7SGabor Kovesdan 941ad30f8e7SGabor Kovesdan output: 942ad30f8e7SGabor Kovesdan *s = s0; 943ad30f8e7SGabor Kovesdan if (pwc) 944ad30f8e7SGabor Kovesdan *pwc = wchar; 945ad30f8e7SGabor Kovesdan *nresult = wchar ? c - chlenbak : 0; 946ad30f8e7SGabor Kovesdan return (0); 947ad30f8e7SGabor Kovesdan 948ad30f8e7SGabor Kovesdan restart: 949ad30f8e7SGabor Kovesdan *s = s0; 950ad30f8e7SGabor Kovesdan *nresult = (size_t)-2; 951ad30f8e7SGabor Kovesdan 952ad30f8e7SGabor Kovesdan return (0); 953ad30f8e7SGabor Kovesdan } 954ad30f8e7SGabor Kovesdan 955ad30f8e7SGabor Kovesdan static int 956ad30f8e7SGabor Kovesdan recommendation(_ISO2022EncodingInfo * __restrict ei, 957ad30f8e7SGabor Kovesdan _ISO2022Charset * __restrict cs) 958ad30f8e7SGabor Kovesdan { 959ad30f8e7SGabor Kovesdan _ISO2022Charset *recommend; 960ad30f8e7SGabor Kovesdan size_t j; 961ad30f8e7SGabor Kovesdan int i; 962ad30f8e7SGabor Kovesdan 963ad30f8e7SGabor Kovesdan /* first, try a exact match. */ 964ad30f8e7SGabor Kovesdan for (i = 0; i < 4; i++) { 965ad30f8e7SGabor Kovesdan recommend = ei->recommend[i]; 966ad30f8e7SGabor Kovesdan for (j = 0; j < ei->recommendsize[i]; j++) { 967ad30f8e7SGabor Kovesdan if (cs->type != recommend[j].type) 968ad30f8e7SGabor Kovesdan continue; 969ad30f8e7SGabor Kovesdan if (cs->final != recommend[j].final) 970ad30f8e7SGabor Kovesdan continue; 971ad30f8e7SGabor Kovesdan if (cs->interm != recommend[j].interm) 972ad30f8e7SGabor Kovesdan continue; 973ad30f8e7SGabor Kovesdan 974ad30f8e7SGabor Kovesdan return (i); 975ad30f8e7SGabor Kovesdan } 976ad30f8e7SGabor Kovesdan } 977ad30f8e7SGabor Kovesdan 978ad30f8e7SGabor Kovesdan /* then, try a wildcard match over final char. */ 979ad30f8e7SGabor Kovesdan for (i = 0; i < 4; i++) { 980ad30f8e7SGabor Kovesdan recommend = ei->recommend[i]; 981ad30f8e7SGabor Kovesdan for (j = 0; j < ei->recommendsize[i]; j++) { 982ad30f8e7SGabor Kovesdan if (cs->type != recommend[j].type) 983ad30f8e7SGabor Kovesdan continue; 984ad30f8e7SGabor Kovesdan if (cs->final && (cs->final != recommend[j].final)) 985ad30f8e7SGabor Kovesdan continue; 986ad30f8e7SGabor Kovesdan if (cs->interm && (cs->interm != recommend[j].interm)) 987ad30f8e7SGabor Kovesdan continue; 988ad30f8e7SGabor Kovesdan 989ad30f8e7SGabor Kovesdan return (i); 990ad30f8e7SGabor Kovesdan } 991ad30f8e7SGabor Kovesdan } 992ad30f8e7SGabor Kovesdan 993ad30f8e7SGabor Kovesdan /* there's no recommendation. make a guess. */ 994ad30f8e7SGabor Kovesdan if (ei->maxcharset == 0) { 995ad30f8e7SGabor Kovesdan return (0); 996ad30f8e7SGabor Kovesdan } else { 997ad30f8e7SGabor Kovesdan switch (cs->type) { 998ad30f8e7SGabor Kovesdan case CS94: 999ad30f8e7SGabor Kovesdan case CS94MULTI: 1000ad30f8e7SGabor Kovesdan return (0); 1001ad30f8e7SGabor Kovesdan case CS96: 1002ad30f8e7SGabor Kovesdan case CS96MULTI: 1003ad30f8e7SGabor Kovesdan return (1); 1004ad30f8e7SGabor Kovesdan } 1005ad30f8e7SGabor Kovesdan } 1006ad30f8e7SGabor Kovesdan return (0); 1007ad30f8e7SGabor Kovesdan } 1008ad30f8e7SGabor Kovesdan 1009ad30f8e7SGabor Kovesdan static int 1010ad30f8e7SGabor Kovesdan _ISO2022_sputwchar(_ISO2022EncodingInfo * __restrict ei, wchar_t wc, 1011ad30f8e7SGabor Kovesdan char * __restrict string, size_t n, char ** __restrict result, 1012ad30f8e7SGabor Kovesdan _ISO2022State * __restrict psenc, size_t * __restrict nresult) 1013ad30f8e7SGabor Kovesdan { 1014ad30f8e7SGabor Kovesdan _ISO2022Charset cs; 1015ad30f8e7SGabor Kovesdan char *p; 1016ad30f8e7SGabor Kovesdan char tmp[MB_LEN_MAX]; 1017ad30f8e7SGabor Kovesdan size_t len; 1018ad30f8e7SGabor Kovesdan int bit8, i = 0, target; 1019ad30f8e7SGabor Kovesdan unsigned char mask; 1020ad30f8e7SGabor Kovesdan 1021ad30f8e7SGabor Kovesdan if (isc0(wc & 0xff)) { 1022ad30f8e7SGabor Kovesdan /* go back to INIT0 or ASCII on control chars */ 1023ad30f8e7SGabor Kovesdan cs = ei->initg[0].final ? ei->initg[0] : ascii; 1024ad30f8e7SGabor Kovesdan } else if (isc1(wc & 0xff)) { 1025ad30f8e7SGabor Kovesdan /* go back to INIT1 or ISO-8859-1 on control chars */ 1026ad30f8e7SGabor Kovesdan cs = ei->initg[1].final ? ei->initg[1] : iso88591; 1027ad30f8e7SGabor Kovesdan } else if (!(wc & ~0xff)) { 1028ad30f8e7SGabor Kovesdan if (wc & 0x80) { 1029ad30f8e7SGabor Kovesdan /* special treatment for ISO-8859-1 */ 1030ad30f8e7SGabor Kovesdan cs = iso88591; 1031ad30f8e7SGabor Kovesdan } else { 1032ad30f8e7SGabor Kovesdan /* special treatment for ASCII */ 1033ad30f8e7SGabor Kovesdan cs = ascii; 1034ad30f8e7SGabor Kovesdan } 1035ad30f8e7SGabor Kovesdan } else { 1036ad30f8e7SGabor Kovesdan cs.final = (wc >> 24) & 0x7f; 1037ad30f8e7SGabor Kovesdan if ((wc >> 16) & 0x80) 1038ad30f8e7SGabor Kovesdan cs.interm = (wc >> 16) & 0x7f; 1039ad30f8e7SGabor Kovesdan else 1040ad30f8e7SGabor Kovesdan cs.interm = '\0'; 1041ad30f8e7SGabor Kovesdan if (wc & 0x80) 1042ad30f8e7SGabor Kovesdan cs.type = (wc & 0x00007f00) ? CS96MULTI : CS96; 1043ad30f8e7SGabor Kovesdan else 1044ad30f8e7SGabor Kovesdan cs.type = (wc & 0x00007f00) ? CS94MULTI : CS94; 1045ad30f8e7SGabor Kovesdan } 1046ad30f8e7SGabor Kovesdan target = recommendation(ei, &cs); 1047ad30f8e7SGabor Kovesdan p = tmp; 1048ad30f8e7SGabor Kovesdan bit8 = ei->flags & F_8BIT; 1049ad30f8e7SGabor Kovesdan 1050ad30f8e7SGabor Kovesdan /* designate the charset onto the target plane(G0/1/2/3). */ 1051ad30f8e7SGabor Kovesdan if (psenc->g[target].type == cs.type && 1052ad30f8e7SGabor Kovesdan psenc->g[target].final == cs.final && 1053ad30f8e7SGabor Kovesdan psenc->g[target].interm == cs.interm) 1054ad30f8e7SGabor Kovesdan goto planeok; 1055ad30f8e7SGabor Kovesdan 1056ad30f8e7SGabor Kovesdan *p++ = '\033'; 1057ad30f8e7SGabor Kovesdan if (cs.type == CS94MULTI || cs.type == CS96MULTI) 1058ad30f8e7SGabor Kovesdan *p++ = '$'; 1059ad30f8e7SGabor Kovesdan if (target == 0 && cs.type == CS94MULTI && strchr("@AB", cs.final) && 1060ad30f8e7SGabor Kovesdan !cs.interm && !(ei->flags & F_NOOLD)) 1061ad30f8e7SGabor Kovesdan ; 1062ad30f8e7SGabor Kovesdan else if (cs.type == CS94 || cs.type == CS94MULTI) 1063ad30f8e7SGabor Kovesdan *p++ = "()*+"[target]; 1064ad30f8e7SGabor Kovesdan else 1065ad30f8e7SGabor Kovesdan *p++ = ",-./"[target]; 1066ad30f8e7SGabor Kovesdan if (cs.interm) 1067ad30f8e7SGabor Kovesdan *p++ = cs.interm; 1068ad30f8e7SGabor Kovesdan *p++ = cs.final; 1069ad30f8e7SGabor Kovesdan 1070ad30f8e7SGabor Kovesdan psenc->g[target].type = cs.type; 1071ad30f8e7SGabor Kovesdan psenc->g[target].final = cs.final; 1072ad30f8e7SGabor Kovesdan psenc->g[target].interm = cs.interm; 1073ad30f8e7SGabor Kovesdan 1074ad30f8e7SGabor Kovesdan planeok: 1075ad30f8e7SGabor Kovesdan /* invoke the plane onto GL or GR. */ 1076ad30f8e7SGabor Kovesdan if (psenc->gl == target) 1077ad30f8e7SGabor Kovesdan goto sideok; 1078ad30f8e7SGabor Kovesdan if (bit8 && psenc->gr == target) 1079ad30f8e7SGabor Kovesdan goto sideok; 1080ad30f8e7SGabor Kovesdan 1081ad30f8e7SGabor Kovesdan if (target == 0 && (ei->flags & F_LS0)) { 1082ad30f8e7SGabor Kovesdan *p++ = '\017'; 1083ad30f8e7SGabor Kovesdan psenc->gl = 0; 1084ad30f8e7SGabor Kovesdan } else if (target == 1 && (ei->flags & F_LS1)) { 1085ad30f8e7SGabor Kovesdan *p++ = '\016'; 1086ad30f8e7SGabor Kovesdan psenc->gl = 1; 1087ad30f8e7SGabor Kovesdan } else if (target == 2 && (ei->flags & F_LS2)) { 1088ad30f8e7SGabor Kovesdan *p++ = '\033'; 1089ad30f8e7SGabor Kovesdan *p++ = 'n'; 1090ad30f8e7SGabor Kovesdan psenc->gl = 2; 1091ad30f8e7SGabor Kovesdan } else if (target == 3 && (ei->flags & F_LS3)) { 1092ad30f8e7SGabor Kovesdan *p++ = '\033'; 1093ad30f8e7SGabor Kovesdan *p++ = 'o'; 1094ad30f8e7SGabor Kovesdan psenc->gl = 3; 1095ad30f8e7SGabor Kovesdan } else if (bit8 && target == 1 && (ei->flags & F_LS1R)) { 1096ad30f8e7SGabor Kovesdan *p++ = '\033'; 1097ad30f8e7SGabor Kovesdan *p++ = '~'; 1098ad30f8e7SGabor Kovesdan psenc->gr = 1; 1099ad30f8e7SGabor Kovesdan } else if (bit8 && target == 2 && (ei->flags & F_LS2R)) { 1100ad30f8e7SGabor Kovesdan *p++ = '\033'; 1101ad30f8e7SGabor Kovesdan /*{*/ 1102ad30f8e7SGabor Kovesdan *p++ = '}'; 1103ad30f8e7SGabor Kovesdan psenc->gr = 2; 1104ad30f8e7SGabor Kovesdan } else if (bit8 && target == 3 && (ei->flags & F_LS3R)) { 1105ad30f8e7SGabor Kovesdan *p++ = '\033'; 1106ad30f8e7SGabor Kovesdan *p++ = '|'; 1107ad30f8e7SGabor Kovesdan psenc->gr = 3; 1108ad30f8e7SGabor Kovesdan } else if (target == 2 && (ei->flags & F_SS2)) { 1109ad30f8e7SGabor Kovesdan *p++ = '\033'; 1110ad30f8e7SGabor Kovesdan *p++ = 'N'; 1111ad30f8e7SGabor Kovesdan psenc->singlegl = 2; 1112ad30f8e7SGabor Kovesdan } else if (target == 3 && (ei->flags & F_SS3)) { 1113ad30f8e7SGabor Kovesdan *p++ = '\033'; 1114ad30f8e7SGabor Kovesdan *p++ = 'O'; 1115ad30f8e7SGabor Kovesdan psenc->singlegl = 3; 1116ad30f8e7SGabor Kovesdan } else if (bit8 && target == 2 && (ei->flags & F_SS2R)) { 1117ad30f8e7SGabor Kovesdan *p++ = '\216'; 1118ad30f8e7SGabor Kovesdan *p++ = 'N'; 1119ad30f8e7SGabor Kovesdan psenc->singlegl = psenc->singlegr = 2; 1120ad30f8e7SGabor Kovesdan } else if (bit8 && target == 3 && (ei->flags & F_SS3R)) { 1121ad30f8e7SGabor Kovesdan *p++ = '\217'; 1122ad30f8e7SGabor Kovesdan *p++ = 'O'; 1123ad30f8e7SGabor Kovesdan psenc->singlegl = psenc->singlegr = 3; 1124ad30f8e7SGabor Kovesdan } else 1125ad30f8e7SGabor Kovesdan goto ilseq; 1126ad30f8e7SGabor Kovesdan 1127ad30f8e7SGabor Kovesdan sideok: 1128ad30f8e7SGabor Kovesdan if (psenc->singlegl == target) 1129ad30f8e7SGabor Kovesdan mask = 0x00; 1130ad30f8e7SGabor Kovesdan else if (psenc->singlegr == target) 1131ad30f8e7SGabor Kovesdan mask = 0x80; 1132ad30f8e7SGabor Kovesdan else if (psenc->gl == target) 1133ad30f8e7SGabor Kovesdan mask = 0x00; 1134ad30f8e7SGabor Kovesdan else if ((ei->flags & F_8BIT) && psenc->gr == target) 1135ad30f8e7SGabor Kovesdan mask = 0x80; 1136ad30f8e7SGabor Kovesdan else 1137ad30f8e7SGabor Kovesdan goto ilseq; 1138ad30f8e7SGabor Kovesdan 1139ad30f8e7SGabor Kovesdan switch (cs.type) { 1140ad30f8e7SGabor Kovesdan case CS94: 1141ad30f8e7SGabor Kovesdan case CS96: 1142ad30f8e7SGabor Kovesdan i = 1; 1143ad30f8e7SGabor Kovesdan break; 1144ad30f8e7SGabor Kovesdan case CS94MULTI: 1145ad30f8e7SGabor Kovesdan case CS96MULTI: 1146ad30f8e7SGabor Kovesdan i = !iscntl(wc & 0xff) ? 1147ad30f8e7SGabor Kovesdan (isthree(cs.final) ? 3 : 2) : 1; 1148ad30f8e7SGabor Kovesdan break; 1149ad30f8e7SGabor Kovesdan } 1150ad30f8e7SGabor Kovesdan while (i-- > 0) 1151ad30f8e7SGabor Kovesdan *p++ = ((wc >> (i << 3)) & 0x7f) | mask; 1152ad30f8e7SGabor Kovesdan 1153ad30f8e7SGabor Kovesdan /* reset single shift state */ 1154ad30f8e7SGabor Kovesdan psenc->singlegl = psenc->singlegr = -1; 1155ad30f8e7SGabor Kovesdan 1156ad30f8e7SGabor Kovesdan len = (size_t)(p - tmp); 1157ad30f8e7SGabor Kovesdan if (n < len) { 1158ad30f8e7SGabor Kovesdan if (result) 1159ad30f8e7SGabor Kovesdan *result = (char *)0; 1160ad30f8e7SGabor Kovesdan *nresult = (size_t)-1; 1161ad30f8e7SGabor Kovesdan return (E2BIG); 1162ad30f8e7SGabor Kovesdan } 1163ad30f8e7SGabor Kovesdan if (result) 1164ad30f8e7SGabor Kovesdan *result = string + len; 1165ad30f8e7SGabor Kovesdan memcpy(string, tmp, len); 1166ad30f8e7SGabor Kovesdan *nresult = len; 1167ad30f8e7SGabor Kovesdan 1168ad30f8e7SGabor Kovesdan return (0); 1169ad30f8e7SGabor Kovesdan 1170ad30f8e7SGabor Kovesdan ilseq: 1171ad30f8e7SGabor Kovesdan *nresult = (size_t)-1; 1172ad30f8e7SGabor Kovesdan return (EILSEQ); 1173ad30f8e7SGabor Kovesdan } 1174ad30f8e7SGabor Kovesdan 1175ad30f8e7SGabor Kovesdan static int 1176ad30f8e7SGabor Kovesdan _citrus_ISO2022_put_state_reset(_ISO2022EncodingInfo * __restrict ei, 1177ad30f8e7SGabor Kovesdan char * __restrict s, size_t n, _ISO2022State * __restrict psenc, 1178ad30f8e7SGabor Kovesdan size_t * __restrict nresult) 1179ad30f8e7SGabor Kovesdan { 1180ad30f8e7SGabor Kovesdan char *result; 1181ad30f8e7SGabor Kovesdan char buf[MB_LEN_MAX]; 1182ad30f8e7SGabor Kovesdan size_t len; 1183ad30f8e7SGabor Kovesdan int ret; 1184ad30f8e7SGabor Kovesdan 1185ad30f8e7SGabor Kovesdan /* XXX state will be modified after this operation... */ 1186ad30f8e7SGabor Kovesdan ret = _ISO2022_sputwchar(ei, L'\0', buf, sizeof(buf), &result, psenc, 1187ad30f8e7SGabor Kovesdan &len); 1188ad30f8e7SGabor Kovesdan if (ret) { 1189ad30f8e7SGabor Kovesdan *nresult = len; 1190ad30f8e7SGabor Kovesdan return (ret); 1191ad30f8e7SGabor Kovesdan } 1192ad30f8e7SGabor Kovesdan 1193ad30f8e7SGabor Kovesdan if (sizeof(buf) < len || n < len-1) { 1194ad30f8e7SGabor Kovesdan /* XXX should recover state? */ 1195ad30f8e7SGabor Kovesdan *nresult = (size_t)-1; 1196ad30f8e7SGabor Kovesdan return (E2BIG); 1197ad30f8e7SGabor Kovesdan } 1198ad30f8e7SGabor Kovesdan 1199ad30f8e7SGabor Kovesdan memcpy(s, buf, len - 1); 1200ad30f8e7SGabor Kovesdan *nresult = len - 1; 1201ad30f8e7SGabor Kovesdan return (0); 1202ad30f8e7SGabor Kovesdan } 1203ad30f8e7SGabor Kovesdan 1204ad30f8e7SGabor Kovesdan static int 1205ad30f8e7SGabor Kovesdan _citrus_ISO2022_wcrtomb_priv(_ISO2022EncodingInfo * __restrict ei, 1206ad30f8e7SGabor Kovesdan char * __restrict s, size_t n, wchar_t wc, 1207ad30f8e7SGabor Kovesdan _ISO2022State * __restrict psenc, size_t * __restrict nresult) 1208ad30f8e7SGabor Kovesdan { 1209ad30f8e7SGabor Kovesdan char *result; 1210ad30f8e7SGabor Kovesdan char buf[MB_LEN_MAX]; 1211ad30f8e7SGabor Kovesdan size_t len; 1212ad30f8e7SGabor Kovesdan int ret; 1213ad30f8e7SGabor Kovesdan 1214ad30f8e7SGabor Kovesdan /* XXX state will be modified after this operation... */ 1215ad30f8e7SGabor Kovesdan ret = _ISO2022_sputwchar(ei, wc, buf, sizeof(buf), &result, psenc, 1216ad30f8e7SGabor Kovesdan &len); 1217ad30f8e7SGabor Kovesdan if (ret) { 1218ad30f8e7SGabor Kovesdan *nresult = len; 1219ad30f8e7SGabor Kovesdan return (ret); 1220ad30f8e7SGabor Kovesdan } 1221ad30f8e7SGabor Kovesdan 1222ad30f8e7SGabor Kovesdan if (sizeof(buf) < len || n < len) { 1223ad30f8e7SGabor Kovesdan /* XXX should recover state? */ 1224ad30f8e7SGabor Kovesdan *nresult = (size_t)-1; 1225ad30f8e7SGabor Kovesdan return (E2BIG); 1226ad30f8e7SGabor Kovesdan } 1227ad30f8e7SGabor Kovesdan 1228ad30f8e7SGabor Kovesdan memcpy(s, buf, len); 1229ad30f8e7SGabor Kovesdan *nresult = len; 1230ad30f8e7SGabor Kovesdan return (0); 1231ad30f8e7SGabor Kovesdan } 1232ad30f8e7SGabor Kovesdan 1233ad30f8e7SGabor Kovesdan static __inline int 1234ad30f8e7SGabor Kovesdan /*ARGSUSED*/ 1235ad30f8e7SGabor Kovesdan _citrus_ISO2022_stdenc_wctocs(_ISO2022EncodingInfo * __restrict ei __unused, 1236ad30f8e7SGabor Kovesdan _csid_t * __restrict csid, _index_t * __restrict idx, wchar_t wc) 1237ad30f8e7SGabor Kovesdan { 1238ad30f8e7SGabor Kovesdan wchar_t m, nm; 1239ad30f8e7SGabor Kovesdan 1240ad30f8e7SGabor Kovesdan m = wc & 0x7FFF8080; 1241ad30f8e7SGabor Kovesdan nm = wc & 0x007F7F7F; 1242ad30f8e7SGabor Kovesdan if (m & 0x00800000) 1243ad30f8e7SGabor Kovesdan nm &= 0x00007F7F; 1244ad30f8e7SGabor Kovesdan else 1245ad30f8e7SGabor Kovesdan m &= 0x7F008080; 1246ad30f8e7SGabor Kovesdan if (nm & 0x007F0000) { 1247ad30f8e7SGabor Kovesdan /* ^3 mark */ 1248ad30f8e7SGabor Kovesdan m |= 0x007F0000; 1249ad30f8e7SGabor Kovesdan } else if (nm & 0x00007F00) { 1250ad30f8e7SGabor Kovesdan /* ^2 mark */ 1251ad30f8e7SGabor Kovesdan m |= 0x00007F00; 1252ad30f8e7SGabor Kovesdan } 1253ad30f8e7SGabor Kovesdan *csid = (_csid_t)m; 1254ad30f8e7SGabor Kovesdan *idx = (_index_t)nm; 1255ad30f8e7SGabor Kovesdan 1256ad30f8e7SGabor Kovesdan return (0); 1257ad30f8e7SGabor Kovesdan } 1258ad30f8e7SGabor Kovesdan 1259ad30f8e7SGabor Kovesdan static __inline int 1260ad30f8e7SGabor Kovesdan /*ARGSUSED*/ 1261ad30f8e7SGabor Kovesdan _citrus_ISO2022_stdenc_cstowc(_ISO2022EncodingInfo * __restrict ei __unused, 1262ad30f8e7SGabor Kovesdan wchar_t * __restrict wc, _csid_t csid, _index_t idx) 1263ad30f8e7SGabor Kovesdan { 1264ad30f8e7SGabor Kovesdan 1265ad30f8e7SGabor Kovesdan *wc = (wchar_t)(csid & 0x7F808080) | (wchar_t)idx; 1266ad30f8e7SGabor Kovesdan 1267ad30f8e7SGabor Kovesdan return (0); 1268ad30f8e7SGabor Kovesdan } 1269ad30f8e7SGabor Kovesdan 1270ad30f8e7SGabor Kovesdan static __inline int 1271ad30f8e7SGabor Kovesdan /*ARGSUSED*/ 1272ad30f8e7SGabor Kovesdan _citrus_ISO2022_stdenc_get_state_desc_generic(_ISO2022EncodingInfo * __restrict ei __unused, 1273ad30f8e7SGabor Kovesdan _ISO2022State * __restrict psenc, int * __restrict rstate) 1274ad30f8e7SGabor Kovesdan { 1275ad30f8e7SGabor Kovesdan 1276ad30f8e7SGabor Kovesdan if (psenc->chlen == 0) { 1277ad30f8e7SGabor Kovesdan /* XXX: it should distinguish initial and stable. */ 1278ad30f8e7SGabor Kovesdan *rstate = _STDENC_SDGEN_STABLE; 1279ad30f8e7SGabor Kovesdan } else 1280ad30f8e7SGabor Kovesdan *rstate = (psenc->ch[0] == '\033') ? 1281ad30f8e7SGabor Kovesdan _STDENC_SDGEN_INCOMPLETE_SHIFT : 1282ad30f8e7SGabor Kovesdan _STDENC_SDGEN_INCOMPLETE_CHAR; 1283ad30f8e7SGabor Kovesdan return (0); 1284ad30f8e7SGabor Kovesdan } 1285ad30f8e7SGabor Kovesdan 1286ad30f8e7SGabor Kovesdan /* ---------------------------------------------------------------------- 1287ad30f8e7SGabor Kovesdan * public interface for stdenc 1288ad30f8e7SGabor Kovesdan */ 1289ad30f8e7SGabor Kovesdan 1290ad30f8e7SGabor Kovesdan _CITRUS_STDENC_DECLS(ISO2022); 1291ad30f8e7SGabor Kovesdan _CITRUS_STDENC_DEF_OPS(ISO2022); 1292ad30f8e7SGabor Kovesdan 1293ad30f8e7SGabor Kovesdan #include "citrus_stdenc_template.h" 1294