1 /* 2 * Copyright (c) 2002-2004 Tim J. Robbins. All rights reserved. 3 * Copyright (c) 1993 4 * The Regents of the University of California. All rights reserved. 5 * 6 * This code is derived from software contributed to Berkeley by 7 * Paul Borman at Krystal Technologies. 8 * 9 * Redistribution and use in source and binary forms, with or without 10 * modification, are permitted provided that the following conditions 11 * are met: 12 * 1. Redistributions of source code must retain the above copyright 13 * notice, this list of conditions and the following disclaimer. 14 * 2. Redistributions in binary form must reproduce the above copyright 15 * notice, this list of conditions and the following disclaimer in the 16 * documentation and/or other materials provided with the distribution. 17 * 4. Neither the name of the University nor the names of its contributors 18 * may be used to endorse or promote products derived from this software 19 * without specific prior written permission. 20 * 21 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 22 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 23 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 24 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 25 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 26 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 27 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 28 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 29 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 30 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 31 * SUCH DAMAGE. 32 */ 33 34 /* 35 * Copyright 2010 Nexenta Systems, Inc. All rights reserved. 36 * Use is subject to license terms. 37 */ 38 39 #include "lint.h" 40 #include <sys/types.h> 41 #include <errno.h> 42 #include "runetype.h" 43 #include <stdlib.h> 44 #include <string.h> 45 #include <wchar.h> 46 #include "mblocal.h" 47 48 static size_t _GBK_mbrtowc(wchar_t *_RESTRICT_KYWD, 49 const char *_RESTRICT_KYWD, 50 size_t, mbstate_t *_RESTRICT_KYWD); 51 static int _GBK_mbsinit(const mbstate_t *); 52 static size_t _GBK_wcrtomb(char *_RESTRICT_KYWD, wchar_t, 53 mbstate_t *_RESTRICT_KYWD); 54 55 typedef struct { 56 wchar_t ch; 57 } _GBKState; 58 59 int 60 _GBK_init(_RuneLocale *rl) 61 { 62 63 __mbrtowc = _GBK_mbrtowc; 64 __wcrtomb = _GBK_wcrtomb; 65 __mbsinit = _GBK_mbsinit; 66 _CurrentRuneLocale = rl; 67 __ctype[520] = 2; 68 charset_is_ascii = 0; 69 return (0); 70 } 71 72 static int 73 _GBK_mbsinit(const mbstate_t *ps) 74 { 75 76 return (ps == NULL || ((const _GBKState *)ps)->ch == 0); 77 } 78 79 static int 80 _gbk_check(uint_t c) 81 { 82 83 c &= 0xff; 84 return ((c >= 0x81 && c <= 0xfe) ? 2 : 1); 85 } 86 87 static size_t 88 _GBK_mbrtowc(wchar_t *_RESTRICT_KYWD pwc, const char *_RESTRICT_KYWD s, 89 size_t n, mbstate_t *_RESTRICT_KYWD ps) 90 { 91 _GBKState *gs; 92 wchar_t wc; 93 size_t len; 94 95 gs = (_GBKState *)ps; 96 97 if ((gs->ch & ~0xFF) != 0) { 98 /* Bad conversion state. */ 99 errno = EINVAL; 100 return ((size_t)-1); 101 } 102 103 if (s == NULL) { 104 s = ""; 105 n = 1; 106 pwc = NULL; 107 } 108 109 if (n == 0) 110 /* Incomplete multibyte sequence */ 111 return ((size_t)-2); 112 113 if (gs->ch != 0) { 114 if (*s == '\0') { 115 errno = EILSEQ; 116 return ((size_t)-1); 117 } 118 wc = (gs->ch << 8) | (*s & 0xFF); 119 if (pwc != NULL) 120 *pwc = wc; 121 gs->ch = 0; 122 return (1); 123 } 124 125 len = (size_t)_gbk_check(*s); 126 wc = *s++ & 0xff; 127 if (len == 2) { 128 if (n < 2) { 129 /* Incomplete multibyte sequence */ 130 gs->ch = wc; 131 return ((size_t)-2); 132 } 133 if (*s == '\0') { 134 errno = EILSEQ; 135 return ((size_t)-1); 136 } 137 wc = (wc << 8) | (*s++ & 0xff); 138 if (pwc != NULL) 139 *pwc = wc; 140 return (2); 141 } else { 142 if (pwc != NULL) 143 *pwc = wc; 144 return (wc == L'\0' ? 0 : 1); 145 } 146 } 147 148 static size_t 149 _GBK_wcrtomb(char *_RESTRICT_KYWD s, wchar_t wc, mbstate_t *_RESTRICT_KYWD ps) 150 { 151 _GBKState *gs; 152 153 gs = (_GBKState *)ps; 154 155 if (gs->ch != 0) { 156 errno = EINVAL; 157 return ((size_t)-1); 158 } 159 160 if (s == NULL) 161 /* Reset to initial shift state (no-op) */ 162 return (1); 163 if (wc & 0x8000) { 164 *s++ = (wc >> 8) & 0xff; 165 *s = wc & 0xff; 166 return (2); 167 } 168 *s = wc & 0xff; 169 return (1); 170 } 171