1 /* $Header: /p/tcsh/cvsroot/tcsh/tc.nls.c,v 3.23 2010/02/12 22:17:20 christos Exp $ */ 2 /* 3 * tc.nls.c: NLS handling 4 */ 5 /*- 6 * Copyright (c) 1980, 1991 The Regents of the University of California. 7 * All rights reserved. 8 * 9 * Redistribution and use in source and binary forms, with or without 10 * modification, are permitted provided that the following conditions 11 * are met: 12 * 1. Redistributions of source code must retain the above copyright 13 * notice, this list of conditions and the following disclaimer. 14 * 2. Redistributions in binary form must reproduce the above copyright 15 * notice, this list of conditions and the following disclaimer in the 16 * documentation and/or other materials provided with the distribution. 17 * 3. Neither the name of the University nor the names of its contributors 18 * may be used to endorse or promote products derived from this software 19 * without specific prior written permission. 20 * 21 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 22 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 23 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 24 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 25 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 26 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 27 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 28 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 29 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 30 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 31 * SUCH DAMAGE. 32 */ 33 #include "sh.h" 34 35 RCSID("$tcsh: tc.nls.c,v 3.23 2010/02/12 22:17:20 christos Exp $") 36 37 38 #ifdef WIDE_STRINGS 39 # ifdef HAVE_WCWIDTH 40 # ifdef UTF16_STRINGS 41 int 42 xwcwidth (wint_t wchar) 43 { 44 wchar_t ws[2]; 45 46 if (wchar <= 0xffff) 47 return wcwidth ((wchar_t) wchar); 48 /* UTF-16 systems can't handle these values directly in calls to wcwidth. 49 However, they can handle them as surrogate pairs in calls to wcswidth. 50 What we do here is to convert UTF-32 values >= 0x10000 into surrogate 51 pairs and compute the width by calling wcswidth. */ 52 wchar -= 0x10000; 53 ws[0] = 0xd800 | (wchar >> 10); 54 ws[1] = 0xdc00 | (wchar & 0x3ff); 55 return wcswidth (ws, 2); 56 } 57 # else 58 #define xwcwidth wcwidth 59 # endif /* !UTF16_STRINGS */ 60 # endif /* HAVE_WCWIDTH */ 61 62 int 63 NLSWidth(Char c) 64 { 65 # ifdef HAVE_WCWIDTH 66 int l; 67 if (c & INVALID_BYTE) 68 return 1; 69 l = xwcwidth((wchar_t) c); 70 return l >= 0 ? l : 0; 71 # else 72 return iswprint(c) != 0; 73 # endif 74 } 75 76 int 77 NLSStringWidth(const Char *s) 78 { 79 int w = 0, l; 80 Char c; 81 82 while (*s) { 83 c = *s++; 84 #ifdef HAVE_WCWIDTH 85 if ((l = xwcwidth((wchar_t) c)) < 0) 86 l = 2; 87 #else 88 l = iswprint(c) != 0; 89 #endif 90 w += l; 91 } 92 return w; 93 } 94 #endif 95 96 Char * 97 NLSChangeCase(const Char *p, int mode) 98 { 99 Char c, *n, c2 = 0; 100 const Char *op = p; 101 102 for (; (c = *p) != 0; p++) { 103 if (mode == 0 && Islower(c)) { 104 c2 = Toupper(c); 105 break; 106 } else if (mode && Isupper(c)) { 107 c2 = Tolower(c); 108 break; 109 } 110 } 111 if (!*p) 112 return 0; 113 n = Strsave(op); 114 n[p - op] = c2; 115 return n; 116 } 117 118 int 119 NLSClassify(Char c, int nocomb) 120 { 121 int w; 122 if (c & INVALID_BYTE) 123 return NLSCLASS_ILLEGAL; 124 w = NLSWidth(c); 125 if ((w > 0 && !(Iscntrl(c) && (c & CHAR) < 0x100)) || (Isprint(c) && !nocomb)) 126 return w; 127 if (Iscntrl(c) && (c & CHAR) < 0x100) { 128 if (c == '\n') 129 return NLSCLASS_NL; 130 if (c == '\t') 131 return NLSCLASS_TAB; 132 return NLSCLASS_CTRL; 133 } 134 #ifdef WIDE_STRINGS 135 if (c >= 0x1000000) 136 return NLSCLASS_ILLEGAL4; 137 if (c >= 0x10000) 138 return NLSCLASS_ILLEGAL3; 139 #endif 140 if (c >= 0x100) 141 return NLSCLASS_ILLEGAL2; 142 return NLSCLASS_ILLEGAL; 143 } 144