xref: /freebsd/lib/libc/locale/setrunelocale.c (revision e8d8bef961a50d4dc22501cde4fb9fb0be1b2532)
1 /*-
2  * SPDX-License-Identifier: BSD-3-Clause
3  *
4  * Copyright (c) 1993
5  *	The Regents of the University of California.  All rights reserved.
6  *
7  * This code is derived from software contributed to Berkeley by
8  * Paul Borman at Krystal Technologies.
9  *
10  * Copyright (c) 2011 The FreeBSD Foundation
11  * All rights reserved.
12  * Portions of this software were developed by David Chisnall
13  * under sponsorship from the FreeBSD Foundation.
14  *
15  * Redistribution and use in source and binary forms, with or without
16  * modification, are permitted provided that the following conditions
17  * are met:
18  * 1. Redistributions of source code must retain the above copyright
19  *    notice, this list of conditions and the following disclaimer.
20  * 2. Redistributions in binary form must reproduce the above copyright
21  *    notice, this list of conditions and the following disclaimer in the
22  *    documentation and/or other materials provided with the distribution.
23  * 3. Neither the name of the University nor the names of its contributors
24  *    may be used to endorse or promote products derived from this software
25  *    without specific prior written permission.
26  *
27  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
28  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
29  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
30  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
31  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
32  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
33  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
34  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
35  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
36  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
37  * SUCH DAMAGE.
38  */
39 
40 #include <sys/cdefs.h>
41 __FBSDID("$FreeBSD$");
42 
43 #define	__RUNETYPE_INTERNAL 1
44 
45 #include <runetype.h>
46 #include <errno.h>
47 #include <limits.h>
48 #include <string.h>
49 #include <stdio.h>
50 #include <stdlib.h>
51 #include <unistd.h>
52 #include <wchar.h>
53 #include "ldpart.h"
54 #include "mblocal.h"
55 #include "setlocale.h"
56 
57 #undef _CurrentRuneLocale
58 extern _RuneLocale const *_CurrentRuneLocale;
59 /*
60  * A cached version of the runes for this thread.  Used by ctype.h
61  */
62 _Thread_local const _RuneLocale *_ThreadRuneLocale;
63 
64 extern int __mb_sb_limit;
65 
66 extern _RuneLocale	*_Read_RuneMagi(const char *);
67 
68 static int		__setrunelocale(struct xlocale_ctype *l, const char *);
69 
70 static void
71 destruct_ctype(void *v)
72 {
73 	struct xlocale_ctype *l = v;
74 
75 	if (&_DefaultRuneLocale != l->runes)
76 		free(l->runes);
77 	free(l);
78 }
79 
80 const _RuneLocale *
81 __getCurrentRuneLocale(void)
82 {
83 
84 	return (XLOCALE_CTYPE(__get_locale())->runes);
85 }
86 
87 static void
88 free_runes(_RuneLocale *rl)
89 {
90 	if ((rl != &_DefaultRuneLocale) && (rl)) {
91 		free(rl);
92 	}
93 }
94 
95 static int
96 __setrunelocale(struct xlocale_ctype *l, const char *encoding)
97 {
98 	_RuneLocale *rl;
99 	int ret;
100 	char *path;
101 	struct xlocale_ctype saved = *l;
102 
103 	/*
104 	 * The "C" and "POSIX" locale are always here.
105 	 */
106 	if (strcmp(encoding, "C") == 0 || strcmp(encoding, "POSIX") == 0) {
107 		free_runes(saved.runes);
108 		(void) _none_init(l, (_RuneLocale*)&_DefaultRuneLocale);
109 		return (0);
110 	}
111 
112 	/* Range checking not needed, encoding length already checked before */
113 	if (asprintf(&path, "%s/%s/LC_CTYPE", _PathLocale, encoding) == -1)
114 		return (errno);
115 
116 	if ((rl = _Read_RuneMagi(path)) == NULL) {
117 		free(path);
118 		errno = EINVAL;
119 		return (errno);
120 	}
121 	free(path);
122 
123 	l->__mbrtowc = NULL;
124 	l->__mbsinit = NULL;
125 	l->__mbsnrtowcs = NULL;
126 	l->__wcrtomb = NULL;
127 	l->__wcsnrtombs = NULL;
128 
129 	rl->__sputrune = NULL;
130 	rl->__sgetrune = NULL;
131 	if (strcmp(rl->__encoding, "NONE:US-ASCII") == 0)
132 		ret = _ascii_init(l, rl);
133 	else if (strncmp(rl->__encoding, "NONE", 4) == 0)
134 		ret = _none_init(l, rl);
135 	else if (strcmp(rl->__encoding, "UTF-8") == 0)
136 		ret = _UTF8_init(l, rl);
137 	else if (strcmp(rl->__encoding, "EUC-CN") == 0)
138 		ret = _EUC_CN_init(l, rl);
139 	else if (strcmp(rl->__encoding, "EUC-JP") == 0)
140 		ret = _EUC_JP_init(l, rl);
141 	else if (strcmp(rl->__encoding, "EUC-KR") == 0)
142 		ret = _EUC_KR_init(l, rl);
143 	else if (strcmp(rl->__encoding, "EUC-TW") == 0)
144 		ret = _EUC_TW_init(l, rl);
145 	else if (strcmp(rl->__encoding, "GB18030") == 0)
146 		ret = _GB18030_init(l, rl);
147 	else if (strcmp(rl->__encoding, "GB2312") == 0)
148 		ret = _GB2312_init(l, rl);
149 	else if (strcmp(rl->__encoding, "GBK") == 0)
150 		ret = _GBK_init(l, rl);
151 	else if (strcmp(rl->__encoding, "BIG5") == 0)
152 		ret = _BIG5_init(l, rl);
153 	else if (strcmp(rl->__encoding, "MSKanji") == 0)
154 		ret = _MSKanji_init(l, rl);
155 	else
156 		ret = EFTYPE;
157 
158 	if (ret == 0) {
159 		/* Free the old runes if it exists. */
160 		free_runes(saved.runes);
161 		/* Reset the mbstates */
162 		memset(&l->c16rtomb, 0, sizeof(l->c16rtomb));
163 		memset(&l->c32rtomb, 0, sizeof(l->c32rtomb));
164 		memset(&l->mblen, 0, sizeof(l->mblen));
165 		memset(&l->mbrlen, 0, sizeof(l->mbrlen));
166 		memset(&l->mbrtoc16, 0, sizeof(l->mbrtoc16));
167 		memset(&l->mbrtoc32, 0, sizeof(l->mbrtoc32));
168 		memset(&l->mbrtowc, 0, sizeof(l->mbrtowc));
169 		memset(&l->mbsnrtowcs, 0, sizeof(l->mbsnrtowcs));
170 		memset(&l->mbsrtowcs, 0, sizeof(l->mbsrtowcs));
171 		memset(&l->mbtowc, 0, sizeof(l->mbtowc));
172 		memset(&l->wcrtomb, 0, sizeof(l->wcrtomb));
173 		memset(&l->wcsnrtombs, 0, sizeof(l->wcsnrtombs));
174 		memset(&l->wcsrtombs, 0, sizeof(l->wcsrtombs));
175 		memset(&l->wctomb, 0, sizeof(l->wctomb));
176 	} else {
177 		/* Restore the saved version if this failed. */
178 		memcpy(l, &saved, sizeof(struct xlocale_ctype));
179 		free(rl);
180 	}
181 
182 	return (ret);
183 }
184 
185 int
186 __wrap_setrunelocale(const char *locale)
187 {
188 	int ret = __setrunelocale(&__xlocale_global_ctype, locale);
189 
190 	if (ret != 0) {
191 		errno = ret;
192 		return (_LDP_ERROR);
193 	}
194 	__mb_cur_max = __xlocale_global_ctype.__mb_cur_max;
195 	__mb_sb_limit = __xlocale_global_ctype.__mb_sb_limit;
196 	_CurrentRuneLocale = __xlocale_global_ctype.runes;
197 	return (_LDP_LOADED);
198 }
199 
200 void
201 __set_thread_rune_locale(locale_t loc)
202 {
203 
204 	if (loc == NULL) {
205 		_ThreadRuneLocale = &_DefaultRuneLocale;
206 	} else if (loc == LC_GLOBAL_LOCALE) {
207 		_ThreadRuneLocale = 0;
208 	} else {
209 		_ThreadRuneLocale = XLOCALE_CTYPE(loc)->runes;
210 	}
211 }
212 
213 void *
214 __ctype_load(const char *locale, locale_t unused __unused)
215 {
216 	struct xlocale_ctype *l = calloc(sizeof(struct xlocale_ctype), 1);
217 
218 	l->header.header.destructor = destruct_ctype;
219 	if (__setrunelocale(l, locale)) {
220 		free(l);
221 		return (NULL);
222 	}
223 	return (l);
224 }
225