xref: /freebsd/contrib/netbsd-tests/lib/libc/locale/t_mbrtowc.c (revision b9f654b163bce26de79705e77b872427c9f2afa1)
1 /* $NetBSD: t_mbrtowc.c,v 1.1 2011/07/15 07:35:21 jruoho Exp $ */
2 
3 /*-
4  * Copyright (c) 2011 The NetBSD Foundation, Inc.
5  * All rights reserved.
6  *
7  * This code is derived from software contributed to The NetBSD Foundation
8  * by YAMAMOTO Takashi
9  *
10  * Redistribution and use in source and binary forms, with or without
11  * modification, are permitted provided that the following conditions
12  * are met:
13  * 1. Redistributions of source code must retain the above copyright
14  *    notice, this list of conditions and the following disclaimer.
15  * 2. Redistributions in binary form must reproduce the above copyright
16  *    notice, this list of conditions and the following disclaimer in the
17  *    documentation and/or other materials provided with the distribution.
18  *
19  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29  * POSSIBILITY OF SUCH DAMAGE.
30  */
31 
32 /*-
33  * Copyright (c)2003 Citrus Project,
34  * All rights reserved.
35  *
36  * Redistribution and use in source and binary forms, with or without
37  * modification, are permitted provided that the following conditions
38  * are met:
39  * 1. Redistributions of source code must retain the above copyright
40  *    notice, this list of conditions and the following disclaimer.
41  * 2. Redistributions in binary form must reproduce the above copyright
42  *    notice, this list of conditions and the following disclaimer in the
43  *    documentation and/or other materials provided with the distribution.
44  *
45  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
46  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
47  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
48  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
49  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
50  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
51  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
52  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
53  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
54  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
55  * SUCH DAMAGE.
56  */
57 
58 #include <sys/cdefs.h>
59 __COPYRIGHT("@(#) Copyright (c) 2011\
60  The NetBSD Foundation, inc. All rights reserved.");
61 __RCSID("$NetBSD: t_mbrtowc.c,v 1.1 2011/07/15 07:35:21 jruoho Exp $");
62 
63 #include <errno.h>
64 #include <locale.h>
65 #include <stdio.h>
66 #include <stdlib.h>
67 #include <string.h>
68 #include <vis.h>
69 #include <wchar.h>
70 
71 #include <atf-c.h>
72 
73 #define SIZE 256
74 
75 static struct test {
76 	const char *locale;
77 	const char *data;
78 	const wchar_t wchars[64];
79 	const wchar_t widths[64];
80 	size_t length;
81 } tests[] = {
82 {
83 	"C",
84 	"ABCD01234_\\",
85 	{ 0x41, 0x42, 0x43, 0x44, 0x30, 0x31, 0x32, 0x33, 0x34, 0x5F, 0x5C },
86 	{ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1 },
87 	11
88 }, {
89 	"en_US.UTF-8",
90 	"[\001\177][\302\200\337\277][\340\240\200\357\277\277][\360\220\200"
91 	"\200\364\217\277\277]",
92 	{ 0x5b, 0x01, 0x7f, 0x5d, 0x5b, 0x80, 0x7ff, 0x5d, 0x5b, 0x800, 0xffff,
93 	  0x5d, 0x5b, 0x10000, 0x10ffff, 0x5d },
94 	{ 1, 1, 1, 1, 1, 2, 2, 1, 1, 3, 3, 1, 1, 4, 4, 1 },
95 	16
96 }, {
97 	"ja_JP.ISO2022-JP2",
98 	"\033$BF|K\1348l\033(BA\033$B$\"\033(BB\033$B$$\033(B",
99 	{ 0x4200467c, 0x42004b5c, 0x4200386c, 0x41, 0x42002422, 0x42, 0x42002424 },
100 	{ 5, 2, 2, 4, 5, 4, 5 },
101 	7
102 }, {
103 	"ja_JP.SJIS",
104 	"\223\372\226{\214\352A\202\240B\202\242",
105 	{ 0x93fa, 0x967b, 0x8cea, 0x41, 0x82a0, 0x42, 0x82a2 },
106 	{ 2, 2, 2, 1, 2, 1, 2 },
107 	7
108 }, {
109 	"ja_JP.eucJP",
110 	"\306\374\313\334\270\354A\244\242B\244\244",
111 	{ 0xc6fc, 0xcbdc, 0xb8ec, 0x41, 0xa4a2, 0x42, 0xa4a4 },
112 	{ 2, 2, 2, 1, 2, 1, 2 },
113 	7
114 }, {
115 	NULL,
116 	NULL,
117 	{ },
118 	{ },
119 	0
120 }
121 };
122 
123 static void
124 h_ctype2(const struct test *t, bool use_mbstate)
125 {
126 	mbstate_t *stp;
127 	mbstate_t st;
128 	char buf[SIZE];
129 	char *str;
130 	size_t n;
131 
132 	ATF_REQUIRE_STREQ(setlocale(LC_ALL, "C"), "C");
133 #ifdef __NetBSD__
134 	ATF_REQUIRE(setlocale(LC_CTYPE, t->locale) != NULL);
135 #else
136 	if (setlocale(LC_CTYPE, t->locale) == NULL) {
137 		fprintf(stderr, "Locale %s not found.\n", t->locale);
138 		return;
139 	}
140 #endif
141 
142 	(void)strvis(buf, t->data, VIS_WHITE | VIS_OCTAL);
143 	(void)printf("Checking string: \"%s\"\n", buf);
144 
145 	ATF_REQUIRE((str = setlocale(LC_ALL, NULL)) != NULL);
146 	(void)printf("Using locale: %s\n", str);
147 
148 	(void)printf("Using mbstate: %s\n", use_mbstate ? "yes" : "no");
149 
150 	(void)memset(&st, 0, sizeof(st));
151 //	mbrtowc(0, 0, 0, &st); /* XXX for ISO2022-JP */
152 	stp = use_mbstate ? &st : 0;
153 
154 	for (n = 9; n > 0; n--) {
155 		const char *src = t->data;
156 		wchar_t dst;
157 		size_t nchar = 0;
158 		int width = 0;
159 
160 		ATF_REQUIRE(mbsinit(stp) != 0);
161 
162 		for (;;) {
163 			size_t rv = mbrtowc(&dst, src, n, stp);
164 
165 			if (rv == 0)
166 				break;
167 
168 			if (rv == (size_t)-2) {
169 				src += n;
170 				width += n;
171 
172 				continue;
173 			}
174 			if (rv == (size_t)-1) {
175 				ATF_REQUIRE_EQ(errno, EILSEQ);
176 				atf_tc_fail("Invalid sequence");
177 				/* NOTREACHED */
178 			}
179 
180 			width += rv;
181 			src += rv;
182 
183 			if (dst != t->wchars[nchar] ||
184 			    width != t->widths[nchar]) {
185 				(void)printf("At position %zd:\n", nchar);
186 				(void)printf("  expected: 0x%04X (%u)\n",
187 					t->wchars[nchar], t->widths[nchar]);
188 				(void)printf("  got     : 0x%04X (%u)\n",
189 					dst, width);
190 				atf_tc_fail("Test failed");
191 			}
192 
193 			nchar++;
194 			width = 0;
195 		}
196 
197 		ATF_REQUIRE_EQ_MSG(dst, 0, "Incorrect terminating character: "
198 			"0x%04X (expected: 0x00)", dst);
199 
200 		ATF_REQUIRE_EQ_MSG(nchar, t->length, "Incorrect length: "
201 			"%zd (expected: %zd)", nchar, t->length);
202 	}
203 
204 	{
205 		wchar_t wbuf[SIZE];
206 		size_t rv;
207 		char const *src = t->data;
208 		int i;
209 
210 		(void)memset(wbuf, 0xFF, sizeof(wbuf));
211 
212 		rv = mbsrtowcs(wbuf, &src, SIZE, stp);
213 
214 		ATF_REQUIRE_EQ_MSG(rv, t->length, "Incorrect length: %zd "
215 			"(expected: %zd)", rv, t->length);
216 		ATF_REQUIRE_EQ(src, NULL);
217 
218 		for (i = 0; wbuf[i] != 0; ++i) {
219 			if (wbuf[i] == t->wchars[i])
220 				continue;
221 
222 			(void)printf("At position %d:\n", i);
223 			(void)printf("  expected: 0x%04X\n", t->wchars[i]);
224 			(void)printf("  got     : 0x%04X\n", wbuf[i]);
225 			atf_tc_fail("Test failed");
226 		}
227 
228 		ATF_REQUIRE_EQ_MSG((size_t)i, t->length, "Incorrect length: "
229 			"%d (expected: %zd)", i, t->length);
230 	}
231 
232 	(void)printf("Ok.\n");
233 }
234 
235 ATF_TC(mbrtowc_internal);
236 ATF_TC_HEAD(mbrtowc_internal, tc)
237 {
238 	atf_tc_set_md_var(tc, "descr",
239 		"Checks mbrtowc(3) and mbsrtowcs(3) (using internal "
240 		"state) with different locales");
241 }
242 ATF_TC_BODY(mbrtowc_internal, tc)
243 {
244 	struct test *t;
245 
246 	for (t = &tests[0]; t->data != NULL; ++t)
247 		h_ctype2(t, false);
248 }
249 
250 ATF_TC(mbrtowc_object);
251 ATF_TC_HEAD(mbrtowc_object, tc)
252 {
253 	atf_tc_set_md_var(tc, "descr",
254 		"Checks mbrtowc(3) and mbsrtowcs(3) (using state "
255 		"object) with different locales");
256 }
257 ATF_TC_BODY(mbrtowc_object, tc)
258 {
259 	struct test *t;
260 
261 	for (t = &tests[0]; t->data != NULL; ++t)
262 		h_ctype2(t, true);
263 }
264 
265 ATF_TP_ADD_TCS(tp)
266 {
267 
268 	ATF_TP_ADD_TC(tp, mbrtowc_internal);
269 	ATF_TP_ADD_TC(tp, mbrtowc_object);
270 
271 	return atf_no_error();
272 }
273