xref: /freebsd/contrib/netbsd-tests/lib/libc/locale/t_mbrtowc.c (revision ca2e4ecd7395ba655ab4bebe7262a06e634216ce)
1 /* $NetBSD: t_mbrtowc.c,v 1.1 2011/07/15 07:35:21 jruoho Exp $ */
2 
3 /*-
4  * Copyright (c) 2011 The NetBSD Foundation, Inc.
5  * All rights reserved.
6  *
7  * This code is derived from software contributed to The NetBSD Foundation
8  * by YAMAMOTO Takashi
9  *
10  * Redistribution and use in source and binary forms, with or without
11  * modification, are permitted provided that the following conditions
12  * are met:
13  * 1. Redistributions of source code must retain the above copyright
14  *    notice, this list of conditions and the following disclaimer.
15  * 2. Redistributions in binary form must reproduce the above copyright
16  *    notice, this list of conditions and the following disclaimer in the
17  *    documentation and/or other materials provided with the distribution.
18  *
19  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29  * POSSIBILITY OF SUCH DAMAGE.
30  */
31 
32 /*-
33  * Copyright (c)2003 Citrus Project,
34  * All rights reserved.
35  *
36  * Redistribution and use in source and binary forms, with or without
37  * modification, are permitted provided that the following conditions
38  * are met:
39  * 1. Redistributions of source code must retain the above copyright
40  *    notice, this list of conditions and the following disclaimer.
41  * 2. Redistributions in binary form must reproduce the above copyright
42  *    notice, this list of conditions and the following disclaimer in the
43  *    documentation and/or other materials provided with the distribution.
44  *
45  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
46  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
47  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
48  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
49  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
50  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
51  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
52  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
53  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
54  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
55  * SUCH DAMAGE.
56  */
57 
58 #include <sys/cdefs.h>
59 __COPYRIGHT("@(#) Copyright (c) 2011\
60  The NetBSD Foundation, inc. All rights reserved.");
61 __RCSID("$NetBSD: t_mbrtowc.c,v 1.1 2011/07/15 07:35:21 jruoho Exp $");
62 
63 #include <errno.h>
64 #include <locale.h>
65 #include <stdio.h>
66 #include <stdlib.h>
67 #include <string.h>
68 #include <vis.h>
69 #include <wchar.h>
70 
71 #include <atf-c.h>
72 
73 #define SIZE 256
74 
75 static struct test {
76 	const char *locale;
77 	const char *data;
78 	const wchar_t wchars[64];
79 	const wchar_t widths[64];
80 	size_t length;
81 } tests[] = {
82 {
83 	"C",
84 	"ABCD01234_\\",
85 	{ 0x41, 0x42, 0x43, 0x44, 0x30, 0x31, 0x32, 0x33, 0x34, 0x5F, 0x5C },
86 	{ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1 },
87 	11
88 }, {
89 	"en_US.UTF-8",
90 	"[\001\177][\302\200\337\277][\340\240\200\357\277\277][\360\220\200"
91 	"\200\367\277\277\277][\370\210\200\200\200\373\277\277\277\277][\374"
92 	"\204\200\200\200\200\375\277\277\277\277\277]",
93 	{ 0x5b, 0x01, 0x7f, 0x5d, 0x5b, 0x80, 0x7ff, 0x5d, 0x5b, 0x800, 0xffff,
94 	  0x5d, 0x5b, 0x10000, 0x1fffff, 0x5d, 0x5b, 0x200000, 0x3ffffff, 0x5d,
95 	  0x5b, 0x4000000, 0x7fffffff, 0x5d },
96 	{ 1, 1, 1, 1, 1, 2, 2, 1, 1, 3, 3, 1, 1, 4, 4, 1, 1, 5, 5, 1, 1, 6, 6, 1 },
97 	24
98 }, {
99 	"ja_JP.ISO2022-JP2",
100 	"\033$BF|K\1348l\033(BA\033$B$\"\033(BB\033$B$$\033(B",
101 	{ 0x4200467c, 0x42004b5c, 0x4200386c, 0x41, 0x42002422, 0x42, 0x42002424 },
102 	{ 5, 2, 2, 4, 5, 4, 5 },
103 	7
104 }, {
105 	"ja_JP.SJIS",
106 	"\223\372\226{\214\352A\202\240B\202\242",
107 	{ 0x93fa, 0x967b, 0x8cea, 0x41, 0x82a0, 0x42, 0x82a2 },
108 	{ 2, 2, 2, 1, 2, 1, 2 },
109 	7
110 }, {
111 	"ja_JP.eucJP",
112 	"\306\374\313\334\270\354A\244\242B\244\244",
113 	{ 0xc6fc, 0xcbdc, 0xb8ec, 0x41, 0xa4a2, 0x42, 0xa4a4 },
114 	{ 2, 2, 2, 1, 2, 1, 2 },
115 	7
116 }, {
117 	NULL,
118 	NULL,
119 	{ },
120 	{ },
121 	0
122 }
123 };
124 
125 static void
126 h_ctype2(const struct test *t, bool use_mbstate)
127 {
128 	mbstate_t *stp;
129 	mbstate_t st;
130 	char buf[SIZE];
131 	char *str;
132 	size_t n;
133 
134 	ATF_REQUIRE_STREQ(setlocale(LC_ALL, "C"), "C");
135 #ifdef __NetBSD__
136 	ATF_REQUIRE(setlocale(LC_CTYPE, t->locale) != NULL);
137 #else
138 	if (setlocale(LC_CTYPE, t->locale) == NULL) {
139 		fprintf(stderr, "Locale %s not found.\n", t->locale);
140 		return;
141 	}
142 #endif
143 
144 	(void)strvis(buf, t->data, VIS_WHITE | VIS_OCTAL);
145 	(void)printf("Checking string: \"%s\"\n", buf);
146 
147 	ATF_REQUIRE((str = setlocale(LC_ALL, NULL)) != NULL);
148 	(void)printf("Using locale: %s\n", str);
149 
150 	(void)printf("Using mbstate: %s\n", use_mbstate ? "yes" : "no");
151 
152 	(void)memset(&st, 0, sizeof(st));
153 //	mbrtowc(0, 0, 0, &st); /* XXX for ISO2022-JP */
154 	stp = use_mbstate ? &st : 0;
155 
156 	for (n = 9; n > 0; n--) {
157 		const char *src = t->data;
158 		wchar_t dst;
159 		size_t nchar = 0;
160 		int width = 0;
161 
162 		ATF_REQUIRE(mbsinit(stp) != 0);
163 
164 		for (;;) {
165 			size_t rv = mbrtowc(&dst, src, n, stp);
166 
167 			if (rv == 0)
168 				break;
169 
170 			if (rv == (size_t)-2) {
171 				src += n;
172 				width += n;
173 
174 				continue;
175 			}
176 			if (rv == (size_t)-1) {
177 				ATF_REQUIRE_EQ(errno, EILSEQ);
178 				atf_tc_fail("Invalid sequence");
179 				/* NOTREACHED */
180 			}
181 
182 			width += rv;
183 			src += rv;
184 
185 			if (dst != t->wchars[nchar] ||
186 			    width != t->widths[nchar]) {
187 				(void)printf("At position %zd:\n", nchar);
188 				(void)printf("  expected: 0x%04X (%u)\n",
189 					t->wchars[nchar], t->widths[nchar]);
190 				(void)printf("  got     : 0x%04X (%u)\n",
191 					dst, width);
192 				atf_tc_fail("Test failed");
193 			}
194 
195 			nchar++;
196 			width = 0;
197 		}
198 
199 		ATF_REQUIRE_EQ_MSG(dst, 0, "Incorrect terminating character: "
200 			"0x%04X (expected: 0x00)", dst);
201 
202 		ATF_REQUIRE_EQ_MSG(nchar, t->length, "Incorrect length: "
203 			"%zd (expected: %zd)", nchar, t->length);
204 	}
205 
206 	{
207 		wchar_t wbuf[SIZE];
208 		size_t rv;
209 		char const *src = t->data;
210 		int i;
211 
212 		(void)memset(wbuf, 0xFF, sizeof(wbuf));
213 
214 		rv = mbsrtowcs(wbuf, &src, SIZE, stp);
215 
216 		ATF_REQUIRE_EQ_MSG(rv, t->length, "Incorrect length: %zd "
217 			"(expected: %zd)", rv, t->length);
218 		ATF_REQUIRE_EQ(src, NULL);
219 
220 		for (i = 0; wbuf[i] != 0; ++i) {
221 			if (wbuf[i] == t->wchars[i])
222 				continue;
223 
224 			(void)printf("At position %d:\n", i);
225 			(void)printf("  expected: 0x%04X\n", t->wchars[i]);
226 			(void)printf("  got     : 0x%04X\n", wbuf[i]);
227 			atf_tc_fail("Test failed");
228 		}
229 
230 		ATF_REQUIRE_EQ_MSG((size_t)i, t->length, "Incorrect length: "
231 			"%d (expected: %zd)", i, t->length);
232 	}
233 
234 	(void)printf("Ok.\n");
235 }
236 
237 ATF_TC(mbrtowc_internal);
238 ATF_TC_HEAD(mbrtowc_internal, tc)
239 {
240 	atf_tc_set_md_var(tc, "descr",
241 		"Checks mbrtowc(3) and mbsrtowcs(3) (using internal "
242 		"state) with different locales");
243 }
244 ATF_TC_BODY(mbrtowc_internal, tc)
245 {
246 	struct test *t;
247 
248 #ifdef __FreeBSD__
249 	atf_tc_expect_fail("ja_* locale fails");
250 #endif
251 	for (t = &tests[0]; t->data != NULL; ++t)
252 		h_ctype2(t, false);
253 }
254 
255 ATF_TC(mbrtowc_object);
256 ATF_TC_HEAD(mbrtowc_object, tc)
257 {
258 	atf_tc_set_md_var(tc, "descr",
259 		"Checks mbrtowc(3) and mbsrtowcs(3) (using state "
260 		"object) with different locales");
261 }
262 ATF_TC_BODY(mbrtowc_object, tc)
263 {
264 	struct test *t;
265 
266 	for (t = &tests[0]; t->data != NULL; ++t)
267 		h_ctype2(t, true);
268 }
269 
270 ATF_TP_ADD_TCS(tp)
271 {
272 
273 	ATF_TP_ADD_TC(tp, mbrtowc_internal);
274 	ATF_TP_ADD_TC(tp, mbrtowc_object);
275 
276 	return atf_no_error();
277 }
278