xref: /freebsd/lib/libc/tests/locale/mbrtowc_test.c (revision b37f6c9805edb4b89f0a8c2b78f78a3dcfc0647b)
1 /*-
2  * Copyright (c) 2002 Tim J. Robbins
3  * All rights reserved.
4  *
5  * Redistribution and use in source and binary forms, with or without
6  * modification, are permitted provided that the following conditions
7  * are met:
8  * 1. Redistributions of source code must retain the above copyright
9  *    notice, this list of conditions and the following disclaimer.
10  * 2. Redistributions in binary form must reproduce the above copyright
11  *    notice, this list of conditions and the following disclaimer in the
12  *    documentation and/or other materials provided with the distribution.
13  *
14  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
15  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
18  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
24  * SUCH DAMAGE.
25  */
26 
27 /*
28  * Test program for mbrtowc(), as specified by IEEE Std. 1003.1-2001 and
29  * ISO/IEC 9899:1999.
30  *
31  * The function is tested with both the "C" ("POSIX") LC_CTYPE setting and
32  * "ja_JP.eucJP". Other encodings are not tested.
33  */
34 
35 #include <sys/cdefs.h>
36 __FBSDID("$FreeBSD$");
37 
38 #include <errno.h>
39 #include <limits.h>
40 #include <locale.h>
41 #include <stdio.h>
42 #include <stdlib.h>
43 #include <string.h>
44 #include <wchar.h>
45 
46 #include <atf-c.h>
47 
48 ATF_TC_WITHOUT_HEAD(mbrtowc_test);
49 ATF_TC_BODY(mbrtowc_test, tc)
50 {
51 	mbstate_t s;
52 	wchar_t wc;
53 	char buf[MB_LEN_MAX + 1];
54 
55 	/*
56 	 * C/POSIX locale.
57 	 */
58 
59 	ATF_REQUIRE(MB_CUR_MAX == 1);
60 
61 	/* Null wide character, internal state. */
62 	memset(buf, 0xcc, sizeof(buf));
63 	buf[0] = 0;
64 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, NULL) == 0);
65 	ATF_REQUIRE(wc == 0);
66 
67 	/* Null wide character. */
68 	memset(&s, 0, sizeof(s));
69 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, &s) == 0);
70 	ATF_REQUIRE(wc == 0);
71 
72 	/* Latin letter A, internal state. */
73 	ATF_REQUIRE(mbrtowc(NULL, 0, 0, NULL) == 0);
74 	buf[0] = 'A';
75 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, NULL) == 1);
76 	ATF_REQUIRE(wc == L'A');
77 
78 	/* Latin letter A. */
79 	memset(&s, 0, sizeof(s));
80 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, &s) == 1);
81 	ATF_REQUIRE(wc == L'A');
82 
83 	/* Incomplete character sequence. */
84 	wc = L'z';
85 	memset(&s, 0, sizeof(s));
86 	ATF_REQUIRE(mbrtowc(&wc, buf, 0, &s) == (size_t)-2);
87 	ATF_REQUIRE(wc == L'z');
88 
89 	/* Check that mbrtowc() doesn't access the buffer when n == 0. */
90 	wc = L'z';
91 	memset(&s, 0, sizeof(s));
92 	buf[0] = '\0';
93 	ATF_REQUIRE(mbrtowc(&wc, buf, 0, &s) == (size_t)-2);
94 	ATF_REQUIRE(wc == L'z');
95 
96 	/*
97 	 * Japanese (EUC) locale.
98 	 */
99 
100 	ATF_REQUIRE(strcmp(setlocale(LC_CTYPE, "ja_JP.eucJP"), "ja_JP.eucJP") == 0);
101 	ATF_REQUIRE(MB_CUR_MAX > 1);
102 
103 	/* Null wide character, internal state. */
104 	ATF_REQUIRE(mbrtowc(NULL, 0, 0, NULL) == 0);
105 	memset(buf, 0xcc, sizeof(buf));
106 	buf[0] = 0;
107 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, NULL) == 0);
108 	ATF_REQUIRE(wc == 0);
109 
110 	/* Null wide character. */
111 	memset(&s, 0, sizeof(s));
112 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, &s) == 0);
113 	ATF_REQUIRE(wc == 0);
114 
115 	/* Latin letter A, internal state. */
116 	ATF_REQUIRE(mbrtowc(NULL, 0, 0, NULL) == 0);
117 	buf[0] = 'A';
118 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, NULL) == 1);
119 	ATF_REQUIRE(wc == L'A');
120 
121 	/* Latin letter A. */
122 	memset(&s, 0, sizeof(s));
123 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, &s) == 1);
124 	ATF_REQUIRE(wc == L'A');
125 
126 	/* Incomplete character sequence (zero length). */
127 	wc = L'z';
128 	memset(&s, 0, sizeof(s));
129 	ATF_REQUIRE(mbrtowc(&wc, buf, 0, &s) == (size_t)-2);
130 	ATF_REQUIRE(wc == L'z');
131 
132 	/* Incomplete character sequence (truncated double-byte). */
133 	memset(buf, 0xcc, sizeof(buf));
134 	buf[0] = 0xa3;
135 	buf[1] = 0x00;
136 	memset(&s, 0, sizeof(s));
137 	wc = 0;
138 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, &s) == (size_t)-2);
139 
140 	/* Same as above, but complete. */
141 	buf[1] = 0xc1;
142 	memset(&s, 0, sizeof(s));
143 	wc = 0;
144 	ATF_REQUIRE(mbrtowc(&wc, buf, 2, &s) == 2);
145 	ATF_REQUIRE(wc == 0xa3c1);
146 
147 	/* Test restarting behaviour. */
148 	memset(buf, 0xcc, sizeof(buf));
149 	buf[0] = 0xa3;
150 	memset(&s, 0, sizeof(s));
151 	wc = 0;
152 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, &s) == (size_t)-2);
153 	ATF_REQUIRE(wc == 0);
154 	buf[0] = 0xc1;
155 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, &s) == 1);
156 	ATF_REQUIRE(wc == 0xa3c1);
157 }
158 
159 ATF_TP_ADD_TCS(tp)
160 {
161 
162 	ATF_TP_ADD_TC(tp, mbrtowc_test);
163 
164 	return (atf_no_error());
165 }
166