1 /* Test of conversion of multibyte character to wide character.
2 Copyright (C) 2008 Free Software Foundation, Inc.
4 This program is free software: you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation; either version 3 of the License, or
7 (at your option) any later version.
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program. If not, see <http://www.gnu.org/licenses/>. */
17 /* Written by Bruno Haible <bruno@clisp.org>, 2008. */
28 #define ASSERT(expr) \
33 fprintf (stderr, "%s:%d: assertion failed\n", __FILE__, __LINE__); \
41 main (int argc, char *argv[])
47 /* configure should already have checked that the locale is supported. */
48 if (setlocale (LC_ALL, "") == NULL)
51 /* Test zero-length input. */
53 memset (&state, '\0', sizeof (mbstate_t));
54 wc = (wchar_t) 0xBADFACE;
55 ret = mbrtowc (&wc, "x", 0, &state);
56 /* gnulib's implementation returns (size_t)(-2).
57 The AIX 5.1 implementation returns (size_t)(-1).
58 glibc's implementation returns 0. */
59 ASSERT (ret == (size_t)(-2) || ret == (size_t)(-1) || ret == 0);
60 ASSERT (mbsinit (&state));
63 /* Test NUL byte input. */
65 memset (&state, '\0', sizeof (mbstate_t));
66 wc = (wchar_t) 0xBADFACE;
67 ret = mbrtowc (&wc, "", 1, &state);
70 ASSERT (mbsinit (&state));
71 ret = mbrtowc (NULL, "", 1, &state);
73 ASSERT (mbsinit (&state));
76 /* Test single-byte input. */
81 memset (&state, '\0', sizeof (mbstate_t));
82 for (c = 0; c < 0x100; c++)
85 case '\t': case '\v': case '\f':
86 case ' ': case '!': case '"': case '#': case '%':
87 case '&': case '\'': case '(': case ')': case '*':
88 case '+': case ',': case '-': case '.': case '/':
89 case '0': case '1': case '2': case '3': case '4':
90 case '5': case '6': case '7': case '8': case '9':
91 case ':': case ';': case '<': case '=': case '>':
93 case 'A': case 'B': case 'C': case 'D': case 'E':
94 case 'F': case 'G': case 'H': case 'I': case 'J':
95 case 'K': case 'L': case 'M': case 'N': case 'O':
96 case 'P': case 'Q': case 'R': case 'S': case 'T':
97 case 'U': case 'V': case 'W': case 'X': case 'Y':
99 case '[': case '\\': case ']': case '^': case '_':
100 case 'a': case 'b': case 'c': case 'd': case 'e':
101 case 'f': case 'g': case 'h': case 'i': case 'j':
102 case 'k': case 'l': case 'm': case 'n': case 'o':
103 case 'p': case 'q': case 'r': case 's': case 't':
104 case 'u': case 'v': case 'w': case 'x': case 'y':
105 case 'z': case '{': case '|': case '}': case '~':
106 /* c is in the ISO C "basic character set". */
108 wc = (wchar_t) 0xBADFACE;
109 ret = mbrtowc (&wc, buf, 1, &state);
112 ASSERT (mbsinit (&state));
113 ret = mbrtowc (NULL, buf, 1, &state);
115 ASSERT (mbsinit (&state));
120 /* Test special calling convention, passing a NULL pointer. */
122 memset (&state, '\0', sizeof (mbstate_t));
123 wc = (wchar_t) 0xBADFACE;
124 ret = mbrtowc (&wc, NULL, 5, &state);
126 ASSERT (wc == (wchar_t) 0xBADFACE);
127 ASSERT (mbsinit (&state));
134 /* Locale encoding is ISO-8859-1 or ISO-8859-15. */
136 char input[] = "B\374\337er"; /* "Büßer" */
137 memset (&state, '\0', sizeof (mbstate_t));
139 wc = (wchar_t) 0xBADFACE;
140 ret = mbrtowc (&wc, input, 1, &state);
143 ASSERT (mbsinit (&state));
146 wc = (wchar_t) 0xBADFACE;
147 ret = mbrtowc (&wc, input + 1, 1, &state);
149 ASSERT (wctob (wc) == (unsigned char) '\374');
150 ASSERT (mbsinit (&state));
153 wc = (wchar_t) 0xBADFACE;
154 ret = mbrtowc (&wc, input + 2, 3, &state);
156 ASSERT (wctob (wc) == (unsigned char) '\337');
157 ASSERT (mbsinit (&state));
160 wc = (wchar_t) 0xBADFACE;
161 ret = mbrtowc (&wc, input + 3, 2, &state);
164 ASSERT (mbsinit (&state));
167 wc = (wchar_t) 0xBADFACE;
168 ret = mbrtowc (&wc, input + 4, 1, &state);
171 ASSERT (mbsinit (&state));
176 /* Locale encoding is UTF-8. */
178 char input[] = "B\303\274\303\237er"; /* "Büßer" */
179 memset (&state, '\0', sizeof (mbstate_t));
181 wc = (wchar_t) 0xBADFACE;
182 ret = mbrtowc (&wc, input, 1, &state);
185 ASSERT (mbsinit (&state));
188 wc = (wchar_t) 0xBADFACE;
189 ret = mbrtowc (&wc, input + 1, 1, &state);
190 ASSERT (ret == (size_t)(-2));
191 ASSERT (wc == (wchar_t) 0xBADFACE);
192 ASSERT (!mbsinit (&state));
195 wc = (wchar_t) 0xBADFACE;
196 ret = mbrtowc (&wc, input + 2, 5, &state);
198 ASSERT (wctob (wc) == EOF);
199 ASSERT (mbsinit (&state));
202 wc = (wchar_t) 0xBADFACE;
203 ret = mbrtowc (&wc, input + 3, 4, &state);
205 ASSERT (wctob (wc) == EOF);
206 ASSERT (mbsinit (&state));
210 wc = (wchar_t) 0xBADFACE;
211 ret = mbrtowc (&wc, input + 5, 2, &state);
214 ASSERT (mbsinit (&state));
217 wc = (wchar_t) 0xBADFACE;
218 ret = mbrtowc (&wc, input + 6, 1, &state);
221 ASSERT (mbsinit (&state));
226 /* Locale encoding is EUC-JP. */
228 char input[] = "<\306\374\313\334\270\354>"; /* "<日本語>" */
229 memset (&state, '\0', sizeof (mbstate_t));
231 wc = (wchar_t) 0xBADFACE;
232 ret = mbrtowc (&wc, input, 1, &state);
235 ASSERT (mbsinit (&state));
238 wc = (wchar_t) 0xBADFACE;
239 ret = mbrtowc (&wc, input + 1, 2, &state);
241 ASSERT (wctob (wc) == EOF);
242 ASSERT (mbsinit (&state));
246 wc = (wchar_t) 0xBADFACE;
247 ret = mbrtowc (&wc, input + 3, 1, &state);
248 ASSERT (ret == (size_t)(-2));
249 ASSERT (wc == (wchar_t) 0xBADFACE);
250 ASSERT (!mbsinit (&state));
253 wc = (wchar_t) 0xBADFACE;
254 ret = mbrtowc (&wc, input + 4, 4, &state);
256 ASSERT (wctob (wc) == EOF);
257 ASSERT (mbsinit (&state));
260 wc = (wchar_t) 0xBADFACE;
261 ret = mbrtowc (&wc, input + 5, 3, &state);
263 ASSERT (wctob (wc) == EOF);
264 ASSERT (mbsinit (&state));
268 wc = (wchar_t) 0xBADFACE;
269 ret = mbrtowc (&wc, input + 7, 1, &state);
272 ASSERT (mbsinit (&state));
277 /* Locale encoding is GB18030. */
279 char input[] = "B\250\271\201\060\211\070er"; /* "Büßer" */
280 memset (&state, '\0', sizeof (mbstate_t));
282 wc = (wchar_t) 0xBADFACE;
283 ret = mbrtowc (&wc, input, 1, &state);
286 ASSERT (mbsinit (&state));
289 wc = (wchar_t) 0xBADFACE;
290 ret = mbrtowc (&wc, input + 1, 1, &state);
291 ASSERT (ret == (size_t)(-2));
292 ASSERT (wc == (wchar_t) 0xBADFACE);
293 ASSERT (!mbsinit (&state));
296 wc = (wchar_t) 0xBADFACE;
297 ret = mbrtowc (&wc, input + 2, 7, &state);
299 ASSERT (wctob (wc) == EOF);
300 ASSERT (mbsinit (&state));
303 wc = (wchar_t) 0xBADFACE;
304 ret = mbrtowc (&wc, input + 3, 6, &state);
306 ASSERT (wctob (wc) == EOF);
307 ASSERT (mbsinit (&state));
313 wc = (wchar_t) 0xBADFACE;
314 ret = mbrtowc (&wc, input + 7, 2, &state);
317 ASSERT (mbsinit (&state));
320 wc = (wchar_t) 0xBADFACE;
321 ret = mbrtowc (&wc, input + 8, 1, &state);
324 ASSERT (mbsinit (&state));