1 /* Test of conversion of multibyte character to wide character.
2 Copyright (C) 2008 Free Software Foundation, Inc.
4 This program is free software: you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation; either version 3 of the License, or
7 (at your option) any later version.
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program. If not, see <http://www.gnu.org/licenses/>. */
17 /* Written by Bruno Haible <bruno@clisp.org>, 2008. */
28 #define ASSERT(expr) \
33 fprintf (stderr, "%s:%d: assertion failed\n", __FILE__, __LINE__); \
41 main (int argc, char *argv[])
47 /* configure should already have checked that the locale is supported. */
48 if (setlocale (LC_ALL, "") == NULL)
51 /* Test zero-length input. */
53 memset (&state, '\0', sizeof (mbstate_t));
55 ret = mbrtowc (&wc, "x", 0, &state);
56 ASSERT (ret == (size_t)(-2) || ret == 0);
57 ASSERT (mbsinit (&state));
60 /* Test NUL byte input. */
62 memset (&state, '\0', sizeof (mbstate_t));
64 ret = mbrtowc (&wc, "", 1, &state);
67 ASSERT (mbsinit (&state));
68 ret = mbrtowc (NULL, "", 1, &state);
70 ASSERT (mbsinit (&state));
73 /* Test single-byte input. */
78 memset (&state, '\0', sizeof (mbstate_t));
79 for (c = 0; c < 0x100; c++)
82 case '\t': case '\v': case '\f':
83 case ' ': case '!': case '"': case '#': case '%':
84 case '&': case '\'': case '(': case ')': case '*':
85 case '+': case ',': case '-': case '.': case '/':
86 case '0': case '1': case '2': case '3': case '4':
87 case '5': case '6': case '7': case '8': case '9':
88 case ':': case ';': case '<': case '=': case '>':
90 case 'A': case 'B': case 'C': case 'D': case 'E':
91 case 'F': case 'G': case 'H': case 'I': case 'J':
92 case 'K': case 'L': case 'M': case 'N': case 'O':
93 case 'P': case 'Q': case 'R': case 'S': case 'T':
94 case 'U': case 'V': case 'W': case 'X': case 'Y':
96 case '[': case '\\': case ']': case '^': case '_':
97 case 'a': case 'b': case 'c': case 'd': case 'e':
98 case 'f': case 'g': case 'h': case 'i': case 'j':
99 case 'k': case 'l': case 'm': case 'n': case 'o':
100 case 'p': case 'q': case 'r': case 's': case 't':
101 case 'u': case 'v': case 'w': case 'x': case 'y':
102 case 'z': case '{': case '|': case '}': case '~':
103 /* c is in the ISO C "basic character set". */
106 ret = mbrtowc (&wc, buf, 1, &state);
109 ASSERT (mbsinit (&state));
110 ret = mbrtowc (NULL, buf, 1, &state);
112 ASSERT (mbsinit (&state));
117 /* Test special calling convention, passing a NULL pointer. */
119 memset (&state, '\0', sizeof (mbstate_t));
121 ret = mbrtowc (&wc, NULL, 5, &state);
123 ASSERT (wc == (wchar_t) 0xBADFACE);
124 ASSERT (mbsinit (&state));
131 /* Locale encoding is ISO-8859-1 or ISO-8859-15. */
133 char input[] = "B\374\337er"; /* "Büßer" */
134 memset (&state, '\0', sizeof (mbstate_t));
137 ret = mbrtowc (&wc, input, 1, &state);
140 ASSERT (mbsinit (&state));
144 ret = mbrtowc (&wc, input + 1, 1, &state);
146 ASSERT (wctob (wc) == (unsigned char) '\374');
147 ASSERT (mbsinit (&state));
151 ret = mbrtowc (&wc, input + 2, 3, &state);
153 ASSERT (wctob (wc) == (unsigned char) '\337');
154 ASSERT (mbsinit (&state));
158 ret = mbrtowc (&wc, input + 3, 2, &state);
161 ASSERT (mbsinit (&state));
165 ret = mbrtowc (&wc, input + 4, 1, &state);
168 ASSERT (mbsinit (&state));
173 /* Locale encoding is UTF-8. */
175 char input[] = "B\303\274\303\237er"; /* "Büßer" */
176 memset (&state, '\0', sizeof (mbstate_t));
179 ret = mbrtowc (&wc, input, 1, &state);
182 ASSERT (mbsinit (&state));
186 ret = mbrtowc (&wc, input + 1, 1, &state);
187 ASSERT (ret == (size_t)(-2));
188 ASSERT (wc == (wchar_t) 0xBADFACE);
189 ASSERT (!mbsinit (&state));
193 ret = mbrtowc (&wc, input + 2, 5, &state);
195 ASSERT (wctob (wc) == EOF);
196 ASSERT (mbsinit (&state));
200 ret = mbrtowc (&wc, input + 3, 4, &state);
202 ASSERT (wctob (wc) == EOF);
203 ASSERT (mbsinit (&state));
208 ret = mbrtowc (&wc, input + 5, 2, &state);
211 ASSERT (mbsinit (&state));
215 ret = mbrtowc (&wc, input + 6, 1, &state);
218 ASSERT (mbsinit (&state));
223 /* Locale encoding is EUC-JP. */
225 char input[] = "B\217\253\344\217\251\316er"; /* "Büßer" */
226 memset (&state, '\0', sizeof (mbstate_t));
229 ret = mbrtowc (&wc, input, 1, &state);
232 ASSERT (mbsinit (&state));
236 ret = mbrtowc (&wc, input + 1, 1, &state);
237 ASSERT (ret == (size_t)(-2));
238 ASSERT (wc == (wchar_t) 0xBADFACE);
239 ASSERT (!mbsinit (&state));
243 ret = mbrtowc (&wc, input + 2, 7, &state);
245 ASSERT (wctob (wc) == EOF);
246 ASSERT (mbsinit (&state));
251 ret = mbrtowc (&wc, input + 4, 5, &state);
253 ASSERT (wctob (wc) == EOF);
254 ASSERT (mbsinit (&state));
260 ret = mbrtowc (&wc, input + 7, 2, &state);
263 ASSERT (mbsinit (&state));
267 ret = mbrtowc (&wc, input + 8, 1, &state);
270 ASSERT (mbsinit (&state));
275 /* Locale encoding is GB18030. */
277 char input[] = "B\250\271\201\060\211\070er"; /* "Büßer" */
278 memset (&state, '\0', sizeof (mbstate_t));
281 ret = mbrtowc (&wc, input, 1, &state);
284 ASSERT (mbsinit (&state));
288 ret = mbrtowc (&wc, input + 1, 1, &state);
289 ASSERT (ret == (size_t)(-2));
290 ASSERT (wc == (wchar_t) 0xBADFACE);
291 ASSERT (!mbsinit (&state));
295 ret = mbrtowc (&wc, input + 2, 7, &state);
297 ASSERT (wctob (wc) == EOF);
298 ASSERT (mbsinit (&state));
302 ret = mbrtowc (&wc, input + 3, 6, &state);
304 ASSERT (wctob (wc) == EOF);
305 ASSERT (mbsinit (&state));
312 ret = mbrtowc (&wc, input + 7, 2, &state);
315 ASSERT (mbsinit (&state));
319 ret = mbrtowc (&wc, input + 8, 1, &state);
322 ASSERT (mbsinit (&state));