1 /* Test of conversion of multibyte character to wide character.
2 Copyright (C) 2008 Free Software Foundation, Inc.
4 This program is free software: you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation; either version 3 of the License, or
7 (at your option) any later version.
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program. If not, see <http://www.gnu.org/licenses/>. */
17 /* Written by Bruno Haible <bruno@clisp.org>, 2008. */
28 #define ASSERT(expr) \
33 fprintf (stderr, "%s:%d: assertion failed\n", __FILE__, __LINE__); \
41 main (int argc, char *argv[])
47 /* configure should already have checked that the locale is supported. */
48 if (setlocale (LC_ALL, "") == NULL)
51 /* Test zero-length input. */
53 memset (&state, '\0', sizeof (mbstate_t));
55 ret = mbrtowc (&wc, "x", 0, &state);
56 /* gnulib's implementation returns (size_t)(-2).
57 The AIX 5.1 implementation returns (size_t)(-1).
58 glibc's implementation returns 0. */
59 ASSERT (ret == (size_t)(-2) || ret == (size_t)(-1) || ret == 0);
60 ASSERT (mbsinit (&state));
63 /* Test NUL byte input. */
65 memset (&state, '\0', sizeof (mbstate_t));
67 ret = mbrtowc (&wc, "", 1, &state);
70 ASSERT (mbsinit (&state));
71 ret = mbrtowc (NULL, "", 1, &state);
73 ASSERT (mbsinit (&state));
76 /* Test single-byte input. */
81 memset (&state, '\0', sizeof (mbstate_t));
82 for (c = 0; c < 0x100; c++)
85 case '\t': case '\v': case '\f':
86 case ' ': case '!': case '"': case '#': case '%':
87 case '&': case '\'': case '(': case ')': case '*':
88 case '+': case ',': case '-': case '.': case '/':
89 case '0': case '1': case '2': case '3': case '4':
90 case '5': case '6': case '7': case '8': case '9':
91 case ':': case ';': case '<': case '=': case '>':
93 case 'A': case 'B': case 'C': case 'D': case 'E':
94 case 'F': case 'G': case 'H': case 'I': case 'J':
95 case 'K': case 'L': case 'M': case 'N': case 'O':
96 case 'P': case 'Q': case 'R': case 'S': case 'T':
97 case 'U': case 'V': case 'W': case 'X': case 'Y':
99 case '[': case '\\': case ']': case '^': case '_':
100 case 'a': case 'b': case 'c': case 'd': case 'e':
101 case 'f': case 'g': case 'h': case 'i': case 'j':
102 case 'k': case 'l': case 'm': case 'n': case 'o':
103 case 'p': case 'q': case 'r': case 's': case 't':
104 case 'u': case 'v': case 'w': case 'x': case 'y':
105 case 'z': case '{': case '|': case '}': case '~':
106 /* c is in the ISO C "basic character set". */
109 ret = mbrtowc (&wc, buf, 1, &state);
112 ASSERT (mbsinit (&state));
113 ret = mbrtowc (NULL, buf, 1, &state);
115 ASSERT (mbsinit (&state));
120 /* Test special calling convention, passing a NULL pointer. */
122 memset (&state, '\0', sizeof (mbstate_t));
124 ret = mbrtowc (&wc, NULL, 5, &state);
126 ASSERT (wc == (wchar_t) 0xBADFACE);
127 ASSERT (mbsinit (&state));
134 /* Locale encoding is ISO-8859-1 or ISO-8859-15. */
136 char input[] = "B\374\337er"; /* "Büßer" */
137 memset (&state, '\0', sizeof (mbstate_t));
140 ret = mbrtowc (&wc, input, 1, &state);
143 ASSERT (mbsinit (&state));
147 ret = mbrtowc (&wc, input + 1, 1, &state);
149 ASSERT (wctob (wc) == (unsigned char) '\374');
150 ASSERT (mbsinit (&state));
154 ret = mbrtowc (&wc, input + 2, 3, &state);
156 ASSERT (wctob (wc) == (unsigned char) '\337');
157 ASSERT (mbsinit (&state));
161 ret = mbrtowc (&wc, input + 3, 2, &state);
164 ASSERT (mbsinit (&state));
168 ret = mbrtowc (&wc, input + 4, 1, &state);
171 ASSERT (mbsinit (&state));
176 /* Locale encoding is UTF-8. */
178 char input[] = "B\303\274\303\237er"; /* "Büßer" */
179 memset (&state, '\0', sizeof (mbstate_t));
182 ret = mbrtowc (&wc, input, 1, &state);
185 ASSERT (mbsinit (&state));
189 ret = mbrtowc (&wc, input + 1, 1, &state);
190 ASSERT (ret == (size_t)(-2));
191 ASSERT (wc == (wchar_t) 0xBADFACE);
192 ASSERT (!mbsinit (&state));
196 ret = mbrtowc (&wc, input + 2, 5, &state);
198 ASSERT (wctob (wc) == EOF);
199 ASSERT (mbsinit (&state));
203 ret = mbrtowc (&wc, input + 3, 4, &state);
205 ASSERT (wctob (wc) == EOF);
206 ASSERT (mbsinit (&state));
211 ret = mbrtowc (&wc, input + 5, 2, &state);
214 ASSERT (mbsinit (&state));
218 ret = mbrtowc (&wc, input + 6, 1, &state);
221 ASSERT (mbsinit (&state));
226 /* Locale encoding is EUC-JP. */
228 char input[] = "B\217\253\344\217\251\316er"; /* "Büßer" */
229 memset (&state, '\0', sizeof (mbstate_t));
232 ret = mbrtowc (&wc, input, 1, &state);
235 ASSERT (mbsinit (&state));
239 ret = mbrtowc (&wc, input + 1, 1, &state);
240 ASSERT (ret == (size_t)(-2));
241 ASSERT (wc == (wchar_t) 0xBADFACE);
242 ASSERT (!mbsinit (&state));
246 ret = mbrtowc (&wc, input + 2, 7, &state);
248 ASSERT (wctob (wc) == EOF);
249 ASSERT (mbsinit (&state));
254 ret = mbrtowc (&wc, input + 4, 5, &state);
256 ASSERT (wctob (wc) == EOF);
257 ASSERT (mbsinit (&state));
263 ret = mbrtowc (&wc, input + 7, 2, &state);
266 ASSERT (mbsinit (&state));
270 ret = mbrtowc (&wc, input + 8, 1, &state);
273 ASSERT (mbsinit (&state));
278 /* Locale encoding is GB18030. */
280 char input[] = "B\250\271\201\060\211\070er"; /* "Büßer" */
281 memset (&state, '\0', sizeof (mbstate_t));
284 ret = mbrtowc (&wc, input, 1, &state);
287 ASSERT (mbsinit (&state));
291 ret = mbrtowc (&wc, input + 1, 1, &state);
292 ASSERT (ret == (size_t)(-2));
293 ASSERT (wc == (wchar_t) 0xBADFACE);
294 ASSERT (!mbsinit (&state));
298 ret = mbrtowc (&wc, input + 2, 7, &state);
300 ASSERT (wctob (wc) == EOF);
301 ASSERT (mbsinit (&state));
305 ret = mbrtowc (&wc, input + 3, 6, &state);
307 ASSERT (wctob (wc) == EOF);
308 ASSERT (mbsinit (&state));
315 ret = mbrtowc (&wc, input + 7, 2, &state);
318 ASSERT (mbsinit (&state));
322 ret = mbrtowc (&wc, input + 8, 1, &state);
325 ASSERT (mbsinit (&state));