t_c16rtomb.c revision 1.5 1 1.5 riastrad /* $NetBSD: t_c16rtomb.c,v 1.5 2024/08/19 16:21:47 riastradh Exp $ */
2 1.1 riastrad
3 1.1 riastrad /*-
4 1.1 riastrad * Copyright (c) 2002 Tim J. Robbins
5 1.1 riastrad * All rights reserved.
6 1.1 riastrad *
7 1.1 riastrad * Copyright (c) 2013 Ed Schouten <ed (at) FreeBSD.org>
8 1.1 riastrad * All rights reserved.
9 1.1 riastrad *
10 1.1 riastrad * Redistribution and use in source and binary forms, with or without
11 1.1 riastrad * modification, are permitted provided that the following conditions
12 1.1 riastrad * are met:
13 1.1 riastrad * 1. Redistributions of source code must retain the above copyright
14 1.1 riastrad * notice, this list of conditions and the following disclaimer.
15 1.1 riastrad * 2. Redistributions in binary form must reproduce the above copyright
16 1.1 riastrad * notice, this list of conditions and the following disclaimer in the
17 1.1 riastrad * documentation and/or other materials provided with the distribution.
18 1.1 riastrad *
19 1.1 riastrad * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
20 1.1 riastrad * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21 1.1 riastrad * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22 1.1 riastrad * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
23 1.1 riastrad * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24 1.1 riastrad * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25 1.1 riastrad * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26 1.1 riastrad * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27 1.1 riastrad * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28 1.1 riastrad * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 1.1 riastrad * SUCH DAMAGE.
30 1.1 riastrad */
31 1.1 riastrad /*
32 1.1 riastrad * Test program for c16rtomb() as specified by ISO/IEC 9899:2011.
33 1.1 riastrad */
34 1.1 riastrad
35 1.1 riastrad #include <sys/cdefs.h>
36 1.5 riastrad __RCSID("$NetBSD: t_c16rtomb.c,v 1.5 2024/08/19 16:21:47 riastradh Exp $");
37 1.1 riastrad
38 1.1 riastrad #include <errno.h>
39 1.1 riastrad #include <limits.h>
40 1.1 riastrad #include <locale.h>
41 1.1 riastrad #include <stdio.h>
42 1.1 riastrad #include <string.h>
43 1.1 riastrad #include <uchar.h>
44 1.1 riastrad
45 1.1 riastrad #include <atf-c.h>
46 1.1 riastrad
47 1.1 riastrad static void
48 1.1 riastrad require_lc_ctype(const char *locale_name)
49 1.1 riastrad {
50 1.1 riastrad char *lc_ctype_set;
51 1.1 riastrad
52 1.1 riastrad lc_ctype_set = setlocale(LC_CTYPE, locale_name);
53 1.1 riastrad if (lc_ctype_set == NULL)
54 1.1 riastrad atf_tc_fail("setlocale(LC_CTYPE, \"%s\") failed; errno=%d",
55 1.1 riastrad locale_name, errno);
56 1.1 riastrad
57 1.1 riastrad ATF_REQUIRE_EQ_MSG(strcmp(lc_ctype_set, locale_name), 0,
58 1.1 riastrad "lc_ctype_set=%s locale_name=%s", lc_ctype_set, locale_name);
59 1.1 riastrad }
60 1.1 riastrad
61 1.1 riastrad static mbstate_t s;
62 1.4 riastrad static char buf[7*MB_LEN_MAX + 1];
63 1.1 riastrad
64 1.1 riastrad ATF_TC_WITHOUT_HEAD(c16rtomb_c_locale_test);
65 1.1 riastrad ATF_TC_BODY(c16rtomb_c_locale_test, tc)
66 1.1 riastrad {
67 1.1 riastrad size_t n;
68 1.1 riastrad
69 1.1 riastrad require_lc_ctype("C");
70 1.1 riastrad
71 1.1 riastrad /*
72 1.1 riastrad * If the buffer argument is NULL, c16 is implicitly 0,
73 1.1 riastrad * c16rtomb() resets its internal state.
74 1.1 riastrad */
75 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, L'\0', NULL)), 1, "n=%zu", n);
76 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, 0xdc00, NULL)), 1, "n=%zu", n);
77 1.1 riastrad
78 1.1 riastrad /* Null wide character. */
79 1.1 riastrad memset(&s, 0, sizeof(s));
80 1.1 riastrad memset(buf, 0xcc, sizeof(buf));
81 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0, &s)), 1, "n=%zu", n);
82 1.1 riastrad ATF_CHECK_MSG(((unsigned char)buf[0] == 0 &&
83 1.1 riastrad (unsigned char)buf[1] == 0xcc),
84 1.1 riastrad "buf=[%02x %02x]", buf[0], buf[1]);
85 1.1 riastrad
86 1.1 riastrad /* Latin letter A, internal state. */
87 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, L'\0', NULL)), 1, "n=%zu", n);
88 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, L'A', NULL)), 1, "n=%zu", n);
89 1.1 riastrad
90 1.1 riastrad /* Latin letter A. */
91 1.1 riastrad memset(&s, 0, sizeof(s));
92 1.1 riastrad memset(buf, 0xcc, sizeof(buf));
93 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, L'A', &s)), 1, "n=%zu", n);
94 1.1 riastrad ATF_CHECK_MSG(((unsigned char)buf[0] == 'A' &&
95 1.1 riastrad (unsigned char)buf[1] == 0xcc),
96 1.1 riastrad "buf=[%02x %02x]", buf[0], buf[1]);
97 1.1 riastrad
98 1.1 riastrad /* Unicode character 'Pile of poo'. */
99 1.1 riastrad memset(&s, 0, sizeof(s));
100 1.1 riastrad memset(buf, 0xcc, sizeof(buf));
101 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xd83d, &s)), 0, "n=%zu", n);
102 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xdca9, &s)), (size_t)-1,
103 1.1 riastrad "n=%zu", n);
104 1.1 riastrad ATF_CHECK_EQ_MSG(errno, EILSEQ, "errno=%d", errno);
105 1.1 riastrad ATF_CHECK_EQ_MSG((unsigned char)buf[0], 0xcc, "buf=[%02x]", buf[0]);
106 1.2 riastrad
107 1.2 riastrad /* Incomplete Unicode character 'Pile of poo', interrupted by NUL. */
108 1.2 riastrad memset(&s, 0, sizeof(s));
109 1.2 riastrad memset(buf, 0xcc, sizeof(buf));
110 1.2 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xd83d, &s)), 0, "n=%zu", n);
111 1.2 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, L'\0', &s)), 1, "n=%zu", n);
112 1.2 riastrad ATF_CHECK_MSG(((unsigned char)buf[0] == '\0' &&
113 1.2 riastrad (unsigned char)buf[1] == 0xcc),
114 1.2 riastrad "buf=[%02x %02x]", buf[0], buf[1]);
115 1.1 riastrad }
116 1.1 riastrad
117 1.4 riastrad ATF_TC_WITHOUT_HEAD(c16rtomb_iso2022jp_locale_test);
118 1.4 riastrad ATF_TC_BODY(c16rtomb_iso2022jp_locale_test, tc)
119 1.4 riastrad {
120 1.4 riastrad char *p;
121 1.4 riastrad size_t n;
122 1.4 riastrad
123 1.4 riastrad require_lc_ctype("ja_JP.ISO-2022-JP");
124 1.4 riastrad
125 1.4 riastrad /*
126 1.4 riastrad * If the buffer argument is NULL, c16 is implicitly 0,
127 1.4 riastrad * c16rtomb() resets its internal state.
128 1.4 riastrad */
129 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, L'\0', NULL)), 1, "n=%zu", n);
130 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, 0xdc00, NULL)), 1, "n=%zu", n);
131 1.4 riastrad
132 1.4 riastrad /* Null wide character. */
133 1.4 riastrad memset(&s, 0, sizeof(s));
134 1.4 riastrad memset(buf, 0xcc, sizeof(buf));
135 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0, &s)), 1, "n=%zu", n);
136 1.4 riastrad ATF_CHECK_MSG(((unsigned char)buf[0] == 0 &&
137 1.4 riastrad (unsigned char)buf[1] == 0xcc),
138 1.4 riastrad "buf=[%02x %02x]", buf[0], buf[1]);
139 1.4 riastrad
140 1.4 riastrad /* Latin letter A, internal state. */
141 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, L'\0', NULL)), 1, "n=%zu", n);
142 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, L'A', NULL)), 1, "n=%zu", n);
143 1.4 riastrad
144 1.4 riastrad /*
145 1.4 riastrad * 1. U+0042 LATIN CAPITAL LETTER A
146 1.4 riastrad * 2. U+00A5 YEN SIGN
147 1.4 riastrad * 3. U+00A5 YEN SIGN (again, no shift needed)
148 1.4 riastrad * 4. U+30A2 KATAKANA LETTER A
149 1.4 riastrad * 5. U+30A2 KATAKANA LETTER A (again, no shift needed)
150 1.4 riastrad * 6. incomplete UTF-16 surrogate pair -- no output
151 1.4 riastrad * 7. U+0000 NUL (plus shift sequence to initial state)
152 1.4 riastrad */
153 1.4 riastrad memset(&s, 0, sizeof(s));
154 1.4 riastrad memset(buf, 0xcc, sizeof(buf));
155 1.4 riastrad p = buf;
156 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(p, L'A', &s)), 1, "n=%zu", n); /* 1 */
157 1.4 riastrad p += 1;
158 1.4 riastrad atf_tc_expect_fail("PR lib/58612:"
159 1.4 riastrad " c8rtomb/c16rtomb/c32rtomb yield suboptimal shift sequences");
160 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(p, 0xa5, &s)), 4, "n=%zu", n); /* 2 */
161 1.4 riastrad p += 4;
162 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(p, 0xa5, &s)), 1, "n=%zu", n); /* 3 */
163 1.4 riastrad p += 1;
164 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(p, 0x30a2, &s)), 5, "n=%zu", n); /* 4 */
165 1.4 riastrad p += 5;
166 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(p, 0x30a2, &s)), 2, "n=%zu", n); /* 5 */
167 1.4 riastrad p += 2;
168 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(p, 0xd800, &s)), 0, "n=%zu", n); /* 6 */
169 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(p, L'\0', &s)), 4, "n=%zu", n); /* 7 */
170 1.4 riastrad p += 4;
171 1.4 riastrad ATF_CHECK_MSG(((unsigned char)buf[0] == 'A' &&
172 1.4 riastrad (unsigned char)buf[1] == 0x1b && /* shift ISO/IEC 646:JP */
173 1.4 riastrad (unsigned char)buf[2] == '(' &&
174 1.4 riastrad (unsigned char)buf[3] == 'J' &&
175 1.4 riastrad (unsigned char)buf[4] == 0x5c && /* YEN SIGN */
176 1.4 riastrad (unsigned char)buf[5] == 0x5c && /* YEN SIGN */
177 1.5 riastrad (unsigned char)buf[6] == 0x1b && /* shift JIS X 0208 */
178 1.4 riastrad (unsigned char)buf[7] == '$' &&
179 1.4 riastrad (unsigned char)buf[8] == 'B' &&
180 1.4 riastrad (unsigned char)buf[9] == 0x25 && /* KATAKANA LETTER A */
181 1.4 riastrad (unsigned char)buf[10] == 0x22 &&
182 1.4 riastrad (unsigned char)buf[11] == 0x25 && /* KATAKANA LETTER A */
183 1.4 riastrad (unsigned char)buf[12] == 0x22 &&
184 1.4 riastrad (unsigned char)buf[13] == 0x1b && /* shift US-ASCII */
185 1.4 riastrad (unsigned char)buf[14] == '(' &&
186 1.4 riastrad (unsigned char)buf[15] == 'B' &&
187 1.4 riastrad (unsigned char)buf[16] == '\0' &&
188 1.4 riastrad (unsigned char)buf[17] == 0xcc),
189 1.4 riastrad "buf=[%02x %02x %02x %02x %02x %02x %02x %02x "
190 1.4 riastrad " %02x %02x %02x %02x %02x %02x %02x %02x "
191 1.4 riastrad " %02x %02x]",
192 1.4 riastrad buf[0], buf[1], buf[2], buf[3],
193 1.4 riastrad buf[4], buf[5], buf[6], buf[7],
194 1.4 riastrad buf[8], buf[9], buf[10], buf[11],
195 1.4 riastrad buf[12], buf[13], buf[14], buf[15],
196 1.4 riastrad buf[16], buf[17]);
197 1.4 riastrad }
198 1.4 riastrad
199 1.1 riastrad ATF_TC_WITHOUT_HEAD(c16rtomb_iso_8859_1_test);
200 1.1 riastrad ATF_TC_BODY(c16rtomb_iso_8859_1_test, tc)
201 1.1 riastrad {
202 1.1 riastrad size_t n;
203 1.1 riastrad
204 1.1 riastrad require_lc_ctype("en_US.ISO8859-1");
205 1.1 riastrad
206 1.1 riastrad /* Unicode character 'Euro sign'. */
207 1.1 riastrad memset(&s, 0, sizeof(s));
208 1.1 riastrad memset(buf, 0xcc, sizeof(buf));
209 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0x20ac, &s)), (size_t)-1,
210 1.1 riastrad "n=%zu", n);
211 1.1 riastrad ATF_CHECK_EQ_MSG(errno, EILSEQ, "errno=%d", errno);
212 1.1 riastrad ATF_CHECK_EQ_MSG((unsigned char)buf[0], 0xcc, "buf=[%02x]", buf[0]);
213 1.1 riastrad }
214 1.1 riastrad
215 1.1 riastrad ATF_TC_WITHOUT_HEAD(c16rtomb_iso_8859_15_test);
216 1.1 riastrad ATF_TC_BODY(c16rtomb_iso_8859_15_test, tc)
217 1.1 riastrad {
218 1.1 riastrad size_t n;
219 1.1 riastrad
220 1.1 riastrad require_lc_ctype("en_US.ISO8859-15");
221 1.1 riastrad
222 1.1 riastrad /* Unicode character 'Euro sign'. */
223 1.1 riastrad memset(&s, 0, sizeof(s));
224 1.1 riastrad memset(buf, 0xcc, sizeof(buf));
225 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0x20ac, &s)), 1, "n=%zu", n);
226 1.1 riastrad ATF_CHECK_MSG(((unsigned char)buf[0] == 0xa4 &&
227 1.1 riastrad (unsigned char)buf[1] == 0xcc),
228 1.1 riastrad "buf=[%02x %02x]", buf[0], buf[1]);
229 1.1 riastrad }
230 1.1 riastrad
231 1.1 riastrad ATF_TC_WITHOUT_HEAD(c16rtomb_utf_8_test);
232 1.1 riastrad ATF_TC_BODY(c16rtomb_utf_8_test, tc)
233 1.1 riastrad {
234 1.1 riastrad size_t n;
235 1.1 riastrad
236 1.1 riastrad require_lc_ctype("en_US.UTF-8");
237 1.1 riastrad
238 1.1 riastrad /* Unicode character 'Pile of poo'. */
239 1.1 riastrad memset(&s, 0, sizeof(s));
240 1.1 riastrad memset(buf, 0xcc, sizeof(buf));
241 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xd83d, &s)), 0, "n=%zu", n);
242 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xdca9, &s)), 4, "n=%zu", n);
243 1.1 riastrad ATF_CHECK_MSG(((unsigned char)buf[0] == 0xf0 &&
244 1.1 riastrad (unsigned char)buf[1] == 0x9f &&
245 1.1 riastrad (unsigned char)buf[2] == 0x92 &&
246 1.1 riastrad (unsigned char)buf[3] == 0xa9 &&
247 1.1 riastrad (unsigned char)buf[4] == 0xcc),
248 1.1 riastrad "buf=[%02x %02x %02x %02x %02x]",
249 1.1 riastrad buf[0], buf[1], buf[2], buf[3], buf[4]);
250 1.1 riastrad
251 1.1 riastrad /* Invalid code; 'Pile of poo' without the trail surrogate. */
252 1.1 riastrad memset(&s, 0, sizeof(s));
253 1.1 riastrad memset(buf, 0xcc, sizeof(buf));
254 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xd83d, &s)), 0, "n=%zu", n);
255 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, L'A', &s)), (size_t)-1,
256 1.1 riastrad "n=%zu", n);
257 1.1 riastrad ATF_CHECK_EQ_MSG(errno, EILSEQ, "errno=%d", errno);
258 1.1 riastrad ATF_CHECK_EQ_MSG((unsigned char)buf[0], 0xcc, "buf=[%02x]", buf[0]);
259 1.1 riastrad
260 1.1 riastrad /* Invalid code; 'Pile of poo' without the lead surrogate. */
261 1.1 riastrad memset(&s, 0, sizeof(s));
262 1.1 riastrad memset(buf, 0xcc, sizeof(buf));
263 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xdca9, &s)), (size_t)-1,
264 1.1 riastrad "n=%zu", n);
265 1.1 riastrad ATF_CHECK_EQ_MSG(errno, EILSEQ, "errno=%d", errno);
266 1.1 riastrad ATF_CHECK_EQ_MSG((unsigned char)buf[0], 0xcc, "buf=[%02x]", buf[0]);
267 1.2 riastrad
268 1.2 riastrad /* Incomplete Unicode character 'Pile of poo', interrupted by NUL. */
269 1.2 riastrad memset(&s, 0, sizeof(s));
270 1.2 riastrad memset(buf, 0xcc, sizeof(buf));
271 1.2 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xd83d, &s)), 0, "n=%zu", n);
272 1.2 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, L'\0', &s)), 1,
273 1.2 riastrad "n=%zu", n);
274 1.2 riastrad ATF_CHECK_MSG(((unsigned char)buf[0] == '\0' &&
275 1.2 riastrad (unsigned char)buf[1] == 0xcc),
276 1.2 riastrad "buf=[%02x %02x]", buf[0], buf[1]);
277 1.1 riastrad }
278 1.1 riastrad
279 1.1 riastrad ATF_TP_ADD_TCS(tp)
280 1.1 riastrad {
281 1.1 riastrad
282 1.1 riastrad ATF_TP_ADD_TC(tp, c16rtomb_c_locale_test);
283 1.4 riastrad ATF_TP_ADD_TC(tp, c16rtomb_iso2022jp_locale_test);
284 1.1 riastrad ATF_TP_ADD_TC(tp, c16rtomb_iso_8859_1_test);
285 1.1 riastrad ATF_TP_ADD_TC(tp, c16rtomb_iso_8859_15_test);
286 1.1 riastrad ATF_TP_ADD_TC(tp, c16rtomb_utf_8_test);
287 1.1 riastrad
288 1.1 riastrad return (atf_no_error());
289 1.1 riastrad }
290