1 1.6 riastrad /* $NetBSD: t_c16rtomb.c,v 1.6 2024/08/19 16:22:10 riastradh Exp $ */ 2 1.1 riastrad 3 1.1 riastrad /*- 4 1.1 riastrad * Copyright (c) 2002 Tim J. Robbins 5 1.1 riastrad * All rights reserved. 6 1.1 riastrad * 7 1.1 riastrad * Copyright (c) 2013 Ed Schouten <ed (at) FreeBSD.org> 8 1.1 riastrad * All rights reserved. 9 1.1 riastrad * 10 1.1 riastrad * Redistribution and use in source and binary forms, with or without 11 1.1 riastrad * modification, are permitted provided that the following conditions 12 1.1 riastrad * are met: 13 1.1 riastrad * 1. Redistributions of source code must retain the above copyright 14 1.1 riastrad * notice, this list of conditions and the following disclaimer. 15 1.1 riastrad * 2. Redistributions in binary form must reproduce the above copyright 16 1.1 riastrad * notice, this list of conditions and the following disclaimer in the 17 1.1 riastrad * documentation and/or other materials provided with the distribution. 18 1.1 riastrad * 19 1.1 riastrad * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 20 1.1 riastrad * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 21 1.1 riastrad * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 22 1.1 riastrad * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 23 1.1 riastrad * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 24 1.1 riastrad * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 25 1.1 riastrad * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 26 1.1 riastrad * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27 1.1 riastrad * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 28 1.1 riastrad * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 29 1.1 riastrad * SUCH DAMAGE. 30 1.1 riastrad */ 31 1.1 riastrad /* 32 1.1 riastrad * Test program for c16rtomb() as specified by ISO/IEC 9899:2011. 33 1.1 riastrad */ 34 1.1 riastrad 35 1.1 riastrad #include <sys/cdefs.h> 36 1.6 riastrad __RCSID("$NetBSD: t_c16rtomb.c,v 1.6 2024/08/19 16:22:10 riastradh Exp $"); 37 1.1 riastrad 38 1.1 riastrad #include <errno.h> 39 1.1 riastrad #include <limits.h> 40 1.1 riastrad #include <locale.h> 41 1.1 riastrad #include <stdio.h> 42 1.1 riastrad #include <string.h> 43 1.1 riastrad #include <uchar.h> 44 1.1 riastrad 45 1.1 riastrad #include <atf-c.h> 46 1.1 riastrad 47 1.1 riastrad static void 48 1.1 riastrad require_lc_ctype(const char *locale_name) 49 1.1 riastrad { 50 1.1 riastrad char *lc_ctype_set; 51 1.1 riastrad 52 1.1 riastrad lc_ctype_set = setlocale(LC_CTYPE, locale_name); 53 1.1 riastrad if (lc_ctype_set == NULL) 54 1.1 riastrad atf_tc_fail("setlocale(LC_CTYPE, \"%s\") failed; errno=%d", 55 1.1 riastrad locale_name, errno); 56 1.1 riastrad 57 1.1 riastrad ATF_REQUIRE_EQ_MSG(strcmp(lc_ctype_set, locale_name), 0, 58 1.1 riastrad "lc_ctype_set=%s locale_name=%s", lc_ctype_set, locale_name); 59 1.1 riastrad } 60 1.1 riastrad 61 1.1 riastrad static mbstate_t s; 62 1.4 riastrad static char buf[7*MB_LEN_MAX + 1]; 63 1.1 riastrad 64 1.1 riastrad ATF_TC_WITHOUT_HEAD(c16rtomb_c_locale_test); 65 1.1 riastrad ATF_TC_BODY(c16rtomb_c_locale_test, tc) 66 1.1 riastrad { 67 1.1 riastrad size_t n; 68 1.1 riastrad 69 1.1 riastrad require_lc_ctype("C"); 70 1.1 riastrad 71 1.1 riastrad /* 72 1.1 riastrad * If the buffer argument is NULL, c16 is implicitly 0, 73 1.1 riastrad * c16rtomb() resets its internal state. 74 1.1 riastrad */ 75 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, L'\0', NULL)), 1, "n=%zu", n); 76 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, 0xdc00, NULL)), 1, "n=%zu", n); 77 1.1 riastrad 78 1.1 riastrad /* Null wide character. */ 79 1.1 riastrad memset(&s, 0, sizeof(s)); 80 1.1 riastrad memset(buf, 0xcc, sizeof(buf)); 81 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0, &s)), 1, "n=%zu", n); 82 1.1 riastrad ATF_CHECK_MSG(((unsigned char)buf[0] == 0 && 83 1.1 riastrad (unsigned char)buf[1] == 0xcc), 84 1.1 riastrad "buf=[%02x %02x]", buf[0], buf[1]); 85 1.1 riastrad 86 1.1 riastrad /* Latin letter A, internal state. */ 87 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, L'\0', NULL)), 1, "n=%zu", n); 88 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, L'A', NULL)), 1, "n=%zu", n); 89 1.1 riastrad 90 1.1 riastrad /* Latin letter A. */ 91 1.1 riastrad memset(&s, 0, sizeof(s)); 92 1.1 riastrad memset(buf, 0xcc, sizeof(buf)); 93 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, L'A', &s)), 1, "n=%zu", n); 94 1.1 riastrad ATF_CHECK_MSG(((unsigned char)buf[0] == 'A' && 95 1.1 riastrad (unsigned char)buf[1] == 0xcc), 96 1.1 riastrad "buf=[%02x %02x]", buf[0], buf[1]); 97 1.1 riastrad 98 1.1 riastrad /* Unicode character 'Pile of poo'. */ 99 1.1 riastrad memset(&s, 0, sizeof(s)); 100 1.1 riastrad memset(buf, 0xcc, sizeof(buf)); 101 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xd83d, &s)), 0, "n=%zu", n); 102 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xdca9, &s)), (size_t)-1, 103 1.1 riastrad "n=%zu", n); 104 1.1 riastrad ATF_CHECK_EQ_MSG(errno, EILSEQ, "errno=%d", errno); 105 1.1 riastrad ATF_CHECK_EQ_MSG((unsigned char)buf[0], 0xcc, "buf=[%02x]", buf[0]); 106 1.2 riastrad 107 1.2 riastrad /* Incomplete Unicode character 'Pile of poo', interrupted by NUL. */ 108 1.2 riastrad memset(&s, 0, sizeof(s)); 109 1.2 riastrad memset(buf, 0xcc, sizeof(buf)); 110 1.2 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xd83d, &s)), 0, "n=%zu", n); 111 1.2 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, L'\0', &s)), 1, "n=%zu", n); 112 1.2 riastrad ATF_CHECK_MSG(((unsigned char)buf[0] == '\0' && 113 1.2 riastrad (unsigned char)buf[1] == 0xcc), 114 1.2 riastrad "buf=[%02x %02x]", buf[0], buf[1]); 115 1.1 riastrad } 116 1.1 riastrad 117 1.4 riastrad ATF_TC_WITHOUT_HEAD(c16rtomb_iso2022jp_locale_test); 118 1.4 riastrad ATF_TC_BODY(c16rtomb_iso2022jp_locale_test, tc) 119 1.4 riastrad { 120 1.4 riastrad char *p; 121 1.4 riastrad size_t n; 122 1.4 riastrad 123 1.4 riastrad require_lc_ctype("ja_JP.ISO-2022-JP"); 124 1.4 riastrad 125 1.4 riastrad /* 126 1.4 riastrad * If the buffer argument is NULL, c16 is implicitly 0, 127 1.4 riastrad * c16rtomb() resets its internal state. 128 1.4 riastrad */ 129 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, L'\0', NULL)), 1, "n=%zu", n); 130 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, 0xdc00, NULL)), 1, "n=%zu", n); 131 1.4 riastrad 132 1.4 riastrad /* Null wide character. */ 133 1.4 riastrad memset(&s, 0, sizeof(s)); 134 1.4 riastrad memset(buf, 0xcc, sizeof(buf)); 135 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0, &s)), 1, "n=%zu", n); 136 1.4 riastrad ATF_CHECK_MSG(((unsigned char)buf[0] == 0 && 137 1.4 riastrad (unsigned char)buf[1] == 0xcc), 138 1.4 riastrad "buf=[%02x %02x]", buf[0], buf[1]); 139 1.4 riastrad 140 1.4 riastrad /* Latin letter A, internal state. */ 141 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, L'\0', NULL)), 1, "n=%zu", n); 142 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, L'A', NULL)), 1, "n=%zu", n); 143 1.4 riastrad 144 1.4 riastrad /* 145 1.4 riastrad * 1. U+0042 LATIN CAPITAL LETTER A 146 1.4 riastrad * 2. U+00A5 YEN SIGN 147 1.4 riastrad * 3. U+00A5 YEN SIGN (again, no shift needed) 148 1.4 riastrad * 4. U+30A2 KATAKANA LETTER A 149 1.4 riastrad * 5. U+30A2 KATAKANA LETTER A (again, no shift needed) 150 1.4 riastrad * 6. incomplete UTF-16 surrogate pair -- no output 151 1.4 riastrad * 7. U+0000 NUL (plus shift sequence to initial state) 152 1.4 riastrad */ 153 1.4 riastrad memset(&s, 0, sizeof(s)); 154 1.4 riastrad memset(buf, 0xcc, sizeof(buf)); 155 1.4 riastrad p = buf; 156 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(p, L'A', &s)), 1, "n=%zu", n); /* 1 */ 157 1.4 riastrad p += 1; 158 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(p, 0xa5, &s)), 4, "n=%zu", n); /* 2 */ 159 1.4 riastrad p += 4; 160 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(p, 0xa5, &s)), 1, "n=%zu", n); /* 3 */ 161 1.4 riastrad p += 1; 162 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(p, 0x30a2, &s)), 5, "n=%zu", n); /* 4 */ 163 1.4 riastrad p += 5; 164 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(p, 0x30a2, &s)), 2, "n=%zu", n); /* 5 */ 165 1.4 riastrad p += 2; 166 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(p, 0xd800, &s)), 0, "n=%zu", n); /* 6 */ 167 1.4 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(p, L'\0', &s)), 4, "n=%zu", n); /* 7 */ 168 1.4 riastrad p += 4; 169 1.4 riastrad ATF_CHECK_MSG(((unsigned char)buf[0] == 'A' && 170 1.4 riastrad (unsigned char)buf[1] == 0x1b && /* shift ISO/IEC 646:JP */ 171 1.4 riastrad (unsigned char)buf[2] == '(' && 172 1.4 riastrad (unsigned char)buf[3] == 'J' && 173 1.4 riastrad (unsigned char)buf[4] == 0x5c && /* YEN SIGN */ 174 1.4 riastrad (unsigned char)buf[5] == 0x5c && /* YEN SIGN */ 175 1.5 riastrad (unsigned char)buf[6] == 0x1b && /* shift JIS X 0208 */ 176 1.4 riastrad (unsigned char)buf[7] == '$' && 177 1.4 riastrad (unsigned char)buf[8] == 'B' && 178 1.4 riastrad (unsigned char)buf[9] == 0x25 && /* KATAKANA LETTER A */ 179 1.4 riastrad (unsigned char)buf[10] == 0x22 && 180 1.4 riastrad (unsigned char)buf[11] == 0x25 && /* KATAKANA LETTER A */ 181 1.4 riastrad (unsigned char)buf[12] == 0x22 && 182 1.4 riastrad (unsigned char)buf[13] == 0x1b && /* shift US-ASCII */ 183 1.4 riastrad (unsigned char)buf[14] == '(' && 184 1.4 riastrad (unsigned char)buf[15] == 'B' && 185 1.4 riastrad (unsigned char)buf[16] == '\0' && 186 1.4 riastrad (unsigned char)buf[17] == 0xcc), 187 1.4 riastrad "buf=[%02x %02x %02x %02x %02x %02x %02x %02x " 188 1.4 riastrad " %02x %02x %02x %02x %02x %02x %02x %02x " 189 1.4 riastrad " %02x %02x]", 190 1.4 riastrad buf[0], buf[1], buf[2], buf[3], 191 1.4 riastrad buf[4], buf[5], buf[6], buf[7], 192 1.4 riastrad buf[8], buf[9], buf[10], buf[11], 193 1.4 riastrad buf[12], buf[13], buf[14], buf[15], 194 1.4 riastrad buf[16], buf[17]); 195 1.4 riastrad } 196 1.4 riastrad 197 1.1 riastrad ATF_TC_WITHOUT_HEAD(c16rtomb_iso_8859_1_test); 198 1.1 riastrad ATF_TC_BODY(c16rtomb_iso_8859_1_test, tc) 199 1.1 riastrad { 200 1.1 riastrad size_t n; 201 1.1 riastrad 202 1.1 riastrad require_lc_ctype("en_US.ISO8859-1"); 203 1.1 riastrad 204 1.1 riastrad /* Unicode character 'Euro sign'. */ 205 1.1 riastrad memset(&s, 0, sizeof(s)); 206 1.1 riastrad memset(buf, 0xcc, sizeof(buf)); 207 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0x20ac, &s)), (size_t)-1, 208 1.1 riastrad "n=%zu", n); 209 1.1 riastrad ATF_CHECK_EQ_MSG(errno, EILSEQ, "errno=%d", errno); 210 1.1 riastrad ATF_CHECK_EQ_MSG((unsigned char)buf[0], 0xcc, "buf=[%02x]", buf[0]); 211 1.1 riastrad } 212 1.1 riastrad 213 1.1 riastrad ATF_TC_WITHOUT_HEAD(c16rtomb_iso_8859_15_test); 214 1.1 riastrad ATF_TC_BODY(c16rtomb_iso_8859_15_test, tc) 215 1.1 riastrad { 216 1.1 riastrad size_t n; 217 1.1 riastrad 218 1.1 riastrad require_lc_ctype("en_US.ISO8859-15"); 219 1.1 riastrad 220 1.1 riastrad /* Unicode character 'Euro sign'. */ 221 1.1 riastrad memset(&s, 0, sizeof(s)); 222 1.1 riastrad memset(buf, 0xcc, sizeof(buf)); 223 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0x20ac, &s)), 1, "n=%zu", n); 224 1.1 riastrad ATF_CHECK_MSG(((unsigned char)buf[0] == 0xa4 && 225 1.1 riastrad (unsigned char)buf[1] == 0xcc), 226 1.1 riastrad "buf=[%02x %02x]", buf[0], buf[1]); 227 1.1 riastrad } 228 1.1 riastrad 229 1.1 riastrad ATF_TC_WITHOUT_HEAD(c16rtomb_utf_8_test); 230 1.1 riastrad ATF_TC_BODY(c16rtomb_utf_8_test, tc) 231 1.1 riastrad { 232 1.1 riastrad size_t n; 233 1.1 riastrad 234 1.1 riastrad require_lc_ctype("en_US.UTF-8"); 235 1.1 riastrad 236 1.1 riastrad /* Unicode character 'Pile of poo'. */ 237 1.1 riastrad memset(&s, 0, sizeof(s)); 238 1.1 riastrad memset(buf, 0xcc, sizeof(buf)); 239 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xd83d, &s)), 0, "n=%zu", n); 240 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xdca9, &s)), 4, "n=%zu", n); 241 1.1 riastrad ATF_CHECK_MSG(((unsigned char)buf[0] == 0xf0 && 242 1.1 riastrad (unsigned char)buf[1] == 0x9f && 243 1.1 riastrad (unsigned char)buf[2] == 0x92 && 244 1.1 riastrad (unsigned char)buf[3] == 0xa9 && 245 1.1 riastrad (unsigned char)buf[4] == 0xcc), 246 1.1 riastrad "buf=[%02x %02x %02x %02x %02x]", 247 1.1 riastrad buf[0], buf[1], buf[2], buf[3], buf[4]); 248 1.1 riastrad 249 1.1 riastrad /* Invalid code; 'Pile of poo' without the trail surrogate. */ 250 1.1 riastrad memset(&s, 0, sizeof(s)); 251 1.1 riastrad memset(buf, 0xcc, sizeof(buf)); 252 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xd83d, &s)), 0, "n=%zu", n); 253 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, L'A', &s)), (size_t)-1, 254 1.1 riastrad "n=%zu", n); 255 1.1 riastrad ATF_CHECK_EQ_MSG(errno, EILSEQ, "errno=%d", errno); 256 1.1 riastrad ATF_CHECK_EQ_MSG((unsigned char)buf[0], 0xcc, "buf=[%02x]", buf[0]); 257 1.1 riastrad 258 1.1 riastrad /* Invalid code; 'Pile of poo' without the lead surrogate. */ 259 1.1 riastrad memset(&s, 0, sizeof(s)); 260 1.1 riastrad memset(buf, 0xcc, sizeof(buf)); 261 1.1 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xdca9, &s)), (size_t)-1, 262 1.1 riastrad "n=%zu", n); 263 1.1 riastrad ATF_CHECK_EQ_MSG(errno, EILSEQ, "errno=%d", errno); 264 1.1 riastrad ATF_CHECK_EQ_MSG((unsigned char)buf[0], 0xcc, "buf=[%02x]", buf[0]); 265 1.2 riastrad 266 1.2 riastrad /* Incomplete Unicode character 'Pile of poo', interrupted by NUL. */ 267 1.2 riastrad memset(&s, 0, sizeof(s)); 268 1.2 riastrad memset(buf, 0xcc, sizeof(buf)); 269 1.2 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xd83d, &s)), 0, "n=%zu", n); 270 1.2 riastrad ATF_CHECK_EQ_MSG((n = c16rtomb(buf, L'\0', &s)), 1, 271 1.2 riastrad "n=%zu", n); 272 1.2 riastrad ATF_CHECK_MSG(((unsigned char)buf[0] == '\0' && 273 1.2 riastrad (unsigned char)buf[1] == 0xcc), 274 1.2 riastrad "buf=[%02x %02x]", buf[0], buf[1]); 275 1.1 riastrad } 276 1.1 riastrad 277 1.1 riastrad ATF_TP_ADD_TCS(tp) 278 1.1 riastrad { 279 1.1 riastrad 280 1.1 riastrad ATF_TP_ADD_TC(tp, c16rtomb_c_locale_test); 281 1.4 riastrad ATF_TP_ADD_TC(tp, c16rtomb_iso2022jp_locale_test); 282 1.1 riastrad ATF_TP_ADD_TC(tp, c16rtomb_iso_8859_1_test); 283 1.1 riastrad ATF_TP_ADD_TC(tp, c16rtomb_iso_8859_15_test); 284 1.1 riastrad ATF_TP_ADD_TC(tp, c16rtomb_utf_8_test); 285 1.1 riastrad 286 1.1 riastrad return (atf_no_error()); 287 1.1 riastrad } 288