Home | History | Annotate | Line # | Download | only in locale
      1  1.6  riastrad /*	$NetBSD: t_c16rtomb.c,v 1.6 2024/08/19 16:22:10 riastradh Exp $	*/
      2  1.1  riastrad 
      3  1.1  riastrad /*-
      4  1.1  riastrad  * Copyright (c) 2002 Tim J. Robbins
      5  1.1  riastrad  * All rights reserved.
      6  1.1  riastrad  *
      7  1.1  riastrad  * Copyright (c) 2013 Ed Schouten <ed (at) FreeBSD.org>
      8  1.1  riastrad  * All rights reserved.
      9  1.1  riastrad  *
     10  1.1  riastrad  * Redistribution and use in source and binary forms, with or without
     11  1.1  riastrad  * modification, are permitted provided that the following conditions
     12  1.1  riastrad  * are met:
     13  1.1  riastrad  * 1. Redistributions of source code must retain the above copyright
     14  1.1  riastrad  *    notice, this list of conditions and the following disclaimer.
     15  1.1  riastrad  * 2. Redistributions in binary form must reproduce the above copyright
     16  1.1  riastrad  *    notice, this list of conditions and the following disclaimer in the
     17  1.1  riastrad  *    documentation and/or other materials provided with the distribution.
     18  1.1  riastrad  *
     19  1.1  riastrad  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
     20  1.1  riastrad  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     21  1.1  riastrad  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     22  1.1  riastrad  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     23  1.1  riastrad  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     24  1.1  riastrad  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     25  1.1  riastrad  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     26  1.1  riastrad  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     27  1.1  riastrad  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     28  1.1  riastrad  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     29  1.1  riastrad  * SUCH DAMAGE.
     30  1.1  riastrad  */
     31  1.1  riastrad /*
     32  1.1  riastrad  * Test program for c16rtomb() as specified by ISO/IEC 9899:2011.
     33  1.1  riastrad  */
     34  1.1  riastrad 
     35  1.1  riastrad #include <sys/cdefs.h>
     36  1.6  riastrad __RCSID("$NetBSD: t_c16rtomb.c,v 1.6 2024/08/19 16:22:10 riastradh Exp $");
     37  1.1  riastrad 
     38  1.1  riastrad #include <errno.h>
     39  1.1  riastrad #include <limits.h>
     40  1.1  riastrad #include <locale.h>
     41  1.1  riastrad #include <stdio.h>
     42  1.1  riastrad #include <string.h>
     43  1.1  riastrad #include <uchar.h>
     44  1.1  riastrad 
     45  1.1  riastrad #include <atf-c.h>
     46  1.1  riastrad 
     47  1.1  riastrad static void
     48  1.1  riastrad require_lc_ctype(const char *locale_name)
     49  1.1  riastrad {
     50  1.1  riastrad 	char *lc_ctype_set;
     51  1.1  riastrad 
     52  1.1  riastrad 	lc_ctype_set = setlocale(LC_CTYPE, locale_name);
     53  1.1  riastrad 	if (lc_ctype_set == NULL)
     54  1.1  riastrad 		atf_tc_fail("setlocale(LC_CTYPE, \"%s\") failed; errno=%d",
     55  1.1  riastrad 		    locale_name, errno);
     56  1.1  riastrad 
     57  1.1  riastrad 	ATF_REQUIRE_EQ_MSG(strcmp(lc_ctype_set, locale_name), 0,
     58  1.1  riastrad 	    "lc_ctype_set=%s locale_name=%s", lc_ctype_set, locale_name);
     59  1.1  riastrad }
     60  1.1  riastrad 
     61  1.1  riastrad static mbstate_t s;
     62  1.4  riastrad static char buf[7*MB_LEN_MAX + 1];
     63  1.1  riastrad 
     64  1.1  riastrad ATF_TC_WITHOUT_HEAD(c16rtomb_c_locale_test);
     65  1.1  riastrad ATF_TC_BODY(c16rtomb_c_locale_test, tc)
     66  1.1  riastrad {
     67  1.1  riastrad 	size_t n;
     68  1.1  riastrad 
     69  1.1  riastrad 	require_lc_ctype("C");
     70  1.1  riastrad 
     71  1.1  riastrad 	/*
     72  1.1  riastrad 	 * If the buffer argument is NULL, c16 is implicitly 0,
     73  1.1  riastrad 	 * c16rtomb() resets its internal state.
     74  1.1  riastrad 	 */
     75  1.1  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, L'\0', NULL)), 1, "n=%zu", n);
     76  1.1  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, 0xdc00, NULL)), 1, "n=%zu", n);
     77  1.1  riastrad 
     78  1.1  riastrad 	/* Null wide character. */
     79  1.1  riastrad 	memset(&s, 0, sizeof(s));
     80  1.1  riastrad 	memset(buf, 0xcc, sizeof(buf));
     81  1.1  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0, &s)), 1, "n=%zu", n);
     82  1.1  riastrad 	ATF_CHECK_MSG(((unsigned char)buf[0] == 0 &&
     83  1.1  riastrad 		(unsigned char)buf[1] == 0xcc),
     84  1.1  riastrad 	    "buf=[%02x %02x]", buf[0], buf[1]);
     85  1.1  riastrad 
     86  1.1  riastrad 	/* Latin letter A, internal state. */
     87  1.1  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, L'\0', NULL)), 1, "n=%zu", n);
     88  1.1  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, L'A', NULL)), 1, "n=%zu", n);
     89  1.1  riastrad 
     90  1.1  riastrad 	/* Latin letter A. */
     91  1.1  riastrad 	memset(&s, 0, sizeof(s));
     92  1.1  riastrad 	memset(buf, 0xcc, sizeof(buf));
     93  1.1  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(buf, L'A', &s)), 1, "n=%zu", n);
     94  1.1  riastrad 	ATF_CHECK_MSG(((unsigned char)buf[0] == 'A' &&
     95  1.1  riastrad 		(unsigned char)buf[1] == 0xcc),
     96  1.1  riastrad 	    "buf=[%02x %02x]", buf[0], buf[1]);
     97  1.1  riastrad 
     98  1.1  riastrad 	/* Unicode character 'Pile of poo'. */
     99  1.1  riastrad 	memset(&s, 0, sizeof(s));
    100  1.1  riastrad 	memset(buf, 0xcc, sizeof(buf));
    101  1.1  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xd83d, &s)), 0, "n=%zu", n);
    102  1.1  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xdca9, &s)), (size_t)-1,
    103  1.1  riastrad 	    "n=%zu", n);
    104  1.1  riastrad 	ATF_CHECK_EQ_MSG(errno, EILSEQ, "errno=%d", errno);
    105  1.1  riastrad 	ATF_CHECK_EQ_MSG((unsigned char)buf[0], 0xcc, "buf=[%02x]", buf[0]);
    106  1.2  riastrad 
    107  1.2  riastrad 	/* Incomplete Unicode character 'Pile of poo', interrupted by NUL. */
    108  1.2  riastrad 	memset(&s, 0, sizeof(s));
    109  1.2  riastrad 	memset(buf, 0xcc, sizeof(buf));
    110  1.2  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xd83d, &s)), 0, "n=%zu", n);
    111  1.2  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(buf, L'\0', &s)), 1, "n=%zu", n);
    112  1.2  riastrad 	ATF_CHECK_MSG(((unsigned char)buf[0] == '\0' &&
    113  1.2  riastrad 		(unsigned char)buf[1] == 0xcc),
    114  1.2  riastrad 	    "buf=[%02x %02x]", buf[0], buf[1]);
    115  1.1  riastrad }
    116  1.1  riastrad 
    117  1.4  riastrad ATF_TC_WITHOUT_HEAD(c16rtomb_iso2022jp_locale_test);
    118  1.4  riastrad ATF_TC_BODY(c16rtomb_iso2022jp_locale_test, tc)
    119  1.4  riastrad {
    120  1.4  riastrad 	char *p;
    121  1.4  riastrad 	size_t n;
    122  1.4  riastrad 
    123  1.4  riastrad 	require_lc_ctype("ja_JP.ISO-2022-JP");
    124  1.4  riastrad 
    125  1.4  riastrad 	/*
    126  1.4  riastrad 	 * If the buffer argument is NULL, c16 is implicitly 0,
    127  1.4  riastrad 	 * c16rtomb() resets its internal state.
    128  1.4  riastrad 	 */
    129  1.4  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, L'\0', NULL)), 1, "n=%zu", n);
    130  1.4  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, 0xdc00, NULL)), 1, "n=%zu", n);
    131  1.4  riastrad 
    132  1.4  riastrad 	/* Null wide character. */
    133  1.4  riastrad 	memset(&s, 0, sizeof(s));
    134  1.4  riastrad 	memset(buf, 0xcc, sizeof(buf));
    135  1.4  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0, &s)), 1, "n=%zu", n);
    136  1.4  riastrad 	ATF_CHECK_MSG(((unsigned char)buf[0] == 0 &&
    137  1.4  riastrad 		(unsigned char)buf[1] == 0xcc),
    138  1.4  riastrad 	    "buf=[%02x %02x]", buf[0], buf[1]);
    139  1.4  riastrad 
    140  1.4  riastrad 	/* Latin letter A, internal state. */
    141  1.4  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, L'\0', NULL)), 1, "n=%zu", n);
    142  1.4  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(NULL, L'A', NULL)), 1, "n=%zu", n);
    143  1.4  riastrad 
    144  1.4  riastrad 	/*
    145  1.4  riastrad 	 * 1. U+0042 LATIN CAPITAL LETTER A
    146  1.4  riastrad 	 * 2. U+00A5 YEN SIGN
    147  1.4  riastrad 	 * 3. U+00A5 YEN SIGN (again, no shift needed)
    148  1.4  riastrad 	 * 4. U+30A2 KATAKANA LETTER A
    149  1.4  riastrad 	 * 5. U+30A2 KATAKANA LETTER A (again, no shift needed)
    150  1.4  riastrad 	 * 6. incomplete UTF-16 surrogate pair -- no output
    151  1.4  riastrad 	 * 7. U+0000 NUL (plus shift sequence to initial state)
    152  1.4  riastrad 	 */
    153  1.4  riastrad 	memset(&s, 0, sizeof(s));
    154  1.4  riastrad 	memset(buf, 0xcc, sizeof(buf));
    155  1.4  riastrad 	p = buf;
    156  1.4  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(p, L'A', &s)), 1, "n=%zu", n); /* 1 */
    157  1.4  riastrad 	p += 1;
    158  1.4  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(p, 0xa5, &s)), 4, "n=%zu", n); /* 2 */
    159  1.4  riastrad 	p += 4;
    160  1.4  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(p, 0xa5, &s)), 1, "n=%zu", n); /* 3 */
    161  1.4  riastrad 	p += 1;
    162  1.4  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(p, 0x30a2, &s)), 5, "n=%zu", n); /* 4 */
    163  1.4  riastrad 	p += 5;
    164  1.4  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(p, 0x30a2, &s)), 2, "n=%zu", n); /* 5 */
    165  1.4  riastrad 	p += 2;
    166  1.4  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(p, 0xd800, &s)), 0, "n=%zu", n); /* 6 */
    167  1.4  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(p, L'\0', &s)), 4, "n=%zu", n); /* 7 */
    168  1.4  riastrad 	p += 4;
    169  1.4  riastrad 	ATF_CHECK_MSG(((unsigned char)buf[0] == 'A' &&
    170  1.4  riastrad 		(unsigned char)buf[1] == 0x1b && /* shift ISO/IEC 646:JP */
    171  1.4  riastrad 		(unsigned char)buf[2] == '(' &&
    172  1.4  riastrad 		(unsigned char)buf[3] == 'J' &&
    173  1.4  riastrad 		(unsigned char)buf[4] == 0x5c && /* YEN SIGN */
    174  1.4  riastrad 		(unsigned char)buf[5] == 0x5c && /* YEN SIGN */
    175  1.5  riastrad 		(unsigned char)buf[6] == 0x1b && /* shift JIS X 0208 */
    176  1.4  riastrad 		(unsigned char)buf[7] == '$' &&
    177  1.4  riastrad 		(unsigned char)buf[8] == 'B' &&
    178  1.4  riastrad 		(unsigned char)buf[9] == 0x25 && /* KATAKANA LETTER A */
    179  1.4  riastrad 		(unsigned char)buf[10] == 0x22 &&
    180  1.4  riastrad 		(unsigned char)buf[11] == 0x25 && /* KATAKANA LETTER A */
    181  1.4  riastrad 		(unsigned char)buf[12] == 0x22 &&
    182  1.4  riastrad 		(unsigned char)buf[13] == 0x1b && /* shift US-ASCII */
    183  1.4  riastrad 		(unsigned char)buf[14] == '(' &&
    184  1.4  riastrad 		(unsigned char)buf[15] == 'B' &&
    185  1.4  riastrad 		(unsigned char)buf[16] == '\0' &&
    186  1.4  riastrad 		(unsigned char)buf[17] == 0xcc),
    187  1.4  riastrad 	    "buf=[%02x %02x %02x %02x  %02x %02x %02x %02x "
    188  1.4  riastrad 	    " %02x %02x %02x %02x  %02x %02x %02x %02x "
    189  1.4  riastrad 	    " %02x %02x]",
    190  1.4  riastrad 	    buf[0], buf[1], buf[2], buf[3],
    191  1.4  riastrad 	    buf[4], buf[5], buf[6], buf[7],
    192  1.4  riastrad 	    buf[8], buf[9], buf[10], buf[11],
    193  1.4  riastrad 	    buf[12], buf[13], buf[14], buf[15],
    194  1.4  riastrad 	    buf[16], buf[17]);
    195  1.4  riastrad }
    196  1.4  riastrad 
    197  1.1  riastrad ATF_TC_WITHOUT_HEAD(c16rtomb_iso_8859_1_test);
    198  1.1  riastrad ATF_TC_BODY(c16rtomb_iso_8859_1_test, tc)
    199  1.1  riastrad {
    200  1.1  riastrad 	size_t n;
    201  1.1  riastrad 
    202  1.1  riastrad 	require_lc_ctype("en_US.ISO8859-1");
    203  1.1  riastrad 
    204  1.1  riastrad 	/* Unicode character 'Euro sign'. */
    205  1.1  riastrad 	memset(&s, 0, sizeof(s));
    206  1.1  riastrad 	memset(buf, 0xcc, sizeof(buf));
    207  1.1  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0x20ac, &s)), (size_t)-1,
    208  1.1  riastrad 	    "n=%zu", n);
    209  1.1  riastrad 	ATF_CHECK_EQ_MSG(errno, EILSEQ, "errno=%d", errno);
    210  1.1  riastrad 	ATF_CHECK_EQ_MSG((unsigned char)buf[0], 0xcc, "buf=[%02x]", buf[0]);
    211  1.1  riastrad }
    212  1.1  riastrad 
    213  1.1  riastrad ATF_TC_WITHOUT_HEAD(c16rtomb_iso_8859_15_test);
    214  1.1  riastrad ATF_TC_BODY(c16rtomb_iso_8859_15_test, tc)
    215  1.1  riastrad {
    216  1.1  riastrad 	size_t n;
    217  1.1  riastrad 
    218  1.1  riastrad 	require_lc_ctype("en_US.ISO8859-15");
    219  1.1  riastrad 
    220  1.1  riastrad 	/* Unicode character 'Euro sign'. */
    221  1.1  riastrad 	memset(&s, 0, sizeof(s));
    222  1.1  riastrad 	memset(buf, 0xcc, sizeof(buf));
    223  1.1  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0x20ac, &s)), 1, "n=%zu", n);
    224  1.1  riastrad 	ATF_CHECK_MSG(((unsigned char)buf[0] == 0xa4 &&
    225  1.1  riastrad 		(unsigned char)buf[1] == 0xcc),
    226  1.1  riastrad 	    "buf=[%02x %02x]", buf[0], buf[1]);
    227  1.1  riastrad }
    228  1.1  riastrad 
    229  1.1  riastrad ATF_TC_WITHOUT_HEAD(c16rtomb_utf_8_test);
    230  1.1  riastrad ATF_TC_BODY(c16rtomb_utf_8_test, tc)
    231  1.1  riastrad {
    232  1.1  riastrad 	size_t n;
    233  1.1  riastrad 
    234  1.1  riastrad 	require_lc_ctype("en_US.UTF-8");
    235  1.1  riastrad 
    236  1.1  riastrad 	/* Unicode character 'Pile of poo'. */
    237  1.1  riastrad 	memset(&s, 0, sizeof(s));
    238  1.1  riastrad 	memset(buf, 0xcc, sizeof(buf));
    239  1.1  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xd83d, &s)), 0, "n=%zu", n);
    240  1.1  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xdca9, &s)), 4, "n=%zu", n);
    241  1.1  riastrad 	ATF_CHECK_MSG(((unsigned char)buf[0] == 0xf0 &&
    242  1.1  riastrad 		(unsigned char)buf[1] == 0x9f &&
    243  1.1  riastrad 		(unsigned char)buf[2] == 0x92 &&
    244  1.1  riastrad 		(unsigned char)buf[3] == 0xa9 &&
    245  1.1  riastrad 		(unsigned char)buf[4] == 0xcc),
    246  1.1  riastrad 	    "buf=[%02x %02x %02x %02x %02x]",
    247  1.1  riastrad 	    buf[0], buf[1], buf[2], buf[3], buf[4]);
    248  1.1  riastrad 
    249  1.1  riastrad 	/* Invalid code; 'Pile of poo' without the trail surrogate. */
    250  1.1  riastrad 	memset(&s, 0, sizeof(s));
    251  1.1  riastrad 	memset(buf, 0xcc, sizeof(buf));
    252  1.1  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xd83d, &s)), 0, "n=%zu", n);
    253  1.1  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(buf, L'A', &s)), (size_t)-1,
    254  1.1  riastrad 	    "n=%zu", n);
    255  1.1  riastrad 	ATF_CHECK_EQ_MSG(errno, EILSEQ, "errno=%d", errno);
    256  1.1  riastrad 	ATF_CHECK_EQ_MSG((unsigned char)buf[0], 0xcc, "buf=[%02x]", buf[0]);
    257  1.1  riastrad 
    258  1.1  riastrad 	/* Invalid code; 'Pile of poo' without the lead surrogate. */
    259  1.1  riastrad 	memset(&s, 0, sizeof(s));
    260  1.1  riastrad 	memset(buf, 0xcc, sizeof(buf));
    261  1.1  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xdca9, &s)), (size_t)-1,
    262  1.1  riastrad 	    "n=%zu", n);
    263  1.1  riastrad 	ATF_CHECK_EQ_MSG(errno, EILSEQ, "errno=%d", errno);
    264  1.1  riastrad 	ATF_CHECK_EQ_MSG((unsigned char)buf[0], 0xcc, "buf=[%02x]", buf[0]);
    265  1.2  riastrad 
    266  1.2  riastrad 	/* Incomplete Unicode character 'Pile of poo', interrupted by NUL. */
    267  1.2  riastrad 	memset(&s, 0, sizeof(s));
    268  1.2  riastrad 	memset(buf, 0xcc, sizeof(buf));
    269  1.2  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(buf, 0xd83d, &s)), 0, "n=%zu", n);
    270  1.2  riastrad 	ATF_CHECK_EQ_MSG((n = c16rtomb(buf, L'\0', &s)), 1,
    271  1.2  riastrad 	    "n=%zu", n);
    272  1.2  riastrad 	ATF_CHECK_MSG(((unsigned char)buf[0] == '\0' &&
    273  1.2  riastrad 		(unsigned char)buf[1] == 0xcc),
    274  1.2  riastrad 	    "buf=[%02x %02x]", buf[0], buf[1]);
    275  1.1  riastrad }
    276  1.1  riastrad 
    277  1.1  riastrad ATF_TP_ADD_TCS(tp)
    278  1.1  riastrad {
    279  1.1  riastrad 
    280  1.1  riastrad 	ATF_TP_ADD_TC(tp, c16rtomb_c_locale_test);
    281  1.4  riastrad 	ATF_TP_ADD_TC(tp, c16rtomb_iso2022jp_locale_test);
    282  1.1  riastrad 	ATF_TP_ADD_TC(tp, c16rtomb_iso_8859_1_test);
    283  1.1  riastrad 	ATF_TP_ADD_TC(tp, c16rtomb_iso_8859_15_test);
    284  1.1  riastrad 	ATF_TP_ADD_TC(tp, c16rtomb_utf_8_test);
    285  1.1  riastrad 
    286  1.1  riastrad 	return (atf_no_error());
    287  1.1  riastrad }
    288