1 1.13 rillig /* $NetBSD: citrus_utf1632.c,v 1.13 2022/04/19 20:32:14 rillig Exp $ */ 2 1.1 tshiozak 3 1.1 tshiozak /*- 4 1.1 tshiozak * Copyright (c)2003 Citrus Project, 5 1.1 tshiozak * All rights reserved. 6 1.1 tshiozak * 7 1.1 tshiozak * Redistribution and use in source and binary forms, with or without 8 1.1 tshiozak * modification, are permitted provided that the following conditions 9 1.1 tshiozak * are met: 10 1.1 tshiozak * 1. Redistributions of source code must retain the above copyright 11 1.1 tshiozak * notice, this list of conditions and the following disclaimer. 12 1.1 tshiozak * 2. Redistributions in binary form must reproduce the above copyright 13 1.1 tshiozak * notice, this list of conditions and the following disclaimer in the 14 1.1 tshiozak * documentation and/or other materials provided with the distribution. 15 1.1 tshiozak * 16 1.1 tshiozak * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 17 1.1 tshiozak * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 18 1.1 tshiozak * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 19 1.1 tshiozak * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 20 1.1 tshiozak * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 21 1.1 tshiozak * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 22 1.1 tshiozak * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 23 1.1 tshiozak * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 24 1.1 tshiozak * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 25 1.1 tshiozak * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 26 1.1 tshiozak * SUCH DAMAGE. 27 1.1 tshiozak */ 28 1.1 tshiozak 29 1.1 tshiozak #include <sys/cdefs.h> 30 1.1 tshiozak #if defined(LIBC_SCCS) && !defined(lint) 31 1.13 rillig __RCSID("$NetBSD: citrus_utf1632.c,v 1.13 2022/04/19 20:32:14 rillig Exp $"); 32 1.1 tshiozak #endif /* LIBC_SCCS and not lint */ 33 1.1 tshiozak 34 1.1 tshiozak #include <assert.h> 35 1.1 tshiozak #include <errno.h> 36 1.1 tshiozak #include <string.h> 37 1.1 tshiozak #include <stdio.h> 38 1.1 tshiozak #include <stdlib.h> 39 1.1 tshiozak #include <stddef.h> 40 1.1 tshiozak #include <limits.h> 41 1.1 tshiozak #include <wchar.h> 42 1.1 tshiozak #include <sys/types.h> 43 1.5 dogcow #include <machine/endian.h> 44 1.1 tshiozak 45 1.1 tshiozak #include "citrus_namespace.h" 46 1.1 tshiozak #include "citrus_types.h" 47 1.1 tshiozak #include "citrus_module.h" 48 1.1 tshiozak #include "citrus_stdenc.h" 49 1.1 tshiozak #include "citrus_bcs.h" 50 1.1 tshiozak 51 1.1 tshiozak #include "citrus_utf1632.h" 52 1.1 tshiozak 53 1.1 tshiozak 54 1.1 tshiozak /* ---------------------------------------------------------------------- 55 1.1 tshiozak * private stuffs used by templates 56 1.1 tshiozak */ 57 1.1 tshiozak 58 1.1 tshiozak typedef struct { 59 1.1 tshiozak u_int8_t ch[4]; 60 1.1 tshiozak int chlen; 61 1.1 tshiozak int current_endian; 62 1.1 tshiozak } _UTF1632State; 63 1.1 tshiozak 64 1.1 tshiozak typedef struct { 65 1.1 tshiozak int preffered_endian; 66 1.1 tshiozak unsigned int cur_max; 67 1.1 tshiozak #define _ENDIAN_UNKNOWN 0 68 1.1 tshiozak #define _ENDIAN_BIG 1 69 1.1 tshiozak #define _ENDIAN_LITTLE 2 70 1.1 tshiozak u_int32_t mode; 71 1.1 tshiozak #define _MODE_UTF32 0x00000001U 72 1.1 tshiozak #define _MODE_FORCE_ENDIAN 0x00000002U 73 1.1 tshiozak } _UTF1632EncodingInfo; 74 1.1 tshiozak 75 1.1 tshiozak #define _FUNCNAME(m) _citrus_UTF1632_##m 76 1.1 tshiozak #define _ENCODING_INFO _UTF1632EncodingInfo 77 1.1 tshiozak #define _ENCODING_STATE _UTF1632State 78 1.1 tshiozak #define _ENCODING_MB_CUR_MAX(_ei_) ((_ei_)->cur_max) 79 1.1 tshiozak #define _ENCODING_IS_STATE_DEPENDENT 0 80 1.1 tshiozak #define _STATE_NEEDS_EXPLICIT_INIT(_ps_) 0 81 1.1 tshiozak 82 1.1 tshiozak 83 1.1 tshiozak static __inline void 84 1.1 tshiozak /*ARGSUSED*/ 85 1.1 tshiozak _citrus_UTF1632_init_state(_UTF1632EncodingInfo *ei, _UTF1632State *s) 86 1.1 tshiozak { 87 1.1 tshiozak memset(s, 0, sizeof(*s)); 88 1.1 tshiozak } 89 1.1 tshiozak 90 1.1 tshiozak static int 91 1.1 tshiozak _citrus_UTF1632_mbrtowc_priv(_UTF1632EncodingInfo *ei, wchar_t *pwc, 92 1.1 tshiozak const char **s, size_t n, _UTF1632State *psenc, 93 1.1 tshiozak size_t *nresult) 94 1.1 tshiozak { 95 1.1 tshiozak int chlenbak, endian, needlen; 96 1.1 tshiozak wchar_t wc; 97 1.1 tshiozak size_t result; 98 1.1 tshiozak const char *s0; 99 1.1 tshiozak 100 1.1 tshiozak _DIAGASSERT(nresult != 0); 101 1.1 tshiozak _DIAGASSERT(ei != NULL); 102 1.1 tshiozak _DIAGASSERT(s != NULL); 103 1.1 tshiozak _DIAGASSERT(psenc != NULL); 104 1.1 tshiozak 105 1.1 tshiozak s0 = *s; 106 1.1 tshiozak 107 1.1 tshiozak if (s0 == NULL) { 108 1.1 tshiozak _citrus_UTF1632_init_state(ei, psenc); 109 1.1 tshiozak *nresult = 0; /* state independent */ 110 1.1 tshiozak return (0); 111 1.1 tshiozak } 112 1.1 tshiozak 113 1.1 tshiozak result = 0; 114 1.1 tshiozak chlenbak = psenc->chlen; 115 1.1 tshiozak 116 1.1 tshiozak refetch: 117 1.1 tshiozak if ((ei->mode & _MODE_UTF32) != 0 || chlenbak>=2) 118 1.1 tshiozak needlen = 4; 119 1.1 tshiozak else 120 1.1 tshiozak needlen = 2; 121 1.1 tshiozak 122 1.1 tshiozak while (chlenbak < needlen) { 123 1.1 tshiozak if (n==0) 124 1.1 tshiozak goto restart; 125 1.1 tshiozak psenc->ch[chlenbak++] = *s0++; 126 1.1 tshiozak n--; 127 1.1 tshiozak result++; 128 1.1 tshiozak } 129 1.1 tshiozak 130 1.10 tnozaki if (psenc->current_endian == _ENDIAN_UNKNOWN) { 131 1.10 tnozaki if ((ei->mode & _MODE_FORCE_ENDIAN) == 0) { 132 1.10 tnozaki /* judge endian marker */ 133 1.10 tnozaki if ((ei->mode & _MODE_UTF32) == 0) { 134 1.10 tnozaki /* UTF16 */ 135 1.10 tnozaki if (psenc->ch[0]==0xFE && psenc->ch[1]==0xFF) { 136 1.10 tnozaki psenc->current_endian = _ENDIAN_BIG; 137 1.10 tnozaki chlenbak = 0; 138 1.10 tnozaki goto refetch; 139 1.10 tnozaki } else if (psenc->ch[0]==0xFF && psenc->ch[1]==0xFE) { 140 1.10 tnozaki psenc->current_endian = _ENDIAN_LITTLE; 141 1.10 tnozaki chlenbak = 0; 142 1.10 tnozaki goto refetch; 143 1.10 tnozaki } 144 1.10 tnozaki } else { 145 1.10 tnozaki /* UTF32 */ 146 1.10 tnozaki if (psenc->ch[0]==0x00 && psenc->ch[1]==0x00 && 147 1.10 tnozaki psenc->ch[2]==0xFE && psenc->ch[3]==0xFF) { 148 1.10 tnozaki psenc->current_endian = _ENDIAN_BIG; 149 1.10 tnozaki chlenbak = 0; 150 1.10 tnozaki goto refetch; 151 1.10 tnozaki } else if (psenc->ch[0]==0xFF && psenc->ch[1]==0xFE && 152 1.10 tnozaki psenc->ch[2]==0x00 && psenc->ch[3]==0x00) { 153 1.10 tnozaki psenc->current_endian = _ENDIAN_LITTLE; 154 1.10 tnozaki chlenbak = 0; 155 1.10 tnozaki goto refetch; 156 1.10 tnozaki } 157 1.10 tnozaki } 158 1.1 tshiozak } 159 1.11 tnozaki psenc->current_endian = ei->preffered_endian; 160 1.1 tshiozak } 161 1.10 tnozaki endian = psenc->current_endian; 162 1.1 tshiozak 163 1.1 tshiozak /* get wc */ 164 1.1 tshiozak if ((ei->mode & _MODE_UTF32) == 0) { 165 1.1 tshiozak /* UTF16 */ 166 1.1 tshiozak if (needlen==2) { 167 1.1 tshiozak switch (endian) { 168 1.1 tshiozak case _ENDIAN_LITTLE: 169 1.1 tshiozak wc = (psenc->ch[0] | 170 1.1 tshiozak ((wchar_t)psenc->ch[1] << 8)); 171 1.1 tshiozak break; 172 1.1 tshiozak case _ENDIAN_BIG: 173 1.1 tshiozak wc = (psenc->ch[1] | 174 1.1 tshiozak ((wchar_t)psenc->ch[0] << 8)); 175 1.1 tshiozak break; 176 1.6 christos default: 177 1.6 christos goto ilseq; 178 1.1 tshiozak } 179 1.1 tshiozak if (wc >= 0xD800 && wc <= 0xDBFF) { 180 1.1 tshiozak /* surrogate high */ 181 1.1 tshiozak needlen=4; 182 1.1 tshiozak goto refetch; 183 1.1 tshiozak } 184 1.1 tshiozak } else { 185 1.1 tshiozak /* surrogate low */ 186 1.1 tshiozak wc -= 0xD800; /* wc : surrogate high (see above) */ 187 1.1 tshiozak wc <<= 10; 188 1.1 tshiozak switch (endian) { 189 1.1 tshiozak case _ENDIAN_LITTLE: 190 1.10 tnozaki if (psenc->ch[3]<0xDC || psenc->ch[3]>0xDF) 191 1.1 tshiozak goto ilseq; 192 1.1 tshiozak wc |= psenc->ch[2]; 193 1.1 tshiozak wc |= (wchar_t)(psenc->ch[3] & 3) << 8; 194 1.1 tshiozak break; 195 1.1 tshiozak case _ENDIAN_BIG: 196 1.10 tnozaki if (psenc->ch[2]<0xDC || psenc->ch[2]>0xDF) 197 1.1 tshiozak goto ilseq; 198 1.1 tshiozak wc |= psenc->ch[3]; 199 1.1 tshiozak wc |= (wchar_t)(psenc->ch[2] & 3) << 8; 200 1.1 tshiozak break; 201 1.6 christos default: 202 1.6 christos goto ilseq; 203 1.1 tshiozak } 204 1.1 tshiozak wc += 0x10000; 205 1.1 tshiozak } 206 1.1 tshiozak } else { 207 1.1 tshiozak /* UTF32 */ 208 1.1 tshiozak switch (endian) { 209 1.1 tshiozak case _ENDIAN_LITTLE: 210 1.1 tshiozak wc = (psenc->ch[0] | 211 1.1 tshiozak ((wchar_t)psenc->ch[1] << 8) | 212 1.1 tshiozak ((wchar_t)psenc->ch[2] << 16) | 213 1.1 tshiozak ((wchar_t)psenc->ch[3] << 24)); 214 1.1 tshiozak break; 215 1.1 tshiozak case _ENDIAN_BIG: 216 1.1 tshiozak wc = (psenc->ch[3] | 217 1.1 tshiozak ((wchar_t)psenc->ch[2] << 8) | 218 1.1 tshiozak ((wchar_t)psenc->ch[1] << 16) | 219 1.1 tshiozak ((wchar_t)psenc->ch[0] << 24)); 220 1.1 tshiozak break; 221 1.6 christos default: 222 1.6 christos goto ilseq; 223 1.1 tshiozak } 224 1.7 tnozaki if (wc >= 0xD800 && wc <= 0xDFFF) 225 1.7 tnozaki goto ilseq; 226 1.1 tshiozak } 227 1.1 tshiozak 228 1.1 tshiozak 229 1.1 tshiozak *pwc = wc; 230 1.1 tshiozak psenc->chlen = 0; 231 1.1 tshiozak *nresult = result; 232 1.1 tshiozak *s = s0; 233 1.1 tshiozak 234 1.1 tshiozak return (0); 235 1.1 tshiozak 236 1.1 tshiozak ilseq: 237 1.1 tshiozak *nresult = (size_t)-1; 238 1.1 tshiozak psenc->chlen = 0; 239 1.1 tshiozak return (EILSEQ); 240 1.1 tshiozak 241 1.1 tshiozak restart: 242 1.1 tshiozak *nresult = (size_t)-2; 243 1.1 tshiozak psenc->chlen = chlenbak; 244 1.1 tshiozak *s = s0; 245 1.1 tshiozak return (0); 246 1.1 tshiozak } 247 1.1 tshiozak 248 1.1 tshiozak static int 249 1.1 tshiozak _citrus_UTF1632_wcrtomb_priv(_UTF1632EncodingInfo *ei, char *s, size_t n, 250 1.1 tshiozak wchar_t wc, _UTF1632State *psenc, 251 1.1 tshiozak size_t *nresult) 252 1.1 tshiozak { 253 1.1 tshiozak wchar_t wc2; 254 1.8 tnozaki static const char _bom[4] = { 255 1.8 tnozaki #if BYTE_ORDER == BIG_ENDIAN 256 1.8 tnozaki 0x00, 0x00, 0xFE, 0xFF, 257 1.8 tnozaki #else 258 1.8 tnozaki 0xFF, 0xFE, 0x00, 0x00, 259 1.8 tnozaki #endif 260 1.8 tnozaki }; 261 1.8 tnozaki const char *bom = &_bom[0]; 262 1.8 tnozaki size_t cnt; 263 1.1 tshiozak 264 1.1 tshiozak _DIAGASSERT(ei != NULL); 265 1.1 tshiozak _DIAGASSERT(nresult != 0); 266 1.1 tshiozak _DIAGASSERT(s != NULL); 267 1.1 tshiozak 268 1.8 tnozaki cnt = (size_t)0; 269 1.8 tnozaki if (psenc->current_endian == _ENDIAN_UNKNOWN) { 270 1.8 tnozaki if ((ei->mode & _MODE_FORCE_ENDIAN) == 0) { 271 1.8 tnozaki if (ei->mode & _MODE_UTF32) { 272 1.8 tnozaki cnt = 4; 273 1.8 tnozaki } else { 274 1.8 tnozaki cnt = 2; 275 1.8 tnozaki #if BYTE_ORDER == BIG_ENDIAN 276 1.8 tnozaki bom += 2; 277 1.8 tnozaki #endif 278 1.8 tnozaki } 279 1.8 tnozaki if (n < cnt) 280 1.8 tnozaki goto e2big; 281 1.8 tnozaki memcpy(s, bom, cnt); 282 1.8 tnozaki s += cnt, n -= cnt; 283 1.8 tnozaki } 284 1.8 tnozaki psenc->current_endian = ei->preffered_endian; 285 1.8 tnozaki } 286 1.8 tnozaki 287 1.1 tshiozak wc2 = 0; 288 1.1 tshiozak if ((ei->mode & _MODE_UTF32)==0) { 289 1.1 tshiozak /* UTF16 */ 290 1.1 tshiozak if (wc>0xFFFF) { 291 1.1 tshiozak /* surrogate */ 292 1.8 tnozaki if (wc>0x10FFFF) 293 1.8 tnozaki goto ilseq; 294 1.8 tnozaki if (n < 4) 295 1.8 tnozaki goto e2big; 296 1.8 tnozaki cnt += 4; 297 1.1 tshiozak wc -= 0x10000; 298 1.1 tshiozak wc2 = (wc & 0x3FF) | 0xDC00; 299 1.1 tshiozak wc = (wc>>10) | 0xD800; 300 1.1 tshiozak } else { 301 1.8 tnozaki if (n < 2) 302 1.8 tnozaki goto e2big; 303 1.8 tnozaki cnt += 2; 304 1.1 tshiozak } 305 1.1 tshiozak 306 1.1 tshiozak surrogate: 307 1.8 tnozaki switch (psenc->current_endian) { 308 1.1 tshiozak case _ENDIAN_BIG: 309 1.1 tshiozak s[1] = wc; 310 1.1 tshiozak s[0] = (wc >>= 8); 311 1.1 tshiozak break; 312 1.1 tshiozak case _ENDIAN_LITTLE: 313 1.1 tshiozak s[0] = wc; 314 1.1 tshiozak s[1] = (wc >>= 8); 315 1.1 tshiozak break; 316 1.1 tshiozak } 317 1.1 tshiozak if (wc2!=0) { 318 1.1 tshiozak wc = wc2; 319 1.1 tshiozak wc2 = 0; 320 1.1 tshiozak s += 2; 321 1.1 tshiozak goto surrogate; 322 1.1 tshiozak } 323 1.1 tshiozak } else { 324 1.1 tshiozak /* UTF32 */ 325 1.7 tnozaki if (wc >= 0xD800 && wc <= 0xDFFF) 326 1.8 tnozaki goto ilseq; 327 1.8 tnozaki if (n < 4) 328 1.8 tnozaki goto e2big; 329 1.8 tnozaki cnt += 4; 330 1.8 tnozaki switch (psenc->current_endian) { 331 1.1 tshiozak case _ENDIAN_BIG: 332 1.1 tshiozak s[3] = wc; 333 1.1 tshiozak s[2] = (wc >>= 8); 334 1.1 tshiozak s[1] = (wc >>= 8); 335 1.1 tshiozak s[0] = (wc >>= 8); 336 1.1 tshiozak break; 337 1.1 tshiozak case _ENDIAN_LITTLE: 338 1.1 tshiozak s[0] = wc; 339 1.1 tshiozak s[1] = (wc >>= 8); 340 1.1 tshiozak s[2] = (wc >>= 8); 341 1.1 tshiozak s[3] = (wc >>= 8); 342 1.1 tshiozak break; 343 1.1 tshiozak } 344 1.1 tshiozak } 345 1.8 tnozaki *nresult = cnt; 346 1.1 tshiozak 347 1.1 tshiozak return 0; 348 1.1 tshiozak 349 1.8 tnozaki ilseq: 350 1.8 tnozaki *nresult = (size_t)-1; 351 1.8 tnozaki return EILSEQ; 352 1.8 tnozaki e2big: 353 1.1 tshiozak *nresult = (size_t)-1; 354 1.8 tnozaki return E2BIG; 355 1.1 tshiozak } 356 1.1 tshiozak 357 1.1 tshiozak static void 358 1.1 tshiozak parse_variable(_UTF1632EncodingInfo * __restrict ei, 359 1.1 tshiozak const void * __restrict var, size_t lenvar) 360 1.1 tshiozak { 361 1.1 tshiozak #define MATCH(x, act) \ 362 1.1 tshiozak do { \ 363 1.1 tshiozak if (lenvar >= (sizeof(#x)-1) && \ 364 1.1 tshiozak _bcs_strncasecmp(p, #x, sizeof(#x)-1) == 0) { \ 365 1.1 tshiozak act; \ 366 1.1 tshiozak lenvar -= sizeof(#x)-1; \ 367 1.1 tshiozak p += sizeof(#x)-1; \ 368 1.1 tshiozak } \ 369 1.13 rillig } while (0) 370 1.1 tshiozak const char *p; 371 1.1 tshiozak p = var; 372 1.1 tshiozak while (lenvar>0) { 373 1.1 tshiozak switch (*p) { 374 1.1 tshiozak case 'B': 375 1.1 tshiozak case 'b': 376 1.1 tshiozak MATCH(big, ei->preffered_endian = _ENDIAN_BIG); 377 1.1 tshiozak break; 378 1.1 tshiozak case 'L': 379 1.1 tshiozak case 'l': 380 1.1 tshiozak MATCH(little, ei->preffered_endian = _ENDIAN_LITTLE); 381 1.1 tshiozak break; 382 1.1 tshiozak case 'F': 383 1.1 tshiozak case 'f': 384 1.1 tshiozak MATCH(force, ei->mode |= _MODE_FORCE_ENDIAN); 385 1.1 tshiozak break; 386 1.1 tshiozak case 'U': 387 1.1 tshiozak case 'u': 388 1.1 tshiozak MATCH(utf32, ei->mode |= _MODE_UTF32); 389 1.1 tshiozak break; 390 1.1 tshiozak } 391 1.1 tshiozak p++; 392 1.1 tshiozak lenvar--; 393 1.1 tshiozak } 394 1.1 tshiozak } 395 1.1 tshiozak 396 1.1 tshiozak static int 397 1.1 tshiozak /*ARGSUSED*/ 398 1.1 tshiozak _citrus_UTF1632_encoding_module_init(_UTF1632EncodingInfo * __restrict ei, 399 1.1 tshiozak const void * __restrict var, 400 1.1 tshiozak size_t lenvar) 401 1.1 tshiozak { 402 1.1 tshiozak _DIAGASSERT(ei != NULL); 403 1.1 tshiozak 404 1.1 tshiozak memset((void *)ei, 0, sizeof(*ei)); 405 1.1 tshiozak 406 1.1 tshiozak parse_variable(ei, var, lenvar); 407 1.1 tshiozak 408 1.1 tshiozak if ((ei->mode&_MODE_UTF32)==0) 409 1.1 tshiozak ei->cur_max = 6; /* endian + surrogate */ 410 1.1 tshiozak else 411 1.1 tshiozak ei->cur_max = 8; /* endian + normal */ 412 1.1 tshiozak 413 1.1 tshiozak if (ei->preffered_endian == _ENDIAN_UNKNOWN) { 414 1.1 tshiozak #if BYTE_ORDER == BIG_ENDIAN 415 1.1 tshiozak ei->preffered_endian = _ENDIAN_BIG; 416 1.1 tshiozak #else 417 1.1 tshiozak ei->preffered_endian = _ENDIAN_LITTLE; 418 1.1 tshiozak #endif 419 1.1 tshiozak } 420 1.1 tshiozak 421 1.1 tshiozak return (0); 422 1.1 tshiozak } 423 1.1 tshiozak 424 1.1 tshiozak static void 425 1.1 tshiozak /*ARGSUSED*/ 426 1.1 tshiozak _citrus_UTF1632_encoding_module_uninit(_UTF1632EncodingInfo *ei) 427 1.1 tshiozak { 428 1.1 tshiozak } 429 1.1 tshiozak 430 1.1 tshiozak static __inline int 431 1.1 tshiozak /*ARGSUSED*/ 432 1.1 tshiozak _citrus_UTF1632_stdenc_wctocs(_UTF1632EncodingInfo * __restrict ei, 433 1.1 tshiozak _csid_t * __restrict csid, 434 1.1 tshiozak _index_t * __restrict idx, 435 1.1 tshiozak _wc_t wc) 436 1.1 tshiozak { 437 1.1 tshiozak 438 1.1 tshiozak _DIAGASSERT(csid != NULL && idx != NULL); 439 1.1 tshiozak 440 1.1 tshiozak *csid = 0; 441 1.1 tshiozak *idx = (_index_t)wc; 442 1.1 tshiozak 443 1.1 tshiozak return (0); 444 1.1 tshiozak } 445 1.1 tshiozak 446 1.1 tshiozak static __inline int 447 1.1 tshiozak /*ARGSUSED*/ 448 1.1 tshiozak _citrus_UTF1632_stdenc_cstowc(_UTF1632EncodingInfo * __restrict ei, 449 1.1 tshiozak _wc_t * __restrict wc, 450 1.1 tshiozak _csid_t csid, _index_t idx) 451 1.1 tshiozak { 452 1.1 tshiozak 453 1.1 tshiozak _DIAGASSERT(wc != NULL); 454 1.1 tshiozak 455 1.1 tshiozak if (csid != 0) 456 1.1 tshiozak return (EILSEQ); 457 1.1 tshiozak 458 1.1 tshiozak *wc = (_wc_t)idx; 459 1.1 tshiozak 460 1.1 tshiozak return (0); 461 1.1 tshiozak } 462 1.1 tshiozak 463 1.4 tshiozak static __inline int 464 1.4 tshiozak /*ARGSUSED*/ 465 1.4 tshiozak _citrus_UTF1632_stdenc_get_state_desc_generic(_UTF1632EncodingInfo * __restrict ei, 466 1.4 tshiozak _UTF1632State * __restrict psenc, 467 1.4 tshiozak int * __restrict rstate) 468 1.4 tshiozak { 469 1.4 tshiozak 470 1.4 tshiozak if (psenc->chlen == 0) 471 1.4 tshiozak *rstate = _STDENC_SDGEN_INITIAL; 472 1.4 tshiozak else 473 1.4 tshiozak *rstate = _STDENC_SDGEN_INCOMPLETE_CHAR; 474 1.4 tshiozak 475 1.4 tshiozak return 0; 476 1.4 tshiozak } 477 1.1 tshiozak 478 1.1 tshiozak /* ---------------------------------------------------------------------- 479 1.1 tshiozak * public interface for stdenc 480 1.1 tshiozak */ 481 1.1 tshiozak 482 1.1 tshiozak _CITRUS_STDENC_DECLS(UTF1632); 483 1.1 tshiozak _CITRUS_STDENC_DEF_OPS(UTF1632); 484 1.1 tshiozak 485 1.1 tshiozak #include "citrus_stdenc_template.h" 486