Home | History | Annotate | Line # | Download | only in modules
citrus_utf1632.c revision 1.9.4.1
      1  1.9.4.1       riz /*	$NetBSD: citrus_utf1632.c,v 1.9.4.1 2010/11/19 23:25:01 riz Exp $	*/
      2      1.1  tshiozak 
      3      1.1  tshiozak /*-
      4      1.1  tshiozak  * Copyright (c)2003 Citrus Project,
      5      1.1  tshiozak  * All rights reserved.
      6      1.1  tshiozak  *
      7      1.1  tshiozak  * Redistribution and use in source and binary forms, with or without
      8      1.1  tshiozak  * modification, are permitted provided that the following conditions
      9      1.1  tshiozak  * are met:
     10      1.1  tshiozak  * 1. Redistributions of source code must retain the above copyright
     11      1.1  tshiozak  *    notice, this list of conditions and the following disclaimer.
     12      1.1  tshiozak  * 2. Redistributions in binary form must reproduce the above copyright
     13      1.1  tshiozak  *    notice, this list of conditions and the following disclaimer in the
     14      1.1  tshiozak  *    documentation and/or other materials provided with the distribution.
     15      1.1  tshiozak  *
     16      1.1  tshiozak  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
     17      1.1  tshiozak  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     18      1.1  tshiozak  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     19      1.1  tshiozak  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     20      1.1  tshiozak  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     21      1.1  tshiozak  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     22      1.1  tshiozak  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     23      1.1  tshiozak  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     24      1.1  tshiozak  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     25      1.1  tshiozak  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     26      1.1  tshiozak  * SUCH DAMAGE.
     27      1.1  tshiozak  */
     28      1.1  tshiozak 
     29      1.1  tshiozak #include <sys/cdefs.h>
     30      1.1  tshiozak #if defined(LIBC_SCCS) && !defined(lint)
     31  1.9.4.1       riz __RCSID("$NetBSD: citrus_utf1632.c,v 1.9.4.1 2010/11/19 23:25:01 riz Exp $");
     32      1.1  tshiozak #endif /* LIBC_SCCS and not lint */
     33      1.1  tshiozak 
     34      1.1  tshiozak #include <assert.h>
     35      1.1  tshiozak #include <errno.h>
     36      1.1  tshiozak #include <string.h>
     37      1.1  tshiozak #include <stdio.h>
     38      1.1  tshiozak #include <stdlib.h>
     39      1.1  tshiozak #include <stddef.h>
     40      1.1  tshiozak #include <limits.h>
     41      1.1  tshiozak #include <wchar.h>
     42      1.1  tshiozak #include <sys/types.h>
     43      1.5    dogcow #include <machine/endian.h>
     44      1.1  tshiozak 
     45      1.1  tshiozak #include "citrus_namespace.h"
     46      1.1  tshiozak #include "citrus_types.h"
     47      1.1  tshiozak #include "citrus_module.h"
     48      1.1  tshiozak #include "citrus_stdenc.h"
     49      1.1  tshiozak #include "citrus_bcs.h"
     50      1.1  tshiozak 
     51      1.1  tshiozak #include "citrus_utf1632.h"
     52      1.1  tshiozak 
     53      1.1  tshiozak 
     54      1.1  tshiozak /* ----------------------------------------------------------------------
     55      1.1  tshiozak  * private stuffs used by templates
     56      1.1  tshiozak  */
     57      1.1  tshiozak 
     58      1.1  tshiozak typedef struct {
     59      1.1  tshiozak 	u_int8_t		ch[4];
     60      1.1  tshiozak 	int			chlen;
     61      1.1  tshiozak 	int			current_endian;
     62      1.1  tshiozak } _UTF1632State;
     63      1.1  tshiozak 
     64      1.1  tshiozak typedef struct {
     65      1.1  tshiozak 	int		preffered_endian;
     66      1.1  tshiozak 	unsigned int	cur_max;
     67      1.1  tshiozak #define _ENDIAN_UNKNOWN	0
     68      1.1  tshiozak #define _ENDIAN_BIG	1
     69      1.1  tshiozak #define _ENDIAN_LITTLE	2
     70      1.1  tshiozak 	u_int32_t	mode;
     71      1.1  tshiozak #define _MODE_UTF32		0x00000001U
     72      1.1  tshiozak #define _MODE_FORCE_ENDIAN	0x00000002U
     73      1.1  tshiozak } _UTF1632EncodingInfo;
     74      1.1  tshiozak 
     75      1.1  tshiozak #define _FUNCNAME(m)			_citrus_UTF1632_##m
     76      1.1  tshiozak #define _ENCODING_INFO			_UTF1632EncodingInfo
     77      1.1  tshiozak #define _ENCODING_STATE			_UTF1632State
     78      1.1  tshiozak #define _ENCODING_MB_CUR_MAX(_ei_)	((_ei_)->cur_max)
     79      1.1  tshiozak #define _ENCODING_IS_STATE_DEPENDENT	0
     80      1.1  tshiozak #define _STATE_NEEDS_EXPLICIT_INIT(_ps_)	0
     81      1.1  tshiozak 
     82      1.1  tshiozak 
     83      1.1  tshiozak static __inline void
     84      1.1  tshiozak /*ARGSUSED*/
     85      1.1  tshiozak _citrus_UTF1632_init_state(_UTF1632EncodingInfo *ei, _UTF1632State *s)
     86      1.1  tshiozak {
     87      1.1  tshiozak 	memset(s, 0, sizeof(*s));
     88      1.1  tshiozak }
     89      1.1  tshiozak 
     90      1.1  tshiozak static int
     91      1.1  tshiozak _citrus_UTF1632_mbrtowc_priv(_UTF1632EncodingInfo *ei, wchar_t *pwc,
     92      1.1  tshiozak 			     const char **s, size_t n, _UTF1632State *psenc,
     93      1.1  tshiozak 			     size_t *nresult)
     94      1.1  tshiozak {
     95      1.1  tshiozak 	int chlenbak, endian, needlen;
     96      1.1  tshiozak 	wchar_t wc;
     97      1.1  tshiozak 	size_t result;
     98      1.1  tshiozak 	const char *s0;
     99      1.1  tshiozak 
    100      1.1  tshiozak 	_DIAGASSERT(nresult != 0);
    101      1.1  tshiozak 	_DIAGASSERT(ei != NULL);
    102      1.1  tshiozak 	_DIAGASSERT(s != NULL);
    103      1.1  tshiozak 	_DIAGASSERT(psenc != NULL);
    104      1.1  tshiozak 
    105      1.1  tshiozak 	s0 = *s;
    106      1.1  tshiozak 
    107      1.1  tshiozak 	if (s0 == NULL) {
    108      1.1  tshiozak 		_citrus_UTF1632_init_state(ei, psenc);
    109      1.1  tshiozak 		*nresult = 0; /* state independent */
    110      1.1  tshiozak 		return (0);
    111      1.1  tshiozak 	}
    112      1.1  tshiozak 
    113      1.1  tshiozak 	result = 0;
    114      1.1  tshiozak 	chlenbak = psenc->chlen;
    115      1.1  tshiozak 
    116      1.1  tshiozak refetch:
    117      1.1  tshiozak 	if ((ei->mode & _MODE_UTF32) != 0 || chlenbak>=2)
    118      1.1  tshiozak 		needlen = 4;
    119      1.1  tshiozak 	else
    120      1.1  tshiozak 		needlen = 2;
    121      1.1  tshiozak 
    122      1.1  tshiozak 	while (chlenbak < needlen) {
    123      1.1  tshiozak 		if (n==0)
    124      1.1  tshiozak 			goto restart;
    125      1.1  tshiozak 		psenc->ch[chlenbak++] = *s0++;
    126      1.1  tshiozak 		n--;
    127      1.1  tshiozak 		result++;
    128      1.1  tshiozak 	}
    129      1.1  tshiozak 
    130  1.9.4.1       riz 	if (psenc->current_endian == _ENDIAN_UNKNOWN) {
    131  1.9.4.1       riz 		if ((ei->mode & _MODE_FORCE_ENDIAN) == 0) {
    132  1.9.4.1       riz 			/* judge endian marker */
    133  1.9.4.1       riz 			if ((ei->mode & _MODE_UTF32) == 0) {
    134  1.9.4.1       riz 				/* UTF16 */
    135  1.9.4.1       riz 				if (psenc->ch[0]==0xFE && psenc->ch[1]==0xFF) {
    136  1.9.4.1       riz 					psenc->current_endian = _ENDIAN_BIG;
    137  1.9.4.1       riz 					chlenbak = 0;
    138  1.9.4.1       riz 					goto refetch;
    139  1.9.4.1       riz 				} else if (psenc->ch[0]==0xFF && psenc->ch[1]==0xFE) {
    140  1.9.4.1       riz 					psenc->current_endian = _ENDIAN_LITTLE;
    141  1.9.4.1       riz 					chlenbak = 0;
    142  1.9.4.1       riz 					goto refetch;
    143  1.9.4.1       riz 				}
    144  1.9.4.1       riz 			} else {
    145  1.9.4.1       riz 				/* UTF32 */
    146  1.9.4.1       riz 				if (psenc->ch[0]==0x00 && psenc->ch[1]==0x00 &&
    147  1.9.4.1       riz 				    psenc->ch[2]==0xFE && psenc->ch[3]==0xFF) {
    148  1.9.4.1       riz 					psenc->current_endian = _ENDIAN_BIG;
    149  1.9.4.1       riz 					chlenbak = 0;
    150  1.9.4.1       riz 					goto refetch;
    151  1.9.4.1       riz 				} else if (psenc->ch[0]==0xFF && psenc->ch[1]==0xFE &&
    152  1.9.4.1       riz 					   psenc->ch[2]==0x00 && psenc->ch[3]==0x00) {
    153  1.9.4.1       riz 					psenc->current_endian = _ENDIAN_LITTLE;
    154  1.9.4.1       riz 					chlenbak = 0;
    155  1.9.4.1       riz 					goto refetch;
    156  1.9.4.1       riz 				}
    157  1.9.4.1       riz 			}
    158      1.1  tshiozak 		}
    159  1.9.4.1       riz 		psenc->current_endian = ei->preffered_endian;
    160      1.1  tshiozak 	}
    161  1.9.4.1       riz 	endian = psenc->current_endian;
    162      1.1  tshiozak 
    163      1.1  tshiozak 	/* get wc */
    164      1.1  tshiozak 	if ((ei->mode & _MODE_UTF32) == 0) {
    165      1.1  tshiozak 		/* UTF16 */
    166      1.1  tshiozak 		if (needlen==2) {
    167      1.1  tshiozak 			switch (endian) {
    168      1.1  tshiozak 			case _ENDIAN_LITTLE:
    169      1.1  tshiozak 				wc = (psenc->ch[0] |
    170      1.1  tshiozak 				      ((wchar_t)psenc->ch[1] << 8));
    171      1.1  tshiozak 				break;
    172      1.1  tshiozak 			case _ENDIAN_BIG:
    173      1.1  tshiozak 				wc = (psenc->ch[1] |
    174      1.1  tshiozak 				      ((wchar_t)psenc->ch[0] << 8));
    175      1.1  tshiozak 				break;
    176      1.6  christos 			default:
    177      1.6  christos 				goto ilseq;
    178      1.1  tshiozak 			}
    179      1.1  tshiozak 			if (wc >= 0xD800 && wc <= 0xDBFF) {
    180      1.1  tshiozak 				/* surrogate high */
    181      1.1  tshiozak 				needlen=4;
    182      1.1  tshiozak 				goto refetch;
    183      1.1  tshiozak 			}
    184      1.1  tshiozak 		} else {
    185      1.1  tshiozak 			/* surrogate low */
    186      1.1  tshiozak 			wc -= 0xD800; /* wc : surrogate high (see above) */
    187      1.1  tshiozak 			wc <<= 10;
    188      1.1  tshiozak 			switch (endian) {
    189      1.1  tshiozak 			case _ENDIAN_LITTLE:
    190  1.9.4.1       riz 				if (psenc->ch[3]<0xDC || psenc->ch[3]>0xDF)
    191      1.1  tshiozak 					goto ilseq;
    192      1.1  tshiozak 				wc |= psenc->ch[2];
    193      1.1  tshiozak 				wc |= (wchar_t)(psenc->ch[3] & 3) << 8;
    194      1.1  tshiozak 				break;
    195      1.1  tshiozak 			case _ENDIAN_BIG:
    196  1.9.4.1       riz 				if (psenc->ch[2]<0xDC || psenc->ch[2]>0xDF)
    197      1.1  tshiozak 					goto ilseq;
    198      1.1  tshiozak 				wc |= psenc->ch[3];
    199      1.1  tshiozak 				wc |= (wchar_t)(psenc->ch[2] & 3) << 8;
    200      1.1  tshiozak 				break;
    201      1.6  christos 			default:
    202      1.6  christos 				goto ilseq;
    203      1.1  tshiozak 			}
    204      1.1  tshiozak 			wc += 0x10000;
    205      1.1  tshiozak 		}
    206      1.1  tshiozak 	} else {
    207      1.1  tshiozak 		/* UTF32 */
    208      1.1  tshiozak 		switch (endian) {
    209      1.1  tshiozak 		case _ENDIAN_LITTLE:
    210      1.1  tshiozak 			wc = (psenc->ch[0] |
    211      1.1  tshiozak 			      ((wchar_t)psenc->ch[1] << 8) |
    212      1.1  tshiozak 			      ((wchar_t)psenc->ch[2] << 16) |
    213      1.1  tshiozak 			      ((wchar_t)psenc->ch[3] << 24));
    214      1.1  tshiozak 			break;
    215      1.1  tshiozak 		case _ENDIAN_BIG:
    216      1.1  tshiozak 			wc = (psenc->ch[3] |
    217      1.1  tshiozak 			      ((wchar_t)psenc->ch[2] << 8) |
    218      1.1  tshiozak 			      ((wchar_t)psenc->ch[1] << 16) |
    219      1.1  tshiozak 			      ((wchar_t)psenc->ch[0] << 24));
    220      1.1  tshiozak 			break;
    221      1.6  christos 		default:
    222      1.6  christos 			goto ilseq;
    223      1.1  tshiozak 		}
    224      1.7   tnozaki 		if (wc >= 0xD800 && wc <= 0xDFFF)
    225      1.7   tnozaki 			goto ilseq;
    226      1.1  tshiozak 	}
    227      1.1  tshiozak 
    228      1.1  tshiozak 
    229      1.1  tshiozak 	*pwc = wc;
    230      1.1  tshiozak 	psenc->chlen = 0;
    231      1.1  tshiozak 	*nresult = result;
    232      1.1  tshiozak 	*s = s0;
    233      1.1  tshiozak 
    234      1.1  tshiozak 	return (0);
    235      1.1  tshiozak 
    236      1.1  tshiozak ilseq:
    237      1.1  tshiozak 	*nresult = (size_t)-1;
    238      1.1  tshiozak 	psenc->chlen = 0;
    239      1.1  tshiozak 	return (EILSEQ);
    240      1.1  tshiozak 
    241      1.1  tshiozak restart:
    242      1.1  tshiozak 	*nresult = (size_t)-2;
    243      1.1  tshiozak 	psenc->chlen = chlenbak;
    244      1.1  tshiozak 	*s = s0;
    245      1.1  tshiozak 	return (0);
    246      1.1  tshiozak }
    247      1.1  tshiozak 
    248      1.1  tshiozak static int
    249      1.1  tshiozak _citrus_UTF1632_wcrtomb_priv(_UTF1632EncodingInfo *ei, char *s, size_t n,
    250      1.1  tshiozak 			     wchar_t wc, _UTF1632State *psenc,
    251      1.1  tshiozak 			     size_t *nresult)
    252      1.1  tshiozak {
    253      1.1  tshiozak 	int ret;
    254      1.1  tshiozak 	wchar_t wc2;
    255      1.8   tnozaki 	static const char _bom[4] = {
    256      1.8   tnozaki #if BYTE_ORDER == BIG_ENDIAN
    257      1.8   tnozaki 	    0x00, 0x00, 0xFE, 0xFF,
    258      1.8   tnozaki #else
    259      1.8   tnozaki 	    0xFF, 0xFE, 0x00, 0x00,
    260      1.8   tnozaki #endif
    261      1.8   tnozaki 	};
    262      1.8   tnozaki 	const char *bom = &_bom[0];
    263      1.8   tnozaki 	size_t cnt;
    264      1.1  tshiozak 
    265      1.1  tshiozak 	_DIAGASSERT(ei != NULL);
    266      1.1  tshiozak 	_DIAGASSERT(nresult != 0);
    267      1.1  tshiozak 	_DIAGASSERT(s != NULL);
    268      1.1  tshiozak 
    269      1.8   tnozaki 	cnt = (size_t)0;
    270      1.8   tnozaki 	if (psenc->current_endian == _ENDIAN_UNKNOWN) {
    271      1.8   tnozaki 		if ((ei->mode & _MODE_FORCE_ENDIAN) == 0) {
    272      1.8   tnozaki 			if (ei->mode & _MODE_UTF32) {
    273      1.8   tnozaki 				cnt = 4;
    274      1.8   tnozaki 			} else {
    275      1.8   tnozaki 				cnt = 2;
    276      1.8   tnozaki #if BYTE_ORDER == BIG_ENDIAN
    277      1.8   tnozaki 				bom += 2;
    278      1.8   tnozaki #endif
    279      1.8   tnozaki 			}
    280      1.8   tnozaki 			if (n < cnt)
    281      1.8   tnozaki 				goto e2big;
    282      1.8   tnozaki 			memcpy(s, bom, cnt);
    283      1.8   tnozaki 			s += cnt, n -= cnt;
    284      1.8   tnozaki 		}
    285      1.8   tnozaki 		psenc->current_endian = ei->preffered_endian;
    286      1.8   tnozaki 	}
    287      1.8   tnozaki 
    288      1.1  tshiozak 	wc2 = 0;
    289      1.1  tshiozak 	if ((ei->mode & _MODE_UTF32)==0) {
    290      1.1  tshiozak 		/* UTF16 */
    291      1.1  tshiozak 		if (wc>0xFFFF) {
    292      1.1  tshiozak 			/* surrogate */
    293      1.8   tnozaki 			if (wc>0x10FFFF)
    294      1.8   tnozaki 				goto ilseq;
    295      1.8   tnozaki 			if (n < 4)
    296      1.8   tnozaki 				goto e2big;
    297      1.8   tnozaki 			cnt += 4;
    298      1.1  tshiozak 			wc -= 0x10000;
    299      1.1  tshiozak 			wc2 = (wc & 0x3FF) | 0xDC00;
    300      1.1  tshiozak 			wc = (wc>>10) | 0xD800;
    301      1.1  tshiozak 		} else {
    302      1.8   tnozaki 			if (n < 2)
    303      1.8   tnozaki 				goto e2big;
    304      1.8   tnozaki 			cnt += 2;
    305      1.1  tshiozak 		}
    306      1.1  tshiozak 
    307      1.1  tshiozak surrogate:
    308      1.8   tnozaki 		switch (psenc->current_endian) {
    309      1.1  tshiozak 		case _ENDIAN_BIG:
    310      1.1  tshiozak 			s[1] = wc;
    311      1.1  tshiozak 			s[0] = (wc >>= 8);
    312      1.1  tshiozak 			break;
    313      1.1  tshiozak 		case _ENDIAN_LITTLE:
    314      1.1  tshiozak 			s[0] = wc;
    315      1.1  tshiozak 			s[1] = (wc >>= 8);
    316      1.1  tshiozak 			break;
    317      1.1  tshiozak 		}
    318      1.1  tshiozak 		if (wc2!=0) {
    319      1.1  tshiozak 			wc = wc2;
    320      1.1  tshiozak 			wc2 = 0;
    321      1.1  tshiozak 			s += 2;
    322      1.1  tshiozak 			goto surrogate;
    323      1.1  tshiozak 		}
    324      1.1  tshiozak 	} else {
    325      1.1  tshiozak 		/* UTF32 */
    326      1.7   tnozaki 		if (wc >= 0xD800 && wc <= 0xDFFF)
    327      1.8   tnozaki 			goto ilseq;
    328      1.8   tnozaki 		if (n < 4)
    329      1.8   tnozaki 			goto e2big;
    330      1.8   tnozaki 		cnt += 4;
    331      1.8   tnozaki 		switch (psenc->current_endian) {
    332      1.1  tshiozak 		case _ENDIAN_BIG:
    333      1.1  tshiozak 			s[3] = wc;
    334      1.1  tshiozak 			s[2] = (wc >>= 8);
    335      1.1  tshiozak 			s[1] = (wc >>= 8);
    336      1.1  tshiozak 			s[0] = (wc >>= 8);
    337      1.1  tshiozak 			break;
    338      1.1  tshiozak 		case _ENDIAN_LITTLE:
    339      1.1  tshiozak 			s[0] = wc;
    340      1.1  tshiozak 			s[1] = (wc >>= 8);
    341      1.1  tshiozak 			s[2] = (wc >>= 8);
    342      1.1  tshiozak 			s[3] = (wc >>= 8);
    343      1.1  tshiozak 			break;
    344      1.1  tshiozak 		}
    345      1.1  tshiozak 	}
    346      1.8   tnozaki 	*nresult = cnt;
    347      1.1  tshiozak 
    348      1.1  tshiozak 	return 0;
    349      1.1  tshiozak 
    350      1.8   tnozaki ilseq:
    351      1.8   tnozaki 	*nresult = (size_t)-1;
    352      1.8   tnozaki 	return EILSEQ;
    353      1.8   tnozaki e2big:
    354      1.1  tshiozak 	*nresult = (size_t)-1;
    355      1.8   tnozaki 	return E2BIG;
    356      1.1  tshiozak }
    357      1.1  tshiozak 
    358      1.1  tshiozak static void
    359      1.1  tshiozak parse_variable(_UTF1632EncodingInfo * __restrict ei,
    360      1.1  tshiozak 	       const void * __restrict var, size_t lenvar)
    361      1.1  tshiozak {
    362      1.1  tshiozak #define MATCH(x, act)						\
    363      1.1  tshiozak do {								\
    364      1.1  tshiozak 	if (lenvar >= (sizeof(#x)-1) &&				\
    365      1.1  tshiozak 	    _bcs_strncasecmp(p, #x, sizeof(#x)-1) == 0) {	\
    366      1.1  tshiozak 		act;						\
    367      1.1  tshiozak 		lenvar -= sizeof(#x)-1;				\
    368      1.1  tshiozak 		p += sizeof(#x)-1;				\
    369      1.1  tshiozak 	}							\
    370      1.1  tshiozak } while (/*CONSTCOND*/0)
    371      1.1  tshiozak 	const char *p;
    372      1.1  tshiozak 	p = var;
    373      1.1  tshiozak 	while (lenvar>0) {
    374      1.1  tshiozak 		switch (*p) {
    375      1.1  tshiozak 		case 'B':
    376      1.1  tshiozak 		case 'b':
    377      1.1  tshiozak 			MATCH(big, ei->preffered_endian = _ENDIAN_BIG);
    378      1.1  tshiozak 			break;
    379      1.1  tshiozak 		case 'L':
    380      1.1  tshiozak 		case 'l':
    381      1.1  tshiozak 			MATCH(little, ei->preffered_endian = _ENDIAN_LITTLE);
    382      1.1  tshiozak 			break;
    383      1.1  tshiozak 		case 'F':
    384      1.1  tshiozak 		case 'f':
    385      1.1  tshiozak 			MATCH(force, ei->mode |= _MODE_FORCE_ENDIAN);
    386      1.1  tshiozak 			break;
    387      1.1  tshiozak 		case 'U':
    388      1.1  tshiozak 		case 'u':
    389      1.1  tshiozak 			MATCH(utf32, ei->mode |= _MODE_UTF32);
    390      1.1  tshiozak 			break;
    391      1.1  tshiozak 		}
    392      1.1  tshiozak 		p++;
    393      1.1  tshiozak 		lenvar--;
    394      1.1  tshiozak 	}
    395      1.1  tshiozak }
    396      1.1  tshiozak 
    397      1.1  tshiozak static int
    398      1.1  tshiozak /*ARGSUSED*/
    399      1.1  tshiozak _citrus_UTF1632_encoding_module_init(_UTF1632EncodingInfo * __restrict ei,
    400      1.1  tshiozak 				     const void * __restrict var,
    401      1.1  tshiozak 				     size_t lenvar)
    402      1.1  tshiozak {
    403      1.1  tshiozak 	_DIAGASSERT(ei != NULL);
    404      1.1  tshiozak 
    405      1.1  tshiozak 	memset((void *)ei, 0, sizeof(*ei));
    406      1.1  tshiozak 
    407      1.1  tshiozak 	parse_variable(ei, var, lenvar);
    408      1.1  tshiozak 
    409      1.1  tshiozak 	if ((ei->mode&_MODE_UTF32)==0)
    410      1.1  tshiozak 		ei->cur_max = 6; /* endian + surrogate */
    411      1.1  tshiozak 	else
    412      1.1  tshiozak 		ei->cur_max = 8; /* endian + normal */
    413      1.1  tshiozak 
    414      1.1  tshiozak 	if (ei->preffered_endian == _ENDIAN_UNKNOWN) {
    415      1.1  tshiozak #if BYTE_ORDER == BIG_ENDIAN
    416      1.1  tshiozak 		ei->preffered_endian = _ENDIAN_BIG;
    417      1.1  tshiozak #else
    418      1.1  tshiozak 		ei->preffered_endian = _ENDIAN_LITTLE;
    419      1.1  tshiozak #endif
    420      1.1  tshiozak 	}
    421      1.1  tshiozak 
    422      1.1  tshiozak 	return (0);
    423      1.1  tshiozak }
    424      1.1  tshiozak 
    425      1.1  tshiozak static void
    426      1.1  tshiozak /*ARGSUSED*/
    427      1.1  tshiozak _citrus_UTF1632_encoding_module_uninit(_UTF1632EncodingInfo *ei)
    428      1.1  tshiozak {
    429      1.1  tshiozak }
    430      1.1  tshiozak 
    431      1.1  tshiozak static __inline int
    432      1.1  tshiozak /*ARGSUSED*/
    433      1.1  tshiozak _citrus_UTF1632_stdenc_wctocs(_UTF1632EncodingInfo * __restrict ei,
    434      1.1  tshiozak 			      _csid_t * __restrict csid,
    435      1.1  tshiozak 			      _index_t * __restrict idx,
    436      1.1  tshiozak 			      _wc_t wc)
    437      1.1  tshiozak {
    438      1.1  tshiozak 
    439      1.1  tshiozak 	_DIAGASSERT(csid != NULL && idx != NULL);
    440      1.1  tshiozak 
    441      1.1  tshiozak 	*csid = 0;
    442      1.1  tshiozak 	*idx = (_index_t)wc;
    443      1.1  tshiozak 
    444      1.1  tshiozak 	return (0);
    445      1.1  tshiozak }
    446      1.1  tshiozak 
    447      1.1  tshiozak static __inline int
    448      1.1  tshiozak /*ARGSUSED*/
    449      1.1  tshiozak _citrus_UTF1632_stdenc_cstowc(_UTF1632EncodingInfo * __restrict ei,
    450      1.1  tshiozak 			      _wc_t * __restrict wc,
    451      1.1  tshiozak 			      _csid_t csid, _index_t idx)
    452      1.1  tshiozak {
    453      1.1  tshiozak 
    454      1.1  tshiozak 	_DIAGASSERT(wc != NULL);
    455      1.1  tshiozak 
    456      1.1  tshiozak 	if (csid != 0)
    457      1.1  tshiozak 		return (EILSEQ);
    458      1.1  tshiozak 
    459      1.1  tshiozak 	*wc = (_wc_t)idx;
    460      1.1  tshiozak 
    461      1.1  tshiozak 	return (0);
    462      1.1  tshiozak }
    463      1.1  tshiozak 
    464      1.4  tshiozak static __inline int
    465      1.4  tshiozak /*ARGSUSED*/
    466      1.4  tshiozak _citrus_UTF1632_stdenc_get_state_desc_generic(_UTF1632EncodingInfo * __restrict ei,
    467      1.4  tshiozak 					      _UTF1632State * __restrict psenc,
    468      1.4  tshiozak 					      int * __restrict rstate)
    469      1.4  tshiozak {
    470      1.4  tshiozak 
    471      1.4  tshiozak 	if (psenc->chlen == 0)
    472      1.4  tshiozak 		*rstate = _STDENC_SDGEN_INITIAL;
    473      1.4  tshiozak 	else
    474      1.4  tshiozak 		*rstate = _STDENC_SDGEN_INCOMPLETE_CHAR;
    475      1.4  tshiozak 
    476      1.4  tshiozak 	return 0;
    477      1.4  tshiozak }
    478      1.1  tshiozak 
    479      1.1  tshiozak /* ----------------------------------------------------------------------
    480      1.1  tshiozak  * public interface for stdenc
    481      1.1  tshiozak  */
    482      1.1  tshiozak 
    483      1.1  tshiozak _CITRUS_STDENC_DECLS(UTF1632);
    484      1.1  tshiozak _CITRUS_STDENC_DEF_OPS(UTF1632);
    485      1.1  tshiozak 
    486      1.1  tshiozak #include "citrus_stdenc_template.h"
    487