Home | History | Annotate | Line # | Download | only in modules
citrus_utf1632.c revision 1.10
      1  1.10   tnozaki /*	$NetBSD: citrus_utf1632.c,v 1.10 2010/03/15 15:00:58 tnozaki Exp $	*/
      2   1.1  tshiozak 
      3   1.1  tshiozak /*-
      4   1.1  tshiozak  * Copyright (c)2003 Citrus Project,
      5   1.1  tshiozak  * All rights reserved.
      6   1.1  tshiozak  *
      7   1.1  tshiozak  * Redistribution and use in source and binary forms, with or without
      8   1.1  tshiozak  * modification, are permitted provided that the following conditions
      9   1.1  tshiozak  * are met:
     10   1.1  tshiozak  * 1. Redistributions of source code must retain the above copyright
     11   1.1  tshiozak  *    notice, this list of conditions and the following disclaimer.
     12   1.1  tshiozak  * 2. Redistributions in binary form must reproduce the above copyright
     13   1.1  tshiozak  *    notice, this list of conditions and the following disclaimer in the
     14   1.1  tshiozak  *    documentation and/or other materials provided with the distribution.
     15   1.1  tshiozak  *
     16   1.1  tshiozak  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
     17   1.1  tshiozak  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     18   1.1  tshiozak  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     19   1.1  tshiozak  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     20   1.1  tshiozak  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     21   1.1  tshiozak  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     22   1.1  tshiozak  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     23   1.1  tshiozak  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     24   1.1  tshiozak  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     25   1.1  tshiozak  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     26   1.1  tshiozak  * SUCH DAMAGE.
     27   1.1  tshiozak  */
     28   1.1  tshiozak 
     29   1.1  tshiozak #include <sys/cdefs.h>
     30   1.1  tshiozak #if defined(LIBC_SCCS) && !defined(lint)
     31  1.10   tnozaki __RCSID("$NetBSD: citrus_utf1632.c,v 1.10 2010/03/15 15:00:58 tnozaki Exp $");
     32   1.1  tshiozak #endif /* LIBC_SCCS and not lint */
     33   1.1  tshiozak 
     34   1.1  tshiozak #include <assert.h>
     35   1.1  tshiozak #include <errno.h>
     36   1.1  tshiozak #include <string.h>
     37   1.1  tshiozak #include <stdio.h>
     38   1.1  tshiozak #include <stdlib.h>
     39   1.1  tshiozak #include <stddef.h>
     40   1.1  tshiozak #include <limits.h>
     41   1.1  tshiozak #include <wchar.h>
     42   1.1  tshiozak #include <sys/types.h>
     43   1.5    dogcow #include <machine/endian.h>
     44   1.1  tshiozak 
     45   1.1  tshiozak #include "citrus_namespace.h"
     46   1.1  tshiozak #include "citrus_types.h"
     47   1.1  tshiozak #include "citrus_module.h"
     48   1.1  tshiozak #include "citrus_stdenc.h"
     49   1.1  tshiozak #include "citrus_bcs.h"
     50   1.1  tshiozak 
     51   1.1  tshiozak #include "citrus_utf1632.h"
     52   1.1  tshiozak 
     53   1.1  tshiozak 
     54   1.1  tshiozak /* ----------------------------------------------------------------------
     55   1.1  tshiozak  * private stuffs used by templates
     56   1.1  tshiozak  */
     57   1.1  tshiozak 
     58   1.1  tshiozak typedef struct {
     59   1.1  tshiozak 	u_int8_t		ch[4];
     60   1.1  tshiozak 	int			chlen;
     61   1.1  tshiozak 	int			current_endian;
     62   1.1  tshiozak } _UTF1632State;
     63   1.1  tshiozak 
     64   1.1  tshiozak typedef struct {
     65   1.1  tshiozak 	int		preffered_endian;
     66   1.1  tshiozak 	unsigned int	cur_max;
     67   1.1  tshiozak #define _ENDIAN_UNKNOWN	0
     68   1.1  tshiozak #define _ENDIAN_BIG	1
     69   1.1  tshiozak #define _ENDIAN_LITTLE	2
     70   1.1  tshiozak 	u_int32_t	mode;
     71   1.1  tshiozak #define _MODE_UTF32		0x00000001U
     72   1.1  tshiozak #define _MODE_FORCE_ENDIAN	0x00000002U
     73   1.1  tshiozak } _UTF1632EncodingInfo;
     74   1.1  tshiozak 
     75   1.1  tshiozak #define _FUNCNAME(m)			_citrus_UTF1632_##m
     76   1.1  tshiozak #define _ENCODING_INFO			_UTF1632EncodingInfo
     77   1.1  tshiozak #define _ENCODING_STATE			_UTF1632State
     78   1.1  tshiozak #define _ENCODING_MB_CUR_MAX(_ei_)	((_ei_)->cur_max)
     79   1.1  tshiozak #define _ENCODING_IS_STATE_DEPENDENT	0
     80   1.1  tshiozak #define _STATE_NEEDS_EXPLICIT_INIT(_ps_)	0
     81   1.1  tshiozak 
     82   1.1  tshiozak 
     83   1.1  tshiozak static __inline void
     84   1.1  tshiozak /*ARGSUSED*/
     85   1.1  tshiozak _citrus_UTF1632_init_state(_UTF1632EncodingInfo *ei, _UTF1632State *s)
     86   1.1  tshiozak {
     87   1.1  tshiozak 	memset(s, 0, sizeof(*s));
     88   1.1  tshiozak }
     89   1.1  tshiozak 
     90   1.1  tshiozak static int
     91   1.1  tshiozak _citrus_UTF1632_mbrtowc_priv(_UTF1632EncodingInfo *ei, wchar_t *pwc,
     92   1.1  tshiozak 			     const char **s, size_t n, _UTF1632State *psenc,
     93   1.1  tshiozak 			     size_t *nresult)
     94   1.1  tshiozak {
     95   1.1  tshiozak 	int chlenbak, endian, needlen;
     96   1.1  tshiozak 	wchar_t wc;
     97   1.1  tshiozak 	size_t result;
     98   1.1  tshiozak 	const char *s0;
     99   1.1  tshiozak 
    100   1.1  tshiozak 	_DIAGASSERT(nresult != 0);
    101   1.1  tshiozak 	_DIAGASSERT(ei != NULL);
    102   1.1  tshiozak 	_DIAGASSERT(s != NULL);
    103   1.1  tshiozak 	_DIAGASSERT(psenc != NULL);
    104   1.1  tshiozak 
    105   1.1  tshiozak 	s0 = *s;
    106   1.1  tshiozak 
    107   1.1  tshiozak 	if (s0 == NULL) {
    108   1.1  tshiozak 		_citrus_UTF1632_init_state(ei, psenc);
    109   1.1  tshiozak 		*nresult = 0; /* state independent */
    110   1.1  tshiozak 		return (0);
    111   1.1  tshiozak 	}
    112   1.1  tshiozak 
    113   1.1  tshiozak 	result = 0;
    114   1.1  tshiozak 	chlenbak = psenc->chlen;
    115   1.1  tshiozak 
    116   1.1  tshiozak refetch:
    117   1.1  tshiozak 	if ((ei->mode & _MODE_UTF32) != 0 || chlenbak>=2)
    118   1.1  tshiozak 		needlen = 4;
    119   1.1  tshiozak 	else
    120   1.1  tshiozak 		needlen = 2;
    121   1.1  tshiozak 
    122   1.1  tshiozak 	while (chlenbak < needlen) {
    123   1.1  tshiozak 		if (n==0)
    124   1.1  tshiozak 			goto restart;
    125   1.1  tshiozak 		psenc->ch[chlenbak++] = *s0++;
    126   1.1  tshiozak 		n--;
    127   1.1  tshiozak 		result++;
    128   1.1  tshiozak 	}
    129   1.1  tshiozak 
    130  1.10   tnozaki 	if (psenc->current_endian == _ENDIAN_UNKNOWN) {
    131  1.10   tnozaki 		if ((ei->mode & _MODE_FORCE_ENDIAN) == 0) {
    132  1.10   tnozaki 			/* judge endian marker */
    133  1.10   tnozaki 			if ((ei->mode & _MODE_UTF32) == 0) {
    134  1.10   tnozaki 				/* UTF16 */
    135  1.10   tnozaki 				if (psenc->ch[0]==0xFE && psenc->ch[1]==0xFF) {
    136  1.10   tnozaki 					psenc->current_endian = _ENDIAN_BIG;
    137  1.10   tnozaki 					chlenbak = 0;
    138  1.10   tnozaki 					goto refetch;
    139  1.10   tnozaki 				} else if (psenc->ch[0]==0xFF && psenc->ch[1]==0xFE) {
    140  1.10   tnozaki 					psenc->current_endian = _ENDIAN_LITTLE;
    141  1.10   tnozaki 					chlenbak = 0;
    142  1.10   tnozaki 					goto refetch;
    143  1.10   tnozaki 				}
    144  1.10   tnozaki 			} else {
    145  1.10   tnozaki 				/* UTF32 */
    146  1.10   tnozaki 				if (psenc->ch[0]==0x00 && psenc->ch[1]==0x00 &&
    147  1.10   tnozaki 				    psenc->ch[2]==0xFE && psenc->ch[3]==0xFF) {
    148  1.10   tnozaki 					psenc->current_endian = _ENDIAN_BIG;
    149  1.10   tnozaki 					chlenbak = 0;
    150  1.10   tnozaki 					goto refetch;
    151  1.10   tnozaki 				} else if (psenc->ch[0]==0xFF && psenc->ch[1]==0xFE &&
    152  1.10   tnozaki 					   psenc->ch[2]==0x00 && psenc->ch[3]==0x00) {
    153  1.10   tnozaki 					psenc->current_endian = _ENDIAN_LITTLE;
    154  1.10   tnozaki 					chlenbak = 0;
    155  1.10   tnozaki 					goto refetch;
    156  1.10   tnozaki 				}
    157  1.10   tnozaki 			}
    158  1.10   tnozaki 		} else {
    159  1.10   tnozaki 			psenc->current_endian = ei->preffered_endian;
    160   1.1  tshiozak 		}
    161   1.1  tshiozak 	}
    162  1.10   tnozaki 	endian = psenc->current_endian;
    163   1.1  tshiozak 
    164   1.1  tshiozak 	/* get wc */
    165   1.1  tshiozak 	if ((ei->mode & _MODE_UTF32) == 0) {
    166   1.1  tshiozak 		/* UTF16 */
    167   1.1  tshiozak 		if (needlen==2) {
    168   1.1  tshiozak 			switch (endian) {
    169   1.1  tshiozak 			case _ENDIAN_LITTLE:
    170   1.1  tshiozak 				wc = (psenc->ch[0] |
    171   1.1  tshiozak 				      ((wchar_t)psenc->ch[1] << 8));
    172   1.1  tshiozak 				break;
    173   1.1  tshiozak 			case _ENDIAN_BIG:
    174   1.1  tshiozak 				wc = (psenc->ch[1] |
    175   1.1  tshiozak 				      ((wchar_t)psenc->ch[0] << 8));
    176   1.1  tshiozak 				break;
    177   1.6  christos 			default:
    178   1.6  christos 				goto ilseq;
    179   1.1  tshiozak 			}
    180   1.1  tshiozak 			if (wc >= 0xD800 && wc <= 0xDBFF) {
    181   1.1  tshiozak 				/* surrogate high */
    182   1.1  tshiozak 				needlen=4;
    183   1.1  tshiozak 				goto refetch;
    184   1.1  tshiozak 			}
    185   1.1  tshiozak 		} else {
    186   1.1  tshiozak 			/* surrogate low */
    187   1.1  tshiozak 			wc -= 0xD800; /* wc : surrogate high (see above) */
    188   1.1  tshiozak 			wc <<= 10;
    189   1.1  tshiozak 			switch (endian) {
    190   1.1  tshiozak 			case _ENDIAN_LITTLE:
    191  1.10   tnozaki 				if (psenc->ch[3]<0xDC || psenc->ch[3]>0xDF)
    192   1.1  tshiozak 					goto ilseq;
    193   1.1  tshiozak 				wc |= psenc->ch[2];
    194   1.1  tshiozak 				wc |= (wchar_t)(psenc->ch[3] & 3) << 8;
    195   1.1  tshiozak 				break;
    196   1.1  tshiozak 			case _ENDIAN_BIG:
    197  1.10   tnozaki 				if (psenc->ch[2]<0xDC || psenc->ch[2]>0xDF)
    198   1.1  tshiozak 					goto ilseq;
    199   1.1  tshiozak 				wc |= psenc->ch[3];
    200   1.1  tshiozak 				wc |= (wchar_t)(psenc->ch[2] & 3) << 8;
    201   1.1  tshiozak 				break;
    202   1.6  christos 			default:
    203   1.6  christos 				goto ilseq;
    204   1.1  tshiozak 			}
    205   1.1  tshiozak 			wc += 0x10000;
    206   1.1  tshiozak 		}
    207   1.1  tshiozak 	} else {
    208   1.1  tshiozak 		/* UTF32 */
    209   1.1  tshiozak 		switch (endian) {
    210   1.1  tshiozak 		case _ENDIAN_LITTLE:
    211   1.1  tshiozak 			wc = (psenc->ch[0] |
    212   1.1  tshiozak 			      ((wchar_t)psenc->ch[1] << 8) |
    213   1.1  tshiozak 			      ((wchar_t)psenc->ch[2] << 16) |
    214   1.1  tshiozak 			      ((wchar_t)psenc->ch[3] << 24));
    215   1.1  tshiozak 			break;
    216   1.1  tshiozak 		case _ENDIAN_BIG:
    217   1.1  tshiozak 			wc = (psenc->ch[3] |
    218   1.1  tshiozak 			      ((wchar_t)psenc->ch[2] << 8) |
    219   1.1  tshiozak 			      ((wchar_t)psenc->ch[1] << 16) |
    220   1.1  tshiozak 			      ((wchar_t)psenc->ch[0] << 24));
    221   1.1  tshiozak 			break;
    222   1.6  christos 		default:
    223   1.6  christos 			goto ilseq;
    224   1.1  tshiozak 		}
    225   1.7   tnozaki 		if (wc >= 0xD800 && wc <= 0xDFFF)
    226   1.7   tnozaki 			goto ilseq;
    227   1.1  tshiozak 	}
    228   1.1  tshiozak 
    229   1.1  tshiozak 
    230   1.1  tshiozak 	*pwc = wc;
    231   1.1  tshiozak 	psenc->chlen = 0;
    232   1.1  tshiozak 	*nresult = result;
    233   1.1  tshiozak 	*s = s0;
    234   1.1  tshiozak 
    235   1.1  tshiozak 	return (0);
    236   1.1  tshiozak 
    237   1.1  tshiozak ilseq:
    238   1.1  tshiozak 	*nresult = (size_t)-1;
    239   1.1  tshiozak 	psenc->chlen = 0;
    240   1.1  tshiozak 	return (EILSEQ);
    241   1.1  tshiozak 
    242   1.1  tshiozak restart:
    243   1.1  tshiozak 	*nresult = (size_t)-2;
    244   1.1  tshiozak 	psenc->chlen = chlenbak;
    245   1.1  tshiozak 	*s = s0;
    246   1.1  tshiozak 	return (0);
    247   1.1  tshiozak }
    248   1.1  tshiozak 
    249   1.1  tshiozak static int
    250   1.1  tshiozak _citrus_UTF1632_wcrtomb_priv(_UTF1632EncodingInfo *ei, char *s, size_t n,
    251   1.1  tshiozak 			     wchar_t wc, _UTF1632State *psenc,
    252   1.1  tshiozak 			     size_t *nresult)
    253   1.1  tshiozak {
    254   1.1  tshiozak 	int ret;
    255   1.1  tshiozak 	wchar_t wc2;
    256   1.8   tnozaki 	static const char _bom[4] = {
    257   1.8   tnozaki #if BYTE_ORDER == BIG_ENDIAN
    258   1.8   tnozaki 	    0x00, 0x00, 0xFE, 0xFF,
    259   1.8   tnozaki #else
    260   1.8   tnozaki 	    0xFF, 0xFE, 0x00, 0x00,
    261   1.8   tnozaki #endif
    262   1.8   tnozaki 	};
    263   1.8   tnozaki 	const char *bom = &_bom[0];
    264   1.8   tnozaki 	size_t cnt;
    265   1.1  tshiozak 
    266   1.1  tshiozak 	_DIAGASSERT(ei != NULL);
    267   1.1  tshiozak 	_DIAGASSERT(nresult != 0);
    268   1.1  tshiozak 	_DIAGASSERT(s != NULL);
    269   1.1  tshiozak 
    270   1.8   tnozaki 	cnt = (size_t)0;
    271   1.8   tnozaki 	if (psenc->current_endian == _ENDIAN_UNKNOWN) {
    272   1.8   tnozaki 		if ((ei->mode & _MODE_FORCE_ENDIAN) == 0) {
    273   1.8   tnozaki 			if (ei->mode & _MODE_UTF32) {
    274   1.8   tnozaki 				cnt = 4;
    275   1.8   tnozaki 			} else {
    276   1.8   tnozaki 				cnt = 2;
    277   1.8   tnozaki #if BYTE_ORDER == BIG_ENDIAN
    278   1.8   tnozaki 				bom += 2;
    279   1.8   tnozaki #endif
    280   1.8   tnozaki 			}
    281   1.8   tnozaki 			if (n < cnt)
    282   1.8   tnozaki 				goto e2big;
    283   1.8   tnozaki 			memcpy(s, bom, cnt);
    284   1.8   tnozaki 			s += cnt, n -= cnt;
    285   1.8   tnozaki 		}
    286   1.8   tnozaki 		psenc->current_endian = ei->preffered_endian;
    287   1.8   tnozaki 	}
    288   1.8   tnozaki 
    289   1.1  tshiozak 	wc2 = 0;
    290   1.1  tshiozak 	if ((ei->mode & _MODE_UTF32)==0) {
    291   1.1  tshiozak 		/* UTF16 */
    292   1.1  tshiozak 		if (wc>0xFFFF) {
    293   1.1  tshiozak 			/* surrogate */
    294   1.8   tnozaki 			if (wc>0x10FFFF)
    295   1.8   tnozaki 				goto ilseq;
    296   1.8   tnozaki 			if (n < 4)
    297   1.8   tnozaki 				goto e2big;
    298   1.8   tnozaki 			cnt += 4;
    299   1.1  tshiozak 			wc -= 0x10000;
    300   1.1  tshiozak 			wc2 = (wc & 0x3FF) | 0xDC00;
    301   1.1  tshiozak 			wc = (wc>>10) | 0xD800;
    302   1.1  tshiozak 		} else {
    303   1.8   tnozaki 			if (n < 2)
    304   1.8   tnozaki 				goto e2big;
    305   1.8   tnozaki 			cnt += 2;
    306   1.1  tshiozak 		}
    307   1.1  tshiozak 
    308   1.1  tshiozak surrogate:
    309   1.8   tnozaki 		switch (psenc->current_endian) {
    310   1.1  tshiozak 		case _ENDIAN_BIG:
    311   1.1  tshiozak 			s[1] = wc;
    312   1.1  tshiozak 			s[0] = (wc >>= 8);
    313   1.1  tshiozak 			break;
    314   1.1  tshiozak 		case _ENDIAN_LITTLE:
    315   1.1  tshiozak 			s[0] = wc;
    316   1.1  tshiozak 			s[1] = (wc >>= 8);
    317   1.1  tshiozak 			break;
    318   1.1  tshiozak 		}
    319   1.1  tshiozak 		if (wc2!=0) {
    320   1.1  tshiozak 			wc = wc2;
    321   1.1  tshiozak 			wc2 = 0;
    322   1.1  tshiozak 			s += 2;
    323   1.1  tshiozak 			goto surrogate;
    324   1.1  tshiozak 		}
    325   1.1  tshiozak 	} else {
    326   1.1  tshiozak 		/* UTF32 */
    327   1.7   tnozaki 		if (wc >= 0xD800 && wc <= 0xDFFF)
    328   1.8   tnozaki 			goto ilseq;
    329   1.8   tnozaki 		if (n < 4)
    330   1.8   tnozaki 			goto e2big;
    331   1.8   tnozaki 		cnt += 4;
    332   1.8   tnozaki 		switch (psenc->current_endian) {
    333   1.1  tshiozak 		case _ENDIAN_BIG:
    334   1.1  tshiozak 			s[3] = wc;
    335   1.1  tshiozak 			s[2] = (wc >>= 8);
    336   1.1  tshiozak 			s[1] = (wc >>= 8);
    337   1.1  tshiozak 			s[0] = (wc >>= 8);
    338   1.1  tshiozak 			break;
    339   1.1  tshiozak 		case _ENDIAN_LITTLE:
    340   1.1  tshiozak 			s[0] = wc;
    341   1.1  tshiozak 			s[1] = (wc >>= 8);
    342   1.1  tshiozak 			s[2] = (wc >>= 8);
    343   1.1  tshiozak 			s[3] = (wc >>= 8);
    344   1.1  tshiozak 			break;
    345   1.1  tshiozak 		}
    346   1.1  tshiozak 	}
    347   1.8   tnozaki 	*nresult = cnt;
    348   1.1  tshiozak 
    349   1.1  tshiozak 	return 0;
    350   1.1  tshiozak 
    351   1.8   tnozaki ilseq:
    352   1.8   tnozaki 	*nresult = (size_t)-1;
    353   1.8   tnozaki 	return EILSEQ;
    354   1.8   tnozaki e2big:
    355   1.1  tshiozak 	*nresult = (size_t)-1;
    356   1.8   tnozaki 	return E2BIG;
    357   1.1  tshiozak }
    358   1.1  tshiozak 
    359   1.1  tshiozak static void
    360   1.1  tshiozak parse_variable(_UTF1632EncodingInfo * __restrict ei,
    361   1.1  tshiozak 	       const void * __restrict var, size_t lenvar)
    362   1.1  tshiozak {
    363   1.1  tshiozak #define MATCH(x, act)						\
    364   1.1  tshiozak do {								\
    365   1.1  tshiozak 	if (lenvar >= (sizeof(#x)-1) &&				\
    366   1.1  tshiozak 	    _bcs_strncasecmp(p, #x, sizeof(#x)-1) == 0) {	\
    367   1.1  tshiozak 		act;						\
    368   1.1  tshiozak 		lenvar -= sizeof(#x)-1;				\
    369   1.1  tshiozak 		p += sizeof(#x)-1;				\
    370   1.1  tshiozak 	}							\
    371   1.1  tshiozak } while (/*CONSTCOND*/0)
    372   1.1  tshiozak 	const char *p;
    373   1.1  tshiozak 	p = var;
    374   1.1  tshiozak 	while (lenvar>0) {
    375   1.1  tshiozak 		switch (*p) {
    376   1.1  tshiozak 		case 'B':
    377   1.1  tshiozak 		case 'b':
    378   1.1  tshiozak 			MATCH(big, ei->preffered_endian = _ENDIAN_BIG);
    379   1.1  tshiozak 			break;
    380   1.1  tshiozak 		case 'L':
    381   1.1  tshiozak 		case 'l':
    382   1.1  tshiozak 			MATCH(little, ei->preffered_endian = _ENDIAN_LITTLE);
    383   1.1  tshiozak 			break;
    384   1.1  tshiozak 		case 'F':
    385   1.1  tshiozak 		case 'f':
    386   1.1  tshiozak 			MATCH(force, ei->mode |= _MODE_FORCE_ENDIAN);
    387   1.1  tshiozak 			break;
    388   1.1  tshiozak 		case 'U':
    389   1.1  tshiozak 		case 'u':
    390   1.1  tshiozak 			MATCH(utf32, ei->mode |= _MODE_UTF32);
    391   1.1  tshiozak 			break;
    392   1.1  tshiozak 		}
    393   1.1  tshiozak 		p++;
    394   1.1  tshiozak 		lenvar--;
    395   1.1  tshiozak 	}
    396   1.1  tshiozak }
    397   1.1  tshiozak 
    398   1.1  tshiozak static int
    399   1.1  tshiozak /*ARGSUSED*/
    400   1.1  tshiozak _citrus_UTF1632_encoding_module_init(_UTF1632EncodingInfo * __restrict ei,
    401   1.1  tshiozak 				     const void * __restrict var,
    402   1.1  tshiozak 				     size_t lenvar)
    403   1.1  tshiozak {
    404   1.1  tshiozak 	_DIAGASSERT(ei != NULL);
    405   1.1  tshiozak 
    406   1.1  tshiozak 	memset((void *)ei, 0, sizeof(*ei));
    407   1.1  tshiozak 
    408   1.1  tshiozak 	parse_variable(ei, var, lenvar);
    409   1.1  tshiozak 
    410   1.1  tshiozak 	if ((ei->mode&_MODE_UTF32)==0)
    411   1.1  tshiozak 		ei->cur_max = 6; /* endian + surrogate */
    412   1.1  tshiozak 	else
    413   1.1  tshiozak 		ei->cur_max = 8; /* endian + normal */
    414   1.1  tshiozak 
    415   1.1  tshiozak 	if (ei->preffered_endian == _ENDIAN_UNKNOWN) {
    416   1.1  tshiozak #if BYTE_ORDER == BIG_ENDIAN
    417   1.1  tshiozak 		ei->preffered_endian = _ENDIAN_BIG;
    418   1.1  tshiozak #else
    419   1.1  tshiozak 		ei->preffered_endian = _ENDIAN_LITTLE;
    420   1.1  tshiozak #endif
    421   1.1  tshiozak 	}
    422   1.1  tshiozak 
    423   1.1  tshiozak 	return (0);
    424   1.1  tshiozak }
    425   1.1  tshiozak 
    426   1.1  tshiozak static void
    427   1.1  tshiozak /*ARGSUSED*/
    428   1.1  tshiozak _citrus_UTF1632_encoding_module_uninit(_UTF1632EncodingInfo *ei)
    429   1.1  tshiozak {
    430   1.1  tshiozak }
    431   1.1  tshiozak 
    432   1.1  tshiozak static __inline int
    433   1.1  tshiozak /*ARGSUSED*/
    434   1.1  tshiozak _citrus_UTF1632_stdenc_wctocs(_UTF1632EncodingInfo * __restrict ei,
    435   1.1  tshiozak 			      _csid_t * __restrict csid,
    436   1.1  tshiozak 			      _index_t * __restrict idx,
    437   1.1  tshiozak 			      _wc_t wc)
    438   1.1  tshiozak {
    439   1.1  tshiozak 
    440   1.1  tshiozak 	_DIAGASSERT(csid != NULL && idx != NULL);
    441   1.1  tshiozak 
    442   1.1  tshiozak 	*csid = 0;
    443   1.1  tshiozak 	*idx = (_index_t)wc;
    444   1.1  tshiozak 
    445   1.1  tshiozak 	return (0);
    446   1.1  tshiozak }
    447   1.1  tshiozak 
    448   1.1  tshiozak static __inline int
    449   1.1  tshiozak /*ARGSUSED*/
    450   1.1  tshiozak _citrus_UTF1632_stdenc_cstowc(_UTF1632EncodingInfo * __restrict ei,
    451   1.1  tshiozak 			      _wc_t * __restrict wc,
    452   1.1  tshiozak 			      _csid_t csid, _index_t idx)
    453   1.1  tshiozak {
    454   1.1  tshiozak 
    455   1.1  tshiozak 	_DIAGASSERT(wc != NULL);
    456   1.1  tshiozak 
    457   1.1  tshiozak 	if (csid != 0)
    458   1.1  tshiozak 		return (EILSEQ);
    459   1.1  tshiozak 
    460   1.1  tshiozak 	*wc = (_wc_t)idx;
    461   1.1  tshiozak 
    462   1.1  tshiozak 	return (0);
    463   1.1  tshiozak }
    464   1.1  tshiozak 
    465   1.4  tshiozak static __inline int
    466   1.4  tshiozak /*ARGSUSED*/
    467   1.4  tshiozak _citrus_UTF1632_stdenc_get_state_desc_generic(_UTF1632EncodingInfo * __restrict ei,
    468   1.4  tshiozak 					      _UTF1632State * __restrict psenc,
    469   1.4  tshiozak 					      int * __restrict rstate)
    470   1.4  tshiozak {
    471   1.4  tshiozak 
    472   1.4  tshiozak 	if (psenc->chlen == 0)
    473   1.4  tshiozak 		*rstate = _STDENC_SDGEN_INITIAL;
    474   1.4  tshiozak 	else
    475   1.4  tshiozak 		*rstate = _STDENC_SDGEN_INCOMPLETE_CHAR;
    476   1.4  tshiozak 
    477   1.4  tshiozak 	return 0;
    478   1.4  tshiozak }
    479   1.1  tshiozak 
    480   1.1  tshiozak /* ----------------------------------------------------------------------
    481   1.1  tshiozak  * public interface for stdenc
    482   1.1  tshiozak  */
    483   1.1  tshiozak 
    484   1.1  tshiozak _CITRUS_STDENC_DECLS(UTF1632);
    485   1.1  tshiozak _CITRUS_STDENC_DEF_OPS(UTF1632);
    486   1.1  tshiozak 
    487   1.1  tshiozak #include "citrus_stdenc_template.h"
    488