citrus_big5.c revision 1.10 1 1.10 tnozaki /* $NetBSD: citrus_big5.c,v 1.10 2006/06/19 17:28:24 tnozaki Exp $ */
2 1.1 tshiozak
3 1.1 tshiozak /*-
4 1.10 tnozaki * Copyright (c)2002, 2006 Citrus Project,
5 1.1 tshiozak * All rights reserved.
6 1.1 tshiozak *
7 1.1 tshiozak * Redistribution and use in source and binary forms, with or without
8 1.1 tshiozak * modification, are permitted provided that the following conditions
9 1.1 tshiozak * are met:
10 1.1 tshiozak * 1. Redistributions of source code must retain the above copyright
11 1.1 tshiozak * notice, this list of conditions and the following disclaimer.
12 1.1 tshiozak * 2. Redistributions in binary form must reproduce the above copyright
13 1.1 tshiozak * notice, this list of conditions and the following disclaimer in the
14 1.1 tshiozak * documentation and/or other materials provided with the distribution.
15 1.1 tshiozak *
16 1.1 tshiozak * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
17 1.1 tshiozak * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18 1.1 tshiozak * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19 1.1 tshiozak * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
20 1.1 tshiozak * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21 1.1 tshiozak * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
22 1.1 tshiozak * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23 1.1 tshiozak * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
24 1.1 tshiozak * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25 1.1 tshiozak * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26 1.1 tshiozak * SUCH DAMAGE.
27 1.1 tshiozak */
28 1.1 tshiozak
29 1.1 tshiozak /*-
30 1.1 tshiozak * Copyright (c) 1993
31 1.1 tshiozak * The Regents of the University of California. All rights reserved.
32 1.1 tshiozak *
33 1.1 tshiozak * This code is derived from software contributed to Berkeley by
34 1.1 tshiozak * Paul Borman at Krystal Technologies.
35 1.1 tshiozak *
36 1.1 tshiozak * Redistribution and use in source and binary forms, with or without
37 1.1 tshiozak * modification, are permitted provided that the following conditions
38 1.1 tshiozak * are met:
39 1.1 tshiozak * 1. Redistributions of source code must retain the above copyright
40 1.1 tshiozak * notice, this list of conditions and the following disclaimer.
41 1.1 tshiozak * 2. Redistributions in binary form must reproduce the above copyright
42 1.1 tshiozak * notice, this list of conditions and the following disclaimer in the
43 1.1 tshiozak * documentation and/or other materials provided with the distribution.
44 1.8 agc * 3. Neither the name of the University nor the names of its contributors
45 1.1 tshiozak * may be used to endorse or promote products derived from this software
46 1.1 tshiozak * without specific prior written permission.
47 1.1 tshiozak *
48 1.1 tshiozak * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
49 1.1 tshiozak * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
50 1.1 tshiozak * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
51 1.1 tshiozak * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
52 1.1 tshiozak * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
53 1.1 tshiozak * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
54 1.1 tshiozak * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
55 1.1 tshiozak * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
56 1.1 tshiozak * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
57 1.1 tshiozak * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
58 1.1 tshiozak * SUCH DAMAGE.
59 1.1 tshiozak */
60 1.1 tshiozak
61 1.1 tshiozak #include <sys/cdefs.h>
62 1.1 tshiozak #if defined(LIBC_SCCS) && !defined(lint)
63 1.10 tnozaki __RCSID("$NetBSD: citrus_big5.c,v 1.10 2006/06/19 17:28:24 tnozaki Exp $");
64 1.1 tshiozak #endif /* LIBC_SCCS and not lint */
65 1.1 tshiozak
66 1.10 tnozaki #include <sys/queue.h>
67 1.10 tnozaki #include <sys/types.h>
68 1.1 tshiozak #include <assert.h>
69 1.1 tshiozak #include <errno.h>
70 1.1 tshiozak #include <string.h>
71 1.10 tnozaki #include <stdint.h>
72 1.1 tshiozak #include <stdio.h>
73 1.1 tshiozak #include <stdlib.h>
74 1.1 tshiozak #include <stddef.h>
75 1.1 tshiozak #include <locale.h>
76 1.1 tshiozak #include <wchar.h>
77 1.1 tshiozak #include <limits.h>
78 1.6 tshiozak
79 1.6 tshiozak #include "citrus_namespace.h"
80 1.6 tshiozak #include "citrus_types.h"
81 1.10 tnozaki #include "citrus_bcs.h"
82 1.1 tshiozak #include "citrus_module.h"
83 1.1 tshiozak #include "citrus_ctype.h"
84 1.6 tshiozak #include "citrus_stdenc.h"
85 1.1 tshiozak #include "citrus_big5.h"
86 1.1 tshiozak
87 1.1 tshiozak /* ----------------------------------------------------------------------
88 1.1 tshiozak * private stuffs used by templates
89 1.1 tshiozak */
90 1.1 tshiozak
91 1.1 tshiozak typedef struct {
92 1.1 tshiozak char ch[2];
93 1.1 tshiozak int chlen;
94 1.1 tshiozak } _BIG5State;
95 1.1 tshiozak
96 1.10 tnozaki typedef struct _BIG5Exclude {
97 1.10 tnozaki TAILQ_ENTRY(_BIG5Exclude) entry;
98 1.10 tnozaki wint_t start, end;
99 1.10 tnozaki } _BIG5Exclude;
100 1.10 tnozaki
101 1.10 tnozaki typedef TAILQ_HEAD(_BIG5ExcludeList, _BIG5Exclude) _BIG5ExcludeList;
102 1.10 tnozaki
103 1.1 tshiozak typedef struct {
104 1.10 tnozaki int cell[0x100];
105 1.10 tnozaki _BIG5ExcludeList excludes;
106 1.1 tshiozak } _BIG5EncodingInfo;
107 1.1 tshiozak
108 1.1 tshiozak typedef struct {
109 1.1 tshiozak _BIG5EncodingInfo ei;
110 1.1 tshiozak struct {
111 1.1 tshiozak /* for future multi-locale facility */
112 1.1 tshiozak _BIG5State s_mblen;
113 1.1 tshiozak _BIG5State s_mbrlen;
114 1.1 tshiozak _BIG5State s_mbrtowc;
115 1.1 tshiozak _BIG5State s_mbtowc;
116 1.1 tshiozak _BIG5State s_mbsrtowcs;
117 1.1 tshiozak _BIG5State s_wcrtomb;
118 1.1 tshiozak _BIG5State s_wcsrtombs;
119 1.1 tshiozak _BIG5State s_wctomb;
120 1.1 tshiozak } states;
121 1.1 tshiozak } _BIG5CTypeInfo;
122 1.1 tshiozak
123 1.1 tshiozak #define _CEI_TO_EI(_cei_) (&(_cei_)->ei)
124 1.1 tshiozak #define _CEI_TO_STATE(_cei_, _func_) (_cei_)->states.s_##_func_
125 1.1 tshiozak
126 1.1 tshiozak #define _FUNCNAME(m) _citrus_BIG5_##m
127 1.1 tshiozak #define _ENCODING_INFO _BIG5EncodingInfo
128 1.1 tshiozak #define _CTYPE_INFO _BIG5CTypeInfo
129 1.1 tshiozak #define _ENCODING_STATE _BIG5State
130 1.2 yamt #define _ENCODING_MB_CUR_MAX(_ei_) 2
131 1.1 tshiozak #define _ENCODING_IS_STATE_DEPENDENT 0
132 1.4 yamt #define _STATE_NEEDS_EXPLICIT_INIT(_ps_) 0
133 1.1 tshiozak
134 1.1 tshiozak
135 1.1 tshiozak static __inline void
136 1.1 tshiozak /*ARGSUSED*/
137 1.1 tshiozak _citrus_BIG5_init_state(_BIG5EncodingInfo * __restrict ei,
138 1.1 tshiozak _BIG5State * __restrict s)
139 1.1 tshiozak {
140 1.1 tshiozak memset(s, 0, sizeof(*s));
141 1.1 tshiozak }
142 1.1 tshiozak
143 1.1 tshiozak static __inline void
144 1.1 tshiozak /*ARGSUSED*/
145 1.1 tshiozak _citrus_BIG5_pack_state(_BIG5EncodingInfo * __restrict ei,
146 1.1 tshiozak void * __restrict pspriv,
147 1.1 tshiozak const _BIG5State * __restrict s)
148 1.1 tshiozak {
149 1.1 tshiozak memcpy(pspriv, (const void *)s, sizeof(*s));
150 1.1 tshiozak }
151 1.1 tshiozak
152 1.1 tshiozak static __inline void
153 1.1 tshiozak /*ARGSUSED*/
154 1.1 tshiozak _citrus_BIG5_unpack_state(_BIG5EncodingInfo * __restrict ei,
155 1.1 tshiozak _BIG5State * __restrict s,
156 1.1 tshiozak const void * __restrict pspriv)
157 1.1 tshiozak {
158 1.1 tshiozak memcpy((void *)s, pspriv, sizeof(*s));
159 1.1 tshiozak }
160 1.1 tshiozak
161 1.1 tshiozak static __inline int
162 1.10 tnozaki _citrus_BIG5_check(_BIG5EncodingInfo *ei, u_int c)
163 1.1 tshiozak {
164 1.10 tnozaki _DIAGASSERT(ei != NULL);
165 1.10 tnozaki
166 1.10 tnozaki return (ei->cell[c & 0xFF] & 0x1) ? 2 : 1;
167 1.1 tshiozak }
168 1.1 tshiozak
169 1.1 tshiozak static __inline int
170 1.10 tnozaki _citrus_BIG5_check2(_BIG5EncodingInfo *ei, u_int c)
171 1.10 tnozaki {
172 1.10 tnozaki _DIAGASSERT(ei != NULL);
173 1.10 tnozaki
174 1.10 tnozaki return (ei->cell[c & 0xFF] & 0x2) ? 1 : 0;
175 1.10 tnozaki }
176 1.10 tnozaki
177 1.10 tnozaki static __inline int
178 1.10 tnozaki _citrus_BIG5_check_excludes(_BIG5EncodingInfo *ei, wint_t c)
179 1.10 tnozaki {
180 1.10 tnozaki _BIG5Exclude *exclude;
181 1.10 tnozaki
182 1.10 tnozaki _DIAGASSERT(ei != NULL);
183 1.10 tnozaki
184 1.10 tnozaki TAILQ_FOREACH(exclude, &ei->excludes, entry) {
185 1.10 tnozaki if (c >= exclude->start && c <= exclude->end)
186 1.10 tnozaki return EILSEQ;
187 1.10 tnozaki }
188 1.10 tnozaki return 0;
189 1.10 tnozaki }
190 1.10 tnozaki
191 1.10 tnozaki #define _STRTOL_LEN(_func_, _type_, _limit_) \
192 1.10 tnozaki static int \
193 1.10 tnozaki _prop_##_func_##_len(const char *s, size_t *n, \
194 1.10 tnozaki char **endptr, int base, _type_ *result) \
195 1.10 tnozaki { \
196 1.10 tnozaki const char *ptr; \
197 1.10 tnozaki char buf[_limit_ + 1], *tail; \
198 1.10 tnozaki size_t siz; \
199 1.10 tnozaki int save_errno, err; \
200 1.10 tnozaki \
201 1.10 tnozaki _DIAGASSERT(s != NULL); \
202 1.10 tnozaki _DIAGASSERT(n != NULL); \
203 1.10 tnozaki /* endptr may be null */ \
204 1.10 tnozaki _DIAGASSERT(result != NULL); \
205 1.10 tnozaki \
206 1.10 tnozaki ptr = _bcs_skip_ws_len(s, n); \
207 1.10 tnozaki if (*n < 1) { \
208 1.10 tnozaki *result = 0; \
209 1.10 tnozaki if (endptr != NULL) \
210 1.10 tnozaki *endptr = __UNCONST(s); \
211 1.10 tnozaki return 0; \
212 1.10 tnozaki } \
213 1.10 tnozaki siz = _limit_ < *n ? _limit_ : *n; \
214 1.10 tnozaki memcpy(buf, ptr, siz); \
215 1.10 tnozaki buf[siz] = '\0'; \
216 1.10 tnozaki \
217 1.10 tnozaki save_errno = errno; \
218 1.10 tnozaki errno = 0; \
219 1.10 tnozaki *result = _func_(buf, &tail, base); \
220 1.10 tnozaki err = errno; \
221 1.10 tnozaki errno = save_errno; \
222 1.10 tnozaki if (err == 0) { \
223 1.10 tnozaki siz = (size_t)(tail - buf); \
224 1.10 tnozaki if (endptr != NULL) \
225 1.10 tnozaki *endptr = __UNCONST(ptr + siz); \
226 1.10 tnozaki *n -= siz; \
227 1.10 tnozaki } \
228 1.10 tnozaki return (err); \
229 1.10 tnozaki }
230 1.10 tnozaki _STRTOL_LEN(strtoul, unsigned long, 13)
231 1.10 tnozaki
232 1.10 tnozaki #define _PROP_READ_UINT(_func_, _type_, _max_) \
233 1.10 tnozaki static int \
234 1.10 tnozaki _prop_read_##_func_(const char **s, size_t *n, _type_ *result) \
235 1.10 tnozaki { \
236 1.10 tnozaki const char *s0; \
237 1.10 tnozaki char *t; \
238 1.10 tnozaki size_t n0; \
239 1.10 tnozaki unsigned long l; \
240 1.10 tnozaki \
241 1.10 tnozaki _DIAGASSERT(s != NULL); \
242 1.10 tnozaki _DIAGASSERT(n != NULL); \
243 1.10 tnozaki _DIAGASSERT(result != NULL); \
244 1.10 tnozaki \
245 1.10 tnozaki s0 = *s; \
246 1.10 tnozaki n0 = *n; \
247 1.10 tnozaki if (_prop_strtoul_len(s0, &n0, &t, 0, &l) != 0 || \
248 1.10 tnozaki s0 == t) \
249 1.10 tnozaki return EINVAL; \
250 1.10 tnozaki if (l > _max_) \
251 1.10 tnozaki return ERANGE; \
252 1.10 tnozaki *result = (_type_)l; \
253 1.10 tnozaki *s = (const char *)t; \
254 1.10 tnozaki *n = n0; \
255 1.10 tnozaki \
256 1.10 tnozaki return 0; \
257 1.10 tnozaki }
258 1.10 tnozaki _PROP_READ_UINT( u8, uint8_t, UINT8_MAX)
259 1.10 tnozaki _PROP_READ_UINT(u16, uint16_t, UINT16_MAX)
260 1.10 tnozaki
261 1.10 tnozaki #define _PROP_HANDLE_TYPE_T(_func_, _type_) \
262 1.10 tnozaki typedef int (*_prop_handle_##_func_##_t) \
263 1.10 tnozaki (void *, const char *, _type_, _type_);
264 1.10 tnozaki _PROP_HANDLE_TYPE_T( u8, uint8_t)
265 1.10 tnozaki _PROP_HANDLE_TYPE_T(u16, uint16_t)
266 1.10 tnozaki
267 1.10 tnozaki typedef struct _prop_key_t _prop_key_t;
268 1.10 tnozaki
269 1.10 tnozaki typedef union {
270 1.10 tnozaki #define _PROP_HANDLE_TYPE_OPS(_func_) \
271 1.10 tnozaki _prop_handle_##_func_##_t _func_
272 1.10 tnozaki
273 1.10 tnozaki _PROP_HANDLE_TYPE_OPS( u8);
274 1.10 tnozaki _PROP_HANDLE_TYPE_OPS(u16);
275 1.10 tnozaki } _prop_handler_t;
276 1.10 tnozaki
277 1.10 tnozaki typedef enum {
278 1.10 tnozaki _PROP_U8, _PROP_U16,
279 1.10 tnozaki } _prop_type_t;
280 1.10 tnozaki
281 1.10 tnozaki struct _prop_key_t {
282 1.10 tnozaki const char *name;
283 1.10 tnozaki _prop_type_t type;
284 1.10 tnozaki _prop_handler_t handler;
285 1.10 tnozaki };
286 1.10 tnozaki
287 1.10 tnozaki static int
288 1.10 tnozaki _prop_parse_variable(void *ctx, const char **s, size_t *n,
289 1.10 tnozaki const _prop_key_t *keys)
290 1.1 tshiozak {
291 1.10 tnozaki const char *s0, *s1;
292 1.10 tnozaki size_t n0, n1, nlen;
293 1.10 tnozaki const _prop_key_t *key;
294 1.10 tnozaki const _prop_handler_t *ptr;
295 1.10 tnozaki int ch0, ret;
296 1.10 tnozaki
297 1.10 tnozaki s0 = *s;
298 1.10 tnozaki n0 = *n;
299 1.10 tnozaki
300 1.10 tnozaki #define PARSE(_func_, _type_) \
301 1.10 tnozaki do { \
302 1.10 tnozaki _type_ x, y; \
303 1.10 tnozaki if (ptr->_func_ == NULL) \
304 1.10 tnozaki return EINVAL; \
305 1.10 tnozaki for (ch0 = 0; ch0 != ';';) { \
306 1.10 tnozaki ret = _prop_read_##_func_(&s0, &n0, &x); \
307 1.10 tnozaki if (ret != 0) \
308 1.10 tnozaki return ret; \
309 1.10 tnozaki s0 = _bcs_skip_ws_len(s0, &n0); \
310 1.10 tnozaki if (n0 < 1 || (ch0 = (int)*s0) == '\0') \
311 1.10 tnozaki return EINVAL; \
312 1.10 tnozaki if(ch0 == '-') { \
313 1.10 tnozaki ++s0, --n0; \
314 1.10 tnozaki ret = _prop_read_##_func_(&s0, &n0, &y);\
315 1.10 tnozaki if (ret != 0) \
316 1.10 tnozaki return ret; \
317 1.10 tnozaki if (x >= y) \
318 1.10 tnozaki return EINVAL; \
319 1.10 tnozaki } else \
320 1.10 tnozaki y = x; \
321 1.10 tnozaki s0 = _bcs_skip_ws_len(s0, &n0); \
322 1.10 tnozaki if (n0 < 1) \
323 1.10 tnozaki return EINVAL; \
324 1.10 tnozaki ch0 = (int)*s0; \
325 1.10 tnozaki if (ch0 != ',' && ch0 != ';') \
326 1.10 tnozaki return EINVAL; \
327 1.10 tnozaki ++s0, --n0; \
328 1.10 tnozaki _DIAGASSERT(ctx != NULL); \
329 1.10 tnozaki ret = (*ptr->_func_)(ctx, key->name, x, y); \
330 1.10 tnozaki if (ret != 0) \
331 1.10 tnozaki return ret; \
332 1.10 tnozaki } \
333 1.10 tnozaki } while (/*CONSTCOND*/0)
334 1.10 tnozaki
335 1.10 tnozaki for (;;) {
336 1.10 tnozaki s0 = _bcs_skip_ws_len(s0, &n0);
337 1.10 tnozaki if (n0 < 1 || *s0 == '\0')
338 1.10 tnozaki break;
339 1.10 tnozaki for (key = keys; key->name != NULL; ++key) {
340 1.10 tnozaki s1 = s0, n1 = n0;
341 1.10 tnozaki nlen = strlen(key->name);
342 1.10 tnozaki if (n1 <= nlen || strncmp(s1, key->name, nlen) != 0)
343 1.10 tnozaki continue;
344 1.10 tnozaki s1 += nlen, n1 -= nlen;
345 1.10 tnozaki s1 = _bcs_skip_ws_len(s1, &n1);
346 1.10 tnozaki if (n1 < 1)
347 1.10 tnozaki continue;
348 1.10 tnozaki ptr = (const _prop_handler_t *)&key->handler;
349 1.10 tnozaki if (*s1 == '=') {
350 1.10 tnozaki s0 = ++s1, n0 = --n1;
351 1.10 tnozaki switch (key->type) {
352 1.10 tnozaki case _PROP_U8:
353 1.10 tnozaki PARSE( u8, uint8_t);
354 1.10 tnozaki break;
355 1.10 tnozaki case _PROP_U16:
356 1.10 tnozaki PARSE(u16, uint16_t);
357 1.10 tnozaki break;
358 1.10 tnozaki default:
359 1.10 tnozaki goto invalid;
360 1.10 tnozaki }
361 1.10 tnozaki break;
362 1.10 tnozaki }
363 1.10 tnozaki }
364 1.10 tnozaki if (key->name == NULL)
365 1.10 tnozaki goto invalid;
366 1.10 tnozaki }
367 1.10 tnozaki *s = s0;
368 1.10 tnozaki *n = n0;
369 1.10 tnozaki
370 1.10 tnozaki return 0;
371 1.10 tnozaki
372 1.10 tnozaki invalid:
373 1.10 tnozaki return EINVAL;
374 1.10 tnozaki }
375 1.10 tnozaki
376 1.10 tnozaki static int
377 1.10 tnozaki _citrus_BIG5_fill_rowcol(void * __restrict ctx, const char * __restrict s,
378 1.10 tnozaki uint8_t start, uint8_t end)
379 1.10 tnozaki {
380 1.10 tnozaki _BIG5EncodingInfo *ei;
381 1.10 tnozaki int i;
382 1.10 tnozaki uint8_t n;
383 1.10 tnozaki
384 1.10 tnozaki _DIAGASSERT(ctx != NULL);
385 1.10 tnozaki
386 1.10 tnozaki ei = (_BIG5EncodingInfo *)ctx;
387 1.10 tnozaki i = strcmp("row", s) ? 1 : 0;
388 1.10 tnozaki i = 1 << i;
389 1.10 tnozaki for (n = start; n <= end; ++n)
390 1.10 tnozaki ei->cell[n & 0xFF] |= i;
391 1.10 tnozaki return 0;
392 1.1 tshiozak }
393 1.1 tshiozak
394 1.1 tshiozak static int
395 1.1 tshiozak /*ARGSUSED*/
396 1.10 tnozaki _citrus_BIG5_fill_excludes(void * __restrict ctx, const char * __restrict s,
397 1.10 tnozaki uint16_t start, uint16_t end)
398 1.1 tshiozak {
399 1.10 tnozaki _BIG5EncodingInfo *ei;
400 1.10 tnozaki _BIG5Exclude *exclude;
401 1.10 tnozaki
402 1.10 tnozaki _DIAGASSERT(ctx != NULL);
403 1.1 tshiozak
404 1.10 tnozaki ei = (_BIG5EncodingInfo *)ctx;
405 1.10 tnozaki exclude = TAILQ_LAST(&ei->excludes, _BIG5ExcludeList);
406 1.10 tnozaki if (exclude != NULL && (wint_t)start <= exclude->end)
407 1.10 tnozaki return EINVAL;
408 1.10 tnozaki exclude = (void *)malloc(sizeof(*exclude));
409 1.10 tnozaki if (exclude == NULL)
410 1.10 tnozaki return ENOMEM;
411 1.10 tnozaki exclude->start = (wint_t)start;
412 1.10 tnozaki exclude->end = (wint_t)end;
413 1.10 tnozaki TAILQ_INSERT_TAIL(&ei->excludes, exclude, entry);
414 1.1 tshiozak
415 1.10 tnozaki return 0;
416 1.1 tshiozak }
417 1.1 tshiozak
418 1.10 tnozaki static const _prop_key_t rootkeys[] = {
419 1.10 tnozaki { "row", _PROP_U8, { u8: &_citrus_BIG5_fill_rowcol } },
420 1.10 tnozaki { "col", _PROP_U8, { u8: &_citrus_BIG5_fill_rowcol } },
421 1.10 tnozaki { "excludes", _PROP_U16, { u16: &_citrus_BIG5_fill_excludes } },
422 1.10 tnozaki { NULL },
423 1.10 tnozaki };
424 1.10 tnozaki
425 1.1 tshiozak static void
426 1.1 tshiozak /*ARGSUSED*/
427 1.6 tshiozak _citrus_BIG5_encoding_module_uninit(_BIG5EncodingInfo *ei)
428 1.1 tshiozak {
429 1.10 tnozaki _BIG5Exclude *exclude;
430 1.10 tnozaki
431 1.10 tnozaki _DIAGASSERT(ei != NULL);
432 1.10 tnozaki
433 1.10 tnozaki while ((exclude = TAILQ_FIRST(&ei->excludes)) != NULL) {
434 1.10 tnozaki TAILQ_REMOVE(&ei->excludes, exclude, entry);
435 1.10 tnozaki free(exclude);
436 1.10 tnozaki }
437 1.10 tnozaki }
438 1.10 tnozaki
439 1.10 tnozaki static int
440 1.10 tnozaki /*ARGSUSED*/
441 1.10 tnozaki _citrus_BIG5_encoding_module_init(_BIG5EncodingInfo * __restrict ei,
442 1.10 tnozaki const void * __restrict var, size_t lenvar)
443 1.10 tnozaki {
444 1.10 tnozaki int err;
445 1.10 tnozaki const char *s;
446 1.10 tnozaki
447 1.10 tnozaki _DIAGASSERT(ei != NULL);
448 1.10 tnozaki
449 1.10 tnozaki memset((void *)ei, 0, sizeof(*ei));
450 1.10 tnozaki TAILQ_INIT(&ei->excludes);
451 1.10 tnozaki
452 1.10 tnozaki if (lenvar > 0 && var != NULL) {
453 1.10 tnozaki s = _bcs_skip_ws_len((const char *)var, &lenvar);
454 1.10 tnozaki if (lenvar > 0 && *s != '\0') {
455 1.10 tnozaki err = _prop_parse_variable(ei, &s, &lenvar, rootkeys);
456 1.10 tnozaki if (err == 0)
457 1.10 tnozaki return 0;
458 1.10 tnozaki
459 1.10 tnozaki _citrus_BIG5_encoding_module_uninit(ei);
460 1.10 tnozaki memset((void *)ei, 0, sizeof(*ei));
461 1.10 tnozaki TAILQ_INIT(&ei->excludes);
462 1.10 tnozaki }
463 1.10 tnozaki }
464 1.10 tnozaki
465 1.10 tnozaki /* fallback Big5-1984, for backward compatibility. */
466 1.10 tnozaki _citrus_BIG5_fill_rowcol(ei, "row", 0xA1, 0xFE);
467 1.10 tnozaki _citrus_BIG5_fill_rowcol(ei, "col", 0x40, 0x7E);
468 1.10 tnozaki _citrus_BIG5_fill_rowcol(ei, "col", 0xA1, 0xFE);
469 1.10 tnozaki
470 1.10 tnozaki return 0;
471 1.1 tshiozak }
472 1.1 tshiozak
473 1.1 tshiozak static int
474 1.1 tshiozak /*ARGSUSED*/
475 1.1 tshiozak _citrus_BIG5_mbrtowc_priv(_BIG5EncodingInfo * __restrict ei,
476 1.1 tshiozak wchar_t * __restrict pwc,
477 1.1 tshiozak const char ** __restrict s, size_t n,
478 1.1 tshiozak _BIG5State * __restrict psenc,
479 1.1 tshiozak size_t * __restrict nresult)
480 1.1 tshiozak {
481 1.1 tshiozak wchar_t wchar;
482 1.1 tshiozak int c;
483 1.1 tshiozak int chlenbak;
484 1.1 tshiozak const char *s0;
485 1.1 tshiozak
486 1.1 tshiozak _DIAGASSERT(nresult != 0);
487 1.1 tshiozak _DIAGASSERT(ei != NULL);
488 1.1 tshiozak _DIAGASSERT(psenc != NULL);
489 1.1 tshiozak _DIAGASSERT(s != NULL && *s != NULL);
490 1.1 tshiozak
491 1.1 tshiozak s0 = *s;
492 1.1 tshiozak
493 1.1 tshiozak if (s0 == NULL) {
494 1.1 tshiozak _citrus_BIG5_init_state(ei, psenc);
495 1.1 tshiozak *nresult = 0;
496 1.1 tshiozak return (0);
497 1.1 tshiozak }
498 1.1 tshiozak
499 1.1 tshiozak chlenbak = psenc->chlen;
500 1.1 tshiozak
501 1.1 tshiozak /* make sure we have the first byte in the buffer */
502 1.1 tshiozak switch (psenc->chlen) {
503 1.1 tshiozak case 0:
504 1.1 tshiozak if (n < 1)
505 1.1 tshiozak goto restart;
506 1.1 tshiozak psenc->ch[0] = *s0++;
507 1.1 tshiozak psenc->chlen = 1;
508 1.1 tshiozak n--;
509 1.1 tshiozak break;
510 1.1 tshiozak case 1:
511 1.1 tshiozak break;
512 1.1 tshiozak default:
513 1.1 tshiozak /* illegal state */
514 1.1 tshiozak goto ilseq;
515 1.1 tshiozak }
516 1.1 tshiozak
517 1.10 tnozaki c = _citrus_BIG5_check(ei, psenc->ch[0] & 0xff);
518 1.1 tshiozak if (c == 0)
519 1.1 tshiozak goto ilseq;
520 1.1 tshiozak while (psenc->chlen < c) {
521 1.1 tshiozak if (n < 1) {
522 1.1 tshiozak goto restart;
523 1.1 tshiozak }
524 1.1 tshiozak psenc->ch[psenc->chlen] = *s0++;
525 1.1 tshiozak psenc->chlen++;
526 1.1 tshiozak n--;
527 1.1 tshiozak }
528 1.1 tshiozak
529 1.1 tshiozak switch (c) {
530 1.1 tshiozak case 1:
531 1.1 tshiozak wchar = psenc->ch[0] & 0xff;
532 1.1 tshiozak break;
533 1.1 tshiozak case 2:
534 1.10 tnozaki if (!_citrus_BIG5_check2(ei, psenc->ch[1] & 0xff))
535 1.1 tshiozak goto ilseq;
536 1.1 tshiozak wchar = ((psenc->ch[0] & 0xff) << 8) | (psenc->ch[1] & 0xff);
537 1.1 tshiozak break;
538 1.1 tshiozak default:
539 1.1 tshiozak /* illegal state */
540 1.1 tshiozak goto ilseq;
541 1.1 tshiozak }
542 1.1 tshiozak
543 1.10 tnozaki if (_citrus_BIG5_check_excludes(ei, (wint_t)wchar) != 0)
544 1.10 tnozaki goto ilseq;
545 1.10 tnozaki
546 1.1 tshiozak *s = s0;
547 1.1 tshiozak psenc->chlen = 0;
548 1.1 tshiozak if (pwc)
549 1.1 tshiozak *pwc = wchar;
550 1.1 tshiozak if (!wchar)
551 1.1 tshiozak *nresult = 0;
552 1.1 tshiozak else
553 1.1 tshiozak *nresult = c - chlenbak;
554 1.1 tshiozak
555 1.1 tshiozak return (0);
556 1.1 tshiozak
557 1.1 tshiozak ilseq:
558 1.1 tshiozak psenc->chlen = 0;
559 1.1 tshiozak *nresult = (size_t)-1;
560 1.1 tshiozak return (EILSEQ);
561 1.1 tshiozak
562 1.1 tshiozak restart:
563 1.1 tshiozak *s = s0;
564 1.1 tshiozak *nresult = (size_t)-2;
565 1.1 tshiozak return (0);
566 1.1 tshiozak }
567 1.1 tshiozak
568 1.1 tshiozak static int
569 1.1 tshiozak /*ARGSUSED*/
570 1.1 tshiozak _citrus_BIG5_wcrtomb_priv(_BIG5EncodingInfo * __restrict ei,
571 1.1 tshiozak char * __restrict s,
572 1.1 tshiozak size_t n, wchar_t wc, _BIG5State * __restrict psenc,
573 1.1 tshiozak size_t * __restrict nresult)
574 1.1 tshiozak {
575 1.6 tshiozak int l, ret;
576 1.1 tshiozak
577 1.1 tshiozak _DIAGASSERT(ei != NULL);
578 1.1 tshiozak _DIAGASSERT(nresult != 0);
579 1.1 tshiozak _DIAGASSERT(s != NULL);
580 1.6 tshiozak
581 1.1 tshiozak /* check invalid sequence */
582 1.10 tnozaki if (wc & ~0xffff ||
583 1.10 tnozaki _citrus_BIG5_check_excludes(ei, (wint_t)wc) != 0) {
584 1.6 tshiozak ret = EILSEQ;
585 1.6 tshiozak goto err;
586 1.6 tshiozak }
587 1.1 tshiozak
588 1.1 tshiozak if (wc & 0x8000) {
589 1.10 tnozaki if (_citrus_BIG5_check(ei, (wc >> 8) & 0xff) != 2 ||
590 1.10 tnozaki !_citrus_BIG5_check2(ei, wc & 0xff)) {
591 1.6 tshiozak ret = EILSEQ;
592 1.6 tshiozak goto err;
593 1.6 tshiozak }
594 1.1 tshiozak l = 2;
595 1.1 tshiozak } else {
596 1.10 tnozaki if (wc & ~0xff || !_citrus_BIG5_check(ei, wc & 0xff)) {
597 1.6 tshiozak ret = EILSEQ;
598 1.6 tshiozak goto err;
599 1.6 tshiozak }
600 1.1 tshiozak l = 1;
601 1.1 tshiozak }
602 1.1 tshiozak
603 1.1 tshiozak if (n < l) {
604 1.1 tshiozak /* bound check failure */
605 1.6 tshiozak ret = E2BIG;
606 1.6 tshiozak goto err;
607 1.1 tshiozak }
608 1.1 tshiozak
609 1.1 tshiozak if (l == 2) {
610 1.1 tshiozak s[0] = (wc >> 8) & 0xff;
611 1.1 tshiozak s[1] = wc & 0xff;
612 1.1 tshiozak } else
613 1.1 tshiozak s[0] = wc & 0xff;
614 1.1 tshiozak
615 1.1 tshiozak *nresult = l;
616 1.1 tshiozak
617 1.6 tshiozak return 0;
618 1.1 tshiozak
619 1.6 tshiozak err:
620 1.1 tshiozak *nresult = (size_t)-1;
621 1.6 tshiozak return ret;
622 1.6 tshiozak }
623 1.6 tshiozak
624 1.6 tshiozak static __inline int
625 1.6 tshiozak /*ARGSUSED*/
626 1.6 tshiozak _citrus_BIG5_stdenc_wctocs(_BIG5EncodingInfo * __restrict ei,
627 1.6 tshiozak _csid_t * __restrict csid,
628 1.6 tshiozak _index_t * __restrict idx, wchar_t wc)
629 1.6 tshiozak {
630 1.6 tshiozak
631 1.6 tshiozak _DIAGASSERT(csid != NULL && idx != NULL);
632 1.6 tshiozak
633 1.10 tnozaki *csid = (wc < 0x100) ? 0 : 1;
634 1.6 tshiozak *idx = (_index_t)wc;
635 1.9 tshiozak
636 1.6 tshiozak return 0;
637 1.1 tshiozak }
638 1.1 tshiozak
639 1.6 tshiozak static __inline int
640 1.6 tshiozak /*ARGSUSED*/
641 1.6 tshiozak _citrus_BIG5_stdenc_cstowc(_BIG5EncodingInfo * __restrict ei,
642 1.6 tshiozak wchar_t * __restrict wc,
643 1.6 tshiozak _csid_t csid, _index_t idx)
644 1.6 tshiozak {
645 1.6 tshiozak _DIAGASSERT(wc != NULL);
646 1.6 tshiozak
647 1.6 tshiozak switch (csid) {
648 1.6 tshiozak case 0:
649 1.6 tshiozak case 1:
650 1.6 tshiozak *wc = (wchar_t)idx;
651 1.6 tshiozak break;
652 1.6 tshiozak default:
653 1.6 tshiozak return EILSEQ;
654 1.6 tshiozak }
655 1.6 tshiozak
656 1.6 tshiozak return 0;
657 1.6 tshiozak }
658 1.1 tshiozak
659 1.9 tshiozak static __inline int
660 1.9 tshiozak /*ARGSUSED*/
661 1.9 tshiozak _citrus_BIG5_stdenc_get_state_desc_generic(_BIG5EncodingInfo * __restrict ei,
662 1.9 tshiozak _BIG5State * __restrict psenc,
663 1.9 tshiozak int * __restrict rstate)
664 1.9 tshiozak {
665 1.9 tshiozak
666 1.9 tshiozak if (psenc->chlen == 0)
667 1.9 tshiozak *rstate = _STDENC_SDGEN_INITIAL;
668 1.9 tshiozak else
669 1.9 tshiozak *rstate = _STDENC_SDGEN_INCOMPLETE_CHAR;
670 1.9 tshiozak
671 1.9 tshiozak return 0;
672 1.9 tshiozak }
673 1.9 tshiozak
674 1.1 tshiozak /* ----------------------------------------------------------------------
675 1.1 tshiozak * public interface for ctype
676 1.1 tshiozak */
677 1.1 tshiozak
678 1.1 tshiozak _CITRUS_CTYPE_DECLS(BIG5);
679 1.1 tshiozak _CITRUS_CTYPE_DEF_OPS(BIG5);
680 1.1 tshiozak
681 1.1 tshiozak #include "citrus_ctype_template.h"
682 1.6 tshiozak
683 1.6 tshiozak
684 1.6 tshiozak /* ----------------------------------------------------------------------
685 1.6 tshiozak * public interface for stdenc
686 1.6 tshiozak */
687 1.6 tshiozak
688 1.6 tshiozak _CITRUS_STDENC_DECLS(BIG5);
689 1.6 tshiozak _CITRUS_STDENC_DEF_OPS(BIG5);
690 1.6 tshiozak
691 1.6 tshiozak #include "citrus_stdenc_template.h"
692