citrus_utf7.c revision 1.6 1 1.6 joerg /* $NetBSD: citrus_utf7.c,v 1.6 2013/05/28 16:57:56 joerg Exp $ */
2 1.1 tnozaki
3 1.1 tnozaki /*-
4 1.1 tnozaki * Copyright (c)2004, 2005 Citrus Project,
5 1.1 tnozaki * All rights reserved.
6 1.1 tnozaki *
7 1.1 tnozaki * Redistribution and use in source and binary forms, with or without
8 1.1 tnozaki * modification, are permitted provided that the following conditions
9 1.1 tnozaki * are met:
10 1.1 tnozaki * 1. Redistributions of source code must retain the above copyright
11 1.1 tnozaki * notice, this list of conditions and the following disclaimer.
12 1.1 tnozaki * 2. Redistributions in binary form must reproduce the above copyright
13 1.1 tnozaki * notice, this list of conditions and the following disclaimer in the
14 1.1 tnozaki * documentation and/or other materials provided with the distribution.
15 1.1 tnozaki *
16 1.1 tnozaki * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
17 1.1 tnozaki * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18 1.1 tnozaki * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19 1.1 tnozaki * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
20 1.1 tnozaki * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21 1.1 tnozaki * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
22 1.1 tnozaki * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23 1.1 tnozaki * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
24 1.1 tnozaki * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25 1.1 tnozaki * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26 1.1 tnozaki * SUCH DAMAGE.
27 1.1 tnozaki *
28 1.1 tnozaki */
29 1.1 tnozaki
30 1.1 tnozaki #include <sys/cdefs.h>
31 1.1 tnozaki #if defined(LIB_SCCS) && !defined(lint)
32 1.6 joerg __RCSID("$NetBSD: citrus_utf7.c,v 1.6 2013/05/28 16:57:56 joerg Exp $");
33 1.1 tnozaki #endif /* LIB_SCCS and not lint */
34 1.1 tnozaki
35 1.1 tnozaki #include <assert.h>
36 1.1 tnozaki #include <errno.h>
37 1.1 tnozaki #include <string.h>
38 1.1 tnozaki #include <stdio.h>
39 1.1 tnozaki #include <stdint.h>
40 1.1 tnozaki #include <stdlib.h>
41 1.1 tnozaki #include <limits.h>
42 1.1 tnozaki #include <wchar.h>
43 1.1 tnozaki
44 1.1 tnozaki #include "citrus_namespace.h"
45 1.1 tnozaki #include "citrus_types.h"
46 1.1 tnozaki #include "citrus_module.h"
47 1.1 tnozaki #include "citrus_ctype.h"
48 1.1 tnozaki #include "citrus_stdenc.h"
49 1.1 tnozaki #include "citrus_utf7.h"
50 1.1 tnozaki
51 1.1 tnozaki /* ----------------------------------------------------------------------
52 1.1 tnozaki * private stuffs used by templates
53 1.1 tnozaki */
54 1.1 tnozaki
55 1.1 tnozaki typedef struct {
56 1.1 tnozaki uint16_t cell[0x80];
57 1.1 tnozaki #define EI_MASK UINT16_C(0xff)
58 1.1 tnozaki #define EI_DIRECT UINT16_C(0x100)
59 1.1 tnozaki #define EI_OPTION UINT16_C(0x200)
60 1.1 tnozaki #define EI_SPACE UINT16_C(0x400)
61 1.1 tnozaki } _UTF7EncodingInfo;
62 1.1 tnozaki
63 1.1 tnozaki typedef struct {
64 1.1 tnozaki unsigned int
65 1.1 tnozaki mode: 1, /* whether base64 mode */
66 1.1 tnozaki bits: 4, /* need to hold 0 - 15 */
67 1.1 tnozaki cache: 22, /* 22 = BASE64_BIT + UTF16_BIT */
68 1.2 tnozaki surrogate: 1; /* whether surrogate pair or not */
69 1.2 tnozaki int chlen;
70 1.1 tnozaki char ch[4]; /* BASE64_IN, 3 * 6 = 18, most closed to UTF16_BIT */
71 1.1 tnozaki } _UTF7State;
72 1.1 tnozaki
73 1.1 tnozaki typedef struct {
74 1.1 tnozaki _UTF7EncodingInfo ei;
75 1.1 tnozaki struct {
76 1.1 tnozaki /* for future multi-locale facility */
77 1.1 tnozaki _UTF7State s_mblen;
78 1.1 tnozaki _UTF7State s_mbrlen;
79 1.1 tnozaki _UTF7State s_mbrtowc;
80 1.1 tnozaki _UTF7State s_mbtowc;
81 1.1 tnozaki _UTF7State s_mbsrtowcs;
82 1.6 joerg _UTF7State s_mbsnrtowcs;
83 1.1 tnozaki _UTF7State s_wcrtomb;
84 1.1 tnozaki _UTF7State s_wcsrtombs;
85 1.6 joerg _UTF7State s_wcsnrtombs;
86 1.1 tnozaki _UTF7State s_wctomb;
87 1.1 tnozaki } states;
88 1.1 tnozaki } _UTF7CTypeInfo;
89 1.1 tnozaki
90 1.1 tnozaki #define _CEI_TO_EI(_cei_) (&(_cei_)->ei)
91 1.1 tnozaki #define _CEI_TO_STATE(_cei_, _func_) (_cei_)->states.s_##_func_
92 1.1 tnozaki
93 1.1 tnozaki #define _FUNCNAME(m) _citrus_UTF7_##m
94 1.1 tnozaki #define _ENCODING_INFO _UTF7EncodingInfo
95 1.1 tnozaki #define _CTYPE_INFO _UTF7CTypeInfo
96 1.1 tnozaki #define _ENCODING_STATE _UTF7State
97 1.1 tnozaki #define _ENCODING_MB_CUR_MAX(_ei_) 4
98 1.1 tnozaki #define _ENCODING_IS_STATE_DEPENDENT 1
99 1.1 tnozaki #define _STATE_NEEDS_EXPLICIT_INIT(_ps_) 0
100 1.1 tnozaki
101 1.1 tnozaki static __inline void
102 1.1 tnozaki /*ARGSUSED*/
103 1.1 tnozaki _citrus_UTF7_init_state(_UTF7EncodingInfo * __restrict ei,
104 1.1 tnozaki _UTF7State * __restrict s)
105 1.1 tnozaki {
106 1.1 tnozaki /* ei appears to be unused */
107 1.1 tnozaki _DIAGASSERT(s != NULL);
108 1.1 tnozaki
109 1.1 tnozaki memset((void *)s, 0, sizeof(*s));
110 1.1 tnozaki }
111 1.1 tnozaki
112 1.1 tnozaki static __inline void
113 1.1 tnozaki /*ARGSUSED*/
114 1.1 tnozaki _citrus_UTF7_pack_state(_UTF7EncodingInfo * __restrict ei,
115 1.1 tnozaki void *__restrict pspriv, const _UTF7State * __restrict s)
116 1.1 tnozaki {
117 1.1 tnozaki /* ei seem to be unused */
118 1.1 tnozaki _DIAGASSERT(pspriv != NULL);
119 1.1 tnozaki _DIAGASSERT(s != NULL);
120 1.1 tnozaki
121 1.1 tnozaki memcpy(pspriv, (const void *)s, sizeof(*s));
122 1.1 tnozaki }
123 1.1 tnozaki
124 1.1 tnozaki static __inline void
125 1.1 tnozaki /*ARGSUSED*/
126 1.1 tnozaki _citrus_UTF7_unpack_state(_UTF7EncodingInfo * __restrict ei,
127 1.1 tnozaki _UTF7State * __restrict s, const void * __restrict pspriv)
128 1.1 tnozaki {
129 1.1 tnozaki /* ei seem to be unused */
130 1.1 tnozaki _DIAGASSERT(s != NULL);
131 1.1 tnozaki _DIAGASSERT(pspriv != NULL);
132 1.1 tnozaki
133 1.1 tnozaki memcpy((void *)s, pspriv, sizeof(*s));
134 1.1 tnozaki }
135 1.1 tnozaki
136 1.1 tnozaki static const char base64[] =
137 1.1 tnozaki "ABCDEFGHIJKLMNOPQRSTUVWXYZ"
138 1.1 tnozaki "abcdefghijklmnopqrstuvwxyz"
139 1.1 tnozaki "0123456789+/";
140 1.1 tnozaki
141 1.1 tnozaki static const char direct[] =
142 1.1 tnozaki "ABCDEFGHIJKLMNOPQRSTUVWXYZ"
143 1.1 tnozaki "abcdefghijklmnopqrstuvwxyz"
144 1.1 tnozaki "0123456789(),-./:?";
145 1.1 tnozaki
146 1.1 tnozaki static const char option[] = "!\"#$%&';<=>@[]^_`{|}";
147 1.1 tnozaki static const char spaces[] = " \t\r\n";
148 1.1 tnozaki
149 1.1 tnozaki #define BASE64_BIT 6
150 1.1 tnozaki #define UTF16_BIT 16
151 1.1 tnozaki
152 1.1 tnozaki #define BASE64_MAX 0x3f
153 1.1 tnozaki #define UTF16_MAX UINT16_C(0xffff)
154 1.1 tnozaki #define UTF32_MAX UINT32_C(0x10ffff)
155 1.1 tnozaki
156 1.1 tnozaki #define BASE64_IN '+'
157 1.1 tnozaki #define BASE64_OUT '-'
158 1.1 tnozaki
159 1.1 tnozaki #define SHIFT7BIT(c) ((c) >> 7)
160 1.1 tnozaki #define ISSPECIAL(c) ((c) == '\0' || (c) == BASE64_IN)
161 1.1 tnozaki
162 1.1 tnozaki #define FINDLEN(ei, c) \
163 1.1 tnozaki (SHIFT7BIT((c)) ? -1 : (((ei)->cell[(c)] & EI_MASK) - 1))
164 1.1 tnozaki
165 1.1 tnozaki #define ISDIRECT(ei, c) (!SHIFT7BIT((c)) && (ISSPECIAL((c)) || \
166 1.1 tnozaki ei->cell[(c)] & (EI_DIRECT | EI_OPTION | EI_SPACE)))
167 1.1 tnozaki
168 1.1 tnozaki #define ISSAFE(ei, c) (!SHIFT7BIT((c)) && (ISSPECIAL((c)) || \
169 1.4 christos (c < 0x80 && ei->cell[(c)] & (EI_DIRECT | EI_SPACE))))
170 1.1 tnozaki
171 1.1 tnozaki /* surrogate pair */
172 1.1 tnozaki #define SRG_BASE UINT32_C(0x10000)
173 1.1 tnozaki #define HISRG_MIN UINT16_C(0xd800)
174 1.1 tnozaki #define HISRG_MAX UINT16_C(0xdbff)
175 1.1 tnozaki #define LOSRG_MIN UINT16_C(0xdc00)
176 1.1 tnozaki #define LOSRG_MAX UINT16_C(0xdfff)
177 1.1 tnozaki
178 1.1 tnozaki static int
179 1.5 tnozaki _citrus_UTF7_mbtoutf16(_UTF7EncodingInfo * __restrict ei,
180 1.1 tnozaki uint16_t * __restrict u16, const char ** __restrict s, size_t n,
181 1.1 tnozaki _UTF7State * __restrict psenc, size_t * __restrict nresult)
182 1.1 tnozaki {
183 1.2 tnozaki _UTF7State sv;
184 1.1 tnozaki const char *s0;
185 1.1 tnozaki int i, done, len;
186 1.1 tnozaki
187 1.1 tnozaki _DIAGASSERT(ei != NULL);
188 1.1 tnozaki _DIAGASSERT(s != NULL && *s != NULL);
189 1.1 tnozaki _DIAGASSERT(psenc != NULL);
190 1.1 tnozaki
191 1.1 tnozaki s0 = *s;
192 1.2 tnozaki sv = *psenc;
193 1.1 tnozaki
194 1.1 tnozaki for (i = 0, done = 0; done == 0; i++) {
195 1.2 tnozaki _DIAGASSERT(i <= psenc->chlen);
196 1.2 tnozaki if (i == psenc->chlen) {
197 1.1 tnozaki if (n-- < 1) {
198 1.1 tnozaki *nresult = (size_t)-2;
199 1.1 tnozaki *s = s0;
200 1.2 tnozaki sv.chlen = psenc->chlen;
201 1.2 tnozaki *psenc = sv;
202 1.5 tnozaki return 0;
203 1.1 tnozaki }
204 1.2 tnozaki psenc->ch[psenc->chlen++] = *s0++;
205 1.1 tnozaki }
206 1.1 tnozaki if (SHIFT7BIT((int)psenc->ch[i]))
207 1.1 tnozaki goto ilseq;
208 1.2 tnozaki if (!psenc->mode) {
209 1.2 tnozaki if (psenc->bits > 0 || psenc->cache > 0)
210 1.5 tnozaki return EINVAL;
211 1.1 tnozaki if (psenc->ch[i] == BASE64_IN) {
212 1.2 tnozaki psenc->mode = 1;
213 1.1 tnozaki } else {
214 1.1 tnozaki if (!ISDIRECT(ei, (int)psenc->ch[i]))
215 1.1 tnozaki goto ilseq;
216 1.1 tnozaki *u16 = (uint16_t)psenc->ch[i];
217 1.1 tnozaki done = 1;
218 1.1 tnozaki continue;
219 1.1 tnozaki }
220 1.1 tnozaki } else {
221 1.2 tnozaki if (psenc->ch[i] == BASE64_OUT && psenc->cache == 0) {
222 1.2 tnozaki psenc->mode = 0;
223 1.1 tnozaki *u16 = (uint16_t)BASE64_IN;
224 1.1 tnozaki done = 1;
225 1.1 tnozaki continue;
226 1.1 tnozaki }
227 1.1 tnozaki len = FINDLEN(ei, (int)psenc->ch[i]);
228 1.1 tnozaki if (len < 0) {
229 1.2 tnozaki if (psenc->bits >= BASE64_BIT)
230 1.5 tnozaki return EINVAL;
231 1.2 tnozaki psenc->mode = 0;
232 1.2 tnozaki psenc->bits = psenc->cache = 0;
233 1.1 tnozaki if (psenc->ch[i] != BASE64_OUT) {
234 1.1 tnozaki if (!ISDIRECT(ei, (int)psenc->ch[i]))
235 1.1 tnozaki goto ilseq;
236 1.1 tnozaki *u16 = (uint16_t)psenc->ch[i];
237 1.1 tnozaki done = 1;
238 1.1 tnozaki }
239 1.1 tnozaki } else {
240 1.5 tnozaki psenc->cache =
241 1.5 tnozaki (psenc->cache << BASE64_BIT) | len;
242 1.2 tnozaki switch (psenc->bits) {
243 1.1 tnozaki case 0: case 2: case 4: case 6: case 8:
244 1.2 tnozaki psenc->bits += BASE64_BIT;
245 1.1 tnozaki break;
246 1.1 tnozaki case 10: case 12: case 14:
247 1.2 tnozaki psenc->bits -= (UTF16_BIT - BASE64_BIT);
248 1.2 tnozaki *u16 = (psenc->cache >> psenc->bits)
249 1.1 tnozaki & UTF16_MAX;
250 1.1 tnozaki done = 1;
251 1.1 tnozaki break;
252 1.1 tnozaki default:
253 1.5 tnozaki return EINVAL;
254 1.1 tnozaki }
255 1.1 tnozaki }
256 1.1 tnozaki }
257 1.1 tnozaki }
258 1.1 tnozaki
259 1.2 tnozaki if (psenc->chlen > i)
260 1.5 tnozaki return EINVAL;
261 1.2 tnozaki psenc->chlen = 0;
262 1.1 tnozaki *nresult = (size_t)((*u16 == 0) ? 0 : s0 - *s);
263 1.1 tnozaki *s = s0;
264 1.1 tnozaki
265 1.5 tnozaki return 0;
266 1.1 tnozaki
267 1.1 tnozaki ilseq:
268 1.1 tnozaki *nresult = (size_t)-1;
269 1.5 tnozaki return EILSEQ;
270 1.1 tnozaki }
271 1.1 tnozaki
272 1.1 tnozaki static int
273 1.1 tnozaki _citrus_UTF7_mbrtowc_priv(_UTF7EncodingInfo * __restrict ei,
274 1.1 tnozaki wchar_t * __restrict pwc, const char ** __restrict s, size_t n,
275 1.1 tnozaki _UTF7State * __restrict psenc, size_t * __restrict nresult)
276 1.1 tnozaki {
277 1.5 tnozaki const char *s0;
278 1.1 tnozaki uint32_t u32;
279 1.1 tnozaki uint16_t hi, lo;
280 1.5 tnozaki size_t siz, nr;
281 1.1 tnozaki int err;
282 1.1 tnozaki
283 1.1 tnozaki _DIAGASSERT(ei != NULL);
284 1.1 tnozaki /* pwc may be null */
285 1.1 tnozaki _DIAGASSERT(s != NULL);
286 1.1 tnozaki _DIAGASSERT(psenc != NULL);
287 1.1 tnozaki
288 1.1 tnozaki if (*s == NULL) {
289 1.1 tnozaki _citrus_UTF7_init_state(ei, psenc);
290 1.1 tnozaki *nresult = (size_t)_ENCODING_IS_STATE_DEPENDENT;
291 1.5 tnozaki return 0;
292 1.1 tnozaki }
293 1.5 tnozaki s0 = *s;
294 1.2 tnozaki if (psenc->surrogate) {
295 1.2 tnozaki hi = (psenc->cache >> 2) & UTF16_MAX;
296 1.5 tnozaki if (hi < HISRG_MIN || hi > HISRG_MAX)
297 1.5 tnozaki return EINVAL;
298 1.1 tnozaki siz = 0;
299 1.1 tnozaki } else {
300 1.5 tnozaki err = _citrus_UTF7_mbtoutf16(ei, &hi, &s0, n, psenc, &nr);
301 1.5 tnozaki if (nr == (size_t)-1 || nr == (size_t)-2) {
302 1.5 tnozaki *nresult = nr;
303 1.5 tnozaki return err;
304 1.5 tnozaki }
305 1.5 tnozaki if (err != 0)
306 1.5 tnozaki return err;
307 1.5 tnozaki n -= nr;
308 1.5 tnozaki siz = nr;
309 1.5 tnozaki if (hi < HISRG_MIN || hi > HISRG_MAX) {
310 1.5 tnozaki u32 = (uint32_t)hi;
311 1.5 tnozaki goto done;
312 1.5 tnozaki }
313 1.5 tnozaki psenc->surrogate = 1;
314 1.1 tnozaki }
315 1.5 tnozaki err = _citrus_UTF7_mbtoutf16(ei, &lo, &s0, n, psenc, &nr);
316 1.5 tnozaki if (nr == (size_t)-1 || nr == (size_t)-2) {
317 1.5 tnozaki *nresult = nr;
318 1.5 tnozaki return err;
319 1.1 tnozaki }
320 1.5 tnozaki if (err != 0)
321 1.5 tnozaki return err;
322 1.5 tnozaki hi -= HISRG_MIN;
323 1.5 tnozaki lo -= LOSRG_MIN;
324 1.5 tnozaki u32 = (hi << 10 | lo) + SRG_BASE;
325 1.5 tnozaki siz += nr;
326 1.5 tnozaki done:
327 1.5 tnozaki *s = s0;
328 1.1 tnozaki if (pwc != NULL)
329 1.1 tnozaki *pwc = (wchar_t)u32;
330 1.5 tnozaki if (u32 == (uint32_t)0) {
331 1.5 tnozaki *nresult = (size_t)0;
332 1.5 tnozaki _citrus_UTF7_init_state(ei, psenc);
333 1.5 tnozaki } else {
334 1.5 tnozaki *nresult = siz;
335 1.5 tnozaki psenc->surrogate = 0;
336 1.5 tnozaki }
337 1.5 tnozaki return err;
338 1.1 tnozaki }
339 1.1 tnozaki
340 1.5 tnozaki static int
341 1.5 tnozaki _citrus_UTF7_utf16tomb(_UTF7EncodingInfo * __restrict ei,
342 1.5 tnozaki char * __restrict s, size_t n, uint16_t u16,
343 1.5 tnozaki _UTF7State * __restrict psenc, size_t * __restrict nresult)
344 1.1 tnozaki {
345 1.1 tnozaki int bits, i;
346 1.1 tnozaki
347 1.1 tnozaki _DIAGASSERT(ei != NULL);
348 1.1 tnozaki _DIAGASSERT(psenc != NULL);
349 1.1 tnozaki
350 1.2 tnozaki if (psenc->chlen != 0 || psenc->bits > BASE64_BIT)
351 1.5 tnozaki return EINVAL;
352 1.1 tnozaki
353 1.1 tnozaki if (ISSAFE(ei, u16)) {
354 1.2 tnozaki if (psenc->mode) {
355 1.2 tnozaki if (psenc->bits > 0) {
356 1.2 tnozaki bits = BASE64_BIT - psenc->bits;
357 1.2 tnozaki i = (psenc->cache << bits) & BASE64_MAX;
358 1.2 tnozaki psenc->ch[psenc->chlen++] = base64[i];
359 1.2 tnozaki psenc->bits = psenc->cache = 0;
360 1.1 tnozaki }
361 1.1 tnozaki if (u16 == BASE64_OUT || FINDLEN(ei, u16) >= 0)
362 1.2 tnozaki psenc->ch[psenc->chlen++] = BASE64_OUT;
363 1.2 tnozaki psenc->mode = 0;
364 1.1 tnozaki }
365 1.2 tnozaki if (psenc->bits != 0)
366 1.5 tnozaki return EINVAL;
367 1.2 tnozaki psenc->ch[psenc->chlen++] = (char)u16;
368 1.1 tnozaki if (u16 == BASE64_IN)
369 1.2 tnozaki psenc->ch[psenc->chlen++] = BASE64_OUT;
370 1.1 tnozaki } else {
371 1.2 tnozaki if (!psenc->mode) {
372 1.2 tnozaki if (psenc->bits > 0)
373 1.5 tnozaki return EINVAL;
374 1.2 tnozaki psenc->ch[psenc->chlen++] = BASE64_IN;
375 1.2 tnozaki psenc->mode = 1;
376 1.1 tnozaki }
377 1.2 tnozaki psenc->cache = (psenc->cache << UTF16_BIT) | u16;
378 1.2 tnozaki bits = UTF16_BIT + psenc->bits;
379 1.2 tnozaki psenc->bits = bits % BASE64_BIT;
380 1.1 tnozaki while ((bits -= BASE64_BIT) >= 0) {
381 1.2 tnozaki i = (psenc->cache >> bits) & BASE64_MAX;
382 1.2 tnozaki psenc->ch[psenc->chlen++] = base64[i];
383 1.1 tnozaki }
384 1.1 tnozaki }
385 1.5 tnozaki memcpy(s, psenc->ch, psenc->chlen);
386 1.5 tnozaki *nresult = psenc->chlen;
387 1.5 tnozaki psenc->chlen = 0;
388 1.1 tnozaki
389 1.5 tnozaki return 0;
390 1.1 tnozaki }
391 1.1 tnozaki
392 1.1 tnozaki static int
393 1.1 tnozaki _citrus_UTF7_wcrtomb_priv(_UTF7EncodingInfo * __restrict ei,
394 1.1 tnozaki char * __restrict s, size_t n, wchar_t wchar,
395 1.1 tnozaki _UTF7State * __restrict psenc, size_t * __restrict nresult)
396 1.1 tnozaki {
397 1.1 tnozaki uint32_t u32;
398 1.1 tnozaki uint16_t u16[2];
399 1.1 tnozaki int err, len, i;
400 1.5 tnozaki size_t siz, nr;
401 1.1 tnozaki
402 1.1 tnozaki _DIAGASSERT(ei != NULL);
403 1.1 tnozaki _DIAGASSERT(s != NULL);
404 1.1 tnozaki _DIAGASSERT(psenc != NULL);
405 1.5 tnozaki _DIAGASSERT(nresult != NULL);
406 1.1 tnozaki
407 1.1 tnozaki u32 = (uint32_t)wchar;
408 1.1 tnozaki if (u32 <= UTF16_MAX) {
409 1.1 tnozaki u16[0] = (uint16_t)u32;
410 1.1 tnozaki len = 1;
411 1.1 tnozaki } else if (u32 <= UTF32_MAX) {
412 1.1 tnozaki u32 -= SRG_BASE;
413 1.1 tnozaki u16[0] = (u32 >> 10) + HISRG_MIN;
414 1.1 tnozaki u16[1] = ((uint16_t)(u32 & UINT32_C(0x3ff))) + LOSRG_MIN;
415 1.1 tnozaki len = 2;
416 1.1 tnozaki } else {
417 1.1 tnozaki *nresult = (size_t)-1;
418 1.5 tnozaki return EILSEQ;
419 1.1 tnozaki }
420 1.5 tnozaki siz = 0;
421 1.5 tnozaki for (i = 0; i < len; ++i) {
422 1.5 tnozaki err = _citrus_UTF7_utf16tomb(ei, s, n, u16[i], psenc, &nr);
423 1.5 tnozaki if (err != 0)
424 1.5 tnozaki return err; /* XXX: state has been modified */
425 1.5 tnozaki s += nr;
426 1.5 tnozaki n -= nr;
427 1.5 tnozaki siz += nr;
428 1.1 tnozaki }
429 1.5 tnozaki *nresult = siz;
430 1.1 tnozaki
431 1.5 tnozaki return 0;
432 1.1 tnozaki }
433 1.1 tnozaki
434 1.1 tnozaki static int
435 1.1 tnozaki /* ARGSUSED */
436 1.1 tnozaki _citrus_UTF7_put_state_reset(_UTF7EncodingInfo * __restrict ei,
437 1.1 tnozaki char * __restrict s, size_t n, _UTF7State * __restrict psenc,
438 1.1 tnozaki size_t * __restrict nresult)
439 1.1 tnozaki {
440 1.1 tnozaki int bits, pos;
441 1.1 tnozaki
442 1.1 tnozaki _DIAGASSERT(ei != NULL);
443 1.1 tnozaki _DIAGASSERT(s != NULL);
444 1.1 tnozaki _DIAGASSERT(psenc != NULL);
445 1.1 tnozaki _DIAGASSERT(nresult != NULL);
446 1.1 tnozaki
447 1.2 tnozaki if (psenc->chlen != 0 || psenc->bits > BASE64_BIT || psenc->surrogate)
448 1.5 tnozaki return EINVAL;
449 1.1 tnozaki
450 1.2 tnozaki if (psenc->mode) {
451 1.2 tnozaki if (psenc->bits > 0) {
452 1.1 tnozaki if (n-- < 1)
453 1.5 tnozaki return E2BIG;
454 1.2 tnozaki bits = BASE64_BIT - psenc->bits;
455 1.2 tnozaki pos = (psenc->cache << bits) & BASE64_MAX;
456 1.2 tnozaki psenc->ch[psenc->chlen++] = base64[pos];
457 1.2 tnozaki psenc->ch[psenc->chlen++] = BASE64_OUT;
458 1.2 tnozaki psenc->bits = psenc->cache = 0;
459 1.1 tnozaki }
460 1.2 tnozaki psenc->mode = 0;
461 1.1 tnozaki }
462 1.2 tnozaki if (psenc->bits != 0)
463 1.5 tnozaki return EINVAL;
464 1.1 tnozaki if (n-- < 1)
465 1.5 tnozaki return E2BIG;
466 1.1 tnozaki
467 1.2 tnozaki _DIAGASSERT(n >= psenc->chlen);
468 1.2 tnozaki *nresult = (size_t)psenc->chlen;
469 1.2 tnozaki if (psenc->chlen > 0) {
470 1.2 tnozaki memcpy(s, psenc->ch, psenc->chlen);
471 1.2 tnozaki psenc->chlen = 0;
472 1.1 tnozaki }
473 1.1 tnozaki
474 1.5 tnozaki return 0;
475 1.1 tnozaki }
476 1.1 tnozaki
477 1.1 tnozaki static __inline int
478 1.1 tnozaki /*ARGSUSED*/
479 1.1 tnozaki _citrus_UTF7_stdenc_wctocs(_UTF7EncodingInfo * __restrict ei,
480 1.1 tnozaki _csid_t * __restrict csid,
481 1.1 tnozaki _index_t * __restrict idx, wchar_t wc)
482 1.1 tnozaki {
483 1.1 tnozaki /* ei seem to be unused */
484 1.1 tnozaki _DIAGASSERT(csid != NULL);
485 1.1 tnozaki _DIAGASSERT(idx != NULL);
486 1.1 tnozaki
487 1.1 tnozaki *csid = 0;
488 1.1 tnozaki *idx = (_index_t)wc;
489 1.1 tnozaki
490 1.5 tnozaki return 0;
491 1.1 tnozaki }
492 1.1 tnozaki
493 1.1 tnozaki static __inline int
494 1.1 tnozaki /*ARGSUSED*/
495 1.1 tnozaki _citrus_UTF7_stdenc_cstowc(_UTF7EncodingInfo * __restrict ei,
496 1.1 tnozaki wchar_t * __restrict wc,
497 1.1 tnozaki _csid_t csid, _index_t idx)
498 1.1 tnozaki {
499 1.1 tnozaki /* ei seem to be unused */
500 1.1 tnozaki _DIAGASSERT(wc != NULL);
501 1.1 tnozaki
502 1.1 tnozaki if (csid != 0)
503 1.5 tnozaki return EILSEQ;
504 1.1 tnozaki *wc = (wchar_t)idx;
505 1.1 tnozaki
506 1.5 tnozaki return 0;
507 1.1 tnozaki }
508 1.1 tnozaki
509 1.3 tshiozak static __inline int
510 1.3 tshiozak /*ARGSUSED*/
511 1.3 tshiozak _citrus_UTF7_stdenc_get_state_desc_generic(_UTF7EncodingInfo * __restrict ei,
512 1.3 tshiozak _UTF7State * __restrict psenc,
513 1.3 tshiozak int * __restrict rstate)
514 1.3 tshiozak {
515 1.3 tshiozak
516 1.3 tshiozak if (psenc->chlen == 0)
517 1.3 tshiozak *rstate = _STDENC_SDGEN_INITIAL;
518 1.3 tshiozak else
519 1.3 tshiozak *rstate = _STDENC_SDGEN_INCOMPLETE_CHAR;
520 1.3 tshiozak
521 1.3 tshiozak return 0;
522 1.3 tshiozak }
523 1.3 tshiozak
524 1.1 tnozaki static void
525 1.1 tnozaki /*ARGSUSED*/
526 1.1 tnozaki _citrus_UTF7_encoding_module_uninit(_UTF7EncodingInfo *ei)
527 1.1 tnozaki {
528 1.1 tnozaki /* ei seems to be unused */
529 1.1 tnozaki }
530 1.1 tnozaki
531 1.1 tnozaki static int
532 1.1 tnozaki /*ARGSUSED*/
533 1.1 tnozaki _citrus_UTF7_encoding_module_init(_UTF7EncodingInfo * __restrict ei,
534 1.1 tnozaki const void * __restrict var, size_t lenvar)
535 1.1 tnozaki {
536 1.1 tnozaki const char *s;
537 1.1 tnozaki
538 1.3 tshiozak _DIAGASSERT(ei != NULL);
539 1.1 tnozaki /* var may be null */
540 1.1 tnozaki
541 1.1 tnozaki memset(ei, 0, sizeof(*ei));
542 1.1 tnozaki
543 1.1 tnozaki #define FILL(str, flag) \
544 1.1 tnozaki do { \
545 1.1 tnozaki for (s = str; *s != '\0'; s++) \
546 1.1 tnozaki ei->cell[*s & 0x7f] |= flag; \
547 1.1 tnozaki } while (/*CONSTCOND*/0)
548 1.1 tnozaki
549 1.1 tnozaki FILL(base64, (s - base64) + 1);
550 1.1 tnozaki FILL(direct, EI_DIRECT);
551 1.1 tnozaki FILL(option, EI_OPTION);
552 1.1 tnozaki FILL(spaces, EI_SPACE);
553 1.1 tnozaki
554 1.5 tnozaki return 0;
555 1.1 tnozaki }
556 1.1 tnozaki
557 1.1 tnozaki /* ----------------------------------------------------------------------
558 1.1 tnozaki * public interface for ctype
559 1.1 tnozaki */
560 1.1 tnozaki
561 1.1 tnozaki _CITRUS_CTYPE_DECLS(UTF7);
562 1.1 tnozaki _CITRUS_CTYPE_DEF_OPS(UTF7);
563 1.1 tnozaki
564 1.1 tnozaki #include "citrus_ctype_template.h"
565 1.1 tnozaki
566 1.1 tnozaki /* ----------------------------------------------------------------------
567 1.1 tnozaki * public interface for stdenc
568 1.1 tnozaki */
569 1.1 tnozaki
570 1.1 tnozaki _CITRUS_STDENC_DECLS(UTF7);
571 1.1 tnozaki _CITRUS_STDENC_DEF_OPS(UTF7);
572 1.1 tnozaki
573 1.1 tnozaki #include "citrus_stdenc_template.h"
574