mime_codecs.c revision 1.11 1 1.11 christos /* $NetBSD: mime_codecs.c,v 1.11 2013/02/14 18:23:45 christos Exp $ */
2 1.1 christos
3 1.1 christos /*-
4 1.1 christos * Copyright (c) 2006 The NetBSD Foundation, Inc.
5 1.1 christos * All rights reserved.
6 1.1 christos *
7 1.1 christos * This code is derived from software contributed to The NetBSD Foundation
8 1.1 christos * by Anon Ymous.
9 1.1 christos *
10 1.1 christos * Redistribution and use in source and binary forms, with or without
11 1.1 christos * modification, are permitted provided that the following conditions
12 1.1 christos * are met:
13 1.1 christos * 1. Redistributions of source code must retain the above copyright
14 1.1 christos * notice, this list of conditions and the following disclaimer.
15 1.1 christos * 2. Redistributions in binary form must reproduce the above copyright
16 1.1 christos * notice, this list of conditions and the following disclaimer in the
17 1.1 christos * documentation and/or other materials provided with the distribution.
18 1.1 christos *
19 1.1 christos * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.1 christos * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.1 christos * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.1 christos * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.1 christos * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.1 christos * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.1 christos * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.1 christos * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.1 christos * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.1 christos * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.1 christos * POSSIBILITY OF SUCH DAMAGE.
30 1.1 christos */
31 1.1 christos
32 1.1 christos /*
33 1.1 christos * This module contains all mime related codecs. Typically there are
34 1.1 christos * two versions: one operating on buffers and one operating on files.
35 1.1 christos * All exported routines have a "mime_" prefix. The file oriented
36 1.1 christos * routines have a "mime_f" prefix replacing the "mime_" prefix of the
37 1.1 christos * equivalent buffer based version.
38 1.1 christos *
39 1.1 christos * The file based API should be:
40 1.1 christos *
41 1.1 christos * mime_f<name>_{encode,decode}(FILE *in, FILE *out, void *cookie)
42 1.1 christos *
43 1.1 christos * XXX - currently this naming convention has not been adheared to.
44 1.1 christos *
45 1.1 christos * where the cookie is a generic way to pass arguments to the routine.
46 1.1 christos * This way these routines can be run by run_function() in mime.c.
47 1.1 christos *
48 1.1 christos * The buffer based API is not as rigid.
49 1.1 christos */
50 1.1 christos
51 1.1 christos #ifdef MIME_SUPPORT
52 1.1 christos
53 1.1 christos #include <sys/cdefs.h>
54 1.1 christos #ifndef __lint__
55 1.11 christos __RCSID("$NetBSD: mime_codecs.c,v 1.11 2013/02/14 18:23:45 christos Exp $");
56 1.1 christos #endif /* not __lint__ */
57 1.1 christos
58 1.1 christos #include <assert.h>
59 1.1 christos #include <iconv.h>
60 1.1 christos #include <stdio.h>
61 1.1 christos #include <stdlib.h>
62 1.1 christos #include <util.h>
63 1.1 christos
64 1.1 christos #include "def.h"
65 1.1 christos #include "extern.h"
66 1.1 christos #include "mime_codecs.h"
67 1.1 christos
68 1.1 christos
69 1.1 christos #ifdef CHARSET_SUPPORT
70 1.1 christos /************************************************************************
71 1.1 christos * Core character set conversion routines.
72 1.1 christos *
73 1.1 christos */
74 1.1 christos
75 1.1 christos /*
76 1.1 christos * Fault-tolerant iconv() function.
77 1.1 christos *
78 1.1 christos * This routine was borrowed from nail-11.25/mime.c and modified. It
79 1.1 christos * tries to handle errno == EILSEQ by restarting at the next input
80 1.1 christos * byte (is this a good idea?). All other errors are handled by the
81 1.1 christos * caller.
82 1.1 christos */
83 1.1 christos PUBLIC size_t
84 1.1 christos mime_iconv(iconv_t cd, const char **inb, size_t *inbleft, char **outb, size_t *outbleft)
85 1.1 christos {
86 1.1 christos size_t sz = 0;
87 1.1 christos
88 1.1 christos while ((sz = iconv(cd, inb, inbleft, outb, outbleft)) == (size_t)-1
89 1.1 christos && errno == EILSEQ) {
90 1.1 christos if (*outbleft > 0) {
91 1.1 christos *(*outb)++ = '?';
92 1.1 christos (*outbleft)--;
93 1.1 christos } else {
94 1.1 christos **outb = '\0';
95 1.1 christos return E2BIG;
96 1.1 christos }
97 1.1 christos if (*inbleft > 0) {
98 1.1 christos (*inb)++;
99 1.1 christos (*inbleft)--;
100 1.1 christos } else {
101 1.1 christos **outb = '\0';
102 1.1 christos break;
103 1.1 christos }
104 1.1 christos }
105 1.1 christos return sz;
106 1.1 christos }
107 1.1 christos
108 1.1 christos /*
109 1.1 christos * This routine was mostly borrowed from src/usr.bin/iconv/iconv.c.
110 1.1 christos * We don't care about the invalid character count, so don't bother
111 1.1 christos * with __iconv(). We do care about robustness, so call iconv_ft()
112 1.1 christos * above to try to recover from errors.
113 1.1 christos */
114 1.1 christos #define INBUFSIZE 1024
115 1.1 christos #define OUTBUFSIZE (INBUFSIZE * 2)
116 1.1 christos
117 1.1 christos PUBLIC void
118 1.1 christos mime_ficonv(FILE *fi, FILE *fo, void *cookie)
119 1.1 christos {
120 1.1 christos char inbuf[INBUFSIZE], outbuf[OUTBUFSIZE], *out;
121 1.1 christos const char *in;
122 1.1 christos size_t inbytes, outbytes, ret;
123 1.1 christos iconv_t cd;
124 1.1 christos
125 1.1 christos /*
126 1.1 christos * NOTE: iconv_t is actually a pointer typedef, so this
127 1.1 christos * conversion is not what it appears to be!
128 1.1 christos */
129 1.1 christos cd = (iconv_t)cookie;
130 1.1 christos
131 1.1 christos while ((inbytes = fread(inbuf, 1, INBUFSIZE, fi)) > 0) {
132 1.1 christos in = inbuf;
133 1.1 christos while (inbytes > 0) {
134 1.1 christos out = outbuf;
135 1.1 christos outbytes = OUTBUFSIZE;
136 1.1 christos ret = mime_iconv(cd, &in, &inbytes, &out, &outbytes);
137 1.1 christos if (ret == (size_t)-1 && errno != E2BIG) {
138 1.1 christos if (errno != EINVAL || in == inbuf) {
139 1.1 christos /* XXX - what is proper here?
140 1.1 christos * Just copy out the remains? */
141 1.1 christos (void)fprintf(fo,
142 1.1 christos "\n\t[ iconv truncated message: %s ]\n\n",
143 1.1 christos strerror(errno));
144 1.1 christos return;
145 1.1 christos }
146 1.1 christos /*
147 1.1 christos * If here: errno == EINVAL && in != inbuf
148 1.1 christos */
149 1.1 christos /* incomplete input character */
150 1.1 christos (void)memmove(inbuf, in, inbytes);
151 1.1 christos ret = fread(inbuf + inbytes, 1,
152 1.1 christos INBUFSIZE - inbytes, fi);
153 1.1 christos if (ret == 0) {
154 1.1 christos if (feof(fi)) {
155 1.1 christos (void)fprintf(fo,
156 1.1 christos "\n\t[ unexpected end of file; "
157 1.1 christos "the last character is "
158 1.1 christos "incomplete. ]\n\n");
159 1.1 christos return;
160 1.1 christos }
161 1.1 christos (void)fprintf(fo,
162 1.1 christos "\n\t[ fread(): %s ]\n\n",
163 1.1 christos strerror(errno));
164 1.1 christos return;
165 1.1 christos }
166 1.1 christos in = inbuf;
167 1.1 christos inbytes += ret;
168 1.1 christos
169 1.1 christos }
170 1.1 christos if (outbytes < OUTBUFSIZE)
171 1.1 christos (void)fwrite(outbuf, 1, OUTBUFSIZE - outbytes, fo);
172 1.1 christos }
173 1.1 christos }
174 1.1 christos /* reset the shift state of the output buffer */
175 1.1 christos outbytes = OUTBUFSIZE;
176 1.1 christos out = outbuf;
177 1.1 christos ret = iconv(cd, NULL, NULL, &out, &outbytes);
178 1.1 christos if (ret == (size_t)-1) {
179 1.1 christos (void)fprintf(fo, "\n\t[ iconv(): %s ]\n\n",
180 1.1 christos strerror(errno));
181 1.1 christos return;
182 1.1 christos }
183 1.1 christos if (outbytes < OUTBUFSIZE)
184 1.1 christos (void)fwrite(outbuf, 1, OUTBUFSIZE - outbytes, fo);
185 1.1 christos }
186 1.1 christos
187 1.1 christos #endif /* CHARSET_SUPPORT */
188 1.1 christos
189 1.1 christos
190 1.1 christos
191 1.1 christos /************************************************************************
192 1.1 christos * Core base64 routines
193 1.1 christos *
194 1.1 christos * Defined in sec 6.8 of RFC 2045.
195 1.1 christos */
196 1.1 christos
197 1.1 christos /*
198 1.1 christos * Decode a base64 buffer.
199 1.6 christos *
200 1.1 christos * bin: buffer to hold the decoded (binary) result (see note 1).
201 1.1 christos * b64: buffer holding the encoded (base64) source.
202 1.1 christos * cnt: number of bytes in the b64 buffer to decode (see note 2).
203 1.1 christos *
204 1.1 christos * Return: the number of bytes written to the 'bin' buffer or -1 on
205 1.1 christos * error.
206 1.1 christos * NOTES:
207 1.1 christos * 1) It is the callers responsibility to ensure that bin is large
208 1.1 christos * enough to hold the result.
209 1.1 christos * 2) The b64 buffer should always contain a multiple of 4 bytes of
210 1.1 christos * data!
211 1.1 christos */
212 1.1 christos PUBLIC ssize_t
213 1.1 christos mime_b64tobin(char *bin, const char *b64, size_t cnt)
214 1.1 christos {
215 1.1 christos static const signed char b64index[] = {
216 1.1 christos -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1,
217 1.1 christos -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1,
218 1.1 christos -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,62, -1,-1,-1,63,
219 1.1 christos 52,53,54,55, 56,57,58,59, 60,61,-1,-1, -1,-2,-1,-1,
220 1.1 christos -1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9,10, 11,12,13,14,
221 1.1 christos 15,16,17,18, 19,20,21,22, 23,24,25,-1, -1,-1,-1,-1,
222 1.1 christos -1,26,27,28, 29,30,31,32, 33,34,35,36, 37,38,39,40,
223 1.1 christos 41,42,43,44, 45,46,47,48, 49,50,51,-1, -1,-1,-1,-1
224 1.1 christos };
225 1.1 christos unsigned char *p;
226 1.3 christos const unsigned char *q, *end;
227 1.6 christos
228 1.1 christos #define EQU (unsigned)-2
229 1.1 christos #define BAD (unsigned)-1
230 1.8 lukem #define uchar64(c) ((c) >= sizeof(b64index) ? BAD : (unsigned)b64index[(c)])
231 1.1 christos
232 1.3 christos p = (unsigned char *)bin;
233 1.3 christos q = (const unsigned char *)b64;
234 1.3 christos for (end = q + cnt; q < end; q += 4) {
235 1.3 christos unsigned a = uchar64(q[0]);
236 1.3 christos unsigned b = uchar64(q[1]);
237 1.3 christos unsigned c = uchar64(q[2]);
238 1.3 christos unsigned d = uchar64(q[3]);
239 1.6 christos
240 1.10 christos if (a == BAD || a == EQU || b == BAD || b == EQU ||
241 1.10 christos c == BAD || d == BAD)
242 1.10 christos return -1;
243 1.10 christos
244 1.1 christos *p++ = ((a << 2) | ((b & 0x30) >> 4));
245 1.1 christos if (c == EQU) { /* got '=' */
246 1.1 christos if (d != EQU)
247 1.1 christos return -1;
248 1.1 christos break;
249 1.1 christos }
250 1.1 christos *p++ = (((b & 0x0f) << 4) | ((c & 0x3c) >> 2));
251 1.1 christos if (d == EQU) { /* got '=' */
252 1.1 christos break;
253 1.1 christos }
254 1.1 christos *p++ = (((c & 0x03) << 6) | d);
255 1.1 christos }
256 1.6 christos
257 1.3 christos #undef uchar64
258 1.1 christos #undef EQU
259 1.1 christos #undef BAD
260 1.1 christos
261 1.1 christos return p - (unsigned char*)bin;
262 1.1 christos }
263 1.1 christos
264 1.1 christos /*
265 1.1 christos * Encode a buffer as a base64 result.
266 1.6 christos *
267 1.1 christos * b64: buffer to hold the encoded (base64) result (see note).
268 1.1 christos * bin: buffer holding the binary source.
269 1.1 christos * cnt: number of bytes in the bin buffer to encode.
270 1.1 christos *
271 1.1 christos * NOTE: it is the callers responsibility to ensure that 'b64' is
272 1.1 christos * large enough to hold the result.
273 1.1 christos */
274 1.1 christos PUBLIC void
275 1.1 christos mime_bintob64(char *b64, const char *bin, size_t cnt)
276 1.1 christos {
277 1.1 christos static const char b64table[] =
278 1.1 christos "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";
279 1.1 christos const unsigned char *p = (const unsigned char*)bin;
280 1.9 christos ssize_t i;
281 1.1 christos
282 1.1 christos for (i = cnt; i > 0; i -= 3) {
283 1.1 christos unsigned a = p[0];
284 1.1 christos unsigned b = p[1];
285 1.1 christos unsigned c = p[2];
286 1.1 christos
287 1.1 christos b64[0] = b64table[a >> 2];
288 1.1 christos switch(i) {
289 1.1 christos case 1:
290 1.1 christos b64[1] = b64table[((a & 0x3) << 4)];
291 1.1 christos b64[2] = '=';
292 1.1 christos b64[3] = '=';
293 1.1 christos break;
294 1.1 christos case 2:
295 1.1 christos b64[1] = b64table[((a & 0x3) << 4) | ((b & 0xf0) >> 4)];
296 1.1 christos b64[2] = b64table[((b & 0xf) << 2)];
297 1.1 christos b64[3] = '=';
298 1.1 christos break;
299 1.1 christos default:
300 1.1 christos b64[1] = b64table[((a & 0x3) << 4) | ((b & 0xf0) >> 4)];
301 1.1 christos b64[2] = b64table[((b & 0xf) << 2) | ((c & 0xc0) >> 6)];
302 1.1 christos b64[3] = b64table[c & 0x3f];
303 1.1 christos break;
304 1.1 christos }
305 1.1 christos p += 3;
306 1.1 christos b64 += 4;
307 1.1 christos }
308 1.1 christos }
309 1.1 christos
310 1.1 christos
311 1.1 christos #define MIME_BASE64_LINE_MAX (4 * 19) /* max line length is 76: see RFC2045 sec 6.8 */
312 1.1 christos
313 1.1 christos static void
314 1.1 christos mime_fB64_encode(FILE *fi, FILE *fo, void *cookie __unused)
315 1.1 christos {
316 1.1 christos static char b64[MIME_BASE64_LINE_MAX];
317 1.1 christos static char mem[3 * (MIME_BASE64_LINE_MAX / 4)];
318 1.9 christos size_t cnt;
319 1.1 christos char *cp;
320 1.1 christos size_t limit;
321 1.1 christos #ifdef __lint__
322 1.1 christos cookie = cookie;
323 1.1 christos #endif
324 1.1 christos limit = 0;
325 1.1 christos if ((cp = value(ENAME_MIME_B64_LINE_MAX)) != NULL)
326 1.1 christos limit = (size_t)atoi(cp);
327 1.1 christos if (limit == 0 || limit > sizeof(b64))
328 1.1 christos limit = sizeof(b64);
329 1.1 christos
330 1.1 christos limit = 3 * roundup(limit, 4) / 4;
331 1.1 christos if (limit < 3)
332 1.1 christos limit = 3;
333 1.1 christos
334 1.1 christos while ((cnt = fread(mem, sizeof(*mem), limit, fi)) > 0) {
335 1.1 christos mime_bintob64(b64, mem, (size_t)cnt);
336 1.1 christos (void)fwrite(b64, sizeof(*b64), (size_t)4 * roundup(cnt, 3) / 3, fo);
337 1.1 christos (void)putc('\n', fo);
338 1.1 christos }
339 1.1 christos }
340 1.1 christos
341 1.1 christos static void
342 1.4 christos mime_fB64_decode(FILE *fi, FILE *fo, void *add_lf)
343 1.1 christos {
344 1.1 christos char *line;
345 1.1 christos size_t len;
346 1.1 christos char *buf;
347 1.1 christos size_t buflen;
348 1.1 christos
349 1.1 christos buflen = 3 * (MIME_BASE64_LINE_MAX / 4);
350 1.1 christos buf = emalloc(buflen);
351 1.1 christos
352 1.1 christos while ((line = fgetln(fi, &len)) != NULL) {
353 1.1 christos ssize_t binlen;
354 1.1 christos if (line[len-1] == '\n') /* forget the trailing newline */
355 1.1 christos len--;
356 1.1 christos
357 1.1 christos /* trash trailing white space */
358 1.6 christos for (/*EMPTY*/; len > 0 && is_WSP(line[len-1]); len--)
359 1.1 christos continue;
360 1.1 christos
361 1.1 christos /* skip leading white space */
362 1.6 christos for (/*EMPTY*/; len > 0 && is_WSP(line[0]); len--, line++)
363 1.1 christos continue;
364 1.1 christos
365 1.1 christos if (len == 0)
366 1.1 christos break;
367 1.1 christos
368 1.1 christos if (3 * len > 4 * buflen) {
369 1.1 christos buflen *= 2;
370 1.1 christos buf = erealloc(buf, buflen);
371 1.1 christos }
372 1.1 christos
373 1.1 christos binlen = mime_b64tobin(buf, line, len);
374 1.1 christos
375 1.1 christos if (binlen <= 0) {
376 1.1 christos (void)fprintf(fo, "WARN: invalid base64 encoding\n");
377 1.1 christos break;
378 1.1 christos }
379 1.1 christos (void)fwrite(buf, 1, (size_t)binlen, fo);
380 1.1 christos }
381 1.1 christos
382 1.1 christos free(buf);
383 1.1 christos
384 1.4 christos if (add_lf)
385 1.1 christos (void)fputc('\n', fo);
386 1.1 christos }
387 1.1 christos
388 1.1 christos
389 1.1 christos /************************************************************************
390 1.1 christos * Core quoted-printable routines.
391 1.1 christos *
392 1.11 christos * Defined in sec 6.7 of RFC 2045.
393 1.1 christos */
394 1.1 christos
395 1.11 christos /*
396 1.11 christos * strtol(3), but inline and with easy error indication.
397 1.11 christos */
398 1.11 christos static inline int
399 1.11 christos _qp_cfromhex(char const *hex)
400 1.11 christos {
401 1.11 christos /* Be robust, allow lowercase hexadecimal letters, too */
402 1.11 christos static unsigned char const atoi16[] = {
403 1.11 christos 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, /* 0x30-0x37 */
404 1.11 christos 0x08, 0x09, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, /* 0x38-0x3F */
405 1.11 christos 0xFF, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF, /* 0x40-0x47 */
406 1.11 christos 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, /* 0x48-0x4f */
407 1.11 christos 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, /* 0x50-0x57 */
408 1.11 christos 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, /* 0x58-0x5f */
409 1.11 christos 0xFF, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0xFF /* 0x60-0x67 */
410 1.11 christos };
411 1.11 christos unsigned char i1, i2;
412 1.11 christos int r;
413 1.11 christos
414 1.11 christos if ((i1 = (unsigned char)hex[0] - '0') >= __arraycount(atoi16) ||
415 1.11 christos (i2 = (unsigned char)hex[1] - '0') >= __arraycount(atoi16))
416 1.11 christos goto jerr;
417 1.11 christos i1 = atoi16[i1];
418 1.11 christos i2 = atoi16[i2];
419 1.11 christos if ((i1 | i2) & 0xF0)
420 1.11 christos goto jerr;
421 1.11 christos r = i1;
422 1.11 christos r <<= 4;
423 1.11 christos r += i2;
424 1.11 christos jleave:
425 1.11 christos return r;
426 1.11 christos jerr:
427 1.11 christos r = -1;
428 1.11 christos goto jleave;
429 1.11 christos }
430 1.11 christos
431 1.11 christos /*
432 1.11 christos * Header specific "quoted-printable" decode!
433 1.11 christos * Differences with body QP decoding (see rfc 2047, sec 4.2):
434 1.11 christos * 1) '=' occurs _only_ when followed by two hex digits (FWS is not allowed).
435 1.11 christos * 2) Spaces can be encoded as '_' in headers for readability.
436 1.11 christos */
437 1.11 christos static ssize_t
438 1.11 christos mime_QPh_decode(char *outbuf, size_t outlen, const char *inbuf, size_t inlen)
439 1.11 christos {
440 1.11 christos const char *p, *inend;
441 1.11 christos char *outend;
442 1.11 christos char *q;
443 1.11 christos
444 1.11 christos outend = outbuf + outlen;
445 1.11 christos inend = inbuf + inlen;
446 1.11 christos q = outbuf;
447 1.11 christos for (p = inbuf; p < inend; p++) {
448 1.11 christos if (q >= outend)
449 1.11 christos return -1;
450 1.11 christos if (*p == '=') {
451 1.11 christos p++;
452 1.11 christos if (p + 1 < inend) {
453 1.11 christos int c = _qp_cfromhex(p++);
454 1.11 christos if (c < 0)
455 1.11 christos return -1;
456 1.11 christos *q++ = (char)c;
457 1.11 christos }
458 1.11 christos else
459 1.11 christos return -1;
460 1.11 christos }
461 1.11 christos else if (*p == '_') /* header's may encode ' ' as '_' */
462 1.11 christos *q++ = ' ';
463 1.11 christos else
464 1.11 christos *q++ = *p;
465 1.11 christos }
466 1.11 christos return q - outbuf;
467 1.11 christos }
468 1.11 christos
469 1.11 christos
470 1.1 christos static int
471 1.1 christos mustquote(unsigned char *p, unsigned char *end, size_t l)
472 1.1 christos {
473 1.1 christos #define N 0 /* do not quote */
474 1.1 christos #define Q 1 /* must quote */
475 1.1 christos #define SP 2 /* white space */
476 1.1 christos #define XF 3 /* special character 'F' - maybe quoted */
477 1.1 christos #define XD 4 /* special character '.' - maybe quoted */
478 1.1 christos #define EQ Q /* '=' must be quoted */
479 1.1 christos #define TB SP /* treat '\t' as a space */
480 1.1 christos #define NL N /* don't quote '\n' (NL) - XXX - quoting here breaks the line length algorithm */
481 1.1 christos #define CR Q /* always quote a '\r' (CR) - it occurs only in a CRLF combo */
482 1.1 christos
483 1.1 christos static const signed char quotetab[] = {
484 1.1 christos Q, Q, Q, Q, Q, Q, Q, Q, Q,TB,NL, Q, Q,CR, Q, Q,
485 1.1 christos Q, Q, Q, Q, Q, Q, Q, Q, Q, Q, Q, Q, Q, Q, Q, Q,
486 1.1 christos SP, N, N, N, N, N, N, N, N, N, N, N, N, N,XD, N,
487 1.1 christos N, N, N, N, N, N, N, N, N, N, N, N, N,EQ, N, N,
488 1.1 christos
489 1.1 christos N, N, N, N, N, N,XF, N, N, N, N, N, N, N, N, N,
490 1.1 christos N, N, N, N, N, N, N, N, N, N, N, N, N, N, N, N,
491 1.1 christos N, N, N, N, N, N, N, N, N, N, N, N, N, N, N, N,
492 1.1 christos N, N, N, N, N, N, N, N, N, N, N, N, N, N, N, Q,
493 1.1 christos };
494 1.1 christos int flag = *p > 0x7f ? Q : quotetab[*p];
495 1.1 christos
496 1.1 christos if (flag == N)
497 1.1 christos return 0;
498 1.1 christos if (flag == Q)
499 1.1 christos return 1;
500 1.1 christos if (flag == SP)
501 1.5 christos return p + 1 < end && p[1] == '\n'; /* trailing white space */
502 1.1 christos
503 1.1 christos /* The remainder are special start-of-line cases. */
504 1.1 christos if (l != 0)
505 1.1 christos return 0;
506 1.6 christos
507 1.1 christos if (flag == XF) /* line may start with "From" */
508 1.5 christos return p + 4 < end && p[1] == 'r' && p[2] == 'o' && p[3] == 'm';
509 1.1 christos
510 1.1 christos if (flag == XD) /* line may consist of a single dot */
511 1.5 christos return p + 1 < end && p[1] == '\n';
512 1.1 christos
513 1.5 christos errx(EXIT_FAILURE,
514 1.5 christos "mustquote: invalid logic: *p=0x%x (%d) flag=%d, l=%zu\n",
515 1.1 christos *p, *p, flag, l);
516 1.1 christos /* NOT REACHED */
517 1.1 christos return 0; /* appease GCC */
518 1.1 christos
519 1.1 christos #undef N
520 1.1 christos #undef Q
521 1.1 christos #undef SP
522 1.1 christos #undef XX
523 1.1 christos #undef EQ
524 1.1 christos #undef TB
525 1.1 christos #undef NL
526 1.1 christos #undef CR
527 1.1 christos }
528 1.1 christos
529 1.1 christos
530 1.1 christos #define MIME_QUOTED_LINE_MAX 76 /* QP max length: see RFC2045 sec 6.7 */
531 1.1 christos
532 1.1 christos static void
533 1.1 christos fput_quoted_line(FILE *fo, char *line, size_t len, size_t limit)
534 1.1 christos {
535 1.1 christos size_t l; /* length of current output line */
536 1.1 christos unsigned char *beg;
537 1.1 christos unsigned char *end;
538 1.1 christos unsigned char *p;
539 1.1 christos
540 1.1 christos assert(limit <= MIME_QUOTED_LINE_MAX);
541 1.1 christos
542 1.1 christos beg = (unsigned char*)line;
543 1.1 christos end = beg + len;
544 1.1 christos l = 0;
545 1.1 christos for (p = (unsigned char*)line; p < end; p++) {
546 1.1 christos if (mustquote(p, end, l)) {
547 1.1 christos if (l + 4 > limit) {
548 1.1 christos (void)fputs("=\n", fo);
549 1.1 christos l = 0;
550 1.1 christos }
551 1.1 christos (void)fprintf(fo, "=%02X", *p);
552 1.1 christos l += 3;
553 1.1 christos }
554 1.1 christos else {
555 1.1 christos if (*p == '\n') {
556 1.11 christos if (p > beg && p[-1] == '\r') {
557 1.11 christos if (l + 4 > limit)
558 1.11 christos (void)fputs("=\n", fo);
559 1.1 christos (void)fputs("=0A=", fo);
560 1.11 christos }
561 1.1 christos l = (size_t)-1;
562 1.1 christos }
563 1.1 christos else if (l + 2 > limit) {
564 1.1 christos (void)fputs("=\n", fo);
565 1.1 christos l = 0;
566 1.1 christos }
567 1.1 christos (void)putc(*p, fo);
568 1.1 christos l++;
569 1.1 christos }
570 1.1 christos }
571 1.1 christos /*
572 1.1 christos * Lines ending in a blank must escape the newline.
573 1.1 christos */
574 1.6 christos if (len && is_WSP(p[-1]))
575 1.1 christos (void)fputs("=\n", fo);
576 1.1 christos }
577 1.1 christos
578 1.1 christos static void
579 1.1 christos mime_fQP_encode(FILE *fi, FILE *fo, void *cookie __unused)
580 1.1 christos {
581 1.1 christos char *line;
582 1.1 christos size_t len;
583 1.1 christos char *cp;
584 1.1 christos size_t limit;
585 1.1 christos
586 1.1 christos #ifdef __lint__
587 1.1 christos cookie = cookie;
588 1.1 christos #endif
589 1.1 christos limit = 0;
590 1.1 christos if ((cp = value(ENAME_MIME_QP_LINE_MAX)) != NULL)
591 1.1 christos limit = (size_t)atoi(cp);
592 1.1 christos if (limit == 0 || limit > MIME_QUOTED_LINE_MAX)
593 1.1 christos limit = MIME_QUOTED_LINE_MAX;
594 1.1 christos if (limit < 4)
595 1.1 christos limit = 4;
596 1.1 christos
597 1.1 christos while ((line = fgetln(fi, &len)) != NULL)
598 1.1 christos fput_quoted_line(fo, line, len, limit);
599 1.1 christos }
600 1.1 christos
601 1.1 christos static void
602 1.1 christos mime_fQP_decode(FILE *fi, FILE *fo, void *cookie __unused)
603 1.1 christos {
604 1.1 christos char *line;
605 1.1 christos size_t len;
606 1.1 christos
607 1.1 christos #ifdef __lint__
608 1.1 christos cookie = cookie;
609 1.1 christos #endif
610 1.1 christos while ((line = fgetln(fi, &len)) != NULL) {
611 1.1 christos char *p;
612 1.1 christos char *end;
613 1.9 christos
614 1.1 christos end = line + len;
615 1.1 christos for (p = line; p < end; p++) {
616 1.1 christos if (*p == '=') {
617 1.1 christos p++;
618 1.6 christos while (p < end && is_WSP(*p))
619 1.1 christos p++;
620 1.1 christos if (*p != '\n' && p + 1 < end) {
621 1.11 christos int c = _qp_cfromhex(p++);
622 1.11 christos if (c >= 0)
623 1.11 christos (void)fputc(c, fo);
624 1.11 christos else
625 1.11 christos (void)fputs("[?]", fo);
626 1.1 christos }
627 1.1 christos }
628 1.1 christos else
629 1.1 christos (void)fputc(*p, fo);
630 1.1 christos }
631 1.1 christos }
632 1.1 christos }
633 1.1 christos
634 1.1 christos
635 1.1 christos /************************************************************************
636 1.1 christos * Routines to select the codec by name.
637 1.1 christos */
638 1.1 christos
639 1.1 christos PUBLIC void
640 1.1 christos mime_fio_copy(FILE *fi, FILE *fo, void *cookie __unused)
641 1.1 christos {
642 1.1 christos int c;
643 1.1 christos
644 1.1 christos #ifdef __lint__
645 1.1 christos cookie = cookie;
646 1.1 christos #endif
647 1.1 christos while ((c = getc(fi)) != EOF)
648 1.1 christos (void)putc(c, fo);
649 1.1 christos
650 1.1 christos (void)fflush(fo);
651 1.1 christos if (ferror(fi)) {
652 1.1 christos warn("read");
653 1.1 christos rewind(fi);
654 1.1 christos return;
655 1.1 christos }
656 1.1 christos if (ferror(fo)) {
657 1.1 christos warn("write");
658 1.1 christos (void)Fclose(fo);
659 1.1 christos rewind(fi);
660 1.1 christos return;
661 1.1 christos }
662 1.1 christos }
663 1.1 christos
664 1.1 christos
665 1.1 christos static const struct transfer_encoding_s {
666 1.1 christos const char *name;
667 1.1 christos mime_codec_t enc;
668 1.1 christos mime_codec_t dec;
669 1.1 christos } transfer_encoding_tbl[] = {
670 1.1 christos { MIME_TRANSFER_7BIT, mime_fio_copy, mime_fio_copy },
671 1.1 christos { MIME_TRANSFER_8BIT, mime_fio_copy, mime_fio_copy },
672 1.1 christos { MIME_TRANSFER_BINARY, mime_fio_copy, mime_fio_copy },
673 1.1 christos { MIME_TRANSFER_QUOTED, mime_fQP_encode, mime_fQP_decode },
674 1.1 christos { MIME_TRANSFER_BASE64, mime_fB64_encode, mime_fB64_decode },
675 1.1 christos { NULL, NULL, NULL },
676 1.1 christos };
677 1.1 christos
678 1.1 christos
679 1.1 christos PUBLIC mime_codec_t
680 1.1 christos mime_fio_encoder(const char *ename)
681 1.1 christos {
682 1.1 christos const struct transfer_encoding_s *tep = NULL;
683 1.1 christos
684 1.1 christos if (ename == NULL)
685 1.1 christos return NULL;
686 1.1 christos
687 1.1 christos for (tep = transfer_encoding_tbl; tep->name; tep++)
688 1.1 christos if (strcasecmp(tep->name, ename) == 0)
689 1.1 christos break;
690 1.1 christos return tep->enc;
691 1.1 christos }
692 1.1 christos
693 1.1 christos PUBLIC mime_codec_t
694 1.1 christos mime_fio_decoder(const char *ename)
695 1.1 christos {
696 1.1 christos const struct transfer_encoding_s *tep = NULL;
697 1.1 christos
698 1.1 christos if (ename == NULL)
699 1.1 christos return NULL;
700 1.1 christos
701 1.1 christos for (tep = transfer_encoding_tbl; tep->name; tep++)
702 1.1 christos if (strcasecmp(tep->name, ename) == 0)
703 1.1 christos break;
704 1.1 christos return tep->dec;
705 1.1 christos }
706 1.1 christos
707 1.1 christos /*
708 1.11 christos * Decode a RFC 2047 extended message header *encoded-word*.
709 1.11 christos * *encoding* is the corresponding character of the *encoded-word*.
710 1.11 christos */
711 1.11 christos PUBLIC ssize_t
712 1.11 christos mime_rfc2047_decode(char encoding, char *outbuf, size_t outlen,
713 1.11 christos const char *inbuf, size_t inlen)
714 1.11 christos {
715 1.11 christos ssize_t declen = -1;
716 1.11 christos
717 1.11 christos if (encoding == 'B' || encoding == 'b') {
718 1.11 christos if (outlen >= 3 * roundup(inlen, 4) / 4)
719 1.11 christos declen = mime_b64tobin(outbuf, inbuf, inlen);
720 1.11 christos } else if (encoding == 'Q' || encoding == 'q')
721 1.11 christos declen = mime_QPh_decode(outbuf, outlen, inbuf, inlen);
722 1.11 christos return declen;
723 1.11 christos }
724 1.11 christos
725 1.11 christos /*
726 1.1 christos * This is for use in complete.c and mime.c to get the list of
727 1.1 christos * encoding names without exposing the transfer_encoding_tbl[]. The
728 1.1 christos * first name is returned if called with a pointer to a NULL pointer.
729 1.1 christos * Subsequent calls with the same cookie give successive names. A
730 1.1 christos * NULL return indicates the end of the list.
731 1.1 christos */
732 1.1 christos PUBLIC const char *
733 1.1 christos mime_next_encoding_name(const void **cookie)
734 1.1 christos {
735 1.1 christos const struct transfer_encoding_s *tep;
736 1.1 christos
737 1.1 christos tep = *cookie;
738 1.1 christos if (tep == NULL)
739 1.1 christos tep = transfer_encoding_tbl;
740 1.1 christos
741 1.1 christos *cookie = tep->name ? &tep[1] : NULL;
742 1.1 christos
743 1.1 christos return tep->name;
744 1.1 christos }
745 1.1 christos
746 1.1 christos #endif /* MIME_SUPPORT */
747