vis.c revision 1.44 1 /* $NetBSD: vis.c,v 1.44 2011/03/12 19:52:48 christos Exp $ */
2
3 /*-
4 * Copyright (c) 1989, 1993
5 * The Regents of the University of California. All rights reserved.
6 *
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
9 * are met:
10 * 1. Redistributions of source code must retain the above copyright
11 * notice, this list of conditions and the following disclaimer.
12 * 2. Redistributions in binary form must reproduce the above copyright
13 * notice, this list of conditions and the following disclaimer in the
14 * documentation and/or other materials provided with the distribution.
15 * 3. Neither the name of the University nor the names of its contributors
16 * may be used to endorse or promote products derived from this software
17 * without specific prior written permission.
18 *
19 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
20 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
23 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 * SUCH DAMAGE.
30 */
31
32 /*-
33 * Copyright (c) 1999, 2005 The NetBSD Foundation, Inc.
34 * All rights reserved.
35 *
36 * Redistribution and use in source and binary forms, with or without
37 * modification, are permitted provided that the following conditions
38 * are met:
39 * 1. Redistributions of source code must retain the above copyright
40 * notice, this list of conditions and the following disclaimer.
41 * 2. Redistributions in binary form must reproduce the above copyright
42 * notice, this list of conditions and the following disclaimer in the
43 * documentation and/or other materials provided with the distribution.
44 *
45 * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
46 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
47 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
48 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
49 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
50 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
51 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
52 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
53 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
54 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
55 * POSSIBILITY OF SUCH DAMAGE.
56 */
57
58 #include <sys/cdefs.h>
59 #if defined(LIBC_SCCS) && !defined(lint)
60 __RCSID("$NetBSD: vis.c,v 1.44 2011/03/12 19:52:48 christos Exp $");
61 #endif /* LIBC_SCCS and not lint */
62
63 #include "namespace.h"
64 #include <sys/types.h>
65
66 #include <assert.h>
67 #include <vis.h>
68 #include <errno.h>
69 #include <stdlib.h>
70
71 #ifdef __weak_alias
72 __weak_alias(strvisx,_strvisx)
73 #endif
74
75 #if !HAVE_VIS || !HAVE_SVIS
76 #include <ctype.h>
77 #include <limits.h>
78 #include <stdio.h>
79 #include <string.h>
80
81 static char *do_svis(char *, size_t *, int, int, int, const char *);
82
83 #undef BELL
84 #define BELL '\a'
85
86 #define isoctal(c) (((u_char)(c)) >= '0' && ((u_char)(c)) <= '7')
87 #define iswhite(c) (c == ' ' || c == '\t' || c == '\n')
88 #define issafe(c) (c == '\b' || c == BELL || c == '\r')
89 #define xtoa(c) "0123456789abcdef"[c]
90 #define XTOA(c) "0123456789ABCDEF"[c]
91
92 #define MAXEXTRAS 5
93
94 #define MAKEEXTRALIST(flag, extra, orig_str) \
95 do { \
96 const char *orig = orig_str; \
97 const char *o = orig; \
98 char *e; \
99 while (*o++) \
100 continue; \
101 extra = malloc((size_t)((o - orig) + MAXEXTRAS)); \
102 if (!extra) break; \
103 for (o = orig, e = extra; (*e++ = *o++) != '\0';) \
104 continue; \
105 e--; \
106 if (flag & VIS_SP) *e++ = ' '; \
107 if (flag & VIS_TAB) *e++ = '\t'; \
108 if (flag & VIS_NL) *e++ = '\n'; \
109 if ((flag & VIS_NOSLASH) == 0) *e++ = '\\'; \
110 *e = '\0'; \
111 } while (/*CONSTCOND*/0)
112
113 /*
114 * This is do_hvis, for HTTP style (RFC 1808)
115 */
116 static char *
117 do_hvis(char *dst, size_t *dlen, int c, int flag, int nextc, const char *extra)
118 {
119
120 if ((isascii(c) && isalnum(c))
121 /* safe */
122 || c == '$' || c == '-' || c == '_' || c == '.' || c == '+'
123 /* extra */
124 || c == '!' || c == '*' || c == '\'' || c == '(' || c == ')'
125 || c == ',') {
126 dst = do_svis(dst, dlen, c, flag, nextc, extra);
127 } else {
128 if (dlen) {
129 if (*dlen < 3)
130 return NULL;
131 *dlen -= 3;
132 }
133 *dst++ = '%';
134 *dst++ = xtoa(((unsigned int)c >> 4) & 0xf);
135 *dst++ = xtoa((unsigned int)c & 0xf);
136 }
137
138 return dst;
139 }
140
141 /*
142 * This is do_mvis, for Quoted-Printable MIME (RFC 2045)
143 * NB: No handling of long lines or CRLF.
144 */
145 static char *
146 do_mvis(char *dst, size_t *dlen, int c, int flag, int nextc, const char *extra)
147 {
148 if ((c != '\n') &&
149 /* Space at the end of the line */
150 ((isspace(c) && (nextc == '\r' || nextc == '\n')) ||
151 /* Out of range */
152 (!isspace(c) && (c < 33 || (c > 60 && c < 62) || c > 126)) ||
153 /* Specific char to be escaped */
154 strchr("#$@[\\]^`{|}~", c) != NULL)) {
155 if (dlen) {
156 if (*dlen < 3)
157 return NULL;
158 *dlen -= 3;
159 }
160 *dst++ = '=';
161 *dst++ = XTOA(((unsigned int)c >> 4) & 0xf);
162 *dst++ = XTOA((unsigned int)c & 0xf);
163 } else {
164 dst = do_svis(dst, dlen, c, flag, nextc, extra);
165 }
166 return dst;
167 }
168
169 /*
170 * This is do_vis, the central code of vis.
171 * dst: Pointer to the destination buffer
172 * c: Character to encode
173 * flag: Flag word
174 * nextc: The character following 'c'
175 * extra: Pointer to the list of extra characters to be
176 * backslash-protected.
177 */
178 static char *
179 do_svis(char *dst, size_t *dlen, int c, int flag, int nextc, const char *extra)
180 {
181 int isextra;
182 size_t odlen = dlen ? *dlen : 0;
183
184 isextra = strchr(extra, c) != NULL;
185 #define HAVE(x) \
186 do { \
187 if (dlen) { \
188 if (*dlen < (x)) \
189 goto out; \
190 *dlen -= (x); \
191 } \
192 } while (/*CONSTCOND*/0)
193 if (!isextra && isascii(c) && (isgraph(c) || iswhite(c) ||
194 ((flag & VIS_SAFE) && issafe(c)))) {
195 HAVE(1);
196 *dst++ = c;
197 return dst;
198 }
199 if (flag & VIS_CSTYLE) {
200 HAVE(2);
201 switch (c) {
202 case '\n':
203 *dst++ = '\\'; *dst++ = 'n';
204 return dst;
205 case '\r':
206 *dst++ = '\\'; *dst++ = 'r';
207 return dst;
208 case '\b':
209 *dst++ = '\\'; *dst++ = 'b';
210 return dst;
211 case BELL:
212 *dst++ = '\\'; *dst++ = 'a';
213 return dst;
214 case '\v':
215 *dst++ = '\\'; *dst++ = 'v';
216 return dst;
217 case '\t':
218 *dst++ = '\\'; *dst++ = 't';
219 return dst;
220 case '\f':
221 *dst++ = '\\'; *dst++ = 'f';
222 return dst;
223 case ' ':
224 *dst++ = '\\'; *dst++ = 's';
225 return dst;
226 case '\0':
227 *dst++ = '\\'; *dst++ = '0';
228 if (isoctal(nextc)) {
229 HAVE(2);
230 *dst++ = '0';
231 *dst++ = '0';
232 }
233 return dst;
234 default:
235 if (isgraph(c)) {
236 *dst++ = '\\'; *dst++ = c;
237 return dst;
238 }
239 if (dlen)
240 *dlen = odlen;
241 }
242 }
243 if (isextra || ((c & 0177) == ' ') || (flag & VIS_OCTAL)) {
244 HAVE(4);
245 *dst++ = '\\';
246 *dst++ = (u_char)(((u_int32_t)(u_char)c >> 6) & 03) + '0';
247 *dst++ = (u_char)(((u_int32_t)(u_char)c >> 3) & 07) + '0';
248 *dst++ = (c & 07) + '0';
249 } else {
250 if ((flag & VIS_NOSLASH) == 0) {
251 HAVE(1);
252 *dst++ = '\\';
253 }
254
255 if (c & 0200) {
256 HAVE(1);
257 c &= 0177; *dst++ = 'M';
258 }
259
260 if (iscntrl(c)) {
261 HAVE(2);
262 *dst++ = '^';
263 if (c == 0177)
264 *dst++ = '?';
265 else
266 *dst++ = c + '@';
267 } else {
268 HAVE(2);
269 *dst++ = '-'; *dst++ = c;
270 }
271 }
272 return dst;
273 out:
274 *dlen = odlen;
275 return NULL;
276 }
277
278 typedef char *(*visfun_t)(char *, size_t *, int, int, int, const char *);
279
280 /*
281 * Return the appropriate encoding function depending on the flags given.
282 */
283 static visfun_t
284 getvisfun(int flag)
285 {
286 if (flag & VIS_HTTPSTYLE)
287 return do_hvis;
288 if (flag & VIS_MIMESTYLE)
289 return do_mvis;
290 return do_svis;
291 }
292
293 /*
294 * isnvis - visually encode characters, also encoding the characters
295 * pointed to by `extra'
296 */
297 static char *
298 isnvis(char *dst, size_t *dlen, int c, int flag, int nextc, const char *extra)
299 {
300 char *nextra = NULL;
301 visfun_t f;
302
303 _DIAGASSERT(dst != NULL);
304 _DIAGASSERT(extra != NULL);
305 MAKEEXTRALIST(flag, nextra, extra);
306 if (!nextra) {
307 if (dlen && *dlen == 0) {
308 errno = ENOSPC;
309 return NULL;
310 }
311 *dst = '\0'; /* can't create nextra, return "" */
312 return dst;
313 }
314 f = getvisfun(flag);
315 dst = (*f)(dst, dlen, c, flag, nextc, nextra);
316 free(nextra);
317 if (dst == NULL || (dlen && *dlen == 0)) {
318 errno = ENOSPC;
319 return NULL;
320 }
321 *dst = '\0';
322 return dst;
323 }
324
325 char *
326 svis(char *dst, int c, int flag, int nextc, const char *extra)
327 {
328 return isnvis(dst, NULL, c, flag, nextc, extra);
329 }
330
331 char *
332 snvis(char *dst, size_t dlen, int c, int flag, int nextc, const char *extra)
333 {
334 return isnvis(dst, &dlen, c, flag, nextc, extra);
335 }
336
337
338 /*
339 * strsvis, strsvisx - visually encode characters from src into dst
340 *
341 * Extra is a pointer to a \0-terminated list of characters to
342 * be encoded, too. These functions are useful e. g. to
343 * encode strings in such a way so that they are not interpreted
344 * by a shell.
345 *
346 * Dst must be 4 times the size of src to account for possible
347 * expansion. The length of dst, not including the trailing NULL,
348 * is returned.
349 *
350 * Strsvisx encodes exactly len bytes from src into dst.
351 * This is useful for encoding a block of data.
352 */
353 static int
354 istrsnvis(char *dst, size_t *dlen, const char *csrc, int flag, const char *extra)
355 {
356 int c;
357 char *start;
358 char *nextra = NULL;
359 const unsigned char *src = (const unsigned char *)csrc;
360 visfun_t f;
361
362 _DIAGASSERT(dst != NULL);
363 _DIAGASSERT(src != NULL);
364 _DIAGASSERT(extra != NULL);
365 MAKEEXTRALIST(flag, nextra, extra);
366 if (!nextra) {
367 *dst = '\0'; /* can't create nextra, return "" */
368 return 0;
369 }
370 f = getvisfun(flag);
371 for (start = dst; (c = *src++) != '\0'; /* empty */) {
372 dst = (*f)(dst, dlen, c, flag, *src, nextra);
373 if (dst == NULL) {
374 errno = ENOSPC;
375 return -1;
376 }
377 }
378 free(nextra);
379 if (dlen && *dlen == 0) {
380 errno = ENOSPC;
381 return -1;
382 }
383 *dst = '\0';
384 return (int)(dst - start);
385 }
386
387 int
388 strsvis(char *dst, const char *csrc, int flag, const char *extra)
389 {
390 return istrsnvis(dst, NULL, csrc, flag, extra);
391 }
392
393 int
394 strsnvis(char *dst, size_t dlen, const char *csrc, int flag, const char *extra)
395 {
396 return istrsnvis(dst, &dlen, csrc, flag, extra);
397 }
398
399 static int
400 istrsnvisx(char *dst, size_t *dlen, const char *csrc, size_t len, int flag,
401 const char *extra)
402 {
403 unsigned char c;
404 char *start;
405 char *nextra = NULL;
406 const unsigned char *src = (const unsigned char *)csrc;
407 visfun_t f;
408
409 _DIAGASSERT(dst != NULL);
410 _DIAGASSERT(src != NULL);
411 _DIAGASSERT(extra != NULL);
412 MAKEEXTRALIST(flag, nextra, extra);
413 if (! nextra) {
414 if (dlen && *dlen == 0) {
415 errno = ENOSPC;
416 return -1;
417 }
418 *dst = '\0'; /* can't create nextra, return "" */
419 return 0;
420 }
421
422 f = getvisfun(flag);
423 for (start = dst; len > 0; len--) {
424 c = *src++;
425 dst = (*f)(dst, dlen, c, flag, len > 1 ? *src : '\0', nextra);
426 if (dst == NULL) {
427 errno = ENOSPC;
428 return -1;
429 }
430 }
431 free(nextra);
432 if (dlen && *dlen == 0) {
433 errno = ENOSPC;
434 return -1;
435 }
436 *dst = '\0';
437 return (int)(dst - start);
438 }
439
440 int
441 strsvisx(char *dst, const char *csrc, size_t len, int flag, const char *extra)
442 {
443 return istrsnvisx(dst, NULL, csrc, len, flag, extra);
444 }
445
446 int
447 strsnvisx(char *dst, size_t dlen, const char *csrc, size_t len, int flag,
448 const char *extra)
449 {
450 return istrsnvisx(dst, &dlen, csrc, len, flag, extra);
451 }
452 #endif
453
454 #if !HAVE_VIS
455 /*
456 * vis - visually encode characters
457 */
458 static char *
459 invis(char *dst, size_t *dlen, int c, int flag, int nextc)
460 {
461 char *extra = NULL;
462 unsigned char uc = (unsigned char)c;
463 visfun_t f;
464
465 _DIAGASSERT(dst != NULL);
466
467 MAKEEXTRALIST(flag, extra, "");
468 if (! extra) {
469 if (dlen && *dlen == 0) {
470 errno = ENOSPC;
471 return NULL;
472 }
473 *dst = '\0'; /* can't create extra, return "" */
474 return dst;
475 }
476 f = getvisfun(flag);
477 dst = (*f)(dst, dlen, uc, flag, nextc, extra);
478 free(extra);
479 if (dst == NULL || (dlen && *dlen == 0)) {
480 errno = ENOSPC;
481 return NULL;
482 }
483 *dst = '\0';
484 return dst;
485 }
486
487 char *
488 vis(char *dst, int c, int flag, int nextc)
489 {
490 return invis(dst, NULL, c, flag, nextc);
491 }
492
493 char *
494 nvis(char *dst, size_t dlen, int c, int flag, int nextc)
495 {
496 return invis(dst, &dlen, c, flag, nextc);
497 }
498
499
500 /*
501 * strvis, strvisx - visually encode characters from src into dst
502 *
503 * Dst must be 4 times the size of src to account for possible
504 * expansion. The length of dst, not including the trailing NULL,
505 * is returned.
506 *
507 * Strvisx encodes exactly len bytes from src into dst.
508 * This is useful for encoding a block of data.
509 */
510 static int
511 istrnvis(char *dst, size_t *dlen, const char *src, int flag)
512 {
513 char *extra = NULL;
514 int rv;
515
516 MAKEEXTRALIST(flag, extra, "");
517 if (!extra) {
518 if (dlen && *dlen == 0) {
519 errno = ENOSPC;
520 return -1;
521 }
522 *dst = '\0'; /* can't create extra, return "" */
523 return 0;
524 }
525 rv = istrsnvis(dst, dlen, src, flag, extra);
526 free(extra);
527 return rv;
528 }
529
530 int
531 strvis(char *dst, const char *src, int flag)
532 {
533 return istrnvis(dst, NULL, src, flag);
534 }
535
536 int
537 strnvis(char *dst, size_t dlen, const char *src, int flag)
538 {
539 return istrnvis(dst, &dlen, src, flag);
540 }
541
542 static int
543 istrnvisx(char *dst, size_t *dlen, const char *src, size_t len, int flag)
544 {
545 char *extra = NULL;
546 int rv;
547
548 MAKEEXTRALIST(flag, extra, "");
549 if (!extra) {
550 if (dlen && *dlen == 0) {
551 errno = ENOSPC;
552 return -1;
553 }
554 *dst = '\0'; /* can't create extra, return "" */
555 return 0;
556 }
557 rv = istrsnvisx(dst, dlen, src, len, flag, extra);
558 free(extra);
559 return rv;
560 }
561
562 int
563 strvisx(char *dst, const char *src, size_t len, int flag)
564 {
565 return istrnvisx(dst, NULL, src, len, flag);
566 }
567
568 int
569 strnvisx(char *dst, size_t dlen, const char *src, size_t len, int flag)
570 {
571 return istrnvisx(dst, &dlen, src, len, flag);
572 }
573
574 #endif
575