vis.c revision 1.45 1 /* $NetBSD: vis.c,v 1.45 2012/12/14 21:38:18 christos Exp $ */
2
3 /*-
4 * Copyright (c) 1989, 1993
5 * The Regents of the University of California. All rights reserved.
6 *
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
9 * are met:
10 * 1. Redistributions of source code must retain the above copyright
11 * notice, this list of conditions and the following disclaimer.
12 * 2. Redistributions in binary form must reproduce the above copyright
13 * notice, this list of conditions and the following disclaimer in the
14 * documentation and/or other materials provided with the distribution.
15 * 3. Neither the name of the University nor the names of its contributors
16 * may be used to endorse or promote products derived from this software
17 * without specific prior written permission.
18 *
19 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
20 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
23 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 * SUCH DAMAGE.
30 */
31
32 /*-
33 * Copyright (c) 1999, 2005 The NetBSD Foundation, Inc.
34 * All rights reserved.
35 *
36 * Redistribution and use in source and binary forms, with or without
37 * modification, are permitted provided that the following conditions
38 * are met:
39 * 1. Redistributions of source code must retain the above copyright
40 * notice, this list of conditions and the following disclaimer.
41 * 2. Redistributions in binary form must reproduce the above copyright
42 * notice, this list of conditions and the following disclaimer in the
43 * documentation and/or other materials provided with the distribution.
44 *
45 * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
46 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
47 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
48 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
49 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
50 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
51 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
52 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
53 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
54 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
55 * POSSIBILITY OF SUCH DAMAGE.
56 */
57
58 #include <sys/cdefs.h>
59 #if defined(LIBC_SCCS) && !defined(lint)
60 __RCSID("$NetBSD: vis.c,v 1.45 2012/12/14 21:38:18 christos Exp $");
61 #endif /* LIBC_SCCS and not lint */
62
63 #include "namespace.h"
64 #include <sys/types.h>
65
66 #include <assert.h>
67 #include <vis.h>
68 #include <errno.h>
69 #include <stdlib.h>
70
71 #ifdef __weak_alias
72 __weak_alias(strvisx,_strvisx)
73 #endif
74
75 #if !HAVE_VIS || !HAVE_SVIS
76 #include <ctype.h>
77 #include <limits.h>
78 #include <stdio.h>
79 #include <string.h>
80
81 static char *do_svis(char *, size_t *, int, int, int, const char *);
82
83 #undef BELL
84 #define BELL '\a'
85
86 #define isoctal(c) (((u_char)(c)) >= '0' && ((u_char)(c)) <= '7')
87 #define iswhite(c) (c == ' ' || c == '\t' || c == '\n')
88 #define issafe(c) (c == '\b' || c == BELL || c == '\r')
89 #define xtoa(c) "0123456789abcdef"[c]
90 #define XTOA(c) "0123456789ABCDEF"[c]
91
92 #define MAXEXTRAS 9
93
94 #define MAKEEXTRALIST(flag, extra, orig_str) \
95 do { \
96 const char *orig = orig_str; \
97 const char *o = orig; \
98 char *e; \
99 while (*o++) \
100 continue; \
101 extra = malloc((size_t)((o - orig) + MAXEXTRAS)); \
102 if (!extra) break; \
103 for (o = orig, e = extra; (*e++ = *o++) != '\0';) \
104 continue; \
105 e--; \
106 if (flag & VIS_GLOB) { \
107 *e++ = '*'; \
108 *e++ = '?'; \
109 *e++ = '['; \
110 *e++ = '#'; \
111 } \
112 if (flag & VIS_SP) *e++ = ' '; \
113 if (flag & VIS_TAB) *e++ = '\t'; \
114 if (flag & VIS_NL) *e++ = '\n'; \
115 if ((flag & VIS_NOSLASH) == 0) *e++ = '\\'; \
116 *e = '\0'; \
117 } while (/*CONSTCOND*/0)
118
119 /*
120 * This is do_hvis, for HTTP style (RFC 1808)
121 */
122 static char *
123 do_hvis(char *dst, size_t *dlen, int c, int flag, int nextc, const char *extra)
124 {
125
126 if ((isascii(c) && isalnum(c))
127 /* safe */
128 || c == '$' || c == '-' || c == '_' || c == '.' || c == '+'
129 /* extra */
130 || c == '!' || c == '*' || c == '\'' || c == '(' || c == ')'
131 || c == ',') {
132 dst = do_svis(dst, dlen, c, flag, nextc, extra);
133 } else {
134 if (dlen) {
135 if (*dlen < 3)
136 return NULL;
137 *dlen -= 3;
138 }
139 *dst++ = '%';
140 *dst++ = xtoa(((unsigned int)c >> 4) & 0xf);
141 *dst++ = xtoa((unsigned int)c & 0xf);
142 }
143
144 return dst;
145 }
146
147 /*
148 * This is do_mvis, for Quoted-Printable MIME (RFC 2045)
149 * NB: No handling of long lines or CRLF.
150 */
151 static char *
152 do_mvis(char *dst, size_t *dlen, int c, int flag, int nextc, const char *extra)
153 {
154 if ((c != '\n') &&
155 /* Space at the end of the line */
156 ((isspace(c) && (nextc == '\r' || nextc == '\n')) ||
157 /* Out of range */
158 (!isspace(c) && (c < 33 || (c > 60 && c < 62) || c > 126)) ||
159 /* Specific char to be escaped */
160 strchr("#$@[\\]^`{|}~", c) != NULL)) {
161 if (dlen) {
162 if (*dlen < 3)
163 return NULL;
164 *dlen -= 3;
165 }
166 *dst++ = '=';
167 *dst++ = XTOA(((unsigned int)c >> 4) & 0xf);
168 *dst++ = XTOA((unsigned int)c & 0xf);
169 } else {
170 dst = do_svis(dst, dlen, c, flag, nextc, extra);
171 }
172 return dst;
173 }
174
175 /*
176 * This is do_vis, the central code of vis.
177 * dst: Pointer to the destination buffer
178 * c: Character to encode
179 * flag: Flag word
180 * nextc: The character following 'c'
181 * extra: Pointer to the list of extra characters to be
182 * backslash-protected.
183 */
184 static char *
185 do_svis(char *dst, size_t *dlen, int c, int flag, int nextc, const char *extra)
186 {
187 int isextra;
188 size_t odlen = dlen ? *dlen : 0;
189
190 isextra = strchr(extra, c) != NULL;
191 #define HAVE(x) \
192 do { \
193 if (dlen) { \
194 if (*dlen < (x)) \
195 goto out; \
196 *dlen -= (x); \
197 } \
198 } while (/*CONSTCOND*/0)
199 if (!isextra && isascii(c) && (isgraph(c) || iswhite(c) ||
200 ((flag & VIS_SAFE) && issafe(c)))) {
201 HAVE(1);
202 *dst++ = c;
203 return dst;
204 }
205 if (flag & VIS_CSTYLE) {
206 HAVE(2);
207 switch (c) {
208 case '\n':
209 *dst++ = '\\'; *dst++ = 'n';
210 return dst;
211 case '\r':
212 *dst++ = '\\'; *dst++ = 'r';
213 return dst;
214 case '\b':
215 *dst++ = '\\'; *dst++ = 'b';
216 return dst;
217 case BELL:
218 *dst++ = '\\'; *dst++ = 'a';
219 return dst;
220 case '\v':
221 *dst++ = '\\'; *dst++ = 'v';
222 return dst;
223 case '\t':
224 *dst++ = '\\'; *dst++ = 't';
225 return dst;
226 case '\f':
227 *dst++ = '\\'; *dst++ = 'f';
228 return dst;
229 case ' ':
230 *dst++ = '\\'; *dst++ = 's';
231 return dst;
232 case '\0':
233 *dst++ = '\\'; *dst++ = '0';
234 if (isoctal(nextc)) {
235 HAVE(2);
236 *dst++ = '0';
237 *dst++ = '0';
238 }
239 return dst;
240 default:
241 if (isgraph(c)) {
242 *dst++ = '\\'; *dst++ = c;
243 return dst;
244 }
245 if (dlen)
246 *dlen = odlen;
247 }
248 }
249 if (isextra || ((c & 0177) == ' ') || (flag & VIS_OCTAL)) {
250 HAVE(4);
251 *dst++ = '\\';
252 *dst++ = (u_char)(((u_int32_t)(u_char)c >> 6) & 03) + '0';
253 *dst++ = (u_char)(((u_int32_t)(u_char)c >> 3) & 07) + '0';
254 *dst++ = (c & 07) + '0';
255 } else {
256 if ((flag & VIS_NOSLASH) == 0) {
257 HAVE(1);
258 *dst++ = '\\';
259 }
260
261 if (c & 0200) {
262 HAVE(1);
263 c &= 0177; *dst++ = 'M';
264 }
265
266 if (iscntrl(c)) {
267 HAVE(2);
268 *dst++ = '^';
269 if (c == 0177)
270 *dst++ = '?';
271 else
272 *dst++ = c + '@';
273 } else {
274 HAVE(2);
275 *dst++ = '-'; *dst++ = c;
276 }
277 }
278 return dst;
279 out:
280 *dlen = odlen;
281 return NULL;
282 }
283
284 typedef char *(*visfun_t)(char *, size_t *, int, int, int, const char *);
285
286 /*
287 * Return the appropriate encoding function depending on the flags given.
288 */
289 static visfun_t
290 getvisfun(int flag)
291 {
292 if (flag & VIS_HTTPSTYLE)
293 return do_hvis;
294 if (flag & VIS_MIMESTYLE)
295 return do_mvis;
296 return do_svis;
297 }
298
299 /*
300 * isnvis - visually encode characters, also encoding the characters
301 * pointed to by `extra'
302 */
303 static char *
304 isnvis(char *dst, size_t *dlen, int c, int flag, int nextc, const char *extra)
305 {
306 char *nextra = NULL;
307 visfun_t f;
308
309 _DIAGASSERT(dst != NULL);
310 _DIAGASSERT(extra != NULL);
311 MAKEEXTRALIST(flag, nextra, extra);
312 if (!nextra) {
313 if (dlen && *dlen == 0) {
314 errno = ENOSPC;
315 return NULL;
316 }
317 *dst = '\0'; /* can't create nextra, return "" */
318 return dst;
319 }
320 f = getvisfun(flag);
321 dst = (*f)(dst, dlen, c, flag, nextc, nextra);
322 free(nextra);
323 if (dst == NULL || (dlen && *dlen == 0)) {
324 errno = ENOSPC;
325 return NULL;
326 }
327 *dst = '\0';
328 return dst;
329 }
330
331 char *
332 svis(char *dst, int c, int flag, int nextc, const char *extra)
333 {
334 return isnvis(dst, NULL, c, flag, nextc, extra);
335 }
336
337 char *
338 snvis(char *dst, size_t dlen, int c, int flag, int nextc, const char *extra)
339 {
340 return isnvis(dst, &dlen, c, flag, nextc, extra);
341 }
342
343
344 /*
345 * strsvis, strsvisx - visually encode characters from src into dst
346 *
347 * Extra is a pointer to a \0-terminated list of characters to
348 * be encoded, too. These functions are useful e. g. to
349 * encode strings in such a way so that they are not interpreted
350 * by a shell.
351 *
352 * Dst must be 4 times the size of src to account for possible
353 * expansion. The length of dst, not including the trailing NULL,
354 * is returned.
355 *
356 * Strsvisx encodes exactly len bytes from src into dst.
357 * This is useful for encoding a block of data.
358 */
359 static int
360 istrsnvis(char *dst, size_t *dlen, const char *csrc, int flag, const char *extra)
361 {
362 int c;
363 char *start;
364 char *nextra = NULL;
365 const unsigned char *src = (const unsigned char *)csrc;
366 visfun_t f;
367
368 _DIAGASSERT(dst != NULL);
369 _DIAGASSERT(src != NULL);
370 _DIAGASSERT(extra != NULL);
371 MAKEEXTRALIST(flag, nextra, extra);
372 if (!nextra) {
373 *dst = '\0'; /* can't create nextra, return "" */
374 return 0;
375 }
376 f = getvisfun(flag);
377 for (start = dst; (c = *src++) != '\0'; /* empty */) {
378 dst = (*f)(dst, dlen, c, flag, *src, nextra);
379 if (dst == NULL) {
380 errno = ENOSPC;
381 return -1;
382 }
383 }
384 free(nextra);
385 if (dlen && *dlen == 0) {
386 errno = ENOSPC;
387 return -1;
388 }
389 *dst = '\0';
390 return (int)(dst - start);
391 }
392
393 int
394 strsvis(char *dst, const char *csrc, int flag, const char *extra)
395 {
396 return istrsnvis(dst, NULL, csrc, flag, extra);
397 }
398
399 int
400 strsnvis(char *dst, size_t dlen, const char *csrc, int flag, const char *extra)
401 {
402 return istrsnvis(dst, &dlen, csrc, flag, extra);
403 }
404
405 static int
406 istrsnvisx(char *dst, size_t *dlen, const char *csrc, size_t len, int flag,
407 const char *extra)
408 {
409 unsigned char c;
410 char *start;
411 char *nextra = NULL;
412 const unsigned char *src = (const unsigned char *)csrc;
413 visfun_t f;
414
415 _DIAGASSERT(dst != NULL);
416 _DIAGASSERT(src != NULL);
417 _DIAGASSERT(extra != NULL);
418 MAKEEXTRALIST(flag, nextra, extra);
419 if (! nextra) {
420 if (dlen && *dlen == 0) {
421 errno = ENOSPC;
422 return -1;
423 }
424 *dst = '\0'; /* can't create nextra, return "" */
425 return 0;
426 }
427
428 f = getvisfun(flag);
429 for (start = dst; len > 0; len--) {
430 c = *src++;
431 dst = (*f)(dst, dlen, c, flag, len > 1 ? *src : '\0', nextra);
432 if (dst == NULL) {
433 errno = ENOSPC;
434 return -1;
435 }
436 }
437 free(nextra);
438 if (dlen && *dlen == 0) {
439 errno = ENOSPC;
440 return -1;
441 }
442 *dst = '\0';
443 return (int)(dst - start);
444 }
445
446 int
447 strsvisx(char *dst, const char *csrc, size_t len, int flag, const char *extra)
448 {
449 return istrsnvisx(dst, NULL, csrc, len, flag, extra);
450 }
451
452 int
453 strsnvisx(char *dst, size_t dlen, const char *csrc, size_t len, int flag,
454 const char *extra)
455 {
456 return istrsnvisx(dst, &dlen, csrc, len, flag, extra);
457 }
458 #endif
459
460 #if !HAVE_VIS
461 /*
462 * vis - visually encode characters
463 */
464 static char *
465 invis(char *dst, size_t *dlen, int c, int flag, int nextc)
466 {
467 char *extra = NULL;
468 unsigned char uc = (unsigned char)c;
469 visfun_t f;
470
471 _DIAGASSERT(dst != NULL);
472
473 MAKEEXTRALIST(flag, extra, "");
474 if (! extra) {
475 if (dlen && *dlen == 0) {
476 errno = ENOSPC;
477 return NULL;
478 }
479 *dst = '\0'; /* can't create extra, return "" */
480 return dst;
481 }
482 f = getvisfun(flag);
483 dst = (*f)(dst, dlen, uc, flag, nextc, extra);
484 free(extra);
485 if (dst == NULL || (dlen && *dlen == 0)) {
486 errno = ENOSPC;
487 return NULL;
488 }
489 *dst = '\0';
490 return dst;
491 }
492
493 char *
494 vis(char *dst, int c, int flag, int nextc)
495 {
496 return invis(dst, NULL, c, flag, nextc);
497 }
498
499 char *
500 nvis(char *dst, size_t dlen, int c, int flag, int nextc)
501 {
502 return invis(dst, &dlen, c, flag, nextc);
503 }
504
505
506 /*
507 * strvis, strvisx - visually encode characters from src into dst
508 *
509 * Dst must be 4 times the size of src to account for possible
510 * expansion. The length of dst, not including the trailing NULL,
511 * is returned.
512 *
513 * Strvisx encodes exactly len bytes from src into dst.
514 * This is useful for encoding a block of data.
515 */
516 static int
517 istrnvis(char *dst, size_t *dlen, const char *src, int flag)
518 {
519 char *extra = NULL;
520 int rv;
521
522 MAKEEXTRALIST(flag, extra, "");
523 if (!extra) {
524 if (dlen && *dlen == 0) {
525 errno = ENOSPC;
526 return -1;
527 }
528 *dst = '\0'; /* can't create extra, return "" */
529 return 0;
530 }
531 rv = istrsnvis(dst, dlen, src, flag, extra);
532 free(extra);
533 return rv;
534 }
535
536 int
537 strvis(char *dst, const char *src, int flag)
538 {
539 return istrnvis(dst, NULL, src, flag);
540 }
541
542 int
543 strnvis(char *dst, size_t dlen, const char *src, int flag)
544 {
545 return istrnvis(dst, &dlen, src, flag);
546 }
547
548 static int
549 istrnvisx(char *dst, size_t *dlen, const char *src, size_t len, int flag)
550 {
551 char *extra = NULL;
552 int rv;
553
554 MAKEEXTRALIST(flag, extra, "");
555 if (!extra) {
556 if (dlen && *dlen == 0) {
557 errno = ENOSPC;
558 return -1;
559 }
560 *dst = '\0'; /* can't create extra, return "" */
561 return 0;
562 }
563 rv = istrsnvisx(dst, dlen, src, len, flag, extra);
564 free(extra);
565 return rv;
566 }
567
568 int
569 strvisx(char *dst, const char *src, size_t len, int flag)
570 {
571 return istrnvisx(dst, NULL, src, len, flag);
572 }
573
574 int
575 strnvisx(char *dst, size_t dlen, const char *src, size_t len, int flag)
576 {
577 return istrnvisx(dst, &dlen, src, len, flag);
578 }
579
580 #endif
581