base64.c revision 1.11.6.2 1 1.11.6.2 christos /* $NetBSD: base64.c,v 1.11.6.2 2008/06/21 20:41:49 christos Exp $ */
2 1.11.6.2 christos
3 1.11.6.2 christos /*
4 1.11.6.2 christos * Copyright (c) 2004 by Internet Systems Consortium, Inc. ("ISC")
5 1.11.6.2 christos * Copyright (c) 1996-1999 by Internet Software Consortium.
6 1.11.6.2 christos *
7 1.11.6.2 christos * Permission to use, copy, modify, and distribute this software for any
8 1.11.6.2 christos * purpose with or without fee is hereby granted, provided that the above
9 1.11.6.2 christos * copyright notice and this permission notice appear in all copies.
10 1.11.6.2 christos *
11 1.11.6.2 christos * THE SOFTWARE IS PROVIDED "AS IS" AND ISC DISCLAIMS ALL WARRANTIES
12 1.11.6.2 christos * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
13 1.11.6.2 christos * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL ISC BE LIABLE FOR
14 1.11.6.2 christos * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
15 1.11.6.2 christos * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
16 1.11.6.2 christos * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT
17 1.11.6.2 christos * OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
18 1.11.6.2 christos */
19 1.11.6.2 christos
20 1.11.6.2 christos /*
21 1.11.6.2 christos * Portions Copyright (c) 1995 by International Business Machines, Inc.
22 1.11.6.2 christos *
23 1.11.6.2 christos * International Business Machines, Inc. (hereinafter called IBM) grants
24 1.11.6.2 christos * permission under its copyrights to use, copy, modify, and distribute this
25 1.11.6.2 christos * Software with or without fee, provided that the above copyright notice and
26 1.11.6.2 christos * all paragraphs of this notice appear in all copies, and that the name of IBM
27 1.11.6.2 christos * not be used in connection with the marketing of any product incorporating
28 1.11.6.2 christos * the Software or modifications thereof, without specific, written prior
29 1.11.6.2 christos * permission.
30 1.11.6.2 christos *
31 1.11.6.2 christos * To the extent it has a right to do so, IBM grants an immunity from suit
32 1.11.6.2 christos * under its patents, if any, for the use, sale or manufacture of products to
33 1.11.6.2 christos * the extent that such products are used for performing Domain Name System
34 1.11.6.2 christos * dynamic updates in TCP/IP networks by means of the Software. No immunity is
35 1.11.6.2 christos * granted for any product per se or for any other function of any product.
36 1.11.6.2 christos *
37 1.11.6.2 christos * THE SOFTWARE IS PROVIDED "AS IS", AND IBM DISCLAIMS ALL WARRANTIES,
38 1.11.6.2 christos * INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
39 1.11.6.2 christos * PARTICULAR PURPOSE. IN NO EVENT SHALL IBM BE LIABLE FOR ANY SPECIAL,
40 1.11.6.2 christos * DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER ARISING
41 1.11.6.2 christos * OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE, EVEN
42 1.11.6.2 christos * IF IBM IS APPRISED OF THE POSSIBILITY OF SUCH DAMAGES.
43 1.11.6.2 christos */
44 1.11.6.2 christos
45 1.11.6.2 christos #include <sys/cdefs.h>
46 1.11.6.2 christos #if defined(LIBC_SCCS) && !defined(lint)
47 1.11.6.2 christos #if 0
48 1.11.6.2 christos static const char rcsid[] = "Id: base64.c,v 1.4 2005/04/27 04:56:34 sra Exp";
49 1.11.6.2 christos #else
50 1.11.6.2 christos __RCSID("$NetBSD: base64.c,v 1.11.6.2 2008/06/21 20:41:49 christos Exp $");
51 1.11.6.2 christos #endif
52 1.11.6.2 christos #endif /* LIBC_SCCS and not lint */
53 1.11.6.2 christos
54 1.11.6.2 christos #include "port_before.h"
55 1.11.6.2 christos
56 1.11.6.2 christos #include <sys/types.h>
57 1.11.6.2 christos #include <sys/param.h>
58 1.11.6.2 christos #include <sys/socket.h>
59 1.11.6.2 christos
60 1.11.6.2 christos #include <netinet/in.h>
61 1.11.6.2 christos #include <arpa/inet.h>
62 1.11.6.2 christos #include <arpa/nameser.h>
63 1.11.6.2 christos
64 1.11.6.2 christos #include <assert.h>
65 1.11.6.2 christos #include <ctype.h>
66 1.11.6.2 christos #include <resolv.h>
67 1.11.6.2 christos #include <stdio.h>
68 1.11.6.2 christos #include <stdlib.h>
69 1.11.6.2 christos #include <string.h>
70 1.11.6.2 christos
71 1.11.6.2 christos #include "port_after.h"
72 1.11.6.2 christos
73 1.11.6.2 christos #define Assert(Cond) if (!(Cond)) abort()
74 1.11.6.2 christos
75 1.11.6.2 christos static const char Base64[] =
76 1.11.6.2 christos "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";
77 1.11.6.2 christos static const char Pad64 = '=';
78 1.11.6.2 christos
79 1.11.6.2 christos /* (From RFC1521 and draft-ietf-dnssec-secext-03.txt)
80 1.11.6.2 christos The following encoding technique is taken from RFC1521 by Borenstein
81 1.11.6.2 christos and Freed. It is reproduced here in a slightly edited form for
82 1.11.6.2 christos convenience.
83 1.11.6.2 christos
84 1.11.6.2 christos A 65-character subset of US-ASCII is used, enabling 6 bits to be
85 1.11.6.2 christos represented per printable character. (The extra 65th character, "=",
86 1.11.6.2 christos is used to signify a special processing function.)
87 1.11.6.2 christos
88 1.11.6.2 christos The encoding process represents 24-bit groups of input bits as output
89 1.11.6.2 christos strings of 4 encoded characters. Proceeding from left to right, a
90 1.11.6.2 christos 24-bit input group is formed by concatenating 3 8-bit input groups.
91 1.11.6.2 christos These 24 bits are then treated as 4 concatenated 6-bit groups, each
92 1.11.6.2 christos of which is translated into a single digit in the base64 alphabet.
93 1.11.6.2 christos
94 1.11.6.2 christos Each 6-bit group is used as an index into an array of 64 printable
95 1.11.6.2 christos characters. The character referenced by the index is placed in the
96 1.11.6.2 christos output string.
97 1.11.6.2 christos
98 1.11.6.2 christos Table 1: The Base64 Alphabet
99 1.11.6.2 christos
100 1.11.6.2 christos Value Encoding Value Encoding Value Encoding Value Encoding
101 1.11.6.2 christos 0 A 17 R 34 i 51 z
102 1.11.6.2 christos 1 B 18 S 35 j 52 0
103 1.11.6.2 christos 2 C 19 T 36 k 53 1
104 1.11.6.2 christos 3 D 20 U 37 l 54 2
105 1.11.6.2 christos 4 E 21 V 38 m 55 3
106 1.11.6.2 christos 5 F 22 W 39 n 56 4
107 1.11.6.2 christos 6 G 23 X 40 o 57 5
108 1.11.6.2 christos 7 H 24 Y 41 p 58 6
109 1.11.6.2 christos 8 I 25 Z 42 q 59 7
110 1.11.6.2 christos 9 J 26 a 43 r 60 8
111 1.11.6.2 christos 10 K 27 b 44 s 61 9
112 1.11.6.2 christos 11 L 28 c 45 t 62 +
113 1.11.6.2 christos 12 M 29 d 46 u 63 /
114 1.11.6.2 christos 13 N 30 e 47 v
115 1.11.6.2 christos 14 O 31 f 48 w (pad) =
116 1.11.6.2 christos 15 P 32 g 49 x
117 1.11.6.2 christos 16 Q 33 h 50 y
118 1.11.6.2 christos
119 1.11.6.2 christos Special processing is performed if fewer than 24 bits are available
120 1.11.6.2 christos at the end of the data being encoded. A full encoding quantum is
121 1.11.6.2 christos always completed at the end of a quantity. When fewer than 24 input
122 1.11.6.2 christos bits are available in an input group, zero bits are added (on the
123 1.11.6.2 christos right) to form an integral number of 6-bit groups. Padding at the
124 1.11.6.2 christos end of the data is performed using the '=' character.
125 1.11.6.2 christos
126 1.11.6.2 christos Since all base64 input is an integral number of octets, only the
127 1.11.6.2 christos -------------------------------------------------
128 1.11.6.2 christos following cases can arise:
129 1.11.6.2 christos
130 1.11.6.2 christos (1) the final quantum of encoding input is an integral
131 1.11.6.2 christos multiple of 24 bits; here, the final unit of encoded
132 1.11.6.2 christos output will be an integral multiple of 4 characters
133 1.11.6.2 christos with no "=" padding,
134 1.11.6.2 christos (2) the final quantum of encoding input is exactly 8 bits;
135 1.11.6.2 christos here, the final unit of encoded output will be two
136 1.11.6.2 christos characters followed by two "=" padding characters, or
137 1.11.6.2 christos (3) the final quantum of encoding input is exactly 16 bits;
138 1.11.6.2 christos here, the final unit of encoded output will be three
139 1.11.6.2 christos characters followed by one "=" padding character.
140 1.11.6.2 christos */
141 1.11.6.2 christos
142 1.11.6.2 christos int
143 1.11.6.2 christos b64_ntop(u_char const *src, size_t srclength, char *target, size_t targsize) {
144 1.11.6.2 christos size_t datalength = 0;
145 1.11.6.2 christos u_char input[3];
146 1.11.6.2 christos u_char output[4];
147 1.11.6.2 christos size_t i;
148 1.11.6.2 christos
149 1.11.6.2 christos _DIAGASSERT(src != NULL);
150 1.11.6.2 christos _DIAGASSERT(target != NULL);
151 1.11.6.2 christos
152 1.11.6.2 christos while (2U < srclength) {
153 1.11.6.2 christos input[0] = *src++;
154 1.11.6.2 christos input[1] = *src++;
155 1.11.6.2 christos input[2] = *src++;
156 1.11.6.2 christos srclength -= 3;
157 1.11.6.2 christos
158 1.11.6.2 christos output[0] = (u_int32_t)input[0] >> 2;
159 1.11.6.2 christos output[1] = ((u_int32_t)(input[0] & 0x03) << 4) +
160 1.11.6.2 christos ((u_int32_t)input[1] >> 4);
161 1.11.6.2 christos output[2] = ((u_int32_t)(input[1] & 0x0f) << 2) +
162 1.11.6.2 christos ((u_int32_t)input[2] >> 6);
163 1.11.6.2 christos output[3] = input[2] & 0x3f;
164 1.11.6.2 christos Assert(output[0] < 64);
165 1.11.6.2 christos Assert(output[1] < 64);
166 1.11.6.2 christos Assert(output[2] < 64);
167 1.11.6.2 christos Assert(output[3] < 64);
168 1.11.6.2 christos
169 1.11.6.2 christos if (datalength + 4 > targsize)
170 1.11.6.2 christos return (-1);
171 1.11.6.2 christos target[datalength++] = Base64[output[0]];
172 1.11.6.2 christos target[datalength++] = Base64[output[1]];
173 1.11.6.2 christos target[datalength++] = Base64[output[2]];
174 1.11.6.2 christos target[datalength++] = Base64[output[3]];
175 1.11.6.2 christos }
176 1.11.6.2 christos
177 1.11.6.2 christos /* Now we worry about padding. */
178 1.11.6.2 christos if (0U != srclength) {
179 1.11.6.2 christos /* Get what's left. */
180 1.11.6.2 christos input[0] = input[1] = input[2] = '\0';
181 1.11.6.2 christos for (i = 0; i < srclength; i++)
182 1.11.6.2 christos input[i] = *src++;
183 1.11.6.2 christos
184 1.11.6.2 christos output[0] = (u_int32_t)input[0] >> 2;
185 1.11.6.2 christos output[1] = ((u_int32_t)(input[0] & 0x03) << 4) +
186 1.11.6.2 christos ((u_int32_t)input[1] >> 4);
187 1.11.6.2 christos output[2] = ((u_int32_t)(input[1] & 0x0f) << 2) +
188 1.11.6.2 christos ((u_int32_t)input[2] >> 6);
189 1.11.6.2 christos Assert(output[0] < 64);
190 1.11.6.2 christos Assert(output[1] < 64);
191 1.11.6.2 christos Assert(output[2] < 64);
192 1.11.6.2 christos
193 1.11.6.2 christos if (datalength + 4 > targsize)
194 1.11.6.2 christos return (-1);
195 1.11.6.2 christos target[datalength++] = Base64[output[0]];
196 1.11.6.2 christos target[datalength++] = Base64[output[1]];
197 1.11.6.2 christos if (srclength == 1U)
198 1.11.6.2 christos target[datalength++] = Pad64;
199 1.11.6.2 christos else
200 1.11.6.2 christos target[datalength++] = Base64[output[2]];
201 1.11.6.2 christos target[datalength++] = Pad64;
202 1.11.6.2 christos }
203 1.11.6.2 christos if (datalength >= targsize)
204 1.11.6.2 christos return (-1);
205 1.11.6.2 christos target[datalength] = '\0'; /*%< Returned value doesn't count \\0. */
206 1.11.6.2 christos return (datalength);
207 1.11.6.2 christos }
208 1.11.6.2 christos
209 1.11.6.2 christos /* skips all whitespace anywhere.
210 1.11.6.2 christos converts characters, four at a time, starting at (or after)
211 1.11.6.2 christos src from base - 64 numbers into three 8 bit bytes in the target area.
212 1.11.6.2 christos it returns the number of data bytes stored at the target, or -1 on error.
213 1.11.6.2 christos */
214 1.11.6.2 christos
215 1.11.6.2 christos int
216 1.11.6.2 christos b64_pton(src, target, targsize)
217 1.11.6.2 christos char const *src;
218 1.11.6.2 christos u_char *target;
219 1.11.6.2 christos size_t targsize;
220 1.11.6.2 christos {
221 1.11.6.2 christos size_t tarindex;
222 1.11.6.2 christos int state, ch;
223 1.11.6.2 christos char *pos;
224 1.11.6.2 christos
225 1.11.6.2 christos _DIAGASSERT(src != NULL);
226 1.11.6.2 christos _DIAGASSERT(target != NULL);
227 1.11.6.2 christos
228 1.11.6.2 christos state = 0;
229 1.11.6.2 christos tarindex = 0;
230 1.11.6.2 christos
231 1.11.6.2 christos while ((ch = (u_char) *src++) != '\0') {
232 1.11.6.2 christos if (isspace(ch)) /*%< Skip whitespace anywhere. */
233 1.11.6.2 christos continue;
234 1.11.6.2 christos
235 1.11.6.2 christos if (ch == Pad64)
236 1.11.6.2 christos break;
237 1.11.6.2 christos
238 1.11.6.2 christos pos = strchr(Base64, ch);
239 1.11.6.2 christos if (pos == 0) /*%< A non-base64 character. */
240 1.11.6.2 christos return (-1);
241 1.11.6.2 christos
242 1.11.6.2 christos switch (state) {
243 1.11.6.2 christos case 0:
244 1.11.6.2 christos if (target) {
245 1.11.6.2 christos if ((size_t)tarindex >= targsize)
246 1.11.6.2 christos return (-1);
247 1.11.6.2 christos target[tarindex] = (pos - Base64) << 2;
248 1.11.6.2 christos }
249 1.11.6.2 christos state = 1;
250 1.11.6.2 christos break;
251 1.11.6.2 christos case 1:
252 1.11.6.2 christos if (target) {
253 1.11.6.2 christos if ((size_t)tarindex + 1 >= targsize)
254 1.11.6.2 christos return (-1);
255 1.11.6.2 christos target[tarindex] |=
256 1.11.6.2 christos (u_int32_t)(pos - Base64) >> 4;
257 1.11.6.2 christos target[tarindex+1] = ((pos - Base64) & 0x0f)
258 1.11.6.2 christos << 4 ;
259 1.11.6.2 christos }
260 1.11.6.2 christos tarindex++;
261 1.11.6.2 christos state = 2;
262 1.11.6.2 christos break;
263 1.11.6.2 christos case 2:
264 1.11.6.2 christos if (target) {
265 1.11.6.2 christos if ((size_t)tarindex + 1 >= targsize)
266 1.11.6.2 christos return (-1);
267 1.11.6.2 christos target[tarindex] |=
268 1.11.6.2 christos (u_int32_t)(pos - Base64) >> 2;
269 1.11.6.2 christos target[tarindex+1] = ((pos - Base64) & 0x03)
270 1.11.6.2 christos << 6;
271 1.11.6.2 christos }
272 1.11.6.2 christos tarindex++;
273 1.11.6.2 christos state = 3;
274 1.11.6.2 christos break;
275 1.11.6.2 christos case 3:
276 1.11.6.2 christos if (target) {
277 1.11.6.2 christos if ((size_t)tarindex >= targsize)
278 1.11.6.2 christos return (-1);
279 1.11.6.2 christos target[tarindex] |= (pos - Base64);
280 1.11.6.2 christos }
281 1.11.6.2 christos tarindex++;
282 1.11.6.2 christos state = 0;
283 1.11.6.2 christos break;
284 1.11.6.2 christos default:
285 1.11.6.2 christos abort();
286 1.11.6.2 christos }
287 1.11.6.2 christos }
288 1.11.6.2 christos
289 1.11.6.2 christos /*
290 1.11.6.2 christos * We are done decoding Base-64 chars. Let's see if we ended
291 1.11.6.2 christos * on a byte boundary, and/or with erroneous trailing characters.
292 1.11.6.2 christos */
293 1.11.6.2 christos
294 1.11.6.2 christos if (ch == Pad64) { /*%< We got a pad char. */
295 1.11.6.2 christos ch = *src++; /*%< Skip it, get next. */
296 1.11.6.2 christos switch (state) {
297 1.11.6.2 christos case 0: /*%< Invalid = in first position */
298 1.11.6.2 christos case 1: /*%< Invalid = in second position */
299 1.11.6.2 christos return (-1);
300 1.11.6.2 christos
301 1.11.6.2 christos case 2: /*%< Valid, means one byte of info */
302 1.11.6.2 christos /* Skip any number of spaces. */
303 1.11.6.2 christos for (; ch != '\0'; ch = (u_char) *src++)
304 1.11.6.2 christos if (!isspace(ch))
305 1.11.6.2 christos break;
306 1.11.6.2 christos /* Make sure there is another trailing = sign. */
307 1.11.6.2 christos if (ch != Pad64)
308 1.11.6.2 christos return (-1);
309 1.11.6.2 christos ch = *src++; /*%< Skip the = */
310 1.11.6.2 christos /* Fall through to "single trailing =" case. */
311 1.11.6.2 christos /* FALLTHROUGH */
312 1.11.6.2 christos
313 1.11.6.2 christos case 3: /*%< Valid, means two bytes of info */
314 1.11.6.2 christos /*
315 1.11.6.2 christos * We know this char is an =. Is there anything but
316 1.11.6.2 christos * whitespace after it?
317 1.11.6.2 christos */
318 1.11.6.2 christos for (; ch != '\0'; ch = (u_char) *src++)
319 1.11.6.2 christos if (!isspace(ch))
320 1.11.6.2 christos return (-1);
321 1.11.6.2 christos
322 1.11.6.2 christos /*
323 1.11.6.2 christos * Now make sure for cases 2 and 3 that the "extra"
324 1.11.6.2 christos * bits that slopped past the last full byte were
325 1.11.6.2 christos * zeros. If we don't check them, they become a
326 1.11.6.2 christos * subliminal channel.
327 1.11.6.2 christos */
328 1.11.6.2 christos if (target && target[tarindex] != 0)
329 1.11.6.2 christos return (-1);
330 1.11.6.2 christos }
331 1.11.6.2 christos } else {
332 1.11.6.2 christos /*
333 1.11.6.2 christos * We ended by seeing the end of the string. Make sure we
334 1.11.6.2 christos * have no partial bytes lying around.
335 1.11.6.2 christos */
336 1.11.6.2 christos if (state != 0)
337 1.11.6.2 christos return (-1);
338 1.11.6.2 christos }
339 1.11.6.2 christos
340 1.11.6.2 christos return (tarindex);
341 1.11.6.2 christos }
342 1.11.6.2 christos
343 1.11.6.2 christos /*! \file */
344