base64.c revision 1.1 1 1.1 mrg /*
2 1.1 mrg * Copyright (c) 1996 by Internet Software Consortium.
3 1.1 mrg *
4 1.1 mrg * Permission to use, copy, modify, and distribute this software for any
5 1.1 mrg * purpose with or without fee is hereby granted, provided that the above
6 1.1 mrg * copyright notice and this permission notice appear in all copies.
7 1.1 mrg *
8 1.1 mrg * THE SOFTWARE IS PROVIDED "AS IS" AND INTERNET SOFTWARE CONSORTIUM DISCLAIMS
9 1.1 mrg * ALL WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES
10 1.1 mrg * OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL INTERNET SOFTWARE
11 1.1 mrg * CONSORTIUM BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL
12 1.1 mrg * DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR
13 1.1 mrg * PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS
14 1.1 mrg * ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS
15 1.1 mrg * SOFTWARE.
16 1.1 mrg */
17 1.1 mrg
18 1.1 mrg /*
19 1.1 mrg * Portions Copyright (c) 1995 by International Business Machines, Inc.
20 1.1 mrg *
21 1.1 mrg * International Business Machines, Inc. (hereinafter called IBM) grants
22 1.1 mrg * permission under its copyrights to use, copy, modify, and distribute this
23 1.1 mrg * Software with or without fee, provided that the above copyright notice and
24 1.1 mrg * all paragraphs of this notice appear in all copies, and that the name of IBM
25 1.1 mrg * not be used in connection with the marketing of any product incorporating
26 1.1 mrg * the Software or modifications thereof, without specific, written prior
27 1.1 mrg * permission.
28 1.1 mrg *
29 1.1 mrg * To the extent it has a right to do so, IBM grants an immunity from suit
30 1.1 mrg * under its patents, if any, for the use, sale or manufacture of products to
31 1.1 mrg * the extent that such products are used for performing Domain Name System
32 1.1 mrg * dynamic updates in TCP/IP networks by means of the Software. No immunity is
33 1.1 mrg * granted for any product per se or for any other function of any product.
34 1.1 mrg *
35 1.1 mrg * THE SOFTWARE IS PROVIDED "AS IS", AND IBM DISCLAIMS ALL WARRANTIES,
36 1.1 mrg * INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
37 1.1 mrg * PARTICULAR PURPOSE. IN NO EVENT SHALL IBM BE LIABLE FOR ANY SPECIAL,
38 1.1 mrg * DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER ARISING
39 1.1 mrg * OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE, EVEN
40 1.1 mrg * IF IBM IS APPRISED OF THE POSSIBILITY OF SUCH DAMAGES.
41 1.1 mrg */
42 1.1 mrg
43 1.1 mrg #include <sys/types.h>
44 1.1 mrg #include <sys/param.h>
45 1.1 mrg #include <sys/socket.h>
46 1.1 mrg #include <netinet/in.h>
47 1.1 mrg #include <arpa/inet.h>
48 1.1 mrg #include <arpa/nameser.h>
49 1.1 mrg
50 1.1 mrg #include <ctype.h>
51 1.1 mrg #include <resolv.h>
52 1.1 mrg #include <stdio.h>
53 1.1 mrg
54 1.1 mrg #if defined(BSD) && (BSD >= 199103) && defined(AF_INET6)
55 1.1 mrg # include <stdlib.h>
56 1.1 mrg # include <string.h>
57 1.1 mrg #else
58 1.1 mrg # include "../conf/portability.h"
59 1.1 mrg #endif
60 1.1 mrg
61 1.1 mrg #define Assert(Cond) if (!(Cond)) abort()
62 1.1 mrg
63 1.1 mrg static const char Base64[] =
64 1.1 mrg "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";
65 1.1 mrg static const char Pad64 = '=';
66 1.1 mrg
67 1.1 mrg /* (From RFC1521 and draft-ietf-dnssec-secext-03.txt)
68 1.1 mrg The following encoding technique is taken from RFC 1521 by Borenstein
69 1.1 mrg and Freed. It is reproduced here in a slightly edited form for
70 1.1 mrg convenience.
71 1.1 mrg
72 1.1 mrg A 65-character subset of US-ASCII is used, enabling 6 bits to be
73 1.1 mrg represented per printable character. (The extra 65th character, "=",
74 1.1 mrg is used to signify a special processing function.)
75 1.1 mrg
76 1.1 mrg The encoding process represents 24-bit groups of input bits as output
77 1.1 mrg strings of 4 encoded characters. Proceeding from left to right, a
78 1.1 mrg 24-bit input group is formed by concatenating 3 8-bit input groups.
79 1.1 mrg These 24 bits are then treated as 4 concatenated 6-bit groups, each
80 1.1 mrg of which is translated into a single digit in the base64 alphabet.
81 1.1 mrg
82 1.1 mrg Each 6-bit group is used as an index into an array of 64 printable
83 1.1 mrg characters. The character referenced by the index is placed in the
84 1.1 mrg output string.
85 1.1 mrg
86 1.1 mrg Table 1: The Base64 Alphabet
87 1.1 mrg
88 1.1 mrg Value Encoding Value Encoding Value Encoding Value Encoding
89 1.1 mrg 0 A 17 R 34 i 51 z
90 1.1 mrg 1 B 18 S 35 j 52 0
91 1.1 mrg 2 C 19 T 36 k 53 1
92 1.1 mrg 3 D 20 U 37 l 54 2
93 1.1 mrg 4 E 21 V 38 m 55 3
94 1.1 mrg 5 F 22 W 39 n 56 4
95 1.1 mrg 6 G 23 X 40 o 57 5
96 1.1 mrg 7 H 24 Y 41 p 58 6
97 1.1 mrg 8 I 25 Z 42 q 59 7
98 1.1 mrg 9 J 26 a 43 r 60 8
99 1.1 mrg 10 K 27 b 44 s 61 9
100 1.1 mrg 11 L 28 c 45 t 62 +
101 1.1 mrg 12 M 29 d 46 u 63 /
102 1.1 mrg 13 N 30 e 47 v
103 1.1 mrg 14 O 31 f 48 w (pad) =
104 1.1 mrg 15 P 32 g 49 x
105 1.1 mrg 16 Q 33 h 50 y
106 1.1 mrg
107 1.1 mrg Special processing is performed if fewer than 24 bits are available
108 1.1 mrg at the end of the data being encoded. A full encoding quantum is
109 1.1 mrg always completed at the end of a quantity. When fewer than 24 input
110 1.1 mrg bits are available in an input group, zero bits are added (on the
111 1.1 mrg right) to form an integral number of 6-bit groups. Padding at the
112 1.1 mrg end of the data is performed using the '=' character.
113 1.1 mrg
114 1.1 mrg Since all base64 input is an integral number of octets, only the
115 1.1 mrg -------------------------------------------------
116 1.1 mrg following cases can arise:
117 1.1 mrg
118 1.1 mrg (1) the final quantum of encoding input is an integral
119 1.1 mrg multiple of 24 bits; here, the final unit of encoded
120 1.1 mrg output will be an integral multiple of 4 characters
121 1.1 mrg with no "=" padding,
122 1.1 mrg (2) the final quantum of encoding input is exactly 8 bits;
123 1.1 mrg here, the final unit of encoded output will be two
124 1.1 mrg characters followed by two "=" padding characters, or
125 1.1 mrg (3) the final quantum of encoding input is exactly 16 bits;
126 1.1 mrg here, the final unit of encoded output will be three
127 1.1 mrg characters followed by one "=" padding character.
128 1.1 mrg */
129 1.1 mrg
130 1.1 mrg int
131 1.1 mrg b64_ntop(src, srclength, target, targsize)
132 1.1 mrg u_char const *src;
133 1.1 mrg size_t srclength;
134 1.1 mrg char *target;
135 1.1 mrg size_t targsize;
136 1.1 mrg {
137 1.1 mrg size_t datalength = 0;
138 1.1 mrg u_char input[3];
139 1.1 mrg u_char output[4];
140 1.1 mrg int i;
141 1.1 mrg
142 1.1 mrg while (2 < srclength) {
143 1.1 mrg input[0] = *src++;
144 1.1 mrg input[1] = *src++;
145 1.1 mrg input[2] = *src++;
146 1.1 mrg srclength -= 3;
147 1.1 mrg
148 1.1 mrg output[0] = input[0] >> 2;
149 1.1 mrg output[1] = ((input[0] & 0x03) << 4) + (input[1] >> 4);
150 1.1 mrg output[2] = ((input[1] & 0x0f) << 2) + (input[2] >> 6);
151 1.1 mrg output[3] = input[2] & 0x3f;
152 1.1 mrg Assert(output[0] < 64);
153 1.1 mrg Assert(output[1] < 64);
154 1.1 mrg Assert(output[2] < 64);
155 1.1 mrg Assert(output[3] < 64);
156 1.1 mrg
157 1.1 mrg if (datalength + 4 > targsize)
158 1.1 mrg return (-1);
159 1.1 mrg target[datalength++] = Base64[output[0]];
160 1.1 mrg target[datalength++] = Base64[output[1]];
161 1.1 mrg target[datalength++] = Base64[output[2]];
162 1.1 mrg target[datalength++] = Base64[output[3]];
163 1.1 mrg }
164 1.1 mrg
165 1.1 mrg /* Now we worry about padding. */
166 1.1 mrg if (0 != srclength) {
167 1.1 mrg /* Get what's left. */
168 1.1 mrg input[0] = input[1] = input[2] = '\0';
169 1.1 mrg for (i = 0; i < srclength; i++)
170 1.1 mrg input[i] = *src++;
171 1.1 mrg
172 1.1 mrg output[0] = input[0] >> 2;
173 1.1 mrg output[1] = ((input[0] & 0x03) << 4) + (input[1] >> 4);
174 1.1 mrg output[2] = ((input[1] & 0x0f) << 2) + (input[2] >> 6);
175 1.1 mrg Assert(output[0] < 64);
176 1.1 mrg Assert(output[1] < 64);
177 1.1 mrg Assert(output[2] < 64);
178 1.1 mrg
179 1.1 mrg if (datalength + 4 > targsize)
180 1.1 mrg return (-1);
181 1.1 mrg target[datalength++] = Base64[output[0]];
182 1.1 mrg target[datalength++] = Base64[output[1]];
183 1.1 mrg if (srclength == 1)
184 1.1 mrg target[datalength++] = Pad64;
185 1.1 mrg else
186 1.1 mrg target[datalength++] = Base64[output[2]];
187 1.1 mrg target[datalength++] = Pad64;
188 1.1 mrg }
189 1.1 mrg if (datalength >= targsize)
190 1.1 mrg return (-1);
191 1.1 mrg target[datalength] = '\0'; /* Returned value doesn't count \0. */
192 1.1 mrg return (datalength);
193 1.1 mrg }
194 1.1 mrg
195 1.1 mrg /* skips all whitespace anywhere.
196 1.1 mrg converts characters, four at a time, starting at (or after)
197 1.1 mrg src from base - 64 numbers into three 8 bit bytes in the target area.
198 1.1 mrg it returns the number of data bytes stored at the target, or -1 on error.
199 1.1 mrg */
200 1.1 mrg
201 1.1 mrg int
202 1.1 mrg b64_pton(src, target, targsize)
203 1.1 mrg char const *src;
204 1.1 mrg u_char *target;
205 1.1 mrg size_t targsize;
206 1.1 mrg {
207 1.1 mrg int tarindex, state, ch;
208 1.1 mrg char *pos;
209 1.1 mrg
210 1.1 mrg state = 0;
211 1.1 mrg tarindex = 0;
212 1.1 mrg
213 1.1 mrg while ((ch = *src++) != '\0') {
214 1.1 mrg if (isspace(ch)) /* Skip whitespace anywhere. */
215 1.1 mrg continue;
216 1.1 mrg
217 1.1 mrg if (ch == Pad64)
218 1.1 mrg break;
219 1.1 mrg
220 1.1 mrg pos = strchr(Base64, ch);
221 1.1 mrg if (pos == 0) /* A non-base64 character. */
222 1.1 mrg return (-1);
223 1.1 mrg
224 1.1 mrg switch (state) {
225 1.1 mrg case 0:
226 1.1 mrg if (target) {
227 1.1 mrg if (tarindex >= targsize)
228 1.1 mrg return (-1);
229 1.1 mrg target[tarindex] = (pos - Base64) << 2;
230 1.1 mrg }
231 1.1 mrg state = 1;
232 1.1 mrg break;
233 1.1 mrg case 1:
234 1.1 mrg if (target) {
235 1.1 mrg if (tarindex + 1 >= targsize)
236 1.1 mrg return (-1);
237 1.1 mrg target[tarindex] |= (pos - Base64) >> 4;
238 1.1 mrg target[tarindex+1] = ((pos - Base64) & 0x0f)
239 1.1 mrg << 4 ;
240 1.1 mrg }
241 1.1 mrg tarindex++;
242 1.1 mrg state = 2;
243 1.1 mrg break;
244 1.1 mrg case 2:
245 1.1 mrg if (target) {
246 1.1 mrg if (tarindex + 1 >= targsize)
247 1.1 mrg return (-1);
248 1.1 mrg target[tarindex] |= (pos - Base64) >> 2;
249 1.1 mrg target[tarindex+1] = ((pos - Base64) & 0x03)
250 1.1 mrg << 6;
251 1.1 mrg }
252 1.1 mrg tarindex++;
253 1.1 mrg state = 3;
254 1.1 mrg break;
255 1.1 mrg case 3:
256 1.1 mrg if (target) {
257 1.1 mrg if (tarindex >= targsize)
258 1.1 mrg return (-1);
259 1.1 mrg target[tarindex] |= (pos - Base64);
260 1.1 mrg }
261 1.1 mrg tarindex++;
262 1.1 mrg state = 0;
263 1.1 mrg break;
264 1.1 mrg default:
265 1.1 mrg abort();
266 1.1 mrg }
267 1.1 mrg }
268 1.1 mrg
269 1.1 mrg /*
270 1.1 mrg * We are done decoding Base-64 chars. Let's see if we ended
271 1.1 mrg * on a byte boundary, and/or with erroneous trailing characters.
272 1.1 mrg */
273 1.1 mrg
274 1.1 mrg if (ch == Pad64) { /* We got a pad char. */
275 1.1 mrg ch = *src++; /* Skip it, get next. */
276 1.1 mrg switch (state) {
277 1.1 mrg case 0: /* Invalid = in first position */
278 1.1 mrg case 1: /* Invalid = in second position */
279 1.1 mrg return (-1);
280 1.1 mrg
281 1.1 mrg case 2: /* Valid, means one byte of info */
282 1.1 mrg /* Skip any number of spaces. */
283 1.1 mrg for (NULL; ch != '\0'; ch = *src++)
284 1.1 mrg if (!isspace(ch))
285 1.1 mrg break;
286 1.1 mrg /* Make sure there is another trailing = sign. */
287 1.1 mrg if (ch != Pad64)
288 1.1 mrg return (-1);
289 1.1 mrg ch = *src++; /* Skip the = */
290 1.1 mrg /* Fall through to "single trailing =" case. */
291 1.1 mrg /* FALLTHROUGH */
292 1.1 mrg
293 1.1 mrg case 3: /* Valid, means two bytes of info */
294 1.1 mrg /*
295 1.1 mrg * We know this char is an =. Is there anything but
296 1.1 mrg * whitespace after it?
297 1.1 mrg */
298 1.1 mrg for (NULL; ch != '\0'; ch = *src++)
299 1.1 mrg if (!isspace(ch))
300 1.1 mrg return (-1);
301 1.1 mrg
302 1.1 mrg /*
303 1.1 mrg * Now make sure for cases 2 and 3 that the "extra"
304 1.1 mrg * bits that slopped past the last full byte were
305 1.1 mrg * zeros. If we don't check them, they become a
306 1.1 mrg * subliminal channel.
307 1.1 mrg */
308 1.1 mrg if (target && target[tarindex] != 0)
309 1.1 mrg return (-1);
310 1.1 mrg }
311 1.1 mrg } else {
312 1.1 mrg /*
313 1.1 mrg * We ended by seeing the end of the string. Make sure we
314 1.1 mrg * have no partial bytes lying around.
315 1.1 mrg */
316 1.1 mrg if (state != 0)
317 1.1 mrg return (-1);
318 1.1 mrg }
319 1.1 mrg
320 1.1 mrg return (tarindex);
321 1.1 mrg }
322