Home | History | Annotate | Line # | Download | only in net
base64.c revision 1.8
      1  1.8   thorpej /*	$NetBSD: base64.c,v 1.8 2002/11/11 01:15:17 thorpej Exp $	*/
      2  1.2       mrg 
      3  1.1       mrg /*
      4  1.1       mrg  * Copyright (c) 1996 by Internet Software Consortium.
      5  1.1       mrg  *
      6  1.1       mrg  * Permission to use, copy, modify, and distribute this software for any
      7  1.1       mrg  * purpose with or without fee is hereby granted, provided that the above
      8  1.1       mrg  * copyright notice and this permission notice appear in all copies.
      9  1.1       mrg  *
     10  1.1       mrg  * THE SOFTWARE IS PROVIDED "AS IS" AND INTERNET SOFTWARE CONSORTIUM DISCLAIMS
     11  1.1       mrg  * ALL WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES
     12  1.1       mrg  * OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL INTERNET SOFTWARE
     13  1.1       mrg  * CONSORTIUM BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL
     14  1.1       mrg  * DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR
     15  1.1       mrg  * PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS
     16  1.1       mrg  * ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS
     17  1.1       mrg  * SOFTWARE.
     18  1.1       mrg  */
     19  1.1       mrg 
     20  1.1       mrg /*
     21  1.1       mrg  * Portions Copyright (c) 1995 by International Business Machines, Inc.
     22  1.1       mrg  *
     23  1.1       mrg  * International Business Machines, Inc. (hereinafter called IBM) grants
     24  1.1       mrg  * permission under its copyrights to use, copy, modify, and distribute this
     25  1.1       mrg  * Software with or without fee, provided that the above copyright notice and
     26  1.1       mrg  * all paragraphs of this notice appear in all copies, and that the name of IBM
     27  1.1       mrg  * not be used in connection with the marketing of any product incorporating
     28  1.1       mrg  * the Software or modifications thereof, without specific, written prior
     29  1.1       mrg  * permission.
     30  1.1       mrg  *
     31  1.1       mrg  * To the extent it has a right to do so, IBM grants an immunity from suit
     32  1.1       mrg  * under its patents, if any, for the use, sale or manufacture of products to
     33  1.1       mrg  * the extent that such products are used for performing Domain Name System
     34  1.1       mrg  * dynamic updates in TCP/IP networks by means of the Software.  No immunity is
     35  1.1       mrg  * granted for any product per se or for any other function of any product.
     36  1.1       mrg  *
     37  1.1       mrg  * THE SOFTWARE IS PROVIDED "AS IS", AND IBM DISCLAIMS ALL WARRANTIES,
     38  1.1       mrg  * INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
     39  1.1       mrg  * PARTICULAR PURPOSE.  IN NO EVENT SHALL IBM BE LIABLE FOR ANY SPECIAL,
     40  1.1       mrg  * DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER ARISING
     41  1.1       mrg  * OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE, EVEN
     42  1.1       mrg  * IF IBM IS APPRISED OF THE POSSIBILITY OF SUCH DAMAGES.
     43  1.1       mrg  */
     44  1.2       mrg 
     45  1.3  christos #include <sys/cdefs.h>
     46  1.2       mrg #if defined(LIBC_SCCS) && !defined(lint)
     47  1.8   thorpej __RCSID("$NetBSD: base64.c,v 1.8 2002/11/11 01:15:17 thorpej Exp $");
     48  1.2       mrg #endif /* LIBC_SCCS and not lint */
     49  1.2       mrg 
     50  1.1       mrg #include <sys/types.h>
     51  1.1       mrg #include <sys/param.h>
     52  1.1       mrg #include <sys/socket.h>
     53  1.1       mrg #include <netinet/in.h>
     54  1.1       mrg #include <arpa/inet.h>
     55  1.1       mrg #include <arpa/nameser.h>
     56  1.1       mrg 
     57  1.5     lukem #include <assert.h>
     58  1.1       mrg #include <ctype.h>
     59  1.1       mrg #include <resolv.h>
     60  1.1       mrg #include <stdio.h>
     61  1.1       mrg 
     62  1.1       mrg #if defined(BSD) && (BSD >= 199103) && defined(AF_INET6)
     63  1.1       mrg # include <stdlib.h>
     64  1.1       mrg # include <string.h>
     65  1.1       mrg #else
     66  1.1       mrg # include "../conf/portability.h"
     67  1.1       mrg #endif
     68  1.1       mrg 
     69  1.1       mrg #define Assert(Cond) if (!(Cond)) abort()
     70  1.1       mrg 
     71  1.1       mrg static const char Base64[] =
     72  1.1       mrg 	"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";
     73  1.1       mrg static const char Pad64 = '=';
     74  1.1       mrg 
     75  1.1       mrg /* (From RFC1521 and draft-ietf-dnssec-secext-03.txt)
     76  1.1       mrg    The following encoding technique is taken from RFC 1521 by Borenstein
     77  1.1       mrg    and Freed.  It is reproduced here in a slightly edited form for
     78  1.1       mrg    convenience.
     79  1.1       mrg 
     80  1.1       mrg    A 65-character subset of US-ASCII is used, enabling 6 bits to be
     81  1.1       mrg    represented per printable character. (The extra 65th character, "=",
     82  1.1       mrg    is used to signify a special processing function.)
     83  1.1       mrg 
     84  1.1       mrg    The encoding process represents 24-bit groups of input bits as output
     85  1.1       mrg    strings of 4 encoded characters. Proceeding from left to right, a
     86  1.1       mrg    24-bit input group is formed by concatenating 3 8-bit input groups.
     87  1.1       mrg    These 24 bits are then treated as 4 concatenated 6-bit groups, each
     88  1.1       mrg    of which is translated into a single digit in the base64 alphabet.
     89  1.1       mrg 
     90  1.1       mrg    Each 6-bit group is used as an index into an array of 64 printable
     91  1.1       mrg    characters. The character referenced by the index is placed in the
     92  1.1       mrg    output string.
     93  1.1       mrg 
     94  1.1       mrg                          Table 1: The Base64 Alphabet
     95  1.1       mrg 
     96  1.1       mrg       Value Encoding  Value Encoding  Value Encoding  Value Encoding
     97  1.1       mrg           0 A            17 R            34 i            51 z
     98  1.1       mrg           1 B            18 S            35 j            52 0
     99  1.1       mrg           2 C            19 T            36 k            53 1
    100  1.1       mrg           3 D            20 U            37 l            54 2
    101  1.1       mrg           4 E            21 V            38 m            55 3
    102  1.1       mrg           5 F            22 W            39 n            56 4
    103  1.1       mrg           6 G            23 X            40 o            57 5
    104  1.1       mrg           7 H            24 Y            41 p            58 6
    105  1.1       mrg           8 I            25 Z            42 q            59 7
    106  1.1       mrg           9 J            26 a            43 r            60 8
    107  1.1       mrg          10 K            27 b            44 s            61 9
    108  1.1       mrg          11 L            28 c            45 t            62 +
    109  1.1       mrg          12 M            29 d            46 u            63 /
    110  1.1       mrg          13 N            30 e            47 v
    111  1.1       mrg          14 O            31 f            48 w         (pad) =
    112  1.1       mrg          15 P            32 g            49 x
    113  1.1       mrg          16 Q            33 h            50 y
    114  1.1       mrg 
    115  1.1       mrg    Special processing is performed if fewer than 24 bits are available
    116  1.1       mrg    at the end of the data being encoded.  A full encoding quantum is
    117  1.1       mrg    always completed at the end of a quantity.  When fewer than 24 input
    118  1.1       mrg    bits are available in an input group, zero bits are added (on the
    119  1.1       mrg    right) to form an integral number of 6-bit groups.  Padding at the
    120  1.1       mrg    end of the data is performed using the '=' character.
    121  1.1       mrg 
    122  1.1       mrg    Since all base64 input is an integral number of octets, only the
    123  1.1       mrg          -------------------------------------------------
    124  1.1       mrg    following cases can arise:
    125  1.1       mrg 
    126  1.1       mrg        (1) the final quantum of encoding input is an integral
    127  1.1       mrg            multiple of 24 bits; here, the final unit of encoded
    128  1.1       mrg 	   output will be an integral multiple of 4 characters
    129  1.1       mrg 	   with no "=" padding,
    130  1.1       mrg        (2) the final quantum of encoding input is exactly 8 bits;
    131  1.1       mrg            here, the final unit of encoded output will be two
    132  1.1       mrg 	   characters followed by two "=" padding characters, or
    133  1.1       mrg        (3) the final quantum of encoding input is exactly 16 bits;
    134  1.1       mrg            here, the final unit of encoded output will be three
    135  1.1       mrg 	   characters followed by one "=" padding character.
    136  1.1       mrg    */
    137  1.1       mrg 
    138  1.1       mrg int
    139  1.1       mrg b64_ntop(src, srclength, target, targsize)
    140  1.1       mrg 	u_char const *src;
    141  1.1       mrg 	size_t srclength;
    142  1.1       mrg 	char *target;
    143  1.1       mrg 	size_t targsize;
    144  1.1       mrg {
    145  1.1       mrg 	size_t datalength = 0;
    146  1.1       mrg 	u_char input[3];
    147  1.1       mrg 	u_char output[4];
    148  1.8   thorpej 	size_t i;
    149  1.1       mrg 
    150  1.5     lukem 	_DIAGASSERT(src != NULL);
    151  1.5     lukem 	_DIAGASSERT(target != NULL);
    152  1.5     lukem 
    153  1.1       mrg 	while (2 < srclength) {
    154  1.1       mrg 		input[0] = *src++;
    155  1.1       mrg 		input[1] = *src++;
    156  1.1       mrg 		input[2] = *src++;
    157  1.1       mrg 		srclength -= 3;
    158  1.1       mrg 
    159  1.4  christos 		output[0] = (u_int32_t)input[0] >> 2;
    160  1.4  christos 		output[1] = ((u_int32_t)(input[0] & 0x03) << 4) +
    161  1.4  christos 		    ((u_int32_t)input[1] >> 4);
    162  1.4  christos 		output[2] = ((u_int32_t)(input[1] & 0x0f) << 2) +
    163  1.4  christos 		    ((u_int32_t)input[2] >> 6);
    164  1.1       mrg 		output[3] = input[2] & 0x3f;
    165  1.1       mrg 		Assert(output[0] < 64);
    166  1.1       mrg 		Assert(output[1] < 64);
    167  1.1       mrg 		Assert(output[2] < 64);
    168  1.1       mrg 		Assert(output[3] < 64);
    169  1.1       mrg 
    170  1.1       mrg 		if (datalength + 4 > targsize)
    171  1.1       mrg 			return (-1);
    172  1.1       mrg 		target[datalength++] = Base64[output[0]];
    173  1.1       mrg 		target[datalength++] = Base64[output[1]];
    174  1.1       mrg 		target[datalength++] = Base64[output[2]];
    175  1.1       mrg 		target[datalength++] = Base64[output[3]];
    176  1.1       mrg 	}
    177  1.1       mrg 
    178  1.1       mrg 	/* Now we worry about padding. */
    179  1.1       mrg 	if (0 != srclength) {
    180  1.1       mrg 		/* Get what's left. */
    181  1.1       mrg 		input[0] = input[1] = input[2] = '\0';
    182  1.1       mrg 		for (i = 0; i < srclength; i++)
    183  1.1       mrg 			input[i] = *src++;
    184  1.1       mrg 
    185  1.4  christos 		output[0] = (u_int32_t)input[0] >> 2;
    186  1.4  christos 		output[1] = ((u_int32_t)(input[0] & 0x03) << 4) +
    187  1.4  christos 		    ((u_int32_t)input[1] >> 4);
    188  1.4  christos 		output[2] = ((u_int32_t)(input[1] & 0x0f) << 2) +
    189  1.4  christos 		    ((u_int32_t)input[2] >> 6);
    190  1.1       mrg 		Assert(output[0] < 64);
    191  1.1       mrg 		Assert(output[1] < 64);
    192  1.1       mrg 		Assert(output[2] < 64);
    193  1.1       mrg 
    194  1.1       mrg 		if (datalength + 4 > targsize)
    195  1.1       mrg 			return (-1);
    196  1.1       mrg 		target[datalength++] = Base64[output[0]];
    197  1.1       mrg 		target[datalength++] = Base64[output[1]];
    198  1.1       mrg 		if (srclength == 1)
    199  1.1       mrg 			target[datalength++] = Pad64;
    200  1.1       mrg 		else
    201  1.1       mrg 			target[datalength++] = Base64[output[2]];
    202  1.1       mrg 		target[datalength++] = Pad64;
    203  1.1       mrg 	}
    204  1.1       mrg 	if (datalength >= targsize)
    205  1.1       mrg 		return (-1);
    206  1.1       mrg 	target[datalength] = '\0';	/* Returned value doesn't count \0. */
    207  1.1       mrg 	return (datalength);
    208  1.1       mrg }
    209  1.1       mrg 
    210  1.1       mrg /* skips all whitespace anywhere.
    211  1.1       mrg    converts characters, four at a time, starting at (or after)
    212  1.1       mrg    src from base - 64 numbers into three 8 bit bytes in the target area.
    213  1.1       mrg    it returns the number of data bytes stored at the target, or -1 on error.
    214  1.1       mrg  */
    215  1.1       mrg 
    216  1.1       mrg int
    217  1.1       mrg b64_pton(src, target, targsize)
    218  1.1       mrg 	char const *src;
    219  1.1       mrg 	u_char *target;
    220  1.1       mrg 	size_t targsize;
    221  1.1       mrg {
    222  1.8   thorpej 	size_t tarindex;
    223  1.8   thorpej 	int state, ch;
    224  1.1       mrg 	char *pos;
    225  1.5     lukem 
    226  1.5     lukem 	_DIAGASSERT(src != NULL);
    227  1.5     lukem 	_DIAGASSERT(target != NULL);
    228  1.1       mrg 
    229  1.1       mrg 	state = 0;
    230  1.1       mrg 	tarindex = 0;
    231  1.1       mrg 
    232  1.7     itohy 	while ((ch = (u_char) *src++) != '\0') {
    233  1.1       mrg 		if (isspace(ch))	/* Skip whitespace anywhere. */
    234  1.1       mrg 			continue;
    235  1.1       mrg 
    236  1.1       mrg 		if (ch == Pad64)
    237  1.1       mrg 			break;
    238  1.1       mrg 
    239  1.1       mrg 		pos = strchr(Base64, ch);
    240  1.1       mrg 		if (pos == 0) 		/* A non-base64 character. */
    241  1.1       mrg 			return (-1);
    242  1.1       mrg 
    243  1.1       mrg 		switch (state) {
    244  1.1       mrg 		case 0:
    245  1.1       mrg 			if (target) {
    246  1.1       mrg 				if (tarindex >= targsize)
    247  1.1       mrg 					return (-1);
    248  1.1       mrg 				target[tarindex] = (pos - Base64) << 2;
    249  1.1       mrg 			}
    250  1.1       mrg 			state = 1;
    251  1.1       mrg 			break;
    252  1.1       mrg 		case 1:
    253  1.1       mrg 			if (target) {
    254  1.1       mrg 				if (tarindex + 1 >= targsize)
    255  1.1       mrg 					return (-1);
    256  1.4  christos 				target[tarindex] |=
    257  1.4  christos 				    (u_int32_t)(pos - Base64) >> 4;
    258  1.1       mrg 				target[tarindex+1]  = ((pos - Base64) & 0x0f)
    259  1.1       mrg 							<< 4 ;
    260  1.1       mrg 			}
    261  1.1       mrg 			tarindex++;
    262  1.1       mrg 			state = 2;
    263  1.1       mrg 			break;
    264  1.1       mrg 		case 2:
    265  1.1       mrg 			if (target) {
    266  1.1       mrg 				if (tarindex + 1 >= targsize)
    267  1.1       mrg 					return (-1);
    268  1.4  christos 				target[tarindex] |=
    269  1.4  christos 					(u_int32_t)(pos - Base64) >> 2;
    270  1.4  christos 				target[tarindex+1] = ((pos - Base64) & 0x03)
    271  1.1       mrg 							<< 6;
    272  1.1       mrg 			}
    273  1.1       mrg 			tarindex++;
    274  1.1       mrg 			state = 3;
    275  1.1       mrg 			break;
    276  1.1       mrg 		case 3:
    277  1.1       mrg 			if (target) {
    278  1.1       mrg 				if (tarindex >= targsize)
    279  1.1       mrg 					return (-1);
    280  1.1       mrg 				target[tarindex] |= (pos - Base64);
    281  1.1       mrg 			}
    282  1.1       mrg 			tarindex++;
    283  1.1       mrg 			state = 0;
    284  1.1       mrg 			break;
    285  1.1       mrg 		default:
    286  1.1       mrg 			abort();
    287  1.1       mrg 		}
    288  1.1       mrg 	}
    289  1.1       mrg 
    290  1.1       mrg 	/*
    291  1.1       mrg 	 * We are done decoding Base-64 chars.  Let's see if we ended
    292  1.1       mrg 	 * on a byte boundary, and/or with erroneous trailing characters.
    293  1.1       mrg 	 */
    294  1.1       mrg 
    295  1.1       mrg 	if (ch == Pad64) {		/* We got a pad char. */
    296  1.1       mrg 		ch = *src++;		/* Skip it, get next. */
    297  1.1       mrg 		switch (state) {
    298  1.1       mrg 		case 0:		/* Invalid = in first position */
    299  1.1       mrg 		case 1:		/* Invalid = in second position */
    300  1.1       mrg 			return (-1);
    301  1.1       mrg 
    302  1.1       mrg 		case 2:		/* Valid, means one byte of info */
    303  1.1       mrg 			/* Skip any number of spaces. */
    304  1.7     itohy 			for (; ch != '\0'; ch = (u_char) *src++)
    305  1.1       mrg 				if (!isspace(ch))
    306  1.1       mrg 					break;
    307  1.1       mrg 			/* Make sure there is another trailing = sign. */
    308  1.1       mrg 			if (ch != Pad64)
    309  1.1       mrg 				return (-1);
    310  1.1       mrg 			ch = *src++;		/* Skip the = */
    311  1.1       mrg 			/* Fall through to "single trailing =" case. */
    312  1.1       mrg 			/* FALLTHROUGH */
    313  1.1       mrg 
    314  1.1       mrg 		case 3:		/* Valid, means two bytes of info */
    315  1.1       mrg 			/*
    316  1.1       mrg 			 * We know this char is an =.  Is there anything but
    317  1.1       mrg 			 * whitespace after it?
    318  1.1       mrg 			 */
    319  1.7     itohy 			for (; ch != '\0'; ch = (u_char) *src++)
    320  1.1       mrg 				if (!isspace(ch))
    321  1.1       mrg 					return (-1);
    322  1.1       mrg 
    323  1.1       mrg 			/*
    324  1.1       mrg 			 * Now make sure for cases 2 and 3 that the "extra"
    325  1.1       mrg 			 * bits that slopped past the last full byte were
    326  1.1       mrg 			 * zeros.  If we don't check them, they become a
    327  1.1       mrg 			 * subliminal channel.
    328  1.1       mrg 			 */
    329  1.1       mrg 			if (target && target[tarindex] != 0)
    330  1.1       mrg 				return (-1);
    331  1.1       mrg 		}
    332  1.1       mrg 	} else {
    333  1.1       mrg 		/*
    334  1.1       mrg 		 * We ended by seeing the end of the string.  Make sure we
    335  1.1       mrg 		 * have no partial bytes lying around.
    336  1.1       mrg 		 */
    337  1.1       mrg 		if (state != 0)
    338  1.1       mrg 			return (-1);
    339  1.1       mrg 	}
    340  1.1       mrg 
    341  1.1       mrg 	return (tarindex);
    342  1.1       mrg }
    343