Home | History | Annotate | Line # | Download | only in net
base64.c revision 1.1
      1  1.1  mrg /*
      2  1.1  mrg  * Copyright (c) 1996 by Internet Software Consortium.
      3  1.1  mrg  *
      4  1.1  mrg  * Permission to use, copy, modify, and distribute this software for any
      5  1.1  mrg  * purpose with or without fee is hereby granted, provided that the above
      6  1.1  mrg  * copyright notice and this permission notice appear in all copies.
      7  1.1  mrg  *
      8  1.1  mrg  * THE SOFTWARE IS PROVIDED "AS IS" AND INTERNET SOFTWARE CONSORTIUM DISCLAIMS
      9  1.1  mrg  * ALL WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES
     10  1.1  mrg  * OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL INTERNET SOFTWARE
     11  1.1  mrg  * CONSORTIUM BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL
     12  1.1  mrg  * DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR
     13  1.1  mrg  * PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS
     14  1.1  mrg  * ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS
     15  1.1  mrg  * SOFTWARE.
     16  1.1  mrg  */
     17  1.1  mrg 
     18  1.1  mrg /*
     19  1.1  mrg  * Portions Copyright (c) 1995 by International Business Machines, Inc.
     20  1.1  mrg  *
     21  1.1  mrg  * International Business Machines, Inc. (hereinafter called IBM) grants
     22  1.1  mrg  * permission under its copyrights to use, copy, modify, and distribute this
     23  1.1  mrg  * Software with or without fee, provided that the above copyright notice and
     24  1.1  mrg  * all paragraphs of this notice appear in all copies, and that the name of IBM
     25  1.1  mrg  * not be used in connection with the marketing of any product incorporating
     26  1.1  mrg  * the Software or modifications thereof, without specific, written prior
     27  1.1  mrg  * permission.
     28  1.1  mrg  *
     29  1.1  mrg  * To the extent it has a right to do so, IBM grants an immunity from suit
     30  1.1  mrg  * under its patents, if any, for the use, sale or manufacture of products to
     31  1.1  mrg  * the extent that such products are used for performing Domain Name System
     32  1.1  mrg  * dynamic updates in TCP/IP networks by means of the Software.  No immunity is
     33  1.1  mrg  * granted for any product per se or for any other function of any product.
     34  1.1  mrg  *
     35  1.1  mrg  * THE SOFTWARE IS PROVIDED "AS IS", AND IBM DISCLAIMS ALL WARRANTIES,
     36  1.1  mrg  * INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
     37  1.1  mrg  * PARTICULAR PURPOSE.  IN NO EVENT SHALL IBM BE LIABLE FOR ANY SPECIAL,
     38  1.1  mrg  * DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER ARISING
     39  1.1  mrg  * OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE, EVEN
     40  1.1  mrg  * IF IBM IS APPRISED OF THE POSSIBILITY OF SUCH DAMAGES.
     41  1.1  mrg  */
     42  1.1  mrg 
     43  1.1  mrg #include <sys/types.h>
     44  1.1  mrg #include <sys/param.h>
     45  1.1  mrg #include <sys/socket.h>
     46  1.1  mrg #include <netinet/in.h>
     47  1.1  mrg #include <arpa/inet.h>
     48  1.1  mrg #include <arpa/nameser.h>
     49  1.1  mrg 
     50  1.1  mrg #include <ctype.h>
     51  1.1  mrg #include <resolv.h>
     52  1.1  mrg #include <stdio.h>
     53  1.1  mrg 
     54  1.1  mrg #if defined(BSD) && (BSD >= 199103) && defined(AF_INET6)
     55  1.1  mrg # include <stdlib.h>
     56  1.1  mrg # include <string.h>
     57  1.1  mrg #else
     58  1.1  mrg # include "../conf/portability.h"
     59  1.1  mrg #endif
     60  1.1  mrg 
     61  1.1  mrg #define Assert(Cond) if (!(Cond)) abort()
     62  1.1  mrg 
     63  1.1  mrg static const char Base64[] =
     64  1.1  mrg 	"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";
     65  1.1  mrg static const char Pad64 = '=';
     66  1.1  mrg 
     67  1.1  mrg /* (From RFC1521 and draft-ietf-dnssec-secext-03.txt)
     68  1.1  mrg    The following encoding technique is taken from RFC 1521 by Borenstein
     69  1.1  mrg    and Freed.  It is reproduced here in a slightly edited form for
     70  1.1  mrg    convenience.
     71  1.1  mrg 
     72  1.1  mrg    A 65-character subset of US-ASCII is used, enabling 6 bits to be
     73  1.1  mrg    represented per printable character. (The extra 65th character, "=",
     74  1.1  mrg    is used to signify a special processing function.)
     75  1.1  mrg 
     76  1.1  mrg    The encoding process represents 24-bit groups of input bits as output
     77  1.1  mrg    strings of 4 encoded characters. Proceeding from left to right, a
     78  1.1  mrg    24-bit input group is formed by concatenating 3 8-bit input groups.
     79  1.1  mrg    These 24 bits are then treated as 4 concatenated 6-bit groups, each
     80  1.1  mrg    of which is translated into a single digit in the base64 alphabet.
     81  1.1  mrg 
     82  1.1  mrg    Each 6-bit group is used as an index into an array of 64 printable
     83  1.1  mrg    characters. The character referenced by the index is placed in the
     84  1.1  mrg    output string.
     85  1.1  mrg 
     86  1.1  mrg                          Table 1: The Base64 Alphabet
     87  1.1  mrg 
     88  1.1  mrg       Value Encoding  Value Encoding  Value Encoding  Value Encoding
     89  1.1  mrg           0 A            17 R            34 i            51 z
     90  1.1  mrg           1 B            18 S            35 j            52 0
     91  1.1  mrg           2 C            19 T            36 k            53 1
     92  1.1  mrg           3 D            20 U            37 l            54 2
     93  1.1  mrg           4 E            21 V            38 m            55 3
     94  1.1  mrg           5 F            22 W            39 n            56 4
     95  1.1  mrg           6 G            23 X            40 o            57 5
     96  1.1  mrg           7 H            24 Y            41 p            58 6
     97  1.1  mrg           8 I            25 Z            42 q            59 7
     98  1.1  mrg           9 J            26 a            43 r            60 8
     99  1.1  mrg          10 K            27 b            44 s            61 9
    100  1.1  mrg          11 L            28 c            45 t            62 +
    101  1.1  mrg          12 M            29 d            46 u            63 /
    102  1.1  mrg          13 N            30 e            47 v
    103  1.1  mrg          14 O            31 f            48 w         (pad) =
    104  1.1  mrg          15 P            32 g            49 x
    105  1.1  mrg          16 Q            33 h            50 y
    106  1.1  mrg 
    107  1.1  mrg    Special processing is performed if fewer than 24 bits are available
    108  1.1  mrg    at the end of the data being encoded.  A full encoding quantum is
    109  1.1  mrg    always completed at the end of a quantity.  When fewer than 24 input
    110  1.1  mrg    bits are available in an input group, zero bits are added (on the
    111  1.1  mrg    right) to form an integral number of 6-bit groups.  Padding at the
    112  1.1  mrg    end of the data is performed using the '=' character.
    113  1.1  mrg 
    114  1.1  mrg    Since all base64 input is an integral number of octets, only the
    115  1.1  mrg          -------------------------------------------------
    116  1.1  mrg    following cases can arise:
    117  1.1  mrg 
    118  1.1  mrg        (1) the final quantum of encoding input is an integral
    119  1.1  mrg            multiple of 24 bits; here, the final unit of encoded
    120  1.1  mrg 	   output will be an integral multiple of 4 characters
    121  1.1  mrg 	   with no "=" padding,
    122  1.1  mrg        (2) the final quantum of encoding input is exactly 8 bits;
    123  1.1  mrg            here, the final unit of encoded output will be two
    124  1.1  mrg 	   characters followed by two "=" padding characters, or
    125  1.1  mrg        (3) the final quantum of encoding input is exactly 16 bits;
    126  1.1  mrg            here, the final unit of encoded output will be three
    127  1.1  mrg 	   characters followed by one "=" padding character.
    128  1.1  mrg    */
    129  1.1  mrg 
    130  1.1  mrg int
    131  1.1  mrg b64_ntop(src, srclength, target, targsize)
    132  1.1  mrg 	u_char const *src;
    133  1.1  mrg 	size_t srclength;
    134  1.1  mrg 	char *target;
    135  1.1  mrg 	size_t targsize;
    136  1.1  mrg {
    137  1.1  mrg 	size_t datalength = 0;
    138  1.1  mrg 	u_char input[3];
    139  1.1  mrg 	u_char output[4];
    140  1.1  mrg 	int i;
    141  1.1  mrg 
    142  1.1  mrg 	while (2 < srclength) {
    143  1.1  mrg 		input[0] = *src++;
    144  1.1  mrg 		input[1] = *src++;
    145  1.1  mrg 		input[2] = *src++;
    146  1.1  mrg 		srclength -= 3;
    147  1.1  mrg 
    148  1.1  mrg 		output[0] = input[0] >> 2;
    149  1.1  mrg 		output[1] = ((input[0] & 0x03) << 4) + (input[1] >> 4);
    150  1.1  mrg 		output[2] = ((input[1] & 0x0f) << 2) + (input[2] >> 6);
    151  1.1  mrg 		output[3] = input[2] & 0x3f;
    152  1.1  mrg 		Assert(output[0] < 64);
    153  1.1  mrg 		Assert(output[1] < 64);
    154  1.1  mrg 		Assert(output[2] < 64);
    155  1.1  mrg 		Assert(output[3] < 64);
    156  1.1  mrg 
    157  1.1  mrg 		if (datalength + 4 > targsize)
    158  1.1  mrg 			return (-1);
    159  1.1  mrg 		target[datalength++] = Base64[output[0]];
    160  1.1  mrg 		target[datalength++] = Base64[output[1]];
    161  1.1  mrg 		target[datalength++] = Base64[output[2]];
    162  1.1  mrg 		target[datalength++] = Base64[output[3]];
    163  1.1  mrg 	}
    164  1.1  mrg 
    165  1.1  mrg 	/* Now we worry about padding. */
    166  1.1  mrg 	if (0 != srclength) {
    167  1.1  mrg 		/* Get what's left. */
    168  1.1  mrg 		input[0] = input[1] = input[2] = '\0';
    169  1.1  mrg 		for (i = 0; i < srclength; i++)
    170  1.1  mrg 			input[i] = *src++;
    171  1.1  mrg 
    172  1.1  mrg 		output[0] = input[0] >> 2;
    173  1.1  mrg 		output[1] = ((input[0] & 0x03) << 4) + (input[1] >> 4);
    174  1.1  mrg 		output[2] = ((input[1] & 0x0f) << 2) + (input[2] >> 6);
    175  1.1  mrg 		Assert(output[0] < 64);
    176  1.1  mrg 		Assert(output[1] < 64);
    177  1.1  mrg 		Assert(output[2] < 64);
    178  1.1  mrg 
    179  1.1  mrg 		if (datalength + 4 > targsize)
    180  1.1  mrg 			return (-1);
    181  1.1  mrg 		target[datalength++] = Base64[output[0]];
    182  1.1  mrg 		target[datalength++] = Base64[output[1]];
    183  1.1  mrg 		if (srclength == 1)
    184  1.1  mrg 			target[datalength++] = Pad64;
    185  1.1  mrg 		else
    186  1.1  mrg 			target[datalength++] = Base64[output[2]];
    187  1.1  mrg 		target[datalength++] = Pad64;
    188  1.1  mrg 	}
    189  1.1  mrg 	if (datalength >= targsize)
    190  1.1  mrg 		return (-1);
    191  1.1  mrg 	target[datalength] = '\0';	/* Returned value doesn't count \0. */
    192  1.1  mrg 	return (datalength);
    193  1.1  mrg }
    194  1.1  mrg 
    195  1.1  mrg /* skips all whitespace anywhere.
    196  1.1  mrg    converts characters, four at a time, starting at (or after)
    197  1.1  mrg    src from base - 64 numbers into three 8 bit bytes in the target area.
    198  1.1  mrg    it returns the number of data bytes stored at the target, or -1 on error.
    199  1.1  mrg  */
    200  1.1  mrg 
    201  1.1  mrg int
    202  1.1  mrg b64_pton(src, target, targsize)
    203  1.1  mrg 	char const *src;
    204  1.1  mrg 	u_char *target;
    205  1.1  mrg 	size_t targsize;
    206  1.1  mrg {
    207  1.1  mrg 	int tarindex, state, ch;
    208  1.1  mrg 	char *pos;
    209  1.1  mrg 
    210  1.1  mrg 	state = 0;
    211  1.1  mrg 	tarindex = 0;
    212  1.1  mrg 
    213  1.1  mrg 	while ((ch = *src++) != '\0') {
    214  1.1  mrg 		if (isspace(ch))	/* Skip whitespace anywhere. */
    215  1.1  mrg 			continue;
    216  1.1  mrg 
    217  1.1  mrg 		if (ch == Pad64)
    218  1.1  mrg 			break;
    219  1.1  mrg 
    220  1.1  mrg 		pos = strchr(Base64, ch);
    221  1.1  mrg 		if (pos == 0) 		/* A non-base64 character. */
    222  1.1  mrg 			return (-1);
    223  1.1  mrg 
    224  1.1  mrg 		switch (state) {
    225  1.1  mrg 		case 0:
    226  1.1  mrg 			if (target) {
    227  1.1  mrg 				if (tarindex >= targsize)
    228  1.1  mrg 					return (-1);
    229  1.1  mrg 				target[tarindex] = (pos - Base64) << 2;
    230  1.1  mrg 			}
    231  1.1  mrg 			state = 1;
    232  1.1  mrg 			break;
    233  1.1  mrg 		case 1:
    234  1.1  mrg 			if (target) {
    235  1.1  mrg 				if (tarindex + 1 >= targsize)
    236  1.1  mrg 					return (-1);
    237  1.1  mrg 				target[tarindex]   |=  (pos - Base64) >> 4;
    238  1.1  mrg 				target[tarindex+1]  = ((pos - Base64) & 0x0f)
    239  1.1  mrg 							<< 4 ;
    240  1.1  mrg 			}
    241  1.1  mrg 			tarindex++;
    242  1.1  mrg 			state = 2;
    243  1.1  mrg 			break;
    244  1.1  mrg 		case 2:
    245  1.1  mrg 			if (target) {
    246  1.1  mrg 				if (tarindex + 1 >= targsize)
    247  1.1  mrg 					return (-1);
    248  1.1  mrg 				target[tarindex]   |=  (pos - Base64) >> 2;
    249  1.1  mrg 				target[tarindex+1]  = ((pos - Base64) & 0x03)
    250  1.1  mrg 							<< 6;
    251  1.1  mrg 			}
    252  1.1  mrg 			tarindex++;
    253  1.1  mrg 			state = 3;
    254  1.1  mrg 			break;
    255  1.1  mrg 		case 3:
    256  1.1  mrg 			if (target) {
    257  1.1  mrg 				if (tarindex >= targsize)
    258  1.1  mrg 					return (-1);
    259  1.1  mrg 				target[tarindex] |= (pos - Base64);
    260  1.1  mrg 			}
    261  1.1  mrg 			tarindex++;
    262  1.1  mrg 			state = 0;
    263  1.1  mrg 			break;
    264  1.1  mrg 		default:
    265  1.1  mrg 			abort();
    266  1.1  mrg 		}
    267  1.1  mrg 	}
    268  1.1  mrg 
    269  1.1  mrg 	/*
    270  1.1  mrg 	 * We are done decoding Base-64 chars.  Let's see if we ended
    271  1.1  mrg 	 * on a byte boundary, and/or with erroneous trailing characters.
    272  1.1  mrg 	 */
    273  1.1  mrg 
    274  1.1  mrg 	if (ch == Pad64) {		/* We got a pad char. */
    275  1.1  mrg 		ch = *src++;		/* Skip it, get next. */
    276  1.1  mrg 		switch (state) {
    277  1.1  mrg 		case 0:		/* Invalid = in first position */
    278  1.1  mrg 		case 1:		/* Invalid = in second position */
    279  1.1  mrg 			return (-1);
    280  1.1  mrg 
    281  1.1  mrg 		case 2:		/* Valid, means one byte of info */
    282  1.1  mrg 			/* Skip any number of spaces. */
    283  1.1  mrg 			for (NULL; ch != '\0'; ch = *src++)
    284  1.1  mrg 				if (!isspace(ch))
    285  1.1  mrg 					break;
    286  1.1  mrg 			/* Make sure there is another trailing = sign. */
    287  1.1  mrg 			if (ch != Pad64)
    288  1.1  mrg 				return (-1);
    289  1.1  mrg 			ch = *src++;		/* Skip the = */
    290  1.1  mrg 			/* Fall through to "single trailing =" case. */
    291  1.1  mrg 			/* FALLTHROUGH */
    292  1.1  mrg 
    293  1.1  mrg 		case 3:		/* Valid, means two bytes of info */
    294  1.1  mrg 			/*
    295  1.1  mrg 			 * We know this char is an =.  Is there anything but
    296  1.1  mrg 			 * whitespace after it?
    297  1.1  mrg 			 */
    298  1.1  mrg 			for (NULL; ch != '\0'; ch = *src++)
    299  1.1  mrg 				if (!isspace(ch))
    300  1.1  mrg 					return (-1);
    301  1.1  mrg 
    302  1.1  mrg 			/*
    303  1.1  mrg 			 * Now make sure for cases 2 and 3 that the "extra"
    304  1.1  mrg 			 * bits that slopped past the last full byte were
    305  1.1  mrg 			 * zeros.  If we don't check them, they become a
    306  1.1  mrg 			 * subliminal channel.
    307  1.1  mrg 			 */
    308  1.1  mrg 			if (target && target[tarindex] != 0)
    309  1.1  mrg 				return (-1);
    310  1.1  mrg 		}
    311  1.1  mrg 	} else {
    312  1.1  mrg 		/*
    313  1.1  mrg 		 * We ended by seeing the end of the string.  Make sure we
    314  1.1  mrg 		 * have no partial bytes lying around.
    315  1.1  mrg 		 */
    316  1.1  mrg 		if (state != 0)
    317  1.1  mrg 			return (-1);
    318  1.1  mrg 	}
    319  1.1  mrg 
    320  1.1  mrg 	return (tarindex);
    321  1.1  mrg }
    322