Home | History | Annotate | Line # | Download | only in net
base64.c revision 1.11.6.2
      1  1.11.6.2  christos /*	$NetBSD: base64.c,v 1.11.6.2 2008/06/21 20:41:49 christos Exp $	*/
      2  1.11.6.2  christos 
      3  1.11.6.2  christos /*
      4  1.11.6.2  christos  * Copyright (c) 2004 by Internet Systems Consortium, Inc. ("ISC")
      5  1.11.6.2  christos  * Copyright (c) 1996-1999 by Internet Software Consortium.
      6  1.11.6.2  christos  *
      7  1.11.6.2  christos  * Permission to use, copy, modify, and distribute this software for any
      8  1.11.6.2  christos  * purpose with or without fee is hereby granted, provided that the above
      9  1.11.6.2  christos  * copyright notice and this permission notice appear in all copies.
     10  1.11.6.2  christos  *
     11  1.11.6.2  christos  * THE SOFTWARE IS PROVIDED "AS IS" AND ISC DISCLAIMS ALL WARRANTIES
     12  1.11.6.2  christos  * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
     13  1.11.6.2  christos  * MERCHANTABILITY AND FITNESS.  IN NO EVENT SHALL ISC BE LIABLE FOR
     14  1.11.6.2  christos  * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
     15  1.11.6.2  christos  * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
     16  1.11.6.2  christos  * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT
     17  1.11.6.2  christos  * OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
     18  1.11.6.2  christos  */
     19  1.11.6.2  christos 
     20  1.11.6.2  christos /*
     21  1.11.6.2  christos  * Portions Copyright (c) 1995 by International Business Machines, Inc.
     22  1.11.6.2  christos  *
     23  1.11.6.2  christos  * International Business Machines, Inc. (hereinafter called IBM) grants
     24  1.11.6.2  christos  * permission under its copyrights to use, copy, modify, and distribute this
     25  1.11.6.2  christos  * Software with or without fee, provided that the above copyright notice and
     26  1.11.6.2  christos  * all paragraphs of this notice appear in all copies, and that the name of IBM
     27  1.11.6.2  christos  * not be used in connection with the marketing of any product incorporating
     28  1.11.6.2  christos  * the Software or modifications thereof, without specific, written prior
     29  1.11.6.2  christos  * permission.
     30  1.11.6.2  christos  *
     31  1.11.6.2  christos  * To the extent it has a right to do so, IBM grants an immunity from suit
     32  1.11.6.2  christos  * under its patents, if any, for the use, sale or manufacture of products to
     33  1.11.6.2  christos  * the extent that such products are used for performing Domain Name System
     34  1.11.6.2  christos  * dynamic updates in TCP/IP networks by means of the Software.  No immunity is
     35  1.11.6.2  christos  * granted for any product per se or for any other function of any product.
     36  1.11.6.2  christos  *
     37  1.11.6.2  christos  * THE SOFTWARE IS PROVIDED "AS IS", AND IBM DISCLAIMS ALL WARRANTIES,
     38  1.11.6.2  christos  * INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
     39  1.11.6.2  christos  * PARTICULAR PURPOSE.  IN NO EVENT SHALL IBM BE LIABLE FOR ANY SPECIAL,
     40  1.11.6.2  christos  * DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER ARISING
     41  1.11.6.2  christos  * OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE, EVEN
     42  1.11.6.2  christos  * IF IBM IS APPRISED OF THE POSSIBILITY OF SUCH DAMAGES.
     43  1.11.6.2  christos  */
     44  1.11.6.2  christos 
     45  1.11.6.2  christos #include <sys/cdefs.h>
     46  1.11.6.2  christos #if defined(LIBC_SCCS) && !defined(lint)
     47  1.11.6.2  christos #if 0
     48  1.11.6.2  christos static const char rcsid[] = "Id: base64.c,v 1.4 2005/04/27 04:56:34 sra Exp";
     49  1.11.6.2  christos #else
     50  1.11.6.2  christos __RCSID("$NetBSD: base64.c,v 1.11.6.2 2008/06/21 20:41:49 christos Exp $");
     51  1.11.6.2  christos #endif
     52  1.11.6.2  christos #endif /* LIBC_SCCS and not lint */
     53  1.11.6.2  christos 
     54  1.11.6.2  christos #include "port_before.h"
     55  1.11.6.2  christos 
     56  1.11.6.2  christos #include <sys/types.h>
     57  1.11.6.2  christos #include <sys/param.h>
     58  1.11.6.2  christos #include <sys/socket.h>
     59  1.11.6.2  christos 
     60  1.11.6.2  christos #include <netinet/in.h>
     61  1.11.6.2  christos #include <arpa/inet.h>
     62  1.11.6.2  christos #include <arpa/nameser.h>
     63  1.11.6.2  christos 
     64  1.11.6.2  christos #include <assert.h>
     65  1.11.6.2  christos #include <ctype.h>
     66  1.11.6.2  christos #include <resolv.h>
     67  1.11.6.2  christos #include <stdio.h>
     68  1.11.6.2  christos #include <stdlib.h>
     69  1.11.6.2  christos #include <string.h>
     70  1.11.6.2  christos 
     71  1.11.6.2  christos #include "port_after.h"
     72  1.11.6.2  christos 
     73  1.11.6.2  christos #define Assert(Cond) if (!(Cond)) abort()
     74  1.11.6.2  christos 
     75  1.11.6.2  christos static const char Base64[] =
     76  1.11.6.2  christos 	"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";
     77  1.11.6.2  christos static const char Pad64 = '=';
     78  1.11.6.2  christos 
     79  1.11.6.2  christos /* (From RFC1521 and draft-ietf-dnssec-secext-03.txt)
     80  1.11.6.2  christos    The following encoding technique is taken from RFC1521 by Borenstein
     81  1.11.6.2  christos    and Freed.  It is reproduced here in a slightly edited form for
     82  1.11.6.2  christos    convenience.
     83  1.11.6.2  christos 
     84  1.11.6.2  christos    A 65-character subset of US-ASCII is used, enabling 6 bits to be
     85  1.11.6.2  christos    represented per printable character. (The extra 65th character, "=",
     86  1.11.6.2  christos    is used to signify a special processing function.)
     87  1.11.6.2  christos 
     88  1.11.6.2  christos    The encoding process represents 24-bit groups of input bits as output
     89  1.11.6.2  christos    strings of 4 encoded characters. Proceeding from left to right, a
     90  1.11.6.2  christos    24-bit input group is formed by concatenating 3 8-bit input groups.
     91  1.11.6.2  christos    These 24 bits are then treated as 4 concatenated 6-bit groups, each
     92  1.11.6.2  christos    of which is translated into a single digit in the base64 alphabet.
     93  1.11.6.2  christos 
     94  1.11.6.2  christos    Each 6-bit group is used as an index into an array of 64 printable
     95  1.11.6.2  christos    characters. The character referenced by the index is placed in the
     96  1.11.6.2  christos    output string.
     97  1.11.6.2  christos 
     98  1.11.6.2  christos                          Table 1: The Base64 Alphabet
     99  1.11.6.2  christos 
    100  1.11.6.2  christos       Value Encoding  Value Encoding  Value Encoding  Value Encoding
    101  1.11.6.2  christos           0 A            17 R            34 i            51 z
    102  1.11.6.2  christos           1 B            18 S            35 j            52 0
    103  1.11.6.2  christos           2 C            19 T            36 k            53 1
    104  1.11.6.2  christos           3 D            20 U            37 l            54 2
    105  1.11.6.2  christos           4 E            21 V            38 m            55 3
    106  1.11.6.2  christos           5 F            22 W            39 n            56 4
    107  1.11.6.2  christos           6 G            23 X            40 o            57 5
    108  1.11.6.2  christos           7 H            24 Y            41 p            58 6
    109  1.11.6.2  christos           8 I            25 Z            42 q            59 7
    110  1.11.6.2  christos           9 J            26 a            43 r            60 8
    111  1.11.6.2  christos          10 K            27 b            44 s            61 9
    112  1.11.6.2  christos          11 L            28 c            45 t            62 +
    113  1.11.6.2  christos          12 M            29 d            46 u            63 /
    114  1.11.6.2  christos          13 N            30 e            47 v
    115  1.11.6.2  christos          14 O            31 f            48 w         (pad) =
    116  1.11.6.2  christos          15 P            32 g            49 x
    117  1.11.6.2  christos          16 Q            33 h            50 y
    118  1.11.6.2  christos 
    119  1.11.6.2  christos    Special processing is performed if fewer than 24 bits are available
    120  1.11.6.2  christos    at the end of the data being encoded.  A full encoding quantum is
    121  1.11.6.2  christos    always completed at the end of a quantity.  When fewer than 24 input
    122  1.11.6.2  christos    bits are available in an input group, zero bits are added (on the
    123  1.11.6.2  christos    right) to form an integral number of 6-bit groups.  Padding at the
    124  1.11.6.2  christos    end of the data is performed using the '=' character.
    125  1.11.6.2  christos 
    126  1.11.6.2  christos    Since all base64 input is an integral number of octets, only the
    127  1.11.6.2  christos          -------------------------------------------------
    128  1.11.6.2  christos    following cases can arise:
    129  1.11.6.2  christos 
    130  1.11.6.2  christos        (1) the final quantum of encoding input is an integral
    131  1.11.6.2  christos            multiple of 24 bits; here, the final unit of encoded
    132  1.11.6.2  christos 	   output will be an integral multiple of 4 characters
    133  1.11.6.2  christos 	   with no "=" padding,
    134  1.11.6.2  christos        (2) the final quantum of encoding input is exactly 8 bits;
    135  1.11.6.2  christos            here, the final unit of encoded output will be two
    136  1.11.6.2  christos 	   characters followed by two "=" padding characters, or
    137  1.11.6.2  christos        (3) the final quantum of encoding input is exactly 16 bits;
    138  1.11.6.2  christos            here, the final unit of encoded output will be three
    139  1.11.6.2  christos 	   characters followed by one "=" padding character.
    140  1.11.6.2  christos    */
    141  1.11.6.2  christos 
    142  1.11.6.2  christos int
    143  1.11.6.2  christos b64_ntop(u_char const *src, size_t srclength, char *target, size_t targsize) {
    144  1.11.6.2  christos 	size_t datalength = 0;
    145  1.11.6.2  christos 	u_char input[3];
    146  1.11.6.2  christos 	u_char output[4];
    147  1.11.6.2  christos 	size_t i;
    148  1.11.6.2  christos 
    149  1.11.6.2  christos 	_DIAGASSERT(src != NULL);
    150  1.11.6.2  christos 	_DIAGASSERT(target != NULL);
    151  1.11.6.2  christos 
    152  1.11.6.2  christos 	while (2U < srclength) {
    153  1.11.6.2  christos 		input[0] = *src++;
    154  1.11.6.2  christos 		input[1] = *src++;
    155  1.11.6.2  christos 		input[2] = *src++;
    156  1.11.6.2  christos 		srclength -= 3;
    157  1.11.6.2  christos 
    158  1.11.6.2  christos 		output[0] = (u_int32_t)input[0] >> 2;
    159  1.11.6.2  christos 		output[1] = ((u_int32_t)(input[0] & 0x03) << 4) +
    160  1.11.6.2  christos 		    ((u_int32_t)input[1] >> 4);
    161  1.11.6.2  christos 		output[2] = ((u_int32_t)(input[1] & 0x0f) << 2) +
    162  1.11.6.2  christos 		    ((u_int32_t)input[2] >> 6);
    163  1.11.6.2  christos 		output[3] = input[2] & 0x3f;
    164  1.11.6.2  christos 		Assert(output[0] < 64);
    165  1.11.6.2  christos 		Assert(output[1] < 64);
    166  1.11.6.2  christos 		Assert(output[2] < 64);
    167  1.11.6.2  christos 		Assert(output[3] < 64);
    168  1.11.6.2  christos 
    169  1.11.6.2  christos 		if (datalength + 4 > targsize)
    170  1.11.6.2  christos 			return (-1);
    171  1.11.6.2  christos 		target[datalength++] = Base64[output[0]];
    172  1.11.6.2  christos 		target[datalength++] = Base64[output[1]];
    173  1.11.6.2  christos 		target[datalength++] = Base64[output[2]];
    174  1.11.6.2  christos 		target[datalength++] = Base64[output[3]];
    175  1.11.6.2  christos 	}
    176  1.11.6.2  christos 
    177  1.11.6.2  christos 	/* Now we worry about padding. */
    178  1.11.6.2  christos 	if (0U != srclength) {
    179  1.11.6.2  christos 		/* Get what's left. */
    180  1.11.6.2  christos 		input[0] = input[1] = input[2] = '\0';
    181  1.11.6.2  christos 		for (i = 0; i < srclength; i++)
    182  1.11.6.2  christos 			input[i] = *src++;
    183  1.11.6.2  christos 
    184  1.11.6.2  christos 		output[0] = (u_int32_t)input[0] >> 2;
    185  1.11.6.2  christos 		output[1] = ((u_int32_t)(input[0] & 0x03) << 4) +
    186  1.11.6.2  christos 		    ((u_int32_t)input[1] >> 4);
    187  1.11.6.2  christos 		output[2] = ((u_int32_t)(input[1] & 0x0f) << 2) +
    188  1.11.6.2  christos 		    ((u_int32_t)input[2] >> 6);
    189  1.11.6.2  christos 		Assert(output[0] < 64);
    190  1.11.6.2  christos 		Assert(output[1] < 64);
    191  1.11.6.2  christos 		Assert(output[2] < 64);
    192  1.11.6.2  christos 
    193  1.11.6.2  christos 		if (datalength + 4 > targsize)
    194  1.11.6.2  christos 			return (-1);
    195  1.11.6.2  christos 		target[datalength++] = Base64[output[0]];
    196  1.11.6.2  christos 		target[datalength++] = Base64[output[1]];
    197  1.11.6.2  christos 		if (srclength == 1U)
    198  1.11.6.2  christos 			target[datalength++] = Pad64;
    199  1.11.6.2  christos 		else
    200  1.11.6.2  christos 			target[datalength++] = Base64[output[2]];
    201  1.11.6.2  christos 		target[datalength++] = Pad64;
    202  1.11.6.2  christos 	}
    203  1.11.6.2  christos 	if (datalength >= targsize)
    204  1.11.6.2  christos 		return (-1);
    205  1.11.6.2  christos 	target[datalength] = '\0';	/*%< Returned value doesn't count \\0. */
    206  1.11.6.2  christos 	return (datalength);
    207  1.11.6.2  christos }
    208  1.11.6.2  christos 
    209  1.11.6.2  christos /* skips all whitespace anywhere.
    210  1.11.6.2  christos    converts characters, four at a time, starting at (or after)
    211  1.11.6.2  christos    src from base - 64 numbers into three 8 bit bytes in the target area.
    212  1.11.6.2  christos    it returns the number of data bytes stored at the target, or -1 on error.
    213  1.11.6.2  christos  */
    214  1.11.6.2  christos 
    215  1.11.6.2  christos int
    216  1.11.6.2  christos b64_pton(src, target, targsize)
    217  1.11.6.2  christos 	char const *src;
    218  1.11.6.2  christos 	u_char *target;
    219  1.11.6.2  christos 	size_t targsize;
    220  1.11.6.2  christos {
    221  1.11.6.2  christos 	size_t tarindex;
    222  1.11.6.2  christos 	int state, ch;
    223  1.11.6.2  christos 	char *pos;
    224  1.11.6.2  christos 
    225  1.11.6.2  christos 	_DIAGASSERT(src != NULL);
    226  1.11.6.2  christos 	_DIAGASSERT(target != NULL);
    227  1.11.6.2  christos 
    228  1.11.6.2  christos 	state = 0;
    229  1.11.6.2  christos 	tarindex = 0;
    230  1.11.6.2  christos 
    231  1.11.6.2  christos 	while ((ch = (u_char) *src++) != '\0') {
    232  1.11.6.2  christos 		if (isspace(ch))	/*%< Skip whitespace anywhere. */
    233  1.11.6.2  christos 			continue;
    234  1.11.6.2  christos 
    235  1.11.6.2  christos 		if (ch == Pad64)
    236  1.11.6.2  christos 			break;
    237  1.11.6.2  christos 
    238  1.11.6.2  christos 		pos = strchr(Base64, ch);
    239  1.11.6.2  christos 		if (pos == 0) 		/*%< A non-base64 character. */
    240  1.11.6.2  christos 			return (-1);
    241  1.11.6.2  christos 
    242  1.11.6.2  christos 		switch (state) {
    243  1.11.6.2  christos 		case 0:
    244  1.11.6.2  christos 			if (target) {
    245  1.11.6.2  christos 				if ((size_t)tarindex >= targsize)
    246  1.11.6.2  christos 					return (-1);
    247  1.11.6.2  christos 				target[tarindex] = (pos - Base64) << 2;
    248  1.11.6.2  christos 			}
    249  1.11.6.2  christos 			state = 1;
    250  1.11.6.2  christos 			break;
    251  1.11.6.2  christos 		case 1:
    252  1.11.6.2  christos 			if (target) {
    253  1.11.6.2  christos 				if ((size_t)tarindex + 1 >= targsize)
    254  1.11.6.2  christos 					return (-1);
    255  1.11.6.2  christos 				target[tarindex] |=
    256  1.11.6.2  christos 				    (u_int32_t)(pos - Base64) >> 4;
    257  1.11.6.2  christos 				target[tarindex+1]  = ((pos - Base64) & 0x0f)
    258  1.11.6.2  christos 							<< 4 ;
    259  1.11.6.2  christos 			}
    260  1.11.6.2  christos 			tarindex++;
    261  1.11.6.2  christos 			state = 2;
    262  1.11.6.2  christos 			break;
    263  1.11.6.2  christos 		case 2:
    264  1.11.6.2  christos 			if (target) {
    265  1.11.6.2  christos 				if ((size_t)tarindex + 1 >= targsize)
    266  1.11.6.2  christos 					return (-1);
    267  1.11.6.2  christos 				target[tarindex] |=
    268  1.11.6.2  christos 					(u_int32_t)(pos - Base64) >> 2;
    269  1.11.6.2  christos 				target[tarindex+1] = ((pos - Base64) & 0x03)
    270  1.11.6.2  christos 							<< 6;
    271  1.11.6.2  christos 			}
    272  1.11.6.2  christos 			tarindex++;
    273  1.11.6.2  christos 			state = 3;
    274  1.11.6.2  christos 			break;
    275  1.11.6.2  christos 		case 3:
    276  1.11.6.2  christos 			if (target) {
    277  1.11.6.2  christos 				if ((size_t)tarindex >= targsize)
    278  1.11.6.2  christos 					return (-1);
    279  1.11.6.2  christos 				target[tarindex] |= (pos - Base64);
    280  1.11.6.2  christos 			}
    281  1.11.6.2  christos 			tarindex++;
    282  1.11.6.2  christos 			state = 0;
    283  1.11.6.2  christos 			break;
    284  1.11.6.2  christos 		default:
    285  1.11.6.2  christos 			abort();
    286  1.11.6.2  christos 		}
    287  1.11.6.2  christos 	}
    288  1.11.6.2  christos 
    289  1.11.6.2  christos 	/*
    290  1.11.6.2  christos 	 * We are done decoding Base-64 chars.  Let's see if we ended
    291  1.11.6.2  christos 	 * on a byte boundary, and/or with erroneous trailing characters.
    292  1.11.6.2  christos 	 */
    293  1.11.6.2  christos 
    294  1.11.6.2  christos 	if (ch == Pad64) {		/*%< We got a pad char. */
    295  1.11.6.2  christos 		ch = *src++;		/*%< Skip it, get next. */
    296  1.11.6.2  christos 		switch (state) {
    297  1.11.6.2  christos 		case 0:		/*%< Invalid = in first position */
    298  1.11.6.2  christos 		case 1:		/*%< Invalid = in second position */
    299  1.11.6.2  christos 			return (-1);
    300  1.11.6.2  christos 
    301  1.11.6.2  christos 		case 2:		/*%< Valid, means one byte of info */
    302  1.11.6.2  christos 			/* Skip any number of spaces. */
    303  1.11.6.2  christos 			for (; ch != '\0'; ch = (u_char) *src++)
    304  1.11.6.2  christos 				if (!isspace(ch))
    305  1.11.6.2  christos 					break;
    306  1.11.6.2  christos 			/* Make sure there is another trailing = sign. */
    307  1.11.6.2  christos 			if (ch != Pad64)
    308  1.11.6.2  christos 				return (-1);
    309  1.11.6.2  christos 			ch = *src++;		/*%< Skip the = */
    310  1.11.6.2  christos 			/* Fall through to "single trailing =" case. */
    311  1.11.6.2  christos 			/* FALLTHROUGH */
    312  1.11.6.2  christos 
    313  1.11.6.2  christos 		case 3:		/*%< Valid, means two bytes of info */
    314  1.11.6.2  christos 			/*
    315  1.11.6.2  christos 			 * We know this char is an =.  Is there anything but
    316  1.11.6.2  christos 			 * whitespace after it?
    317  1.11.6.2  christos 			 */
    318  1.11.6.2  christos 			for (; ch != '\0'; ch = (u_char) *src++)
    319  1.11.6.2  christos 				if (!isspace(ch))
    320  1.11.6.2  christos 					return (-1);
    321  1.11.6.2  christos 
    322  1.11.6.2  christos 			/*
    323  1.11.6.2  christos 			 * Now make sure for cases 2 and 3 that the "extra"
    324  1.11.6.2  christos 			 * bits that slopped past the last full byte were
    325  1.11.6.2  christos 			 * zeros.  If we don't check them, they become a
    326  1.11.6.2  christos 			 * subliminal channel.
    327  1.11.6.2  christos 			 */
    328  1.11.6.2  christos 			if (target && target[tarindex] != 0)
    329  1.11.6.2  christos 				return (-1);
    330  1.11.6.2  christos 		}
    331  1.11.6.2  christos 	} else {
    332  1.11.6.2  christos 		/*
    333  1.11.6.2  christos 		 * We ended by seeing the end of the string.  Make sure we
    334  1.11.6.2  christos 		 * have no partial bytes lying around.
    335  1.11.6.2  christos 		 */
    336  1.11.6.2  christos 		if (state != 0)
    337  1.11.6.2  christos 			return (-1);
    338  1.11.6.2  christos 	}
    339  1.11.6.2  christos 
    340  1.11.6.2  christos 	return (tarindex);
    341  1.11.6.2  christos }
    342  1.11.6.2  christos 
    343  1.11.6.2  christos /*! \file */
    344