Home | History | Annotate | Line # | Download | only in net
      1  1.17  christos /*	$NetBSD: base64.c,v 1.17 2024/01/20 14:52:48 christos Exp $	*/
      2   1.2       mrg 
      3   1.1       mrg /*
      4   1.9  christos  * Copyright (c) 2004 by Internet Systems Consortium, Inc. ("ISC")
      5   1.9  christos  * Copyright (c) 1996-1999 by Internet Software Consortium.
      6   1.1       mrg  *
      7   1.1       mrg  * Permission to use, copy, modify, and distribute this software for any
      8   1.1       mrg  * purpose with or without fee is hereby granted, provided that the above
      9   1.1       mrg  * copyright notice and this permission notice appear in all copies.
     10   1.1       mrg  *
     11   1.9  christos  * THE SOFTWARE IS PROVIDED "AS IS" AND ISC DISCLAIMS ALL WARRANTIES
     12   1.9  christos  * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
     13   1.9  christos  * MERCHANTABILITY AND FITNESS.  IN NO EVENT SHALL ISC BE LIABLE FOR
     14   1.9  christos  * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
     15   1.9  christos  * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
     16   1.9  christos  * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT
     17   1.9  christos  * OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
     18   1.1       mrg  */
     19   1.1       mrg 
     20   1.1       mrg /*
     21   1.1       mrg  * Portions Copyright (c) 1995 by International Business Machines, Inc.
     22   1.1       mrg  *
     23   1.1       mrg  * International Business Machines, Inc. (hereinafter called IBM) grants
     24   1.1       mrg  * permission under its copyrights to use, copy, modify, and distribute this
     25   1.1       mrg  * Software with or without fee, provided that the above copyright notice and
     26   1.1       mrg  * all paragraphs of this notice appear in all copies, and that the name of IBM
     27   1.1       mrg  * not be used in connection with the marketing of any product incorporating
     28   1.1       mrg  * the Software or modifications thereof, without specific, written prior
     29   1.1       mrg  * permission.
     30   1.1       mrg  *
     31   1.1       mrg  * To the extent it has a right to do so, IBM grants an immunity from suit
     32   1.1       mrg  * under its patents, if any, for the use, sale or manufacture of products to
     33   1.1       mrg  * the extent that such products are used for performing Domain Name System
     34   1.1       mrg  * dynamic updates in TCP/IP networks by means of the Software.  No immunity is
     35   1.1       mrg  * granted for any product per se or for any other function of any product.
     36   1.1       mrg  *
     37   1.1       mrg  * THE SOFTWARE IS PROVIDED "AS IS", AND IBM DISCLAIMS ALL WARRANTIES,
     38   1.1       mrg  * INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
     39   1.1       mrg  * PARTICULAR PURPOSE.  IN NO EVENT SHALL IBM BE LIABLE FOR ANY SPECIAL,
     40   1.1       mrg  * DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER ARISING
     41   1.1       mrg  * OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE, EVEN
     42   1.1       mrg  * IF IBM IS APPRISED OF THE POSSIBILITY OF SUCH DAMAGES.
     43   1.1       mrg  */
     44   1.2       mrg 
     45   1.3  christos #include <sys/cdefs.h>
     46   1.2       mrg #if defined(LIBC_SCCS) && !defined(lint)
     47   1.9  christos #if 0
     48  1.11  christos static const char rcsid[] = "Id: base64.c,v 1.4 2005/04/27 04:56:34 sra Exp";
     49   1.9  christos #else
     50  1.17  christos __RCSID("$NetBSD: base64.c,v 1.17 2024/01/20 14:52:48 christos Exp $");
     51   1.9  christos #endif
     52   1.2       mrg #endif /* LIBC_SCCS and not lint */
     53   1.2       mrg 
     54   1.9  christos #include "port_before.h"
     55   1.9  christos 
     56   1.1       mrg #include <sys/types.h>
     57   1.1       mrg #include <sys/param.h>
     58   1.1       mrg #include <sys/socket.h>
     59   1.9  christos 
     60   1.1       mrg #include <netinet/in.h>
     61   1.1       mrg #include <arpa/inet.h>
     62   1.1       mrg #include <arpa/nameser.h>
     63   1.1       mrg 
     64   1.5     lukem #include <assert.h>
     65   1.1       mrg #include <ctype.h>
     66   1.1       mrg #include <resolv.h>
     67   1.1       mrg #include <stdio.h>
     68   1.9  christos #include <stdlib.h>
     69   1.9  christos #include <string.h>
     70   1.1       mrg 
     71   1.9  christos #include "port_after.h"
     72   1.1       mrg 
     73   1.1       mrg #define Assert(Cond) if (!(Cond)) abort()
     74   1.1       mrg 
     75   1.1       mrg static const char Base64[] =
     76   1.1       mrg 	"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";
     77   1.1       mrg static const char Pad64 = '=';
     78   1.1       mrg 
     79   1.1       mrg /* (From RFC1521 and draft-ietf-dnssec-secext-03.txt)
     80   1.9  christos    The following encoding technique is taken from RFC1521 by Borenstein
     81   1.1       mrg    and Freed.  It is reproduced here in a slightly edited form for
     82   1.1       mrg    convenience.
     83   1.1       mrg 
     84   1.1       mrg    A 65-character subset of US-ASCII is used, enabling 6 bits to be
     85   1.1       mrg    represented per printable character. (The extra 65th character, "=",
     86   1.1       mrg    is used to signify a special processing function.)
     87   1.1       mrg 
     88   1.1       mrg    The encoding process represents 24-bit groups of input bits as output
     89   1.1       mrg    strings of 4 encoded characters. Proceeding from left to right, a
     90   1.1       mrg    24-bit input group is formed by concatenating 3 8-bit input groups.
     91   1.1       mrg    These 24 bits are then treated as 4 concatenated 6-bit groups, each
     92   1.1       mrg    of which is translated into a single digit in the base64 alphabet.
     93   1.1       mrg 
     94   1.1       mrg    Each 6-bit group is used as an index into an array of 64 printable
     95   1.1       mrg    characters. The character referenced by the index is placed in the
     96   1.1       mrg    output string.
     97   1.1       mrg 
     98   1.1       mrg                          Table 1: The Base64 Alphabet
     99   1.1       mrg 
    100   1.1       mrg       Value Encoding  Value Encoding  Value Encoding  Value Encoding
    101   1.1       mrg           0 A            17 R            34 i            51 z
    102   1.1       mrg           1 B            18 S            35 j            52 0
    103   1.1       mrg           2 C            19 T            36 k            53 1
    104   1.1       mrg           3 D            20 U            37 l            54 2
    105   1.1       mrg           4 E            21 V            38 m            55 3
    106   1.1       mrg           5 F            22 W            39 n            56 4
    107   1.1       mrg           6 G            23 X            40 o            57 5
    108   1.1       mrg           7 H            24 Y            41 p            58 6
    109   1.1       mrg           8 I            25 Z            42 q            59 7
    110   1.1       mrg           9 J            26 a            43 r            60 8
    111   1.1       mrg          10 K            27 b            44 s            61 9
    112   1.1       mrg          11 L            28 c            45 t            62 +
    113   1.1       mrg          12 M            29 d            46 u            63 /
    114   1.1       mrg          13 N            30 e            47 v
    115   1.1       mrg          14 O            31 f            48 w         (pad) =
    116   1.1       mrg          15 P            32 g            49 x
    117   1.1       mrg          16 Q            33 h            50 y
    118   1.1       mrg 
    119   1.1       mrg    Special processing is performed if fewer than 24 bits are available
    120   1.1       mrg    at the end of the data being encoded.  A full encoding quantum is
    121   1.1       mrg    always completed at the end of a quantity.  When fewer than 24 input
    122   1.1       mrg    bits are available in an input group, zero bits are added (on the
    123   1.1       mrg    right) to form an integral number of 6-bit groups.  Padding at the
    124   1.1       mrg    end of the data is performed using the '=' character.
    125   1.1       mrg 
    126   1.1       mrg    Since all base64 input is an integral number of octets, only the
    127   1.1       mrg          -------------------------------------------------
    128   1.1       mrg    following cases can arise:
    129   1.1       mrg 
    130   1.1       mrg        (1) the final quantum of encoding input is an integral
    131   1.1       mrg            multiple of 24 bits; here, the final unit of encoded
    132   1.1       mrg 	   output will be an integral multiple of 4 characters
    133   1.1       mrg 	   with no "=" padding,
    134   1.1       mrg        (2) the final quantum of encoding input is exactly 8 bits;
    135   1.1       mrg            here, the final unit of encoded output will be two
    136   1.1       mrg 	   characters followed by two "=" padding characters, or
    137   1.1       mrg        (3) the final quantum of encoding input is exactly 16 bits;
    138   1.1       mrg            here, the final unit of encoded output will be three
    139   1.1       mrg 	   characters followed by one "=" padding character.
    140   1.1       mrg    */
    141   1.1       mrg 
    142   1.1       mrg int
    143   1.9  christos b64_ntop(u_char const *src, size_t srclength, char *target, size_t targsize) {
    144   1.1       mrg 	size_t datalength = 0;
    145   1.1       mrg 	u_char input[3];
    146   1.1       mrg 	u_char output[4];
    147   1.8   thorpej 	size_t i;
    148   1.1       mrg 
    149   1.5     lukem 	_DIAGASSERT(src != NULL);
    150   1.5     lukem 	_DIAGASSERT(target != NULL);
    151   1.5     lukem 
    152   1.9  christos 	while (2U < srclength) {
    153   1.1       mrg 		input[0] = *src++;
    154   1.1       mrg 		input[1] = *src++;
    155   1.1       mrg 		input[2] = *src++;
    156   1.1       mrg 		srclength -= 3;
    157   1.1       mrg 
    158  1.16  christos 		output[0] = (uint32_t)input[0] >> 2;
    159  1.16  christos 		output[1] = ((uint32_t)(input[0] & 0x03) << 4) +
    160  1.16  christos 		    ((uint32_t)input[1] >> 4);
    161  1.16  christos 		output[2] = ((uint32_t)(input[1] & 0x0f) << 2) +
    162  1.16  christos 		    ((uint32_t)input[2] >> 6);
    163   1.1       mrg 		output[3] = input[2] & 0x3f;
    164   1.1       mrg 		Assert(output[0] < 64);
    165   1.1       mrg 		Assert(output[1] < 64);
    166   1.1       mrg 		Assert(output[2] < 64);
    167   1.1       mrg 		Assert(output[3] < 64);
    168   1.1       mrg 
    169   1.1       mrg 		if (datalength + 4 > targsize)
    170  1.16  christos 			return -1;
    171   1.1       mrg 		target[datalength++] = Base64[output[0]];
    172   1.1       mrg 		target[datalength++] = Base64[output[1]];
    173   1.1       mrg 		target[datalength++] = Base64[output[2]];
    174   1.1       mrg 		target[datalength++] = Base64[output[3]];
    175   1.1       mrg 	}
    176   1.1       mrg 
    177   1.1       mrg 	/* Now we worry about padding. */
    178   1.9  christos 	if (0U != srclength) {
    179   1.1       mrg 		/* Get what's left. */
    180   1.1       mrg 		input[0] = input[1] = input[2] = '\0';
    181   1.1       mrg 		for (i = 0; i < srclength; i++)
    182   1.1       mrg 			input[i] = *src++;
    183   1.1       mrg 
    184  1.16  christos 		output[0] = (uint32_t)input[0] >> 2;
    185  1.16  christos 		output[1] = ((uint32_t)(input[0] & 0x03) << 4) +
    186  1.16  christos 		    ((uint32_t)input[1] >> 4);
    187  1.16  christos 		output[2] = ((uint32_t)(input[1] & 0x0f) << 2) +
    188  1.16  christos 		    ((uint32_t)input[2] >> 6);
    189   1.1       mrg 		Assert(output[0] < 64);
    190   1.1       mrg 		Assert(output[1] < 64);
    191   1.1       mrg 		Assert(output[2] < 64);
    192   1.1       mrg 
    193   1.1       mrg 		if (datalength + 4 > targsize)
    194  1.16  christos 			return -1;
    195   1.1       mrg 		target[datalength++] = Base64[output[0]];
    196   1.1       mrg 		target[datalength++] = Base64[output[1]];
    197   1.9  christos 		if (srclength == 1U)
    198   1.1       mrg 			target[datalength++] = Pad64;
    199   1.1       mrg 		else
    200   1.1       mrg 			target[datalength++] = Base64[output[2]];
    201   1.1       mrg 		target[datalength++] = Pad64;
    202   1.1       mrg 	}
    203   1.1       mrg 	if (datalength >= targsize)
    204  1.16  christos 		return -1;
    205   1.9  christos 	target[datalength] = '\0';	/*%< Returned value doesn't count \\0. */
    206  1.13  christos 	_DIAGASSERT(__type_fit(int, datalength));
    207  1.13  christos 	return (int)datalength;
    208   1.1       mrg }
    209   1.1       mrg 
    210   1.1       mrg /* skips all whitespace anywhere.
    211   1.1       mrg    converts characters, four at a time, starting at (or after)
    212   1.1       mrg    src from base - 64 numbers into three 8 bit bytes in the target area.
    213   1.1       mrg    it returns the number of data bytes stored at the target, or -1 on error.
    214   1.1       mrg  */
    215   1.1       mrg 
    216   1.1       mrg int
    217  1.14       abs b64_pton(char const *src, u_char *target, size_t targsize)
    218   1.1       mrg {
    219   1.8   thorpej 	size_t tarindex;
    220   1.8   thorpej 	int state, ch;
    221  1.15  christos 	u_char nextbyte;
    222  1.17  christos 	const char *pos;
    223   1.5     lukem 
    224   1.5     lukem 	_DIAGASSERT(src != NULL);
    225   1.5     lukem 	_DIAGASSERT(target != NULL);
    226   1.1       mrg 
    227   1.1       mrg 	state = 0;
    228   1.1       mrg 	tarindex = 0;
    229   1.1       mrg 
    230   1.7     itohy 	while ((ch = (u_char) *src++) != '\0') {
    231   1.9  christos 		if (isspace(ch))	/*%< Skip whitespace anywhere. */
    232   1.1       mrg 			continue;
    233   1.1       mrg 
    234   1.1       mrg 		if (ch == Pad64)
    235   1.1       mrg 			break;
    236   1.1       mrg 
    237   1.1       mrg 		pos = strchr(Base64, ch);
    238  1.16  christos 		if (pos == NULL) 	/*%< A non-base64 character. */
    239  1.16  christos 			return -1;
    240   1.1       mrg 
    241   1.1       mrg 		switch (state) {
    242   1.1       mrg 		case 0:
    243   1.1       mrg 			if (target) {
    244  1.16  christos 				if (tarindex >= targsize)
    245  1.16  christos 					return -1;
    246  1.15  christos 				target[tarindex] = (u_char)(pos - Base64) << 2;
    247   1.1       mrg 			}
    248   1.1       mrg 			state = 1;
    249   1.1       mrg 			break;
    250   1.1       mrg 		case 1:
    251   1.1       mrg 			if (target) {
    252  1.16  christos 				if (tarindex >= targsize)
    253  1.16  christos 					return -1;
    254   1.4  christos 				target[tarindex] |=
    255  1.16  christos 				    (uint32_t)(pos - Base64) >> 4;
    256  1.15  christos 				nextbyte = (u_char)((pos - Base64) & 0x0f) << 4;
    257  1.15  christos 				if (tarindex + 1 < targsize)
    258  1.15  christos 					target[tarindex + 1] = nextbyte;
    259  1.15  christos 				else if (nextbyte)
    260  1.16  christos 					return -1;
    261   1.1       mrg 			}
    262   1.1       mrg 			tarindex++;
    263   1.1       mrg 			state = 2;
    264   1.1       mrg 			break;
    265   1.1       mrg 		case 2:
    266   1.1       mrg 			if (target) {
    267  1.16  christos 				if (tarindex >= targsize)
    268  1.16  christos 					return -1;
    269   1.4  christos 				target[tarindex] |=
    270  1.16  christos 					(uint32_t)(pos - Base64) >> 2;
    271  1.15  christos 				nextbyte = (u_char)((pos - Base64) & 0x03) << 6;
    272  1.15  christos 				if (tarindex + 1 < targsize)
    273  1.15  christos 					target[tarindex + 1] = nextbyte;
    274  1.15  christos 				else if (nextbyte)
    275  1.16  christos 					return -1;
    276   1.1       mrg 			}
    277   1.1       mrg 			tarindex++;
    278   1.1       mrg 			state = 3;
    279   1.1       mrg 			break;
    280   1.1       mrg 		case 3:
    281   1.1       mrg 			if (target) {
    282   1.9  christos 				if ((size_t)tarindex >= targsize)
    283  1.16  christos 					return -1;
    284  1.16  christos 				target[tarindex] |= (u_char)(pos - Base64);
    285   1.1       mrg 			}
    286   1.1       mrg 			tarindex++;
    287   1.1       mrg 			state = 0;
    288   1.1       mrg 			break;
    289   1.1       mrg 		default:
    290   1.1       mrg 			abort();
    291   1.1       mrg 		}
    292   1.1       mrg 	}
    293   1.1       mrg 
    294   1.1       mrg 	/*
    295   1.1       mrg 	 * We are done decoding Base-64 chars.  Let's see if we ended
    296   1.1       mrg 	 * on a byte boundary, and/or with erroneous trailing characters.
    297   1.1       mrg 	 */
    298   1.1       mrg 
    299   1.9  christos 	if (ch == Pad64) {		/*%< We got a pad char. */
    300   1.9  christos 		ch = *src++;		/*%< Skip it, get next. */
    301   1.1       mrg 		switch (state) {
    302   1.9  christos 		case 0:		/*%< Invalid = in first position */
    303   1.9  christos 		case 1:		/*%< Invalid = in second position */
    304  1.16  christos 			return -1;
    305   1.1       mrg 
    306   1.9  christos 		case 2:		/*%< Valid, means one byte of info */
    307   1.1       mrg 			/* Skip any number of spaces. */
    308   1.7     itohy 			for (; ch != '\0'; ch = (u_char) *src++)
    309   1.1       mrg 				if (!isspace(ch))
    310   1.1       mrg 					break;
    311   1.1       mrg 			/* Make sure there is another trailing = sign. */
    312   1.1       mrg 			if (ch != Pad64)
    313  1.16  christos 				return -1;
    314   1.9  christos 			ch = *src++;		/*%< Skip the = */
    315   1.1       mrg 			/* Fall through to "single trailing =" case. */
    316   1.1       mrg 			/* FALLTHROUGH */
    317   1.1       mrg 
    318   1.9  christos 		case 3:		/*%< Valid, means two bytes of info */
    319   1.1       mrg 			/*
    320   1.1       mrg 			 * We know this char is an =.  Is there anything but
    321   1.1       mrg 			 * whitespace after it?
    322   1.1       mrg 			 */
    323   1.7     itohy 			for (; ch != '\0'; ch = (u_char) *src++)
    324   1.1       mrg 				if (!isspace(ch))
    325  1.16  christos 					return -1;
    326   1.1       mrg 
    327   1.1       mrg 			/*
    328   1.1       mrg 			 * Now make sure for cases 2 and 3 that the "extra"
    329   1.1       mrg 			 * bits that slopped past the last full byte were
    330   1.1       mrg 			 * zeros.  If we don't check them, they become a
    331   1.1       mrg 			 * subliminal channel.
    332   1.1       mrg 			 */
    333  1.15  christos 			if (target && tarindex < targsize &&
    334  1.15  christos 			    target[tarindex] != 0)
    335  1.16  christos 				return -1;
    336   1.1       mrg 		}
    337   1.1       mrg 	} else {
    338   1.1       mrg 		/*
    339   1.1       mrg 		 * We ended by seeing the end of the string.  Make sure we
    340   1.1       mrg 		 * have no partial bytes lying around.
    341   1.1       mrg 		 */
    342   1.1       mrg 		if (state != 0)
    343  1.16  christos 			return -1;
    344   1.1       mrg 	}
    345   1.1       mrg 
    346  1.13  christos 	_DIAGASSERT(__type_fit(int, tarindex));
    347  1.13  christos 	return (int)tarindex;
    348   1.1       mrg }
    349   1.9  christos 
    350   1.9  christos /*! \file */
    351