cast128.c revision 1.10 1 1.10 pgoyette /* $NetBSD: cast128.c,v 1.10 2014/01/01 15:18:57 pgoyette Exp $ */
2 1.6 thorpej /* $OpenBSD: cast.c,v 1.2 2000/06/06 06:49:47 deraadt Exp $ */
3 1.1 thorpej
4 1.1 thorpej /*
5 1.6 thorpej * CAST-128 in C
6 1.6 thorpej * Written by Steve Reid <sreid (at) sea-to-sky.net>
7 1.6 thorpej * 100% Public Domain - no warranty
8 1.6 thorpej * Released 1997.10.11
9 1.1 thorpej */
10 1.4 lukem
11 1.4 lukem #include <sys/cdefs.h>
12 1.10 pgoyette __KERNEL_RCSID(0, "$NetBSD: cast128.c,v 1.10 2014/01/01 15:18:57 pgoyette Exp $");
13 1.1 thorpej
14 1.6 thorpej #include <sys/types.h>
15 1.10 pgoyette #include <sys/errno.h>
16 1.10 pgoyette #include <sys/module.h>
17 1.10 pgoyette
18 1.1 thorpej #include <crypto/cast128/cast128.h>
19 1.6 thorpej #include <crypto/cast128/cast128sb.h>
20 1.1 thorpej
21 1.6 thorpej /* Macros to access 8-bit bytes out of a 32-bit word */
22 1.6 thorpej #define U_INT8_Ta(x) ( (u_int8_t) (x>>24) )
23 1.6 thorpej #define U_INT8_Tb(x) ( (u_int8_t) ((x>>16)&255) )
24 1.6 thorpej #define U_INT8_Tc(x) ( (u_int8_t) ((x>>8)&255) )
25 1.6 thorpej #define U_INT8_Td(x) ( (u_int8_t) ((x)&255) )
26 1.6 thorpej
27 1.6 thorpej /* Circular left shift */
28 1.6 thorpej #define ROL(x, n) ( ((x)<<(n)) | ((x)>>(32-(n))) )
29 1.6 thorpej
30 1.6 thorpej /* CAST-128 uses three different round functions */
31 1.6 thorpej #define F1(l, r, i) \
32 1.6 thorpej t = ROL(key->xkey[i] + r, key->xkey[i+16]); \
33 1.6 thorpej l ^= ((cast_sbox1[U_INT8_Ta(t)] ^ cast_sbox2[U_INT8_Tb(t)]) - \
34 1.6 thorpej cast_sbox3[U_INT8_Tc(t)]) + cast_sbox4[U_INT8_Td(t)];
35 1.6 thorpej #define F2(l, r, i) \
36 1.6 thorpej t = ROL(key->xkey[i] ^ r, key->xkey[i+16]); \
37 1.6 thorpej l ^= ((cast_sbox1[U_INT8_Ta(t)] - cast_sbox2[U_INT8_Tb(t)]) + \
38 1.6 thorpej cast_sbox3[U_INT8_Tc(t)]) ^ cast_sbox4[U_INT8_Td(t)];
39 1.6 thorpej #define F3(l, r, i) \
40 1.6 thorpej t = ROL(key->xkey[i] - r, key->xkey[i+16]); \
41 1.6 thorpej l ^= ((cast_sbox1[U_INT8_Ta(t)] + cast_sbox2[U_INT8_Tb(t)]) ^ \
42 1.6 thorpej cast_sbox3[U_INT8_Tc(t)]) - cast_sbox4[U_INT8_Td(t)];
43 1.1 thorpej
44 1.1 thorpej
45 1.6 thorpej /***** Encryption Function *****/
46 1.1 thorpej
47 1.7 thorpej void cast128_encrypt(const cast128_key* key, const u_int8_t* inblock,
48 1.7 thorpej u_int8_t* outblock)
49 1.1 thorpej {
50 1.6 thorpej u_int32_t t, l, r;
51 1.1 thorpej
52 1.6 thorpej /* Get inblock into l,r */
53 1.6 thorpej l = ((u_int32_t)inblock[0] << 24) | ((u_int32_t)inblock[1] << 16) |
54 1.6 thorpej ((u_int32_t)inblock[2] << 8) | (u_int32_t)inblock[3];
55 1.6 thorpej r = ((u_int32_t)inblock[4] << 24) | ((u_int32_t)inblock[5] << 16) |
56 1.6 thorpej ((u_int32_t)inblock[6] << 8) | (u_int32_t)inblock[7];
57 1.6 thorpej /* Do the work */
58 1.6 thorpej F1(l, r, 0);
59 1.6 thorpej F2(r, l, 1);
60 1.6 thorpej F3(l, r, 2);
61 1.6 thorpej F1(r, l, 3);
62 1.6 thorpej F2(l, r, 4);
63 1.6 thorpej F3(r, l, 5);
64 1.6 thorpej F1(l, r, 6);
65 1.6 thorpej F2(r, l, 7);
66 1.6 thorpej F3(l, r, 8);
67 1.6 thorpej F1(r, l, 9);
68 1.6 thorpej F2(l, r, 10);
69 1.6 thorpej F3(r, l, 11);
70 1.6 thorpej /* Only do full 16 rounds if key length > 80 bits */
71 1.6 thorpej if (key->rounds > 12) {
72 1.6 thorpej F1(l, r, 12);
73 1.6 thorpej F2(r, l, 13);
74 1.6 thorpej F3(l, r, 14);
75 1.6 thorpej F1(r, l, 15);
76 1.6 thorpej }
77 1.6 thorpej /* Put l,r into outblock */
78 1.6 thorpej outblock[0] = U_INT8_Ta(r);
79 1.6 thorpej outblock[1] = U_INT8_Tb(r);
80 1.6 thorpej outblock[2] = U_INT8_Tc(r);
81 1.6 thorpej outblock[3] = U_INT8_Td(r);
82 1.6 thorpej outblock[4] = U_INT8_Ta(l);
83 1.6 thorpej outblock[5] = U_INT8_Tb(l);
84 1.6 thorpej outblock[6] = U_INT8_Tc(l);
85 1.6 thorpej outblock[7] = U_INT8_Td(l);
86 1.6 thorpej /* Wipe clean */
87 1.6 thorpej t = l = r = 0;
88 1.1 thorpej }
89 1.1 thorpej
90 1.1 thorpej
91 1.6 thorpej /***** Decryption Function *****/
92 1.1 thorpej
93 1.7 thorpej void cast128_decrypt(const cast128_key* key, const u_int8_t* inblock,
94 1.7 thorpej u_int8_t* outblock)
95 1.6 thorpej {
96 1.6 thorpej u_int32_t t, l, r;
97 1.1 thorpej
98 1.6 thorpej /* Get inblock into l,r */
99 1.6 thorpej r = ((u_int32_t)inblock[0] << 24) | ((u_int32_t)inblock[1] << 16) |
100 1.6 thorpej ((u_int32_t)inblock[2] << 8) | (u_int32_t)inblock[3];
101 1.6 thorpej l = ((u_int32_t)inblock[4] << 24) | ((u_int32_t)inblock[5] << 16) |
102 1.6 thorpej ((u_int32_t)inblock[6] << 8) | (u_int32_t)inblock[7];
103 1.6 thorpej /* Do the work */
104 1.6 thorpej /* Only do full 16 rounds if key length > 80 bits */
105 1.6 thorpej if (key->rounds > 12) {
106 1.6 thorpej F1(r, l, 15);
107 1.6 thorpej F3(l, r, 14);
108 1.6 thorpej F2(r, l, 13);
109 1.6 thorpej F1(l, r, 12);
110 1.6 thorpej }
111 1.6 thorpej F3(r, l, 11);
112 1.6 thorpej F2(l, r, 10);
113 1.6 thorpej F1(r, l, 9);
114 1.6 thorpej F3(l, r, 8);
115 1.6 thorpej F2(r, l, 7);
116 1.6 thorpej F1(l, r, 6);
117 1.6 thorpej F3(r, l, 5);
118 1.6 thorpej F2(l, r, 4);
119 1.6 thorpej F1(r, l, 3);
120 1.6 thorpej F3(l, r, 2);
121 1.6 thorpej F2(r, l, 1);
122 1.6 thorpej F1(l, r, 0);
123 1.6 thorpej /* Put l,r into outblock */
124 1.6 thorpej outblock[0] = U_INT8_Ta(l);
125 1.6 thorpej outblock[1] = U_INT8_Tb(l);
126 1.6 thorpej outblock[2] = U_INT8_Tc(l);
127 1.6 thorpej outblock[3] = U_INT8_Td(l);
128 1.6 thorpej outblock[4] = U_INT8_Ta(r);
129 1.6 thorpej outblock[5] = U_INT8_Tb(r);
130 1.6 thorpej outblock[6] = U_INT8_Tc(r);
131 1.6 thorpej outblock[7] = U_INT8_Td(r);
132 1.6 thorpej /* Wipe clean */
133 1.6 thorpej t = l = r = 0;
134 1.1 thorpej }
135 1.1 thorpej
136 1.1 thorpej
137 1.6 thorpej /***** Key Schedual *****/
138 1.1 thorpej
139 1.7 thorpej void cast128_setkey(cast128_key* key, const u_int8_t* rawkey, int keybytes)
140 1.1 thorpej {
141 1.9 mrg u_int32_t t[4], z[4], x[4];
142 1.9 mrg int i;
143 1.1 thorpej
144 1.6 thorpej /* Set number of rounds to 12 or 16, depending on key length */
145 1.6 thorpej key->rounds = (keybytes <= 10 ? 12 : 16);
146 1.1 thorpej
147 1.6 thorpej /* Copy key to workspace x */
148 1.6 thorpej for (i = 0; i < 4; i++) {
149 1.6 thorpej x[i] = 0;
150 1.9 mrg t[i] = z[i] = 0; /* XXX gcc */
151 1.6 thorpej if ((i*4+0) < keybytes) x[i] = (u_int32_t)rawkey[i*4+0] << 24;
152 1.6 thorpej if ((i*4+1) < keybytes) x[i] |= (u_int32_t)rawkey[i*4+1] << 16;
153 1.6 thorpej if ((i*4+2) < keybytes) x[i] |= (u_int32_t)rawkey[i*4+2] << 8;
154 1.6 thorpej if ((i*4+3) < keybytes) x[i] |= (u_int32_t)rawkey[i*4+3];
155 1.6 thorpej }
156 1.6 thorpej /* Generate 32 subkeys, four at a time */
157 1.6 thorpej for (i = 0; i < 32; i+=4) {
158 1.6 thorpej switch (i & 4) {
159 1.6 thorpej case 0:
160 1.6 thorpej t[0] = z[0] = x[0] ^ cast_sbox5[U_INT8_Tb(x[3])] ^
161 1.6 thorpej cast_sbox6[U_INT8_Td(x[3])] ^ cast_sbox7[U_INT8_Ta(x[3])] ^
162 1.6 thorpej cast_sbox8[U_INT8_Tc(x[3])] ^ cast_sbox7[U_INT8_Ta(x[2])];
163 1.6 thorpej t[1] = z[1] = x[2] ^ cast_sbox5[U_INT8_Ta(z[0])] ^
164 1.6 thorpej cast_sbox6[U_INT8_Tc(z[0])] ^ cast_sbox7[U_INT8_Tb(z[0])] ^
165 1.6 thorpej cast_sbox8[U_INT8_Td(z[0])] ^ cast_sbox8[U_INT8_Tc(x[2])];
166 1.6 thorpej t[2] = z[2] = x[3] ^ cast_sbox5[U_INT8_Td(z[1])] ^
167 1.6 thorpej cast_sbox6[U_INT8_Tc(z[1])] ^ cast_sbox7[U_INT8_Tb(z[1])] ^
168 1.6 thorpej cast_sbox8[U_INT8_Ta(z[1])] ^ cast_sbox5[U_INT8_Tb(x[2])];
169 1.6 thorpej t[3] = z[3] = x[1] ^ cast_sbox5[U_INT8_Tc(z[2])] ^
170 1.6 thorpej cast_sbox6[U_INT8_Tb(z[2])] ^ cast_sbox7[U_INT8_Td(z[2])] ^
171 1.6 thorpej cast_sbox8[U_INT8_Ta(z[2])] ^ cast_sbox6[U_INT8_Td(x[2])];
172 1.6 thorpej break;
173 1.6 thorpej case 4:
174 1.6 thorpej t[0] = x[0] = z[2] ^ cast_sbox5[U_INT8_Tb(z[1])] ^
175 1.6 thorpej cast_sbox6[U_INT8_Td(z[1])] ^ cast_sbox7[U_INT8_Ta(z[1])] ^
176 1.6 thorpej cast_sbox8[U_INT8_Tc(z[1])] ^ cast_sbox7[U_INT8_Ta(z[0])];
177 1.6 thorpej t[1] = x[1] = z[0] ^ cast_sbox5[U_INT8_Ta(x[0])] ^
178 1.6 thorpej cast_sbox6[U_INT8_Tc(x[0])] ^ cast_sbox7[U_INT8_Tb(x[0])] ^
179 1.6 thorpej cast_sbox8[U_INT8_Td(x[0])] ^ cast_sbox8[U_INT8_Tc(z[0])];
180 1.6 thorpej t[2] = x[2] = z[1] ^ cast_sbox5[U_INT8_Td(x[1])] ^
181 1.6 thorpej cast_sbox6[U_INT8_Tc(x[1])] ^ cast_sbox7[U_INT8_Tb(x[1])] ^
182 1.6 thorpej cast_sbox8[U_INT8_Ta(x[1])] ^ cast_sbox5[U_INT8_Tb(z[0])];
183 1.6 thorpej t[3] = x[3] = z[3] ^ cast_sbox5[U_INT8_Tc(x[2])] ^
184 1.6 thorpej cast_sbox6[U_INT8_Tb(x[2])] ^ cast_sbox7[U_INT8_Td(x[2])] ^
185 1.6 thorpej cast_sbox8[U_INT8_Ta(x[2])] ^ cast_sbox6[U_INT8_Td(z[0])];
186 1.6 thorpej break;
187 1.6 thorpej }
188 1.6 thorpej switch (i & 12) {
189 1.6 thorpej case 0:
190 1.6 thorpej case 12:
191 1.6 thorpej key->xkey[i+0] = cast_sbox5[U_INT8_Ta(t[2])] ^ cast_sbox6[U_INT8_Tb(t[2])] ^
192 1.6 thorpej cast_sbox7[U_INT8_Td(t[1])] ^ cast_sbox8[U_INT8_Tc(t[1])];
193 1.6 thorpej key->xkey[i+1] = cast_sbox5[U_INT8_Tc(t[2])] ^ cast_sbox6[U_INT8_Td(t[2])] ^
194 1.6 thorpej cast_sbox7[U_INT8_Tb(t[1])] ^ cast_sbox8[U_INT8_Ta(t[1])];
195 1.6 thorpej key->xkey[i+2] = cast_sbox5[U_INT8_Ta(t[3])] ^ cast_sbox6[U_INT8_Tb(t[3])] ^
196 1.6 thorpej cast_sbox7[U_INT8_Td(t[0])] ^ cast_sbox8[U_INT8_Tc(t[0])];
197 1.6 thorpej key->xkey[i+3] = cast_sbox5[U_INT8_Tc(t[3])] ^ cast_sbox6[U_INT8_Td(t[3])] ^
198 1.6 thorpej cast_sbox7[U_INT8_Tb(t[0])] ^ cast_sbox8[U_INT8_Ta(t[0])];
199 1.6 thorpej break;
200 1.6 thorpej case 4:
201 1.6 thorpej case 8:
202 1.6 thorpej key->xkey[i+0] = cast_sbox5[U_INT8_Td(t[0])] ^ cast_sbox6[U_INT8_Tc(t[0])] ^
203 1.6 thorpej cast_sbox7[U_INT8_Ta(t[3])] ^ cast_sbox8[U_INT8_Tb(t[3])];
204 1.6 thorpej key->xkey[i+1] = cast_sbox5[U_INT8_Tb(t[0])] ^ cast_sbox6[U_INT8_Ta(t[0])] ^
205 1.6 thorpej cast_sbox7[U_INT8_Tc(t[3])] ^ cast_sbox8[U_INT8_Td(t[3])];
206 1.6 thorpej key->xkey[i+2] = cast_sbox5[U_INT8_Td(t[1])] ^ cast_sbox6[U_INT8_Tc(t[1])] ^
207 1.6 thorpej cast_sbox7[U_INT8_Ta(t[2])] ^ cast_sbox8[U_INT8_Tb(t[2])];
208 1.6 thorpej key->xkey[i+3] = cast_sbox5[U_INT8_Tb(t[1])] ^ cast_sbox6[U_INT8_Ta(t[1])] ^
209 1.6 thorpej cast_sbox7[U_INT8_Tc(t[2])] ^ cast_sbox8[U_INT8_Td(t[2])];
210 1.6 thorpej break;
211 1.6 thorpej }
212 1.6 thorpej switch (i & 12) {
213 1.6 thorpej case 0:
214 1.6 thorpej key->xkey[i+0] ^= cast_sbox5[U_INT8_Tc(z[0])];
215 1.6 thorpej key->xkey[i+1] ^= cast_sbox6[U_INT8_Tc(z[1])];
216 1.6 thorpej key->xkey[i+2] ^= cast_sbox7[U_INT8_Tb(z[2])];
217 1.6 thorpej key->xkey[i+3] ^= cast_sbox8[U_INT8_Ta(z[3])];
218 1.6 thorpej break;
219 1.6 thorpej case 4:
220 1.6 thorpej key->xkey[i+0] ^= cast_sbox5[U_INT8_Ta(x[2])];
221 1.6 thorpej key->xkey[i+1] ^= cast_sbox6[U_INT8_Tb(x[3])];
222 1.6 thorpej key->xkey[i+2] ^= cast_sbox7[U_INT8_Td(x[0])];
223 1.6 thorpej key->xkey[i+3] ^= cast_sbox8[U_INT8_Td(x[1])];
224 1.6 thorpej break;
225 1.6 thorpej case 8:
226 1.6 thorpej key->xkey[i+0] ^= cast_sbox5[U_INT8_Tb(z[2])];
227 1.6 thorpej key->xkey[i+1] ^= cast_sbox6[U_INT8_Ta(z[3])];
228 1.6 thorpej key->xkey[i+2] ^= cast_sbox7[U_INT8_Tc(z[0])];
229 1.6 thorpej key->xkey[i+3] ^= cast_sbox8[U_INT8_Tc(z[1])];
230 1.6 thorpej break;
231 1.6 thorpej case 12:
232 1.6 thorpej key->xkey[i+0] ^= cast_sbox5[U_INT8_Td(x[0])];
233 1.6 thorpej key->xkey[i+1] ^= cast_sbox6[U_INT8_Td(x[1])];
234 1.6 thorpej key->xkey[i+2] ^= cast_sbox7[U_INT8_Ta(x[2])];
235 1.6 thorpej key->xkey[i+3] ^= cast_sbox8[U_INT8_Tb(x[3])];
236 1.6 thorpej break;
237 1.6 thorpej }
238 1.6 thorpej if (i >= 16) {
239 1.6 thorpej key->xkey[i+0] &= 31;
240 1.6 thorpej key->xkey[i+1] &= 31;
241 1.6 thorpej key->xkey[i+2] &= 31;
242 1.6 thorpej key->xkey[i+3] &= 31;
243 1.6 thorpej }
244 1.6 thorpej }
245 1.6 thorpej /* Wipe clean */
246 1.6 thorpej for (i = 0; i < 4; i++) {
247 1.6 thorpej t[i] = x[i] = z[i] = 0;
248 1.6 thorpej }
249 1.1 thorpej }
250 1.1 thorpej
251 1.6 thorpej /* Made in Canada */
252 1.10 pgoyette
253 1.10 pgoyette #if defined(_KERNEL)
254 1.10 pgoyette
255 1.10 pgoyette MODULE(MODULE_CLASS_MISC, cast128, NULL);
256 1.10 pgoyette
257 1.10 pgoyette static int
258 1.10 pgoyette cast128_modcmd(modcmd_t cmd, void *opaque)
259 1.10 pgoyette {
260 1.10 pgoyette
261 1.10 pgoyette switch (cmd) {
262 1.10 pgoyette case MODULE_CMD_INIT:
263 1.10 pgoyette return 0;
264 1.10 pgoyette case MODULE_CMD_FINI:
265 1.10 pgoyette return 0;
266 1.10 pgoyette default:
267 1.10 pgoyette return ENOTTY;
268 1.10 pgoyette }
269 1.10 pgoyette }
270 1.10 pgoyette
271 1.10 pgoyette #endif /* defined(KERNEL) */
272