cast128.c revision 1.5.16.2 1 1.5.16.1 skrll /* $NetBSD: cast128.c,v 1.5.16.2 2004/09/18 14:44:26 skrll Exp $ */
2 1.5.16.1 skrll /* $OpenBSD: cast.c,v 1.2 2000/06/06 06:49:47 deraadt Exp $ */
3 1.1 thorpej
4 1.1 thorpej /*
5 1.5.16.1 skrll * CAST-128 in C
6 1.5.16.1 skrll * Written by Steve Reid <sreid (at) sea-to-sky.net>
7 1.5.16.1 skrll * 100% Public Domain - no warranty
8 1.5.16.1 skrll * Released 1997.10.11
9 1.1 thorpej */
10 1.4 lukem
11 1.4 lukem #include <sys/cdefs.h>
12 1.5.16.1 skrll __KERNEL_RCSID(0, "$NetBSD: cast128.c,v 1.5.16.2 2004/09/18 14:44:26 skrll Exp $");
13 1.1 thorpej
14 1.5.16.1 skrll #include <sys/types.h>
15 1.1 thorpej #include <crypto/cast128/cast128.h>
16 1.5.16.1 skrll #include <crypto/cast128/cast128sb.h>
17 1.1 thorpej
18 1.5.16.1 skrll /* Macros to access 8-bit bytes out of a 32-bit word */
19 1.5.16.1 skrll #define U_INT8_Ta(x) ( (u_int8_t) (x>>24) )
20 1.5.16.1 skrll #define U_INT8_Tb(x) ( (u_int8_t) ((x>>16)&255) )
21 1.5.16.1 skrll #define U_INT8_Tc(x) ( (u_int8_t) ((x>>8)&255) )
22 1.5.16.1 skrll #define U_INT8_Td(x) ( (u_int8_t) ((x)&255) )
23 1.5.16.1 skrll
24 1.5.16.1 skrll /* Circular left shift */
25 1.5.16.1 skrll #define ROL(x, n) ( ((x)<<(n)) | ((x)>>(32-(n))) )
26 1.5.16.1 skrll
27 1.5.16.1 skrll /* CAST-128 uses three different round functions */
28 1.5.16.1 skrll #define F1(l, r, i) \
29 1.5.16.1 skrll t = ROL(key->xkey[i] + r, key->xkey[i+16]); \
30 1.5.16.1 skrll l ^= ((cast_sbox1[U_INT8_Ta(t)] ^ cast_sbox2[U_INT8_Tb(t)]) - \
31 1.5.16.1 skrll cast_sbox3[U_INT8_Tc(t)]) + cast_sbox4[U_INT8_Td(t)];
32 1.5.16.1 skrll #define F2(l, r, i) \
33 1.5.16.1 skrll t = ROL(key->xkey[i] ^ r, key->xkey[i+16]); \
34 1.5.16.1 skrll l ^= ((cast_sbox1[U_INT8_Ta(t)] - cast_sbox2[U_INT8_Tb(t)]) + \
35 1.5.16.1 skrll cast_sbox3[U_INT8_Tc(t)]) ^ cast_sbox4[U_INT8_Td(t)];
36 1.5.16.1 skrll #define F3(l, r, i) \
37 1.5.16.1 skrll t = ROL(key->xkey[i] - r, key->xkey[i+16]); \
38 1.5.16.1 skrll l ^= ((cast_sbox1[U_INT8_Ta(t)] + cast_sbox2[U_INT8_Tb(t)]) ^ \
39 1.5.16.1 skrll cast_sbox3[U_INT8_Tc(t)]) - cast_sbox4[U_INT8_Td(t)];
40 1.1 thorpej
41 1.1 thorpej
42 1.5.16.1 skrll /***** Encryption Function *****/
43 1.1 thorpej
44 1.5.16.1 skrll void cast128_encrypt(const cast128_key* key, const u_int8_t* inblock,
45 1.5.16.1 skrll u_int8_t* outblock)
46 1.1 thorpej {
47 1.5.16.1 skrll u_int32_t t, l, r;
48 1.1 thorpej
49 1.5.16.1 skrll /* Get inblock into l,r */
50 1.5.16.1 skrll l = ((u_int32_t)inblock[0] << 24) | ((u_int32_t)inblock[1] << 16) |
51 1.5.16.1 skrll ((u_int32_t)inblock[2] << 8) | (u_int32_t)inblock[3];
52 1.5.16.1 skrll r = ((u_int32_t)inblock[4] << 24) | ((u_int32_t)inblock[5] << 16) |
53 1.5.16.1 skrll ((u_int32_t)inblock[6] << 8) | (u_int32_t)inblock[7];
54 1.5.16.1 skrll /* Do the work */
55 1.5.16.1 skrll F1(l, r, 0);
56 1.5.16.1 skrll F2(r, l, 1);
57 1.5.16.1 skrll F3(l, r, 2);
58 1.5.16.1 skrll F1(r, l, 3);
59 1.5.16.1 skrll F2(l, r, 4);
60 1.5.16.1 skrll F3(r, l, 5);
61 1.5.16.1 skrll F1(l, r, 6);
62 1.5.16.1 skrll F2(r, l, 7);
63 1.5.16.1 skrll F3(l, r, 8);
64 1.5.16.1 skrll F1(r, l, 9);
65 1.5.16.1 skrll F2(l, r, 10);
66 1.5.16.1 skrll F3(r, l, 11);
67 1.5.16.1 skrll /* Only do full 16 rounds if key length > 80 bits */
68 1.5.16.1 skrll if (key->rounds > 12) {
69 1.5.16.1 skrll F1(l, r, 12);
70 1.5.16.1 skrll F2(r, l, 13);
71 1.5.16.1 skrll F3(l, r, 14);
72 1.5.16.1 skrll F1(r, l, 15);
73 1.5.16.1 skrll }
74 1.5.16.1 skrll /* Put l,r into outblock */
75 1.5.16.1 skrll outblock[0] = U_INT8_Ta(r);
76 1.5.16.1 skrll outblock[1] = U_INT8_Tb(r);
77 1.5.16.1 skrll outblock[2] = U_INT8_Tc(r);
78 1.5.16.1 skrll outblock[3] = U_INT8_Td(r);
79 1.5.16.1 skrll outblock[4] = U_INT8_Ta(l);
80 1.5.16.1 skrll outblock[5] = U_INT8_Tb(l);
81 1.5.16.1 skrll outblock[6] = U_INT8_Tc(l);
82 1.5.16.1 skrll outblock[7] = U_INT8_Td(l);
83 1.5.16.1 skrll /* Wipe clean */
84 1.5.16.1 skrll t = l = r = 0;
85 1.1 thorpej }
86 1.1 thorpej
87 1.1 thorpej
88 1.5.16.1 skrll /***** Decryption Function *****/
89 1.1 thorpej
90 1.5.16.1 skrll void cast128_decrypt(const cast128_key* key, const u_int8_t* inblock,
91 1.5.16.1 skrll u_int8_t* outblock)
92 1.1 thorpej {
93 1.5.16.1 skrll u_int32_t t, l, r;
94 1.1 thorpej
95 1.5.16.1 skrll /* Get inblock into l,r */
96 1.5.16.1 skrll r = ((u_int32_t)inblock[0] << 24) | ((u_int32_t)inblock[1] << 16) |
97 1.5.16.1 skrll ((u_int32_t)inblock[2] << 8) | (u_int32_t)inblock[3];
98 1.5.16.1 skrll l = ((u_int32_t)inblock[4] << 24) | ((u_int32_t)inblock[5] << 16) |
99 1.5.16.1 skrll ((u_int32_t)inblock[6] << 8) | (u_int32_t)inblock[7];
100 1.5.16.1 skrll /* Do the work */
101 1.5.16.1 skrll /* Only do full 16 rounds if key length > 80 bits */
102 1.5.16.1 skrll if (key->rounds > 12) {
103 1.5.16.1 skrll F1(r, l, 15);
104 1.5.16.1 skrll F3(l, r, 14);
105 1.5.16.1 skrll F2(r, l, 13);
106 1.5.16.1 skrll F1(l, r, 12);
107 1.5.16.1 skrll }
108 1.5.16.1 skrll F3(r, l, 11);
109 1.5.16.1 skrll F2(l, r, 10);
110 1.5.16.1 skrll F1(r, l, 9);
111 1.5.16.1 skrll F3(l, r, 8);
112 1.5.16.1 skrll F2(r, l, 7);
113 1.5.16.1 skrll F1(l, r, 6);
114 1.5.16.1 skrll F3(r, l, 5);
115 1.5.16.1 skrll F2(l, r, 4);
116 1.5.16.1 skrll F1(r, l, 3);
117 1.5.16.1 skrll F3(l, r, 2);
118 1.5.16.1 skrll F2(r, l, 1);
119 1.5.16.1 skrll F1(l, r, 0);
120 1.5.16.1 skrll /* Put l,r into outblock */
121 1.5.16.1 skrll outblock[0] = U_INT8_Ta(l);
122 1.5.16.1 skrll outblock[1] = U_INT8_Tb(l);
123 1.5.16.1 skrll outblock[2] = U_INT8_Tc(l);
124 1.5.16.1 skrll outblock[3] = U_INT8_Td(l);
125 1.5.16.1 skrll outblock[4] = U_INT8_Ta(r);
126 1.5.16.1 skrll outblock[5] = U_INT8_Tb(r);
127 1.5.16.1 skrll outblock[6] = U_INT8_Tc(r);
128 1.5.16.1 skrll outblock[7] = U_INT8_Td(r);
129 1.5.16.1 skrll /* Wipe clean */
130 1.5.16.1 skrll t = l = r = 0;
131 1.1 thorpej }
132 1.1 thorpej
133 1.1 thorpej
134 1.5.16.1 skrll /***** Key Schedual *****/
135 1.1 thorpej
136 1.5.16.1 skrll void cast128_setkey(cast128_key* key, const u_int8_t* rawkey, int keybytes)
137 1.1 thorpej {
138 1.5.16.1 skrll u_int32_t t[4], z[4], x[4];
139 1.5.16.1 skrll int i;
140 1.1 thorpej
141 1.5.16.1 skrll /* Set number of rounds to 12 or 16, depending on key length */
142 1.5.16.1 skrll key->rounds = (keybytes <= 10 ? 12 : 16);
143 1.1 thorpej
144 1.5.16.1 skrll /* Copy key to workspace x */
145 1.5.16.1 skrll for (i = 0; i < 4; i++) {
146 1.5.16.1 skrll x[i] = 0;
147 1.5.16.1 skrll if ((i*4+0) < keybytes) x[i] = (u_int32_t)rawkey[i*4+0] << 24;
148 1.5.16.1 skrll if ((i*4+1) < keybytes) x[i] |= (u_int32_t)rawkey[i*4+1] << 16;
149 1.5.16.1 skrll if ((i*4+2) < keybytes) x[i] |= (u_int32_t)rawkey[i*4+2] << 8;
150 1.5.16.1 skrll if ((i*4+3) < keybytes) x[i] |= (u_int32_t)rawkey[i*4+3];
151 1.5.16.1 skrll }
152 1.5.16.1 skrll /* Generate 32 subkeys, four at a time */
153 1.5.16.1 skrll for (i = 0; i < 32; i+=4) {
154 1.5.16.1 skrll switch (i & 4) {
155 1.5.16.1 skrll case 0:
156 1.5.16.1 skrll t[0] = z[0] = x[0] ^ cast_sbox5[U_INT8_Tb(x[3])] ^
157 1.5.16.1 skrll cast_sbox6[U_INT8_Td(x[3])] ^ cast_sbox7[U_INT8_Ta(x[3])] ^
158 1.5.16.1 skrll cast_sbox8[U_INT8_Tc(x[3])] ^ cast_sbox7[U_INT8_Ta(x[2])];
159 1.5.16.1 skrll t[1] = z[1] = x[2] ^ cast_sbox5[U_INT8_Ta(z[0])] ^
160 1.5.16.1 skrll cast_sbox6[U_INT8_Tc(z[0])] ^ cast_sbox7[U_INT8_Tb(z[0])] ^
161 1.5.16.1 skrll cast_sbox8[U_INT8_Td(z[0])] ^ cast_sbox8[U_INT8_Tc(x[2])];
162 1.5.16.1 skrll t[2] = z[2] = x[3] ^ cast_sbox5[U_INT8_Td(z[1])] ^
163 1.5.16.1 skrll cast_sbox6[U_INT8_Tc(z[1])] ^ cast_sbox7[U_INT8_Tb(z[1])] ^
164 1.5.16.1 skrll cast_sbox8[U_INT8_Ta(z[1])] ^ cast_sbox5[U_INT8_Tb(x[2])];
165 1.5.16.1 skrll t[3] = z[3] = x[1] ^ cast_sbox5[U_INT8_Tc(z[2])] ^
166 1.5.16.1 skrll cast_sbox6[U_INT8_Tb(z[2])] ^ cast_sbox7[U_INT8_Td(z[2])] ^
167 1.5.16.1 skrll cast_sbox8[U_INT8_Ta(z[2])] ^ cast_sbox6[U_INT8_Td(x[2])];
168 1.5.16.1 skrll break;
169 1.5.16.1 skrll case 4:
170 1.5.16.1 skrll t[0] = x[0] = z[2] ^ cast_sbox5[U_INT8_Tb(z[1])] ^
171 1.5.16.1 skrll cast_sbox6[U_INT8_Td(z[1])] ^ cast_sbox7[U_INT8_Ta(z[1])] ^
172 1.5.16.1 skrll cast_sbox8[U_INT8_Tc(z[1])] ^ cast_sbox7[U_INT8_Ta(z[0])];
173 1.5.16.1 skrll t[1] = x[1] = z[0] ^ cast_sbox5[U_INT8_Ta(x[0])] ^
174 1.5.16.1 skrll cast_sbox6[U_INT8_Tc(x[0])] ^ cast_sbox7[U_INT8_Tb(x[0])] ^
175 1.5.16.1 skrll cast_sbox8[U_INT8_Td(x[0])] ^ cast_sbox8[U_INT8_Tc(z[0])];
176 1.5.16.1 skrll t[2] = x[2] = z[1] ^ cast_sbox5[U_INT8_Td(x[1])] ^
177 1.5.16.1 skrll cast_sbox6[U_INT8_Tc(x[1])] ^ cast_sbox7[U_INT8_Tb(x[1])] ^
178 1.5.16.1 skrll cast_sbox8[U_INT8_Ta(x[1])] ^ cast_sbox5[U_INT8_Tb(z[0])];
179 1.5.16.1 skrll t[3] = x[3] = z[3] ^ cast_sbox5[U_INT8_Tc(x[2])] ^
180 1.5.16.1 skrll cast_sbox6[U_INT8_Tb(x[2])] ^ cast_sbox7[U_INT8_Td(x[2])] ^
181 1.5.16.1 skrll cast_sbox8[U_INT8_Ta(x[2])] ^ cast_sbox6[U_INT8_Td(z[0])];
182 1.5.16.1 skrll break;
183 1.5.16.1 skrll }
184 1.5.16.1 skrll switch (i & 12) {
185 1.5.16.1 skrll case 0:
186 1.5.16.1 skrll case 12:
187 1.5.16.1 skrll key->xkey[i+0] = cast_sbox5[U_INT8_Ta(t[2])] ^ cast_sbox6[U_INT8_Tb(t[2])] ^
188 1.5.16.1 skrll cast_sbox7[U_INT8_Td(t[1])] ^ cast_sbox8[U_INT8_Tc(t[1])];
189 1.5.16.1 skrll key->xkey[i+1] = cast_sbox5[U_INT8_Tc(t[2])] ^ cast_sbox6[U_INT8_Td(t[2])] ^
190 1.5.16.1 skrll cast_sbox7[U_INT8_Tb(t[1])] ^ cast_sbox8[U_INT8_Ta(t[1])];
191 1.5.16.1 skrll key->xkey[i+2] = cast_sbox5[U_INT8_Ta(t[3])] ^ cast_sbox6[U_INT8_Tb(t[3])] ^
192 1.5.16.1 skrll cast_sbox7[U_INT8_Td(t[0])] ^ cast_sbox8[U_INT8_Tc(t[0])];
193 1.5.16.1 skrll key->xkey[i+3] = cast_sbox5[U_INT8_Tc(t[3])] ^ cast_sbox6[U_INT8_Td(t[3])] ^
194 1.5.16.1 skrll cast_sbox7[U_INT8_Tb(t[0])] ^ cast_sbox8[U_INT8_Ta(t[0])];
195 1.5.16.1 skrll break;
196 1.5.16.1 skrll case 4:
197 1.5.16.1 skrll case 8:
198 1.5.16.1 skrll key->xkey[i+0] = cast_sbox5[U_INT8_Td(t[0])] ^ cast_sbox6[U_INT8_Tc(t[0])] ^
199 1.5.16.1 skrll cast_sbox7[U_INT8_Ta(t[3])] ^ cast_sbox8[U_INT8_Tb(t[3])];
200 1.5.16.1 skrll key->xkey[i+1] = cast_sbox5[U_INT8_Tb(t[0])] ^ cast_sbox6[U_INT8_Ta(t[0])] ^
201 1.5.16.1 skrll cast_sbox7[U_INT8_Tc(t[3])] ^ cast_sbox8[U_INT8_Td(t[3])];
202 1.5.16.1 skrll key->xkey[i+2] = cast_sbox5[U_INT8_Td(t[1])] ^ cast_sbox6[U_INT8_Tc(t[1])] ^
203 1.5.16.1 skrll cast_sbox7[U_INT8_Ta(t[2])] ^ cast_sbox8[U_INT8_Tb(t[2])];
204 1.5.16.1 skrll key->xkey[i+3] = cast_sbox5[U_INT8_Tb(t[1])] ^ cast_sbox6[U_INT8_Ta(t[1])] ^
205 1.5.16.1 skrll cast_sbox7[U_INT8_Tc(t[2])] ^ cast_sbox8[U_INT8_Td(t[2])];
206 1.5.16.1 skrll break;
207 1.5.16.1 skrll }
208 1.5.16.1 skrll switch (i & 12) {
209 1.5.16.1 skrll case 0:
210 1.5.16.1 skrll key->xkey[i+0] ^= cast_sbox5[U_INT8_Tc(z[0])];
211 1.5.16.1 skrll key->xkey[i+1] ^= cast_sbox6[U_INT8_Tc(z[1])];
212 1.5.16.1 skrll key->xkey[i+2] ^= cast_sbox7[U_INT8_Tb(z[2])];
213 1.5.16.1 skrll key->xkey[i+3] ^= cast_sbox8[U_INT8_Ta(z[3])];
214 1.5.16.1 skrll break;
215 1.5.16.1 skrll case 4:
216 1.5.16.1 skrll key->xkey[i+0] ^= cast_sbox5[U_INT8_Ta(x[2])];
217 1.5.16.1 skrll key->xkey[i+1] ^= cast_sbox6[U_INT8_Tb(x[3])];
218 1.5.16.1 skrll key->xkey[i+2] ^= cast_sbox7[U_INT8_Td(x[0])];
219 1.5.16.1 skrll key->xkey[i+3] ^= cast_sbox8[U_INT8_Td(x[1])];
220 1.5.16.1 skrll break;
221 1.5.16.1 skrll case 8:
222 1.5.16.1 skrll key->xkey[i+0] ^= cast_sbox5[U_INT8_Tb(z[2])];
223 1.5.16.1 skrll key->xkey[i+1] ^= cast_sbox6[U_INT8_Ta(z[3])];
224 1.5.16.1 skrll key->xkey[i+2] ^= cast_sbox7[U_INT8_Tc(z[0])];
225 1.5.16.1 skrll key->xkey[i+3] ^= cast_sbox8[U_INT8_Tc(z[1])];
226 1.5.16.1 skrll break;
227 1.5.16.1 skrll case 12:
228 1.5.16.1 skrll key->xkey[i+0] ^= cast_sbox5[U_INT8_Td(x[0])];
229 1.5.16.1 skrll key->xkey[i+1] ^= cast_sbox6[U_INT8_Td(x[1])];
230 1.5.16.1 skrll key->xkey[i+2] ^= cast_sbox7[U_INT8_Ta(x[2])];
231 1.5.16.1 skrll key->xkey[i+3] ^= cast_sbox8[U_INT8_Tb(x[3])];
232 1.5.16.1 skrll break;
233 1.5.16.1 skrll }
234 1.5.16.1 skrll if (i >= 16) {
235 1.5.16.1 skrll key->xkey[i+0] &= 31;
236 1.5.16.1 skrll key->xkey[i+1] &= 31;
237 1.5.16.1 skrll key->xkey[i+2] &= 31;
238 1.5.16.1 skrll key->xkey[i+3] &= 31;
239 1.5.16.1 skrll }
240 1.5.16.1 skrll }
241 1.5.16.1 skrll /* Wipe clean */
242 1.5.16.1 skrll for (i = 0; i < 4; i++) {
243 1.5.16.1 skrll t[i] = x[i] = z[i] = 0;
244 1.5.16.1 skrll }
245 1.5.16.1 skrll }
246 1.1 thorpej
247 1.5.16.1 skrll /* Made in Canada */
248