aes_ct_dec.c revision 1.2 1 1.2 riastrad /* $NetBSD: aes_ct_dec.c,v 1.2 2020/06/29 23:36:59 riastradh Exp $ */
2 1.1 riastrad
3 1.1 riastrad /*
4 1.1 riastrad * Copyright (c) 2016 Thomas Pornin <pornin (at) bolet.org>
5 1.1 riastrad *
6 1.1 riastrad * Permission is hereby granted, free of charge, to any person obtaining
7 1.1 riastrad * a copy of this software and associated documentation files (the
8 1.1 riastrad * "Software"), to deal in the Software without restriction, including
9 1.1 riastrad * without limitation the rights to use, copy, modify, merge, publish,
10 1.1 riastrad * distribute, sublicense, and/or sell copies of the Software, and to
11 1.1 riastrad * permit persons to whom the Software is furnished to do so, subject to
12 1.1 riastrad * the following conditions:
13 1.1 riastrad *
14 1.1 riastrad * The above copyright notice and this permission notice shall be
15 1.1 riastrad * included in all copies or substantial portions of the Software.
16 1.1 riastrad *
17 1.1 riastrad * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
18 1.1 riastrad * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
19 1.1 riastrad * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
20 1.1 riastrad * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
21 1.1 riastrad * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
22 1.1 riastrad * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
23 1.1 riastrad * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
24 1.1 riastrad * SOFTWARE.
25 1.1 riastrad */
26 1.1 riastrad
27 1.1 riastrad #include <sys/cdefs.h>
28 1.2 riastrad __KERNEL_RCSID(1, "$NetBSD: aes_ct_dec.c,v 1.2 2020/06/29 23:36:59 riastradh Exp $");
29 1.1 riastrad
30 1.1 riastrad #include <sys/types.h>
31 1.1 riastrad
32 1.1 riastrad #include <crypto/aes/aes_bear.h>
33 1.1 riastrad
34 1.1 riastrad /* see inner.h */
35 1.1 riastrad void
36 1.1 riastrad br_aes_ct_bitslice_invSbox(uint32_t *q)
37 1.1 riastrad {
38 1.1 riastrad /*
39 1.1 riastrad * AES S-box is:
40 1.1 riastrad * S(x) = A(I(x)) ^ 0x63
41 1.1 riastrad * where I() is inversion in GF(256), and A() is a linear
42 1.1 riastrad * transform (0 is formally defined to be its own inverse).
43 1.1 riastrad * Since inversion is an involution, the inverse S-box can be
44 1.1 riastrad * computed from the S-box as:
45 1.1 riastrad * iS(x) = B(S(B(x ^ 0x63)) ^ 0x63)
46 1.1 riastrad * where B() is the inverse of A(). Indeed, for any y in GF(256):
47 1.1 riastrad * iS(S(y)) = B(A(I(B(A(I(y)) ^ 0x63 ^ 0x63))) ^ 0x63 ^ 0x63) = y
48 1.1 riastrad *
49 1.1 riastrad * Note: we reuse the implementation of the forward S-box,
50 1.1 riastrad * instead of duplicating it here, so that total code size is
51 1.1 riastrad * lower. By merging the B() transforms into the S-box circuit
52 1.1 riastrad * we could make faster CBC decryption, but CBC decryption is
53 1.1 riastrad * already quite faster than CBC encryption because we can
54 1.1 riastrad * process two blocks in parallel.
55 1.1 riastrad */
56 1.1 riastrad uint32_t q0, q1, q2, q3, q4, q5, q6, q7;
57 1.1 riastrad
58 1.1 riastrad q0 = ~q[0];
59 1.1 riastrad q1 = ~q[1];
60 1.1 riastrad q2 = q[2];
61 1.1 riastrad q3 = q[3];
62 1.1 riastrad q4 = q[4];
63 1.1 riastrad q5 = ~q[5];
64 1.1 riastrad q6 = ~q[6];
65 1.1 riastrad q7 = q[7];
66 1.1 riastrad q[7] = q1 ^ q4 ^ q6;
67 1.1 riastrad q[6] = q0 ^ q3 ^ q5;
68 1.1 riastrad q[5] = q7 ^ q2 ^ q4;
69 1.1 riastrad q[4] = q6 ^ q1 ^ q3;
70 1.1 riastrad q[3] = q5 ^ q0 ^ q2;
71 1.1 riastrad q[2] = q4 ^ q7 ^ q1;
72 1.1 riastrad q[1] = q3 ^ q6 ^ q0;
73 1.1 riastrad q[0] = q2 ^ q5 ^ q7;
74 1.1 riastrad
75 1.1 riastrad br_aes_ct_bitslice_Sbox(q);
76 1.1 riastrad
77 1.1 riastrad q0 = ~q[0];
78 1.1 riastrad q1 = ~q[1];
79 1.1 riastrad q2 = q[2];
80 1.1 riastrad q3 = q[3];
81 1.1 riastrad q4 = q[4];
82 1.1 riastrad q5 = ~q[5];
83 1.1 riastrad q6 = ~q[6];
84 1.1 riastrad q7 = q[7];
85 1.1 riastrad q[7] = q1 ^ q4 ^ q6;
86 1.1 riastrad q[6] = q0 ^ q3 ^ q5;
87 1.1 riastrad q[5] = q7 ^ q2 ^ q4;
88 1.1 riastrad q[4] = q6 ^ q1 ^ q3;
89 1.1 riastrad q[3] = q5 ^ q0 ^ q2;
90 1.1 riastrad q[2] = q4 ^ q7 ^ q1;
91 1.1 riastrad q[1] = q3 ^ q6 ^ q0;
92 1.1 riastrad q[0] = q2 ^ q5 ^ q7;
93 1.1 riastrad }
94 1.1 riastrad
95 1.1 riastrad static void
96 1.1 riastrad add_round_key(uint32_t *q, const uint32_t *sk)
97 1.1 riastrad {
98 1.1 riastrad int i;
99 1.1 riastrad
100 1.1 riastrad for (i = 0; i < 8; i ++) {
101 1.1 riastrad q[i] ^= sk[i];
102 1.1 riastrad }
103 1.1 riastrad }
104 1.1 riastrad
105 1.1 riastrad static void
106 1.1 riastrad inv_shift_rows(uint32_t *q)
107 1.1 riastrad {
108 1.1 riastrad int i;
109 1.1 riastrad
110 1.1 riastrad for (i = 0; i < 8; i ++) {
111 1.1 riastrad uint32_t x;
112 1.1 riastrad
113 1.1 riastrad x = q[i];
114 1.1 riastrad q[i] = (x & 0x000000FF)
115 1.1 riastrad | ((x & 0x00003F00) << 2) | ((x & 0x0000C000) >> 6)
116 1.1 riastrad | ((x & 0x000F0000) << 4) | ((x & 0x00F00000) >> 4)
117 1.1 riastrad | ((x & 0x03000000) << 6) | ((x & 0xFC000000) >> 2);
118 1.1 riastrad }
119 1.1 riastrad }
120 1.1 riastrad
121 1.1 riastrad static inline uint32_t
122 1.1 riastrad rotr16(uint32_t x)
123 1.1 riastrad {
124 1.1 riastrad return (x << 16) | (x >> 16);
125 1.1 riastrad }
126 1.1 riastrad
127 1.1 riastrad static void
128 1.1 riastrad inv_mix_columns(uint32_t *q)
129 1.1 riastrad {
130 1.1 riastrad uint32_t q0, q1, q2, q3, q4, q5, q6, q7;
131 1.1 riastrad uint32_t r0, r1, r2, r3, r4, r5, r6, r7;
132 1.1 riastrad
133 1.1 riastrad q0 = q[0];
134 1.1 riastrad q1 = q[1];
135 1.1 riastrad q2 = q[2];
136 1.1 riastrad q3 = q[3];
137 1.1 riastrad q4 = q[4];
138 1.1 riastrad q5 = q[5];
139 1.1 riastrad q6 = q[6];
140 1.1 riastrad q7 = q[7];
141 1.1 riastrad r0 = (q0 >> 8) | (q0 << 24);
142 1.1 riastrad r1 = (q1 >> 8) | (q1 << 24);
143 1.1 riastrad r2 = (q2 >> 8) | (q2 << 24);
144 1.1 riastrad r3 = (q3 >> 8) | (q3 << 24);
145 1.1 riastrad r4 = (q4 >> 8) | (q4 << 24);
146 1.1 riastrad r5 = (q5 >> 8) | (q5 << 24);
147 1.1 riastrad r6 = (q6 >> 8) | (q6 << 24);
148 1.1 riastrad r7 = (q7 >> 8) | (q7 << 24);
149 1.1 riastrad
150 1.1 riastrad q[0] = q5 ^ q6 ^ q7 ^ r0 ^ r5 ^ r7 ^ rotr16(q0 ^ q5 ^ q6 ^ r0 ^ r5);
151 1.1 riastrad q[1] = q0 ^ q5 ^ r0 ^ r1 ^ r5 ^ r6 ^ r7 ^ rotr16(q1 ^ q5 ^ q7 ^ r1 ^ r5 ^ r6);
152 1.1 riastrad q[2] = q0 ^ q1 ^ q6 ^ r1 ^ r2 ^ r6 ^ r7 ^ rotr16(q0 ^ q2 ^ q6 ^ r2 ^ r6 ^ r7);
153 1.1 riastrad q[3] = q0 ^ q1 ^ q2 ^ q5 ^ q6 ^ r0 ^ r2 ^ r3 ^ r5 ^ rotr16(q0 ^ q1 ^ q3 ^ q5 ^ q6 ^ q7 ^ r0 ^ r3 ^ r5 ^ r7);
154 1.1 riastrad q[4] = q1 ^ q2 ^ q3 ^ q5 ^ r1 ^ r3 ^ r4 ^ r5 ^ r6 ^ r7 ^ rotr16(q1 ^ q2 ^ q4 ^ q5 ^ q7 ^ r1 ^ r4 ^ r5 ^ r6);
155 1.1 riastrad q[5] = q2 ^ q3 ^ q4 ^ q6 ^ r2 ^ r4 ^ r5 ^ r6 ^ r7 ^ rotr16(q2 ^ q3 ^ q5 ^ q6 ^ r2 ^ r5 ^ r6 ^ r7);
156 1.1 riastrad q[6] = q3 ^ q4 ^ q5 ^ q7 ^ r3 ^ r5 ^ r6 ^ r7 ^ rotr16(q3 ^ q4 ^ q6 ^ q7 ^ r3 ^ r6 ^ r7);
157 1.1 riastrad q[7] = q4 ^ q5 ^ q6 ^ r4 ^ r6 ^ r7 ^ rotr16(q4 ^ q5 ^ q7 ^ r4 ^ r7);
158 1.1 riastrad }
159 1.1 riastrad
160 1.1 riastrad /* see inner.h */
161 1.1 riastrad void
162 1.1 riastrad br_aes_ct_bitslice_decrypt(unsigned num_rounds,
163 1.1 riastrad const uint32_t *skey, uint32_t *q)
164 1.1 riastrad {
165 1.1 riastrad unsigned u;
166 1.1 riastrad
167 1.1 riastrad add_round_key(q, skey + (num_rounds << 3));
168 1.1 riastrad for (u = num_rounds - 1; u > 0; u --) {
169 1.1 riastrad inv_shift_rows(q);
170 1.1 riastrad br_aes_ct_bitslice_invSbox(q);
171 1.1 riastrad add_round_key(q, skey + (u << 3));
172 1.1 riastrad inv_mix_columns(q);
173 1.1 riastrad }
174 1.1 riastrad inv_shift_rows(q);
175 1.1 riastrad br_aes_ct_bitslice_invSbox(q);
176 1.1 riastrad add_round_key(q, skey);
177 1.1 riastrad }
178 1.2 riastrad
179 1.2 riastrad /* NetBSD addition, for generating compatible decryption keys */
180 1.2 riastrad void
181 1.2 riastrad br_aes_ct_inv_mix_columns(uint32_t *q)
182 1.2 riastrad {
183 1.2 riastrad
184 1.2 riastrad inv_mix_columns(q);
185 1.2 riastrad }
186