1 /* $FreeBSD: src/sys/crypto/rijndael/rijndael-alg-fst.c,v 1.3.2.1 2001/07/03 11:01:35 ume Exp $ */
2 /* $DragonFly: src/sys/crypto/rijndael/rijndael-alg-fst.c,v 1.2 2003/06/17 04:28:20 dillon Exp $ */
3 /* $KAME: rijndael-alg-fst.c,v 1.7 2001/05/27 00:23:23 itojun Exp $ */
6 * rijndael-alg-fst.c v2.3 April '2000
8 * Optimised ANSI C code
10 * authors: v1.0: Antoon Bosselaers
11 * v2.0: Vincent Rijmen
14 * This code is placed in the public domain.
17 #include <sys/cdefs.h>
18 #include <sys/types.h>
20 #include <sys/systm.h>
24 #include <crypto/rijndael/rijndael-alg-fst.h>
25 #include <crypto/rijndael/rijndael_local.h>
27 #include <crypto/rijndael/boxes-fst.dat>
29 int rijndaelKeySched(word8 k
[MAXKC
][4], word8 W
[MAXROUNDS
+1][4][4], int ROUNDS
) {
30 /* Calculate the necessary round keys
31 * The number of calculations depends on keyBits and blockBits
33 int j
, r
, t
, rconpointer
= 0;
41 for (j
= KC
-1; j
>= 0; j
--) {
42 *((word32
*)tk
[j
]) = *((word32
*)k
[j
]);
46 /* copy values into round key array */
47 for (j
= 0; (j
< KC
) && (r
< ROUNDS
+ 1); ) {
48 for (; (j
< KC
) && (t
< 4); j
++, t
++) {
49 *((word32
*)W
[r
][t
]) = *((word32
*)tk
[j
]);
57 while (r
< ROUNDS
+ 1) { /* while not enough round key material calculated */
58 /* calculate new values */
59 tk
[0][0] ^= S
[tk
[KC
-1][1]];
60 tk
[0][1] ^= S
[tk
[KC
-1][2]];
61 tk
[0][2] ^= S
[tk
[KC
-1][3]];
62 tk
[0][3] ^= S
[tk
[KC
-1][0]];
63 tk
[0][0] ^= rcon
[rconpointer
++];
66 for (j
= 1; j
< KC
; j
++) {
67 *((word32
*)tk
[j
]) ^= *((word32
*)tk
[j
-1]);
70 for (j
= 1; j
< KC
/2; j
++) {
71 *((word32
*)tk
[j
]) ^= *((word32
*)tk
[j
-1]);
73 tk
[KC
/2][0] ^= S
[tk
[KC
/2 - 1][0]];
74 tk
[KC
/2][1] ^= S
[tk
[KC
/2 - 1][1]];
75 tk
[KC
/2][2] ^= S
[tk
[KC
/2 - 1][2]];
76 tk
[KC
/2][3] ^= S
[tk
[KC
/2 - 1][3]];
77 for (j
= KC
/2 + 1; j
< KC
; j
++) {
78 *((word32
*)tk
[j
]) ^= *((word32
*)tk
[j
-1]);
81 /* copy values into round key array */
82 for (j
= 0; (j
< KC
) && (r
< ROUNDS
+ 1); ) {
83 for (; (j
< KC
) && (t
< 4); j
++, t
++) {
84 *((word32
*)W
[r
][t
]) = *((word32
*)tk
[j
]);
96 int rijndaelKeyEncToDec(word8 W
[MAXROUNDS
+1][4][4], int ROUNDS
) {
100 for (r
= 1; r
< ROUNDS
; r
++) {
103 *((const word32
*)U1
[w
[0]])
104 ^ *((const word32
*)U2
[w
[1]])
105 ^ *((const word32
*)U3
[w
[2]])
106 ^ *((const word32
*)U4
[w
[3]]);
110 *((const word32
*)U1
[w
[0]])
111 ^ *((const word32
*)U2
[w
[1]])
112 ^ *((const word32
*)U3
[w
[2]])
113 ^ *((const word32
*)U4
[w
[3]]);
117 *((const word32
*)U1
[w
[0]])
118 ^ *((const word32
*)U2
[w
[1]])
119 ^ *((const word32
*)U3
[w
[2]])
120 ^ *((const word32
*)U4
[w
[3]]);
124 *((const word32
*)U1
[w
[0]])
125 ^ *((const word32
*)U2
[w
[1]])
126 ^ *((const word32
*)U3
[w
[2]])
127 ^ *((const word32
*)U4
[w
[3]]);
133 * Encrypt a single block.
135 int rijndaelEncrypt(word8 in
[16], word8 out
[16], word8 rk
[MAXROUNDS
+1][4][4], int ROUNDS
) {
147 #define temp xtemp.x8
149 memcpy(a
, in
, sizeof a
);
151 *((word32
*)temp
[0]) = *((word32
*)(a
)) ^ *((word32
*)rk
[0][0]);
152 *((word32
*)temp
[1]) = *((word32
*)(a
+ 4)) ^ *((word32
*)rk
[0][1]);
153 *((word32
*)temp
[2]) = *((word32
*)(a
+ 8)) ^ *((word32
*)rk
[0][2]);
154 *((word32
*)temp
[3]) = *((word32
*)(a
+12)) ^ *((word32
*)rk
[0][3]);
155 *((word32
*)(b
)) = *((const word32
*)T1
[temp
[0][0]])
156 ^ *((const word32
*)T2
[temp
[1][1]])
157 ^ *((const word32
*)T3
[temp
[2][2]])
158 ^ *((const word32
*)T4
[temp
[3][3]]);
159 *((word32
*)(b
+ 4)) = *((const word32
*)T1
[temp
[1][0]])
160 ^ *((const word32
*)T2
[temp
[2][1]])
161 ^ *((const word32
*)T3
[temp
[3][2]])
162 ^ *((const word32
*)T4
[temp
[0][3]]);
163 *((word32
*)(b
+ 8)) = *((const word32
*)T1
[temp
[2][0]])
164 ^ *((const word32
*)T2
[temp
[3][1]])
165 ^ *((const word32
*)T3
[temp
[0][2]])
166 ^ *((const word32
*)T4
[temp
[1][3]]);
167 *((word32
*)(b
+12)) = *((const word32
*)T1
[temp
[3][0]])
168 ^ *((const word32
*)T2
[temp
[0][1]])
169 ^ *((const word32
*)T3
[temp
[1][2]])
170 ^ *((const word32
*)T4
[temp
[2][3]]);
171 for (r
= 1; r
< ROUNDS
-1; r
++) {
172 *((word32
*)temp
[0]) = *((word32
*)(b
)) ^ *((word32
*)rk
[r
][0]);
173 *((word32
*)temp
[1]) = *((word32
*)(b
+ 4)) ^ *((word32
*)rk
[r
][1]);
174 *((word32
*)temp
[2]) = *((word32
*)(b
+ 8)) ^ *((word32
*)rk
[r
][2]);
175 *((word32
*)temp
[3]) = *((word32
*)(b
+12)) ^ *((word32
*)rk
[r
][3]);
177 *((word32
*)(b
)) = *((const word32
*)T1
[temp
[0][0]])
178 ^ *((const word32
*)T2
[temp
[1][1]])
179 ^ *((const word32
*)T3
[temp
[2][2]])
180 ^ *((const word32
*)T4
[temp
[3][3]]);
181 *((word32
*)(b
+ 4)) = *((const word32
*)T1
[temp
[1][0]])
182 ^ *((const word32
*)T2
[temp
[2][1]])
183 ^ *((const word32
*)T3
[temp
[3][2]])
184 ^ *((const word32
*)T4
[temp
[0][3]]);
185 *((word32
*)(b
+ 8)) = *((const word32
*)T1
[temp
[2][0]])
186 ^ *((const word32
*)T2
[temp
[3][1]])
187 ^ *((const word32
*)T3
[temp
[0][2]])
188 ^ *((const word32
*)T4
[temp
[1][3]]);
189 *((word32
*)(b
+12)) = *((const word32
*)T1
[temp
[3][0]])
190 ^ *((const word32
*)T2
[temp
[0][1]])
191 ^ *((const word32
*)T3
[temp
[1][2]])
192 ^ *((const word32
*)T4
[temp
[2][3]]);
194 /* last round is special */
195 *((word32
*)temp
[0]) = *((word32
*)(b
)) ^ *((word32
*)rk
[ROUNDS
-1][0]);
196 *((word32
*)temp
[1]) = *((word32
*)(b
+ 4)) ^ *((word32
*)rk
[ROUNDS
-1][1]);
197 *((word32
*)temp
[2]) = *((word32
*)(b
+ 8)) ^ *((word32
*)rk
[ROUNDS
-1][2]);
198 *((word32
*)temp
[3]) = *((word32
*)(b
+12)) ^ *((word32
*)rk
[ROUNDS
-1][3]);
199 b
[ 0] = T1
[temp
[0][0]][1];
200 b
[ 1] = T1
[temp
[1][1]][1];
201 b
[ 2] = T1
[temp
[2][2]][1];
202 b
[ 3] = T1
[temp
[3][3]][1];
203 b
[ 4] = T1
[temp
[1][0]][1];
204 b
[ 5] = T1
[temp
[2][1]][1];
205 b
[ 6] = T1
[temp
[3][2]][1];
206 b
[ 7] = T1
[temp
[0][3]][1];
207 b
[ 8] = T1
[temp
[2][0]][1];
208 b
[ 9] = T1
[temp
[3][1]][1];
209 b
[10] = T1
[temp
[0][2]][1];
210 b
[11] = T1
[temp
[1][3]][1];
211 b
[12] = T1
[temp
[3][0]][1];
212 b
[13] = T1
[temp
[0][1]][1];
213 b
[14] = T1
[temp
[1][2]][1];
214 b
[15] = T1
[temp
[2][3]][1];
215 *((word32
*)(b
)) ^= *((word32
*)rk
[ROUNDS
][0]);
216 *((word32
*)(b
+ 4)) ^= *((word32
*)rk
[ROUNDS
][1]);
217 *((word32
*)(b
+ 8)) ^= *((word32
*)rk
[ROUNDS
][2]);
218 *((word32
*)(b
+12)) ^= *((word32
*)rk
[ROUNDS
][3]);
220 memcpy(out
, b
, sizeof b
/* XXX out */);
228 #ifdef INTERMEDIATE_VALUE_KAT
230 * Encrypt only a certain number of rounds.
231 * Only used in the Intermediate Value Known Answer Test.
233 int rijndaelEncryptRound(word8 a
[4][4], word8 rk
[MAXROUNDS
+1][4][4], int ROUNDS
, int rounds
) {
237 /* make number of rounds sane */
238 if (rounds
> ROUNDS
) {
242 *((word32
*)a
[0]) = *((word32
*)a
[0]) ^ *((word32
*)rk
[0][0]);
243 *((word32
*)a
[1]) = *((word32
*)a
[1]) ^ *((word32
*)rk
[0][1]);
244 *((word32
*)a
[2]) = *((word32
*)a
[2]) ^ *((word32
*)rk
[0][2]);
245 *((word32
*)a
[3]) = *((word32
*)a
[3]) ^ *((word32
*)rk
[0][3]);
247 for (r
= 1; (r
<= rounds
) && (r
< ROUNDS
); r
++) {
248 *((word32
*)temp
[0]) = *((word32
*)T1
[a
[0][0]])
249 ^ *((word32
*)T2
[a
[1][1]])
250 ^ *((word32
*)T3
[a
[2][2]])
251 ^ *((word32
*)T4
[a
[3][3]]);
252 *((word32
*)temp
[1]) = *((word32
*)T1
[a
[1][0]])
253 ^ *((word32
*)T2
[a
[2][1]])
254 ^ *((word32
*)T3
[a
[3][2]])
255 ^ *((word32
*)T4
[a
[0][3]]);
256 *((word32
*)temp
[2]) = *((word32
*)T1
[a
[2][0]])
257 ^ *((word32
*)T2
[a
[3][1]])
258 ^ *((word32
*)T3
[a
[0][2]])
259 ^ *((word32
*)T4
[a
[1][3]]);
260 *((word32
*)temp
[3]) = *((word32
*)T1
[a
[3][0]])
261 ^ *((word32
*)T2
[a
[0][1]])
262 ^ *((word32
*)T3
[a
[1][2]])
263 ^ *((word32
*)T4
[a
[2][3]]);
264 *((word32
*)a
[0]) = *((word32
*)temp
[0]) ^ *((word32
*)rk
[r
][0]);
265 *((word32
*)a
[1]) = *((word32
*)temp
[1]) ^ *((word32
*)rk
[r
][1]);
266 *((word32
*)a
[2]) = *((word32
*)temp
[2]) ^ *((word32
*)rk
[r
][2]);
267 *((word32
*)a
[3]) = *((word32
*)temp
[3]) ^ *((word32
*)rk
[r
][3]);
269 if (rounds
== ROUNDS
) {
270 /* last round is special */
271 temp
[0][0] = T1
[a
[0][0]][1];
272 temp
[0][1] = T1
[a
[1][1]][1];
273 temp
[0][2] = T1
[a
[2][2]][1];
274 temp
[0][3] = T1
[a
[3][3]][1];
275 temp
[1][0] = T1
[a
[1][0]][1];
276 temp
[1][1] = T1
[a
[2][1]][1];
277 temp
[1][2] = T1
[a
[3][2]][1];
278 temp
[1][3] = T1
[a
[0][3]][1];
279 temp
[2][0] = T1
[a
[2][0]][1];
280 temp
[2][1] = T1
[a
[3][1]][1];
281 temp
[2][2] = T1
[a
[0][2]][1];
282 temp
[2][3] = T1
[a
[1][3]][1];
283 temp
[3][0] = T1
[a
[3][0]][1];
284 temp
[3][1] = T1
[a
[0][1]][1];
285 temp
[3][2] = T1
[a
[1][2]][1];
286 temp
[3][3] = T1
[a
[2][3]][1];
287 *((word32
*)a
[0]) = *((word32
*)temp
[0]) ^ *((word32
*)rk
[ROUNDS
][0]);
288 *((word32
*)a
[1]) = *((word32
*)temp
[1]) ^ *((word32
*)rk
[ROUNDS
][1]);
289 *((word32
*)a
[2]) = *((word32
*)temp
[2]) ^ *((word32
*)rk
[ROUNDS
][2]);
290 *((word32
*)a
[3]) = *((word32
*)temp
[3]) ^ *((word32
*)rk
[ROUNDS
][3]);
295 #endif /* INTERMEDIATE_VALUE_KAT */
298 * Decrypt a single block.
300 int rijndaelDecrypt(word8 in
[16], word8 out
[16], word8 rk
[MAXROUNDS
+1][4][4], int ROUNDS
) {
312 #define temp xtemp.x8
314 memcpy(a
, in
, sizeof a
);
316 *((word32
*)temp
[0]) = *((word32
*)(a
)) ^ *((word32
*)rk
[ROUNDS
][0]);
317 *((word32
*)temp
[1]) = *((word32
*)(a
+ 4)) ^ *((word32
*)rk
[ROUNDS
][1]);
318 *((word32
*)temp
[2]) = *((word32
*)(a
+ 8)) ^ *((word32
*)rk
[ROUNDS
][2]);
319 *((word32
*)temp
[3]) = *((word32
*)(a
+12)) ^ *((word32
*)rk
[ROUNDS
][3]);
321 *((word32
*)(b
)) = *((const word32
*)T5
[temp
[0][0]])
322 ^ *((const word32
*)T6
[temp
[3][1]])
323 ^ *((const word32
*)T7
[temp
[2][2]])
324 ^ *((const word32
*)T8
[temp
[1][3]]);
325 *((word32
*)(b
+ 4)) = *((const word32
*)T5
[temp
[1][0]])
326 ^ *((const word32
*)T6
[temp
[0][1]])
327 ^ *((const word32
*)T7
[temp
[3][2]])
328 ^ *((const word32
*)T8
[temp
[2][3]]);
329 *((word32
*)(b
+ 8)) = *((const word32
*)T5
[temp
[2][0]])
330 ^ *((const word32
*)T6
[temp
[1][1]])
331 ^ *((const word32
*)T7
[temp
[0][2]])
332 ^ *((const word32
*)T8
[temp
[3][3]]);
333 *((word32
*)(b
+12)) = *((const word32
*)T5
[temp
[3][0]])
334 ^ *((const word32
*)T6
[temp
[2][1]])
335 ^ *((const word32
*)T7
[temp
[1][2]])
336 ^ *((const word32
*)T8
[temp
[0][3]]);
337 for (r
= ROUNDS
-1; r
> 1; r
--) {
338 *((word32
*)temp
[0]) = *((word32
*)(b
)) ^ *((word32
*)rk
[r
][0]);
339 *((word32
*)temp
[1]) = *((word32
*)(b
+ 4)) ^ *((word32
*)rk
[r
][1]);
340 *((word32
*)temp
[2]) = *((word32
*)(b
+ 8)) ^ *((word32
*)rk
[r
][2]);
341 *((word32
*)temp
[3]) = *((word32
*)(b
+12)) ^ *((word32
*)rk
[r
][3]);
342 *((word32
*)(b
)) = *((const word32
*)T5
[temp
[0][0]])
343 ^ *((const word32
*)T6
[temp
[3][1]])
344 ^ *((const word32
*)T7
[temp
[2][2]])
345 ^ *((const word32
*)T8
[temp
[1][3]]);
346 *((word32
*)(b
+ 4)) = *((const word32
*)T5
[temp
[1][0]])
347 ^ *((const word32
*)T6
[temp
[0][1]])
348 ^ *((const word32
*)T7
[temp
[3][2]])
349 ^ *((const word32
*)T8
[temp
[2][3]]);
350 *((word32
*)(b
+ 8)) = *((const word32
*)T5
[temp
[2][0]])
351 ^ *((const word32
*)T6
[temp
[1][1]])
352 ^ *((const word32
*)T7
[temp
[0][2]])
353 ^ *((const word32
*)T8
[temp
[3][3]]);
354 *((word32
*)(b
+12)) = *((const word32
*)T5
[temp
[3][0]])
355 ^ *((const word32
*)T6
[temp
[2][1]])
356 ^ *((const word32
*)T7
[temp
[1][2]])
357 ^ *((const word32
*)T8
[temp
[0][3]]);
359 /* last round is special */
360 *((word32
*)temp
[0]) = *((word32
*)(b
)) ^ *((word32
*)rk
[1][0]);
361 *((word32
*)temp
[1]) = *((word32
*)(b
+ 4)) ^ *((word32
*)rk
[1][1]);
362 *((word32
*)temp
[2]) = *((word32
*)(b
+ 8)) ^ *((word32
*)rk
[1][2]);
363 *((word32
*)temp
[3]) = *((word32
*)(b
+12)) ^ *((word32
*)rk
[1][3]);
364 b
[ 0] = S5
[temp
[0][0]];
365 b
[ 1] = S5
[temp
[3][1]];
366 b
[ 2] = S5
[temp
[2][2]];
367 b
[ 3] = S5
[temp
[1][3]];
368 b
[ 4] = S5
[temp
[1][0]];
369 b
[ 5] = S5
[temp
[0][1]];
370 b
[ 6] = S5
[temp
[3][2]];
371 b
[ 7] = S5
[temp
[2][3]];
372 b
[ 8] = S5
[temp
[2][0]];
373 b
[ 9] = S5
[temp
[1][1]];
374 b
[10] = S5
[temp
[0][2]];
375 b
[11] = S5
[temp
[3][3]];
376 b
[12] = S5
[temp
[3][0]];
377 b
[13] = S5
[temp
[2][1]];
378 b
[14] = S5
[temp
[1][2]];
379 b
[15] = S5
[temp
[0][3]];
380 *((word32
*)(b
)) ^= *((word32
*)rk
[0][0]);
381 *((word32
*)(b
+ 4)) ^= *((word32
*)rk
[0][1]);
382 *((word32
*)(b
+ 8)) ^= *((word32
*)rk
[0][2]);
383 *((word32
*)(b
+12)) ^= *((word32
*)rk
[0][3]);
385 memcpy(out
, b
, sizeof b
/* XXX out */);
394 #ifdef INTERMEDIATE_VALUE_KAT
396 * Decrypt only a certain number of rounds.
397 * Only used in the Intermediate Value Known Answer Test.
398 * Operations rearranged such that the intermediate values
399 * of decryption correspond with the intermediate values
402 int rijndaelDecryptRound(word8 a
[4][4], word8 rk
[MAXROUNDS
+1][4][4], int ROUNDS
, int rounds
) {
404 word8 temp
[4], shift
;
406 /* make number of rounds sane */
407 if (rounds
> ROUNDS
) {
410 /* first round is special: */
411 *(word32
*)a
[0] ^= *(word32
*)rk
[ROUNDS
][0];
412 *(word32
*)a
[1] ^= *(word32
*)rk
[ROUNDS
][1];
413 *(word32
*)a
[2] ^= *(word32
*)rk
[ROUNDS
][2];
414 *(word32
*)a
[3] ^= *(word32
*)rk
[ROUNDS
][3];
415 for (i
= 0; i
< 4; i
++) {
416 a
[i
][0] = Si
[a
[i
][0]];
417 a
[i
][1] = Si
[a
[i
][1]];
418 a
[i
][2] = Si
[a
[i
][2]];
419 a
[i
][3] = Si
[a
[i
][3]];
421 for (i
= 1; i
< 4; i
++) {
423 temp
[0] = a
[(0 + shift
) & 3][i
];
424 temp
[1] = a
[(1 + shift
) & 3][i
];
425 temp
[2] = a
[(2 + shift
) & 3][i
];
426 temp
[3] = a
[(3 + shift
) & 3][i
];
432 /* ROUNDS-1 ordinary rounds */
433 for (r
= ROUNDS
-1; r
> rounds
; r
--) {
434 *(word32
*)a
[0] ^= *(word32
*)rk
[r
][0];
435 *(word32
*)a
[1] ^= *(word32
*)rk
[r
][1];
436 *(word32
*)a
[2] ^= *(word32
*)rk
[r
][2];
437 *(word32
*)a
[3] ^= *(word32
*)rk
[r
][3];
440 *((word32
*)U1
[a
[0][0]])
441 ^ *((word32
*)U2
[a
[0][1]])
442 ^ *((word32
*)U3
[a
[0][2]])
443 ^ *((word32
*)U4
[a
[0][3]]);
446 *((word32
*)U1
[a
[1][0]])
447 ^ *((word32
*)U2
[a
[1][1]])
448 ^ *((word32
*)U3
[a
[1][2]])
449 ^ *((word32
*)U4
[a
[1][3]]);
452 *((word32
*)U1
[a
[2][0]])
453 ^ *((word32
*)U2
[a
[2][1]])
454 ^ *((word32
*)U3
[a
[2][2]])
455 ^ *((word32
*)U4
[a
[2][3]]);
458 *((word32
*)U1
[a
[3][0]])
459 ^ *((word32
*)U2
[a
[3][1]])
460 ^ *((word32
*)U3
[a
[3][2]])
461 ^ *((word32
*)U4
[a
[3][3]]);
462 for (i
= 0; i
< 4; i
++) {
463 a
[i
][0] = Si
[a
[i
][0]];
464 a
[i
][1] = Si
[a
[i
][1]];
465 a
[i
][2] = Si
[a
[i
][2]];
466 a
[i
][3] = Si
[a
[i
][3]];
468 for (i
= 1; i
< 4; i
++) {
470 temp
[0] = a
[(0 + shift
) & 3][i
];
471 temp
[1] = a
[(1 + shift
) & 3][i
];
472 temp
[2] = a
[(2 + shift
) & 3][i
];
473 temp
[3] = a
[(3 + shift
) & 3][i
];
481 /* End with the extra key addition */
482 *(word32
*)a
[0] ^= *(word32
*)rk
[0][0];
483 *(word32
*)a
[1] ^= *(word32
*)rk
[0][1];
484 *(word32
*)a
[2] ^= *(word32
*)rk
[0][2];
485 *(word32
*)a
[3] ^= *(word32
*)rk
[0][3];
489 #endif /* INTERMEDIATE_VALUE_KAT */