1 // SPDX-License-Identifier: GPL-2.0-only
3 * Bit sliced AES using NEON instructions
5 * Copyright (C) 2017 Linaro Ltd <ard.biesheuvel@linaro.org>
10 #include <crypto/aes.h>
11 #include <crypto/ctr.h>
12 #include <crypto/internal/simd.h>
13 #include <crypto/internal/skcipher.h>
14 #include <crypto/scatterwalk.h>
15 #include <crypto/xts.h>
16 #include <linux/module.h>
18 MODULE_AUTHOR("Ard Biesheuvel <ard.biesheuvel@linaro.org>");
19 MODULE_LICENSE("GPL v2");
21 MODULE_ALIAS_CRYPTO("ecb(aes)");
22 MODULE_ALIAS_CRYPTO("cbc(aes)-all");
23 MODULE_ALIAS_CRYPTO("ctr(aes)");
24 MODULE_ALIAS_CRYPTO("xts(aes)");
26 asmlinkage
void aesbs_convert_key(u8 out
[], u32
const rk
[], int rounds
);
28 asmlinkage
void aesbs_ecb_encrypt(u8 out
[], u8
const in
[], u8
const rk
[],
29 int rounds
, int blocks
);
30 asmlinkage
void aesbs_ecb_decrypt(u8 out
[], u8
const in
[], u8
const rk
[],
31 int rounds
, int blocks
);
33 asmlinkage
void aesbs_cbc_decrypt(u8 out
[], u8
const in
[], u8
const rk
[],
34 int rounds
, int blocks
, u8 iv
[]);
36 asmlinkage
void aesbs_ctr_encrypt(u8 out
[], u8
const in
[], u8
const rk
[],
37 int rounds
, int blocks
, u8 ctr
[], u8 final
[]);
39 asmlinkage
void aesbs_xts_encrypt(u8 out
[], u8
const in
[], u8
const rk
[],
40 int rounds
, int blocks
, u8 iv
[], int);
41 asmlinkage
void aesbs_xts_decrypt(u8 out
[], u8
const in
[], u8
const rk
[],
42 int rounds
, int blocks
, u8 iv
[], int);
46 u8 rk
[13 * (8 * AES_BLOCK_SIZE
) + 32] __aligned(AES_BLOCK_SIZE
);
49 struct aesbs_cbc_ctx
{
51 struct crypto_skcipher
*enc_tfm
;
54 struct aesbs_xts_ctx
{
56 struct crypto_cipher
*cts_tfm
;
57 struct crypto_cipher
*tweak_tfm
;
60 struct aesbs_ctr_ctx
{
61 struct aesbs_ctx key
; /* must be first member */
62 struct crypto_aes_ctx fallback
;
65 static int aesbs_setkey(struct crypto_skcipher
*tfm
, const u8
*in_key
,
68 struct aesbs_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
69 struct crypto_aes_ctx rk
;
72 err
= aes_expandkey(&rk
, in_key
, key_len
);
76 ctx
->rounds
= 6 + key_len
/ 4;
79 aesbs_convert_key(ctx
->rk
, rk
.key_enc
, ctx
->rounds
);
85 static int __ecb_crypt(struct skcipher_request
*req
,
86 void (*fn
)(u8 out
[], u8
const in
[], u8
const rk
[],
87 int rounds
, int blocks
))
89 struct crypto_skcipher
*tfm
= crypto_skcipher_reqtfm(req
);
90 struct aesbs_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
91 struct skcipher_walk walk
;
94 err
= skcipher_walk_virt(&walk
, req
, false);
96 while (walk
.nbytes
>= AES_BLOCK_SIZE
) {
97 unsigned int blocks
= walk
.nbytes
/ AES_BLOCK_SIZE
;
99 if (walk
.nbytes
< walk
.total
)
100 blocks
= round_down(blocks
,
101 walk
.stride
/ AES_BLOCK_SIZE
);
104 fn(walk
.dst
.virt
.addr
, walk
.src
.virt
.addr
, ctx
->rk
,
105 ctx
->rounds
, blocks
);
107 err
= skcipher_walk_done(&walk
,
108 walk
.nbytes
- blocks
* AES_BLOCK_SIZE
);
114 static int ecb_encrypt(struct skcipher_request
*req
)
116 return __ecb_crypt(req
, aesbs_ecb_encrypt
);
119 static int ecb_decrypt(struct skcipher_request
*req
)
121 return __ecb_crypt(req
, aesbs_ecb_decrypt
);
124 static int aesbs_cbc_setkey(struct crypto_skcipher
*tfm
, const u8
*in_key
,
125 unsigned int key_len
)
127 struct aesbs_cbc_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
128 struct crypto_aes_ctx rk
;
131 err
= aes_expandkey(&rk
, in_key
, key_len
);
135 ctx
->key
.rounds
= 6 + key_len
/ 4;
138 aesbs_convert_key(ctx
->key
.rk
, rk
.key_enc
, ctx
->key
.rounds
);
140 memzero_explicit(&rk
, sizeof(rk
));
142 return crypto_skcipher_setkey(ctx
->enc_tfm
, in_key
, key_len
);
145 static int cbc_encrypt(struct skcipher_request
*req
)
147 struct skcipher_request
*subreq
= skcipher_request_ctx(req
);
148 struct crypto_skcipher
*tfm
= crypto_skcipher_reqtfm(req
);
149 struct aesbs_cbc_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
151 skcipher_request_set_tfm(subreq
, ctx
->enc_tfm
);
152 skcipher_request_set_callback(subreq
,
153 skcipher_request_flags(req
),
155 skcipher_request_set_crypt(subreq
, req
->src
, req
->dst
,
156 req
->cryptlen
, req
->iv
);
158 return crypto_skcipher_encrypt(subreq
);
161 static int cbc_decrypt(struct skcipher_request
*req
)
163 struct crypto_skcipher
*tfm
= crypto_skcipher_reqtfm(req
);
164 struct aesbs_cbc_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
165 struct skcipher_walk walk
;
168 err
= skcipher_walk_virt(&walk
, req
, false);
170 while (walk
.nbytes
>= AES_BLOCK_SIZE
) {
171 unsigned int blocks
= walk
.nbytes
/ AES_BLOCK_SIZE
;
173 if (walk
.nbytes
< walk
.total
)
174 blocks
= round_down(blocks
,
175 walk
.stride
/ AES_BLOCK_SIZE
);
178 aesbs_cbc_decrypt(walk
.dst
.virt
.addr
, walk
.src
.virt
.addr
,
179 ctx
->key
.rk
, ctx
->key
.rounds
, blocks
,
182 err
= skcipher_walk_done(&walk
,
183 walk
.nbytes
- blocks
* AES_BLOCK_SIZE
);
189 static int cbc_init(struct crypto_skcipher
*tfm
)
191 struct aesbs_cbc_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
192 unsigned int reqsize
;
194 ctx
->enc_tfm
= crypto_alloc_skcipher("cbc(aes)", 0, CRYPTO_ALG_ASYNC
|
195 CRYPTO_ALG_NEED_FALLBACK
);
196 if (IS_ERR(ctx
->enc_tfm
))
197 return PTR_ERR(ctx
->enc_tfm
);
199 reqsize
= sizeof(struct skcipher_request
);
200 reqsize
+= crypto_skcipher_reqsize(ctx
->enc_tfm
);
201 crypto_skcipher_set_reqsize(tfm
, reqsize
);
206 static void cbc_exit(struct crypto_skcipher
*tfm
)
208 struct aesbs_cbc_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
210 crypto_free_skcipher(ctx
->enc_tfm
);
213 static int aesbs_ctr_setkey_sync(struct crypto_skcipher
*tfm
, const u8
*in_key
,
214 unsigned int key_len
)
216 struct aesbs_ctr_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
219 err
= aes_expandkey(&ctx
->fallback
, in_key
, key_len
);
223 ctx
->key
.rounds
= 6 + key_len
/ 4;
226 aesbs_convert_key(ctx
->key
.rk
, ctx
->fallback
.key_enc
, ctx
->key
.rounds
);
232 static int ctr_encrypt(struct skcipher_request
*req
)
234 struct crypto_skcipher
*tfm
= crypto_skcipher_reqtfm(req
);
235 struct aesbs_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
236 struct skcipher_walk walk
;
237 u8 buf
[AES_BLOCK_SIZE
];
240 err
= skcipher_walk_virt(&walk
, req
, false);
242 while (walk
.nbytes
> 0) {
243 unsigned int blocks
= walk
.nbytes
/ AES_BLOCK_SIZE
;
244 u8
*final
= (walk
.total
% AES_BLOCK_SIZE
) ? buf
: NULL
;
246 if (walk
.nbytes
< walk
.total
) {
247 blocks
= round_down(blocks
,
248 walk
.stride
/ AES_BLOCK_SIZE
);
253 aesbs_ctr_encrypt(walk
.dst
.virt
.addr
, walk
.src
.virt
.addr
,
254 ctx
->rk
, ctx
->rounds
, blocks
, walk
.iv
, final
);
258 u8
*dst
= walk
.dst
.virt
.addr
+ blocks
* AES_BLOCK_SIZE
;
259 u8
*src
= walk
.src
.virt
.addr
+ blocks
* AES_BLOCK_SIZE
;
261 crypto_xor_cpy(dst
, src
, final
,
262 walk
.total
% AES_BLOCK_SIZE
);
264 err
= skcipher_walk_done(&walk
, 0);
267 err
= skcipher_walk_done(&walk
,
268 walk
.nbytes
- blocks
* AES_BLOCK_SIZE
);
274 static void ctr_encrypt_one(struct crypto_skcipher
*tfm
, const u8
*src
, u8
*dst
)
276 struct aesbs_ctr_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
280 * Temporarily disable interrupts to avoid races where
281 * cachelines are evicted when the CPU is interrupted
282 * to do something else.
284 local_irq_save(flags
);
285 aes_encrypt(&ctx
->fallback
, dst
, src
);
286 local_irq_restore(flags
);
289 static int ctr_encrypt_sync(struct skcipher_request
*req
)
291 if (!crypto_simd_usable())
292 return crypto_ctr_encrypt_walk(req
, ctr_encrypt_one
);
294 return ctr_encrypt(req
);
297 static int aesbs_xts_setkey(struct crypto_skcipher
*tfm
, const u8
*in_key
,
298 unsigned int key_len
)
300 struct aesbs_xts_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
303 err
= xts_verify_key(tfm
, in_key
, key_len
);
308 err
= crypto_cipher_setkey(ctx
->cts_tfm
, in_key
, key_len
);
311 err
= crypto_cipher_setkey(ctx
->tweak_tfm
, in_key
+ key_len
, key_len
);
315 return aesbs_setkey(tfm
, in_key
, key_len
);
318 static int xts_init(struct crypto_skcipher
*tfm
)
320 struct aesbs_xts_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
322 ctx
->cts_tfm
= crypto_alloc_cipher("aes", 0, 0);
323 if (IS_ERR(ctx
->cts_tfm
))
324 return PTR_ERR(ctx
->cts_tfm
);
326 ctx
->tweak_tfm
= crypto_alloc_cipher("aes", 0, 0);
327 if (IS_ERR(ctx
->tweak_tfm
))
328 crypto_free_cipher(ctx
->cts_tfm
);
330 return PTR_ERR_OR_ZERO(ctx
->tweak_tfm
);
333 static void xts_exit(struct crypto_skcipher
*tfm
)
335 struct aesbs_xts_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
337 crypto_free_cipher(ctx
->tweak_tfm
);
338 crypto_free_cipher(ctx
->cts_tfm
);
341 static int __xts_crypt(struct skcipher_request
*req
, bool encrypt
,
342 void (*fn
)(u8 out
[], u8
const in
[], u8
const rk
[],
343 int rounds
, int blocks
, u8 iv
[], int))
345 struct crypto_skcipher
*tfm
= crypto_skcipher_reqtfm(req
);
346 struct aesbs_xts_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
347 int tail
= req
->cryptlen
% AES_BLOCK_SIZE
;
348 struct skcipher_request subreq
;
349 u8 buf
[2 * AES_BLOCK_SIZE
];
350 struct skcipher_walk walk
;
353 if (req
->cryptlen
< AES_BLOCK_SIZE
)
356 if (unlikely(tail
)) {
357 skcipher_request_set_tfm(&subreq
, tfm
);
358 skcipher_request_set_callback(&subreq
,
359 skcipher_request_flags(req
),
361 skcipher_request_set_crypt(&subreq
, req
->src
, req
->dst
,
362 req
->cryptlen
- tail
, req
->iv
);
366 err
= skcipher_walk_virt(&walk
, req
, true);
370 crypto_cipher_encrypt_one(ctx
->tweak_tfm
, walk
.iv
, walk
.iv
);
372 while (walk
.nbytes
>= AES_BLOCK_SIZE
) {
373 unsigned int blocks
= walk
.nbytes
/ AES_BLOCK_SIZE
;
374 int reorder_last_tweak
= !encrypt
&& tail
> 0;
376 if (walk
.nbytes
< walk
.total
) {
377 blocks
= round_down(blocks
,
378 walk
.stride
/ AES_BLOCK_SIZE
);
379 reorder_last_tweak
= 0;
383 fn(walk
.dst
.virt
.addr
, walk
.src
.virt
.addr
, ctx
->key
.rk
,
384 ctx
->key
.rounds
, blocks
, walk
.iv
, reorder_last_tweak
);
386 err
= skcipher_walk_done(&walk
,
387 walk
.nbytes
- blocks
* AES_BLOCK_SIZE
);
390 if (err
|| likely(!tail
))
393 /* handle ciphertext stealing */
394 scatterwalk_map_and_copy(buf
, req
->dst
, req
->cryptlen
- AES_BLOCK_SIZE
,
396 memcpy(buf
+ AES_BLOCK_SIZE
, buf
, tail
);
397 scatterwalk_map_and_copy(buf
, req
->src
, req
->cryptlen
, tail
, 0);
399 crypto_xor(buf
, req
->iv
, AES_BLOCK_SIZE
);
402 crypto_cipher_encrypt_one(ctx
->cts_tfm
, buf
, buf
);
404 crypto_cipher_decrypt_one(ctx
->cts_tfm
, buf
, buf
);
406 crypto_xor(buf
, req
->iv
, AES_BLOCK_SIZE
);
408 scatterwalk_map_and_copy(buf
, req
->dst
, req
->cryptlen
- AES_BLOCK_SIZE
,
409 AES_BLOCK_SIZE
+ tail
, 1);
413 static int xts_encrypt(struct skcipher_request
*req
)
415 return __xts_crypt(req
, true, aesbs_xts_encrypt
);
418 static int xts_decrypt(struct skcipher_request
*req
)
420 return __xts_crypt(req
, false, aesbs_xts_decrypt
);
423 static struct skcipher_alg aes_algs
[] = { {
424 .base
.cra_name
= "__ecb(aes)",
425 .base
.cra_driver_name
= "__ecb-aes-neonbs",
426 .base
.cra_priority
= 250,
427 .base
.cra_blocksize
= AES_BLOCK_SIZE
,
428 .base
.cra_ctxsize
= sizeof(struct aesbs_ctx
),
429 .base
.cra_module
= THIS_MODULE
,
430 .base
.cra_flags
= CRYPTO_ALG_INTERNAL
,
432 .min_keysize
= AES_MIN_KEY_SIZE
,
433 .max_keysize
= AES_MAX_KEY_SIZE
,
434 .walksize
= 8 * AES_BLOCK_SIZE
,
435 .setkey
= aesbs_setkey
,
436 .encrypt
= ecb_encrypt
,
437 .decrypt
= ecb_decrypt
,
439 .base
.cra_name
= "__cbc(aes)",
440 .base
.cra_driver_name
= "__cbc-aes-neonbs",
441 .base
.cra_priority
= 250,
442 .base
.cra_blocksize
= AES_BLOCK_SIZE
,
443 .base
.cra_ctxsize
= sizeof(struct aesbs_cbc_ctx
),
444 .base
.cra_module
= THIS_MODULE
,
445 .base
.cra_flags
= CRYPTO_ALG_INTERNAL
|
446 CRYPTO_ALG_NEED_FALLBACK
,
448 .min_keysize
= AES_MIN_KEY_SIZE
,
449 .max_keysize
= AES_MAX_KEY_SIZE
,
450 .walksize
= 8 * AES_BLOCK_SIZE
,
451 .ivsize
= AES_BLOCK_SIZE
,
452 .setkey
= aesbs_cbc_setkey
,
453 .encrypt
= cbc_encrypt
,
454 .decrypt
= cbc_decrypt
,
458 .base
.cra_name
= "__ctr(aes)",
459 .base
.cra_driver_name
= "__ctr-aes-neonbs",
460 .base
.cra_priority
= 250,
461 .base
.cra_blocksize
= 1,
462 .base
.cra_ctxsize
= sizeof(struct aesbs_ctx
),
463 .base
.cra_module
= THIS_MODULE
,
464 .base
.cra_flags
= CRYPTO_ALG_INTERNAL
,
466 .min_keysize
= AES_MIN_KEY_SIZE
,
467 .max_keysize
= AES_MAX_KEY_SIZE
,
468 .chunksize
= AES_BLOCK_SIZE
,
469 .walksize
= 8 * AES_BLOCK_SIZE
,
470 .ivsize
= AES_BLOCK_SIZE
,
471 .setkey
= aesbs_setkey
,
472 .encrypt
= ctr_encrypt
,
473 .decrypt
= ctr_encrypt
,
475 .base
.cra_name
= "ctr(aes)",
476 .base
.cra_driver_name
= "ctr-aes-neonbs-sync",
477 .base
.cra_priority
= 250 - 1,
478 .base
.cra_blocksize
= 1,
479 .base
.cra_ctxsize
= sizeof(struct aesbs_ctr_ctx
),
480 .base
.cra_module
= THIS_MODULE
,
482 .min_keysize
= AES_MIN_KEY_SIZE
,
483 .max_keysize
= AES_MAX_KEY_SIZE
,
484 .chunksize
= AES_BLOCK_SIZE
,
485 .walksize
= 8 * AES_BLOCK_SIZE
,
486 .ivsize
= AES_BLOCK_SIZE
,
487 .setkey
= aesbs_ctr_setkey_sync
,
488 .encrypt
= ctr_encrypt_sync
,
489 .decrypt
= ctr_encrypt_sync
,
491 .base
.cra_name
= "__xts(aes)",
492 .base
.cra_driver_name
= "__xts-aes-neonbs",
493 .base
.cra_priority
= 250,
494 .base
.cra_blocksize
= AES_BLOCK_SIZE
,
495 .base
.cra_ctxsize
= sizeof(struct aesbs_xts_ctx
),
496 .base
.cra_module
= THIS_MODULE
,
497 .base
.cra_flags
= CRYPTO_ALG_INTERNAL
,
499 .min_keysize
= 2 * AES_MIN_KEY_SIZE
,
500 .max_keysize
= 2 * AES_MAX_KEY_SIZE
,
501 .walksize
= 8 * AES_BLOCK_SIZE
,
502 .ivsize
= AES_BLOCK_SIZE
,
503 .setkey
= aesbs_xts_setkey
,
504 .encrypt
= xts_encrypt
,
505 .decrypt
= xts_decrypt
,
510 static struct simd_skcipher_alg
*aes_simd_algs
[ARRAY_SIZE(aes_algs
)];
512 static void aes_exit(void)
516 for (i
= 0; i
< ARRAY_SIZE(aes_simd_algs
); i
++)
517 if (aes_simd_algs
[i
])
518 simd_skcipher_free(aes_simd_algs
[i
]);
520 crypto_unregister_skciphers(aes_algs
, ARRAY_SIZE(aes_algs
));
523 static int __init
aes_init(void)
525 struct simd_skcipher_alg
*simd
;
526 const char *basename
;
532 if (!(elf_hwcap
& HWCAP_NEON
))
535 err
= crypto_register_skciphers(aes_algs
, ARRAY_SIZE(aes_algs
));
539 for (i
= 0; i
< ARRAY_SIZE(aes_algs
); i
++) {
540 if (!(aes_algs
[i
].base
.cra_flags
& CRYPTO_ALG_INTERNAL
))
543 algname
= aes_algs
[i
].base
.cra_name
+ 2;
544 drvname
= aes_algs
[i
].base
.cra_driver_name
+ 2;
545 basename
= aes_algs
[i
].base
.cra_driver_name
;
546 simd
= simd_skcipher_create_compat(algname
, drvname
, basename
);
549 goto unregister_simds
;
551 aes_simd_algs
[i
] = simd
;
560 late_initcall(aes_init
);
561 module_exit(aes_exit
);