1 // SPDX-License-Identifier: GPL-2.0-only
3 * Bit sliced AES using NEON instructions
5 * Copyright (C) 2017 Linaro Ltd <ard.biesheuvel@linaro.org>
10 #include <crypto/aes.h>
11 #include <crypto/cbc.h>
12 #include <crypto/ctr.h>
13 #include <crypto/internal/simd.h>
14 #include <crypto/internal/skcipher.h>
15 #include <crypto/scatterwalk.h>
16 #include <crypto/xts.h>
17 #include <linux/module.h>
19 MODULE_AUTHOR("Ard Biesheuvel <ard.biesheuvel@linaro.org>");
20 MODULE_LICENSE("GPL v2");
22 MODULE_ALIAS_CRYPTO("ecb(aes)");
23 MODULE_ALIAS_CRYPTO("cbc(aes)");
24 MODULE_ALIAS_CRYPTO("ctr(aes)");
25 MODULE_ALIAS_CRYPTO("xts(aes)");
27 asmlinkage
void aesbs_convert_key(u8 out
[], u32
const rk
[], int rounds
);
29 asmlinkage
void aesbs_ecb_encrypt(u8 out
[], u8
const in
[], u8
const rk
[],
30 int rounds
, int blocks
);
31 asmlinkage
void aesbs_ecb_decrypt(u8 out
[], u8
const in
[], u8
const rk
[],
32 int rounds
, int blocks
);
34 asmlinkage
void aesbs_cbc_decrypt(u8 out
[], u8
const in
[], u8
const rk
[],
35 int rounds
, int blocks
, u8 iv
[]);
37 asmlinkage
void aesbs_ctr_encrypt(u8 out
[], u8
const in
[], u8
const rk
[],
38 int rounds
, int blocks
, u8 ctr
[], u8 final
[]);
40 asmlinkage
void aesbs_xts_encrypt(u8 out
[], u8
const in
[], u8
const rk
[],
41 int rounds
, int blocks
, u8 iv
[], int);
42 asmlinkage
void aesbs_xts_decrypt(u8 out
[], u8
const in
[], u8
const rk
[],
43 int rounds
, int blocks
, u8 iv
[], int);
47 u8 rk
[13 * (8 * AES_BLOCK_SIZE
) + 32] __aligned(AES_BLOCK_SIZE
);
50 struct aesbs_cbc_ctx
{
52 struct crypto_cipher
*enc_tfm
;
55 struct aesbs_xts_ctx
{
57 struct crypto_cipher
*cts_tfm
;
58 struct crypto_cipher
*tweak_tfm
;
61 struct aesbs_ctr_ctx
{
62 struct aesbs_ctx key
; /* must be first member */
63 struct crypto_aes_ctx fallback
;
66 static int aesbs_setkey(struct crypto_skcipher
*tfm
, const u8
*in_key
,
69 struct aesbs_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
70 struct crypto_aes_ctx rk
;
73 err
= aes_expandkey(&rk
, in_key
, key_len
);
77 ctx
->rounds
= 6 + key_len
/ 4;
80 aesbs_convert_key(ctx
->rk
, rk
.key_enc
, ctx
->rounds
);
86 static int __ecb_crypt(struct skcipher_request
*req
,
87 void (*fn
)(u8 out
[], u8
const in
[], u8
const rk
[],
88 int rounds
, int blocks
))
90 struct crypto_skcipher
*tfm
= crypto_skcipher_reqtfm(req
);
91 struct aesbs_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
92 struct skcipher_walk walk
;
95 err
= skcipher_walk_virt(&walk
, req
, false);
97 while (walk
.nbytes
>= AES_BLOCK_SIZE
) {
98 unsigned int blocks
= walk
.nbytes
/ AES_BLOCK_SIZE
;
100 if (walk
.nbytes
< walk
.total
)
101 blocks
= round_down(blocks
,
102 walk
.stride
/ AES_BLOCK_SIZE
);
105 fn(walk
.dst
.virt
.addr
, walk
.src
.virt
.addr
, ctx
->rk
,
106 ctx
->rounds
, blocks
);
108 err
= skcipher_walk_done(&walk
,
109 walk
.nbytes
- blocks
* AES_BLOCK_SIZE
);
115 static int ecb_encrypt(struct skcipher_request
*req
)
117 return __ecb_crypt(req
, aesbs_ecb_encrypt
);
120 static int ecb_decrypt(struct skcipher_request
*req
)
122 return __ecb_crypt(req
, aesbs_ecb_decrypt
);
125 static int aesbs_cbc_setkey(struct crypto_skcipher
*tfm
, const u8
*in_key
,
126 unsigned int key_len
)
128 struct aesbs_cbc_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
129 struct crypto_aes_ctx rk
;
132 err
= aes_expandkey(&rk
, in_key
, key_len
);
136 ctx
->key
.rounds
= 6 + key_len
/ 4;
139 aesbs_convert_key(ctx
->key
.rk
, rk
.key_enc
, ctx
->key
.rounds
);
141 memzero_explicit(&rk
, sizeof(rk
));
143 return crypto_cipher_setkey(ctx
->enc_tfm
, in_key
, key_len
);
146 static void cbc_encrypt_one(struct crypto_skcipher
*tfm
, const u8
*src
, u8
*dst
)
148 struct aesbs_cbc_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
150 crypto_cipher_encrypt_one(ctx
->enc_tfm
, dst
, src
);
153 static int cbc_encrypt(struct skcipher_request
*req
)
155 return crypto_cbc_encrypt_walk(req
, cbc_encrypt_one
);
158 static int cbc_decrypt(struct skcipher_request
*req
)
160 struct crypto_skcipher
*tfm
= crypto_skcipher_reqtfm(req
);
161 struct aesbs_cbc_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
162 struct skcipher_walk walk
;
165 err
= skcipher_walk_virt(&walk
, req
, false);
167 while (walk
.nbytes
>= AES_BLOCK_SIZE
) {
168 unsigned int blocks
= walk
.nbytes
/ AES_BLOCK_SIZE
;
170 if (walk
.nbytes
< walk
.total
)
171 blocks
= round_down(blocks
,
172 walk
.stride
/ AES_BLOCK_SIZE
);
175 aesbs_cbc_decrypt(walk
.dst
.virt
.addr
, walk
.src
.virt
.addr
,
176 ctx
->key
.rk
, ctx
->key
.rounds
, blocks
,
179 err
= skcipher_walk_done(&walk
,
180 walk
.nbytes
- blocks
* AES_BLOCK_SIZE
);
186 static int cbc_init(struct crypto_tfm
*tfm
)
188 struct aesbs_cbc_ctx
*ctx
= crypto_tfm_ctx(tfm
);
190 ctx
->enc_tfm
= crypto_alloc_cipher("aes", 0, 0);
192 return PTR_ERR_OR_ZERO(ctx
->enc_tfm
);
195 static void cbc_exit(struct crypto_tfm
*tfm
)
197 struct aesbs_cbc_ctx
*ctx
= crypto_tfm_ctx(tfm
);
199 crypto_free_cipher(ctx
->enc_tfm
);
202 static int aesbs_ctr_setkey_sync(struct crypto_skcipher
*tfm
, const u8
*in_key
,
203 unsigned int key_len
)
205 struct aesbs_ctr_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
208 err
= aes_expandkey(&ctx
->fallback
, in_key
, key_len
);
212 ctx
->key
.rounds
= 6 + key_len
/ 4;
215 aesbs_convert_key(ctx
->key
.rk
, ctx
->fallback
.key_enc
, ctx
->key
.rounds
);
221 static int ctr_encrypt(struct skcipher_request
*req
)
223 struct crypto_skcipher
*tfm
= crypto_skcipher_reqtfm(req
);
224 struct aesbs_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
225 struct skcipher_walk walk
;
226 u8 buf
[AES_BLOCK_SIZE
];
229 err
= skcipher_walk_virt(&walk
, req
, false);
231 while (walk
.nbytes
> 0) {
232 unsigned int blocks
= walk
.nbytes
/ AES_BLOCK_SIZE
;
233 u8
*final
= (walk
.total
% AES_BLOCK_SIZE
) ? buf
: NULL
;
235 if (walk
.nbytes
< walk
.total
) {
236 blocks
= round_down(blocks
,
237 walk
.stride
/ AES_BLOCK_SIZE
);
242 aesbs_ctr_encrypt(walk
.dst
.virt
.addr
, walk
.src
.virt
.addr
,
243 ctx
->rk
, ctx
->rounds
, blocks
, walk
.iv
, final
);
247 u8
*dst
= walk
.dst
.virt
.addr
+ blocks
* AES_BLOCK_SIZE
;
248 u8
*src
= walk
.src
.virt
.addr
+ blocks
* AES_BLOCK_SIZE
;
250 crypto_xor_cpy(dst
, src
, final
,
251 walk
.total
% AES_BLOCK_SIZE
);
253 err
= skcipher_walk_done(&walk
, 0);
256 err
= skcipher_walk_done(&walk
,
257 walk
.nbytes
- blocks
* AES_BLOCK_SIZE
);
263 static void ctr_encrypt_one(struct crypto_skcipher
*tfm
, const u8
*src
, u8
*dst
)
265 struct aesbs_ctr_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
269 * Temporarily disable interrupts to avoid races where
270 * cachelines are evicted when the CPU is interrupted
271 * to do something else.
273 local_irq_save(flags
);
274 aes_encrypt(&ctx
->fallback
, dst
, src
);
275 local_irq_restore(flags
);
278 static int ctr_encrypt_sync(struct skcipher_request
*req
)
280 if (!crypto_simd_usable())
281 return crypto_ctr_encrypt_walk(req
, ctr_encrypt_one
);
283 return ctr_encrypt(req
);
286 static int aesbs_xts_setkey(struct crypto_skcipher
*tfm
, const u8
*in_key
,
287 unsigned int key_len
)
289 struct aesbs_xts_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
292 err
= xts_verify_key(tfm
, in_key
, key_len
);
297 err
= crypto_cipher_setkey(ctx
->cts_tfm
, in_key
, key_len
);
300 err
= crypto_cipher_setkey(ctx
->tweak_tfm
, in_key
+ key_len
, key_len
);
304 return aesbs_setkey(tfm
, in_key
, key_len
);
307 static int xts_init(struct crypto_tfm
*tfm
)
309 struct aesbs_xts_ctx
*ctx
= crypto_tfm_ctx(tfm
);
311 ctx
->cts_tfm
= crypto_alloc_cipher("aes", 0, 0);
312 if (IS_ERR(ctx
->cts_tfm
))
313 return PTR_ERR(ctx
->cts_tfm
);
315 ctx
->tweak_tfm
= crypto_alloc_cipher("aes", 0, 0);
316 if (IS_ERR(ctx
->tweak_tfm
))
317 crypto_free_cipher(ctx
->cts_tfm
);
319 return PTR_ERR_OR_ZERO(ctx
->tweak_tfm
);
322 static void xts_exit(struct crypto_tfm
*tfm
)
324 struct aesbs_xts_ctx
*ctx
= crypto_tfm_ctx(tfm
);
326 crypto_free_cipher(ctx
->tweak_tfm
);
327 crypto_free_cipher(ctx
->cts_tfm
);
330 static int __xts_crypt(struct skcipher_request
*req
, bool encrypt
,
331 void (*fn
)(u8 out
[], u8
const in
[], u8
const rk
[],
332 int rounds
, int blocks
, u8 iv
[], int))
334 struct crypto_skcipher
*tfm
= crypto_skcipher_reqtfm(req
);
335 struct aesbs_xts_ctx
*ctx
= crypto_skcipher_ctx(tfm
);
336 int tail
= req
->cryptlen
% AES_BLOCK_SIZE
;
337 struct skcipher_request subreq
;
338 u8 buf
[2 * AES_BLOCK_SIZE
];
339 struct skcipher_walk walk
;
342 if (req
->cryptlen
< AES_BLOCK_SIZE
)
345 if (unlikely(tail
)) {
346 skcipher_request_set_tfm(&subreq
, tfm
);
347 skcipher_request_set_callback(&subreq
,
348 skcipher_request_flags(req
),
350 skcipher_request_set_crypt(&subreq
, req
->src
, req
->dst
,
351 req
->cryptlen
- tail
, req
->iv
);
355 err
= skcipher_walk_virt(&walk
, req
, true);
359 crypto_cipher_encrypt_one(ctx
->tweak_tfm
, walk
.iv
, walk
.iv
);
361 while (walk
.nbytes
>= AES_BLOCK_SIZE
) {
362 unsigned int blocks
= walk
.nbytes
/ AES_BLOCK_SIZE
;
363 int reorder_last_tweak
= !encrypt
&& tail
> 0;
365 if (walk
.nbytes
< walk
.total
) {
366 blocks
= round_down(blocks
,
367 walk
.stride
/ AES_BLOCK_SIZE
);
368 reorder_last_tweak
= 0;
372 fn(walk
.dst
.virt
.addr
, walk
.src
.virt
.addr
, ctx
->key
.rk
,
373 ctx
->key
.rounds
, blocks
, walk
.iv
, reorder_last_tweak
);
375 err
= skcipher_walk_done(&walk
,
376 walk
.nbytes
- blocks
* AES_BLOCK_SIZE
);
379 if (err
|| likely(!tail
))
382 /* handle ciphertext stealing */
383 scatterwalk_map_and_copy(buf
, req
->dst
, req
->cryptlen
- AES_BLOCK_SIZE
,
385 memcpy(buf
+ AES_BLOCK_SIZE
, buf
, tail
);
386 scatterwalk_map_and_copy(buf
, req
->src
, req
->cryptlen
, tail
, 0);
388 crypto_xor(buf
, req
->iv
, AES_BLOCK_SIZE
);
391 crypto_cipher_encrypt_one(ctx
->cts_tfm
, buf
, buf
);
393 crypto_cipher_decrypt_one(ctx
->cts_tfm
, buf
, buf
);
395 crypto_xor(buf
, req
->iv
, AES_BLOCK_SIZE
);
397 scatterwalk_map_and_copy(buf
, req
->dst
, req
->cryptlen
- AES_BLOCK_SIZE
,
398 AES_BLOCK_SIZE
+ tail
, 1);
402 static int xts_encrypt(struct skcipher_request
*req
)
404 return __xts_crypt(req
, true, aesbs_xts_encrypt
);
407 static int xts_decrypt(struct skcipher_request
*req
)
409 return __xts_crypt(req
, false, aesbs_xts_decrypt
);
412 static struct skcipher_alg aes_algs
[] = { {
413 .base
.cra_name
= "__ecb(aes)",
414 .base
.cra_driver_name
= "__ecb-aes-neonbs",
415 .base
.cra_priority
= 250,
416 .base
.cra_blocksize
= AES_BLOCK_SIZE
,
417 .base
.cra_ctxsize
= sizeof(struct aesbs_ctx
),
418 .base
.cra_module
= THIS_MODULE
,
419 .base
.cra_flags
= CRYPTO_ALG_INTERNAL
,
421 .min_keysize
= AES_MIN_KEY_SIZE
,
422 .max_keysize
= AES_MAX_KEY_SIZE
,
423 .walksize
= 8 * AES_BLOCK_SIZE
,
424 .setkey
= aesbs_setkey
,
425 .encrypt
= ecb_encrypt
,
426 .decrypt
= ecb_decrypt
,
428 .base
.cra_name
= "__cbc(aes)",
429 .base
.cra_driver_name
= "__cbc-aes-neonbs",
430 .base
.cra_priority
= 250,
431 .base
.cra_blocksize
= AES_BLOCK_SIZE
,
432 .base
.cra_ctxsize
= sizeof(struct aesbs_cbc_ctx
),
433 .base
.cra_module
= THIS_MODULE
,
434 .base
.cra_flags
= CRYPTO_ALG_INTERNAL
,
435 .base
.cra_init
= cbc_init
,
436 .base
.cra_exit
= cbc_exit
,
438 .min_keysize
= AES_MIN_KEY_SIZE
,
439 .max_keysize
= AES_MAX_KEY_SIZE
,
440 .walksize
= 8 * AES_BLOCK_SIZE
,
441 .ivsize
= AES_BLOCK_SIZE
,
442 .setkey
= aesbs_cbc_setkey
,
443 .encrypt
= cbc_encrypt
,
444 .decrypt
= cbc_decrypt
,
446 .base
.cra_name
= "__ctr(aes)",
447 .base
.cra_driver_name
= "__ctr-aes-neonbs",
448 .base
.cra_priority
= 250,
449 .base
.cra_blocksize
= 1,
450 .base
.cra_ctxsize
= sizeof(struct aesbs_ctx
),
451 .base
.cra_module
= THIS_MODULE
,
452 .base
.cra_flags
= CRYPTO_ALG_INTERNAL
,
454 .min_keysize
= AES_MIN_KEY_SIZE
,
455 .max_keysize
= AES_MAX_KEY_SIZE
,
456 .chunksize
= AES_BLOCK_SIZE
,
457 .walksize
= 8 * AES_BLOCK_SIZE
,
458 .ivsize
= AES_BLOCK_SIZE
,
459 .setkey
= aesbs_setkey
,
460 .encrypt
= ctr_encrypt
,
461 .decrypt
= ctr_encrypt
,
463 .base
.cra_name
= "ctr(aes)",
464 .base
.cra_driver_name
= "ctr-aes-neonbs-sync",
465 .base
.cra_priority
= 250 - 1,
466 .base
.cra_blocksize
= 1,
467 .base
.cra_ctxsize
= sizeof(struct aesbs_ctr_ctx
),
468 .base
.cra_module
= THIS_MODULE
,
470 .min_keysize
= AES_MIN_KEY_SIZE
,
471 .max_keysize
= AES_MAX_KEY_SIZE
,
472 .chunksize
= AES_BLOCK_SIZE
,
473 .walksize
= 8 * AES_BLOCK_SIZE
,
474 .ivsize
= AES_BLOCK_SIZE
,
475 .setkey
= aesbs_ctr_setkey_sync
,
476 .encrypt
= ctr_encrypt_sync
,
477 .decrypt
= ctr_encrypt_sync
,
479 .base
.cra_name
= "__xts(aes)",
480 .base
.cra_driver_name
= "__xts-aes-neonbs",
481 .base
.cra_priority
= 250,
482 .base
.cra_blocksize
= AES_BLOCK_SIZE
,
483 .base
.cra_ctxsize
= sizeof(struct aesbs_xts_ctx
),
484 .base
.cra_module
= THIS_MODULE
,
485 .base
.cra_flags
= CRYPTO_ALG_INTERNAL
,
486 .base
.cra_init
= xts_init
,
487 .base
.cra_exit
= xts_exit
,
489 .min_keysize
= 2 * AES_MIN_KEY_SIZE
,
490 .max_keysize
= 2 * AES_MAX_KEY_SIZE
,
491 .walksize
= 8 * AES_BLOCK_SIZE
,
492 .ivsize
= AES_BLOCK_SIZE
,
493 .setkey
= aesbs_xts_setkey
,
494 .encrypt
= xts_encrypt
,
495 .decrypt
= xts_decrypt
,
498 static struct simd_skcipher_alg
*aes_simd_algs
[ARRAY_SIZE(aes_algs
)];
500 static void aes_exit(void)
504 for (i
= 0; i
< ARRAY_SIZE(aes_simd_algs
); i
++)
505 if (aes_simd_algs
[i
])
506 simd_skcipher_free(aes_simd_algs
[i
]);
508 crypto_unregister_skciphers(aes_algs
, ARRAY_SIZE(aes_algs
));
511 static int __init
aes_init(void)
513 struct simd_skcipher_alg
*simd
;
514 const char *basename
;
520 if (!(elf_hwcap
& HWCAP_NEON
))
523 err
= crypto_register_skciphers(aes_algs
, ARRAY_SIZE(aes_algs
));
527 for (i
= 0; i
< ARRAY_SIZE(aes_algs
); i
++) {
528 if (!(aes_algs
[i
].base
.cra_flags
& CRYPTO_ALG_INTERNAL
))
531 algname
= aes_algs
[i
].base
.cra_name
+ 2;
532 drvname
= aes_algs
[i
].base
.cra_driver_name
+ 2;
533 basename
= aes_algs
[i
].base
.cra_driver_name
;
534 simd
= simd_skcipher_create_compat(algname
, drvname
, basename
);
537 goto unregister_simds
;
539 aes_simd_algs
[i
] = simd
;
548 late_initcall(aes_init
);
549 module_exit(aes_exit
);