2 * Glue Code for x86_64/AVX/AES-NI assembler optimized version of Camellia
4 * Copyright © 2012-2013 Jussi Kivilinna <jussi.kivilinna@iki.fi>
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; either version 2 of the License, or
9 * (at your option) any later version.
13 #include <linux/module.h>
14 #include <linux/types.h>
15 #include <linux/crypto.h>
16 #include <linux/err.h>
17 #include <crypto/ablk_helper.h>
18 #include <crypto/algapi.h>
19 #include <crypto/ctr.h>
20 #include <crypto/lrw.h>
21 #include <crypto/xts.h>
23 #include <asm/xsave.h>
24 #include <asm/crypto/camellia.h>
25 #include <asm/crypto/glue_helper.h>
27 #define CAMELLIA_AESNI_PARALLEL_BLOCKS 16
29 /* 16-way parallel cipher functions (avx/aes-ni) */
30 asmlinkage
void camellia_ecb_enc_16way(struct camellia_ctx
*ctx
, u8
*dst
,
32 EXPORT_SYMBOL_GPL(camellia_ecb_enc_16way
);
34 asmlinkage
void camellia_ecb_dec_16way(struct camellia_ctx
*ctx
, u8
*dst
,
36 EXPORT_SYMBOL_GPL(camellia_ecb_dec_16way
);
38 asmlinkage
void camellia_cbc_dec_16way(struct camellia_ctx
*ctx
, u8
*dst
,
40 EXPORT_SYMBOL_GPL(camellia_cbc_dec_16way
);
42 asmlinkage
void camellia_ctr_16way(struct camellia_ctx
*ctx
, u8
*dst
,
43 const u8
*src
, le128
*iv
);
44 EXPORT_SYMBOL_GPL(camellia_ctr_16way
);
46 asmlinkage
void camellia_xts_enc_16way(struct camellia_ctx
*ctx
, u8
*dst
,
47 const u8
*src
, le128
*iv
);
48 EXPORT_SYMBOL_GPL(camellia_xts_enc_16way
);
50 asmlinkage
void camellia_xts_dec_16way(struct camellia_ctx
*ctx
, u8
*dst
,
51 const u8
*src
, le128
*iv
);
52 EXPORT_SYMBOL_GPL(camellia_xts_dec_16way
);
54 void camellia_xts_enc(void *ctx
, u128
*dst
, const u128
*src
, le128
*iv
)
56 glue_xts_crypt_128bit_one(ctx
, dst
, src
, iv
,
57 GLUE_FUNC_CAST(camellia_enc_blk
));
59 EXPORT_SYMBOL_GPL(camellia_xts_enc
);
61 void camellia_xts_dec(void *ctx
, u128
*dst
, const u128
*src
, le128
*iv
)
63 glue_xts_crypt_128bit_one(ctx
, dst
, src
, iv
,
64 GLUE_FUNC_CAST(camellia_dec_blk
));
66 EXPORT_SYMBOL_GPL(camellia_xts_dec
);
68 static const struct common_glue_ctx camellia_enc
= {
70 .fpu_blocks_limit
= CAMELLIA_AESNI_PARALLEL_BLOCKS
,
73 .num_blocks
= CAMELLIA_AESNI_PARALLEL_BLOCKS
,
74 .fn_u
= { .ecb
= GLUE_FUNC_CAST(camellia_ecb_enc_16way
) }
77 .fn_u
= { .ecb
= GLUE_FUNC_CAST(camellia_enc_blk_2way
) }
80 .fn_u
= { .ecb
= GLUE_FUNC_CAST(camellia_enc_blk
) }
84 static const struct common_glue_ctx camellia_ctr
= {
86 .fpu_blocks_limit
= CAMELLIA_AESNI_PARALLEL_BLOCKS
,
89 .num_blocks
= CAMELLIA_AESNI_PARALLEL_BLOCKS
,
90 .fn_u
= { .ctr
= GLUE_CTR_FUNC_CAST(camellia_ctr_16way
) }
93 .fn_u
= { .ctr
= GLUE_CTR_FUNC_CAST(camellia_crypt_ctr_2way
) }
96 .fn_u
= { .ctr
= GLUE_CTR_FUNC_CAST(camellia_crypt_ctr
) }
100 static const struct common_glue_ctx camellia_enc_xts
= {
102 .fpu_blocks_limit
= CAMELLIA_AESNI_PARALLEL_BLOCKS
,
105 .num_blocks
= CAMELLIA_AESNI_PARALLEL_BLOCKS
,
106 .fn_u
= { .xts
= GLUE_XTS_FUNC_CAST(camellia_xts_enc_16way
) }
109 .fn_u
= { .xts
= GLUE_XTS_FUNC_CAST(camellia_xts_enc
) }
113 static const struct common_glue_ctx camellia_dec
= {
115 .fpu_blocks_limit
= CAMELLIA_AESNI_PARALLEL_BLOCKS
,
118 .num_blocks
= CAMELLIA_AESNI_PARALLEL_BLOCKS
,
119 .fn_u
= { .ecb
= GLUE_FUNC_CAST(camellia_ecb_dec_16way
) }
122 .fn_u
= { .ecb
= GLUE_FUNC_CAST(camellia_dec_blk_2way
) }
125 .fn_u
= { .ecb
= GLUE_FUNC_CAST(camellia_dec_blk
) }
129 static const struct common_glue_ctx camellia_dec_cbc
= {
131 .fpu_blocks_limit
= CAMELLIA_AESNI_PARALLEL_BLOCKS
,
134 .num_blocks
= CAMELLIA_AESNI_PARALLEL_BLOCKS
,
135 .fn_u
= { .cbc
= GLUE_CBC_FUNC_CAST(camellia_cbc_dec_16way
) }
138 .fn_u
= { .cbc
= GLUE_CBC_FUNC_CAST(camellia_decrypt_cbc_2way
) }
141 .fn_u
= { .cbc
= GLUE_CBC_FUNC_CAST(camellia_dec_blk
) }
145 static const struct common_glue_ctx camellia_dec_xts
= {
147 .fpu_blocks_limit
= CAMELLIA_AESNI_PARALLEL_BLOCKS
,
150 .num_blocks
= CAMELLIA_AESNI_PARALLEL_BLOCKS
,
151 .fn_u
= { .xts
= GLUE_XTS_FUNC_CAST(camellia_xts_dec_16way
) }
154 .fn_u
= { .xts
= GLUE_XTS_FUNC_CAST(camellia_xts_dec
) }
158 static int ecb_encrypt(struct blkcipher_desc
*desc
, struct scatterlist
*dst
,
159 struct scatterlist
*src
, unsigned int nbytes
)
161 return glue_ecb_crypt_128bit(&camellia_enc
, desc
, dst
, src
, nbytes
);
164 static int ecb_decrypt(struct blkcipher_desc
*desc
, struct scatterlist
*dst
,
165 struct scatterlist
*src
, unsigned int nbytes
)
167 return glue_ecb_crypt_128bit(&camellia_dec
, desc
, dst
, src
, nbytes
);
170 static int cbc_encrypt(struct blkcipher_desc
*desc
, struct scatterlist
*dst
,
171 struct scatterlist
*src
, unsigned int nbytes
)
173 return glue_cbc_encrypt_128bit(GLUE_FUNC_CAST(camellia_enc_blk
), desc
,
177 static int cbc_decrypt(struct blkcipher_desc
*desc
, struct scatterlist
*dst
,
178 struct scatterlist
*src
, unsigned int nbytes
)
180 return glue_cbc_decrypt_128bit(&camellia_dec_cbc
, desc
, dst
, src
,
184 static int ctr_crypt(struct blkcipher_desc
*desc
, struct scatterlist
*dst
,
185 struct scatterlist
*src
, unsigned int nbytes
)
187 return glue_ctr_crypt_128bit(&camellia_ctr
, desc
, dst
, src
, nbytes
);
190 static inline bool camellia_fpu_begin(bool fpu_enabled
, unsigned int nbytes
)
192 return glue_fpu_begin(CAMELLIA_BLOCK_SIZE
,
193 CAMELLIA_AESNI_PARALLEL_BLOCKS
, NULL
, fpu_enabled
,
197 static inline void camellia_fpu_end(bool fpu_enabled
)
199 glue_fpu_end(fpu_enabled
);
202 static int camellia_setkey(struct crypto_tfm
*tfm
, const u8
*in_key
,
203 unsigned int key_len
)
205 return __camellia_setkey(crypto_tfm_ctx(tfm
), in_key
, key_len
,
210 struct camellia_ctx
*ctx
;
214 static void encrypt_callback(void *priv
, u8
*srcdst
, unsigned int nbytes
)
216 const unsigned int bsize
= CAMELLIA_BLOCK_SIZE
;
217 struct crypt_priv
*ctx
= priv
;
220 ctx
->fpu_enabled
= camellia_fpu_begin(ctx
->fpu_enabled
, nbytes
);
222 if (nbytes
>= CAMELLIA_AESNI_PARALLEL_BLOCKS
* bsize
) {
223 camellia_ecb_enc_16way(ctx
->ctx
, srcdst
, srcdst
);
224 srcdst
+= bsize
* CAMELLIA_AESNI_PARALLEL_BLOCKS
;
225 nbytes
-= bsize
* CAMELLIA_AESNI_PARALLEL_BLOCKS
;
228 while (nbytes
>= CAMELLIA_PARALLEL_BLOCKS
* bsize
) {
229 camellia_enc_blk_2way(ctx
->ctx
, srcdst
, srcdst
);
230 srcdst
+= bsize
* CAMELLIA_PARALLEL_BLOCKS
;
231 nbytes
-= bsize
* CAMELLIA_PARALLEL_BLOCKS
;
234 for (i
= 0; i
< nbytes
/ bsize
; i
++, srcdst
+= bsize
)
235 camellia_enc_blk(ctx
->ctx
, srcdst
, srcdst
);
238 static void decrypt_callback(void *priv
, u8
*srcdst
, unsigned int nbytes
)
240 const unsigned int bsize
= CAMELLIA_BLOCK_SIZE
;
241 struct crypt_priv
*ctx
= priv
;
244 ctx
->fpu_enabled
= camellia_fpu_begin(ctx
->fpu_enabled
, nbytes
);
246 if (nbytes
>= CAMELLIA_AESNI_PARALLEL_BLOCKS
* bsize
) {
247 camellia_ecb_dec_16way(ctx
->ctx
, srcdst
, srcdst
);
248 srcdst
+= bsize
* CAMELLIA_AESNI_PARALLEL_BLOCKS
;
249 nbytes
-= bsize
* CAMELLIA_AESNI_PARALLEL_BLOCKS
;
252 while (nbytes
>= CAMELLIA_PARALLEL_BLOCKS
* bsize
) {
253 camellia_dec_blk_2way(ctx
->ctx
, srcdst
, srcdst
);
254 srcdst
+= bsize
* CAMELLIA_PARALLEL_BLOCKS
;
255 nbytes
-= bsize
* CAMELLIA_PARALLEL_BLOCKS
;
258 for (i
= 0; i
< nbytes
/ bsize
; i
++, srcdst
+= bsize
)
259 camellia_dec_blk(ctx
->ctx
, srcdst
, srcdst
);
262 static int lrw_encrypt(struct blkcipher_desc
*desc
, struct scatterlist
*dst
,
263 struct scatterlist
*src
, unsigned int nbytes
)
265 struct camellia_lrw_ctx
*ctx
= crypto_blkcipher_ctx(desc
->tfm
);
266 be128 buf
[CAMELLIA_AESNI_PARALLEL_BLOCKS
];
267 struct crypt_priv crypt_ctx
= {
268 .ctx
= &ctx
->camellia_ctx
,
269 .fpu_enabled
= false,
271 struct lrw_crypt_req req
= {
273 .tbuflen
= sizeof(buf
),
275 .table_ctx
= &ctx
->lrw_table
,
276 .crypt_ctx
= &crypt_ctx
,
277 .crypt_fn
= encrypt_callback
,
281 desc
->flags
&= ~CRYPTO_TFM_REQ_MAY_SLEEP
;
282 ret
= lrw_crypt(desc
, dst
, src
, nbytes
, &req
);
283 camellia_fpu_end(crypt_ctx
.fpu_enabled
);
288 static int lrw_decrypt(struct blkcipher_desc
*desc
, struct scatterlist
*dst
,
289 struct scatterlist
*src
, unsigned int nbytes
)
291 struct camellia_lrw_ctx
*ctx
= crypto_blkcipher_ctx(desc
->tfm
);
292 be128 buf
[CAMELLIA_AESNI_PARALLEL_BLOCKS
];
293 struct crypt_priv crypt_ctx
= {
294 .ctx
= &ctx
->camellia_ctx
,
295 .fpu_enabled
= false,
297 struct lrw_crypt_req req
= {
299 .tbuflen
= sizeof(buf
),
301 .table_ctx
= &ctx
->lrw_table
,
302 .crypt_ctx
= &crypt_ctx
,
303 .crypt_fn
= decrypt_callback
,
307 desc
->flags
&= ~CRYPTO_TFM_REQ_MAY_SLEEP
;
308 ret
= lrw_crypt(desc
, dst
, src
, nbytes
, &req
);
309 camellia_fpu_end(crypt_ctx
.fpu_enabled
);
314 static int xts_encrypt(struct blkcipher_desc
*desc
, struct scatterlist
*dst
,
315 struct scatterlist
*src
, unsigned int nbytes
)
317 struct camellia_xts_ctx
*ctx
= crypto_blkcipher_ctx(desc
->tfm
);
319 return glue_xts_crypt_128bit(&camellia_enc_xts
, desc
, dst
, src
, nbytes
,
320 XTS_TWEAK_CAST(camellia_enc_blk
),
321 &ctx
->tweak_ctx
, &ctx
->crypt_ctx
);
324 static int xts_decrypt(struct blkcipher_desc
*desc
, struct scatterlist
*dst
,
325 struct scatterlist
*src
, unsigned int nbytes
)
327 struct camellia_xts_ctx
*ctx
= crypto_blkcipher_ctx(desc
->tfm
);
329 return glue_xts_crypt_128bit(&camellia_dec_xts
, desc
, dst
, src
, nbytes
,
330 XTS_TWEAK_CAST(camellia_enc_blk
),
331 &ctx
->tweak_ctx
, &ctx
->crypt_ctx
);
334 static struct crypto_alg cmll_algs
[10] = { {
335 .cra_name
= "__ecb-camellia-aesni",
336 .cra_driver_name
= "__driver-ecb-camellia-aesni",
338 .cra_flags
= CRYPTO_ALG_TYPE_BLKCIPHER
|
340 .cra_blocksize
= CAMELLIA_BLOCK_SIZE
,
341 .cra_ctxsize
= sizeof(struct camellia_ctx
),
343 .cra_type
= &crypto_blkcipher_type
,
344 .cra_module
= THIS_MODULE
,
347 .min_keysize
= CAMELLIA_MIN_KEY_SIZE
,
348 .max_keysize
= CAMELLIA_MAX_KEY_SIZE
,
349 .setkey
= camellia_setkey
,
350 .encrypt
= ecb_encrypt
,
351 .decrypt
= ecb_decrypt
,
355 .cra_name
= "__cbc-camellia-aesni",
356 .cra_driver_name
= "__driver-cbc-camellia-aesni",
358 .cra_flags
= CRYPTO_ALG_TYPE_BLKCIPHER
|
360 .cra_blocksize
= CAMELLIA_BLOCK_SIZE
,
361 .cra_ctxsize
= sizeof(struct camellia_ctx
),
363 .cra_type
= &crypto_blkcipher_type
,
364 .cra_module
= THIS_MODULE
,
367 .min_keysize
= CAMELLIA_MIN_KEY_SIZE
,
368 .max_keysize
= CAMELLIA_MAX_KEY_SIZE
,
369 .setkey
= camellia_setkey
,
370 .encrypt
= cbc_encrypt
,
371 .decrypt
= cbc_decrypt
,
375 .cra_name
= "__ctr-camellia-aesni",
376 .cra_driver_name
= "__driver-ctr-camellia-aesni",
378 .cra_flags
= CRYPTO_ALG_TYPE_BLKCIPHER
|
381 .cra_ctxsize
= sizeof(struct camellia_ctx
),
383 .cra_type
= &crypto_blkcipher_type
,
384 .cra_module
= THIS_MODULE
,
387 .min_keysize
= CAMELLIA_MIN_KEY_SIZE
,
388 .max_keysize
= CAMELLIA_MAX_KEY_SIZE
,
389 .ivsize
= CAMELLIA_BLOCK_SIZE
,
390 .setkey
= camellia_setkey
,
391 .encrypt
= ctr_crypt
,
392 .decrypt
= ctr_crypt
,
396 .cra_name
= "__lrw-camellia-aesni",
397 .cra_driver_name
= "__driver-lrw-camellia-aesni",
399 .cra_flags
= CRYPTO_ALG_TYPE_BLKCIPHER
|
401 .cra_blocksize
= CAMELLIA_BLOCK_SIZE
,
402 .cra_ctxsize
= sizeof(struct camellia_lrw_ctx
),
404 .cra_type
= &crypto_blkcipher_type
,
405 .cra_module
= THIS_MODULE
,
406 .cra_exit
= lrw_camellia_exit_tfm
,
409 .min_keysize
= CAMELLIA_MIN_KEY_SIZE
+
411 .max_keysize
= CAMELLIA_MAX_KEY_SIZE
+
413 .ivsize
= CAMELLIA_BLOCK_SIZE
,
414 .setkey
= lrw_camellia_setkey
,
415 .encrypt
= lrw_encrypt
,
416 .decrypt
= lrw_decrypt
,
420 .cra_name
= "__xts-camellia-aesni",
421 .cra_driver_name
= "__driver-xts-camellia-aesni",
423 .cra_flags
= CRYPTO_ALG_TYPE_BLKCIPHER
|
425 .cra_blocksize
= CAMELLIA_BLOCK_SIZE
,
426 .cra_ctxsize
= sizeof(struct camellia_xts_ctx
),
428 .cra_type
= &crypto_blkcipher_type
,
429 .cra_module
= THIS_MODULE
,
432 .min_keysize
= CAMELLIA_MIN_KEY_SIZE
* 2,
433 .max_keysize
= CAMELLIA_MAX_KEY_SIZE
* 2,
434 .ivsize
= CAMELLIA_BLOCK_SIZE
,
435 .setkey
= xts_camellia_setkey
,
436 .encrypt
= xts_encrypt
,
437 .decrypt
= xts_decrypt
,
441 .cra_name
= "ecb(camellia)",
442 .cra_driver_name
= "ecb-camellia-aesni",
444 .cra_flags
= CRYPTO_ALG_TYPE_ABLKCIPHER
| CRYPTO_ALG_ASYNC
,
445 .cra_blocksize
= CAMELLIA_BLOCK_SIZE
,
446 .cra_ctxsize
= sizeof(struct async_helper_ctx
),
448 .cra_type
= &crypto_ablkcipher_type
,
449 .cra_module
= THIS_MODULE
,
450 .cra_init
= ablk_init
,
451 .cra_exit
= ablk_exit
,
454 .min_keysize
= CAMELLIA_MIN_KEY_SIZE
,
455 .max_keysize
= CAMELLIA_MAX_KEY_SIZE
,
456 .setkey
= ablk_set_key
,
457 .encrypt
= ablk_encrypt
,
458 .decrypt
= ablk_decrypt
,
462 .cra_name
= "cbc(camellia)",
463 .cra_driver_name
= "cbc-camellia-aesni",
465 .cra_flags
= CRYPTO_ALG_TYPE_ABLKCIPHER
| CRYPTO_ALG_ASYNC
,
466 .cra_blocksize
= CAMELLIA_BLOCK_SIZE
,
467 .cra_ctxsize
= sizeof(struct async_helper_ctx
),
469 .cra_type
= &crypto_ablkcipher_type
,
470 .cra_module
= THIS_MODULE
,
471 .cra_init
= ablk_init
,
472 .cra_exit
= ablk_exit
,
475 .min_keysize
= CAMELLIA_MIN_KEY_SIZE
,
476 .max_keysize
= CAMELLIA_MAX_KEY_SIZE
,
477 .ivsize
= CAMELLIA_BLOCK_SIZE
,
478 .setkey
= ablk_set_key
,
479 .encrypt
= __ablk_encrypt
,
480 .decrypt
= ablk_decrypt
,
484 .cra_name
= "ctr(camellia)",
485 .cra_driver_name
= "ctr-camellia-aesni",
487 .cra_flags
= CRYPTO_ALG_TYPE_ABLKCIPHER
| CRYPTO_ALG_ASYNC
,
489 .cra_ctxsize
= sizeof(struct async_helper_ctx
),
491 .cra_type
= &crypto_ablkcipher_type
,
492 .cra_module
= THIS_MODULE
,
493 .cra_init
= ablk_init
,
494 .cra_exit
= ablk_exit
,
497 .min_keysize
= CAMELLIA_MIN_KEY_SIZE
,
498 .max_keysize
= CAMELLIA_MAX_KEY_SIZE
,
499 .ivsize
= CAMELLIA_BLOCK_SIZE
,
500 .setkey
= ablk_set_key
,
501 .encrypt
= ablk_encrypt
,
502 .decrypt
= ablk_encrypt
,
507 .cra_name
= "lrw(camellia)",
508 .cra_driver_name
= "lrw-camellia-aesni",
510 .cra_flags
= CRYPTO_ALG_TYPE_ABLKCIPHER
| CRYPTO_ALG_ASYNC
,
511 .cra_blocksize
= CAMELLIA_BLOCK_SIZE
,
512 .cra_ctxsize
= sizeof(struct async_helper_ctx
),
514 .cra_type
= &crypto_ablkcipher_type
,
515 .cra_module
= THIS_MODULE
,
516 .cra_init
= ablk_init
,
517 .cra_exit
= ablk_exit
,
520 .min_keysize
= CAMELLIA_MIN_KEY_SIZE
+
522 .max_keysize
= CAMELLIA_MAX_KEY_SIZE
+
524 .ivsize
= CAMELLIA_BLOCK_SIZE
,
525 .setkey
= ablk_set_key
,
526 .encrypt
= ablk_encrypt
,
527 .decrypt
= ablk_decrypt
,
531 .cra_name
= "xts(camellia)",
532 .cra_driver_name
= "xts-camellia-aesni",
534 .cra_flags
= CRYPTO_ALG_TYPE_ABLKCIPHER
| CRYPTO_ALG_ASYNC
,
535 .cra_blocksize
= CAMELLIA_BLOCK_SIZE
,
536 .cra_ctxsize
= sizeof(struct async_helper_ctx
),
538 .cra_type
= &crypto_ablkcipher_type
,
539 .cra_module
= THIS_MODULE
,
540 .cra_init
= ablk_init
,
541 .cra_exit
= ablk_exit
,
544 .min_keysize
= CAMELLIA_MIN_KEY_SIZE
* 2,
545 .max_keysize
= CAMELLIA_MAX_KEY_SIZE
* 2,
546 .ivsize
= CAMELLIA_BLOCK_SIZE
,
547 .setkey
= ablk_set_key
,
548 .encrypt
= ablk_encrypt
,
549 .decrypt
= ablk_decrypt
,
554 static int __init
camellia_aesni_init(void)
558 if (!cpu_has_avx
|| !cpu_has_aes
|| !cpu_has_osxsave
) {
559 pr_info("AVX or AES-NI instructions are not detected.\n");
563 xcr0
= xgetbv(XCR_XFEATURE_ENABLED_MASK
);
564 if ((xcr0
& (XSTATE_SSE
| XSTATE_YMM
)) != (XSTATE_SSE
| XSTATE_YMM
)) {
565 pr_info("AVX detected but unusable.\n");
569 return crypto_register_algs(cmll_algs
, ARRAY_SIZE(cmll_algs
));
572 static void __exit
camellia_aesni_fini(void)
574 crypto_unregister_algs(cmll_algs
, ARRAY_SIZE(cmll_algs
));
577 module_init(camellia_aesni_init
);
578 module_exit(camellia_aesni_fini
);
580 MODULE_LICENSE("GPL");
581 MODULE_DESCRIPTION("Camellia Cipher Algorithm, AES-NI/AVX optimized");
582 MODULE_ALIAS_CRYPTO("camellia");
583 MODULE_ALIAS_CRYPTO("camellia-asm");