2 * Accelerated GHASH implementation with Intel PCLMULQDQ-NI
3 * instructions. This file contains glue code.
5 * Copyright (c) 2009 Intel Corp.
6 * Author: Huang Ying <ying.huang@intel.com>
8 * This program is free software; you can redistribute it and/or modify it
9 * under the terms of the GNU General Public License version 2 as published
10 * by the Free Software Foundation.
13 #include <linux/err.h>
14 #include <linux/module.h>
15 #include <linux/init.h>
16 #include <linux/kernel.h>
17 #include <linux/crypto.h>
18 #include <crypto/algapi.h>
19 #include <crypto/cryptd.h>
20 #include <crypto/gf128mul.h>
21 #include <crypto/internal/hash.h>
22 #include <asm/fpu/api.h>
23 #include <asm/cpu_device_id.h>
25 #define GHASH_BLOCK_SIZE 16
26 #define GHASH_DIGEST_SIZE 16
28 void clmul_ghash_mul(char *dst
, const u128
*shash
);
30 void clmul_ghash_update(char *dst
, const char *src
, unsigned int srclen
,
33 struct ghash_async_ctx
{
34 struct cryptd_ahash
*cryptd_tfm
;
41 struct ghash_desc_ctx
{
42 u8 buffer
[GHASH_BLOCK_SIZE
];
46 static int ghash_init(struct shash_desc
*desc
)
48 struct ghash_desc_ctx
*dctx
= shash_desc_ctx(desc
);
50 memset(dctx
, 0, sizeof(*dctx
));
55 static int ghash_setkey(struct crypto_shash
*tfm
,
56 const u8
*key
, unsigned int keylen
)
58 struct ghash_ctx
*ctx
= crypto_shash_ctx(tfm
);
59 be128
*x
= (be128
*)key
;
62 if (keylen
!= GHASH_BLOCK_SIZE
) {
63 crypto_shash_set_flags(tfm
, CRYPTO_TFM_RES_BAD_KEY_LEN
);
67 /* perform multiplication by 'x' in GF(2^128) */
68 a
= be64_to_cpu(x
->a
);
69 b
= be64_to_cpu(x
->b
);
71 ctx
->shash
.a
= (b
<< 1) | (a
>> 63);
72 ctx
->shash
.b
= (a
<< 1) | (b
>> 63);
75 ctx
->shash
.b
^= ((u64
)0xc2) << 56;
80 static int ghash_update(struct shash_desc
*desc
,
81 const u8
*src
, unsigned int srclen
)
83 struct ghash_desc_ctx
*dctx
= shash_desc_ctx(desc
);
84 struct ghash_ctx
*ctx
= crypto_shash_ctx(desc
->tfm
);
85 u8
*dst
= dctx
->buffer
;
89 int n
= min(srclen
, dctx
->bytes
);
90 u8
*pos
= dst
+ (GHASH_BLOCK_SIZE
- dctx
->bytes
);
99 clmul_ghash_mul(dst
, &ctx
->shash
);
102 clmul_ghash_update(dst
, src
, srclen
, &ctx
->shash
);
106 src
+= srclen
- (srclen
& 0xf);
108 dctx
->bytes
= GHASH_BLOCK_SIZE
- srclen
;
116 static void ghash_flush(struct ghash_ctx
*ctx
, struct ghash_desc_ctx
*dctx
)
118 u8
*dst
= dctx
->buffer
;
121 u8
*tmp
= dst
+ (GHASH_BLOCK_SIZE
- dctx
->bytes
);
123 while (dctx
->bytes
--)
127 clmul_ghash_mul(dst
, &ctx
->shash
);
134 static int ghash_final(struct shash_desc
*desc
, u8
*dst
)
136 struct ghash_desc_ctx
*dctx
= shash_desc_ctx(desc
);
137 struct ghash_ctx
*ctx
= crypto_shash_ctx(desc
->tfm
);
138 u8
*buf
= dctx
->buffer
;
140 ghash_flush(ctx
, dctx
);
141 memcpy(dst
, buf
, GHASH_BLOCK_SIZE
);
146 static struct shash_alg ghash_alg
= {
147 .digestsize
= GHASH_DIGEST_SIZE
,
149 .update
= ghash_update
,
150 .final
= ghash_final
,
151 .setkey
= ghash_setkey
,
152 .descsize
= sizeof(struct ghash_desc_ctx
),
154 .cra_name
= "__ghash",
155 .cra_driver_name
= "__ghash-pclmulqdqni",
157 .cra_flags
= CRYPTO_ALG_INTERNAL
,
158 .cra_blocksize
= GHASH_BLOCK_SIZE
,
159 .cra_ctxsize
= sizeof(struct ghash_ctx
),
160 .cra_module
= THIS_MODULE
,
164 static int ghash_async_init(struct ahash_request
*req
)
166 struct crypto_ahash
*tfm
= crypto_ahash_reqtfm(req
);
167 struct ghash_async_ctx
*ctx
= crypto_ahash_ctx(tfm
);
168 struct ahash_request
*cryptd_req
= ahash_request_ctx(req
);
169 struct cryptd_ahash
*cryptd_tfm
= ctx
->cryptd_tfm
;
170 struct shash_desc
*desc
= cryptd_shash_desc(cryptd_req
);
171 struct crypto_shash
*child
= cryptd_ahash_child(cryptd_tfm
);
174 desc
->flags
= req
->base
.flags
;
175 return crypto_shash_init(desc
);
178 static int ghash_async_update(struct ahash_request
*req
)
180 struct ahash_request
*cryptd_req
= ahash_request_ctx(req
);
181 struct crypto_ahash
*tfm
= crypto_ahash_reqtfm(req
);
182 struct ghash_async_ctx
*ctx
= crypto_ahash_ctx(tfm
);
183 struct cryptd_ahash
*cryptd_tfm
= ctx
->cryptd_tfm
;
185 if (!irq_fpu_usable() ||
186 (in_atomic() && cryptd_ahash_queued(cryptd_tfm
))) {
187 memcpy(cryptd_req
, req
, sizeof(*req
));
188 ahash_request_set_tfm(cryptd_req
, &cryptd_tfm
->base
);
189 return crypto_ahash_update(cryptd_req
);
191 struct shash_desc
*desc
= cryptd_shash_desc(cryptd_req
);
192 return shash_ahash_update(req
, desc
);
196 static int ghash_async_final(struct ahash_request
*req
)
198 struct ahash_request
*cryptd_req
= ahash_request_ctx(req
);
199 struct crypto_ahash
*tfm
= crypto_ahash_reqtfm(req
);
200 struct ghash_async_ctx
*ctx
= crypto_ahash_ctx(tfm
);
201 struct cryptd_ahash
*cryptd_tfm
= ctx
->cryptd_tfm
;
203 if (!irq_fpu_usable() ||
204 (in_atomic() && cryptd_ahash_queued(cryptd_tfm
))) {
205 memcpy(cryptd_req
, req
, sizeof(*req
));
206 ahash_request_set_tfm(cryptd_req
, &cryptd_tfm
->base
);
207 return crypto_ahash_final(cryptd_req
);
209 struct shash_desc
*desc
= cryptd_shash_desc(cryptd_req
);
210 return crypto_shash_final(desc
, req
->result
);
214 static int ghash_async_import(struct ahash_request
*req
, const void *in
)
216 struct ahash_request
*cryptd_req
= ahash_request_ctx(req
);
217 struct shash_desc
*desc
= cryptd_shash_desc(cryptd_req
);
218 struct ghash_desc_ctx
*dctx
= shash_desc_ctx(desc
);
220 ghash_async_init(req
);
221 memcpy(dctx
, in
, sizeof(*dctx
));
226 static int ghash_async_export(struct ahash_request
*req
, void *out
)
228 struct ahash_request
*cryptd_req
= ahash_request_ctx(req
);
229 struct shash_desc
*desc
= cryptd_shash_desc(cryptd_req
);
230 struct ghash_desc_ctx
*dctx
= shash_desc_ctx(desc
);
232 memcpy(out
, dctx
, sizeof(*dctx
));
237 static int ghash_async_digest(struct ahash_request
*req
)
239 struct crypto_ahash
*tfm
= crypto_ahash_reqtfm(req
);
240 struct ghash_async_ctx
*ctx
= crypto_ahash_ctx(tfm
);
241 struct ahash_request
*cryptd_req
= ahash_request_ctx(req
);
242 struct cryptd_ahash
*cryptd_tfm
= ctx
->cryptd_tfm
;
244 if (!irq_fpu_usable() ||
245 (in_atomic() && cryptd_ahash_queued(cryptd_tfm
))) {
246 memcpy(cryptd_req
, req
, sizeof(*req
));
247 ahash_request_set_tfm(cryptd_req
, &cryptd_tfm
->base
);
248 return crypto_ahash_digest(cryptd_req
);
250 struct shash_desc
*desc
= cryptd_shash_desc(cryptd_req
);
251 struct crypto_shash
*child
= cryptd_ahash_child(cryptd_tfm
);
254 desc
->flags
= req
->base
.flags
;
255 return shash_ahash_digest(req
, desc
);
259 static int ghash_async_setkey(struct crypto_ahash
*tfm
, const u8
*key
,
262 struct ghash_async_ctx
*ctx
= crypto_ahash_ctx(tfm
);
263 struct crypto_ahash
*child
= &ctx
->cryptd_tfm
->base
;
266 crypto_ahash_clear_flags(child
, CRYPTO_TFM_REQ_MASK
);
267 crypto_ahash_set_flags(child
, crypto_ahash_get_flags(tfm
)
268 & CRYPTO_TFM_REQ_MASK
);
269 err
= crypto_ahash_setkey(child
, key
, keylen
);
270 crypto_ahash_set_flags(tfm
, crypto_ahash_get_flags(child
)
271 & CRYPTO_TFM_RES_MASK
);
276 static int ghash_async_init_tfm(struct crypto_tfm
*tfm
)
278 struct cryptd_ahash
*cryptd_tfm
;
279 struct ghash_async_ctx
*ctx
= crypto_tfm_ctx(tfm
);
281 cryptd_tfm
= cryptd_alloc_ahash("__ghash-pclmulqdqni",
283 CRYPTO_ALG_INTERNAL
);
284 if (IS_ERR(cryptd_tfm
))
285 return PTR_ERR(cryptd_tfm
);
286 ctx
->cryptd_tfm
= cryptd_tfm
;
287 crypto_ahash_set_reqsize(__crypto_ahash_cast(tfm
),
288 sizeof(struct ahash_request
) +
289 crypto_ahash_reqsize(&cryptd_tfm
->base
));
294 static void ghash_async_exit_tfm(struct crypto_tfm
*tfm
)
296 struct ghash_async_ctx
*ctx
= crypto_tfm_ctx(tfm
);
298 cryptd_free_ahash(ctx
->cryptd_tfm
);
301 static struct ahash_alg ghash_async_alg
= {
302 .init
= ghash_async_init
,
303 .update
= ghash_async_update
,
304 .final
= ghash_async_final
,
305 .setkey
= ghash_async_setkey
,
306 .digest
= ghash_async_digest
,
307 .export
= ghash_async_export
,
308 .import
= ghash_async_import
,
310 .digestsize
= GHASH_DIGEST_SIZE
,
311 .statesize
= sizeof(struct ghash_desc_ctx
),
314 .cra_driver_name
= "ghash-clmulni",
316 .cra_ctxsize
= sizeof(struct ghash_async_ctx
),
317 .cra_flags
= CRYPTO_ALG_ASYNC
,
318 .cra_blocksize
= GHASH_BLOCK_SIZE
,
319 .cra_module
= THIS_MODULE
,
320 .cra_init
= ghash_async_init_tfm
,
321 .cra_exit
= ghash_async_exit_tfm
,
326 static const struct x86_cpu_id pcmul_cpu_id
[] = {
327 X86_FEATURE_MATCH(X86_FEATURE_PCLMULQDQ
), /* Pickle-Mickle-Duck */
330 MODULE_DEVICE_TABLE(x86cpu
, pcmul_cpu_id
);
332 static int __init
ghash_pclmulqdqni_mod_init(void)
336 if (!x86_match_cpu(pcmul_cpu_id
))
339 err
= crypto_register_shash(&ghash_alg
);
342 err
= crypto_register_ahash(&ghash_async_alg
);
349 crypto_unregister_shash(&ghash_alg
);
354 static void __exit
ghash_pclmulqdqni_mod_exit(void)
356 crypto_unregister_ahash(&ghash_async_alg
);
357 crypto_unregister_shash(&ghash_alg
);
360 module_init(ghash_pclmulqdqni_mod_init
);
361 module_exit(ghash_pclmulqdqni_mod_exit
);
363 MODULE_LICENSE("GPL");
364 MODULE_DESCRIPTION("GHASH Message Digest Algorithm, "
365 "accelerated by PCLMULQDQ-NI");
366 MODULE_ALIAS_CRYPTO("ghash");