4 * Support for VIA PadLock hardware crypto engine.
6 * Copyright (c) 2006 Michal Ludvig <michal@logix.cz>
8 * This program is free software; you can redistribute it and/or modify
9 * it under the terms of the GNU General Public License as published by
10 * the Free Software Foundation; either version 2 of the License, or
11 * (at your option) any later version.
15 #include <crypto/internal/hash.h>
16 #include <crypto/padlock.h>
17 #include <crypto/sha.h>
18 #include <linux/err.h>
19 #include <linux/module.h>
20 #include <linux/init.h>
21 #include <linux/errno.h>
22 #include <linux/interrupt.h>
23 #include <linux/kernel.h>
24 #include <linux/scatterlist.h>
25 #include <asm/cpu_device_id.h>
26 #include <asm/fpu/api.h>
28 struct padlock_sha_desc
{
29 struct shash_desc fallback
;
32 struct padlock_sha_ctx
{
33 struct crypto_shash
*fallback
;
36 static int padlock_sha_init(struct shash_desc
*desc
)
38 struct padlock_sha_desc
*dctx
= shash_desc_ctx(desc
);
39 struct padlock_sha_ctx
*ctx
= crypto_shash_ctx(desc
->tfm
);
41 dctx
->fallback
.tfm
= ctx
->fallback
;
42 dctx
->fallback
.flags
= desc
->flags
& CRYPTO_TFM_REQ_MAY_SLEEP
;
43 return crypto_shash_init(&dctx
->fallback
);
46 static int padlock_sha_update(struct shash_desc
*desc
,
47 const u8
*data
, unsigned int length
)
49 struct padlock_sha_desc
*dctx
= shash_desc_ctx(desc
);
51 dctx
->fallback
.flags
= desc
->flags
& CRYPTO_TFM_REQ_MAY_SLEEP
;
52 return crypto_shash_update(&dctx
->fallback
, data
, length
);
55 static int padlock_sha_export(struct shash_desc
*desc
, void *out
)
57 struct padlock_sha_desc
*dctx
= shash_desc_ctx(desc
);
59 return crypto_shash_export(&dctx
->fallback
, out
);
62 static int padlock_sha_import(struct shash_desc
*desc
, const void *in
)
64 struct padlock_sha_desc
*dctx
= shash_desc_ctx(desc
);
65 struct padlock_sha_ctx
*ctx
= crypto_shash_ctx(desc
->tfm
);
67 dctx
->fallback
.tfm
= ctx
->fallback
;
68 dctx
->fallback
.flags
= desc
->flags
& CRYPTO_TFM_REQ_MAY_SLEEP
;
69 return crypto_shash_import(&dctx
->fallback
, in
);
72 static inline void padlock_output_block(uint32_t *src
,
73 uint32_t *dst
, size_t count
)
76 *dst
++ = swab32(*src
++);
79 static int padlock_sha1_finup(struct shash_desc
*desc
, const u8
*in
,
80 unsigned int count
, u8
*out
)
82 /* We can't store directly to *out as it may be unaligned. */
83 /* BTW Don't reduce the buffer size below 128 Bytes!
84 * PadLock microcode needs it that big. */
85 char buf
[128 + PADLOCK_ALIGNMENT
- STACK_ALIGN
] __attribute__
86 ((aligned(STACK_ALIGN
)));
87 char *result
= PTR_ALIGN(&buf
[0], PADLOCK_ALIGNMENT
);
88 struct padlock_sha_desc
*dctx
= shash_desc_ctx(desc
);
89 struct sha1_state state
;
91 unsigned int leftover
;
94 dctx
->fallback
.flags
= desc
->flags
& CRYPTO_TFM_REQ_MAY_SLEEP
;
95 err
= crypto_shash_export(&dctx
->fallback
, &state
);
99 if (state
.count
+ count
> ULONG_MAX
)
100 return crypto_shash_finup(&dctx
->fallback
, in
, count
, out
);
102 leftover
= ((state
.count
- 1) & (SHA1_BLOCK_SIZE
- 1)) + 1;
103 space
= SHA1_BLOCK_SIZE
- leftover
;
106 err
= crypto_shash_update(&dctx
->fallback
, in
, space
) ?:
107 crypto_shash_export(&dctx
->fallback
, &state
);
113 memcpy(state
.buffer
+ leftover
, in
, count
);
116 state
.count
&= ~(SHA1_BLOCK_SIZE
- 1);
120 memcpy(result
, &state
.state
, SHA1_DIGEST_SIZE
);
122 asm volatile (".byte 0xf3,0x0f,0xa6,0xc8" /* rep xsha1 */
124 : "c"((unsigned long)state
.count
+ count
), \
125 "a"((unsigned long)state
.count
), \
126 "S"(in
), "D"(result
));
128 padlock_output_block((uint32_t *)result
, (uint32_t *)out
, 5);
134 static int padlock_sha1_final(struct shash_desc
*desc
, u8
*out
)
138 return padlock_sha1_finup(desc
, buf
, 0, out
);
141 static int padlock_sha256_finup(struct shash_desc
*desc
, const u8
*in
,
142 unsigned int count
, u8
*out
)
144 /* We can't store directly to *out as it may be unaligned. */
145 /* BTW Don't reduce the buffer size below 128 Bytes!
146 * PadLock microcode needs it that big. */
147 char buf
[128 + PADLOCK_ALIGNMENT
- STACK_ALIGN
] __attribute__
148 ((aligned(STACK_ALIGN
)));
149 char *result
= PTR_ALIGN(&buf
[0], PADLOCK_ALIGNMENT
);
150 struct padlock_sha_desc
*dctx
= shash_desc_ctx(desc
);
151 struct sha256_state state
;
153 unsigned int leftover
;
156 dctx
->fallback
.flags
= desc
->flags
& CRYPTO_TFM_REQ_MAY_SLEEP
;
157 err
= crypto_shash_export(&dctx
->fallback
, &state
);
161 if (state
.count
+ count
> ULONG_MAX
)
162 return crypto_shash_finup(&dctx
->fallback
, in
, count
, out
);
164 leftover
= ((state
.count
- 1) & (SHA256_BLOCK_SIZE
- 1)) + 1;
165 space
= SHA256_BLOCK_SIZE
- leftover
;
168 err
= crypto_shash_update(&dctx
->fallback
, in
, space
) ?:
169 crypto_shash_export(&dctx
->fallback
, &state
);
175 memcpy(state
.buf
+ leftover
, in
, count
);
178 state
.count
&= ~(SHA1_BLOCK_SIZE
- 1);
182 memcpy(result
, &state
.state
, SHA256_DIGEST_SIZE
);
184 asm volatile (".byte 0xf3,0x0f,0xa6,0xd0" /* rep xsha256 */
186 : "c"((unsigned long)state
.count
+ count
), \
187 "a"((unsigned long)state
.count
), \
188 "S"(in
), "D"(result
));
190 padlock_output_block((uint32_t *)result
, (uint32_t *)out
, 8);
196 static int padlock_sha256_final(struct shash_desc
*desc
, u8
*out
)
200 return padlock_sha256_finup(desc
, buf
, 0, out
);
203 static int padlock_cra_init(struct crypto_tfm
*tfm
)
205 struct crypto_shash
*hash
= __crypto_shash_cast(tfm
);
206 const char *fallback_driver_name
= crypto_tfm_alg_name(tfm
);
207 struct padlock_sha_ctx
*ctx
= crypto_tfm_ctx(tfm
);
208 struct crypto_shash
*fallback_tfm
;
211 /* Allocate a fallback and abort if it failed. */
212 fallback_tfm
= crypto_alloc_shash(fallback_driver_name
, 0,
213 CRYPTO_ALG_NEED_FALLBACK
);
214 if (IS_ERR(fallback_tfm
)) {
215 printk(KERN_WARNING PFX
"Fallback driver '%s' could not be loaded!\n",
216 fallback_driver_name
);
217 err
= PTR_ERR(fallback_tfm
);
221 ctx
->fallback
= fallback_tfm
;
222 hash
->descsize
+= crypto_shash_descsize(fallback_tfm
);
229 static void padlock_cra_exit(struct crypto_tfm
*tfm
)
231 struct padlock_sha_ctx
*ctx
= crypto_tfm_ctx(tfm
);
233 crypto_free_shash(ctx
->fallback
);
236 static struct shash_alg sha1_alg
= {
237 .digestsize
= SHA1_DIGEST_SIZE
,
238 .init
= padlock_sha_init
,
239 .update
= padlock_sha_update
,
240 .finup
= padlock_sha1_finup
,
241 .final
= padlock_sha1_final
,
242 .export
= padlock_sha_export
,
243 .import
= padlock_sha_import
,
244 .descsize
= sizeof(struct padlock_sha_desc
),
245 .statesize
= sizeof(struct sha1_state
),
248 .cra_driver_name
= "sha1-padlock",
249 .cra_priority
= PADLOCK_CRA_PRIORITY
,
250 .cra_flags
= CRYPTO_ALG_NEED_FALLBACK
,
251 .cra_blocksize
= SHA1_BLOCK_SIZE
,
252 .cra_ctxsize
= sizeof(struct padlock_sha_ctx
),
253 .cra_module
= THIS_MODULE
,
254 .cra_init
= padlock_cra_init
,
255 .cra_exit
= padlock_cra_exit
,
259 static struct shash_alg sha256_alg
= {
260 .digestsize
= SHA256_DIGEST_SIZE
,
261 .init
= padlock_sha_init
,
262 .update
= padlock_sha_update
,
263 .finup
= padlock_sha256_finup
,
264 .final
= padlock_sha256_final
,
265 .export
= padlock_sha_export
,
266 .import
= padlock_sha_import
,
267 .descsize
= sizeof(struct padlock_sha_desc
),
268 .statesize
= sizeof(struct sha256_state
),
270 .cra_name
= "sha256",
271 .cra_driver_name
= "sha256-padlock",
272 .cra_priority
= PADLOCK_CRA_PRIORITY
,
273 .cra_flags
= CRYPTO_ALG_NEED_FALLBACK
,
274 .cra_blocksize
= SHA256_BLOCK_SIZE
,
275 .cra_ctxsize
= sizeof(struct padlock_sha_ctx
),
276 .cra_module
= THIS_MODULE
,
277 .cra_init
= padlock_cra_init
,
278 .cra_exit
= padlock_cra_exit
,
282 /* Add two shash_alg instance for hardware-implemented *
283 * multiple-parts hash supported by VIA Nano Processor.*/
284 static int padlock_sha1_init_nano(struct shash_desc
*desc
)
286 struct sha1_state
*sctx
= shash_desc_ctx(desc
);
288 *sctx
= (struct sha1_state
){
289 .state
= { SHA1_H0
, SHA1_H1
, SHA1_H2
, SHA1_H3
, SHA1_H4
},
295 static int padlock_sha1_update_nano(struct shash_desc
*desc
,
296 const u8
*data
, unsigned int len
)
298 struct sha1_state
*sctx
= shash_desc_ctx(desc
);
299 unsigned int partial
, done
;
301 /*The PHE require the out buffer must 128 bytes and 16-bytes aligned*/
302 u8 buf
[128 + PADLOCK_ALIGNMENT
- STACK_ALIGN
] __attribute__
303 ((aligned(STACK_ALIGN
)));
304 u8
*dst
= PTR_ALIGN(&buf
[0], PADLOCK_ALIGNMENT
);
306 partial
= sctx
->count
& 0x3f;
310 memcpy(dst
, (u8
*)(sctx
->state
), SHA1_DIGEST_SIZE
);
312 if ((partial
+ len
) >= SHA1_BLOCK_SIZE
) {
314 /* Append the bytes in state's buffer to a block to handle */
317 memcpy(sctx
->buffer
+ partial
, data
,
318 done
+ SHA1_BLOCK_SIZE
);
320 asm volatile (".byte 0xf3,0x0f,0xa6,0xc8"
321 : "+S"(src
), "+D"(dst
) \
322 : "a"((long)-1), "c"((unsigned long)1));
323 done
+= SHA1_BLOCK_SIZE
;
327 /* Process the left bytes from the input data */
328 if (len
- done
>= SHA1_BLOCK_SIZE
) {
329 asm volatile (".byte 0xf3,0x0f,0xa6,0xc8"
330 : "+S"(src
), "+D"(dst
)
332 "c"((unsigned long)((len
- done
) / SHA1_BLOCK_SIZE
)));
333 done
+= ((len
- done
) - (len
- done
) % SHA1_BLOCK_SIZE
);
338 memcpy((u8
*)(sctx
->state
), dst
, SHA1_DIGEST_SIZE
);
339 memcpy(sctx
->buffer
+ partial
, src
, len
- done
);
344 static int padlock_sha1_final_nano(struct shash_desc
*desc
, u8
*out
)
346 struct sha1_state
*state
= (struct sha1_state
*)shash_desc_ctx(desc
);
347 unsigned int partial
, padlen
;
349 static const u8 padding
[64] = { 0x80, };
351 bits
= cpu_to_be64(state
->count
<< 3);
353 /* Pad out to 56 mod 64 */
354 partial
= state
->count
& 0x3f;
355 padlen
= (partial
< 56) ? (56 - partial
) : ((64+56) - partial
);
356 padlock_sha1_update_nano(desc
, padding
, padlen
);
358 /* Append length field bytes */
359 padlock_sha1_update_nano(desc
, (const u8
*)&bits
, sizeof(bits
));
362 padlock_output_block((uint32_t *)(state
->state
), (uint32_t *)out
, 5);
367 static int padlock_sha256_init_nano(struct shash_desc
*desc
)
369 struct sha256_state
*sctx
= shash_desc_ctx(desc
);
371 *sctx
= (struct sha256_state
){
372 .state
= { SHA256_H0
, SHA256_H1
, SHA256_H2
, SHA256_H3
, \
373 SHA256_H4
, SHA256_H5
, SHA256_H6
, SHA256_H7
},
379 static int padlock_sha256_update_nano(struct shash_desc
*desc
, const u8
*data
,
382 struct sha256_state
*sctx
= shash_desc_ctx(desc
);
383 unsigned int partial
, done
;
385 /*The PHE require the out buffer must 128 bytes and 16-bytes aligned*/
386 u8 buf
[128 + PADLOCK_ALIGNMENT
- STACK_ALIGN
] __attribute__
387 ((aligned(STACK_ALIGN
)));
388 u8
*dst
= PTR_ALIGN(&buf
[0], PADLOCK_ALIGNMENT
);
390 partial
= sctx
->count
& 0x3f;
394 memcpy(dst
, (u8
*)(sctx
->state
), SHA256_DIGEST_SIZE
);
396 if ((partial
+ len
) >= SHA256_BLOCK_SIZE
) {
398 /* Append the bytes in state's buffer to a block to handle */
401 memcpy(sctx
->buf
+ partial
, data
,
402 done
+ SHA256_BLOCK_SIZE
);
404 asm volatile (".byte 0xf3,0x0f,0xa6,0xd0"
405 : "+S"(src
), "+D"(dst
)
406 : "a"((long)-1), "c"((unsigned long)1));
407 done
+= SHA256_BLOCK_SIZE
;
411 /* Process the left bytes from input data*/
412 if (len
- done
>= SHA256_BLOCK_SIZE
) {
413 asm volatile (".byte 0xf3,0x0f,0xa6,0xd0"
414 : "+S"(src
), "+D"(dst
)
416 "c"((unsigned long)((len
- done
) / 64)));
417 done
+= ((len
- done
) - (len
- done
) % 64);
422 memcpy((u8
*)(sctx
->state
), dst
, SHA256_DIGEST_SIZE
);
423 memcpy(sctx
->buf
+ partial
, src
, len
- done
);
428 static int padlock_sha256_final_nano(struct shash_desc
*desc
, u8
*out
)
430 struct sha256_state
*state
=
431 (struct sha256_state
*)shash_desc_ctx(desc
);
432 unsigned int partial
, padlen
;
434 static const u8 padding
[64] = { 0x80, };
436 bits
= cpu_to_be64(state
->count
<< 3);
438 /* Pad out to 56 mod 64 */
439 partial
= state
->count
& 0x3f;
440 padlen
= (partial
< 56) ? (56 - partial
) : ((64+56) - partial
);
441 padlock_sha256_update_nano(desc
, padding
, padlen
);
443 /* Append length field bytes */
444 padlock_sha256_update_nano(desc
, (const u8
*)&bits
, sizeof(bits
));
447 padlock_output_block((uint32_t *)(state
->state
), (uint32_t *)out
, 8);
452 static int padlock_sha_export_nano(struct shash_desc
*desc
,
455 int statesize
= crypto_shash_statesize(desc
->tfm
);
456 void *sctx
= shash_desc_ctx(desc
);
458 memcpy(out
, sctx
, statesize
);
462 static int padlock_sha_import_nano(struct shash_desc
*desc
,
465 int statesize
= crypto_shash_statesize(desc
->tfm
);
466 void *sctx
= shash_desc_ctx(desc
);
468 memcpy(sctx
, in
, statesize
);
472 static struct shash_alg sha1_alg_nano
= {
473 .digestsize
= SHA1_DIGEST_SIZE
,
474 .init
= padlock_sha1_init_nano
,
475 .update
= padlock_sha1_update_nano
,
476 .final
= padlock_sha1_final_nano
,
477 .export
= padlock_sha_export_nano
,
478 .import
= padlock_sha_import_nano
,
479 .descsize
= sizeof(struct sha1_state
),
480 .statesize
= sizeof(struct sha1_state
),
483 .cra_driver_name
= "sha1-padlock-nano",
484 .cra_priority
= PADLOCK_CRA_PRIORITY
,
485 .cra_blocksize
= SHA1_BLOCK_SIZE
,
486 .cra_module
= THIS_MODULE
,
490 static struct shash_alg sha256_alg_nano
= {
491 .digestsize
= SHA256_DIGEST_SIZE
,
492 .init
= padlock_sha256_init_nano
,
493 .update
= padlock_sha256_update_nano
,
494 .final
= padlock_sha256_final_nano
,
495 .export
= padlock_sha_export_nano
,
496 .import
= padlock_sha_import_nano
,
497 .descsize
= sizeof(struct sha256_state
),
498 .statesize
= sizeof(struct sha256_state
),
500 .cra_name
= "sha256",
501 .cra_driver_name
= "sha256-padlock-nano",
502 .cra_priority
= PADLOCK_CRA_PRIORITY
,
503 .cra_blocksize
= SHA256_BLOCK_SIZE
,
504 .cra_module
= THIS_MODULE
,
508 static const struct x86_cpu_id padlock_sha_ids
[] = {
509 X86_FEATURE_MATCH(X86_FEATURE_PHE
),
512 MODULE_DEVICE_TABLE(x86cpu
, padlock_sha_ids
);
514 static int __init
padlock_init(void)
517 struct cpuinfo_x86
*c
= &cpu_data(0);
518 struct shash_alg
*sha1
;
519 struct shash_alg
*sha256
;
521 if (!x86_match_cpu(padlock_sha_ids
) || !boot_cpu_has(X86_FEATURE_PHE_EN
))
524 /* Register the newly added algorithm module if on *
525 * VIA Nano processor, or else just do as before */
526 if (c
->x86_model
< 0x0f) {
528 sha256
= &sha256_alg
;
530 sha1
= &sha1_alg_nano
;
531 sha256
= &sha256_alg_nano
;
534 rc
= crypto_register_shash(sha1
);
538 rc
= crypto_register_shash(sha256
);
542 printk(KERN_NOTICE PFX
"Using VIA PadLock ACE for SHA1/SHA256 algorithms.\n");
547 crypto_unregister_shash(sha1
);
550 printk(KERN_ERR PFX
"VIA PadLock SHA1/SHA256 initialization failed.\n");
554 static void __exit
padlock_fini(void)
556 struct cpuinfo_x86
*c
= &cpu_data(0);
558 if (c
->x86_model
>= 0x0f) {
559 crypto_unregister_shash(&sha1_alg_nano
);
560 crypto_unregister_shash(&sha256_alg_nano
);
562 crypto_unregister_shash(&sha1_alg
);
563 crypto_unregister_shash(&sha256_alg
);
567 module_init(padlock_init
);
568 module_exit(padlock_fini
);
570 MODULE_DESCRIPTION("VIA PadLock SHA1/SHA256 algorithms support.");
571 MODULE_LICENSE("GPL");
572 MODULE_AUTHOR("Michal Ludvig");
574 MODULE_ALIAS_CRYPTO("sha1-all");
575 MODULE_ALIAS_CRYPTO("sha256-all");
576 MODULE_ALIAS_CRYPTO("sha1-padlock");
577 MODULE_ALIAS_CRYPTO("sha256-padlock");