4 * Support for VIA PadLock hardware crypto engine.
6 * Copyright (c) 2006 Michal Ludvig <michal@logix.cz>
8 * This program is free software; you can redistribute it and/or modify
9 * it under the terms of the GNU General Public License as published by
10 * the Free Software Foundation; either version 2 of the License, or
11 * (at your option) any later version.
15 #include <crypto/internal/hash.h>
16 #include <crypto/padlock.h>
17 #include <crypto/sha.h>
18 #include <linux/err.h>
19 #include <linux/module.h>
20 #include <linux/init.h>
21 #include <linux/errno.h>
22 #include <linux/interrupt.h>
23 #include <linux/kernel.h>
24 #include <linux/scatterlist.h>
27 struct padlock_sha_desc
{
28 struct shash_desc fallback
;
31 struct padlock_sha_ctx
{
32 struct crypto_shash
*fallback
;
35 static int padlock_sha_init(struct shash_desc
*desc
)
37 struct padlock_sha_desc
*dctx
= shash_desc_ctx(desc
);
38 struct padlock_sha_ctx
*ctx
= crypto_shash_ctx(desc
->tfm
);
40 dctx
->fallback
.tfm
= ctx
->fallback
;
41 dctx
->fallback
.flags
= desc
->flags
& CRYPTO_TFM_REQ_MAY_SLEEP
;
42 return crypto_shash_init(&dctx
->fallback
);
45 static int padlock_sha_update(struct shash_desc
*desc
,
46 const u8
*data
, unsigned int length
)
48 struct padlock_sha_desc
*dctx
= shash_desc_ctx(desc
);
50 dctx
->fallback
.flags
= desc
->flags
& CRYPTO_TFM_REQ_MAY_SLEEP
;
51 return crypto_shash_update(&dctx
->fallback
, data
, length
);
54 static int padlock_sha_export(struct shash_desc
*desc
, void *out
)
56 struct padlock_sha_desc
*dctx
= shash_desc_ctx(desc
);
58 return crypto_shash_export(&dctx
->fallback
, out
);
61 static int padlock_sha_import(struct shash_desc
*desc
, const void *in
)
63 struct padlock_sha_desc
*dctx
= shash_desc_ctx(desc
);
64 struct padlock_sha_ctx
*ctx
= crypto_shash_ctx(desc
->tfm
);
66 dctx
->fallback
.tfm
= ctx
->fallback
;
67 dctx
->fallback
.flags
= desc
->flags
& CRYPTO_TFM_REQ_MAY_SLEEP
;
68 return crypto_shash_import(&dctx
->fallback
, in
);
71 static inline void padlock_output_block(uint32_t *src
,
72 uint32_t *dst
, size_t count
)
75 *dst
++ = swab32(*src
++);
78 static int padlock_sha1_finup(struct shash_desc
*desc
, const u8
*in
,
79 unsigned int count
, u8
*out
)
81 /* We can't store directly to *out as it may be unaligned. */
82 /* BTW Don't reduce the buffer size below 128 Bytes!
83 * PadLock microcode needs it that big. */
84 char buf
[128 + PADLOCK_ALIGNMENT
- STACK_ALIGN
] __attribute__
85 ((aligned(STACK_ALIGN
)));
86 char *result
= PTR_ALIGN(&buf
[0], PADLOCK_ALIGNMENT
);
87 struct padlock_sha_desc
*dctx
= shash_desc_ctx(desc
);
88 struct sha1_state state
;
90 unsigned int leftover
;
94 dctx
->fallback
.flags
= desc
->flags
& CRYPTO_TFM_REQ_MAY_SLEEP
;
95 err
= crypto_shash_export(&dctx
->fallback
, &state
);
99 if (state
.count
+ count
> ULONG_MAX
)
100 return crypto_shash_finup(&dctx
->fallback
, in
, count
, out
);
102 leftover
= ((state
.count
- 1) & (SHA1_BLOCK_SIZE
- 1)) + 1;
103 space
= SHA1_BLOCK_SIZE
- leftover
;
106 err
= crypto_shash_update(&dctx
->fallback
, in
, space
) ?:
107 crypto_shash_export(&dctx
->fallback
, &state
);
113 memcpy(state
.buffer
+ leftover
, in
, count
);
116 state
.count
&= ~(SHA1_BLOCK_SIZE
- 1);
120 memcpy(result
, &state
.state
, SHA1_DIGEST_SIZE
);
122 /* prevent taking the spurious DNA fault with padlock. */
123 ts_state
= irq_ts_save();
124 asm volatile (".byte 0xf3,0x0f,0xa6,0xc8" /* rep xsha1 */
126 : "c"((unsigned long)state
.count
+ count
), \
127 "a"((unsigned long)state
.count
), \
128 "S"(in
), "D"(result
));
129 irq_ts_restore(ts_state
);
131 padlock_output_block((uint32_t *)result
, (uint32_t *)out
, 5);
137 static int padlock_sha1_final(struct shash_desc
*desc
, u8
*out
)
141 return padlock_sha1_finup(desc
, buf
, 0, out
);
144 static int padlock_sha256_finup(struct shash_desc
*desc
, const u8
*in
,
145 unsigned int count
, u8
*out
)
147 /* We can't store directly to *out as it may be unaligned. */
148 /* BTW Don't reduce the buffer size below 128 Bytes!
149 * PadLock microcode needs it that big. */
150 char buf
[128 + PADLOCK_ALIGNMENT
- STACK_ALIGN
] __attribute__
151 ((aligned(STACK_ALIGN
)));
152 char *result
= PTR_ALIGN(&buf
[0], PADLOCK_ALIGNMENT
);
153 struct padlock_sha_desc
*dctx
= shash_desc_ctx(desc
);
154 struct sha256_state state
;
156 unsigned int leftover
;
160 dctx
->fallback
.flags
= desc
->flags
& CRYPTO_TFM_REQ_MAY_SLEEP
;
161 err
= crypto_shash_export(&dctx
->fallback
, &state
);
165 if (state
.count
+ count
> ULONG_MAX
)
166 return crypto_shash_finup(&dctx
->fallback
, in
, count
, out
);
168 leftover
= ((state
.count
- 1) & (SHA256_BLOCK_SIZE
- 1)) + 1;
169 space
= SHA256_BLOCK_SIZE
- leftover
;
172 err
= crypto_shash_update(&dctx
->fallback
, in
, space
) ?:
173 crypto_shash_export(&dctx
->fallback
, &state
);
179 memcpy(state
.buf
+ leftover
, in
, count
);
182 state
.count
&= ~(SHA1_BLOCK_SIZE
- 1);
186 memcpy(result
, &state
.state
, SHA256_DIGEST_SIZE
);
188 /* prevent taking the spurious DNA fault with padlock. */
189 ts_state
= irq_ts_save();
190 asm volatile (".byte 0xf3,0x0f,0xa6,0xd0" /* rep xsha256 */
192 : "c"((unsigned long)state
.count
+ count
), \
193 "a"((unsigned long)state
.count
), \
194 "S"(in
), "D"(result
));
195 irq_ts_restore(ts_state
);
197 padlock_output_block((uint32_t *)result
, (uint32_t *)out
, 8);
203 static int padlock_sha256_final(struct shash_desc
*desc
, u8
*out
)
207 return padlock_sha256_finup(desc
, buf
, 0, out
);
210 static int padlock_cra_init(struct crypto_tfm
*tfm
)
212 struct crypto_shash
*hash
= __crypto_shash_cast(tfm
);
213 const char *fallback_driver_name
= tfm
->__crt_alg
->cra_name
;
214 struct padlock_sha_ctx
*ctx
= crypto_tfm_ctx(tfm
);
215 struct crypto_shash
*fallback_tfm
;
218 /* Allocate a fallback and abort if it failed. */
219 fallback_tfm
= crypto_alloc_shash(fallback_driver_name
, 0,
220 CRYPTO_ALG_NEED_FALLBACK
);
221 if (IS_ERR(fallback_tfm
)) {
222 printk(KERN_WARNING PFX
"Fallback driver '%s' could not be loaded!\n",
223 fallback_driver_name
);
224 err
= PTR_ERR(fallback_tfm
);
228 ctx
->fallback
= fallback_tfm
;
229 hash
->descsize
+= crypto_shash_descsize(fallback_tfm
);
236 static void padlock_cra_exit(struct crypto_tfm
*tfm
)
238 struct padlock_sha_ctx
*ctx
= crypto_tfm_ctx(tfm
);
240 crypto_free_shash(ctx
->fallback
);
243 static struct shash_alg sha1_alg
= {
244 .digestsize
= SHA1_DIGEST_SIZE
,
245 .init
= padlock_sha_init
,
246 .update
= padlock_sha_update
,
247 .finup
= padlock_sha1_finup
,
248 .final
= padlock_sha1_final
,
249 .export
= padlock_sha_export
,
250 .import
= padlock_sha_import
,
251 .descsize
= sizeof(struct padlock_sha_desc
),
252 .statesize
= sizeof(struct sha1_state
),
255 .cra_driver_name
= "sha1-padlock",
256 .cra_priority
= PADLOCK_CRA_PRIORITY
,
257 .cra_flags
= CRYPTO_ALG_TYPE_SHASH
|
258 CRYPTO_ALG_NEED_FALLBACK
,
259 .cra_blocksize
= SHA1_BLOCK_SIZE
,
260 .cra_ctxsize
= sizeof(struct padlock_sha_ctx
),
261 .cra_module
= THIS_MODULE
,
262 .cra_init
= padlock_cra_init
,
263 .cra_exit
= padlock_cra_exit
,
267 static struct shash_alg sha256_alg
= {
268 .digestsize
= SHA256_DIGEST_SIZE
,
269 .init
= padlock_sha_init
,
270 .update
= padlock_sha_update
,
271 .finup
= padlock_sha256_finup
,
272 .final
= padlock_sha256_final
,
273 .export
= padlock_sha_export
,
274 .import
= padlock_sha_import
,
275 .descsize
= sizeof(struct padlock_sha_desc
),
276 .statesize
= sizeof(struct sha256_state
),
278 .cra_name
= "sha256",
279 .cra_driver_name
= "sha256-padlock",
280 .cra_priority
= PADLOCK_CRA_PRIORITY
,
281 .cra_flags
= CRYPTO_ALG_TYPE_SHASH
|
282 CRYPTO_ALG_NEED_FALLBACK
,
283 .cra_blocksize
= SHA256_BLOCK_SIZE
,
284 .cra_ctxsize
= sizeof(struct padlock_sha_ctx
),
285 .cra_module
= THIS_MODULE
,
286 .cra_init
= padlock_cra_init
,
287 .cra_exit
= padlock_cra_exit
,
291 /* Add two shash_alg instance for hardware-implemented *
292 * multiple-parts hash supported by VIA Nano Processor.*/
293 static int padlock_sha1_init_nano(struct shash_desc
*desc
)
295 struct sha1_state
*sctx
= shash_desc_ctx(desc
);
297 *sctx
= (struct sha1_state
){
298 .state
= { SHA1_H0
, SHA1_H1
, SHA1_H2
, SHA1_H3
, SHA1_H4
},
304 static int padlock_sha1_update_nano(struct shash_desc
*desc
,
305 const u8
*data
, unsigned int len
)
307 struct sha1_state
*sctx
= shash_desc_ctx(desc
);
308 unsigned int partial
, done
;
310 /*The PHE require the out buffer must 128 bytes and 16-bytes aligned*/
311 u8 buf
[128 + PADLOCK_ALIGNMENT
- STACK_ALIGN
] __attribute__
312 ((aligned(STACK_ALIGN
)));
313 u8
*dst
= PTR_ALIGN(&buf
[0], PADLOCK_ALIGNMENT
);
316 partial
= sctx
->count
& 0x3f;
320 memcpy(dst
, (u8
*)(sctx
->state
), SHA1_DIGEST_SIZE
);
322 if ((partial
+ len
) >= SHA1_BLOCK_SIZE
) {
324 /* Append the bytes in state's buffer to a block to handle */
327 memcpy(sctx
->buffer
+ partial
, data
,
328 done
+ SHA1_BLOCK_SIZE
);
330 ts_state
= irq_ts_save();
331 asm volatile (".byte 0xf3,0x0f,0xa6,0xc8"
332 : "+S"(src
), "+D"(dst
) \
333 : "a"((long)-1), "c"((unsigned long)1));
334 irq_ts_restore(ts_state
);
335 done
+= SHA1_BLOCK_SIZE
;
339 /* Process the left bytes from the input data */
340 if (len
- done
>= SHA1_BLOCK_SIZE
) {
341 ts_state
= irq_ts_save();
342 asm volatile (".byte 0xf3,0x0f,0xa6,0xc8"
343 : "+S"(src
), "+D"(dst
)
345 "c"((unsigned long)((len
- done
) / SHA1_BLOCK_SIZE
)));
346 irq_ts_restore(ts_state
);
347 done
+= ((len
- done
) - (len
- done
) % SHA1_BLOCK_SIZE
);
352 memcpy((u8
*)(sctx
->state
), dst
, SHA1_DIGEST_SIZE
);
353 memcpy(sctx
->buffer
+ partial
, src
, len
- done
);
358 static int padlock_sha1_final_nano(struct shash_desc
*desc
, u8
*out
)
360 struct sha1_state
*state
= (struct sha1_state
*)shash_desc_ctx(desc
);
361 unsigned int partial
, padlen
;
363 static const u8 padding
[64] = { 0x80, };
365 bits
= cpu_to_be64(state
->count
<< 3);
367 /* Pad out to 56 mod 64 */
368 partial
= state
->count
& 0x3f;
369 padlen
= (partial
< 56) ? (56 - partial
) : ((64+56) - partial
);
370 padlock_sha1_update_nano(desc
, padding
, padlen
);
372 /* Append length field bytes */
373 padlock_sha1_update_nano(desc
, (const u8
*)&bits
, sizeof(bits
));
376 padlock_output_block((uint32_t *)(state
->state
), (uint32_t *)out
, 5);
381 static int padlock_sha256_init_nano(struct shash_desc
*desc
)
383 struct sha256_state
*sctx
= shash_desc_ctx(desc
);
385 *sctx
= (struct sha256_state
){
386 .state
= { SHA256_H0
, SHA256_H1
, SHA256_H2
, SHA256_H3
, \
387 SHA256_H4
, SHA256_H5
, SHA256_H6
, SHA256_H7
},
393 static int padlock_sha256_update_nano(struct shash_desc
*desc
, const u8
*data
,
396 struct sha256_state
*sctx
= shash_desc_ctx(desc
);
397 unsigned int partial
, done
;
399 /*The PHE require the out buffer must 128 bytes and 16-bytes aligned*/
400 u8 buf
[128 + PADLOCK_ALIGNMENT
- STACK_ALIGN
] __attribute__
401 ((aligned(STACK_ALIGN
)));
402 u8
*dst
= PTR_ALIGN(&buf
[0], PADLOCK_ALIGNMENT
);
405 partial
= sctx
->count
& 0x3f;
409 memcpy(dst
, (u8
*)(sctx
->state
), SHA256_DIGEST_SIZE
);
411 if ((partial
+ len
) >= SHA256_BLOCK_SIZE
) {
413 /* Append the bytes in state's buffer to a block to handle */
416 memcpy(sctx
->buf
+ partial
, data
,
417 done
+ SHA256_BLOCK_SIZE
);
419 ts_state
= irq_ts_save();
420 asm volatile (".byte 0xf3,0x0f,0xa6,0xd0"
421 : "+S"(src
), "+D"(dst
)
422 : "a"((long)-1), "c"((unsigned long)1));
423 irq_ts_restore(ts_state
);
424 done
+= SHA256_BLOCK_SIZE
;
428 /* Process the left bytes from input data*/
429 if (len
- done
>= SHA256_BLOCK_SIZE
) {
430 ts_state
= irq_ts_save();
431 asm volatile (".byte 0xf3,0x0f,0xa6,0xd0"
432 : "+S"(src
), "+D"(dst
)
434 "c"((unsigned long)((len
- done
) / 64)));
435 irq_ts_restore(ts_state
);
436 done
+= ((len
- done
) - (len
- done
) % 64);
441 memcpy((u8
*)(sctx
->state
), dst
, SHA256_DIGEST_SIZE
);
442 memcpy(sctx
->buf
+ partial
, src
, len
- done
);
447 static int padlock_sha256_final_nano(struct shash_desc
*desc
, u8
*out
)
449 struct sha256_state
*state
=
450 (struct sha256_state
*)shash_desc_ctx(desc
);
451 unsigned int partial
, padlen
;
453 static const u8 padding
[64] = { 0x80, };
455 bits
= cpu_to_be64(state
->count
<< 3);
457 /* Pad out to 56 mod 64 */
458 partial
= state
->count
& 0x3f;
459 padlen
= (partial
< 56) ? (56 - partial
) : ((64+56) - partial
);
460 padlock_sha256_update_nano(desc
, padding
, padlen
);
462 /* Append length field bytes */
463 padlock_sha256_update_nano(desc
, (const u8
*)&bits
, sizeof(bits
));
466 padlock_output_block((uint32_t *)(state
->state
), (uint32_t *)out
, 8);
471 static int padlock_sha_export_nano(struct shash_desc
*desc
,
474 int statesize
= crypto_shash_statesize(desc
->tfm
);
475 void *sctx
= shash_desc_ctx(desc
);
477 memcpy(out
, sctx
, statesize
);
481 static int padlock_sha_import_nano(struct shash_desc
*desc
,
484 int statesize
= crypto_shash_statesize(desc
->tfm
);
485 void *sctx
= shash_desc_ctx(desc
);
487 memcpy(sctx
, in
, statesize
);
491 static struct shash_alg sha1_alg_nano
= {
492 .digestsize
= SHA1_DIGEST_SIZE
,
493 .init
= padlock_sha1_init_nano
,
494 .update
= padlock_sha1_update_nano
,
495 .final
= padlock_sha1_final_nano
,
496 .export
= padlock_sha_export_nano
,
497 .import
= padlock_sha_import_nano
,
498 .descsize
= sizeof(struct sha1_state
),
499 .statesize
= sizeof(struct sha1_state
),
502 .cra_driver_name
= "sha1-padlock-nano",
503 .cra_priority
= PADLOCK_CRA_PRIORITY
,
504 .cra_flags
= CRYPTO_ALG_TYPE_SHASH
,
505 .cra_blocksize
= SHA1_BLOCK_SIZE
,
506 .cra_module
= THIS_MODULE
,
510 static struct shash_alg sha256_alg_nano
= {
511 .digestsize
= SHA256_DIGEST_SIZE
,
512 .init
= padlock_sha256_init_nano
,
513 .update
= padlock_sha256_update_nano
,
514 .final
= padlock_sha256_final_nano
,
515 .export
= padlock_sha_export_nano
,
516 .import
= padlock_sha_import_nano
,
517 .descsize
= sizeof(struct sha256_state
),
518 .statesize
= sizeof(struct sha256_state
),
520 .cra_name
= "sha256",
521 .cra_driver_name
= "sha256-padlock-nano",
522 .cra_priority
= PADLOCK_CRA_PRIORITY
,
523 .cra_flags
= CRYPTO_ALG_TYPE_SHASH
,
524 .cra_blocksize
= SHA256_BLOCK_SIZE
,
525 .cra_module
= THIS_MODULE
,
529 static int __init
padlock_init(void)
532 struct cpuinfo_x86
*c
= &cpu_data(0);
533 struct shash_alg
*sha1
;
534 struct shash_alg
*sha256
;
537 printk(KERN_NOTICE PFX
"VIA PadLock Hash Engine not detected.\n");
541 if (!cpu_has_phe_enabled
) {
542 printk(KERN_NOTICE PFX
"VIA PadLock detected, but not enabled. Hmm, strange...\n");
546 /* Register the newly added algorithm module if on *
547 * VIA Nano processor, or else just do as before */
548 if (c
->x86_model
< 0x0f) {
550 sha256
= &sha256_alg
;
552 sha1
= &sha1_alg_nano
;
553 sha256
= &sha256_alg_nano
;
556 rc
= crypto_register_shash(sha1
);
560 rc
= crypto_register_shash(sha256
);
564 printk(KERN_NOTICE PFX
"Using VIA PadLock ACE for SHA1/SHA256 algorithms.\n");
569 crypto_unregister_shash(sha1
);
572 printk(KERN_ERR PFX
"VIA PadLock SHA1/SHA256 initialization failed.\n");
576 static void __exit
padlock_fini(void)
578 struct cpuinfo_x86
*c
= &cpu_data(0);
580 if (c
->x86_model
>= 0x0f) {
581 crypto_unregister_shash(&sha1_alg_nano
);
582 crypto_unregister_shash(&sha256_alg_nano
);
584 crypto_unregister_shash(&sha1_alg
);
585 crypto_unregister_shash(&sha256_alg
);
589 module_init(padlock_init
);
590 module_exit(padlock_fini
);
592 MODULE_DESCRIPTION("VIA PadLock SHA1/SHA256 algorithms support.");
593 MODULE_LICENSE("GPL");
594 MODULE_AUTHOR("Michal Ludvig");
596 MODULE_ALIAS("sha1-all");
597 MODULE_ALIAS("sha256-all");
598 MODULE_ALIAS("sha1-padlock");
599 MODULE_ALIAS("sha256-padlock");