2 * Glue Code for AVX assembler version of Twofish Cipher
4 * Copyright (C) 2012 Johannes Goetzfried
5 * <Johannes.Goetzfried@informatik.stud.uni-erlangen.de>
7 * Copyright © 2013 Jussi Kivilinna <jussi.kivilinna@iki.fi>
9 * This program is free software; you can redistribute it and/or modify
10 * it under the terms of the GNU General Public License as published by
11 * the Free Software Foundation; either version 2 of the License, or
12 * (at your option) any later version.
14 * This program is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 * GNU General Public License for more details.
19 * You should have received a copy of the GNU General Public License
20 * along with this program; if not, write to the Free Software
21 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307
26 #include <linux/module.h>
27 #include <linux/hardirq.h>
28 #include <linux/types.h>
29 #include <linux/crypto.h>
30 #include <linux/err.h>
31 #include <crypto/ablk_helper.h>
32 #include <crypto/algapi.h>
33 #include <crypto/twofish.h>
34 #include <crypto/cryptd.h>
35 #include <crypto/b128ops.h>
36 #include <crypto/ctr.h>
37 #include <crypto/lrw.h>
38 #include <crypto/xts.h>
39 #include <asm/fpu/api.h>
40 #include <asm/crypto/twofish.h>
41 #include <asm/crypto/glue_helper.h>
42 #include <crypto/scatterwalk.h>
43 #include <linux/workqueue.h>
44 #include <linux/spinlock.h>
46 #define TWOFISH_PARALLEL_BLOCKS 8
48 /* 8-way parallel cipher functions */
49 asmlinkage
void twofish_ecb_enc_8way(struct twofish_ctx
*ctx
, u8
*dst
,
51 asmlinkage
void twofish_ecb_dec_8way(struct twofish_ctx
*ctx
, u8
*dst
,
54 asmlinkage
void twofish_cbc_dec_8way(struct twofish_ctx
*ctx
, u8
*dst
,
56 asmlinkage
void twofish_ctr_8way(struct twofish_ctx
*ctx
, u8
*dst
,
57 const u8
*src
, le128
*iv
);
59 asmlinkage
void twofish_xts_enc_8way(struct twofish_ctx
*ctx
, u8
*dst
,
60 const u8
*src
, le128
*iv
);
61 asmlinkage
void twofish_xts_dec_8way(struct twofish_ctx
*ctx
, u8
*dst
,
62 const u8
*src
, le128
*iv
);
64 static inline void twofish_enc_blk_3way(struct twofish_ctx
*ctx
, u8
*dst
,
67 __twofish_enc_blk_3way(ctx
, dst
, src
, false);
70 static void twofish_xts_enc(void *ctx
, u128
*dst
, const u128
*src
, le128
*iv
)
72 glue_xts_crypt_128bit_one(ctx
, dst
, src
, iv
,
73 GLUE_FUNC_CAST(twofish_enc_blk
));
76 static void twofish_xts_dec(void *ctx
, u128
*dst
, const u128
*src
, le128
*iv
)
78 glue_xts_crypt_128bit_one(ctx
, dst
, src
, iv
,
79 GLUE_FUNC_CAST(twofish_dec_blk
));
83 static const struct common_glue_ctx twofish_enc
= {
85 .fpu_blocks_limit
= TWOFISH_PARALLEL_BLOCKS
,
88 .num_blocks
= TWOFISH_PARALLEL_BLOCKS
,
89 .fn_u
= { .ecb
= GLUE_FUNC_CAST(twofish_ecb_enc_8way
) }
92 .fn_u
= { .ecb
= GLUE_FUNC_CAST(twofish_enc_blk_3way
) }
95 .fn_u
= { .ecb
= GLUE_FUNC_CAST(twofish_enc_blk
) }
99 static const struct common_glue_ctx twofish_ctr
= {
101 .fpu_blocks_limit
= TWOFISH_PARALLEL_BLOCKS
,
104 .num_blocks
= TWOFISH_PARALLEL_BLOCKS
,
105 .fn_u
= { .ctr
= GLUE_CTR_FUNC_CAST(twofish_ctr_8way
) }
108 .fn_u
= { .ctr
= GLUE_CTR_FUNC_CAST(twofish_enc_blk_ctr_3way
) }
111 .fn_u
= { .ctr
= GLUE_CTR_FUNC_CAST(twofish_enc_blk_ctr
) }
115 static const struct common_glue_ctx twofish_enc_xts
= {
117 .fpu_blocks_limit
= TWOFISH_PARALLEL_BLOCKS
,
120 .num_blocks
= TWOFISH_PARALLEL_BLOCKS
,
121 .fn_u
= { .xts
= GLUE_XTS_FUNC_CAST(twofish_xts_enc_8way
) }
124 .fn_u
= { .xts
= GLUE_XTS_FUNC_CAST(twofish_xts_enc
) }
128 static const struct common_glue_ctx twofish_dec
= {
130 .fpu_blocks_limit
= TWOFISH_PARALLEL_BLOCKS
,
133 .num_blocks
= TWOFISH_PARALLEL_BLOCKS
,
134 .fn_u
= { .ecb
= GLUE_FUNC_CAST(twofish_ecb_dec_8way
) }
137 .fn_u
= { .ecb
= GLUE_FUNC_CAST(twofish_dec_blk_3way
) }
140 .fn_u
= { .ecb
= GLUE_FUNC_CAST(twofish_dec_blk
) }
144 static const struct common_glue_ctx twofish_dec_cbc
= {
146 .fpu_blocks_limit
= TWOFISH_PARALLEL_BLOCKS
,
149 .num_blocks
= TWOFISH_PARALLEL_BLOCKS
,
150 .fn_u
= { .cbc
= GLUE_CBC_FUNC_CAST(twofish_cbc_dec_8way
) }
153 .fn_u
= { .cbc
= GLUE_CBC_FUNC_CAST(twofish_dec_blk_cbc_3way
) }
156 .fn_u
= { .cbc
= GLUE_CBC_FUNC_CAST(twofish_dec_blk
) }
160 static const struct common_glue_ctx twofish_dec_xts
= {
162 .fpu_blocks_limit
= TWOFISH_PARALLEL_BLOCKS
,
165 .num_blocks
= TWOFISH_PARALLEL_BLOCKS
,
166 .fn_u
= { .xts
= GLUE_XTS_FUNC_CAST(twofish_xts_dec_8way
) }
169 .fn_u
= { .xts
= GLUE_XTS_FUNC_CAST(twofish_xts_dec
) }
173 static int ecb_encrypt(struct blkcipher_desc
*desc
, struct scatterlist
*dst
,
174 struct scatterlist
*src
, unsigned int nbytes
)
176 return glue_ecb_crypt_128bit(&twofish_enc
, desc
, dst
, src
, nbytes
);
179 static int ecb_decrypt(struct blkcipher_desc
*desc
, struct scatterlist
*dst
,
180 struct scatterlist
*src
, unsigned int nbytes
)
182 return glue_ecb_crypt_128bit(&twofish_dec
, desc
, dst
, src
, nbytes
);
185 static int cbc_encrypt(struct blkcipher_desc
*desc
, struct scatterlist
*dst
,
186 struct scatterlist
*src
, unsigned int nbytes
)
188 return glue_cbc_encrypt_128bit(GLUE_FUNC_CAST(twofish_enc_blk
), desc
,
192 static int cbc_decrypt(struct blkcipher_desc
*desc
, struct scatterlist
*dst
,
193 struct scatterlist
*src
, unsigned int nbytes
)
195 return glue_cbc_decrypt_128bit(&twofish_dec_cbc
, desc
, dst
, src
,
199 static int ctr_crypt(struct blkcipher_desc
*desc
, struct scatterlist
*dst
,
200 struct scatterlist
*src
, unsigned int nbytes
)
202 return glue_ctr_crypt_128bit(&twofish_ctr
, desc
, dst
, src
, nbytes
);
205 static inline bool twofish_fpu_begin(bool fpu_enabled
, unsigned int nbytes
)
207 return glue_fpu_begin(TF_BLOCK_SIZE
, TWOFISH_PARALLEL_BLOCKS
, NULL
,
208 fpu_enabled
, nbytes
);
211 static inline void twofish_fpu_end(bool fpu_enabled
)
213 glue_fpu_end(fpu_enabled
);
217 struct twofish_ctx
*ctx
;
221 static void encrypt_callback(void *priv
, u8
*srcdst
, unsigned int nbytes
)
223 const unsigned int bsize
= TF_BLOCK_SIZE
;
224 struct crypt_priv
*ctx
= priv
;
227 ctx
->fpu_enabled
= twofish_fpu_begin(ctx
->fpu_enabled
, nbytes
);
229 if (nbytes
== bsize
* TWOFISH_PARALLEL_BLOCKS
) {
230 twofish_ecb_enc_8way(ctx
->ctx
, srcdst
, srcdst
);
234 for (i
= 0; i
< nbytes
/ (bsize
* 3); i
++, srcdst
+= bsize
* 3)
235 twofish_enc_blk_3way(ctx
->ctx
, srcdst
, srcdst
);
239 for (i
= 0; i
< nbytes
/ bsize
; i
++, srcdst
+= bsize
)
240 twofish_enc_blk(ctx
->ctx
, srcdst
, srcdst
);
243 static void decrypt_callback(void *priv
, u8
*srcdst
, unsigned int nbytes
)
245 const unsigned int bsize
= TF_BLOCK_SIZE
;
246 struct crypt_priv
*ctx
= priv
;
249 ctx
->fpu_enabled
= twofish_fpu_begin(ctx
->fpu_enabled
, nbytes
);
251 if (nbytes
== bsize
* TWOFISH_PARALLEL_BLOCKS
) {
252 twofish_ecb_dec_8way(ctx
->ctx
, srcdst
, srcdst
);
256 for (i
= 0; i
< nbytes
/ (bsize
* 3); i
++, srcdst
+= bsize
* 3)
257 twofish_dec_blk_3way(ctx
->ctx
, srcdst
, srcdst
);
261 for (i
= 0; i
< nbytes
/ bsize
; i
++, srcdst
+= bsize
)
262 twofish_dec_blk(ctx
->ctx
, srcdst
, srcdst
);
265 static int lrw_encrypt(struct blkcipher_desc
*desc
, struct scatterlist
*dst
,
266 struct scatterlist
*src
, unsigned int nbytes
)
268 struct twofish_lrw_ctx
*ctx
= crypto_blkcipher_ctx(desc
->tfm
);
269 be128 buf
[TWOFISH_PARALLEL_BLOCKS
];
270 struct crypt_priv crypt_ctx
= {
271 .ctx
= &ctx
->twofish_ctx
,
272 .fpu_enabled
= false,
274 struct lrw_crypt_req req
= {
276 .tbuflen
= sizeof(buf
),
278 .table_ctx
= &ctx
->lrw_table
,
279 .crypt_ctx
= &crypt_ctx
,
280 .crypt_fn
= encrypt_callback
,
284 desc
->flags
&= ~CRYPTO_TFM_REQ_MAY_SLEEP
;
285 ret
= lrw_crypt(desc
, dst
, src
, nbytes
, &req
);
286 twofish_fpu_end(crypt_ctx
.fpu_enabled
);
291 static int lrw_decrypt(struct blkcipher_desc
*desc
, struct scatterlist
*dst
,
292 struct scatterlist
*src
, unsigned int nbytes
)
294 struct twofish_lrw_ctx
*ctx
= crypto_blkcipher_ctx(desc
->tfm
);
295 be128 buf
[TWOFISH_PARALLEL_BLOCKS
];
296 struct crypt_priv crypt_ctx
= {
297 .ctx
= &ctx
->twofish_ctx
,
298 .fpu_enabled
= false,
300 struct lrw_crypt_req req
= {
302 .tbuflen
= sizeof(buf
),
304 .table_ctx
= &ctx
->lrw_table
,
305 .crypt_ctx
= &crypt_ctx
,
306 .crypt_fn
= decrypt_callback
,
310 desc
->flags
&= ~CRYPTO_TFM_REQ_MAY_SLEEP
;
311 ret
= lrw_crypt(desc
, dst
, src
, nbytes
, &req
);
312 twofish_fpu_end(crypt_ctx
.fpu_enabled
);
317 static int xts_encrypt(struct blkcipher_desc
*desc
, struct scatterlist
*dst
,
318 struct scatterlist
*src
, unsigned int nbytes
)
320 struct twofish_xts_ctx
*ctx
= crypto_blkcipher_ctx(desc
->tfm
);
322 return glue_xts_crypt_128bit(&twofish_enc_xts
, desc
, dst
, src
, nbytes
,
323 XTS_TWEAK_CAST(twofish_enc_blk
),
324 &ctx
->tweak_ctx
, &ctx
->crypt_ctx
);
327 static int xts_decrypt(struct blkcipher_desc
*desc
, struct scatterlist
*dst
,
328 struct scatterlist
*src
, unsigned int nbytes
)
330 struct twofish_xts_ctx
*ctx
= crypto_blkcipher_ctx(desc
->tfm
);
332 return glue_xts_crypt_128bit(&twofish_dec_xts
, desc
, dst
, src
, nbytes
,
333 XTS_TWEAK_CAST(twofish_enc_blk
),
334 &ctx
->tweak_ctx
, &ctx
->crypt_ctx
);
337 static struct crypto_alg twofish_algs
[10] = { {
338 .cra_name
= "__ecb-twofish-avx",
339 .cra_driver_name
= "__driver-ecb-twofish-avx",
341 .cra_flags
= CRYPTO_ALG_TYPE_BLKCIPHER
|
343 .cra_blocksize
= TF_BLOCK_SIZE
,
344 .cra_ctxsize
= sizeof(struct twofish_ctx
),
346 .cra_type
= &crypto_blkcipher_type
,
347 .cra_module
= THIS_MODULE
,
350 .min_keysize
= TF_MIN_KEY_SIZE
,
351 .max_keysize
= TF_MAX_KEY_SIZE
,
352 .setkey
= twofish_setkey
,
353 .encrypt
= ecb_encrypt
,
354 .decrypt
= ecb_decrypt
,
358 .cra_name
= "__cbc-twofish-avx",
359 .cra_driver_name
= "__driver-cbc-twofish-avx",
361 .cra_flags
= CRYPTO_ALG_TYPE_BLKCIPHER
|
363 .cra_blocksize
= TF_BLOCK_SIZE
,
364 .cra_ctxsize
= sizeof(struct twofish_ctx
),
366 .cra_type
= &crypto_blkcipher_type
,
367 .cra_module
= THIS_MODULE
,
370 .min_keysize
= TF_MIN_KEY_SIZE
,
371 .max_keysize
= TF_MAX_KEY_SIZE
,
372 .setkey
= twofish_setkey
,
373 .encrypt
= cbc_encrypt
,
374 .decrypt
= cbc_decrypt
,
378 .cra_name
= "__ctr-twofish-avx",
379 .cra_driver_name
= "__driver-ctr-twofish-avx",
381 .cra_flags
= CRYPTO_ALG_TYPE_BLKCIPHER
|
384 .cra_ctxsize
= sizeof(struct twofish_ctx
),
386 .cra_type
= &crypto_blkcipher_type
,
387 .cra_module
= THIS_MODULE
,
390 .min_keysize
= TF_MIN_KEY_SIZE
,
391 .max_keysize
= TF_MAX_KEY_SIZE
,
392 .ivsize
= TF_BLOCK_SIZE
,
393 .setkey
= twofish_setkey
,
394 .encrypt
= ctr_crypt
,
395 .decrypt
= ctr_crypt
,
399 .cra_name
= "__lrw-twofish-avx",
400 .cra_driver_name
= "__driver-lrw-twofish-avx",
402 .cra_flags
= CRYPTO_ALG_TYPE_BLKCIPHER
|
404 .cra_blocksize
= TF_BLOCK_SIZE
,
405 .cra_ctxsize
= sizeof(struct twofish_lrw_ctx
),
407 .cra_type
= &crypto_blkcipher_type
,
408 .cra_module
= THIS_MODULE
,
409 .cra_exit
= lrw_twofish_exit_tfm
,
412 .min_keysize
= TF_MIN_KEY_SIZE
+
414 .max_keysize
= TF_MAX_KEY_SIZE
+
416 .ivsize
= TF_BLOCK_SIZE
,
417 .setkey
= lrw_twofish_setkey
,
418 .encrypt
= lrw_encrypt
,
419 .decrypt
= lrw_decrypt
,
423 .cra_name
= "__xts-twofish-avx",
424 .cra_driver_name
= "__driver-xts-twofish-avx",
426 .cra_flags
= CRYPTO_ALG_TYPE_BLKCIPHER
|
428 .cra_blocksize
= TF_BLOCK_SIZE
,
429 .cra_ctxsize
= sizeof(struct twofish_xts_ctx
),
431 .cra_type
= &crypto_blkcipher_type
,
432 .cra_module
= THIS_MODULE
,
435 .min_keysize
= TF_MIN_KEY_SIZE
* 2,
436 .max_keysize
= TF_MAX_KEY_SIZE
* 2,
437 .ivsize
= TF_BLOCK_SIZE
,
438 .setkey
= xts_twofish_setkey
,
439 .encrypt
= xts_encrypt
,
440 .decrypt
= xts_decrypt
,
444 .cra_name
= "ecb(twofish)",
445 .cra_driver_name
= "ecb-twofish-avx",
447 .cra_flags
= CRYPTO_ALG_TYPE_ABLKCIPHER
| CRYPTO_ALG_ASYNC
,
448 .cra_blocksize
= TF_BLOCK_SIZE
,
449 .cra_ctxsize
= sizeof(struct async_helper_ctx
),
451 .cra_type
= &crypto_ablkcipher_type
,
452 .cra_module
= THIS_MODULE
,
453 .cra_init
= ablk_init
,
454 .cra_exit
= ablk_exit
,
457 .min_keysize
= TF_MIN_KEY_SIZE
,
458 .max_keysize
= TF_MAX_KEY_SIZE
,
459 .setkey
= ablk_set_key
,
460 .encrypt
= ablk_encrypt
,
461 .decrypt
= ablk_decrypt
,
465 .cra_name
= "cbc(twofish)",
466 .cra_driver_name
= "cbc-twofish-avx",
468 .cra_flags
= CRYPTO_ALG_TYPE_ABLKCIPHER
| CRYPTO_ALG_ASYNC
,
469 .cra_blocksize
= TF_BLOCK_SIZE
,
470 .cra_ctxsize
= sizeof(struct async_helper_ctx
),
472 .cra_type
= &crypto_ablkcipher_type
,
473 .cra_module
= THIS_MODULE
,
474 .cra_init
= ablk_init
,
475 .cra_exit
= ablk_exit
,
478 .min_keysize
= TF_MIN_KEY_SIZE
,
479 .max_keysize
= TF_MAX_KEY_SIZE
,
480 .ivsize
= TF_BLOCK_SIZE
,
481 .setkey
= ablk_set_key
,
482 .encrypt
= __ablk_encrypt
,
483 .decrypt
= ablk_decrypt
,
487 .cra_name
= "ctr(twofish)",
488 .cra_driver_name
= "ctr-twofish-avx",
490 .cra_flags
= CRYPTO_ALG_TYPE_ABLKCIPHER
| CRYPTO_ALG_ASYNC
,
492 .cra_ctxsize
= sizeof(struct async_helper_ctx
),
494 .cra_type
= &crypto_ablkcipher_type
,
495 .cra_module
= THIS_MODULE
,
496 .cra_init
= ablk_init
,
497 .cra_exit
= ablk_exit
,
500 .min_keysize
= TF_MIN_KEY_SIZE
,
501 .max_keysize
= TF_MAX_KEY_SIZE
,
502 .ivsize
= TF_BLOCK_SIZE
,
503 .setkey
= ablk_set_key
,
504 .encrypt
= ablk_encrypt
,
505 .decrypt
= ablk_encrypt
,
510 .cra_name
= "lrw(twofish)",
511 .cra_driver_name
= "lrw-twofish-avx",
513 .cra_flags
= CRYPTO_ALG_TYPE_ABLKCIPHER
| CRYPTO_ALG_ASYNC
,
514 .cra_blocksize
= TF_BLOCK_SIZE
,
515 .cra_ctxsize
= sizeof(struct async_helper_ctx
),
517 .cra_type
= &crypto_ablkcipher_type
,
518 .cra_module
= THIS_MODULE
,
519 .cra_init
= ablk_init
,
520 .cra_exit
= ablk_exit
,
523 .min_keysize
= TF_MIN_KEY_SIZE
+
525 .max_keysize
= TF_MAX_KEY_SIZE
+
527 .ivsize
= TF_BLOCK_SIZE
,
528 .setkey
= ablk_set_key
,
529 .encrypt
= ablk_encrypt
,
530 .decrypt
= ablk_decrypt
,
534 .cra_name
= "xts(twofish)",
535 .cra_driver_name
= "xts-twofish-avx",
537 .cra_flags
= CRYPTO_ALG_TYPE_ABLKCIPHER
| CRYPTO_ALG_ASYNC
,
538 .cra_blocksize
= TF_BLOCK_SIZE
,
539 .cra_ctxsize
= sizeof(struct async_helper_ctx
),
541 .cra_type
= &crypto_ablkcipher_type
,
542 .cra_module
= THIS_MODULE
,
543 .cra_init
= ablk_init
,
544 .cra_exit
= ablk_exit
,
547 .min_keysize
= TF_MIN_KEY_SIZE
* 2,
548 .max_keysize
= TF_MAX_KEY_SIZE
* 2,
549 .ivsize
= TF_BLOCK_SIZE
,
550 .setkey
= ablk_set_key
,
551 .encrypt
= ablk_encrypt
,
552 .decrypt
= ablk_decrypt
,
557 static int __init
twofish_init(void)
559 const char *feature_name
;
561 if (!cpu_has_xfeatures(XFEATURE_MASK_SSE
| XFEATURE_MASK_YMM
, &feature_name
)) {
562 pr_info("CPU feature '%s' is not supported.\n", feature_name
);
566 return crypto_register_algs(twofish_algs
, ARRAY_SIZE(twofish_algs
));
569 static void __exit
twofish_exit(void)
571 crypto_unregister_algs(twofish_algs
, ARRAY_SIZE(twofish_algs
));
574 module_init(twofish_init
);
575 module_exit(twofish_exit
);
577 MODULE_DESCRIPTION("Twofish Cipher Algorithm, AVX optimized");
578 MODULE_LICENSE("GPL");
579 MODULE_ALIAS_CRYPTO("twofish");