12874c5fdSThomas Gleixner // SPDX-License-Identifier: GPL-2.0-or-later
2f3f935a7SJussi Kivilinna /*
3f3f935a7SJussi Kivilinna  * Glue Code for x86_64/AVX2/AES-NI assembler optimized version of Camellia
4f3f935a7SJussi Kivilinna  *
5f3f935a7SJussi Kivilinna  * Copyright © 2013 Jussi Kivilinna <jussi.kivilinna@mbnet.fi>
6f3f935a7SJussi Kivilinna  */
7f3f935a7SJussi Kivilinna 
844893bc2SEric Biggers #include <crypto/algapi.h>
944893bc2SEric Biggers #include <crypto/internal/simd.h>
1044893bc2SEric Biggers #include <linux/crypto.h>
1144893bc2SEric Biggers #include <linux/err.h>
1244893bc2SEric Biggers #include <linux/module.h>
1344893bc2SEric Biggers #include <linux/types.h>
14f3f935a7SJussi Kivilinna 
15*a04ea6f7SArd Biesheuvel #include "camellia.h"
16407d409aSArd Biesheuvel #include "ecb_cbc_helpers.h"
17407d409aSArd Biesheuvel 
18f3f935a7SJussi Kivilinna #define CAMELLIA_AESNI_PARALLEL_BLOCKS 16
19f3f935a7SJussi Kivilinna #define CAMELLIA_AESNI_AVX2_PARALLEL_BLOCKS 32
20f3f935a7SJussi Kivilinna 
21f3f935a7SJussi Kivilinna /* 32-way AVX2/AES-NI parallel cipher functions */
229c1e8836SKees Cook asmlinkage void camellia_ecb_enc_32way(const void *ctx, u8 *dst, const u8 *src);
239c1e8836SKees Cook asmlinkage void camellia_ecb_dec_32way(const void *ctx, u8 *dst, const u8 *src);
24f3f935a7SJussi Kivilinna 
259c1e8836SKees Cook asmlinkage void camellia_cbc_dec_32way(const void *ctx, u8 *dst, const u8 *src);
26f3f935a7SJussi Kivilinna 
camellia_setkey(struct crypto_skcipher * tfm,const u8 * key,unsigned int keylen)2744893bc2SEric Biggers static int camellia_setkey(struct crypto_skcipher *tfm, const u8 *key,
2844893bc2SEric Biggers 			   unsigned int keylen)
29f3f935a7SJussi Kivilinna {
30674f368aSEric Biggers 	return __camellia_setkey(crypto_skcipher_ctx(tfm), key, keylen);
31f3f935a7SJussi Kivilinna }
32f3f935a7SJussi Kivilinna 
ecb_encrypt(struct skcipher_request * req)3344893bc2SEric Biggers static int ecb_encrypt(struct skcipher_request *req)
34f3f935a7SJussi Kivilinna {
35407d409aSArd Biesheuvel 	ECB_WALK_START(req, CAMELLIA_BLOCK_SIZE, CAMELLIA_AESNI_PARALLEL_BLOCKS);
36407d409aSArd Biesheuvel 	ECB_BLOCK(CAMELLIA_AESNI_AVX2_PARALLEL_BLOCKS, camellia_ecb_enc_32way);
37407d409aSArd Biesheuvel 	ECB_BLOCK(CAMELLIA_AESNI_PARALLEL_BLOCKS, camellia_ecb_enc_16way);
38407d409aSArd Biesheuvel 	ECB_BLOCK(2, camellia_enc_blk_2way);
39407d409aSArd Biesheuvel 	ECB_BLOCK(1, camellia_enc_blk);
40407d409aSArd Biesheuvel 	ECB_WALK_END();
41f3f935a7SJussi Kivilinna }
42f3f935a7SJussi Kivilinna 
ecb_decrypt(struct skcipher_request * req)4344893bc2SEric Biggers static int ecb_decrypt(struct skcipher_request *req)
44f3f935a7SJussi Kivilinna {
45407d409aSArd Biesheuvel 	ECB_WALK_START(req, CAMELLIA_BLOCK_SIZE, CAMELLIA_AESNI_PARALLEL_BLOCKS);
46407d409aSArd Biesheuvel 	ECB_BLOCK(CAMELLIA_AESNI_AVX2_PARALLEL_BLOCKS, camellia_ecb_dec_32way);
47407d409aSArd Biesheuvel 	ECB_BLOCK(CAMELLIA_AESNI_PARALLEL_BLOCKS, camellia_ecb_dec_16way);
48407d409aSArd Biesheuvel 	ECB_BLOCK(2, camellia_dec_blk_2way);
49407d409aSArd Biesheuvel 	ECB_BLOCK(1, camellia_dec_blk);
50407d409aSArd Biesheuvel 	ECB_WALK_END();
51f3f935a7SJussi Kivilinna }
52f3f935a7SJussi Kivilinna 
cbc_encrypt(struct skcipher_request * req)5344893bc2SEric Biggers static int cbc_encrypt(struct skcipher_request *req)
54f3f935a7SJussi Kivilinna {
55407d409aSArd Biesheuvel 	CBC_WALK_START(req, CAMELLIA_BLOCK_SIZE, -1);
56407d409aSArd Biesheuvel 	CBC_ENC_BLOCK(camellia_enc_blk);
57407d409aSArd Biesheuvel 	CBC_WALK_END();
58f3f935a7SJussi Kivilinna }
59f3f935a7SJussi Kivilinna 
cbc_decrypt(struct skcipher_request * req)6044893bc2SEric Biggers static int cbc_decrypt(struct skcipher_request *req)
61f3f935a7SJussi Kivilinna {
62407d409aSArd Biesheuvel 	CBC_WALK_START(req, CAMELLIA_BLOCK_SIZE, CAMELLIA_AESNI_PARALLEL_BLOCKS);
63407d409aSArd Biesheuvel 	CBC_DEC_BLOCK(CAMELLIA_AESNI_AVX2_PARALLEL_BLOCKS, camellia_cbc_dec_32way);
64407d409aSArd Biesheuvel 	CBC_DEC_BLOCK(CAMELLIA_AESNI_PARALLEL_BLOCKS, camellia_cbc_dec_16way);
65407d409aSArd Biesheuvel 	CBC_DEC_BLOCK(2, camellia_decrypt_cbc_2way);
66407d409aSArd Biesheuvel 	CBC_DEC_BLOCK(1, camellia_dec_blk);
67407d409aSArd Biesheuvel 	CBC_WALK_END();
68f3f935a7SJussi Kivilinna }
69f3f935a7SJussi Kivilinna 
7044893bc2SEric Biggers static struct skcipher_alg camellia_algs[] = {
7144893bc2SEric Biggers 	{
7244893bc2SEric Biggers 		.base.cra_name		= "__ecb(camellia)",
7344893bc2SEric Biggers 		.base.cra_driver_name	= "__ecb-camellia-aesni-avx2",
7444893bc2SEric Biggers 		.base.cra_priority	= 500,
7544893bc2SEric Biggers 		.base.cra_flags		= CRYPTO_ALG_INTERNAL,
7644893bc2SEric Biggers 		.base.cra_blocksize	= CAMELLIA_BLOCK_SIZE,
7744893bc2SEric Biggers 		.base.cra_ctxsize	= sizeof(struct camellia_ctx),
7844893bc2SEric Biggers 		.base.cra_module	= THIS_MODULE,
79f3f935a7SJussi Kivilinna 		.min_keysize		= CAMELLIA_MIN_KEY_SIZE,
80f3f935a7SJussi Kivilinna 		.max_keysize		= CAMELLIA_MAX_KEY_SIZE,
81f3f935a7SJussi Kivilinna 		.setkey			= camellia_setkey,
82f3f935a7SJussi Kivilinna 		.encrypt		= ecb_encrypt,
83f3f935a7SJussi Kivilinna 		.decrypt		= ecb_decrypt,
84f3f935a7SJussi Kivilinna 	}, {
8544893bc2SEric Biggers 		.base.cra_name		= "__cbc(camellia)",
8644893bc2SEric Biggers 		.base.cra_driver_name	= "__cbc-camellia-aesni-avx2",
8744893bc2SEric Biggers 		.base.cra_priority	= 500,
8844893bc2SEric Biggers 		.base.cra_flags		= CRYPTO_ALG_INTERNAL,
8944893bc2SEric Biggers 		.base.cra_blocksize	= CAMELLIA_BLOCK_SIZE,
9044893bc2SEric Biggers 		.base.cra_ctxsize	= sizeof(struct camellia_ctx),
9144893bc2SEric Biggers 		.base.cra_module	= THIS_MODULE,
92f3f935a7SJussi Kivilinna 		.min_keysize		= CAMELLIA_MIN_KEY_SIZE,
93f3f935a7SJussi Kivilinna 		.max_keysize		= CAMELLIA_MAX_KEY_SIZE,
94f3f935a7SJussi Kivilinna 		.ivsize			= CAMELLIA_BLOCK_SIZE,
95f3f935a7SJussi Kivilinna 		.setkey			= camellia_setkey,
9644893bc2SEric Biggers 		.encrypt		= cbc_encrypt,
9744893bc2SEric Biggers 		.decrypt		= cbc_decrypt,
98f3f935a7SJussi Kivilinna 	},
9944893bc2SEric Biggers };
10044893bc2SEric Biggers 
10144893bc2SEric Biggers static struct simd_skcipher_alg *camellia_simd_algs[ARRAY_SIZE(camellia_algs)];
102f3f935a7SJussi Kivilinna 
camellia_aesni_init(void)103f3f935a7SJussi Kivilinna static int __init camellia_aesni_init(void)
104f3f935a7SJussi Kivilinna {
1057bc371faSIngo Molnar 	const char *feature_name;
106f3f935a7SJussi Kivilinna 
107da154e82SBorislav Petkov 	if (!boot_cpu_has(X86_FEATURE_AVX) ||
108da154e82SBorislav Petkov 	    !boot_cpu_has(X86_FEATURE_AVX2) ||
1091f4dd793SBorislav Petkov 	    !boot_cpu_has(X86_FEATURE_AES) ||
110ab4a56faSBorislav Petkov 	    !boot_cpu_has(X86_FEATURE_OSXSAVE)) {
111b54b4bbbSIngo Molnar 		pr_info("AVX2 or AES-NI instructions are not detected.\n");
112b54b4bbbSIngo Molnar 		return -ENODEV;
113b54b4bbbSIngo Molnar 	}
114b54b4bbbSIngo Molnar 
115d91cab78SDave Hansen 	if (!cpu_has_xfeatures(XFEATURE_MASK_SSE | XFEATURE_MASK_YMM,
116d91cab78SDave Hansen 				&feature_name)) {
1177bc371faSIngo Molnar 		pr_info("CPU feature '%s' is not supported.\n", feature_name);
118f3f935a7SJussi Kivilinna 		return -ENODEV;
119f3f935a7SJussi Kivilinna 	}
120f3f935a7SJussi Kivilinna 
12144893bc2SEric Biggers 	return simd_register_skciphers_compat(camellia_algs,
12244893bc2SEric Biggers 					      ARRAY_SIZE(camellia_algs),
12344893bc2SEric Biggers 					      camellia_simd_algs);
124f3f935a7SJussi Kivilinna }
125f3f935a7SJussi Kivilinna 
camellia_aesni_fini(void)126f3f935a7SJussi Kivilinna static void __exit camellia_aesni_fini(void)
127f3f935a7SJussi Kivilinna {
12844893bc2SEric Biggers 	simd_unregister_skciphers(camellia_algs, ARRAY_SIZE(camellia_algs),
12944893bc2SEric Biggers 				  camellia_simd_algs);
130f3f935a7SJussi Kivilinna }
131f3f935a7SJussi Kivilinna 
132f3f935a7SJussi Kivilinna module_init(camellia_aesni_init);
133f3f935a7SJussi Kivilinna module_exit(camellia_aesni_fini);
134f3f935a7SJussi Kivilinna 
135f3f935a7SJussi Kivilinna MODULE_LICENSE("GPL");
136f3f935a7SJussi Kivilinna MODULE_DESCRIPTION("Camellia Cipher Algorithm, AES-NI/AVX2 optimized");
1375d26a105SKees Cook MODULE_ALIAS_CRYPTO("camellia");
1385d26a105SKees Cook MODULE_ALIAS_CRYPTO("camellia-asm");
139