xref: /OK3568_Linux_fs/kernel/arch/x86/crypto/serpent_avx2_glue.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Glue Code for x86_64/AVX2 assembler optimized version of Serpent
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * Copyright © 2012-2013 Jussi Kivilinna <jussi.kivilinna@mbnet.fi>
6*4882a593Smuzhiyun  */
7*4882a593Smuzhiyun 
8*4882a593Smuzhiyun #include <linux/module.h>
9*4882a593Smuzhiyun #include <linux/types.h>
10*4882a593Smuzhiyun #include <linux/crypto.h>
11*4882a593Smuzhiyun #include <linux/err.h>
12*4882a593Smuzhiyun #include <crypto/algapi.h>
13*4882a593Smuzhiyun #include <crypto/internal/simd.h>
14*4882a593Smuzhiyun #include <crypto/serpent.h>
15*4882a593Smuzhiyun #include <crypto/xts.h>
16*4882a593Smuzhiyun #include <asm/crypto/glue_helper.h>
17*4882a593Smuzhiyun #include <asm/crypto/serpent-avx.h>
18*4882a593Smuzhiyun 
19*4882a593Smuzhiyun #define SERPENT_AVX2_PARALLEL_BLOCKS 16
20*4882a593Smuzhiyun 
21*4882a593Smuzhiyun /* 16-way AVX2 parallel cipher functions */
22*4882a593Smuzhiyun asmlinkage void serpent_ecb_enc_16way(const void *ctx, u8 *dst, const u8 *src);
23*4882a593Smuzhiyun asmlinkage void serpent_ecb_dec_16way(const void *ctx, u8 *dst, const u8 *src);
24*4882a593Smuzhiyun asmlinkage void serpent_cbc_dec_16way(const void *ctx, u8 *dst, const u8 *src);
25*4882a593Smuzhiyun 
26*4882a593Smuzhiyun asmlinkage void serpent_ctr_16way(const void *ctx, u8 *dst, const u8 *src,
27*4882a593Smuzhiyun 				  le128 *iv);
28*4882a593Smuzhiyun asmlinkage void serpent_xts_enc_16way(const void *ctx, u8 *dst, const u8 *src,
29*4882a593Smuzhiyun 				      le128 *iv);
30*4882a593Smuzhiyun asmlinkage void serpent_xts_dec_16way(const void *ctx, u8 *dst, const u8 *src,
31*4882a593Smuzhiyun 				      le128 *iv);
32*4882a593Smuzhiyun 
serpent_setkey_skcipher(struct crypto_skcipher * tfm,const u8 * key,unsigned int keylen)33*4882a593Smuzhiyun static int serpent_setkey_skcipher(struct crypto_skcipher *tfm,
34*4882a593Smuzhiyun 				   const u8 *key, unsigned int keylen)
35*4882a593Smuzhiyun {
36*4882a593Smuzhiyun 	return __serpent_setkey(crypto_skcipher_ctx(tfm), key, keylen);
37*4882a593Smuzhiyun }
38*4882a593Smuzhiyun 
39*4882a593Smuzhiyun static const struct common_glue_ctx serpent_enc = {
40*4882a593Smuzhiyun 	.num_funcs = 3,
41*4882a593Smuzhiyun 	.fpu_blocks_limit = 8,
42*4882a593Smuzhiyun 
43*4882a593Smuzhiyun 	.funcs = { {
44*4882a593Smuzhiyun 		.num_blocks = 16,
45*4882a593Smuzhiyun 		.fn_u = { .ecb = serpent_ecb_enc_16way }
46*4882a593Smuzhiyun 	}, {
47*4882a593Smuzhiyun 		.num_blocks = 8,
48*4882a593Smuzhiyun 		.fn_u = { .ecb = serpent_ecb_enc_8way_avx }
49*4882a593Smuzhiyun 	}, {
50*4882a593Smuzhiyun 		.num_blocks = 1,
51*4882a593Smuzhiyun 		.fn_u = { .ecb = __serpent_encrypt }
52*4882a593Smuzhiyun 	} }
53*4882a593Smuzhiyun };
54*4882a593Smuzhiyun 
55*4882a593Smuzhiyun static const struct common_glue_ctx serpent_ctr = {
56*4882a593Smuzhiyun 	.num_funcs = 3,
57*4882a593Smuzhiyun 	.fpu_blocks_limit = 8,
58*4882a593Smuzhiyun 
59*4882a593Smuzhiyun 	.funcs = { {
60*4882a593Smuzhiyun 		.num_blocks = 16,
61*4882a593Smuzhiyun 		.fn_u = { .ctr = serpent_ctr_16way }
62*4882a593Smuzhiyun 	},  {
63*4882a593Smuzhiyun 		.num_blocks = 8,
64*4882a593Smuzhiyun 		.fn_u = { .ctr = serpent_ctr_8way_avx }
65*4882a593Smuzhiyun 	}, {
66*4882a593Smuzhiyun 		.num_blocks = 1,
67*4882a593Smuzhiyun 		.fn_u = { .ctr = __serpent_crypt_ctr }
68*4882a593Smuzhiyun 	} }
69*4882a593Smuzhiyun };
70*4882a593Smuzhiyun 
71*4882a593Smuzhiyun static const struct common_glue_ctx serpent_enc_xts = {
72*4882a593Smuzhiyun 	.num_funcs = 3,
73*4882a593Smuzhiyun 	.fpu_blocks_limit = 8,
74*4882a593Smuzhiyun 
75*4882a593Smuzhiyun 	.funcs = { {
76*4882a593Smuzhiyun 		.num_blocks = 16,
77*4882a593Smuzhiyun 		.fn_u = { .xts = serpent_xts_enc_16way }
78*4882a593Smuzhiyun 	}, {
79*4882a593Smuzhiyun 		.num_blocks = 8,
80*4882a593Smuzhiyun 		.fn_u = { .xts = serpent_xts_enc_8way_avx }
81*4882a593Smuzhiyun 	}, {
82*4882a593Smuzhiyun 		.num_blocks = 1,
83*4882a593Smuzhiyun 		.fn_u = { .xts = serpent_xts_enc }
84*4882a593Smuzhiyun 	} }
85*4882a593Smuzhiyun };
86*4882a593Smuzhiyun 
87*4882a593Smuzhiyun static const struct common_glue_ctx serpent_dec = {
88*4882a593Smuzhiyun 	.num_funcs = 3,
89*4882a593Smuzhiyun 	.fpu_blocks_limit = 8,
90*4882a593Smuzhiyun 
91*4882a593Smuzhiyun 	.funcs = { {
92*4882a593Smuzhiyun 		.num_blocks = 16,
93*4882a593Smuzhiyun 		.fn_u = { .ecb = serpent_ecb_dec_16way }
94*4882a593Smuzhiyun 	}, {
95*4882a593Smuzhiyun 		.num_blocks = 8,
96*4882a593Smuzhiyun 		.fn_u = { .ecb = serpent_ecb_dec_8way_avx }
97*4882a593Smuzhiyun 	}, {
98*4882a593Smuzhiyun 		.num_blocks = 1,
99*4882a593Smuzhiyun 		.fn_u = { .ecb = __serpent_decrypt }
100*4882a593Smuzhiyun 	} }
101*4882a593Smuzhiyun };
102*4882a593Smuzhiyun 
103*4882a593Smuzhiyun static const struct common_glue_ctx serpent_dec_cbc = {
104*4882a593Smuzhiyun 	.num_funcs = 3,
105*4882a593Smuzhiyun 	.fpu_blocks_limit = 8,
106*4882a593Smuzhiyun 
107*4882a593Smuzhiyun 	.funcs = { {
108*4882a593Smuzhiyun 		.num_blocks = 16,
109*4882a593Smuzhiyun 		.fn_u = { .cbc = serpent_cbc_dec_16way }
110*4882a593Smuzhiyun 	}, {
111*4882a593Smuzhiyun 		.num_blocks = 8,
112*4882a593Smuzhiyun 		.fn_u = { .cbc = serpent_cbc_dec_8way_avx }
113*4882a593Smuzhiyun 	}, {
114*4882a593Smuzhiyun 		.num_blocks = 1,
115*4882a593Smuzhiyun 		.fn_u = { .cbc = __serpent_decrypt }
116*4882a593Smuzhiyun 	} }
117*4882a593Smuzhiyun };
118*4882a593Smuzhiyun 
119*4882a593Smuzhiyun static const struct common_glue_ctx serpent_dec_xts = {
120*4882a593Smuzhiyun 	.num_funcs = 3,
121*4882a593Smuzhiyun 	.fpu_blocks_limit = 8,
122*4882a593Smuzhiyun 
123*4882a593Smuzhiyun 	.funcs = { {
124*4882a593Smuzhiyun 		.num_blocks = 16,
125*4882a593Smuzhiyun 		.fn_u = { .xts = serpent_xts_dec_16way }
126*4882a593Smuzhiyun 	}, {
127*4882a593Smuzhiyun 		.num_blocks = 8,
128*4882a593Smuzhiyun 		.fn_u = { .xts = serpent_xts_dec_8way_avx }
129*4882a593Smuzhiyun 	}, {
130*4882a593Smuzhiyun 		.num_blocks = 1,
131*4882a593Smuzhiyun 		.fn_u = { .xts = serpent_xts_dec }
132*4882a593Smuzhiyun 	} }
133*4882a593Smuzhiyun };
134*4882a593Smuzhiyun 
ecb_encrypt(struct skcipher_request * req)135*4882a593Smuzhiyun static int ecb_encrypt(struct skcipher_request *req)
136*4882a593Smuzhiyun {
137*4882a593Smuzhiyun 	return glue_ecb_req_128bit(&serpent_enc, req);
138*4882a593Smuzhiyun }
139*4882a593Smuzhiyun 
ecb_decrypt(struct skcipher_request * req)140*4882a593Smuzhiyun static int ecb_decrypt(struct skcipher_request *req)
141*4882a593Smuzhiyun {
142*4882a593Smuzhiyun 	return glue_ecb_req_128bit(&serpent_dec, req);
143*4882a593Smuzhiyun }
144*4882a593Smuzhiyun 
cbc_encrypt(struct skcipher_request * req)145*4882a593Smuzhiyun static int cbc_encrypt(struct skcipher_request *req)
146*4882a593Smuzhiyun {
147*4882a593Smuzhiyun 	return glue_cbc_encrypt_req_128bit(__serpent_encrypt, req);
148*4882a593Smuzhiyun }
149*4882a593Smuzhiyun 
cbc_decrypt(struct skcipher_request * req)150*4882a593Smuzhiyun static int cbc_decrypt(struct skcipher_request *req)
151*4882a593Smuzhiyun {
152*4882a593Smuzhiyun 	return glue_cbc_decrypt_req_128bit(&serpent_dec_cbc, req);
153*4882a593Smuzhiyun }
154*4882a593Smuzhiyun 
ctr_crypt(struct skcipher_request * req)155*4882a593Smuzhiyun static int ctr_crypt(struct skcipher_request *req)
156*4882a593Smuzhiyun {
157*4882a593Smuzhiyun 	return glue_ctr_req_128bit(&serpent_ctr, req);
158*4882a593Smuzhiyun }
159*4882a593Smuzhiyun 
xts_encrypt(struct skcipher_request * req)160*4882a593Smuzhiyun static int xts_encrypt(struct skcipher_request *req)
161*4882a593Smuzhiyun {
162*4882a593Smuzhiyun 	struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
163*4882a593Smuzhiyun 	struct serpent_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
164*4882a593Smuzhiyun 
165*4882a593Smuzhiyun 	return glue_xts_req_128bit(&serpent_enc_xts, req,
166*4882a593Smuzhiyun 				   __serpent_encrypt, &ctx->tweak_ctx,
167*4882a593Smuzhiyun 				   &ctx->crypt_ctx, false);
168*4882a593Smuzhiyun }
169*4882a593Smuzhiyun 
xts_decrypt(struct skcipher_request * req)170*4882a593Smuzhiyun static int xts_decrypt(struct skcipher_request *req)
171*4882a593Smuzhiyun {
172*4882a593Smuzhiyun 	struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
173*4882a593Smuzhiyun 	struct serpent_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
174*4882a593Smuzhiyun 
175*4882a593Smuzhiyun 	return glue_xts_req_128bit(&serpent_dec_xts, req,
176*4882a593Smuzhiyun 				   __serpent_encrypt, &ctx->tweak_ctx,
177*4882a593Smuzhiyun 				   &ctx->crypt_ctx, true);
178*4882a593Smuzhiyun }
179*4882a593Smuzhiyun 
180*4882a593Smuzhiyun static struct skcipher_alg serpent_algs[] = {
181*4882a593Smuzhiyun 	{
182*4882a593Smuzhiyun 		.base.cra_name		= "__ecb(serpent)",
183*4882a593Smuzhiyun 		.base.cra_driver_name	= "__ecb-serpent-avx2",
184*4882a593Smuzhiyun 		.base.cra_priority	= 600,
185*4882a593Smuzhiyun 		.base.cra_flags		= CRYPTO_ALG_INTERNAL,
186*4882a593Smuzhiyun 		.base.cra_blocksize	= SERPENT_BLOCK_SIZE,
187*4882a593Smuzhiyun 		.base.cra_ctxsize	= sizeof(struct serpent_ctx),
188*4882a593Smuzhiyun 		.base.cra_module	= THIS_MODULE,
189*4882a593Smuzhiyun 		.min_keysize		= SERPENT_MIN_KEY_SIZE,
190*4882a593Smuzhiyun 		.max_keysize		= SERPENT_MAX_KEY_SIZE,
191*4882a593Smuzhiyun 		.setkey			= serpent_setkey_skcipher,
192*4882a593Smuzhiyun 		.encrypt		= ecb_encrypt,
193*4882a593Smuzhiyun 		.decrypt		= ecb_decrypt,
194*4882a593Smuzhiyun 	}, {
195*4882a593Smuzhiyun 		.base.cra_name		= "__cbc(serpent)",
196*4882a593Smuzhiyun 		.base.cra_driver_name	= "__cbc-serpent-avx2",
197*4882a593Smuzhiyun 		.base.cra_priority	= 600,
198*4882a593Smuzhiyun 		.base.cra_flags		= CRYPTO_ALG_INTERNAL,
199*4882a593Smuzhiyun 		.base.cra_blocksize	= SERPENT_BLOCK_SIZE,
200*4882a593Smuzhiyun 		.base.cra_ctxsize	= sizeof(struct serpent_ctx),
201*4882a593Smuzhiyun 		.base.cra_module	= THIS_MODULE,
202*4882a593Smuzhiyun 		.min_keysize		= SERPENT_MIN_KEY_SIZE,
203*4882a593Smuzhiyun 		.max_keysize		= SERPENT_MAX_KEY_SIZE,
204*4882a593Smuzhiyun 		.ivsize			= SERPENT_BLOCK_SIZE,
205*4882a593Smuzhiyun 		.setkey			= serpent_setkey_skcipher,
206*4882a593Smuzhiyun 		.encrypt		= cbc_encrypt,
207*4882a593Smuzhiyun 		.decrypt		= cbc_decrypt,
208*4882a593Smuzhiyun 	}, {
209*4882a593Smuzhiyun 		.base.cra_name		= "__ctr(serpent)",
210*4882a593Smuzhiyun 		.base.cra_driver_name	= "__ctr-serpent-avx2",
211*4882a593Smuzhiyun 		.base.cra_priority	= 600,
212*4882a593Smuzhiyun 		.base.cra_flags		= CRYPTO_ALG_INTERNAL,
213*4882a593Smuzhiyun 		.base.cra_blocksize	= 1,
214*4882a593Smuzhiyun 		.base.cra_ctxsize	= sizeof(struct serpent_ctx),
215*4882a593Smuzhiyun 		.base.cra_module	= THIS_MODULE,
216*4882a593Smuzhiyun 		.min_keysize		= SERPENT_MIN_KEY_SIZE,
217*4882a593Smuzhiyun 		.max_keysize		= SERPENT_MAX_KEY_SIZE,
218*4882a593Smuzhiyun 		.ivsize			= SERPENT_BLOCK_SIZE,
219*4882a593Smuzhiyun 		.chunksize		= SERPENT_BLOCK_SIZE,
220*4882a593Smuzhiyun 		.setkey			= serpent_setkey_skcipher,
221*4882a593Smuzhiyun 		.encrypt		= ctr_crypt,
222*4882a593Smuzhiyun 		.decrypt		= ctr_crypt,
223*4882a593Smuzhiyun 	}, {
224*4882a593Smuzhiyun 		.base.cra_name		= "__xts(serpent)",
225*4882a593Smuzhiyun 		.base.cra_driver_name	= "__xts-serpent-avx2",
226*4882a593Smuzhiyun 		.base.cra_priority	= 600,
227*4882a593Smuzhiyun 		.base.cra_flags		= CRYPTO_ALG_INTERNAL,
228*4882a593Smuzhiyun 		.base.cra_blocksize	= SERPENT_BLOCK_SIZE,
229*4882a593Smuzhiyun 		.base.cra_ctxsize	= sizeof(struct serpent_xts_ctx),
230*4882a593Smuzhiyun 		.base.cra_module	= THIS_MODULE,
231*4882a593Smuzhiyun 		.min_keysize		= 2 * SERPENT_MIN_KEY_SIZE,
232*4882a593Smuzhiyun 		.max_keysize		= 2 * SERPENT_MAX_KEY_SIZE,
233*4882a593Smuzhiyun 		.ivsize			= SERPENT_BLOCK_SIZE,
234*4882a593Smuzhiyun 		.setkey			= xts_serpent_setkey,
235*4882a593Smuzhiyun 		.encrypt		= xts_encrypt,
236*4882a593Smuzhiyun 		.decrypt		= xts_decrypt,
237*4882a593Smuzhiyun 	},
238*4882a593Smuzhiyun };
239*4882a593Smuzhiyun 
240*4882a593Smuzhiyun static struct simd_skcipher_alg *serpent_simd_algs[ARRAY_SIZE(serpent_algs)];
241*4882a593Smuzhiyun 
init(void)242*4882a593Smuzhiyun static int __init init(void)
243*4882a593Smuzhiyun {
244*4882a593Smuzhiyun 	const char *feature_name;
245*4882a593Smuzhiyun 
246*4882a593Smuzhiyun 	if (!boot_cpu_has(X86_FEATURE_AVX2) || !boot_cpu_has(X86_FEATURE_OSXSAVE)) {
247*4882a593Smuzhiyun 		pr_info("AVX2 instructions are not detected.\n");
248*4882a593Smuzhiyun 		return -ENODEV;
249*4882a593Smuzhiyun 	}
250*4882a593Smuzhiyun 	if (!cpu_has_xfeatures(XFEATURE_MASK_SSE | XFEATURE_MASK_YMM,
251*4882a593Smuzhiyun 				&feature_name)) {
252*4882a593Smuzhiyun 		pr_info("CPU feature '%s' is not supported.\n", feature_name);
253*4882a593Smuzhiyun 		return -ENODEV;
254*4882a593Smuzhiyun 	}
255*4882a593Smuzhiyun 
256*4882a593Smuzhiyun 	return simd_register_skciphers_compat(serpent_algs,
257*4882a593Smuzhiyun 					      ARRAY_SIZE(serpent_algs),
258*4882a593Smuzhiyun 					      serpent_simd_algs);
259*4882a593Smuzhiyun }
260*4882a593Smuzhiyun 
fini(void)261*4882a593Smuzhiyun static void __exit fini(void)
262*4882a593Smuzhiyun {
263*4882a593Smuzhiyun 	simd_unregister_skciphers(serpent_algs, ARRAY_SIZE(serpent_algs),
264*4882a593Smuzhiyun 				  serpent_simd_algs);
265*4882a593Smuzhiyun }
266*4882a593Smuzhiyun 
267*4882a593Smuzhiyun module_init(init);
268*4882a593Smuzhiyun module_exit(fini);
269*4882a593Smuzhiyun 
270*4882a593Smuzhiyun MODULE_LICENSE("GPL");
271*4882a593Smuzhiyun MODULE_DESCRIPTION("Serpent Cipher Algorithm, AVX2 optimized");
272*4882a593Smuzhiyun MODULE_ALIAS_CRYPTO("serpent");
273*4882a593Smuzhiyun MODULE_ALIAS_CRYPTO("serpent-asm");
274