xref: /OK3568_Linux_fs/kernel/arch/x86/crypto/cast6_avx_glue.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Glue Code for the AVX assembler implementation of the Cast6 Cipher
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * Copyright (C) 2012 Johannes Goetzfried
6*4882a593Smuzhiyun  *     <Johannes.Goetzfried@informatik.stud.uni-erlangen.de>
7*4882a593Smuzhiyun  *
8*4882a593Smuzhiyun  * Copyright © 2013 Jussi Kivilinna <jussi.kivilinna@iki.fi>
9*4882a593Smuzhiyun  */
10*4882a593Smuzhiyun 
11*4882a593Smuzhiyun #include <linux/module.h>
12*4882a593Smuzhiyun #include <linux/types.h>
13*4882a593Smuzhiyun #include <linux/crypto.h>
14*4882a593Smuzhiyun #include <linux/err.h>
15*4882a593Smuzhiyun #include <crypto/algapi.h>
16*4882a593Smuzhiyun #include <crypto/cast6.h>
17*4882a593Smuzhiyun #include <crypto/internal/simd.h>
18*4882a593Smuzhiyun #include <crypto/xts.h>
19*4882a593Smuzhiyun #include <asm/crypto/glue_helper.h>
20*4882a593Smuzhiyun 
21*4882a593Smuzhiyun #define CAST6_PARALLEL_BLOCKS 8
22*4882a593Smuzhiyun 
23*4882a593Smuzhiyun asmlinkage void cast6_ecb_enc_8way(const void *ctx, u8 *dst, const u8 *src);
24*4882a593Smuzhiyun asmlinkage void cast6_ecb_dec_8way(const void *ctx, u8 *dst, const u8 *src);
25*4882a593Smuzhiyun 
26*4882a593Smuzhiyun asmlinkage void cast6_cbc_dec_8way(const void *ctx, u8 *dst, const u8 *src);
27*4882a593Smuzhiyun asmlinkage void cast6_ctr_8way(const void *ctx, u8 *dst, const u8 *src,
28*4882a593Smuzhiyun 			       le128 *iv);
29*4882a593Smuzhiyun 
30*4882a593Smuzhiyun asmlinkage void cast6_xts_enc_8way(const void *ctx, u8 *dst, const u8 *src,
31*4882a593Smuzhiyun 				   le128 *iv);
32*4882a593Smuzhiyun asmlinkage void cast6_xts_dec_8way(const void *ctx, u8 *dst, const u8 *src,
33*4882a593Smuzhiyun 				   le128 *iv);
34*4882a593Smuzhiyun 
cast6_setkey_skcipher(struct crypto_skcipher * tfm,const u8 * key,unsigned int keylen)35*4882a593Smuzhiyun static int cast6_setkey_skcipher(struct crypto_skcipher *tfm,
36*4882a593Smuzhiyun 				 const u8 *key, unsigned int keylen)
37*4882a593Smuzhiyun {
38*4882a593Smuzhiyun 	return cast6_setkey(&tfm->base, key, keylen);
39*4882a593Smuzhiyun }
40*4882a593Smuzhiyun 
cast6_xts_enc(const void * ctx,u8 * dst,const u8 * src,le128 * iv)41*4882a593Smuzhiyun static void cast6_xts_enc(const void *ctx, u8 *dst, const u8 *src, le128 *iv)
42*4882a593Smuzhiyun {
43*4882a593Smuzhiyun 	glue_xts_crypt_128bit_one(ctx, dst, src, iv, __cast6_encrypt);
44*4882a593Smuzhiyun }
45*4882a593Smuzhiyun 
cast6_xts_dec(const void * ctx,u8 * dst,const u8 * src,le128 * iv)46*4882a593Smuzhiyun static void cast6_xts_dec(const void *ctx, u8 *dst, const u8 *src, le128 *iv)
47*4882a593Smuzhiyun {
48*4882a593Smuzhiyun 	glue_xts_crypt_128bit_one(ctx, dst, src, iv, __cast6_decrypt);
49*4882a593Smuzhiyun }
50*4882a593Smuzhiyun 
cast6_crypt_ctr(const void * ctx,u8 * d,const u8 * s,le128 * iv)51*4882a593Smuzhiyun static void cast6_crypt_ctr(const void *ctx, u8 *d, const u8 *s, le128 *iv)
52*4882a593Smuzhiyun {
53*4882a593Smuzhiyun 	be128 ctrblk;
54*4882a593Smuzhiyun 	u128 *dst = (u128 *)d;
55*4882a593Smuzhiyun 	const u128 *src = (const u128 *)s;
56*4882a593Smuzhiyun 
57*4882a593Smuzhiyun 	le128_to_be128(&ctrblk, iv);
58*4882a593Smuzhiyun 	le128_inc(iv);
59*4882a593Smuzhiyun 
60*4882a593Smuzhiyun 	__cast6_encrypt(ctx, (u8 *)&ctrblk, (u8 *)&ctrblk);
61*4882a593Smuzhiyun 	u128_xor(dst, src, (u128 *)&ctrblk);
62*4882a593Smuzhiyun }
63*4882a593Smuzhiyun 
64*4882a593Smuzhiyun static const struct common_glue_ctx cast6_enc = {
65*4882a593Smuzhiyun 	.num_funcs = 2,
66*4882a593Smuzhiyun 	.fpu_blocks_limit = CAST6_PARALLEL_BLOCKS,
67*4882a593Smuzhiyun 
68*4882a593Smuzhiyun 	.funcs = { {
69*4882a593Smuzhiyun 		.num_blocks = CAST6_PARALLEL_BLOCKS,
70*4882a593Smuzhiyun 		.fn_u = { .ecb = cast6_ecb_enc_8way }
71*4882a593Smuzhiyun 	}, {
72*4882a593Smuzhiyun 		.num_blocks = 1,
73*4882a593Smuzhiyun 		.fn_u = { .ecb = __cast6_encrypt }
74*4882a593Smuzhiyun 	} }
75*4882a593Smuzhiyun };
76*4882a593Smuzhiyun 
77*4882a593Smuzhiyun static const struct common_glue_ctx cast6_ctr = {
78*4882a593Smuzhiyun 	.num_funcs = 2,
79*4882a593Smuzhiyun 	.fpu_blocks_limit = CAST6_PARALLEL_BLOCKS,
80*4882a593Smuzhiyun 
81*4882a593Smuzhiyun 	.funcs = { {
82*4882a593Smuzhiyun 		.num_blocks = CAST6_PARALLEL_BLOCKS,
83*4882a593Smuzhiyun 		.fn_u = { .ctr = cast6_ctr_8way }
84*4882a593Smuzhiyun 	}, {
85*4882a593Smuzhiyun 		.num_blocks = 1,
86*4882a593Smuzhiyun 		.fn_u = { .ctr = cast6_crypt_ctr }
87*4882a593Smuzhiyun 	} }
88*4882a593Smuzhiyun };
89*4882a593Smuzhiyun 
90*4882a593Smuzhiyun static const struct common_glue_ctx cast6_enc_xts = {
91*4882a593Smuzhiyun 	.num_funcs = 2,
92*4882a593Smuzhiyun 	.fpu_blocks_limit = CAST6_PARALLEL_BLOCKS,
93*4882a593Smuzhiyun 
94*4882a593Smuzhiyun 	.funcs = { {
95*4882a593Smuzhiyun 		.num_blocks = CAST6_PARALLEL_BLOCKS,
96*4882a593Smuzhiyun 		.fn_u = { .xts = cast6_xts_enc_8way }
97*4882a593Smuzhiyun 	}, {
98*4882a593Smuzhiyun 		.num_blocks = 1,
99*4882a593Smuzhiyun 		.fn_u = { .xts = cast6_xts_enc }
100*4882a593Smuzhiyun 	} }
101*4882a593Smuzhiyun };
102*4882a593Smuzhiyun 
103*4882a593Smuzhiyun static const struct common_glue_ctx cast6_dec = {
104*4882a593Smuzhiyun 	.num_funcs = 2,
105*4882a593Smuzhiyun 	.fpu_blocks_limit = CAST6_PARALLEL_BLOCKS,
106*4882a593Smuzhiyun 
107*4882a593Smuzhiyun 	.funcs = { {
108*4882a593Smuzhiyun 		.num_blocks = CAST6_PARALLEL_BLOCKS,
109*4882a593Smuzhiyun 		.fn_u = { .ecb = cast6_ecb_dec_8way }
110*4882a593Smuzhiyun 	}, {
111*4882a593Smuzhiyun 		.num_blocks = 1,
112*4882a593Smuzhiyun 		.fn_u = { .ecb = __cast6_decrypt }
113*4882a593Smuzhiyun 	} }
114*4882a593Smuzhiyun };
115*4882a593Smuzhiyun 
116*4882a593Smuzhiyun static const struct common_glue_ctx cast6_dec_cbc = {
117*4882a593Smuzhiyun 	.num_funcs = 2,
118*4882a593Smuzhiyun 	.fpu_blocks_limit = CAST6_PARALLEL_BLOCKS,
119*4882a593Smuzhiyun 
120*4882a593Smuzhiyun 	.funcs = { {
121*4882a593Smuzhiyun 		.num_blocks = CAST6_PARALLEL_BLOCKS,
122*4882a593Smuzhiyun 		.fn_u = { .cbc = cast6_cbc_dec_8way }
123*4882a593Smuzhiyun 	}, {
124*4882a593Smuzhiyun 		.num_blocks = 1,
125*4882a593Smuzhiyun 		.fn_u = { .cbc = __cast6_decrypt }
126*4882a593Smuzhiyun 	} }
127*4882a593Smuzhiyun };
128*4882a593Smuzhiyun 
129*4882a593Smuzhiyun static const struct common_glue_ctx cast6_dec_xts = {
130*4882a593Smuzhiyun 	.num_funcs = 2,
131*4882a593Smuzhiyun 	.fpu_blocks_limit = CAST6_PARALLEL_BLOCKS,
132*4882a593Smuzhiyun 
133*4882a593Smuzhiyun 	.funcs = { {
134*4882a593Smuzhiyun 		.num_blocks = CAST6_PARALLEL_BLOCKS,
135*4882a593Smuzhiyun 		.fn_u = { .xts = cast6_xts_dec_8way }
136*4882a593Smuzhiyun 	}, {
137*4882a593Smuzhiyun 		.num_blocks = 1,
138*4882a593Smuzhiyun 		.fn_u = { .xts = cast6_xts_dec }
139*4882a593Smuzhiyun 	} }
140*4882a593Smuzhiyun };
141*4882a593Smuzhiyun 
ecb_encrypt(struct skcipher_request * req)142*4882a593Smuzhiyun static int ecb_encrypt(struct skcipher_request *req)
143*4882a593Smuzhiyun {
144*4882a593Smuzhiyun 	return glue_ecb_req_128bit(&cast6_enc, req);
145*4882a593Smuzhiyun }
146*4882a593Smuzhiyun 
ecb_decrypt(struct skcipher_request * req)147*4882a593Smuzhiyun static int ecb_decrypt(struct skcipher_request *req)
148*4882a593Smuzhiyun {
149*4882a593Smuzhiyun 	return glue_ecb_req_128bit(&cast6_dec, req);
150*4882a593Smuzhiyun }
151*4882a593Smuzhiyun 
cbc_encrypt(struct skcipher_request * req)152*4882a593Smuzhiyun static int cbc_encrypt(struct skcipher_request *req)
153*4882a593Smuzhiyun {
154*4882a593Smuzhiyun 	return glue_cbc_encrypt_req_128bit(__cast6_encrypt, req);
155*4882a593Smuzhiyun }
156*4882a593Smuzhiyun 
cbc_decrypt(struct skcipher_request * req)157*4882a593Smuzhiyun static int cbc_decrypt(struct skcipher_request *req)
158*4882a593Smuzhiyun {
159*4882a593Smuzhiyun 	return glue_cbc_decrypt_req_128bit(&cast6_dec_cbc, req);
160*4882a593Smuzhiyun }
161*4882a593Smuzhiyun 
ctr_crypt(struct skcipher_request * req)162*4882a593Smuzhiyun static int ctr_crypt(struct skcipher_request *req)
163*4882a593Smuzhiyun {
164*4882a593Smuzhiyun 	return glue_ctr_req_128bit(&cast6_ctr, req);
165*4882a593Smuzhiyun }
166*4882a593Smuzhiyun 
167*4882a593Smuzhiyun struct cast6_xts_ctx {
168*4882a593Smuzhiyun 	struct cast6_ctx tweak_ctx;
169*4882a593Smuzhiyun 	struct cast6_ctx crypt_ctx;
170*4882a593Smuzhiyun };
171*4882a593Smuzhiyun 
xts_cast6_setkey(struct crypto_skcipher * tfm,const u8 * key,unsigned int keylen)172*4882a593Smuzhiyun static int xts_cast6_setkey(struct crypto_skcipher *tfm, const u8 *key,
173*4882a593Smuzhiyun 			    unsigned int keylen)
174*4882a593Smuzhiyun {
175*4882a593Smuzhiyun 	struct cast6_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
176*4882a593Smuzhiyun 	int err;
177*4882a593Smuzhiyun 
178*4882a593Smuzhiyun 	err = xts_verify_key(tfm, key, keylen);
179*4882a593Smuzhiyun 	if (err)
180*4882a593Smuzhiyun 		return err;
181*4882a593Smuzhiyun 
182*4882a593Smuzhiyun 	/* first half of xts-key is for crypt */
183*4882a593Smuzhiyun 	err = __cast6_setkey(&ctx->crypt_ctx, key, keylen / 2);
184*4882a593Smuzhiyun 	if (err)
185*4882a593Smuzhiyun 		return err;
186*4882a593Smuzhiyun 
187*4882a593Smuzhiyun 	/* second half of xts-key is for tweak */
188*4882a593Smuzhiyun 	return __cast6_setkey(&ctx->tweak_ctx, key + keylen / 2, keylen / 2);
189*4882a593Smuzhiyun }
190*4882a593Smuzhiyun 
xts_encrypt(struct skcipher_request * req)191*4882a593Smuzhiyun static int xts_encrypt(struct skcipher_request *req)
192*4882a593Smuzhiyun {
193*4882a593Smuzhiyun 	struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
194*4882a593Smuzhiyun 	struct cast6_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
195*4882a593Smuzhiyun 
196*4882a593Smuzhiyun 	return glue_xts_req_128bit(&cast6_enc_xts, req, __cast6_encrypt,
197*4882a593Smuzhiyun 				   &ctx->tweak_ctx, &ctx->crypt_ctx, false);
198*4882a593Smuzhiyun }
199*4882a593Smuzhiyun 
xts_decrypt(struct skcipher_request * req)200*4882a593Smuzhiyun static int xts_decrypt(struct skcipher_request *req)
201*4882a593Smuzhiyun {
202*4882a593Smuzhiyun 	struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
203*4882a593Smuzhiyun 	struct cast6_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
204*4882a593Smuzhiyun 
205*4882a593Smuzhiyun 	return glue_xts_req_128bit(&cast6_dec_xts, req, __cast6_encrypt,
206*4882a593Smuzhiyun 				   &ctx->tweak_ctx, &ctx->crypt_ctx, true);
207*4882a593Smuzhiyun }
208*4882a593Smuzhiyun 
209*4882a593Smuzhiyun static struct skcipher_alg cast6_algs[] = {
210*4882a593Smuzhiyun 	{
211*4882a593Smuzhiyun 		.base.cra_name		= "__ecb(cast6)",
212*4882a593Smuzhiyun 		.base.cra_driver_name	= "__ecb-cast6-avx",
213*4882a593Smuzhiyun 		.base.cra_priority	= 200,
214*4882a593Smuzhiyun 		.base.cra_flags		= CRYPTO_ALG_INTERNAL,
215*4882a593Smuzhiyun 		.base.cra_blocksize	= CAST6_BLOCK_SIZE,
216*4882a593Smuzhiyun 		.base.cra_ctxsize	= sizeof(struct cast6_ctx),
217*4882a593Smuzhiyun 		.base.cra_module	= THIS_MODULE,
218*4882a593Smuzhiyun 		.min_keysize		= CAST6_MIN_KEY_SIZE,
219*4882a593Smuzhiyun 		.max_keysize		= CAST6_MAX_KEY_SIZE,
220*4882a593Smuzhiyun 		.setkey			= cast6_setkey_skcipher,
221*4882a593Smuzhiyun 		.encrypt		= ecb_encrypt,
222*4882a593Smuzhiyun 		.decrypt		= ecb_decrypt,
223*4882a593Smuzhiyun 	}, {
224*4882a593Smuzhiyun 		.base.cra_name		= "__cbc(cast6)",
225*4882a593Smuzhiyun 		.base.cra_driver_name	= "__cbc-cast6-avx",
226*4882a593Smuzhiyun 		.base.cra_priority	= 200,
227*4882a593Smuzhiyun 		.base.cra_flags		= CRYPTO_ALG_INTERNAL,
228*4882a593Smuzhiyun 		.base.cra_blocksize	= CAST6_BLOCK_SIZE,
229*4882a593Smuzhiyun 		.base.cra_ctxsize	= sizeof(struct cast6_ctx),
230*4882a593Smuzhiyun 		.base.cra_module	= THIS_MODULE,
231*4882a593Smuzhiyun 		.min_keysize		= CAST6_MIN_KEY_SIZE,
232*4882a593Smuzhiyun 		.max_keysize		= CAST6_MAX_KEY_SIZE,
233*4882a593Smuzhiyun 		.ivsize			= CAST6_BLOCK_SIZE,
234*4882a593Smuzhiyun 		.setkey			= cast6_setkey_skcipher,
235*4882a593Smuzhiyun 		.encrypt		= cbc_encrypt,
236*4882a593Smuzhiyun 		.decrypt		= cbc_decrypt,
237*4882a593Smuzhiyun 	}, {
238*4882a593Smuzhiyun 		.base.cra_name		= "__ctr(cast6)",
239*4882a593Smuzhiyun 		.base.cra_driver_name	= "__ctr-cast6-avx",
240*4882a593Smuzhiyun 		.base.cra_priority	= 200,
241*4882a593Smuzhiyun 		.base.cra_flags		= CRYPTO_ALG_INTERNAL,
242*4882a593Smuzhiyun 		.base.cra_blocksize	= 1,
243*4882a593Smuzhiyun 		.base.cra_ctxsize	= sizeof(struct cast6_ctx),
244*4882a593Smuzhiyun 		.base.cra_module	= THIS_MODULE,
245*4882a593Smuzhiyun 		.min_keysize		= CAST6_MIN_KEY_SIZE,
246*4882a593Smuzhiyun 		.max_keysize		= CAST6_MAX_KEY_SIZE,
247*4882a593Smuzhiyun 		.ivsize			= CAST6_BLOCK_SIZE,
248*4882a593Smuzhiyun 		.chunksize		= CAST6_BLOCK_SIZE,
249*4882a593Smuzhiyun 		.setkey			= cast6_setkey_skcipher,
250*4882a593Smuzhiyun 		.encrypt		= ctr_crypt,
251*4882a593Smuzhiyun 		.decrypt		= ctr_crypt,
252*4882a593Smuzhiyun 	}, {
253*4882a593Smuzhiyun 		.base.cra_name		= "__xts(cast6)",
254*4882a593Smuzhiyun 		.base.cra_driver_name	= "__xts-cast6-avx",
255*4882a593Smuzhiyun 		.base.cra_priority	= 200,
256*4882a593Smuzhiyun 		.base.cra_flags		= CRYPTO_ALG_INTERNAL,
257*4882a593Smuzhiyun 		.base.cra_blocksize	= CAST6_BLOCK_SIZE,
258*4882a593Smuzhiyun 		.base.cra_ctxsize	= sizeof(struct cast6_xts_ctx),
259*4882a593Smuzhiyun 		.base.cra_module	= THIS_MODULE,
260*4882a593Smuzhiyun 		.min_keysize		= 2 * CAST6_MIN_KEY_SIZE,
261*4882a593Smuzhiyun 		.max_keysize		= 2 * CAST6_MAX_KEY_SIZE,
262*4882a593Smuzhiyun 		.ivsize			= CAST6_BLOCK_SIZE,
263*4882a593Smuzhiyun 		.setkey			= xts_cast6_setkey,
264*4882a593Smuzhiyun 		.encrypt		= xts_encrypt,
265*4882a593Smuzhiyun 		.decrypt		= xts_decrypt,
266*4882a593Smuzhiyun 	},
267*4882a593Smuzhiyun };
268*4882a593Smuzhiyun 
269*4882a593Smuzhiyun static struct simd_skcipher_alg *cast6_simd_algs[ARRAY_SIZE(cast6_algs)];
270*4882a593Smuzhiyun 
cast6_init(void)271*4882a593Smuzhiyun static int __init cast6_init(void)
272*4882a593Smuzhiyun {
273*4882a593Smuzhiyun 	const char *feature_name;
274*4882a593Smuzhiyun 
275*4882a593Smuzhiyun 	if (!cpu_has_xfeatures(XFEATURE_MASK_SSE | XFEATURE_MASK_YMM,
276*4882a593Smuzhiyun 				&feature_name)) {
277*4882a593Smuzhiyun 		pr_info("CPU feature '%s' is not supported.\n", feature_name);
278*4882a593Smuzhiyun 		return -ENODEV;
279*4882a593Smuzhiyun 	}
280*4882a593Smuzhiyun 
281*4882a593Smuzhiyun 	return simd_register_skciphers_compat(cast6_algs,
282*4882a593Smuzhiyun 					      ARRAY_SIZE(cast6_algs),
283*4882a593Smuzhiyun 					      cast6_simd_algs);
284*4882a593Smuzhiyun }
285*4882a593Smuzhiyun 
cast6_exit(void)286*4882a593Smuzhiyun static void __exit cast6_exit(void)
287*4882a593Smuzhiyun {
288*4882a593Smuzhiyun 	simd_unregister_skciphers(cast6_algs, ARRAY_SIZE(cast6_algs),
289*4882a593Smuzhiyun 				  cast6_simd_algs);
290*4882a593Smuzhiyun }
291*4882a593Smuzhiyun 
292*4882a593Smuzhiyun module_init(cast6_init);
293*4882a593Smuzhiyun module_exit(cast6_exit);
294*4882a593Smuzhiyun 
295*4882a593Smuzhiyun MODULE_DESCRIPTION("Cast6 Cipher Algorithm, AVX optimized");
296*4882a593Smuzhiyun MODULE_LICENSE("GPL");
297*4882a593Smuzhiyun MODULE_ALIAS_CRYPTO("cast6");
298