xref: /OK3568_Linux_fs/kernel/arch/x86/crypto/cast5_avx_glue.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Glue Code for the AVX assembler implementation of the Cast5 Cipher
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * Copyright (C) 2012 Johannes Goetzfried
6*4882a593Smuzhiyun  *     <Johannes.Goetzfried@informatik.stud.uni-erlangen.de>
7*4882a593Smuzhiyun  */
8*4882a593Smuzhiyun 
9*4882a593Smuzhiyun #include <asm/crypto/glue_helper.h>
10*4882a593Smuzhiyun #include <crypto/algapi.h>
11*4882a593Smuzhiyun #include <crypto/cast5.h>
12*4882a593Smuzhiyun #include <crypto/internal/simd.h>
13*4882a593Smuzhiyun #include <linux/crypto.h>
14*4882a593Smuzhiyun #include <linux/err.h>
15*4882a593Smuzhiyun #include <linux/module.h>
16*4882a593Smuzhiyun #include <linux/types.h>
17*4882a593Smuzhiyun 
18*4882a593Smuzhiyun #define CAST5_PARALLEL_BLOCKS 16
19*4882a593Smuzhiyun 
20*4882a593Smuzhiyun asmlinkage void cast5_ecb_enc_16way(struct cast5_ctx *ctx, u8 *dst,
21*4882a593Smuzhiyun 				    const u8 *src);
22*4882a593Smuzhiyun asmlinkage void cast5_ecb_dec_16way(struct cast5_ctx *ctx, u8 *dst,
23*4882a593Smuzhiyun 				    const u8 *src);
24*4882a593Smuzhiyun asmlinkage void cast5_cbc_dec_16way(struct cast5_ctx *ctx, u8 *dst,
25*4882a593Smuzhiyun 				    const u8 *src);
26*4882a593Smuzhiyun asmlinkage void cast5_ctr_16way(struct cast5_ctx *ctx, u8 *dst, const u8 *src,
27*4882a593Smuzhiyun 				__be64 *iv);
28*4882a593Smuzhiyun 
cast5_setkey_skcipher(struct crypto_skcipher * tfm,const u8 * key,unsigned int keylen)29*4882a593Smuzhiyun static int cast5_setkey_skcipher(struct crypto_skcipher *tfm, const u8 *key,
30*4882a593Smuzhiyun 				 unsigned int keylen)
31*4882a593Smuzhiyun {
32*4882a593Smuzhiyun 	return cast5_setkey(&tfm->base, key, keylen);
33*4882a593Smuzhiyun }
34*4882a593Smuzhiyun 
cast5_fpu_begin(bool fpu_enabled,struct skcipher_walk * walk,unsigned int nbytes)35*4882a593Smuzhiyun static inline bool cast5_fpu_begin(bool fpu_enabled, struct skcipher_walk *walk,
36*4882a593Smuzhiyun 				   unsigned int nbytes)
37*4882a593Smuzhiyun {
38*4882a593Smuzhiyun 	return glue_fpu_begin(CAST5_BLOCK_SIZE, CAST5_PARALLEL_BLOCKS,
39*4882a593Smuzhiyun 			      walk, fpu_enabled, nbytes);
40*4882a593Smuzhiyun }
41*4882a593Smuzhiyun 
cast5_fpu_end(bool fpu_enabled)42*4882a593Smuzhiyun static inline void cast5_fpu_end(bool fpu_enabled)
43*4882a593Smuzhiyun {
44*4882a593Smuzhiyun 	return glue_fpu_end(fpu_enabled);
45*4882a593Smuzhiyun }
46*4882a593Smuzhiyun 
ecb_crypt(struct skcipher_request * req,bool enc)47*4882a593Smuzhiyun static int ecb_crypt(struct skcipher_request *req, bool enc)
48*4882a593Smuzhiyun {
49*4882a593Smuzhiyun 	bool fpu_enabled = false;
50*4882a593Smuzhiyun 	struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
51*4882a593Smuzhiyun 	struct cast5_ctx *ctx = crypto_skcipher_ctx(tfm);
52*4882a593Smuzhiyun 	struct skcipher_walk walk;
53*4882a593Smuzhiyun 	const unsigned int bsize = CAST5_BLOCK_SIZE;
54*4882a593Smuzhiyun 	unsigned int nbytes;
55*4882a593Smuzhiyun 	void (*fn)(struct cast5_ctx *ctx, u8 *dst, const u8 *src);
56*4882a593Smuzhiyun 	int err;
57*4882a593Smuzhiyun 
58*4882a593Smuzhiyun 	err = skcipher_walk_virt(&walk, req, false);
59*4882a593Smuzhiyun 
60*4882a593Smuzhiyun 	while ((nbytes = walk.nbytes)) {
61*4882a593Smuzhiyun 		u8 *wsrc = walk.src.virt.addr;
62*4882a593Smuzhiyun 		u8 *wdst = walk.dst.virt.addr;
63*4882a593Smuzhiyun 
64*4882a593Smuzhiyun 		fpu_enabled = cast5_fpu_begin(fpu_enabled, &walk, nbytes);
65*4882a593Smuzhiyun 
66*4882a593Smuzhiyun 		/* Process multi-block batch */
67*4882a593Smuzhiyun 		if (nbytes >= bsize * CAST5_PARALLEL_BLOCKS) {
68*4882a593Smuzhiyun 			fn = (enc) ? cast5_ecb_enc_16way : cast5_ecb_dec_16way;
69*4882a593Smuzhiyun 			do {
70*4882a593Smuzhiyun 				fn(ctx, wdst, wsrc);
71*4882a593Smuzhiyun 
72*4882a593Smuzhiyun 				wsrc += bsize * CAST5_PARALLEL_BLOCKS;
73*4882a593Smuzhiyun 				wdst += bsize * CAST5_PARALLEL_BLOCKS;
74*4882a593Smuzhiyun 				nbytes -= bsize * CAST5_PARALLEL_BLOCKS;
75*4882a593Smuzhiyun 			} while (nbytes >= bsize * CAST5_PARALLEL_BLOCKS);
76*4882a593Smuzhiyun 
77*4882a593Smuzhiyun 			if (nbytes < bsize)
78*4882a593Smuzhiyun 				goto done;
79*4882a593Smuzhiyun 		}
80*4882a593Smuzhiyun 
81*4882a593Smuzhiyun 		fn = (enc) ? __cast5_encrypt : __cast5_decrypt;
82*4882a593Smuzhiyun 
83*4882a593Smuzhiyun 		/* Handle leftovers */
84*4882a593Smuzhiyun 		do {
85*4882a593Smuzhiyun 			fn(ctx, wdst, wsrc);
86*4882a593Smuzhiyun 
87*4882a593Smuzhiyun 			wsrc += bsize;
88*4882a593Smuzhiyun 			wdst += bsize;
89*4882a593Smuzhiyun 			nbytes -= bsize;
90*4882a593Smuzhiyun 		} while (nbytes >= bsize);
91*4882a593Smuzhiyun 
92*4882a593Smuzhiyun done:
93*4882a593Smuzhiyun 		err = skcipher_walk_done(&walk, nbytes);
94*4882a593Smuzhiyun 	}
95*4882a593Smuzhiyun 
96*4882a593Smuzhiyun 	cast5_fpu_end(fpu_enabled);
97*4882a593Smuzhiyun 	return err;
98*4882a593Smuzhiyun }
99*4882a593Smuzhiyun 
ecb_encrypt(struct skcipher_request * req)100*4882a593Smuzhiyun static int ecb_encrypt(struct skcipher_request *req)
101*4882a593Smuzhiyun {
102*4882a593Smuzhiyun 	return ecb_crypt(req, true);
103*4882a593Smuzhiyun }
104*4882a593Smuzhiyun 
ecb_decrypt(struct skcipher_request * req)105*4882a593Smuzhiyun static int ecb_decrypt(struct skcipher_request *req)
106*4882a593Smuzhiyun {
107*4882a593Smuzhiyun 	return ecb_crypt(req, false);
108*4882a593Smuzhiyun }
109*4882a593Smuzhiyun 
cbc_encrypt(struct skcipher_request * req)110*4882a593Smuzhiyun static int cbc_encrypt(struct skcipher_request *req)
111*4882a593Smuzhiyun {
112*4882a593Smuzhiyun 	const unsigned int bsize = CAST5_BLOCK_SIZE;
113*4882a593Smuzhiyun 	struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
114*4882a593Smuzhiyun 	struct cast5_ctx *ctx = crypto_skcipher_ctx(tfm);
115*4882a593Smuzhiyun 	struct skcipher_walk walk;
116*4882a593Smuzhiyun 	unsigned int nbytes;
117*4882a593Smuzhiyun 	int err;
118*4882a593Smuzhiyun 
119*4882a593Smuzhiyun 	err = skcipher_walk_virt(&walk, req, false);
120*4882a593Smuzhiyun 
121*4882a593Smuzhiyun 	while ((nbytes = walk.nbytes)) {
122*4882a593Smuzhiyun 		u64 *src = (u64 *)walk.src.virt.addr;
123*4882a593Smuzhiyun 		u64 *dst = (u64 *)walk.dst.virt.addr;
124*4882a593Smuzhiyun 		u64 *iv = (u64 *)walk.iv;
125*4882a593Smuzhiyun 
126*4882a593Smuzhiyun 		do {
127*4882a593Smuzhiyun 			*dst = *src ^ *iv;
128*4882a593Smuzhiyun 			__cast5_encrypt(ctx, (u8 *)dst, (u8 *)dst);
129*4882a593Smuzhiyun 			iv = dst;
130*4882a593Smuzhiyun 			src++;
131*4882a593Smuzhiyun 			dst++;
132*4882a593Smuzhiyun 			nbytes -= bsize;
133*4882a593Smuzhiyun 		} while (nbytes >= bsize);
134*4882a593Smuzhiyun 
135*4882a593Smuzhiyun 		*(u64 *)walk.iv = *iv;
136*4882a593Smuzhiyun 		err = skcipher_walk_done(&walk, nbytes);
137*4882a593Smuzhiyun 	}
138*4882a593Smuzhiyun 
139*4882a593Smuzhiyun 	return err;
140*4882a593Smuzhiyun }
141*4882a593Smuzhiyun 
__cbc_decrypt(struct cast5_ctx * ctx,struct skcipher_walk * walk)142*4882a593Smuzhiyun static unsigned int __cbc_decrypt(struct cast5_ctx *ctx,
143*4882a593Smuzhiyun 				  struct skcipher_walk *walk)
144*4882a593Smuzhiyun {
145*4882a593Smuzhiyun 	const unsigned int bsize = CAST5_BLOCK_SIZE;
146*4882a593Smuzhiyun 	unsigned int nbytes = walk->nbytes;
147*4882a593Smuzhiyun 	u64 *src = (u64 *)walk->src.virt.addr;
148*4882a593Smuzhiyun 	u64 *dst = (u64 *)walk->dst.virt.addr;
149*4882a593Smuzhiyun 	u64 last_iv;
150*4882a593Smuzhiyun 
151*4882a593Smuzhiyun 	/* Start of the last block. */
152*4882a593Smuzhiyun 	src += nbytes / bsize - 1;
153*4882a593Smuzhiyun 	dst += nbytes / bsize - 1;
154*4882a593Smuzhiyun 
155*4882a593Smuzhiyun 	last_iv = *src;
156*4882a593Smuzhiyun 
157*4882a593Smuzhiyun 	/* Process multi-block batch */
158*4882a593Smuzhiyun 	if (nbytes >= bsize * CAST5_PARALLEL_BLOCKS) {
159*4882a593Smuzhiyun 		do {
160*4882a593Smuzhiyun 			nbytes -= bsize * (CAST5_PARALLEL_BLOCKS - 1);
161*4882a593Smuzhiyun 			src -= CAST5_PARALLEL_BLOCKS - 1;
162*4882a593Smuzhiyun 			dst -= CAST5_PARALLEL_BLOCKS - 1;
163*4882a593Smuzhiyun 
164*4882a593Smuzhiyun 			cast5_cbc_dec_16way(ctx, (u8 *)dst, (u8 *)src);
165*4882a593Smuzhiyun 
166*4882a593Smuzhiyun 			nbytes -= bsize;
167*4882a593Smuzhiyun 			if (nbytes < bsize)
168*4882a593Smuzhiyun 				goto done;
169*4882a593Smuzhiyun 
170*4882a593Smuzhiyun 			*dst ^= *(src - 1);
171*4882a593Smuzhiyun 			src -= 1;
172*4882a593Smuzhiyun 			dst -= 1;
173*4882a593Smuzhiyun 		} while (nbytes >= bsize * CAST5_PARALLEL_BLOCKS);
174*4882a593Smuzhiyun 	}
175*4882a593Smuzhiyun 
176*4882a593Smuzhiyun 	/* Handle leftovers */
177*4882a593Smuzhiyun 	for (;;) {
178*4882a593Smuzhiyun 		__cast5_decrypt(ctx, (u8 *)dst, (u8 *)src);
179*4882a593Smuzhiyun 
180*4882a593Smuzhiyun 		nbytes -= bsize;
181*4882a593Smuzhiyun 		if (nbytes < bsize)
182*4882a593Smuzhiyun 			break;
183*4882a593Smuzhiyun 
184*4882a593Smuzhiyun 		*dst ^= *(src - 1);
185*4882a593Smuzhiyun 		src -= 1;
186*4882a593Smuzhiyun 		dst -= 1;
187*4882a593Smuzhiyun 	}
188*4882a593Smuzhiyun 
189*4882a593Smuzhiyun done:
190*4882a593Smuzhiyun 	*dst ^= *(u64 *)walk->iv;
191*4882a593Smuzhiyun 	*(u64 *)walk->iv = last_iv;
192*4882a593Smuzhiyun 
193*4882a593Smuzhiyun 	return nbytes;
194*4882a593Smuzhiyun }
195*4882a593Smuzhiyun 
cbc_decrypt(struct skcipher_request * req)196*4882a593Smuzhiyun static int cbc_decrypt(struct skcipher_request *req)
197*4882a593Smuzhiyun {
198*4882a593Smuzhiyun 	struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
199*4882a593Smuzhiyun 	struct cast5_ctx *ctx = crypto_skcipher_ctx(tfm);
200*4882a593Smuzhiyun 	bool fpu_enabled = false;
201*4882a593Smuzhiyun 	struct skcipher_walk walk;
202*4882a593Smuzhiyun 	unsigned int nbytes;
203*4882a593Smuzhiyun 	int err;
204*4882a593Smuzhiyun 
205*4882a593Smuzhiyun 	err = skcipher_walk_virt(&walk, req, false);
206*4882a593Smuzhiyun 
207*4882a593Smuzhiyun 	while ((nbytes = walk.nbytes)) {
208*4882a593Smuzhiyun 		fpu_enabled = cast5_fpu_begin(fpu_enabled, &walk, nbytes);
209*4882a593Smuzhiyun 		nbytes = __cbc_decrypt(ctx, &walk);
210*4882a593Smuzhiyun 		err = skcipher_walk_done(&walk, nbytes);
211*4882a593Smuzhiyun 	}
212*4882a593Smuzhiyun 
213*4882a593Smuzhiyun 	cast5_fpu_end(fpu_enabled);
214*4882a593Smuzhiyun 	return err;
215*4882a593Smuzhiyun }
216*4882a593Smuzhiyun 
ctr_crypt_final(struct skcipher_walk * walk,struct cast5_ctx * ctx)217*4882a593Smuzhiyun static void ctr_crypt_final(struct skcipher_walk *walk, struct cast5_ctx *ctx)
218*4882a593Smuzhiyun {
219*4882a593Smuzhiyun 	u8 *ctrblk = walk->iv;
220*4882a593Smuzhiyun 	u8 keystream[CAST5_BLOCK_SIZE];
221*4882a593Smuzhiyun 	u8 *src = walk->src.virt.addr;
222*4882a593Smuzhiyun 	u8 *dst = walk->dst.virt.addr;
223*4882a593Smuzhiyun 	unsigned int nbytes = walk->nbytes;
224*4882a593Smuzhiyun 
225*4882a593Smuzhiyun 	__cast5_encrypt(ctx, keystream, ctrblk);
226*4882a593Smuzhiyun 	crypto_xor_cpy(dst, keystream, src, nbytes);
227*4882a593Smuzhiyun 
228*4882a593Smuzhiyun 	crypto_inc(ctrblk, CAST5_BLOCK_SIZE);
229*4882a593Smuzhiyun }
230*4882a593Smuzhiyun 
__ctr_crypt(struct skcipher_walk * walk,struct cast5_ctx * ctx)231*4882a593Smuzhiyun static unsigned int __ctr_crypt(struct skcipher_walk *walk,
232*4882a593Smuzhiyun 				struct cast5_ctx *ctx)
233*4882a593Smuzhiyun {
234*4882a593Smuzhiyun 	const unsigned int bsize = CAST5_BLOCK_SIZE;
235*4882a593Smuzhiyun 	unsigned int nbytes = walk->nbytes;
236*4882a593Smuzhiyun 	u64 *src = (u64 *)walk->src.virt.addr;
237*4882a593Smuzhiyun 	u64 *dst = (u64 *)walk->dst.virt.addr;
238*4882a593Smuzhiyun 
239*4882a593Smuzhiyun 	/* Process multi-block batch */
240*4882a593Smuzhiyun 	if (nbytes >= bsize * CAST5_PARALLEL_BLOCKS) {
241*4882a593Smuzhiyun 		do {
242*4882a593Smuzhiyun 			cast5_ctr_16way(ctx, (u8 *)dst, (u8 *)src,
243*4882a593Smuzhiyun 					(__be64 *)walk->iv);
244*4882a593Smuzhiyun 
245*4882a593Smuzhiyun 			src += CAST5_PARALLEL_BLOCKS;
246*4882a593Smuzhiyun 			dst += CAST5_PARALLEL_BLOCKS;
247*4882a593Smuzhiyun 			nbytes -= bsize * CAST5_PARALLEL_BLOCKS;
248*4882a593Smuzhiyun 		} while (nbytes >= bsize * CAST5_PARALLEL_BLOCKS);
249*4882a593Smuzhiyun 
250*4882a593Smuzhiyun 		if (nbytes < bsize)
251*4882a593Smuzhiyun 			goto done;
252*4882a593Smuzhiyun 	}
253*4882a593Smuzhiyun 
254*4882a593Smuzhiyun 	/* Handle leftovers */
255*4882a593Smuzhiyun 	do {
256*4882a593Smuzhiyun 		u64 ctrblk;
257*4882a593Smuzhiyun 
258*4882a593Smuzhiyun 		if (dst != src)
259*4882a593Smuzhiyun 			*dst = *src;
260*4882a593Smuzhiyun 
261*4882a593Smuzhiyun 		ctrblk = *(u64 *)walk->iv;
262*4882a593Smuzhiyun 		be64_add_cpu((__be64 *)walk->iv, 1);
263*4882a593Smuzhiyun 
264*4882a593Smuzhiyun 		__cast5_encrypt(ctx, (u8 *)&ctrblk, (u8 *)&ctrblk);
265*4882a593Smuzhiyun 		*dst ^= ctrblk;
266*4882a593Smuzhiyun 
267*4882a593Smuzhiyun 		src += 1;
268*4882a593Smuzhiyun 		dst += 1;
269*4882a593Smuzhiyun 		nbytes -= bsize;
270*4882a593Smuzhiyun 	} while (nbytes >= bsize);
271*4882a593Smuzhiyun 
272*4882a593Smuzhiyun done:
273*4882a593Smuzhiyun 	return nbytes;
274*4882a593Smuzhiyun }
275*4882a593Smuzhiyun 
ctr_crypt(struct skcipher_request * req)276*4882a593Smuzhiyun static int ctr_crypt(struct skcipher_request *req)
277*4882a593Smuzhiyun {
278*4882a593Smuzhiyun 	struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
279*4882a593Smuzhiyun 	struct cast5_ctx *ctx = crypto_skcipher_ctx(tfm);
280*4882a593Smuzhiyun 	bool fpu_enabled = false;
281*4882a593Smuzhiyun 	struct skcipher_walk walk;
282*4882a593Smuzhiyun 	unsigned int nbytes;
283*4882a593Smuzhiyun 	int err;
284*4882a593Smuzhiyun 
285*4882a593Smuzhiyun 	err = skcipher_walk_virt(&walk, req, false);
286*4882a593Smuzhiyun 
287*4882a593Smuzhiyun 	while ((nbytes = walk.nbytes) >= CAST5_BLOCK_SIZE) {
288*4882a593Smuzhiyun 		fpu_enabled = cast5_fpu_begin(fpu_enabled, &walk, nbytes);
289*4882a593Smuzhiyun 		nbytes = __ctr_crypt(&walk, ctx);
290*4882a593Smuzhiyun 		err = skcipher_walk_done(&walk, nbytes);
291*4882a593Smuzhiyun 	}
292*4882a593Smuzhiyun 
293*4882a593Smuzhiyun 	cast5_fpu_end(fpu_enabled);
294*4882a593Smuzhiyun 
295*4882a593Smuzhiyun 	if (walk.nbytes) {
296*4882a593Smuzhiyun 		ctr_crypt_final(&walk, ctx);
297*4882a593Smuzhiyun 		err = skcipher_walk_done(&walk, 0);
298*4882a593Smuzhiyun 	}
299*4882a593Smuzhiyun 
300*4882a593Smuzhiyun 	return err;
301*4882a593Smuzhiyun }
302*4882a593Smuzhiyun 
303*4882a593Smuzhiyun static struct skcipher_alg cast5_algs[] = {
304*4882a593Smuzhiyun 	{
305*4882a593Smuzhiyun 		.base.cra_name		= "__ecb(cast5)",
306*4882a593Smuzhiyun 		.base.cra_driver_name	= "__ecb-cast5-avx",
307*4882a593Smuzhiyun 		.base.cra_priority	= 200,
308*4882a593Smuzhiyun 		.base.cra_flags		= CRYPTO_ALG_INTERNAL,
309*4882a593Smuzhiyun 		.base.cra_blocksize	= CAST5_BLOCK_SIZE,
310*4882a593Smuzhiyun 		.base.cra_ctxsize	= sizeof(struct cast5_ctx),
311*4882a593Smuzhiyun 		.base.cra_module	= THIS_MODULE,
312*4882a593Smuzhiyun 		.min_keysize		= CAST5_MIN_KEY_SIZE,
313*4882a593Smuzhiyun 		.max_keysize		= CAST5_MAX_KEY_SIZE,
314*4882a593Smuzhiyun 		.setkey			= cast5_setkey_skcipher,
315*4882a593Smuzhiyun 		.encrypt		= ecb_encrypt,
316*4882a593Smuzhiyun 		.decrypt		= ecb_decrypt,
317*4882a593Smuzhiyun 	}, {
318*4882a593Smuzhiyun 		.base.cra_name		= "__cbc(cast5)",
319*4882a593Smuzhiyun 		.base.cra_driver_name	= "__cbc-cast5-avx",
320*4882a593Smuzhiyun 		.base.cra_priority	= 200,
321*4882a593Smuzhiyun 		.base.cra_flags		= CRYPTO_ALG_INTERNAL,
322*4882a593Smuzhiyun 		.base.cra_blocksize	= CAST5_BLOCK_SIZE,
323*4882a593Smuzhiyun 		.base.cra_ctxsize	= sizeof(struct cast5_ctx),
324*4882a593Smuzhiyun 		.base.cra_module	= THIS_MODULE,
325*4882a593Smuzhiyun 		.min_keysize		= CAST5_MIN_KEY_SIZE,
326*4882a593Smuzhiyun 		.max_keysize		= CAST5_MAX_KEY_SIZE,
327*4882a593Smuzhiyun 		.ivsize			= CAST5_BLOCK_SIZE,
328*4882a593Smuzhiyun 		.setkey			= cast5_setkey_skcipher,
329*4882a593Smuzhiyun 		.encrypt		= cbc_encrypt,
330*4882a593Smuzhiyun 		.decrypt		= cbc_decrypt,
331*4882a593Smuzhiyun 	}, {
332*4882a593Smuzhiyun 		.base.cra_name		= "__ctr(cast5)",
333*4882a593Smuzhiyun 		.base.cra_driver_name	= "__ctr-cast5-avx",
334*4882a593Smuzhiyun 		.base.cra_priority	= 200,
335*4882a593Smuzhiyun 		.base.cra_flags		= CRYPTO_ALG_INTERNAL,
336*4882a593Smuzhiyun 		.base.cra_blocksize	= 1,
337*4882a593Smuzhiyun 		.base.cra_ctxsize	= sizeof(struct cast5_ctx),
338*4882a593Smuzhiyun 		.base.cra_module	= THIS_MODULE,
339*4882a593Smuzhiyun 		.min_keysize		= CAST5_MIN_KEY_SIZE,
340*4882a593Smuzhiyun 		.max_keysize		= CAST5_MAX_KEY_SIZE,
341*4882a593Smuzhiyun 		.ivsize			= CAST5_BLOCK_SIZE,
342*4882a593Smuzhiyun 		.chunksize		= CAST5_BLOCK_SIZE,
343*4882a593Smuzhiyun 		.setkey			= cast5_setkey_skcipher,
344*4882a593Smuzhiyun 		.encrypt		= ctr_crypt,
345*4882a593Smuzhiyun 		.decrypt		= ctr_crypt,
346*4882a593Smuzhiyun 	}
347*4882a593Smuzhiyun };
348*4882a593Smuzhiyun 
349*4882a593Smuzhiyun static struct simd_skcipher_alg *cast5_simd_algs[ARRAY_SIZE(cast5_algs)];
350*4882a593Smuzhiyun 
cast5_init(void)351*4882a593Smuzhiyun static int __init cast5_init(void)
352*4882a593Smuzhiyun {
353*4882a593Smuzhiyun 	const char *feature_name;
354*4882a593Smuzhiyun 
355*4882a593Smuzhiyun 	if (!cpu_has_xfeatures(XFEATURE_MASK_SSE | XFEATURE_MASK_YMM,
356*4882a593Smuzhiyun 				&feature_name)) {
357*4882a593Smuzhiyun 		pr_info("CPU feature '%s' is not supported.\n", feature_name);
358*4882a593Smuzhiyun 		return -ENODEV;
359*4882a593Smuzhiyun 	}
360*4882a593Smuzhiyun 
361*4882a593Smuzhiyun 	return simd_register_skciphers_compat(cast5_algs,
362*4882a593Smuzhiyun 					      ARRAY_SIZE(cast5_algs),
363*4882a593Smuzhiyun 					      cast5_simd_algs);
364*4882a593Smuzhiyun }
365*4882a593Smuzhiyun 
cast5_exit(void)366*4882a593Smuzhiyun static void __exit cast5_exit(void)
367*4882a593Smuzhiyun {
368*4882a593Smuzhiyun 	simd_unregister_skciphers(cast5_algs, ARRAY_SIZE(cast5_algs),
369*4882a593Smuzhiyun 				  cast5_simd_algs);
370*4882a593Smuzhiyun }
371*4882a593Smuzhiyun 
372*4882a593Smuzhiyun module_init(cast5_init);
373*4882a593Smuzhiyun module_exit(cast5_exit);
374*4882a593Smuzhiyun 
375*4882a593Smuzhiyun MODULE_DESCRIPTION("Cast5 Cipher Algorithm, AVX optimized");
376*4882a593Smuzhiyun MODULE_LICENSE("GPL");
377*4882a593Smuzhiyun MODULE_ALIAS_CRYPTO("cast5");
378