xref: /OK3568_Linux_fs/kernel/arch/x86/crypto/camellia_aesni_avx_glue.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Glue Code for x86_64/AVX/AES-NI assembler optimized version of Camellia
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * Copyright © 2012-2013 Jussi Kivilinna <jussi.kivilinna@iki.fi>
6*4882a593Smuzhiyun  */
7*4882a593Smuzhiyun 
8*4882a593Smuzhiyun #include <asm/crypto/camellia.h>
9*4882a593Smuzhiyun #include <asm/crypto/glue_helper.h>
10*4882a593Smuzhiyun #include <crypto/algapi.h>
11*4882a593Smuzhiyun #include <crypto/internal/simd.h>
12*4882a593Smuzhiyun #include <crypto/xts.h>
13*4882a593Smuzhiyun #include <linux/crypto.h>
14*4882a593Smuzhiyun #include <linux/err.h>
15*4882a593Smuzhiyun #include <linux/module.h>
16*4882a593Smuzhiyun #include <linux/types.h>
17*4882a593Smuzhiyun 
18*4882a593Smuzhiyun #define CAMELLIA_AESNI_PARALLEL_BLOCKS 16
19*4882a593Smuzhiyun 
20*4882a593Smuzhiyun /* 16-way parallel cipher functions (avx/aes-ni) */
21*4882a593Smuzhiyun asmlinkage void camellia_ecb_enc_16way(const void *ctx, u8 *dst, const u8 *src);
22*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(camellia_ecb_enc_16way);
23*4882a593Smuzhiyun 
24*4882a593Smuzhiyun asmlinkage void camellia_ecb_dec_16way(const void *ctx, u8 *dst, const u8 *src);
25*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(camellia_ecb_dec_16way);
26*4882a593Smuzhiyun 
27*4882a593Smuzhiyun asmlinkage void camellia_cbc_dec_16way(const void *ctx, u8 *dst, const u8 *src);
28*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(camellia_cbc_dec_16way);
29*4882a593Smuzhiyun 
30*4882a593Smuzhiyun asmlinkage void camellia_ctr_16way(const void *ctx, u8 *dst, const u8 *src,
31*4882a593Smuzhiyun 				   le128 *iv);
32*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(camellia_ctr_16way);
33*4882a593Smuzhiyun 
34*4882a593Smuzhiyun asmlinkage void camellia_xts_enc_16way(const void *ctx, u8 *dst, const u8 *src,
35*4882a593Smuzhiyun 				       le128 *iv);
36*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(camellia_xts_enc_16way);
37*4882a593Smuzhiyun 
38*4882a593Smuzhiyun asmlinkage void camellia_xts_dec_16way(const void *ctx, u8 *dst, const u8 *src,
39*4882a593Smuzhiyun 				       le128 *iv);
40*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(camellia_xts_dec_16way);
41*4882a593Smuzhiyun 
camellia_xts_enc(const void * ctx,u8 * dst,const u8 * src,le128 * iv)42*4882a593Smuzhiyun void camellia_xts_enc(const void *ctx, u8 *dst, const u8 *src, le128 *iv)
43*4882a593Smuzhiyun {
44*4882a593Smuzhiyun 	glue_xts_crypt_128bit_one(ctx, dst, src, iv, camellia_enc_blk);
45*4882a593Smuzhiyun }
46*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(camellia_xts_enc);
47*4882a593Smuzhiyun 
camellia_xts_dec(const void * ctx,u8 * dst,const u8 * src,le128 * iv)48*4882a593Smuzhiyun void camellia_xts_dec(const void *ctx, u8 *dst, const u8 *src, le128 *iv)
49*4882a593Smuzhiyun {
50*4882a593Smuzhiyun 	glue_xts_crypt_128bit_one(ctx, dst, src, iv, camellia_dec_blk);
51*4882a593Smuzhiyun }
52*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(camellia_xts_dec);
53*4882a593Smuzhiyun 
54*4882a593Smuzhiyun static const struct common_glue_ctx camellia_enc = {
55*4882a593Smuzhiyun 	.num_funcs = 3,
56*4882a593Smuzhiyun 	.fpu_blocks_limit = CAMELLIA_AESNI_PARALLEL_BLOCKS,
57*4882a593Smuzhiyun 
58*4882a593Smuzhiyun 	.funcs = { {
59*4882a593Smuzhiyun 		.num_blocks = CAMELLIA_AESNI_PARALLEL_BLOCKS,
60*4882a593Smuzhiyun 		.fn_u = { .ecb = camellia_ecb_enc_16way }
61*4882a593Smuzhiyun 	}, {
62*4882a593Smuzhiyun 		.num_blocks = 2,
63*4882a593Smuzhiyun 		.fn_u = { .ecb = camellia_enc_blk_2way }
64*4882a593Smuzhiyun 	}, {
65*4882a593Smuzhiyun 		.num_blocks = 1,
66*4882a593Smuzhiyun 		.fn_u = { .ecb = camellia_enc_blk }
67*4882a593Smuzhiyun 	} }
68*4882a593Smuzhiyun };
69*4882a593Smuzhiyun 
70*4882a593Smuzhiyun static const struct common_glue_ctx camellia_ctr = {
71*4882a593Smuzhiyun 	.num_funcs = 3,
72*4882a593Smuzhiyun 	.fpu_blocks_limit = CAMELLIA_AESNI_PARALLEL_BLOCKS,
73*4882a593Smuzhiyun 
74*4882a593Smuzhiyun 	.funcs = { {
75*4882a593Smuzhiyun 		.num_blocks = CAMELLIA_AESNI_PARALLEL_BLOCKS,
76*4882a593Smuzhiyun 		.fn_u = { .ctr = camellia_ctr_16way }
77*4882a593Smuzhiyun 	}, {
78*4882a593Smuzhiyun 		.num_blocks = 2,
79*4882a593Smuzhiyun 		.fn_u = { .ctr = camellia_crypt_ctr_2way }
80*4882a593Smuzhiyun 	}, {
81*4882a593Smuzhiyun 		.num_blocks = 1,
82*4882a593Smuzhiyun 		.fn_u = { .ctr = camellia_crypt_ctr }
83*4882a593Smuzhiyun 	} }
84*4882a593Smuzhiyun };
85*4882a593Smuzhiyun 
86*4882a593Smuzhiyun static const struct common_glue_ctx camellia_enc_xts = {
87*4882a593Smuzhiyun 	.num_funcs = 2,
88*4882a593Smuzhiyun 	.fpu_blocks_limit = CAMELLIA_AESNI_PARALLEL_BLOCKS,
89*4882a593Smuzhiyun 
90*4882a593Smuzhiyun 	.funcs = { {
91*4882a593Smuzhiyun 		.num_blocks = CAMELLIA_AESNI_PARALLEL_BLOCKS,
92*4882a593Smuzhiyun 		.fn_u = { .xts = camellia_xts_enc_16way }
93*4882a593Smuzhiyun 	}, {
94*4882a593Smuzhiyun 		.num_blocks = 1,
95*4882a593Smuzhiyun 		.fn_u = { .xts = camellia_xts_enc }
96*4882a593Smuzhiyun 	} }
97*4882a593Smuzhiyun };
98*4882a593Smuzhiyun 
99*4882a593Smuzhiyun static const struct common_glue_ctx camellia_dec = {
100*4882a593Smuzhiyun 	.num_funcs = 3,
101*4882a593Smuzhiyun 	.fpu_blocks_limit = CAMELLIA_AESNI_PARALLEL_BLOCKS,
102*4882a593Smuzhiyun 
103*4882a593Smuzhiyun 	.funcs = { {
104*4882a593Smuzhiyun 		.num_blocks = CAMELLIA_AESNI_PARALLEL_BLOCKS,
105*4882a593Smuzhiyun 		.fn_u = { .ecb = camellia_ecb_dec_16way }
106*4882a593Smuzhiyun 	}, {
107*4882a593Smuzhiyun 		.num_blocks = 2,
108*4882a593Smuzhiyun 		.fn_u = { .ecb = camellia_dec_blk_2way }
109*4882a593Smuzhiyun 	}, {
110*4882a593Smuzhiyun 		.num_blocks = 1,
111*4882a593Smuzhiyun 		.fn_u = { .ecb = camellia_dec_blk }
112*4882a593Smuzhiyun 	} }
113*4882a593Smuzhiyun };
114*4882a593Smuzhiyun 
115*4882a593Smuzhiyun static const struct common_glue_ctx camellia_dec_cbc = {
116*4882a593Smuzhiyun 	.num_funcs = 3,
117*4882a593Smuzhiyun 	.fpu_blocks_limit = CAMELLIA_AESNI_PARALLEL_BLOCKS,
118*4882a593Smuzhiyun 
119*4882a593Smuzhiyun 	.funcs = { {
120*4882a593Smuzhiyun 		.num_blocks = CAMELLIA_AESNI_PARALLEL_BLOCKS,
121*4882a593Smuzhiyun 		.fn_u = { .cbc = camellia_cbc_dec_16way }
122*4882a593Smuzhiyun 	}, {
123*4882a593Smuzhiyun 		.num_blocks = 2,
124*4882a593Smuzhiyun 		.fn_u = { .cbc = camellia_decrypt_cbc_2way }
125*4882a593Smuzhiyun 	}, {
126*4882a593Smuzhiyun 		.num_blocks = 1,
127*4882a593Smuzhiyun 		.fn_u = { .cbc = camellia_dec_blk }
128*4882a593Smuzhiyun 	} }
129*4882a593Smuzhiyun };
130*4882a593Smuzhiyun 
131*4882a593Smuzhiyun static const struct common_glue_ctx camellia_dec_xts = {
132*4882a593Smuzhiyun 	.num_funcs = 2,
133*4882a593Smuzhiyun 	.fpu_blocks_limit = CAMELLIA_AESNI_PARALLEL_BLOCKS,
134*4882a593Smuzhiyun 
135*4882a593Smuzhiyun 	.funcs = { {
136*4882a593Smuzhiyun 		.num_blocks = CAMELLIA_AESNI_PARALLEL_BLOCKS,
137*4882a593Smuzhiyun 		.fn_u = { .xts = camellia_xts_dec_16way }
138*4882a593Smuzhiyun 	}, {
139*4882a593Smuzhiyun 		.num_blocks = 1,
140*4882a593Smuzhiyun 		.fn_u = { .xts = camellia_xts_dec }
141*4882a593Smuzhiyun 	} }
142*4882a593Smuzhiyun };
143*4882a593Smuzhiyun 
camellia_setkey(struct crypto_skcipher * tfm,const u8 * key,unsigned int keylen)144*4882a593Smuzhiyun static int camellia_setkey(struct crypto_skcipher *tfm, const u8 *key,
145*4882a593Smuzhiyun 			   unsigned int keylen)
146*4882a593Smuzhiyun {
147*4882a593Smuzhiyun 	return __camellia_setkey(crypto_skcipher_ctx(tfm), key, keylen);
148*4882a593Smuzhiyun }
149*4882a593Smuzhiyun 
ecb_encrypt(struct skcipher_request * req)150*4882a593Smuzhiyun static int ecb_encrypt(struct skcipher_request *req)
151*4882a593Smuzhiyun {
152*4882a593Smuzhiyun 	return glue_ecb_req_128bit(&camellia_enc, req);
153*4882a593Smuzhiyun }
154*4882a593Smuzhiyun 
ecb_decrypt(struct skcipher_request * req)155*4882a593Smuzhiyun static int ecb_decrypt(struct skcipher_request *req)
156*4882a593Smuzhiyun {
157*4882a593Smuzhiyun 	return glue_ecb_req_128bit(&camellia_dec, req);
158*4882a593Smuzhiyun }
159*4882a593Smuzhiyun 
cbc_encrypt(struct skcipher_request * req)160*4882a593Smuzhiyun static int cbc_encrypt(struct skcipher_request *req)
161*4882a593Smuzhiyun {
162*4882a593Smuzhiyun 	return glue_cbc_encrypt_req_128bit(camellia_enc_blk, req);
163*4882a593Smuzhiyun }
164*4882a593Smuzhiyun 
cbc_decrypt(struct skcipher_request * req)165*4882a593Smuzhiyun static int cbc_decrypt(struct skcipher_request *req)
166*4882a593Smuzhiyun {
167*4882a593Smuzhiyun 	return glue_cbc_decrypt_req_128bit(&camellia_dec_cbc, req);
168*4882a593Smuzhiyun }
169*4882a593Smuzhiyun 
ctr_crypt(struct skcipher_request * req)170*4882a593Smuzhiyun static int ctr_crypt(struct skcipher_request *req)
171*4882a593Smuzhiyun {
172*4882a593Smuzhiyun 	return glue_ctr_req_128bit(&camellia_ctr, req);
173*4882a593Smuzhiyun }
174*4882a593Smuzhiyun 
xts_camellia_setkey(struct crypto_skcipher * tfm,const u8 * key,unsigned int keylen)175*4882a593Smuzhiyun int xts_camellia_setkey(struct crypto_skcipher *tfm, const u8 *key,
176*4882a593Smuzhiyun 			unsigned int keylen)
177*4882a593Smuzhiyun {
178*4882a593Smuzhiyun 	struct camellia_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
179*4882a593Smuzhiyun 	int err;
180*4882a593Smuzhiyun 
181*4882a593Smuzhiyun 	err = xts_verify_key(tfm, key, keylen);
182*4882a593Smuzhiyun 	if (err)
183*4882a593Smuzhiyun 		return err;
184*4882a593Smuzhiyun 
185*4882a593Smuzhiyun 	/* first half of xts-key is for crypt */
186*4882a593Smuzhiyun 	err = __camellia_setkey(&ctx->crypt_ctx, key, keylen / 2);
187*4882a593Smuzhiyun 	if (err)
188*4882a593Smuzhiyun 		return err;
189*4882a593Smuzhiyun 
190*4882a593Smuzhiyun 	/* second half of xts-key is for tweak */
191*4882a593Smuzhiyun 	return __camellia_setkey(&ctx->tweak_ctx, key + keylen / 2, keylen / 2);
192*4882a593Smuzhiyun }
193*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(xts_camellia_setkey);
194*4882a593Smuzhiyun 
xts_encrypt(struct skcipher_request * req)195*4882a593Smuzhiyun static int xts_encrypt(struct skcipher_request *req)
196*4882a593Smuzhiyun {
197*4882a593Smuzhiyun 	struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
198*4882a593Smuzhiyun 	struct camellia_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
199*4882a593Smuzhiyun 
200*4882a593Smuzhiyun 	return glue_xts_req_128bit(&camellia_enc_xts, req, camellia_enc_blk,
201*4882a593Smuzhiyun 				   &ctx->tweak_ctx, &ctx->crypt_ctx, false);
202*4882a593Smuzhiyun }
203*4882a593Smuzhiyun 
xts_decrypt(struct skcipher_request * req)204*4882a593Smuzhiyun static int xts_decrypt(struct skcipher_request *req)
205*4882a593Smuzhiyun {
206*4882a593Smuzhiyun 	struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
207*4882a593Smuzhiyun 	struct camellia_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
208*4882a593Smuzhiyun 
209*4882a593Smuzhiyun 	return glue_xts_req_128bit(&camellia_dec_xts, req, camellia_enc_blk,
210*4882a593Smuzhiyun 				   &ctx->tweak_ctx, &ctx->crypt_ctx, true);
211*4882a593Smuzhiyun }
212*4882a593Smuzhiyun 
213*4882a593Smuzhiyun static struct skcipher_alg camellia_algs[] = {
214*4882a593Smuzhiyun 	{
215*4882a593Smuzhiyun 		.base.cra_name		= "__ecb(camellia)",
216*4882a593Smuzhiyun 		.base.cra_driver_name	= "__ecb-camellia-aesni",
217*4882a593Smuzhiyun 		.base.cra_priority	= 400,
218*4882a593Smuzhiyun 		.base.cra_flags		= CRYPTO_ALG_INTERNAL,
219*4882a593Smuzhiyun 		.base.cra_blocksize	= CAMELLIA_BLOCK_SIZE,
220*4882a593Smuzhiyun 		.base.cra_ctxsize	= sizeof(struct camellia_ctx),
221*4882a593Smuzhiyun 		.base.cra_module	= THIS_MODULE,
222*4882a593Smuzhiyun 		.min_keysize		= CAMELLIA_MIN_KEY_SIZE,
223*4882a593Smuzhiyun 		.max_keysize		= CAMELLIA_MAX_KEY_SIZE,
224*4882a593Smuzhiyun 		.setkey			= camellia_setkey,
225*4882a593Smuzhiyun 		.encrypt		= ecb_encrypt,
226*4882a593Smuzhiyun 		.decrypt		= ecb_decrypt,
227*4882a593Smuzhiyun 	}, {
228*4882a593Smuzhiyun 		.base.cra_name		= "__cbc(camellia)",
229*4882a593Smuzhiyun 		.base.cra_driver_name	= "__cbc-camellia-aesni",
230*4882a593Smuzhiyun 		.base.cra_priority	= 400,
231*4882a593Smuzhiyun 		.base.cra_flags		= CRYPTO_ALG_INTERNAL,
232*4882a593Smuzhiyun 		.base.cra_blocksize	= CAMELLIA_BLOCK_SIZE,
233*4882a593Smuzhiyun 		.base.cra_ctxsize	= sizeof(struct camellia_ctx),
234*4882a593Smuzhiyun 		.base.cra_module	= THIS_MODULE,
235*4882a593Smuzhiyun 		.min_keysize		= CAMELLIA_MIN_KEY_SIZE,
236*4882a593Smuzhiyun 		.max_keysize		= CAMELLIA_MAX_KEY_SIZE,
237*4882a593Smuzhiyun 		.ivsize			= CAMELLIA_BLOCK_SIZE,
238*4882a593Smuzhiyun 		.setkey			= camellia_setkey,
239*4882a593Smuzhiyun 		.encrypt		= cbc_encrypt,
240*4882a593Smuzhiyun 		.decrypt		= cbc_decrypt,
241*4882a593Smuzhiyun 	}, {
242*4882a593Smuzhiyun 		.base.cra_name		= "__ctr(camellia)",
243*4882a593Smuzhiyun 		.base.cra_driver_name	= "__ctr-camellia-aesni",
244*4882a593Smuzhiyun 		.base.cra_priority	= 400,
245*4882a593Smuzhiyun 		.base.cra_flags		= CRYPTO_ALG_INTERNAL,
246*4882a593Smuzhiyun 		.base.cra_blocksize	= 1,
247*4882a593Smuzhiyun 		.base.cra_ctxsize	= sizeof(struct camellia_ctx),
248*4882a593Smuzhiyun 		.base.cra_module	= THIS_MODULE,
249*4882a593Smuzhiyun 		.min_keysize		= CAMELLIA_MIN_KEY_SIZE,
250*4882a593Smuzhiyun 		.max_keysize		= CAMELLIA_MAX_KEY_SIZE,
251*4882a593Smuzhiyun 		.ivsize			= CAMELLIA_BLOCK_SIZE,
252*4882a593Smuzhiyun 		.chunksize		= CAMELLIA_BLOCK_SIZE,
253*4882a593Smuzhiyun 		.setkey			= camellia_setkey,
254*4882a593Smuzhiyun 		.encrypt		= ctr_crypt,
255*4882a593Smuzhiyun 		.decrypt		= ctr_crypt,
256*4882a593Smuzhiyun 	}, {
257*4882a593Smuzhiyun 		.base.cra_name		= "__xts(camellia)",
258*4882a593Smuzhiyun 		.base.cra_driver_name	= "__xts-camellia-aesni",
259*4882a593Smuzhiyun 		.base.cra_priority	= 400,
260*4882a593Smuzhiyun 		.base.cra_flags		= CRYPTO_ALG_INTERNAL,
261*4882a593Smuzhiyun 		.base.cra_blocksize	= CAMELLIA_BLOCK_SIZE,
262*4882a593Smuzhiyun 		.base.cra_ctxsize	= sizeof(struct camellia_xts_ctx),
263*4882a593Smuzhiyun 		.base.cra_module	= THIS_MODULE,
264*4882a593Smuzhiyun 		.min_keysize		= 2 * CAMELLIA_MIN_KEY_SIZE,
265*4882a593Smuzhiyun 		.max_keysize		= 2 * CAMELLIA_MAX_KEY_SIZE,
266*4882a593Smuzhiyun 		.ivsize			= CAMELLIA_BLOCK_SIZE,
267*4882a593Smuzhiyun 		.setkey			= xts_camellia_setkey,
268*4882a593Smuzhiyun 		.encrypt		= xts_encrypt,
269*4882a593Smuzhiyun 		.decrypt		= xts_decrypt,
270*4882a593Smuzhiyun 	},
271*4882a593Smuzhiyun };
272*4882a593Smuzhiyun 
273*4882a593Smuzhiyun static struct simd_skcipher_alg *camellia_simd_algs[ARRAY_SIZE(camellia_algs)];
274*4882a593Smuzhiyun 
camellia_aesni_init(void)275*4882a593Smuzhiyun static int __init camellia_aesni_init(void)
276*4882a593Smuzhiyun {
277*4882a593Smuzhiyun 	const char *feature_name;
278*4882a593Smuzhiyun 
279*4882a593Smuzhiyun 	if (!boot_cpu_has(X86_FEATURE_AVX) ||
280*4882a593Smuzhiyun 	    !boot_cpu_has(X86_FEATURE_AES) ||
281*4882a593Smuzhiyun 	    !boot_cpu_has(X86_FEATURE_OSXSAVE)) {
282*4882a593Smuzhiyun 		pr_info("AVX or AES-NI instructions are not detected.\n");
283*4882a593Smuzhiyun 		return -ENODEV;
284*4882a593Smuzhiyun 	}
285*4882a593Smuzhiyun 
286*4882a593Smuzhiyun 	if (!cpu_has_xfeatures(XFEATURE_MASK_SSE | XFEATURE_MASK_YMM,
287*4882a593Smuzhiyun 				&feature_name)) {
288*4882a593Smuzhiyun 		pr_info("CPU feature '%s' is not supported.\n", feature_name);
289*4882a593Smuzhiyun 		return -ENODEV;
290*4882a593Smuzhiyun 	}
291*4882a593Smuzhiyun 
292*4882a593Smuzhiyun 	return simd_register_skciphers_compat(camellia_algs,
293*4882a593Smuzhiyun 					      ARRAY_SIZE(camellia_algs),
294*4882a593Smuzhiyun 					      camellia_simd_algs);
295*4882a593Smuzhiyun }
296*4882a593Smuzhiyun 
camellia_aesni_fini(void)297*4882a593Smuzhiyun static void __exit camellia_aesni_fini(void)
298*4882a593Smuzhiyun {
299*4882a593Smuzhiyun 	simd_unregister_skciphers(camellia_algs, ARRAY_SIZE(camellia_algs),
300*4882a593Smuzhiyun 				  camellia_simd_algs);
301*4882a593Smuzhiyun }
302*4882a593Smuzhiyun 
303*4882a593Smuzhiyun module_init(camellia_aesni_init);
304*4882a593Smuzhiyun module_exit(camellia_aesni_fini);
305*4882a593Smuzhiyun 
306*4882a593Smuzhiyun MODULE_LICENSE("GPL");
307*4882a593Smuzhiyun MODULE_DESCRIPTION("Camellia Cipher Algorithm, AES-NI/AVX optimized");
308*4882a593Smuzhiyun MODULE_ALIAS_CRYPTO("camellia");
309*4882a593Smuzhiyun MODULE_ALIAS_CRYPTO("camellia-asm");
310