xref: /OK3568_Linux_fs/kernel/arch/x86/crypto/serpent_sse2_glue.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Glue Code for SSE2 assembler versions of Serpent Cipher
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * Copyright (c) 2011 Jussi Kivilinna <jussi.kivilinna@mbnet.fi>
6*4882a593Smuzhiyun  *
7*4882a593Smuzhiyun  * Glue code based on aesni-intel_glue.c by:
8*4882a593Smuzhiyun  *  Copyright (C) 2008, Intel Corp.
9*4882a593Smuzhiyun  *    Author: Huang Ying <ying.huang@intel.com>
10*4882a593Smuzhiyun  *
11*4882a593Smuzhiyun  * CBC & ECB parts based on code (crypto/cbc.c,ecb.c) by:
12*4882a593Smuzhiyun  *   Copyright (c) 2006 Herbert Xu <herbert@gondor.apana.org.au>
13*4882a593Smuzhiyun  * CTR part based on code (crypto/ctr.c) by:
14*4882a593Smuzhiyun  *   (C) Copyright IBM Corp. 2007 - Joy Latten <latten@us.ibm.com>
15*4882a593Smuzhiyun  */
16*4882a593Smuzhiyun 
17*4882a593Smuzhiyun #include <linux/module.h>
18*4882a593Smuzhiyun #include <linux/types.h>
19*4882a593Smuzhiyun #include <linux/crypto.h>
20*4882a593Smuzhiyun #include <linux/err.h>
21*4882a593Smuzhiyun #include <crypto/algapi.h>
22*4882a593Smuzhiyun #include <crypto/b128ops.h>
23*4882a593Smuzhiyun #include <crypto/internal/simd.h>
24*4882a593Smuzhiyun #include <crypto/serpent.h>
25*4882a593Smuzhiyun #include <asm/crypto/serpent-sse2.h>
26*4882a593Smuzhiyun #include <asm/crypto/glue_helper.h>
27*4882a593Smuzhiyun 
serpent_setkey_skcipher(struct crypto_skcipher * tfm,const u8 * key,unsigned int keylen)28*4882a593Smuzhiyun static int serpent_setkey_skcipher(struct crypto_skcipher *tfm,
29*4882a593Smuzhiyun 				   const u8 *key, unsigned int keylen)
30*4882a593Smuzhiyun {
31*4882a593Smuzhiyun 	return __serpent_setkey(crypto_skcipher_ctx(tfm), key, keylen);
32*4882a593Smuzhiyun }
33*4882a593Smuzhiyun 
serpent_decrypt_cbc_xway(const void * ctx,u8 * d,const u8 * s)34*4882a593Smuzhiyun static void serpent_decrypt_cbc_xway(const void *ctx, u8 *d, const u8 *s)
35*4882a593Smuzhiyun {
36*4882a593Smuzhiyun 	u128 ivs[SERPENT_PARALLEL_BLOCKS - 1];
37*4882a593Smuzhiyun 	u128 *dst = (u128 *)d;
38*4882a593Smuzhiyun 	const u128 *src = (const u128 *)s;
39*4882a593Smuzhiyun 	unsigned int j;
40*4882a593Smuzhiyun 
41*4882a593Smuzhiyun 	for (j = 0; j < SERPENT_PARALLEL_BLOCKS - 1; j++)
42*4882a593Smuzhiyun 		ivs[j] = src[j];
43*4882a593Smuzhiyun 
44*4882a593Smuzhiyun 	serpent_dec_blk_xway(ctx, (u8 *)dst, (u8 *)src);
45*4882a593Smuzhiyun 
46*4882a593Smuzhiyun 	for (j = 0; j < SERPENT_PARALLEL_BLOCKS - 1; j++)
47*4882a593Smuzhiyun 		u128_xor(dst + (j + 1), dst + (j + 1), ivs + j);
48*4882a593Smuzhiyun }
49*4882a593Smuzhiyun 
serpent_crypt_ctr(const void * ctx,u8 * d,const u8 * s,le128 * iv)50*4882a593Smuzhiyun static void serpent_crypt_ctr(const void *ctx, u8 *d, const u8 *s, le128 *iv)
51*4882a593Smuzhiyun {
52*4882a593Smuzhiyun 	be128 ctrblk;
53*4882a593Smuzhiyun 	u128 *dst = (u128 *)d;
54*4882a593Smuzhiyun 	const u128 *src = (const u128 *)s;
55*4882a593Smuzhiyun 
56*4882a593Smuzhiyun 	le128_to_be128(&ctrblk, iv);
57*4882a593Smuzhiyun 	le128_inc(iv);
58*4882a593Smuzhiyun 
59*4882a593Smuzhiyun 	__serpent_encrypt(ctx, (u8 *)&ctrblk, (u8 *)&ctrblk);
60*4882a593Smuzhiyun 	u128_xor(dst, src, (u128 *)&ctrblk);
61*4882a593Smuzhiyun }
62*4882a593Smuzhiyun 
serpent_crypt_ctr_xway(const void * ctx,u8 * d,const u8 * s,le128 * iv)63*4882a593Smuzhiyun static void serpent_crypt_ctr_xway(const void *ctx, u8 *d, const u8 *s,
64*4882a593Smuzhiyun 				   le128 *iv)
65*4882a593Smuzhiyun {
66*4882a593Smuzhiyun 	be128 ctrblks[SERPENT_PARALLEL_BLOCKS];
67*4882a593Smuzhiyun 	u128 *dst = (u128 *)d;
68*4882a593Smuzhiyun 	const u128 *src = (const u128 *)s;
69*4882a593Smuzhiyun 	unsigned int i;
70*4882a593Smuzhiyun 
71*4882a593Smuzhiyun 	for (i = 0; i < SERPENT_PARALLEL_BLOCKS; i++) {
72*4882a593Smuzhiyun 		if (dst != src)
73*4882a593Smuzhiyun 			dst[i] = src[i];
74*4882a593Smuzhiyun 
75*4882a593Smuzhiyun 		le128_to_be128(&ctrblks[i], iv);
76*4882a593Smuzhiyun 		le128_inc(iv);
77*4882a593Smuzhiyun 	}
78*4882a593Smuzhiyun 
79*4882a593Smuzhiyun 	serpent_enc_blk_xway_xor(ctx, (u8 *)dst, (u8 *)ctrblks);
80*4882a593Smuzhiyun }
81*4882a593Smuzhiyun 
82*4882a593Smuzhiyun static const struct common_glue_ctx serpent_enc = {
83*4882a593Smuzhiyun 	.num_funcs = 2,
84*4882a593Smuzhiyun 	.fpu_blocks_limit = SERPENT_PARALLEL_BLOCKS,
85*4882a593Smuzhiyun 
86*4882a593Smuzhiyun 	.funcs = { {
87*4882a593Smuzhiyun 		.num_blocks = SERPENT_PARALLEL_BLOCKS,
88*4882a593Smuzhiyun 		.fn_u = { .ecb = serpent_enc_blk_xway }
89*4882a593Smuzhiyun 	}, {
90*4882a593Smuzhiyun 		.num_blocks = 1,
91*4882a593Smuzhiyun 		.fn_u = { .ecb = __serpent_encrypt }
92*4882a593Smuzhiyun 	} }
93*4882a593Smuzhiyun };
94*4882a593Smuzhiyun 
95*4882a593Smuzhiyun static const struct common_glue_ctx serpent_ctr = {
96*4882a593Smuzhiyun 	.num_funcs = 2,
97*4882a593Smuzhiyun 	.fpu_blocks_limit = SERPENT_PARALLEL_BLOCKS,
98*4882a593Smuzhiyun 
99*4882a593Smuzhiyun 	.funcs = { {
100*4882a593Smuzhiyun 		.num_blocks = SERPENT_PARALLEL_BLOCKS,
101*4882a593Smuzhiyun 		.fn_u = { .ctr = serpent_crypt_ctr_xway }
102*4882a593Smuzhiyun 	}, {
103*4882a593Smuzhiyun 		.num_blocks = 1,
104*4882a593Smuzhiyun 		.fn_u = { .ctr = serpent_crypt_ctr }
105*4882a593Smuzhiyun 	} }
106*4882a593Smuzhiyun };
107*4882a593Smuzhiyun 
108*4882a593Smuzhiyun static const struct common_glue_ctx serpent_dec = {
109*4882a593Smuzhiyun 	.num_funcs = 2,
110*4882a593Smuzhiyun 	.fpu_blocks_limit = SERPENT_PARALLEL_BLOCKS,
111*4882a593Smuzhiyun 
112*4882a593Smuzhiyun 	.funcs = { {
113*4882a593Smuzhiyun 		.num_blocks = SERPENT_PARALLEL_BLOCKS,
114*4882a593Smuzhiyun 		.fn_u = { .ecb = serpent_dec_blk_xway }
115*4882a593Smuzhiyun 	}, {
116*4882a593Smuzhiyun 		.num_blocks = 1,
117*4882a593Smuzhiyun 		.fn_u = { .ecb = __serpent_decrypt }
118*4882a593Smuzhiyun 	} }
119*4882a593Smuzhiyun };
120*4882a593Smuzhiyun 
121*4882a593Smuzhiyun static const struct common_glue_ctx serpent_dec_cbc = {
122*4882a593Smuzhiyun 	.num_funcs = 2,
123*4882a593Smuzhiyun 	.fpu_blocks_limit = SERPENT_PARALLEL_BLOCKS,
124*4882a593Smuzhiyun 
125*4882a593Smuzhiyun 	.funcs = { {
126*4882a593Smuzhiyun 		.num_blocks = SERPENT_PARALLEL_BLOCKS,
127*4882a593Smuzhiyun 		.fn_u = { .cbc = serpent_decrypt_cbc_xway }
128*4882a593Smuzhiyun 	}, {
129*4882a593Smuzhiyun 		.num_blocks = 1,
130*4882a593Smuzhiyun 		.fn_u = { .cbc = __serpent_decrypt }
131*4882a593Smuzhiyun 	} }
132*4882a593Smuzhiyun };
133*4882a593Smuzhiyun 
ecb_encrypt(struct skcipher_request * req)134*4882a593Smuzhiyun static int ecb_encrypt(struct skcipher_request *req)
135*4882a593Smuzhiyun {
136*4882a593Smuzhiyun 	return glue_ecb_req_128bit(&serpent_enc, req);
137*4882a593Smuzhiyun }
138*4882a593Smuzhiyun 
ecb_decrypt(struct skcipher_request * req)139*4882a593Smuzhiyun static int ecb_decrypt(struct skcipher_request *req)
140*4882a593Smuzhiyun {
141*4882a593Smuzhiyun 	return glue_ecb_req_128bit(&serpent_dec, req);
142*4882a593Smuzhiyun }
143*4882a593Smuzhiyun 
cbc_encrypt(struct skcipher_request * req)144*4882a593Smuzhiyun static int cbc_encrypt(struct skcipher_request *req)
145*4882a593Smuzhiyun {
146*4882a593Smuzhiyun 	return glue_cbc_encrypt_req_128bit(__serpent_encrypt,
147*4882a593Smuzhiyun 					   req);
148*4882a593Smuzhiyun }
149*4882a593Smuzhiyun 
cbc_decrypt(struct skcipher_request * req)150*4882a593Smuzhiyun static int cbc_decrypt(struct skcipher_request *req)
151*4882a593Smuzhiyun {
152*4882a593Smuzhiyun 	return glue_cbc_decrypt_req_128bit(&serpent_dec_cbc, req);
153*4882a593Smuzhiyun }
154*4882a593Smuzhiyun 
ctr_crypt(struct skcipher_request * req)155*4882a593Smuzhiyun static int ctr_crypt(struct skcipher_request *req)
156*4882a593Smuzhiyun {
157*4882a593Smuzhiyun 	return glue_ctr_req_128bit(&serpent_ctr, req);
158*4882a593Smuzhiyun }
159*4882a593Smuzhiyun 
160*4882a593Smuzhiyun static struct skcipher_alg serpent_algs[] = {
161*4882a593Smuzhiyun 	{
162*4882a593Smuzhiyun 		.base.cra_name		= "__ecb(serpent)",
163*4882a593Smuzhiyun 		.base.cra_driver_name	= "__ecb-serpent-sse2",
164*4882a593Smuzhiyun 		.base.cra_priority	= 400,
165*4882a593Smuzhiyun 		.base.cra_flags		= CRYPTO_ALG_INTERNAL,
166*4882a593Smuzhiyun 		.base.cra_blocksize	= SERPENT_BLOCK_SIZE,
167*4882a593Smuzhiyun 		.base.cra_ctxsize	= sizeof(struct serpent_ctx),
168*4882a593Smuzhiyun 		.base.cra_module	= THIS_MODULE,
169*4882a593Smuzhiyun 		.min_keysize		= SERPENT_MIN_KEY_SIZE,
170*4882a593Smuzhiyun 		.max_keysize		= SERPENT_MAX_KEY_SIZE,
171*4882a593Smuzhiyun 		.setkey			= serpent_setkey_skcipher,
172*4882a593Smuzhiyun 		.encrypt		= ecb_encrypt,
173*4882a593Smuzhiyun 		.decrypt		= ecb_decrypt,
174*4882a593Smuzhiyun 	}, {
175*4882a593Smuzhiyun 		.base.cra_name		= "__cbc(serpent)",
176*4882a593Smuzhiyun 		.base.cra_driver_name	= "__cbc-serpent-sse2",
177*4882a593Smuzhiyun 		.base.cra_priority	= 400,
178*4882a593Smuzhiyun 		.base.cra_flags		= CRYPTO_ALG_INTERNAL,
179*4882a593Smuzhiyun 		.base.cra_blocksize	= SERPENT_BLOCK_SIZE,
180*4882a593Smuzhiyun 		.base.cra_ctxsize	= sizeof(struct serpent_ctx),
181*4882a593Smuzhiyun 		.base.cra_module	= THIS_MODULE,
182*4882a593Smuzhiyun 		.min_keysize		= SERPENT_MIN_KEY_SIZE,
183*4882a593Smuzhiyun 		.max_keysize		= SERPENT_MAX_KEY_SIZE,
184*4882a593Smuzhiyun 		.ivsize			= SERPENT_BLOCK_SIZE,
185*4882a593Smuzhiyun 		.setkey			= serpent_setkey_skcipher,
186*4882a593Smuzhiyun 		.encrypt		= cbc_encrypt,
187*4882a593Smuzhiyun 		.decrypt		= cbc_decrypt,
188*4882a593Smuzhiyun 	}, {
189*4882a593Smuzhiyun 		.base.cra_name		= "__ctr(serpent)",
190*4882a593Smuzhiyun 		.base.cra_driver_name	= "__ctr-serpent-sse2",
191*4882a593Smuzhiyun 		.base.cra_priority	= 400,
192*4882a593Smuzhiyun 		.base.cra_flags		= CRYPTO_ALG_INTERNAL,
193*4882a593Smuzhiyun 		.base.cra_blocksize	= 1,
194*4882a593Smuzhiyun 		.base.cra_ctxsize	= sizeof(struct serpent_ctx),
195*4882a593Smuzhiyun 		.base.cra_module	= THIS_MODULE,
196*4882a593Smuzhiyun 		.min_keysize		= SERPENT_MIN_KEY_SIZE,
197*4882a593Smuzhiyun 		.max_keysize		= SERPENT_MAX_KEY_SIZE,
198*4882a593Smuzhiyun 		.ivsize			= SERPENT_BLOCK_SIZE,
199*4882a593Smuzhiyun 		.chunksize		= SERPENT_BLOCK_SIZE,
200*4882a593Smuzhiyun 		.setkey			= serpent_setkey_skcipher,
201*4882a593Smuzhiyun 		.encrypt		= ctr_crypt,
202*4882a593Smuzhiyun 		.decrypt		= ctr_crypt,
203*4882a593Smuzhiyun 	},
204*4882a593Smuzhiyun };
205*4882a593Smuzhiyun 
206*4882a593Smuzhiyun static struct simd_skcipher_alg *serpent_simd_algs[ARRAY_SIZE(serpent_algs)];
207*4882a593Smuzhiyun 
serpent_sse2_init(void)208*4882a593Smuzhiyun static int __init serpent_sse2_init(void)
209*4882a593Smuzhiyun {
210*4882a593Smuzhiyun 	if (!boot_cpu_has(X86_FEATURE_XMM2)) {
211*4882a593Smuzhiyun 		printk(KERN_INFO "SSE2 instructions are not detected.\n");
212*4882a593Smuzhiyun 		return -ENODEV;
213*4882a593Smuzhiyun 	}
214*4882a593Smuzhiyun 
215*4882a593Smuzhiyun 	return simd_register_skciphers_compat(serpent_algs,
216*4882a593Smuzhiyun 					      ARRAY_SIZE(serpent_algs),
217*4882a593Smuzhiyun 					      serpent_simd_algs);
218*4882a593Smuzhiyun }
219*4882a593Smuzhiyun 
serpent_sse2_exit(void)220*4882a593Smuzhiyun static void __exit serpent_sse2_exit(void)
221*4882a593Smuzhiyun {
222*4882a593Smuzhiyun 	simd_unregister_skciphers(serpent_algs, ARRAY_SIZE(serpent_algs),
223*4882a593Smuzhiyun 				  serpent_simd_algs);
224*4882a593Smuzhiyun }
225*4882a593Smuzhiyun 
226*4882a593Smuzhiyun module_init(serpent_sse2_init);
227*4882a593Smuzhiyun module_exit(serpent_sse2_exit);
228*4882a593Smuzhiyun 
229*4882a593Smuzhiyun MODULE_DESCRIPTION("Serpent Cipher Algorithm, SSE2 optimized");
230*4882a593Smuzhiyun MODULE_LICENSE("GPL");
231*4882a593Smuzhiyun MODULE_ALIAS_CRYPTO("serpent");
232