1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Glue Code for AVX assembler versions of Serpent Cipher
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Copyright (C) 2012 Johannes Goetzfried
6*4882a593Smuzhiyun * <Johannes.Goetzfried@informatik.stud.uni-erlangen.de>
7*4882a593Smuzhiyun *
8*4882a593Smuzhiyun * Copyright © 2011-2013 Jussi Kivilinna <jussi.kivilinna@iki.fi>
9*4882a593Smuzhiyun */
10*4882a593Smuzhiyun
11*4882a593Smuzhiyun #include <linux/module.h>
12*4882a593Smuzhiyun #include <linux/types.h>
13*4882a593Smuzhiyun #include <linux/crypto.h>
14*4882a593Smuzhiyun #include <linux/err.h>
15*4882a593Smuzhiyun #include <crypto/algapi.h>
16*4882a593Smuzhiyun #include <crypto/internal/simd.h>
17*4882a593Smuzhiyun #include <crypto/serpent.h>
18*4882a593Smuzhiyun #include <crypto/xts.h>
19*4882a593Smuzhiyun #include <asm/crypto/glue_helper.h>
20*4882a593Smuzhiyun #include <asm/crypto/serpent-avx.h>
21*4882a593Smuzhiyun
22*4882a593Smuzhiyun /* 8-way parallel cipher functions */
23*4882a593Smuzhiyun asmlinkage void serpent_ecb_enc_8way_avx(const void *ctx, u8 *dst,
24*4882a593Smuzhiyun const u8 *src);
25*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(serpent_ecb_enc_8way_avx);
26*4882a593Smuzhiyun
27*4882a593Smuzhiyun asmlinkage void serpent_ecb_dec_8way_avx(const void *ctx, u8 *dst,
28*4882a593Smuzhiyun const u8 *src);
29*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(serpent_ecb_dec_8way_avx);
30*4882a593Smuzhiyun
31*4882a593Smuzhiyun asmlinkage void serpent_cbc_dec_8way_avx(const void *ctx, u8 *dst,
32*4882a593Smuzhiyun const u8 *src);
33*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(serpent_cbc_dec_8way_avx);
34*4882a593Smuzhiyun
35*4882a593Smuzhiyun asmlinkage void serpent_ctr_8way_avx(const void *ctx, u8 *dst, const u8 *src,
36*4882a593Smuzhiyun le128 *iv);
37*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(serpent_ctr_8way_avx);
38*4882a593Smuzhiyun
39*4882a593Smuzhiyun asmlinkage void serpent_xts_enc_8way_avx(const void *ctx, u8 *dst,
40*4882a593Smuzhiyun const u8 *src, le128 *iv);
41*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(serpent_xts_enc_8way_avx);
42*4882a593Smuzhiyun
43*4882a593Smuzhiyun asmlinkage void serpent_xts_dec_8way_avx(const void *ctx, u8 *dst,
44*4882a593Smuzhiyun const u8 *src, le128 *iv);
45*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(serpent_xts_dec_8way_avx);
46*4882a593Smuzhiyun
__serpent_crypt_ctr(const void * ctx,u8 * d,const u8 * s,le128 * iv)47*4882a593Smuzhiyun void __serpent_crypt_ctr(const void *ctx, u8 *d, const u8 *s, le128 *iv)
48*4882a593Smuzhiyun {
49*4882a593Smuzhiyun be128 ctrblk;
50*4882a593Smuzhiyun u128 *dst = (u128 *)d;
51*4882a593Smuzhiyun const u128 *src = (const u128 *)s;
52*4882a593Smuzhiyun
53*4882a593Smuzhiyun le128_to_be128(&ctrblk, iv);
54*4882a593Smuzhiyun le128_inc(iv);
55*4882a593Smuzhiyun
56*4882a593Smuzhiyun __serpent_encrypt(ctx, (u8 *)&ctrblk, (u8 *)&ctrblk);
57*4882a593Smuzhiyun u128_xor(dst, src, (u128 *)&ctrblk);
58*4882a593Smuzhiyun }
59*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(__serpent_crypt_ctr);
60*4882a593Smuzhiyun
serpent_xts_enc(const void * ctx,u8 * dst,const u8 * src,le128 * iv)61*4882a593Smuzhiyun void serpent_xts_enc(const void *ctx, u8 *dst, const u8 *src, le128 *iv)
62*4882a593Smuzhiyun {
63*4882a593Smuzhiyun glue_xts_crypt_128bit_one(ctx, dst, src, iv, __serpent_encrypt);
64*4882a593Smuzhiyun }
65*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(serpent_xts_enc);
66*4882a593Smuzhiyun
serpent_xts_dec(const void * ctx,u8 * dst,const u8 * src,le128 * iv)67*4882a593Smuzhiyun void serpent_xts_dec(const void *ctx, u8 *dst, const u8 *src, le128 *iv)
68*4882a593Smuzhiyun {
69*4882a593Smuzhiyun glue_xts_crypt_128bit_one(ctx, dst, src, iv, __serpent_decrypt);
70*4882a593Smuzhiyun }
71*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(serpent_xts_dec);
72*4882a593Smuzhiyun
serpent_setkey_skcipher(struct crypto_skcipher * tfm,const u8 * key,unsigned int keylen)73*4882a593Smuzhiyun static int serpent_setkey_skcipher(struct crypto_skcipher *tfm,
74*4882a593Smuzhiyun const u8 *key, unsigned int keylen)
75*4882a593Smuzhiyun {
76*4882a593Smuzhiyun return __serpent_setkey(crypto_skcipher_ctx(tfm), key, keylen);
77*4882a593Smuzhiyun }
78*4882a593Smuzhiyun
xts_serpent_setkey(struct crypto_skcipher * tfm,const u8 * key,unsigned int keylen)79*4882a593Smuzhiyun int xts_serpent_setkey(struct crypto_skcipher *tfm, const u8 *key,
80*4882a593Smuzhiyun unsigned int keylen)
81*4882a593Smuzhiyun {
82*4882a593Smuzhiyun struct serpent_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
83*4882a593Smuzhiyun int err;
84*4882a593Smuzhiyun
85*4882a593Smuzhiyun err = xts_verify_key(tfm, key, keylen);
86*4882a593Smuzhiyun if (err)
87*4882a593Smuzhiyun return err;
88*4882a593Smuzhiyun
89*4882a593Smuzhiyun /* first half of xts-key is for crypt */
90*4882a593Smuzhiyun err = __serpent_setkey(&ctx->crypt_ctx, key, keylen / 2);
91*4882a593Smuzhiyun if (err)
92*4882a593Smuzhiyun return err;
93*4882a593Smuzhiyun
94*4882a593Smuzhiyun /* second half of xts-key is for tweak */
95*4882a593Smuzhiyun return __serpent_setkey(&ctx->tweak_ctx, key + keylen / 2, keylen / 2);
96*4882a593Smuzhiyun }
97*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(xts_serpent_setkey);
98*4882a593Smuzhiyun
99*4882a593Smuzhiyun static const struct common_glue_ctx serpent_enc = {
100*4882a593Smuzhiyun .num_funcs = 2,
101*4882a593Smuzhiyun .fpu_blocks_limit = SERPENT_PARALLEL_BLOCKS,
102*4882a593Smuzhiyun
103*4882a593Smuzhiyun .funcs = { {
104*4882a593Smuzhiyun .num_blocks = SERPENT_PARALLEL_BLOCKS,
105*4882a593Smuzhiyun .fn_u = { .ecb = serpent_ecb_enc_8way_avx }
106*4882a593Smuzhiyun }, {
107*4882a593Smuzhiyun .num_blocks = 1,
108*4882a593Smuzhiyun .fn_u = { .ecb = __serpent_encrypt }
109*4882a593Smuzhiyun } }
110*4882a593Smuzhiyun };
111*4882a593Smuzhiyun
112*4882a593Smuzhiyun static const struct common_glue_ctx serpent_ctr = {
113*4882a593Smuzhiyun .num_funcs = 2,
114*4882a593Smuzhiyun .fpu_blocks_limit = SERPENT_PARALLEL_BLOCKS,
115*4882a593Smuzhiyun
116*4882a593Smuzhiyun .funcs = { {
117*4882a593Smuzhiyun .num_blocks = SERPENT_PARALLEL_BLOCKS,
118*4882a593Smuzhiyun .fn_u = { .ctr = serpent_ctr_8way_avx }
119*4882a593Smuzhiyun }, {
120*4882a593Smuzhiyun .num_blocks = 1,
121*4882a593Smuzhiyun .fn_u = { .ctr = __serpent_crypt_ctr }
122*4882a593Smuzhiyun } }
123*4882a593Smuzhiyun };
124*4882a593Smuzhiyun
125*4882a593Smuzhiyun static const struct common_glue_ctx serpent_enc_xts = {
126*4882a593Smuzhiyun .num_funcs = 2,
127*4882a593Smuzhiyun .fpu_blocks_limit = SERPENT_PARALLEL_BLOCKS,
128*4882a593Smuzhiyun
129*4882a593Smuzhiyun .funcs = { {
130*4882a593Smuzhiyun .num_blocks = SERPENT_PARALLEL_BLOCKS,
131*4882a593Smuzhiyun .fn_u = { .xts = serpent_xts_enc_8way_avx }
132*4882a593Smuzhiyun }, {
133*4882a593Smuzhiyun .num_blocks = 1,
134*4882a593Smuzhiyun .fn_u = { .xts = serpent_xts_enc }
135*4882a593Smuzhiyun } }
136*4882a593Smuzhiyun };
137*4882a593Smuzhiyun
138*4882a593Smuzhiyun static const struct common_glue_ctx serpent_dec = {
139*4882a593Smuzhiyun .num_funcs = 2,
140*4882a593Smuzhiyun .fpu_blocks_limit = SERPENT_PARALLEL_BLOCKS,
141*4882a593Smuzhiyun
142*4882a593Smuzhiyun .funcs = { {
143*4882a593Smuzhiyun .num_blocks = SERPENT_PARALLEL_BLOCKS,
144*4882a593Smuzhiyun .fn_u = { .ecb = serpent_ecb_dec_8way_avx }
145*4882a593Smuzhiyun }, {
146*4882a593Smuzhiyun .num_blocks = 1,
147*4882a593Smuzhiyun .fn_u = { .ecb = __serpent_decrypt }
148*4882a593Smuzhiyun } }
149*4882a593Smuzhiyun };
150*4882a593Smuzhiyun
151*4882a593Smuzhiyun static const struct common_glue_ctx serpent_dec_cbc = {
152*4882a593Smuzhiyun .num_funcs = 2,
153*4882a593Smuzhiyun .fpu_blocks_limit = SERPENT_PARALLEL_BLOCKS,
154*4882a593Smuzhiyun
155*4882a593Smuzhiyun .funcs = { {
156*4882a593Smuzhiyun .num_blocks = SERPENT_PARALLEL_BLOCKS,
157*4882a593Smuzhiyun .fn_u = { .cbc = serpent_cbc_dec_8way_avx }
158*4882a593Smuzhiyun }, {
159*4882a593Smuzhiyun .num_blocks = 1,
160*4882a593Smuzhiyun .fn_u = { .cbc = __serpent_decrypt }
161*4882a593Smuzhiyun } }
162*4882a593Smuzhiyun };
163*4882a593Smuzhiyun
164*4882a593Smuzhiyun static const struct common_glue_ctx serpent_dec_xts = {
165*4882a593Smuzhiyun .num_funcs = 2,
166*4882a593Smuzhiyun .fpu_blocks_limit = SERPENT_PARALLEL_BLOCKS,
167*4882a593Smuzhiyun
168*4882a593Smuzhiyun .funcs = { {
169*4882a593Smuzhiyun .num_blocks = SERPENT_PARALLEL_BLOCKS,
170*4882a593Smuzhiyun .fn_u = { .xts = serpent_xts_dec_8way_avx }
171*4882a593Smuzhiyun }, {
172*4882a593Smuzhiyun .num_blocks = 1,
173*4882a593Smuzhiyun .fn_u = { .xts = serpent_xts_dec }
174*4882a593Smuzhiyun } }
175*4882a593Smuzhiyun };
176*4882a593Smuzhiyun
ecb_encrypt(struct skcipher_request * req)177*4882a593Smuzhiyun static int ecb_encrypt(struct skcipher_request *req)
178*4882a593Smuzhiyun {
179*4882a593Smuzhiyun return glue_ecb_req_128bit(&serpent_enc, req);
180*4882a593Smuzhiyun }
181*4882a593Smuzhiyun
ecb_decrypt(struct skcipher_request * req)182*4882a593Smuzhiyun static int ecb_decrypt(struct skcipher_request *req)
183*4882a593Smuzhiyun {
184*4882a593Smuzhiyun return glue_ecb_req_128bit(&serpent_dec, req);
185*4882a593Smuzhiyun }
186*4882a593Smuzhiyun
cbc_encrypt(struct skcipher_request * req)187*4882a593Smuzhiyun static int cbc_encrypt(struct skcipher_request *req)
188*4882a593Smuzhiyun {
189*4882a593Smuzhiyun return glue_cbc_encrypt_req_128bit(__serpent_encrypt, req);
190*4882a593Smuzhiyun }
191*4882a593Smuzhiyun
cbc_decrypt(struct skcipher_request * req)192*4882a593Smuzhiyun static int cbc_decrypt(struct skcipher_request *req)
193*4882a593Smuzhiyun {
194*4882a593Smuzhiyun return glue_cbc_decrypt_req_128bit(&serpent_dec_cbc, req);
195*4882a593Smuzhiyun }
196*4882a593Smuzhiyun
ctr_crypt(struct skcipher_request * req)197*4882a593Smuzhiyun static int ctr_crypt(struct skcipher_request *req)
198*4882a593Smuzhiyun {
199*4882a593Smuzhiyun return glue_ctr_req_128bit(&serpent_ctr, req);
200*4882a593Smuzhiyun }
201*4882a593Smuzhiyun
xts_encrypt(struct skcipher_request * req)202*4882a593Smuzhiyun static int xts_encrypt(struct skcipher_request *req)
203*4882a593Smuzhiyun {
204*4882a593Smuzhiyun struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
205*4882a593Smuzhiyun struct serpent_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
206*4882a593Smuzhiyun
207*4882a593Smuzhiyun return glue_xts_req_128bit(&serpent_enc_xts, req,
208*4882a593Smuzhiyun __serpent_encrypt, &ctx->tweak_ctx,
209*4882a593Smuzhiyun &ctx->crypt_ctx, false);
210*4882a593Smuzhiyun }
211*4882a593Smuzhiyun
xts_decrypt(struct skcipher_request * req)212*4882a593Smuzhiyun static int xts_decrypt(struct skcipher_request *req)
213*4882a593Smuzhiyun {
214*4882a593Smuzhiyun struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
215*4882a593Smuzhiyun struct serpent_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
216*4882a593Smuzhiyun
217*4882a593Smuzhiyun return glue_xts_req_128bit(&serpent_dec_xts, req,
218*4882a593Smuzhiyun __serpent_encrypt, &ctx->tweak_ctx,
219*4882a593Smuzhiyun &ctx->crypt_ctx, true);
220*4882a593Smuzhiyun }
221*4882a593Smuzhiyun
222*4882a593Smuzhiyun static struct skcipher_alg serpent_algs[] = {
223*4882a593Smuzhiyun {
224*4882a593Smuzhiyun .base.cra_name = "__ecb(serpent)",
225*4882a593Smuzhiyun .base.cra_driver_name = "__ecb-serpent-avx",
226*4882a593Smuzhiyun .base.cra_priority = 500,
227*4882a593Smuzhiyun .base.cra_flags = CRYPTO_ALG_INTERNAL,
228*4882a593Smuzhiyun .base.cra_blocksize = SERPENT_BLOCK_SIZE,
229*4882a593Smuzhiyun .base.cra_ctxsize = sizeof(struct serpent_ctx),
230*4882a593Smuzhiyun .base.cra_module = THIS_MODULE,
231*4882a593Smuzhiyun .min_keysize = SERPENT_MIN_KEY_SIZE,
232*4882a593Smuzhiyun .max_keysize = SERPENT_MAX_KEY_SIZE,
233*4882a593Smuzhiyun .setkey = serpent_setkey_skcipher,
234*4882a593Smuzhiyun .encrypt = ecb_encrypt,
235*4882a593Smuzhiyun .decrypt = ecb_decrypt,
236*4882a593Smuzhiyun }, {
237*4882a593Smuzhiyun .base.cra_name = "__cbc(serpent)",
238*4882a593Smuzhiyun .base.cra_driver_name = "__cbc-serpent-avx",
239*4882a593Smuzhiyun .base.cra_priority = 500,
240*4882a593Smuzhiyun .base.cra_flags = CRYPTO_ALG_INTERNAL,
241*4882a593Smuzhiyun .base.cra_blocksize = SERPENT_BLOCK_SIZE,
242*4882a593Smuzhiyun .base.cra_ctxsize = sizeof(struct serpent_ctx),
243*4882a593Smuzhiyun .base.cra_module = THIS_MODULE,
244*4882a593Smuzhiyun .min_keysize = SERPENT_MIN_KEY_SIZE,
245*4882a593Smuzhiyun .max_keysize = SERPENT_MAX_KEY_SIZE,
246*4882a593Smuzhiyun .ivsize = SERPENT_BLOCK_SIZE,
247*4882a593Smuzhiyun .setkey = serpent_setkey_skcipher,
248*4882a593Smuzhiyun .encrypt = cbc_encrypt,
249*4882a593Smuzhiyun .decrypt = cbc_decrypt,
250*4882a593Smuzhiyun }, {
251*4882a593Smuzhiyun .base.cra_name = "__ctr(serpent)",
252*4882a593Smuzhiyun .base.cra_driver_name = "__ctr-serpent-avx",
253*4882a593Smuzhiyun .base.cra_priority = 500,
254*4882a593Smuzhiyun .base.cra_flags = CRYPTO_ALG_INTERNAL,
255*4882a593Smuzhiyun .base.cra_blocksize = 1,
256*4882a593Smuzhiyun .base.cra_ctxsize = sizeof(struct serpent_ctx),
257*4882a593Smuzhiyun .base.cra_module = THIS_MODULE,
258*4882a593Smuzhiyun .min_keysize = SERPENT_MIN_KEY_SIZE,
259*4882a593Smuzhiyun .max_keysize = SERPENT_MAX_KEY_SIZE,
260*4882a593Smuzhiyun .ivsize = SERPENT_BLOCK_SIZE,
261*4882a593Smuzhiyun .chunksize = SERPENT_BLOCK_SIZE,
262*4882a593Smuzhiyun .setkey = serpent_setkey_skcipher,
263*4882a593Smuzhiyun .encrypt = ctr_crypt,
264*4882a593Smuzhiyun .decrypt = ctr_crypt,
265*4882a593Smuzhiyun }, {
266*4882a593Smuzhiyun .base.cra_name = "__xts(serpent)",
267*4882a593Smuzhiyun .base.cra_driver_name = "__xts-serpent-avx",
268*4882a593Smuzhiyun .base.cra_priority = 500,
269*4882a593Smuzhiyun .base.cra_flags = CRYPTO_ALG_INTERNAL,
270*4882a593Smuzhiyun .base.cra_blocksize = SERPENT_BLOCK_SIZE,
271*4882a593Smuzhiyun .base.cra_ctxsize = sizeof(struct serpent_xts_ctx),
272*4882a593Smuzhiyun .base.cra_module = THIS_MODULE,
273*4882a593Smuzhiyun .min_keysize = 2 * SERPENT_MIN_KEY_SIZE,
274*4882a593Smuzhiyun .max_keysize = 2 * SERPENT_MAX_KEY_SIZE,
275*4882a593Smuzhiyun .ivsize = SERPENT_BLOCK_SIZE,
276*4882a593Smuzhiyun .setkey = xts_serpent_setkey,
277*4882a593Smuzhiyun .encrypt = xts_encrypt,
278*4882a593Smuzhiyun .decrypt = xts_decrypt,
279*4882a593Smuzhiyun },
280*4882a593Smuzhiyun };
281*4882a593Smuzhiyun
282*4882a593Smuzhiyun static struct simd_skcipher_alg *serpent_simd_algs[ARRAY_SIZE(serpent_algs)];
283*4882a593Smuzhiyun
serpent_init(void)284*4882a593Smuzhiyun static int __init serpent_init(void)
285*4882a593Smuzhiyun {
286*4882a593Smuzhiyun const char *feature_name;
287*4882a593Smuzhiyun
288*4882a593Smuzhiyun if (!cpu_has_xfeatures(XFEATURE_MASK_SSE | XFEATURE_MASK_YMM,
289*4882a593Smuzhiyun &feature_name)) {
290*4882a593Smuzhiyun pr_info("CPU feature '%s' is not supported.\n", feature_name);
291*4882a593Smuzhiyun return -ENODEV;
292*4882a593Smuzhiyun }
293*4882a593Smuzhiyun
294*4882a593Smuzhiyun return simd_register_skciphers_compat(serpent_algs,
295*4882a593Smuzhiyun ARRAY_SIZE(serpent_algs),
296*4882a593Smuzhiyun serpent_simd_algs);
297*4882a593Smuzhiyun }
298*4882a593Smuzhiyun
serpent_exit(void)299*4882a593Smuzhiyun static void __exit serpent_exit(void)
300*4882a593Smuzhiyun {
301*4882a593Smuzhiyun simd_unregister_skciphers(serpent_algs, ARRAY_SIZE(serpent_algs),
302*4882a593Smuzhiyun serpent_simd_algs);
303*4882a593Smuzhiyun }
304*4882a593Smuzhiyun
305*4882a593Smuzhiyun module_init(serpent_init);
306*4882a593Smuzhiyun module_exit(serpent_exit);
307*4882a593Smuzhiyun
308*4882a593Smuzhiyun MODULE_DESCRIPTION("Serpent Cipher Algorithm, AVX optimized");
309*4882a593Smuzhiyun MODULE_LICENSE("GPL");
310*4882a593Smuzhiyun MODULE_ALIAS_CRYPTO("serpent");
311