1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Glue Code for x86_64/AVX/AES-NI assembler optimized version of Camellia
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Copyright © 2012-2013 Jussi Kivilinna <jussi.kivilinna@iki.fi>
6*4882a593Smuzhiyun */
7*4882a593Smuzhiyun
8*4882a593Smuzhiyun #include <asm/crypto/camellia.h>
9*4882a593Smuzhiyun #include <asm/crypto/glue_helper.h>
10*4882a593Smuzhiyun #include <crypto/algapi.h>
11*4882a593Smuzhiyun #include <crypto/internal/simd.h>
12*4882a593Smuzhiyun #include <crypto/xts.h>
13*4882a593Smuzhiyun #include <linux/crypto.h>
14*4882a593Smuzhiyun #include <linux/err.h>
15*4882a593Smuzhiyun #include <linux/module.h>
16*4882a593Smuzhiyun #include <linux/types.h>
17*4882a593Smuzhiyun
18*4882a593Smuzhiyun #define CAMELLIA_AESNI_PARALLEL_BLOCKS 16
19*4882a593Smuzhiyun
20*4882a593Smuzhiyun /* 16-way parallel cipher functions (avx/aes-ni) */
21*4882a593Smuzhiyun asmlinkage void camellia_ecb_enc_16way(const void *ctx, u8 *dst, const u8 *src);
22*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(camellia_ecb_enc_16way);
23*4882a593Smuzhiyun
24*4882a593Smuzhiyun asmlinkage void camellia_ecb_dec_16way(const void *ctx, u8 *dst, const u8 *src);
25*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(camellia_ecb_dec_16way);
26*4882a593Smuzhiyun
27*4882a593Smuzhiyun asmlinkage void camellia_cbc_dec_16way(const void *ctx, u8 *dst, const u8 *src);
28*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(camellia_cbc_dec_16way);
29*4882a593Smuzhiyun
30*4882a593Smuzhiyun asmlinkage void camellia_ctr_16way(const void *ctx, u8 *dst, const u8 *src,
31*4882a593Smuzhiyun le128 *iv);
32*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(camellia_ctr_16way);
33*4882a593Smuzhiyun
34*4882a593Smuzhiyun asmlinkage void camellia_xts_enc_16way(const void *ctx, u8 *dst, const u8 *src,
35*4882a593Smuzhiyun le128 *iv);
36*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(camellia_xts_enc_16way);
37*4882a593Smuzhiyun
38*4882a593Smuzhiyun asmlinkage void camellia_xts_dec_16way(const void *ctx, u8 *dst, const u8 *src,
39*4882a593Smuzhiyun le128 *iv);
40*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(camellia_xts_dec_16way);
41*4882a593Smuzhiyun
camellia_xts_enc(const void * ctx,u8 * dst,const u8 * src,le128 * iv)42*4882a593Smuzhiyun void camellia_xts_enc(const void *ctx, u8 *dst, const u8 *src, le128 *iv)
43*4882a593Smuzhiyun {
44*4882a593Smuzhiyun glue_xts_crypt_128bit_one(ctx, dst, src, iv, camellia_enc_blk);
45*4882a593Smuzhiyun }
46*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(camellia_xts_enc);
47*4882a593Smuzhiyun
camellia_xts_dec(const void * ctx,u8 * dst,const u8 * src,le128 * iv)48*4882a593Smuzhiyun void camellia_xts_dec(const void *ctx, u8 *dst, const u8 *src, le128 *iv)
49*4882a593Smuzhiyun {
50*4882a593Smuzhiyun glue_xts_crypt_128bit_one(ctx, dst, src, iv, camellia_dec_blk);
51*4882a593Smuzhiyun }
52*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(camellia_xts_dec);
53*4882a593Smuzhiyun
54*4882a593Smuzhiyun static const struct common_glue_ctx camellia_enc = {
55*4882a593Smuzhiyun .num_funcs = 3,
56*4882a593Smuzhiyun .fpu_blocks_limit = CAMELLIA_AESNI_PARALLEL_BLOCKS,
57*4882a593Smuzhiyun
58*4882a593Smuzhiyun .funcs = { {
59*4882a593Smuzhiyun .num_blocks = CAMELLIA_AESNI_PARALLEL_BLOCKS,
60*4882a593Smuzhiyun .fn_u = { .ecb = camellia_ecb_enc_16way }
61*4882a593Smuzhiyun }, {
62*4882a593Smuzhiyun .num_blocks = 2,
63*4882a593Smuzhiyun .fn_u = { .ecb = camellia_enc_blk_2way }
64*4882a593Smuzhiyun }, {
65*4882a593Smuzhiyun .num_blocks = 1,
66*4882a593Smuzhiyun .fn_u = { .ecb = camellia_enc_blk }
67*4882a593Smuzhiyun } }
68*4882a593Smuzhiyun };
69*4882a593Smuzhiyun
70*4882a593Smuzhiyun static const struct common_glue_ctx camellia_ctr = {
71*4882a593Smuzhiyun .num_funcs = 3,
72*4882a593Smuzhiyun .fpu_blocks_limit = CAMELLIA_AESNI_PARALLEL_BLOCKS,
73*4882a593Smuzhiyun
74*4882a593Smuzhiyun .funcs = { {
75*4882a593Smuzhiyun .num_blocks = CAMELLIA_AESNI_PARALLEL_BLOCKS,
76*4882a593Smuzhiyun .fn_u = { .ctr = camellia_ctr_16way }
77*4882a593Smuzhiyun }, {
78*4882a593Smuzhiyun .num_blocks = 2,
79*4882a593Smuzhiyun .fn_u = { .ctr = camellia_crypt_ctr_2way }
80*4882a593Smuzhiyun }, {
81*4882a593Smuzhiyun .num_blocks = 1,
82*4882a593Smuzhiyun .fn_u = { .ctr = camellia_crypt_ctr }
83*4882a593Smuzhiyun } }
84*4882a593Smuzhiyun };
85*4882a593Smuzhiyun
86*4882a593Smuzhiyun static const struct common_glue_ctx camellia_enc_xts = {
87*4882a593Smuzhiyun .num_funcs = 2,
88*4882a593Smuzhiyun .fpu_blocks_limit = CAMELLIA_AESNI_PARALLEL_BLOCKS,
89*4882a593Smuzhiyun
90*4882a593Smuzhiyun .funcs = { {
91*4882a593Smuzhiyun .num_blocks = CAMELLIA_AESNI_PARALLEL_BLOCKS,
92*4882a593Smuzhiyun .fn_u = { .xts = camellia_xts_enc_16way }
93*4882a593Smuzhiyun }, {
94*4882a593Smuzhiyun .num_blocks = 1,
95*4882a593Smuzhiyun .fn_u = { .xts = camellia_xts_enc }
96*4882a593Smuzhiyun } }
97*4882a593Smuzhiyun };
98*4882a593Smuzhiyun
99*4882a593Smuzhiyun static const struct common_glue_ctx camellia_dec = {
100*4882a593Smuzhiyun .num_funcs = 3,
101*4882a593Smuzhiyun .fpu_blocks_limit = CAMELLIA_AESNI_PARALLEL_BLOCKS,
102*4882a593Smuzhiyun
103*4882a593Smuzhiyun .funcs = { {
104*4882a593Smuzhiyun .num_blocks = CAMELLIA_AESNI_PARALLEL_BLOCKS,
105*4882a593Smuzhiyun .fn_u = { .ecb = camellia_ecb_dec_16way }
106*4882a593Smuzhiyun }, {
107*4882a593Smuzhiyun .num_blocks = 2,
108*4882a593Smuzhiyun .fn_u = { .ecb = camellia_dec_blk_2way }
109*4882a593Smuzhiyun }, {
110*4882a593Smuzhiyun .num_blocks = 1,
111*4882a593Smuzhiyun .fn_u = { .ecb = camellia_dec_blk }
112*4882a593Smuzhiyun } }
113*4882a593Smuzhiyun };
114*4882a593Smuzhiyun
115*4882a593Smuzhiyun static const struct common_glue_ctx camellia_dec_cbc = {
116*4882a593Smuzhiyun .num_funcs = 3,
117*4882a593Smuzhiyun .fpu_blocks_limit = CAMELLIA_AESNI_PARALLEL_BLOCKS,
118*4882a593Smuzhiyun
119*4882a593Smuzhiyun .funcs = { {
120*4882a593Smuzhiyun .num_blocks = CAMELLIA_AESNI_PARALLEL_BLOCKS,
121*4882a593Smuzhiyun .fn_u = { .cbc = camellia_cbc_dec_16way }
122*4882a593Smuzhiyun }, {
123*4882a593Smuzhiyun .num_blocks = 2,
124*4882a593Smuzhiyun .fn_u = { .cbc = camellia_decrypt_cbc_2way }
125*4882a593Smuzhiyun }, {
126*4882a593Smuzhiyun .num_blocks = 1,
127*4882a593Smuzhiyun .fn_u = { .cbc = camellia_dec_blk }
128*4882a593Smuzhiyun } }
129*4882a593Smuzhiyun };
130*4882a593Smuzhiyun
131*4882a593Smuzhiyun static const struct common_glue_ctx camellia_dec_xts = {
132*4882a593Smuzhiyun .num_funcs = 2,
133*4882a593Smuzhiyun .fpu_blocks_limit = CAMELLIA_AESNI_PARALLEL_BLOCKS,
134*4882a593Smuzhiyun
135*4882a593Smuzhiyun .funcs = { {
136*4882a593Smuzhiyun .num_blocks = CAMELLIA_AESNI_PARALLEL_BLOCKS,
137*4882a593Smuzhiyun .fn_u = { .xts = camellia_xts_dec_16way }
138*4882a593Smuzhiyun }, {
139*4882a593Smuzhiyun .num_blocks = 1,
140*4882a593Smuzhiyun .fn_u = { .xts = camellia_xts_dec }
141*4882a593Smuzhiyun } }
142*4882a593Smuzhiyun };
143*4882a593Smuzhiyun
camellia_setkey(struct crypto_skcipher * tfm,const u8 * key,unsigned int keylen)144*4882a593Smuzhiyun static int camellia_setkey(struct crypto_skcipher *tfm, const u8 *key,
145*4882a593Smuzhiyun unsigned int keylen)
146*4882a593Smuzhiyun {
147*4882a593Smuzhiyun return __camellia_setkey(crypto_skcipher_ctx(tfm), key, keylen);
148*4882a593Smuzhiyun }
149*4882a593Smuzhiyun
ecb_encrypt(struct skcipher_request * req)150*4882a593Smuzhiyun static int ecb_encrypt(struct skcipher_request *req)
151*4882a593Smuzhiyun {
152*4882a593Smuzhiyun return glue_ecb_req_128bit(&camellia_enc, req);
153*4882a593Smuzhiyun }
154*4882a593Smuzhiyun
ecb_decrypt(struct skcipher_request * req)155*4882a593Smuzhiyun static int ecb_decrypt(struct skcipher_request *req)
156*4882a593Smuzhiyun {
157*4882a593Smuzhiyun return glue_ecb_req_128bit(&camellia_dec, req);
158*4882a593Smuzhiyun }
159*4882a593Smuzhiyun
cbc_encrypt(struct skcipher_request * req)160*4882a593Smuzhiyun static int cbc_encrypt(struct skcipher_request *req)
161*4882a593Smuzhiyun {
162*4882a593Smuzhiyun return glue_cbc_encrypt_req_128bit(camellia_enc_blk, req);
163*4882a593Smuzhiyun }
164*4882a593Smuzhiyun
cbc_decrypt(struct skcipher_request * req)165*4882a593Smuzhiyun static int cbc_decrypt(struct skcipher_request *req)
166*4882a593Smuzhiyun {
167*4882a593Smuzhiyun return glue_cbc_decrypt_req_128bit(&camellia_dec_cbc, req);
168*4882a593Smuzhiyun }
169*4882a593Smuzhiyun
ctr_crypt(struct skcipher_request * req)170*4882a593Smuzhiyun static int ctr_crypt(struct skcipher_request *req)
171*4882a593Smuzhiyun {
172*4882a593Smuzhiyun return glue_ctr_req_128bit(&camellia_ctr, req);
173*4882a593Smuzhiyun }
174*4882a593Smuzhiyun
xts_camellia_setkey(struct crypto_skcipher * tfm,const u8 * key,unsigned int keylen)175*4882a593Smuzhiyun int xts_camellia_setkey(struct crypto_skcipher *tfm, const u8 *key,
176*4882a593Smuzhiyun unsigned int keylen)
177*4882a593Smuzhiyun {
178*4882a593Smuzhiyun struct camellia_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
179*4882a593Smuzhiyun int err;
180*4882a593Smuzhiyun
181*4882a593Smuzhiyun err = xts_verify_key(tfm, key, keylen);
182*4882a593Smuzhiyun if (err)
183*4882a593Smuzhiyun return err;
184*4882a593Smuzhiyun
185*4882a593Smuzhiyun /* first half of xts-key is for crypt */
186*4882a593Smuzhiyun err = __camellia_setkey(&ctx->crypt_ctx, key, keylen / 2);
187*4882a593Smuzhiyun if (err)
188*4882a593Smuzhiyun return err;
189*4882a593Smuzhiyun
190*4882a593Smuzhiyun /* second half of xts-key is for tweak */
191*4882a593Smuzhiyun return __camellia_setkey(&ctx->tweak_ctx, key + keylen / 2, keylen / 2);
192*4882a593Smuzhiyun }
193*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(xts_camellia_setkey);
194*4882a593Smuzhiyun
xts_encrypt(struct skcipher_request * req)195*4882a593Smuzhiyun static int xts_encrypt(struct skcipher_request *req)
196*4882a593Smuzhiyun {
197*4882a593Smuzhiyun struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
198*4882a593Smuzhiyun struct camellia_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
199*4882a593Smuzhiyun
200*4882a593Smuzhiyun return glue_xts_req_128bit(&camellia_enc_xts, req, camellia_enc_blk,
201*4882a593Smuzhiyun &ctx->tweak_ctx, &ctx->crypt_ctx, false);
202*4882a593Smuzhiyun }
203*4882a593Smuzhiyun
xts_decrypt(struct skcipher_request * req)204*4882a593Smuzhiyun static int xts_decrypt(struct skcipher_request *req)
205*4882a593Smuzhiyun {
206*4882a593Smuzhiyun struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
207*4882a593Smuzhiyun struct camellia_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
208*4882a593Smuzhiyun
209*4882a593Smuzhiyun return glue_xts_req_128bit(&camellia_dec_xts, req, camellia_enc_blk,
210*4882a593Smuzhiyun &ctx->tweak_ctx, &ctx->crypt_ctx, true);
211*4882a593Smuzhiyun }
212*4882a593Smuzhiyun
213*4882a593Smuzhiyun static struct skcipher_alg camellia_algs[] = {
214*4882a593Smuzhiyun {
215*4882a593Smuzhiyun .base.cra_name = "__ecb(camellia)",
216*4882a593Smuzhiyun .base.cra_driver_name = "__ecb-camellia-aesni",
217*4882a593Smuzhiyun .base.cra_priority = 400,
218*4882a593Smuzhiyun .base.cra_flags = CRYPTO_ALG_INTERNAL,
219*4882a593Smuzhiyun .base.cra_blocksize = CAMELLIA_BLOCK_SIZE,
220*4882a593Smuzhiyun .base.cra_ctxsize = sizeof(struct camellia_ctx),
221*4882a593Smuzhiyun .base.cra_module = THIS_MODULE,
222*4882a593Smuzhiyun .min_keysize = CAMELLIA_MIN_KEY_SIZE,
223*4882a593Smuzhiyun .max_keysize = CAMELLIA_MAX_KEY_SIZE,
224*4882a593Smuzhiyun .setkey = camellia_setkey,
225*4882a593Smuzhiyun .encrypt = ecb_encrypt,
226*4882a593Smuzhiyun .decrypt = ecb_decrypt,
227*4882a593Smuzhiyun }, {
228*4882a593Smuzhiyun .base.cra_name = "__cbc(camellia)",
229*4882a593Smuzhiyun .base.cra_driver_name = "__cbc-camellia-aesni",
230*4882a593Smuzhiyun .base.cra_priority = 400,
231*4882a593Smuzhiyun .base.cra_flags = CRYPTO_ALG_INTERNAL,
232*4882a593Smuzhiyun .base.cra_blocksize = CAMELLIA_BLOCK_SIZE,
233*4882a593Smuzhiyun .base.cra_ctxsize = sizeof(struct camellia_ctx),
234*4882a593Smuzhiyun .base.cra_module = THIS_MODULE,
235*4882a593Smuzhiyun .min_keysize = CAMELLIA_MIN_KEY_SIZE,
236*4882a593Smuzhiyun .max_keysize = CAMELLIA_MAX_KEY_SIZE,
237*4882a593Smuzhiyun .ivsize = CAMELLIA_BLOCK_SIZE,
238*4882a593Smuzhiyun .setkey = camellia_setkey,
239*4882a593Smuzhiyun .encrypt = cbc_encrypt,
240*4882a593Smuzhiyun .decrypt = cbc_decrypt,
241*4882a593Smuzhiyun }, {
242*4882a593Smuzhiyun .base.cra_name = "__ctr(camellia)",
243*4882a593Smuzhiyun .base.cra_driver_name = "__ctr-camellia-aesni",
244*4882a593Smuzhiyun .base.cra_priority = 400,
245*4882a593Smuzhiyun .base.cra_flags = CRYPTO_ALG_INTERNAL,
246*4882a593Smuzhiyun .base.cra_blocksize = 1,
247*4882a593Smuzhiyun .base.cra_ctxsize = sizeof(struct camellia_ctx),
248*4882a593Smuzhiyun .base.cra_module = THIS_MODULE,
249*4882a593Smuzhiyun .min_keysize = CAMELLIA_MIN_KEY_SIZE,
250*4882a593Smuzhiyun .max_keysize = CAMELLIA_MAX_KEY_SIZE,
251*4882a593Smuzhiyun .ivsize = CAMELLIA_BLOCK_SIZE,
252*4882a593Smuzhiyun .chunksize = CAMELLIA_BLOCK_SIZE,
253*4882a593Smuzhiyun .setkey = camellia_setkey,
254*4882a593Smuzhiyun .encrypt = ctr_crypt,
255*4882a593Smuzhiyun .decrypt = ctr_crypt,
256*4882a593Smuzhiyun }, {
257*4882a593Smuzhiyun .base.cra_name = "__xts(camellia)",
258*4882a593Smuzhiyun .base.cra_driver_name = "__xts-camellia-aesni",
259*4882a593Smuzhiyun .base.cra_priority = 400,
260*4882a593Smuzhiyun .base.cra_flags = CRYPTO_ALG_INTERNAL,
261*4882a593Smuzhiyun .base.cra_blocksize = CAMELLIA_BLOCK_SIZE,
262*4882a593Smuzhiyun .base.cra_ctxsize = sizeof(struct camellia_xts_ctx),
263*4882a593Smuzhiyun .base.cra_module = THIS_MODULE,
264*4882a593Smuzhiyun .min_keysize = 2 * CAMELLIA_MIN_KEY_SIZE,
265*4882a593Smuzhiyun .max_keysize = 2 * CAMELLIA_MAX_KEY_SIZE,
266*4882a593Smuzhiyun .ivsize = CAMELLIA_BLOCK_SIZE,
267*4882a593Smuzhiyun .setkey = xts_camellia_setkey,
268*4882a593Smuzhiyun .encrypt = xts_encrypt,
269*4882a593Smuzhiyun .decrypt = xts_decrypt,
270*4882a593Smuzhiyun },
271*4882a593Smuzhiyun };
272*4882a593Smuzhiyun
273*4882a593Smuzhiyun static struct simd_skcipher_alg *camellia_simd_algs[ARRAY_SIZE(camellia_algs)];
274*4882a593Smuzhiyun
camellia_aesni_init(void)275*4882a593Smuzhiyun static int __init camellia_aesni_init(void)
276*4882a593Smuzhiyun {
277*4882a593Smuzhiyun const char *feature_name;
278*4882a593Smuzhiyun
279*4882a593Smuzhiyun if (!boot_cpu_has(X86_FEATURE_AVX) ||
280*4882a593Smuzhiyun !boot_cpu_has(X86_FEATURE_AES) ||
281*4882a593Smuzhiyun !boot_cpu_has(X86_FEATURE_OSXSAVE)) {
282*4882a593Smuzhiyun pr_info("AVX or AES-NI instructions are not detected.\n");
283*4882a593Smuzhiyun return -ENODEV;
284*4882a593Smuzhiyun }
285*4882a593Smuzhiyun
286*4882a593Smuzhiyun if (!cpu_has_xfeatures(XFEATURE_MASK_SSE | XFEATURE_MASK_YMM,
287*4882a593Smuzhiyun &feature_name)) {
288*4882a593Smuzhiyun pr_info("CPU feature '%s' is not supported.\n", feature_name);
289*4882a593Smuzhiyun return -ENODEV;
290*4882a593Smuzhiyun }
291*4882a593Smuzhiyun
292*4882a593Smuzhiyun return simd_register_skciphers_compat(camellia_algs,
293*4882a593Smuzhiyun ARRAY_SIZE(camellia_algs),
294*4882a593Smuzhiyun camellia_simd_algs);
295*4882a593Smuzhiyun }
296*4882a593Smuzhiyun
camellia_aesni_fini(void)297*4882a593Smuzhiyun static void __exit camellia_aesni_fini(void)
298*4882a593Smuzhiyun {
299*4882a593Smuzhiyun simd_unregister_skciphers(camellia_algs, ARRAY_SIZE(camellia_algs),
300*4882a593Smuzhiyun camellia_simd_algs);
301*4882a593Smuzhiyun }
302*4882a593Smuzhiyun
303*4882a593Smuzhiyun module_init(camellia_aesni_init);
304*4882a593Smuzhiyun module_exit(camellia_aesni_fini);
305*4882a593Smuzhiyun
306*4882a593Smuzhiyun MODULE_LICENSE("GPL");
307*4882a593Smuzhiyun MODULE_DESCRIPTION("Camellia Cipher Algorithm, AES-NI/AVX optimized");
308*4882a593Smuzhiyun MODULE_ALIAS_CRYPTO("camellia");
309*4882a593Smuzhiyun MODULE_ALIAS_CRYPTO("camellia-asm");
310