1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * OpenSSL/Cryptogams accelerated Poly1305 transform for MIPS
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Copyright (C) 2019 Linaro Ltd. <ard.biesheuvel@linaro.org>
6*4882a593Smuzhiyun */
7*4882a593Smuzhiyun
8*4882a593Smuzhiyun #include <asm/unaligned.h>
9*4882a593Smuzhiyun #include <crypto/algapi.h>
10*4882a593Smuzhiyun #include <crypto/internal/hash.h>
11*4882a593Smuzhiyun #include <crypto/internal/poly1305.h>
12*4882a593Smuzhiyun #include <linux/cpufeature.h>
13*4882a593Smuzhiyun #include <linux/crypto.h>
14*4882a593Smuzhiyun #include <linux/module.h>
15*4882a593Smuzhiyun
16*4882a593Smuzhiyun asmlinkage void poly1305_init_mips(void *state, const u8 *key);
17*4882a593Smuzhiyun asmlinkage void poly1305_blocks_mips(void *state, const u8 *src, u32 len, u32 hibit);
18*4882a593Smuzhiyun asmlinkage void poly1305_emit_mips(void *state, u8 *digest, const u32 *nonce);
19*4882a593Smuzhiyun
poly1305_init_arch(struct poly1305_desc_ctx * dctx,const u8 key[POLY1305_KEY_SIZE])20*4882a593Smuzhiyun void poly1305_init_arch(struct poly1305_desc_ctx *dctx, const u8 key[POLY1305_KEY_SIZE])
21*4882a593Smuzhiyun {
22*4882a593Smuzhiyun poly1305_init_mips(&dctx->h, key);
23*4882a593Smuzhiyun dctx->s[0] = get_unaligned_le32(key + 16);
24*4882a593Smuzhiyun dctx->s[1] = get_unaligned_le32(key + 20);
25*4882a593Smuzhiyun dctx->s[2] = get_unaligned_le32(key + 24);
26*4882a593Smuzhiyun dctx->s[3] = get_unaligned_le32(key + 28);
27*4882a593Smuzhiyun dctx->buflen = 0;
28*4882a593Smuzhiyun }
29*4882a593Smuzhiyun EXPORT_SYMBOL(poly1305_init_arch);
30*4882a593Smuzhiyun
mips_poly1305_init(struct shash_desc * desc)31*4882a593Smuzhiyun static int mips_poly1305_init(struct shash_desc *desc)
32*4882a593Smuzhiyun {
33*4882a593Smuzhiyun struct poly1305_desc_ctx *dctx = shash_desc_ctx(desc);
34*4882a593Smuzhiyun
35*4882a593Smuzhiyun dctx->buflen = 0;
36*4882a593Smuzhiyun dctx->rset = 0;
37*4882a593Smuzhiyun dctx->sset = false;
38*4882a593Smuzhiyun
39*4882a593Smuzhiyun return 0;
40*4882a593Smuzhiyun }
41*4882a593Smuzhiyun
mips_poly1305_blocks(struct poly1305_desc_ctx * dctx,const u8 * src,u32 len,u32 hibit)42*4882a593Smuzhiyun static void mips_poly1305_blocks(struct poly1305_desc_ctx *dctx, const u8 *src,
43*4882a593Smuzhiyun u32 len, u32 hibit)
44*4882a593Smuzhiyun {
45*4882a593Smuzhiyun if (unlikely(!dctx->sset)) {
46*4882a593Smuzhiyun if (!dctx->rset) {
47*4882a593Smuzhiyun poly1305_init_mips(&dctx->h, src);
48*4882a593Smuzhiyun src += POLY1305_BLOCK_SIZE;
49*4882a593Smuzhiyun len -= POLY1305_BLOCK_SIZE;
50*4882a593Smuzhiyun dctx->rset = 1;
51*4882a593Smuzhiyun }
52*4882a593Smuzhiyun if (len >= POLY1305_BLOCK_SIZE) {
53*4882a593Smuzhiyun dctx->s[0] = get_unaligned_le32(src + 0);
54*4882a593Smuzhiyun dctx->s[1] = get_unaligned_le32(src + 4);
55*4882a593Smuzhiyun dctx->s[2] = get_unaligned_le32(src + 8);
56*4882a593Smuzhiyun dctx->s[3] = get_unaligned_le32(src + 12);
57*4882a593Smuzhiyun src += POLY1305_BLOCK_SIZE;
58*4882a593Smuzhiyun len -= POLY1305_BLOCK_SIZE;
59*4882a593Smuzhiyun dctx->sset = true;
60*4882a593Smuzhiyun }
61*4882a593Smuzhiyun if (len < POLY1305_BLOCK_SIZE)
62*4882a593Smuzhiyun return;
63*4882a593Smuzhiyun }
64*4882a593Smuzhiyun
65*4882a593Smuzhiyun len &= ~(POLY1305_BLOCK_SIZE - 1);
66*4882a593Smuzhiyun
67*4882a593Smuzhiyun poly1305_blocks_mips(&dctx->h, src, len, hibit);
68*4882a593Smuzhiyun }
69*4882a593Smuzhiyun
mips_poly1305_update(struct shash_desc * desc,const u8 * src,unsigned int len)70*4882a593Smuzhiyun static int mips_poly1305_update(struct shash_desc *desc, const u8 *src,
71*4882a593Smuzhiyun unsigned int len)
72*4882a593Smuzhiyun {
73*4882a593Smuzhiyun struct poly1305_desc_ctx *dctx = shash_desc_ctx(desc);
74*4882a593Smuzhiyun
75*4882a593Smuzhiyun if (unlikely(dctx->buflen)) {
76*4882a593Smuzhiyun u32 bytes = min(len, POLY1305_BLOCK_SIZE - dctx->buflen);
77*4882a593Smuzhiyun
78*4882a593Smuzhiyun memcpy(dctx->buf + dctx->buflen, src, bytes);
79*4882a593Smuzhiyun src += bytes;
80*4882a593Smuzhiyun len -= bytes;
81*4882a593Smuzhiyun dctx->buflen += bytes;
82*4882a593Smuzhiyun
83*4882a593Smuzhiyun if (dctx->buflen == POLY1305_BLOCK_SIZE) {
84*4882a593Smuzhiyun mips_poly1305_blocks(dctx, dctx->buf, POLY1305_BLOCK_SIZE, 1);
85*4882a593Smuzhiyun dctx->buflen = 0;
86*4882a593Smuzhiyun }
87*4882a593Smuzhiyun }
88*4882a593Smuzhiyun
89*4882a593Smuzhiyun if (likely(len >= POLY1305_BLOCK_SIZE)) {
90*4882a593Smuzhiyun mips_poly1305_blocks(dctx, src, len, 1);
91*4882a593Smuzhiyun src += round_down(len, POLY1305_BLOCK_SIZE);
92*4882a593Smuzhiyun len %= POLY1305_BLOCK_SIZE;
93*4882a593Smuzhiyun }
94*4882a593Smuzhiyun
95*4882a593Smuzhiyun if (unlikely(len)) {
96*4882a593Smuzhiyun dctx->buflen = len;
97*4882a593Smuzhiyun memcpy(dctx->buf, src, len);
98*4882a593Smuzhiyun }
99*4882a593Smuzhiyun return 0;
100*4882a593Smuzhiyun }
101*4882a593Smuzhiyun
poly1305_update_arch(struct poly1305_desc_ctx * dctx,const u8 * src,unsigned int nbytes)102*4882a593Smuzhiyun void poly1305_update_arch(struct poly1305_desc_ctx *dctx, const u8 *src,
103*4882a593Smuzhiyun unsigned int nbytes)
104*4882a593Smuzhiyun {
105*4882a593Smuzhiyun if (unlikely(dctx->buflen)) {
106*4882a593Smuzhiyun u32 bytes = min(nbytes, POLY1305_BLOCK_SIZE - dctx->buflen);
107*4882a593Smuzhiyun
108*4882a593Smuzhiyun memcpy(dctx->buf + dctx->buflen, src, bytes);
109*4882a593Smuzhiyun src += bytes;
110*4882a593Smuzhiyun nbytes -= bytes;
111*4882a593Smuzhiyun dctx->buflen += bytes;
112*4882a593Smuzhiyun
113*4882a593Smuzhiyun if (dctx->buflen == POLY1305_BLOCK_SIZE) {
114*4882a593Smuzhiyun poly1305_blocks_mips(&dctx->h, dctx->buf,
115*4882a593Smuzhiyun POLY1305_BLOCK_SIZE, 1);
116*4882a593Smuzhiyun dctx->buflen = 0;
117*4882a593Smuzhiyun }
118*4882a593Smuzhiyun }
119*4882a593Smuzhiyun
120*4882a593Smuzhiyun if (likely(nbytes >= POLY1305_BLOCK_SIZE)) {
121*4882a593Smuzhiyun unsigned int len = round_down(nbytes, POLY1305_BLOCK_SIZE);
122*4882a593Smuzhiyun
123*4882a593Smuzhiyun poly1305_blocks_mips(&dctx->h, src, len, 1);
124*4882a593Smuzhiyun src += len;
125*4882a593Smuzhiyun nbytes %= POLY1305_BLOCK_SIZE;
126*4882a593Smuzhiyun }
127*4882a593Smuzhiyun
128*4882a593Smuzhiyun if (unlikely(nbytes)) {
129*4882a593Smuzhiyun dctx->buflen = nbytes;
130*4882a593Smuzhiyun memcpy(dctx->buf, src, nbytes);
131*4882a593Smuzhiyun }
132*4882a593Smuzhiyun }
133*4882a593Smuzhiyun EXPORT_SYMBOL(poly1305_update_arch);
134*4882a593Smuzhiyun
poly1305_final_arch(struct poly1305_desc_ctx * dctx,u8 * dst)135*4882a593Smuzhiyun void poly1305_final_arch(struct poly1305_desc_ctx *dctx, u8 *dst)
136*4882a593Smuzhiyun {
137*4882a593Smuzhiyun if (unlikely(dctx->buflen)) {
138*4882a593Smuzhiyun dctx->buf[dctx->buflen++] = 1;
139*4882a593Smuzhiyun memset(dctx->buf + dctx->buflen, 0,
140*4882a593Smuzhiyun POLY1305_BLOCK_SIZE - dctx->buflen);
141*4882a593Smuzhiyun poly1305_blocks_mips(&dctx->h, dctx->buf, POLY1305_BLOCK_SIZE, 0);
142*4882a593Smuzhiyun }
143*4882a593Smuzhiyun
144*4882a593Smuzhiyun poly1305_emit_mips(&dctx->h, dst, dctx->s);
145*4882a593Smuzhiyun *dctx = (struct poly1305_desc_ctx){};
146*4882a593Smuzhiyun }
147*4882a593Smuzhiyun EXPORT_SYMBOL(poly1305_final_arch);
148*4882a593Smuzhiyun
mips_poly1305_final(struct shash_desc * desc,u8 * dst)149*4882a593Smuzhiyun static int mips_poly1305_final(struct shash_desc *desc, u8 *dst)
150*4882a593Smuzhiyun {
151*4882a593Smuzhiyun struct poly1305_desc_ctx *dctx = shash_desc_ctx(desc);
152*4882a593Smuzhiyun
153*4882a593Smuzhiyun if (unlikely(!dctx->sset))
154*4882a593Smuzhiyun return -ENOKEY;
155*4882a593Smuzhiyun
156*4882a593Smuzhiyun poly1305_final_arch(dctx, dst);
157*4882a593Smuzhiyun return 0;
158*4882a593Smuzhiyun }
159*4882a593Smuzhiyun
160*4882a593Smuzhiyun static struct shash_alg mips_poly1305_alg = {
161*4882a593Smuzhiyun .init = mips_poly1305_init,
162*4882a593Smuzhiyun .update = mips_poly1305_update,
163*4882a593Smuzhiyun .final = mips_poly1305_final,
164*4882a593Smuzhiyun .digestsize = POLY1305_DIGEST_SIZE,
165*4882a593Smuzhiyun .descsize = sizeof(struct poly1305_desc_ctx),
166*4882a593Smuzhiyun
167*4882a593Smuzhiyun .base.cra_name = "poly1305",
168*4882a593Smuzhiyun .base.cra_driver_name = "poly1305-mips",
169*4882a593Smuzhiyun .base.cra_priority = 200,
170*4882a593Smuzhiyun .base.cra_blocksize = POLY1305_BLOCK_SIZE,
171*4882a593Smuzhiyun .base.cra_module = THIS_MODULE,
172*4882a593Smuzhiyun };
173*4882a593Smuzhiyun
mips_poly1305_mod_init(void)174*4882a593Smuzhiyun static int __init mips_poly1305_mod_init(void)
175*4882a593Smuzhiyun {
176*4882a593Smuzhiyun return IS_REACHABLE(CONFIG_CRYPTO_HASH) ?
177*4882a593Smuzhiyun crypto_register_shash(&mips_poly1305_alg) : 0;
178*4882a593Smuzhiyun }
179*4882a593Smuzhiyun
mips_poly1305_mod_exit(void)180*4882a593Smuzhiyun static void __exit mips_poly1305_mod_exit(void)
181*4882a593Smuzhiyun {
182*4882a593Smuzhiyun if (IS_REACHABLE(CONFIG_CRYPTO_HASH))
183*4882a593Smuzhiyun crypto_unregister_shash(&mips_poly1305_alg);
184*4882a593Smuzhiyun }
185*4882a593Smuzhiyun
186*4882a593Smuzhiyun module_init(mips_poly1305_mod_init);
187*4882a593Smuzhiyun module_exit(mips_poly1305_mod_exit);
188*4882a593Smuzhiyun
189*4882a593Smuzhiyun MODULE_LICENSE("GPL v2");
190*4882a593Smuzhiyun MODULE_ALIAS_CRYPTO("poly1305");
191*4882a593Smuzhiyun MODULE_ALIAS_CRYPTO("poly1305-mips");
192