1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Accelerated CRC32(C) using ARM CRC, NEON and Crypto Extensions instructions
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Copyright (C) 2016 Linaro Ltd <ard.biesheuvel@linaro.org>
6*4882a593Smuzhiyun */
7*4882a593Smuzhiyun
8*4882a593Smuzhiyun #include <linux/cpufeature.h>
9*4882a593Smuzhiyun #include <linux/crc32.h>
10*4882a593Smuzhiyun #include <linux/init.h>
11*4882a593Smuzhiyun #include <linux/kernel.h>
12*4882a593Smuzhiyun #include <linux/module.h>
13*4882a593Smuzhiyun #include <linux/string.h>
14*4882a593Smuzhiyun
15*4882a593Smuzhiyun #include <crypto/internal/hash.h>
16*4882a593Smuzhiyun #include <crypto/internal/simd.h>
17*4882a593Smuzhiyun
18*4882a593Smuzhiyun #include <asm/hwcap.h>
19*4882a593Smuzhiyun #include <asm/neon.h>
20*4882a593Smuzhiyun #include <asm/simd.h>
21*4882a593Smuzhiyun #include <asm/unaligned.h>
22*4882a593Smuzhiyun
23*4882a593Smuzhiyun #define PMULL_MIN_LEN 64L /* minimum size of buffer
24*4882a593Smuzhiyun * for crc32_pmull_le_16 */
25*4882a593Smuzhiyun #define SCALE_F 16L /* size of NEON register */
26*4882a593Smuzhiyun
27*4882a593Smuzhiyun asmlinkage u32 crc32_pmull_le(const u8 buf[], u32 len, u32 init_crc);
28*4882a593Smuzhiyun asmlinkage u32 crc32_armv8_le(u32 init_crc, const u8 buf[], u32 len);
29*4882a593Smuzhiyun
30*4882a593Smuzhiyun asmlinkage u32 crc32c_pmull_le(const u8 buf[], u32 len, u32 init_crc);
31*4882a593Smuzhiyun asmlinkage u32 crc32c_armv8_le(u32 init_crc, const u8 buf[], u32 len);
32*4882a593Smuzhiyun
33*4882a593Smuzhiyun static u32 (*fallback_crc32)(u32 init_crc, const u8 buf[], u32 len);
34*4882a593Smuzhiyun static u32 (*fallback_crc32c)(u32 init_crc, const u8 buf[], u32 len);
35*4882a593Smuzhiyun
crc32_cra_init(struct crypto_tfm * tfm)36*4882a593Smuzhiyun static int crc32_cra_init(struct crypto_tfm *tfm)
37*4882a593Smuzhiyun {
38*4882a593Smuzhiyun u32 *key = crypto_tfm_ctx(tfm);
39*4882a593Smuzhiyun
40*4882a593Smuzhiyun *key = 0;
41*4882a593Smuzhiyun return 0;
42*4882a593Smuzhiyun }
43*4882a593Smuzhiyun
crc32c_cra_init(struct crypto_tfm * tfm)44*4882a593Smuzhiyun static int crc32c_cra_init(struct crypto_tfm *tfm)
45*4882a593Smuzhiyun {
46*4882a593Smuzhiyun u32 *key = crypto_tfm_ctx(tfm);
47*4882a593Smuzhiyun
48*4882a593Smuzhiyun *key = ~0;
49*4882a593Smuzhiyun return 0;
50*4882a593Smuzhiyun }
51*4882a593Smuzhiyun
crc32_setkey(struct crypto_shash * hash,const u8 * key,unsigned int keylen)52*4882a593Smuzhiyun static int crc32_setkey(struct crypto_shash *hash, const u8 *key,
53*4882a593Smuzhiyun unsigned int keylen)
54*4882a593Smuzhiyun {
55*4882a593Smuzhiyun u32 *mctx = crypto_shash_ctx(hash);
56*4882a593Smuzhiyun
57*4882a593Smuzhiyun if (keylen != sizeof(u32))
58*4882a593Smuzhiyun return -EINVAL;
59*4882a593Smuzhiyun *mctx = le32_to_cpup((__le32 *)key);
60*4882a593Smuzhiyun return 0;
61*4882a593Smuzhiyun }
62*4882a593Smuzhiyun
crc32_init(struct shash_desc * desc)63*4882a593Smuzhiyun static int crc32_init(struct shash_desc *desc)
64*4882a593Smuzhiyun {
65*4882a593Smuzhiyun u32 *mctx = crypto_shash_ctx(desc->tfm);
66*4882a593Smuzhiyun u32 *crc = shash_desc_ctx(desc);
67*4882a593Smuzhiyun
68*4882a593Smuzhiyun *crc = *mctx;
69*4882a593Smuzhiyun return 0;
70*4882a593Smuzhiyun }
71*4882a593Smuzhiyun
crc32_update(struct shash_desc * desc,const u8 * data,unsigned int length)72*4882a593Smuzhiyun static int crc32_update(struct shash_desc *desc, const u8 *data,
73*4882a593Smuzhiyun unsigned int length)
74*4882a593Smuzhiyun {
75*4882a593Smuzhiyun u32 *crc = shash_desc_ctx(desc);
76*4882a593Smuzhiyun
77*4882a593Smuzhiyun *crc = crc32_armv8_le(*crc, data, length);
78*4882a593Smuzhiyun return 0;
79*4882a593Smuzhiyun }
80*4882a593Smuzhiyun
crc32c_update(struct shash_desc * desc,const u8 * data,unsigned int length)81*4882a593Smuzhiyun static int crc32c_update(struct shash_desc *desc, const u8 *data,
82*4882a593Smuzhiyun unsigned int length)
83*4882a593Smuzhiyun {
84*4882a593Smuzhiyun u32 *crc = shash_desc_ctx(desc);
85*4882a593Smuzhiyun
86*4882a593Smuzhiyun *crc = crc32c_armv8_le(*crc, data, length);
87*4882a593Smuzhiyun return 0;
88*4882a593Smuzhiyun }
89*4882a593Smuzhiyun
crc32_final(struct shash_desc * desc,u8 * out)90*4882a593Smuzhiyun static int crc32_final(struct shash_desc *desc, u8 *out)
91*4882a593Smuzhiyun {
92*4882a593Smuzhiyun u32 *crc = shash_desc_ctx(desc);
93*4882a593Smuzhiyun
94*4882a593Smuzhiyun put_unaligned_le32(*crc, out);
95*4882a593Smuzhiyun return 0;
96*4882a593Smuzhiyun }
97*4882a593Smuzhiyun
crc32c_final(struct shash_desc * desc,u8 * out)98*4882a593Smuzhiyun static int crc32c_final(struct shash_desc *desc, u8 *out)
99*4882a593Smuzhiyun {
100*4882a593Smuzhiyun u32 *crc = shash_desc_ctx(desc);
101*4882a593Smuzhiyun
102*4882a593Smuzhiyun put_unaligned_le32(~*crc, out);
103*4882a593Smuzhiyun return 0;
104*4882a593Smuzhiyun }
105*4882a593Smuzhiyun
crc32_pmull_update(struct shash_desc * desc,const u8 * data,unsigned int length)106*4882a593Smuzhiyun static int crc32_pmull_update(struct shash_desc *desc, const u8 *data,
107*4882a593Smuzhiyun unsigned int length)
108*4882a593Smuzhiyun {
109*4882a593Smuzhiyun u32 *crc = shash_desc_ctx(desc);
110*4882a593Smuzhiyun unsigned int l;
111*4882a593Smuzhiyun
112*4882a593Smuzhiyun if (crypto_simd_usable()) {
113*4882a593Smuzhiyun if ((u32)data % SCALE_F) {
114*4882a593Smuzhiyun l = min_t(u32, length, SCALE_F - ((u32)data % SCALE_F));
115*4882a593Smuzhiyun
116*4882a593Smuzhiyun *crc = fallback_crc32(*crc, data, l);
117*4882a593Smuzhiyun
118*4882a593Smuzhiyun data += l;
119*4882a593Smuzhiyun length -= l;
120*4882a593Smuzhiyun }
121*4882a593Smuzhiyun
122*4882a593Smuzhiyun if (length >= PMULL_MIN_LEN) {
123*4882a593Smuzhiyun l = round_down(length, SCALE_F);
124*4882a593Smuzhiyun
125*4882a593Smuzhiyun kernel_neon_begin();
126*4882a593Smuzhiyun *crc = crc32_pmull_le(data, l, *crc);
127*4882a593Smuzhiyun kernel_neon_end();
128*4882a593Smuzhiyun
129*4882a593Smuzhiyun data += l;
130*4882a593Smuzhiyun length -= l;
131*4882a593Smuzhiyun }
132*4882a593Smuzhiyun }
133*4882a593Smuzhiyun
134*4882a593Smuzhiyun if (length > 0)
135*4882a593Smuzhiyun *crc = fallback_crc32(*crc, data, length);
136*4882a593Smuzhiyun
137*4882a593Smuzhiyun return 0;
138*4882a593Smuzhiyun }
139*4882a593Smuzhiyun
crc32c_pmull_update(struct shash_desc * desc,const u8 * data,unsigned int length)140*4882a593Smuzhiyun static int crc32c_pmull_update(struct shash_desc *desc, const u8 *data,
141*4882a593Smuzhiyun unsigned int length)
142*4882a593Smuzhiyun {
143*4882a593Smuzhiyun u32 *crc = shash_desc_ctx(desc);
144*4882a593Smuzhiyun unsigned int l;
145*4882a593Smuzhiyun
146*4882a593Smuzhiyun if (crypto_simd_usable()) {
147*4882a593Smuzhiyun if ((u32)data % SCALE_F) {
148*4882a593Smuzhiyun l = min_t(u32, length, SCALE_F - ((u32)data % SCALE_F));
149*4882a593Smuzhiyun
150*4882a593Smuzhiyun *crc = fallback_crc32c(*crc, data, l);
151*4882a593Smuzhiyun
152*4882a593Smuzhiyun data += l;
153*4882a593Smuzhiyun length -= l;
154*4882a593Smuzhiyun }
155*4882a593Smuzhiyun
156*4882a593Smuzhiyun if (length >= PMULL_MIN_LEN) {
157*4882a593Smuzhiyun l = round_down(length, SCALE_F);
158*4882a593Smuzhiyun
159*4882a593Smuzhiyun kernel_neon_begin();
160*4882a593Smuzhiyun *crc = crc32c_pmull_le(data, l, *crc);
161*4882a593Smuzhiyun kernel_neon_end();
162*4882a593Smuzhiyun
163*4882a593Smuzhiyun data += l;
164*4882a593Smuzhiyun length -= l;
165*4882a593Smuzhiyun }
166*4882a593Smuzhiyun }
167*4882a593Smuzhiyun
168*4882a593Smuzhiyun if (length > 0)
169*4882a593Smuzhiyun *crc = fallback_crc32c(*crc, data, length);
170*4882a593Smuzhiyun
171*4882a593Smuzhiyun return 0;
172*4882a593Smuzhiyun }
173*4882a593Smuzhiyun
174*4882a593Smuzhiyun static struct shash_alg crc32_pmull_algs[] = { {
175*4882a593Smuzhiyun .setkey = crc32_setkey,
176*4882a593Smuzhiyun .init = crc32_init,
177*4882a593Smuzhiyun .update = crc32_update,
178*4882a593Smuzhiyun .final = crc32_final,
179*4882a593Smuzhiyun .descsize = sizeof(u32),
180*4882a593Smuzhiyun .digestsize = sizeof(u32),
181*4882a593Smuzhiyun
182*4882a593Smuzhiyun .base.cra_ctxsize = sizeof(u32),
183*4882a593Smuzhiyun .base.cra_init = crc32_cra_init,
184*4882a593Smuzhiyun .base.cra_name = "crc32",
185*4882a593Smuzhiyun .base.cra_driver_name = "crc32-arm-ce",
186*4882a593Smuzhiyun .base.cra_priority = 200,
187*4882a593Smuzhiyun .base.cra_flags = CRYPTO_ALG_OPTIONAL_KEY,
188*4882a593Smuzhiyun .base.cra_blocksize = 1,
189*4882a593Smuzhiyun .base.cra_module = THIS_MODULE,
190*4882a593Smuzhiyun }, {
191*4882a593Smuzhiyun .setkey = crc32_setkey,
192*4882a593Smuzhiyun .init = crc32_init,
193*4882a593Smuzhiyun .update = crc32c_update,
194*4882a593Smuzhiyun .final = crc32c_final,
195*4882a593Smuzhiyun .descsize = sizeof(u32),
196*4882a593Smuzhiyun .digestsize = sizeof(u32),
197*4882a593Smuzhiyun
198*4882a593Smuzhiyun .base.cra_ctxsize = sizeof(u32),
199*4882a593Smuzhiyun .base.cra_init = crc32c_cra_init,
200*4882a593Smuzhiyun .base.cra_name = "crc32c",
201*4882a593Smuzhiyun .base.cra_driver_name = "crc32c-arm-ce",
202*4882a593Smuzhiyun .base.cra_priority = 200,
203*4882a593Smuzhiyun .base.cra_flags = CRYPTO_ALG_OPTIONAL_KEY,
204*4882a593Smuzhiyun .base.cra_blocksize = 1,
205*4882a593Smuzhiyun .base.cra_module = THIS_MODULE,
206*4882a593Smuzhiyun } };
207*4882a593Smuzhiyun
crc32_pmull_mod_init(void)208*4882a593Smuzhiyun static int __init crc32_pmull_mod_init(void)
209*4882a593Smuzhiyun {
210*4882a593Smuzhiyun if (elf_hwcap2 & HWCAP2_PMULL) {
211*4882a593Smuzhiyun crc32_pmull_algs[0].update = crc32_pmull_update;
212*4882a593Smuzhiyun crc32_pmull_algs[1].update = crc32c_pmull_update;
213*4882a593Smuzhiyun
214*4882a593Smuzhiyun if (elf_hwcap2 & HWCAP2_CRC32) {
215*4882a593Smuzhiyun fallback_crc32 = crc32_armv8_le;
216*4882a593Smuzhiyun fallback_crc32c = crc32c_armv8_le;
217*4882a593Smuzhiyun } else {
218*4882a593Smuzhiyun fallback_crc32 = crc32_le;
219*4882a593Smuzhiyun fallback_crc32c = __crc32c_le;
220*4882a593Smuzhiyun }
221*4882a593Smuzhiyun } else if (!(elf_hwcap2 & HWCAP2_CRC32)) {
222*4882a593Smuzhiyun return -ENODEV;
223*4882a593Smuzhiyun }
224*4882a593Smuzhiyun
225*4882a593Smuzhiyun return crypto_register_shashes(crc32_pmull_algs,
226*4882a593Smuzhiyun ARRAY_SIZE(crc32_pmull_algs));
227*4882a593Smuzhiyun }
228*4882a593Smuzhiyun
crc32_pmull_mod_exit(void)229*4882a593Smuzhiyun static void __exit crc32_pmull_mod_exit(void)
230*4882a593Smuzhiyun {
231*4882a593Smuzhiyun crypto_unregister_shashes(crc32_pmull_algs,
232*4882a593Smuzhiyun ARRAY_SIZE(crc32_pmull_algs));
233*4882a593Smuzhiyun }
234*4882a593Smuzhiyun
235*4882a593Smuzhiyun static const struct cpu_feature __maybe_unused crc32_cpu_feature[] = {
236*4882a593Smuzhiyun { cpu_feature(CRC32) }, { cpu_feature(PMULL) }, { }
237*4882a593Smuzhiyun };
238*4882a593Smuzhiyun MODULE_DEVICE_TABLE(cpu, crc32_cpu_feature);
239*4882a593Smuzhiyun
240*4882a593Smuzhiyun module_init(crc32_pmull_mod_init);
241*4882a593Smuzhiyun module_exit(crc32_pmull_mod_exit);
242*4882a593Smuzhiyun
243*4882a593Smuzhiyun MODULE_AUTHOR("Ard Biesheuvel <ard.biesheuvel@linaro.org>");
244*4882a593Smuzhiyun MODULE_LICENSE("GPL v2");
245*4882a593Smuzhiyun MODULE_ALIAS_CRYPTO("crc32");
246*4882a593Smuzhiyun MODULE_ALIAS_CRYPTO("crc32c");
247