1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun #include <linux/crc32.h>
3*4882a593Smuzhiyun #include <crypto/internal/hash.h>
4*4882a593Smuzhiyun #include <crypto/internal/simd.h>
5*4882a593Smuzhiyun #include <linux/init.h>
6*4882a593Smuzhiyun #include <linux/module.h>
7*4882a593Smuzhiyun #include <linux/string.h>
8*4882a593Smuzhiyun #include <linux/kernel.h>
9*4882a593Smuzhiyun #include <linux/cpufeature.h>
10*4882a593Smuzhiyun #include <asm/simd.h>
11*4882a593Smuzhiyun #include <asm/switch_to.h>
12*4882a593Smuzhiyun
13*4882a593Smuzhiyun #define CHKSUM_BLOCK_SIZE 1
14*4882a593Smuzhiyun #define CHKSUM_DIGEST_SIZE 4
15*4882a593Smuzhiyun
16*4882a593Smuzhiyun #define VMX_ALIGN 16
17*4882a593Smuzhiyun #define VMX_ALIGN_MASK (VMX_ALIGN-1)
18*4882a593Smuzhiyun
19*4882a593Smuzhiyun #define VECTOR_BREAKPOINT 512
20*4882a593Smuzhiyun
21*4882a593Smuzhiyun u32 __crc32c_vpmsum(u32 crc, unsigned char const *p, size_t len);
22*4882a593Smuzhiyun
crc32c_vpmsum(u32 crc,unsigned char const * p,size_t len)23*4882a593Smuzhiyun static u32 crc32c_vpmsum(u32 crc, unsigned char const *p, size_t len)
24*4882a593Smuzhiyun {
25*4882a593Smuzhiyun unsigned int prealign;
26*4882a593Smuzhiyun unsigned int tail;
27*4882a593Smuzhiyun
28*4882a593Smuzhiyun if (len < (VECTOR_BREAKPOINT + VMX_ALIGN) || !crypto_simd_usable())
29*4882a593Smuzhiyun return __crc32c_le(crc, p, len);
30*4882a593Smuzhiyun
31*4882a593Smuzhiyun if ((unsigned long)p & VMX_ALIGN_MASK) {
32*4882a593Smuzhiyun prealign = VMX_ALIGN - ((unsigned long)p & VMX_ALIGN_MASK);
33*4882a593Smuzhiyun crc = __crc32c_le(crc, p, prealign);
34*4882a593Smuzhiyun len -= prealign;
35*4882a593Smuzhiyun p += prealign;
36*4882a593Smuzhiyun }
37*4882a593Smuzhiyun
38*4882a593Smuzhiyun if (len & ~VMX_ALIGN_MASK) {
39*4882a593Smuzhiyun preempt_disable();
40*4882a593Smuzhiyun pagefault_disable();
41*4882a593Smuzhiyun enable_kernel_altivec();
42*4882a593Smuzhiyun crc = __crc32c_vpmsum(crc, p, len & ~VMX_ALIGN_MASK);
43*4882a593Smuzhiyun disable_kernel_altivec();
44*4882a593Smuzhiyun pagefault_enable();
45*4882a593Smuzhiyun preempt_enable();
46*4882a593Smuzhiyun }
47*4882a593Smuzhiyun
48*4882a593Smuzhiyun tail = len & VMX_ALIGN_MASK;
49*4882a593Smuzhiyun if (tail) {
50*4882a593Smuzhiyun p += len & ~VMX_ALIGN_MASK;
51*4882a593Smuzhiyun crc = __crc32c_le(crc, p, tail);
52*4882a593Smuzhiyun }
53*4882a593Smuzhiyun
54*4882a593Smuzhiyun return crc;
55*4882a593Smuzhiyun }
56*4882a593Smuzhiyun
crc32c_vpmsum_cra_init(struct crypto_tfm * tfm)57*4882a593Smuzhiyun static int crc32c_vpmsum_cra_init(struct crypto_tfm *tfm)
58*4882a593Smuzhiyun {
59*4882a593Smuzhiyun u32 *key = crypto_tfm_ctx(tfm);
60*4882a593Smuzhiyun
61*4882a593Smuzhiyun *key = ~0;
62*4882a593Smuzhiyun
63*4882a593Smuzhiyun return 0;
64*4882a593Smuzhiyun }
65*4882a593Smuzhiyun
66*4882a593Smuzhiyun /*
67*4882a593Smuzhiyun * Setting the seed allows arbitrary accumulators and flexible XOR policy
68*4882a593Smuzhiyun * If your algorithm starts with ~0, then XOR with ~0 before you set
69*4882a593Smuzhiyun * the seed.
70*4882a593Smuzhiyun */
crc32c_vpmsum_setkey(struct crypto_shash * hash,const u8 * key,unsigned int keylen)71*4882a593Smuzhiyun static int crc32c_vpmsum_setkey(struct crypto_shash *hash, const u8 *key,
72*4882a593Smuzhiyun unsigned int keylen)
73*4882a593Smuzhiyun {
74*4882a593Smuzhiyun u32 *mctx = crypto_shash_ctx(hash);
75*4882a593Smuzhiyun
76*4882a593Smuzhiyun if (keylen != sizeof(u32))
77*4882a593Smuzhiyun return -EINVAL;
78*4882a593Smuzhiyun *mctx = le32_to_cpup((__le32 *)key);
79*4882a593Smuzhiyun return 0;
80*4882a593Smuzhiyun }
81*4882a593Smuzhiyun
crc32c_vpmsum_init(struct shash_desc * desc)82*4882a593Smuzhiyun static int crc32c_vpmsum_init(struct shash_desc *desc)
83*4882a593Smuzhiyun {
84*4882a593Smuzhiyun u32 *mctx = crypto_shash_ctx(desc->tfm);
85*4882a593Smuzhiyun u32 *crcp = shash_desc_ctx(desc);
86*4882a593Smuzhiyun
87*4882a593Smuzhiyun *crcp = *mctx;
88*4882a593Smuzhiyun
89*4882a593Smuzhiyun return 0;
90*4882a593Smuzhiyun }
91*4882a593Smuzhiyun
crc32c_vpmsum_update(struct shash_desc * desc,const u8 * data,unsigned int len)92*4882a593Smuzhiyun static int crc32c_vpmsum_update(struct shash_desc *desc, const u8 *data,
93*4882a593Smuzhiyun unsigned int len)
94*4882a593Smuzhiyun {
95*4882a593Smuzhiyun u32 *crcp = shash_desc_ctx(desc);
96*4882a593Smuzhiyun
97*4882a593Smuzhiyun *crcp = crc32c_vpmsum(*crcp, data, len);
98*4882a593Smuzhiyun
99*4882a593Smuzhiyun return 0;
100*4882a593Smuzhiyun }
101*4882a593Smuzhiyun
__crc32c_vpmsum_finup(u32 * crcp,const u8 * data,unsigned int len,u8 * out)102*4882a593Smuzhiyun static int __crc32c_vpmsum_finup(u32 *crcp, const u8 *data, unsigned int len,
103*4882a593Smuzhiyun u8 *out)
104*4882a593Smuzhiyun {
105*4882a593Smuzhiyun *(__le32 *)out = ~cpu_to_le32(crc32c_vpmsum(*crcp, data, len));
106*4882a593Smuzhiyun
107*4882a593Smuzhiyun return 0;
108*4882a593Smuzhiyun }
109*4882a593Smuzhiyun
crc32c_vpmsum_finup(struct shash_desc * desc,const u8 * data,unsigned int len,u8 * out)110*4882a593Smuzhiyun static int crc32c_vpmsum_finup(struct shash_desc *desc, const u8 *data,
111*4882a593Smuzhiyun unsigned int len, u8 *out)
112*4882a593Smuzhiyun {
113*4882a593Smuzhiyun return __crc32c_vpmsum_finup(shash_desc_ctx(desc), data, len, out);
114*4882a593Smuzhiyun }
115*4882a593Smuzhiyun
crc32c_vpmsum_final(struct shash_desc * desc,u8 * out)116*4882a593Smuzhiyun static int crc32c_vpmsum_final(struct shash_desc *desc, u8 *out)
117*4882a593Smuzhiyun {
118*4882a593Smuzhiyun u32 *crcp = shash_desc_ctx(desc);
119*4882a593Smuzhiyun
120*4882a593Smuzhiyun *(__le32 *)out = ~cpu_to_le32p(crcp);
121*4882a593Smuzhiyun
122*4882a593Smuzhiyun return 0;
123*4882a593Smuzhiyun }
124*4882a593Smuzhiyun
crc32c_vpmsum_digest(struct shash_desc * desc,const u8 * data,unsigned int len,u8 * out)125*4882a593Smuzhiyun static int crc32c_vpmsum_digest(struct shash_desc *desc, const u8 *data,
126*4882a593Smuzhiyun unsigned int len, u8 *out)
127*4882a593Smuzhiyun {
128*4882a593Smuzhiyun return __crc32c_vpmsum_finup(crypto_shash_ctx(desc->tfm), data, len,
129*4882a593Smuzhiyun out);
130*4882a593Smuzhiyun }
131*4882a593Smuzhiyun
132*4882a593Smuzhiyun static struct shash_alg alg = {
133*4882a593Smuzhiyun .setkey = crc32c_vpmsum_setkey,
134*4882a593Smuzhiyun .init = crc32c_vpmsum_init,
135*4882a593Smuzhiyun .update = crc32c_vpmsum_update,
136*4882a593Smuzhiyun .final = crc32c_vpmsum_final,
137*4882a593Smuzhiyun .finup = crc32c_vpmsum_finup,
138*4882a593Smuzhiyun .digest = crc32c_vpmsum_digest,
139*4882a593Smuzhiyun .descsize = sizeof(u32),
140*4882a593Smuzhiyun .digestsize = CHKSUM_DIGEST_SIZE,
141*4882a593Smuzhiyun .base = {
142*4882a593Smuzhiyun .cra_name = "crc32c",
143*4882a593Smuzhiyun .cra_driver_name = "crc32c-vpmsum",
144*4882a593Smuzhiyun .cra_priority = 200,
145*4882a593Smuzhiyun .cra_flags = CRYPTO_ALG_OPTIONAL_KEY,
146*4882a593Smuzhiyun .cra_blocksize = CHKSUM_BLOCK_SIZE,
147*4882a593Smuzhiyun .cra_ctxsize = sizeof(u32),
148*4882a593Smuzhiyun .cra_module = THIS_MODULE,
149*4882a593Smuzhiyun .cra_init = crc32c_vpmsum_cra_init,
150*4882a593Smuzhiyun }
151*4882a593Smuzhiyun };
152*4882a593Smuzhiyun
crc32c_vpmsum_mod_init(void)153*4882a593Smuzhiyun static int __init crc32c_vpmsum_mod_init(void)
154*4882a593Smuzhiyun {
155*4882a593Smuzhiyun if (!cpu_has_feature(CPU_FTR_ARCH_207S))
156*4882a593Smuzhiyun return -ENODEV;
157*4882a593Smuzhiyun
158*4882a593Smuzhiyun return crypto_register_shash(&alg);
159*4882a593Smuzhiyun }
160*4882a593Smuzhiyun
crc32c_vpmsum_mod_fini(void)161*4882a593Smuzhiyun static void __exit crc32c_vpmsum_mod_fini(void)
162*4882a593Smuzhiyun {
163*4882a593Smuzhiyun crypto_unregister_shash(&alg);
164*4882a593Smuzhiyun }
165*4882a593Smuzhiyun
166*4882a593Smuzhiyun module_cpu_feature_match(PPC_MODULE_FEATURE_VEC_CRYPTO, crc32c_vpmsum_mod_init);
167*4882a593Smuzhiyun module_exit(crc32c_vpmsum_mod_fini);
168*4882a593Smuzhiyun
169*4882a593Smuzhiyun MODULE_AUTHOR("Anton Blanchard <anton@samba.org>");
170*4882a593Smuzhiyun MODULE_DESCRIPTION("CRC32C using vector polynomial multiply-sum instructions");
171*4882a593Smuzhiyun MODULE_LICENSE("GPL");
172*4882a593Smuzhiyun MODULE_ALIAS_CRYPTO("crc32c");
173*4882a593Smuzhiyun MODULE_ALIAS_CRYPTO("crc32c-vpmsum");
174