1*4882a593Smuzhiyun /* GPL HEADER START
2*4882a593Smuzhiyun *
3*4882a593Smuzhiyun * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * This program is free software; you can redistribute it and/or modify
6*4882a593Smuzhiyun * it under the terms of the GNU General Public License version 2 only,
7*4882a593Smuzhiyun * as published by the Free Software Foundation.
8*4882a593Smuzhiyun *
9*4882a593Smuzhiyun * This program is distributed in the hope that it will be useful, but
10*4882a593Smuzhiyun * WITHOUT ANY WARRANTY; without even the implied warranty of
11*4882a593Smuzhiyun * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12*4882a593Smuzhiyun * General Public License version 2 for more details (a copy is included
13*4882a593Smuzhiyun * in the LICENSE file that accompanied this code).
14*4882a593Smuzhiyun *
15*4882a593Smuzhiyun * You should have received a copy of the GNU General Public License
16*4882a593Smuzhiyun * version 2 along with this program; If not, see http://www.gnu.org/licenses
17*4882a593Smuzhiyun *
18*4882a593Smuzhiyun * Please visit http://www.xyratex.com/contact if you need additional
19*4882a593Smuzhiyun * information or have any questions.
20*4882a593Smuzhiyun *
21*4882a593Smuzhiyun * GPL HEADER END
22*4882a593Smuzhiyun */
23*4882a593Smuzhiyun
24*4882a593Smuzhiyun /*
25*4882a593Smuzhiyun * Copyright 2012 Xyratex Technology Limited
26*4882a593Smuzhiyun *
27*4882a593Smuzhiyun * Wrappers for kernel crypto shash api to pclmulqdq crc32 imlementation.
28*4882a593Smuzhiyun */
29*4882a593Smuzhiyun #include <linux/init.h>
30*4882a593Smuzhiyun #include <linux/module.h>
31*4882a593Smuzhiyun #include <linux/string.h>
32*4882a593Smuzhiyun #include <linux/kernel.h>
33*4882a593Smuzhiyun #include <linux/crc32.h>
34*4882a593Smuzhiyun #include <crypto/internal/hash.h>
35*4882a593Smuzhiyun #include <crypto/internal/simd.h>
36*4882a593Smuzhiyun
37*4882a593Smuzhiyun #include <asm/cpufeatures.h>
38*4882a593Smuzhiyun #include <asm/cpu_device_id.h>
39*4882a593Smuzhiyun #include <asm/simd.h>
40*4882a593Smuzhiyun
41*4882a593Smuzhiyun #define CHKSUM_BLOCK_SIZE 1
42*4882a593Smuzhiyun #define CHKSUM_DIGEST_SIZE 4
43*4882a593Smuzhiyun
44*4882a593Smuzhiyun #define PCLMUL_MIN_LEN 64L /* minimum size of buffer
45*4882a593Smuzhiyun * for crc32_pclmul_le_16 */
46*4882a593Smuzhiyun #define SCALE_F 16L /* size of xmm register */
47*4882a593Smuzhiyun #define SCALE_F_MASK (SCALE_F - 1)
48*4882a593Smuzhiyun
49*4882a593Smuzhiyun u32 crc32_pclmul_le_16(unsigned char const *buffer, size_t len, u32 crc32);
50*4882a593Smuzhiyun
51*4882a593Smuzhiyun static u32 __attribute__((pure))
crc32_pclmul_le(u32 crc,unsigned char const * p,size_t len)52*4882a593Smuzhiyun crc32_pclmul_le(u32 crc, unsigned char const *p, size_t len)
53*4882a593Smuzhiyun {
54*4882a593Smuzhiyun unsigned int iquotient;
55*4882a593Smuzhiyun unsigned int iremainder;
56*4882a593Smuzhiyun unsigned int prealign;
57*4882a593Smuzhiyun
58*4882a593Smuzhiyun if (len < PCLMUL_MIN_LEN + SCALE_F_MASK || !crypto_simd_usable())
59*4882a593Smuzhiyun return crc32_le(crc, p, len);
60*4882a593Smuzhiyun
61*4882a593Smuzhiyun if ((long)p & SCALE_F_MASK) {
62*4882a593Smuzhiyun /* align p to 16 byte */
63*4882a593Smuzhiyun prealign = SCALE_F - ((long)p & SCALE_F_MASK);
64*4882a593Smuzhiyun
65*4882a593Smuzhiyun crc = crc32_le(crc, p, prealign);
66*4882a593Smuzhiyun len -= prealign;
67*4882a593Smuzhiyun p = (unsigned char *)(((unsigned long)p + SCALE_F_MASK) &
68*4882a593Smuzhiyun ~SCALE_F_MASK);
69*4882a593Smuzhiyun }
70*4882a593Smuzhiyun iquotient = len & (~SCALE_F_MASK);
71*4882a593Smuzhiyun iremainder = len & SCALE_F_MASK;
72*4882a593Smuzhiyun
73*4882a593Smuzhiyun kernel_fpu_begin();
74*4882a593Smuzhiyun crc = crc32_pclmul_le_16(p, iquotient, crc);
75*4882a593Smuzhiyun kernel_fpu_end();
76*4882a593Smuzhiyun
77*4882a593Smuzhiyun if (iremainder)
78*4882a593Smuzhiyun crc = crc32_le(crc, p + iquotient, iremainder);
79*4882a593Smuzhiyun
80*4882a593Smuzhiyun return crc;
81*4882a593Smuzhiyun }
82*4882a593Smuzhiyun
crc32_pclmul_cra_init(struct crypto_tfm * tfm)83*4882a593Smuzhiyun static int crc32_pclmul_cra_init(struct crypto_tfm *tfm)
84*4882a593Smuzhiyun {
85*4882a593Smuzhiyun u32 *key = crypto_tfm_ctx(tfm);
86*4882a593Smuzhiyun
87*4882a593Smuzhiyun *key = 0;
88*4882a593Smuzhiyun
89*4882a593Smuzhiyun return 0;
90*4882a593Smuzhiyun }
91*4882a593Smuzhiyun
crc32_pclmul_setkey(struct crypto_shash * hash,const u8 * key,unsigned int keylen)92*4882a593Smuzhiyun static int crc32_pclmul_setkey(struct crypto_shash *hash, const u8 *key,
93*4882a593Smuzhiyun unsigned int keylen)
94*4882a593Smuzhiyun {
95*4882a593Smuzhiyun u32 *mctx = crypto_shash_ctx(hash);
96*4882a593Smuzhiyun
97*4882a593Smuzhiyun if (keylen != sizeof(u32))
98*4882a593Smuzhiyun return -EINVAL;
99*4882a593Smuzhiyun *mctx = le32_to_cpup((__le32 *)key);
100*4882a593Smuzhiyun return 0;
101*4882a593Smuzhiyun }
102*4882a593Smuzhiyun
crc32_pclmul_init(struct shash_desc * desc)103*4882a593Smuzhiyun static int crc32_pclmul_init(struct shash_desc *desc)
104*4882a593Smuzhiyun {
105*4882a593Smuzhiyun u32 *mctx = crypto_shash_ctx(desc->tfm);
106*4882a593Smuzhiyun u32 *crcp = shash_desc_ctx(desc);
107*4882a593Smuzhiyun
108*4882a593Smuzhiyun *crcp = *mctx;
109*4882a593Smuzhiyun
110*4882a593Smuzhiyun return 0;
111*4882a593Smuzhiyun }
112*4882a593Smuzhiyun
crc32_pclmul_update(struct shash_desc * desc,const u8 * data,unsigned int len)113*4882a593Smuzhiyun static int crc32_pclmul_update(struct shash_desc *desc, const u8 *data,
114*4882a593Smuzhiyun unsigned int len)
115*4882a593Smuzhiyun {
116*4882a593Smuzhiyun u32 *crcp = shash_desc_ctx(desc);
117*4882a593Smuzhiyun
118*4882a593Smuzhiyun *crcp = crc32_pclmul_le(*crcp, data, len);
119*4882a593Smuzhiyun return 0;
120*4882a593Smuzhiyun }
121*4882a593Smuzhiyun
122*4882a593Smuzhiyun /* No final XOR 0xFFFFFFFF, like crc32_le */
__crc32_pclmul_finup(u32 * crcp,const u8 * data,unsigned int len,u8 * out)123*4882a593Smuzhiyun static int __crc32_pclmul_finup(u32 *crcp, const u8 *data, unsigned int len,
124*4882a593Smuzhiyun u8 *out)
125*4882a593Smuzhiyun {
126*4882a593Smuzhiyun *(__le32 *)out = cpu_to_le32(crc32_pclmul_le(*crcp, data, len));
127*4882a593Smuzhiyun return 0;
128*4882a593Smuzhiyun }
129*4882a593Smuzhiyun
crc32_pclmul_finup(struct shash_desc * desc,const u8 * data,unsigned int len,u8 * out)130*4882a593Smuzhiyun static int crc32_pclmul_finup(struct shash_desc *desc, const u8 *data,
131*4882a593Smuzhiyun unsigned int len, u8 *out)
132*4882a593Smuzhiyun {
133*4882a593Smuzhiyun return __crc32_pclmul_finup(shash_desc_ctx(desc), data, len, out);
134*4882a593Smuzhiyun }
135*4882a593Smuzhiyun
crc32_pclmul_final(struct shash_desc * desc,u8 * out)136*4882a593Smuzhiyun static int crc32_pclmul_final(struct shash_desc *desc, u8 *out)
137*4882a593Smuzhiyun {
138*4882a593Smuzhiyun u32 *crcp = shash_desc_ctx(desc);
139*4882a593Smuzhiyun
140*4882a593Smuzhiyun *(__le32 *)out = cpu_to_le32p(crcp);
141*4882a593Smuzhiyun return 0;
142*4882a593Smuzhiyun }
143*4882a593Smuzhiyun
crc32_pclmul_digest(struct shash_desc * desc,const u8 * data,unsigned int len,u8 * out)144*4882a593Smuzhiyun static int crc32_pclmul_digest(struct shash_desc *desc, const u8 *data,
145*4882a593Smuzhiyun unsigned int len, u8 *out)
146*4882a593Smuzhiyun {
147*4882a593Smuzhiyun return __crc32_pclmul_finup(crypto_shash_ctx(desc->tfm), data, len,
148*4882a593Smuzhiyun out);
149*4882a593Smuzhiyun }
150*4882a593Smuzhiyun
151*4882a593Smuzhiyun static struct shash_alg alg = {
152*4882a593Smuzhiyun .setkey = crc32_pclmul_setkey,
153*4882a593Smuzhiyun .init = crc32_pclmul_init,
154*4882a593Smuzhiyun .update = crc32_pclmul_update,
155*4882a593Smuzhiyun .final = crc32_pclmul_final,
156*4882a593Smuzhiyun .finup = crc32_pclmul_finup,
157*4882a593Smuzhiyun .digest = crc32_pclmul_digest,
158*4882a593Smuzhiyun .descsize = sizeof(u32),
159*4882a593Smuzhiyun .digestsize = CHKSUM_DIGEST_SIZE,
160*4882a593Smuzhiyun .base = {
161*4882a593Smuzhiyun .cra_name = "crc32",
162*4882a593Smuzhiyun .cra_driver_name = "crc32-pclmul",
163*4882a593Smuzhiyun .cra_priority = 200,
164*4882a593Smuzhiyun .cra_flags = CRYPTO_ALG_OPTIONAL_KEY,
165*4882a593Smuzhiyun .cra_blocksize = CHKSUM_BLOCK_SIZE,
166*4882a593Smuzhiyun .cra_ctxsize = sizeof(u32),
167*4882a593Smuzhiyun .cra_module = THIS_MODULE,
168*4882a593Smuzhiyun .cra_init = crc32_pclmul_cra_init,
169*4882a593Smuzhiyun }
170*4882a593Smuzhiyun };
171*4882a593Smuzhiyun
172*4882a593Smuzhiyun static const struct x86_cpu_id crc32pclmul_cpu_id[] = {
173*4882a593Smuzhiyun X86_MATCH_FEATURE(X86_FEATURE_PCLMULQDQ, NULL),
174*4882a593Smuzhiyun {}
175*4882a593Smuzhiyun };
176*4882a593Smuzhiyun MODULE_DEVICE_TABLE(x86cpu, crc32pclmul_cpu_id);
177*4882a593Smuzhiyun
178*4882a593Smuzhiyun
crc32_pclmul_mod_init(void)179*4882a593Smuzhiyun static int __init crc32_pclmul_mod_init(void)
180*4882a593Smuzhiyun {
181*4882a593Smuzhiyun
182*4882a593Smuzhiyun if (!x86_match_cpu(crc32pclmul_cpu_id)) {
183*4882a593Smuzhiyun pr_info("PCLMULQDQ-NI instructions are not detected.\n");
184*4882a593Smuzhiyun return -ENODEV;
185*4882a593Smuzhiyun }
186*4882a593Smuzhiyun return crypto_register_shash(&alg);
187*4882a593Smuzhiyun }
188*4882a593Smuzhiyun
crc32_pclmul_mod_fini(void)189*4882a593Smuzhiyun static void __exit crc32_pclmul_mod_fini(void)
190*4882a593Smuzhiyun {
191*4882a593Smuzhiyun crypto_unregister_shash(&alg);
192*4882a593Smuzhiyun }
193*4882a593Smuzhiyun
194*4882a593Smuzhiyun module_init(crc32_pclmul_mod_init);
195*4882a593Smuzhiyun module_exit(crc32_pclmul_mod_fini);
196*4882a593Smuzhiyun
197*4882a593Smuzhiyun MODULE_AUTHOR("Alexander Boyko <alexander_boyko@xyratex.com>");
198*4882a593Smuzhiyun MODULE_LICENSE("GPL");
199*4882a593Smuzhiyun
200*4882a593Smuzhiyun MODULE_ALIAS_CRYPTO("crc32");
201*4882a593Smuzhiyun MODULE_ALIAS_CRYPTO("crc32-pclmul");
202