1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Linux/arm64 port of the OpenSSL SHA256 implementation for AArch64
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Copyright (c) 2016 Linaro Ltd. <ard.biesheuvel@linaro.org>
6*4882a593Smuzhiyun */
7*4882a593Smuzhiyun
8*4882a593Smuzhiyun #include <asm/hwcap.h>
9*4882a593Smuzhiyun #include <asm/neon.h>
10*4882a593Smuzhiyun #include <asm/simd.h>
11*4882a593Smuzhiyun #include <crypto/internal/hash.h>
12*4882a593Smuzhiyun #include <crypto/internal/simd.h>
13*4882a593Smuzhiyun #include <crypto/sha.h>
14*4882a593Smuzhiyun #include <crypto/sha256_base.h>
15*4882a593Smuzhiyun #include <linux/types.h>
16*4882a593Smuzhiyun #include <linux/string.h>
17*4882a593Smuzhiyun
18*4882a593Smuzhiyun MODULE_DESCRIPTION("SHA-224/SHA-256 secure hash for arm64");
19*4882a593Smuzhiyun MODULE_AUTHOR("Andy Polyakov <appro@openssl.org>");
20*4882a593Smuzhiyun MODULE_AUTHOR("Ard Biesheuvel <ard.biesheuvel@linaro.org>");
21*4882a593Smuzhiyun MODULE_LICENSE("GPL v2");
22*4882a593Smuzhiyun MODULE_ALIAS_CRYPTO("sha224");
23*4882a593Smuzhiyun MODULE_ALIAS_CRYPTO("sha256");
24*4882a593Smuzhiyun
25*4882a593Smuzhiyun asmlinkage void sha256_block_data_order(u32 *digest, const void *data,
26*4882a593Smuzhiyun unsigned int num_blks);
27*4882a593Smuzhiyun EXPORT_SYMBOL(sha256_block_data_order);
28*4882a593Smuzhiyun
__sha256_block_data_order(struct sha256_state * sst,u8 const * src,int blocks)29*4882a593Smuzhiyun static void __sha256_block_data_order(struct sha256_state *sst, u8 const *src,
30*4882a593Smuzhiyun int blocks)
31*4882a593Smuzhiyun {
32*4882a593Smuzhiyun sha256_block_data_order(sst->state, src, blocks);
33*4882a593Smuzhiyun }
34*4882a593Smuzhiyun
35*4882a593Smuzhiyun asmlinkage void sha256_block_neon(u32 *digest, const void *data,
36*4882a593Smuzhiyun unsigned int num_blks);
37*4882a593Smuzhiyun
__sha256_block_neon(struct sha256_state * sst,u8 const * src,int blocks)38*4882a593Smuzhiyun static void __sha256_block_neon(struct sha256_state *sst, u8 const *src,
39*4882a593Smuzhiyun int blocks)
40*4882a593Smuzhiyun {
41*4882a593Smuzhiyun sha256_block_neon(sst->state, src, blocks);
42*4882a593Smuzhiyun }
43*4882a593Smuzhiyun
crypto_sha256_arm64_update(struct shash_desc * desc,const u8 * data,unsigned int len)44*4882a593Smuzhiyun static int crypto_sha256_arm64_update(struct shash_desc *desc, const u8 *data,
45*4882a593Smuzhiyun unsigned int len)
46*4882a593Smuzhiyun {
47*4882a593Smuzhiyun return sha256_base_do_update(desc, data, len,
48*4882a593Smuzhiyun __sha256_block_data_order);
49*4882a593Smuzhiyun }
50*4882a593Smuzhiyun
crypto_sha256_arm64_finup(struct shash_desc * desc,const u8 * data,unsigned int len,u8 * out)51*4882a593Smuzhiyun static int crypto_sha256_arm64_finup(struct shash_desc *desc, const u8 *data,
52*4882a593Smuzhiyun unsigned int len, u8 *out)
53*4882a593Smuzhiyun {
54*4882a593Smuzhiyun if (len)
55*4882a593Smuzhiyun sha256_base_do_update(desc, data, len,
56*4882a593Smuzhiyun __sha256_block_data_order);
57*4882a593Smuzhiyun sha256_base_do_finalize(desc, __sha256_block_data_order);
58*4882a593Smuzhiyun
59*4882a593Smuzhiyun return sha256_base_finish(desc, out);
60*4882a593Smuzhiyun }
61*4882a593Smuzhiyun
crypto_sha256_arm64_final(struct shash_desc * desc,u8 * out)62*4882a593Smuzhiyun static int crypto_sha256_arm64_final(struct shash_desc *desc, u8 *out)
63*4882a593Smuzhiyun {
64*4882a593Smuzhiyun return crypto_sha256_arm64_finup(desc, NULL, 0, out);
65*4882a593Smuzhiyun }
66*4882a593Smuzhiyun
67*4882a593Smuzhiyun static struct shash_alg algs[] = { {
68*4882a593Smuzhiyun .digestsize = SHA256_DIGEST_SIZE,
69*4882a593Smuzhiyun .init = sha256_base_init,
70*4882a593Smuzhiyun .update = crypto_sha256_arm64_update,
71*4882a593Smuzhiyun .final = crypto_sha256_arm64_final,
72*4882a593Smuzhiyun .finup = crypto_sha256_arm64_finup,
73*4882a593Smuzhiyun .descsize = sizeof(struct sha256_state),
74*4882a593Smuzhiyun .base.cra_name = "sha256",
75*4882a593Smuzhiyun .base.cra_driver_name = "sha256-arm64",
76*4882a593Smuzhiyun .base.cra_priority = 125,
77*4882a593Smuzhiyun .base.cra_blocksize = SHA256_BLOCK_SIZE,
78*4882a593Smuzhiyun .base.cra_module = THIS_MODULE,
79*4882a593Smuzhiyun }, {
80*4882a593Smuzhiyun .digestsize = SHA224_DIGEST_SIZE,
81*4882a593Smuzhiyun .init = sha224_base_init,
82*4882a593Smuzhiyun .update = crypto_sha256_arm64_update,
83*4882a593Smuzhiyun .final = crypto_sha256_arm64_final,
84*4882a593Smuzhiyun .finup = crypto_sha256_arm64_finup,
85*4882a593Smuzhiyun .descsize = sizeof(struct sha256_state),
86*4882a593Smuzhiyun .base.cra_name = "sha224",
87*4882a593Smuzhiyun .base.cra_driver_name = "sha224-arm64",
88*4882a593Smuzhiyun .base.cra_priority = 125,
89*4882a593Smuzhiyun .base.cra_blocksize = SHA224_BLOCK_SIZE,
90*4882a593Smuzhiyun .base.cra_module = THIS_MODULE,
91*4882a593Smuzhiyun } };
92*4882a593Smuzhiyun
sha256_update_neon(struct shash_desc * desc,const u8 * data,unsigned int len)93*4882a593Smuzhiyun static int sha256_update_neon(struct shash_desc *desc, const u8 *data,
94*4882a593Smuzhiyun unsigned int len)
95*4882a593Smuzhiyun {
96*4882a593Smuzhiyun struct sha256_state *sctx = shash_desc_ctx(desc);
97*4882a593Smuzhiyun
98*4882a593Smuzhiyun if (!crypto_simd_usable())
99*4882a593Smuzhiyun return sha256_base_do_update(desc, data, len,
100*4882a593Smuzhiyun __sha256_block_data_order);
101*4882a593Smuzhiyun
102*4882a593Smuzhiyun while (len > 0) {
103*4882a593Smuzhiyun unsigned int chunk = len;
104*4882a593Smuzhiyun
105*4882a593Smuzhiyun /*
106*4882a593Smuzhiyun * Don't hog the CPU for the entire time it takes to process all
107*4882a593Smuzhiyun * input when running on a preemptible kernel, but process the
108*4882a593Smuzhiyun * data block by block instead.
109*4882a593Smuzhiyun */
110*4882a593Smuzhiyun if (IS_ENABLED(CONFIG_PREEMPTION) &&
111*4882a593Smuzhiyun chunk + sctx->count % SHA256_BLOCK_SIZE > SHA256_BLOCK_SIZE)
112*4882a593Smuzhiyun chunk = SHA256_BLOCK_SIZE -
113*4882a593Smuzhiyun sctx->count % SHA256_BLOCK_SIZE;
114*4882a593Smuzhiyun
115*4882a593Smuzhiyun kernel_neon_begin();
116*4882a593Smuzhiyun sha256_base_do_update(desc, data, chunk, __sha256_block_neon);
117*4882a593Smuzhiyun kernel_neon_end();
118*4882a593Smuzhiyun data += chunk;
119*4882a593Smuzhiyun len -= chunk;
120*4882a593Smuzhiyun }
121*4882a593Smuzhiyun return 0;
122*4882a593Smuzhiyun }
123*4882a593Smuzhiyun
sha256_finup_neon(struct shash_desc * desc,const u8 * data,unsigned int len,u8 * out)124*4882a593Smuzhiyun static int sha256_finup_neon(struct shash_desc *desc, const u8 *data,
125*4882a593Smuzhiyun unsigned int len, u8 *out)
126*4882a593Smuzhiyun {
127*4882a593Smuzhiyun if (!crypto_simd_usable()) {
128*4882a593Smuzhiyun if (len)
129*4882a593Smuzhiyun sha256_base_do_update(desc, data, len,
130*4882a593Smuzhiyun __sha256_block_data_order);
131*4882a593Smuzhiyun sha256_base_do_finalize(desc, __sha256_block_data_order);
132*4882a593Smuzhiyun } else {
133*4882a593Smuzhiyun if (len)
134*4882a593Smuzhiyun sha256_update_neon(desc, data, len);
135*4882a593Smuzhiyun kernel_neon_begin();
136*4882a593Smuzhiyun sha256_base_do_finalize(desc, __sha256_block_neon);
137*4882a593Smuzhiyun kernel_neon_end();
138*4882a593Smuzhiyun }
139*4882a593Smuzhiyun return sha256_base_finish(desc, out);
140*4882a593Smuzhiyun }
141*4882a593Smuzhiyun
sha256_final_neon(struct shash_desc * desc,u8 * out)142*4882a593Smuzhiyun static int sha256_final_neon(struct shash_desc *desc, u8 *out)
143*4882a593Smuzhiyun {
144*4882a593Smuzhiyun return sha256_finup_neon(desc, NULL, 0, out);
145*4882a593Smuzhiyun }
146*4882a593Smuzhiyun
147*4882a593Smuzhiyun static struct shash_alg neon_algs[] = { {
148*4882a593Smuzhiyun .digestsize = SHA256_DIGEST_SIZE,
149*4882a593Smuzhiyun .init = sha256_base_init,
150*4882a593Smuzhiyun .update = sha256_update_neon,
151*4882a593Smuzhiyun .final = sha256_final_neon,
152*4882a593Smuzhiyun .finup = sha256_finup_neon,
153*4882a593Smuzhiyun .descsize = sizeof(struct sha256_state),
154*4882a593Smuzhiyun .base.cra_name = "sha256",
155*4882a593Smuzhiyun .base.cra_driver_name = "sha256-arm64-neon",
156*4882a593Smuzhiyun .base.cra_priority = 150,
157*4882a593Smuzhiyun .base.cra_blocksize = SHA256_BLOCK_SIZE,
158*4882a593Smuzhiyun .base.cra_module = THIS_MODULE,
159*4882a593Smuzhiyun }, {
160*4882a593Smuzhiyun .digestsize = SHA224_DIGEST_SIZE,
161*4882a593Smuzhiyun .init = sha224_base_init,
162*4882a593Smuzhiyun .update = sha256_update_neon,
163*4882a593Smuzhiyun .final = sha256_final_neon,
164*4882a593Smuzhiyun .finup = sha256_finup_neon,
165*4882a593Smuzhiyun .descsize = sizeof(struct sha256_state),
166*4882a593Smuzhiyun .base.cra_name = "sha224",
167*4882a593Smuzhiyun .base.cra_driver_name = "sha224-arm64-neon",
168*4882a593Smuzhiyun .base.cra_priority = 150,
169*4882a593Smuzhiyun .base.cra_blocksize = SHA224_BLOCK_SIZE,
170*4882a593Smuzhiyun .base.cra_module = THIS_MODULE,
171*4882a593Smuzhiyun } };
172*4882a593Smuzhiyun
sha256_mod_init(void)173*4882a593Smuzhiyun static int __init sha256_mod_init(void)
174*4882a593Smuzhiyun {
175*4882a593Smuzhiyun int ret = crypto_register_shashes(algs, ARRAY_SIZE(algs));
176*4882a593Smuzhiyun if (ret)
177*4882a593Smuzhiyun return ret;
178*4882a593Smuzhiyun
179*4882a593Smuzhiyun if (cpu_have_named_feature(ASIMD)) {
180*4882a593Smuzhiyun ret = crypto_register_shashes(neon_algs, ARRAY_SIZE(neon_algs));
181*4882a593Smuzhiyun if (ret)
182*4882a593Smuzhiyun crypto_unregister_shashes(algs, ARRAY_SIZE(algs));
183*4882a593Smuzhiyun }
184*4882a593Smuzhiyun return ret;
185*4882a593Smuzhiyun }
186*4882a593Smuzhiyun
sha256_mod_fini(void)187*4882a593Smuzhiyun static void __exit sha256_mod_fini(void)
188*4882a593Smuzhiyun {
189*4882a593Smuzhiyun if (cpu_have_named_feature(ASIMD))
190*4882a593Smuzhiyun crypto_unregister_shashes(neon_algs, ARRAY_SIZE(neon_algs));
191*4882a593Smuzhiyun crypto_unregister_shashes(algs, ARRAY_SIZE(algs));
192*4882a593Smuzhiyun }
193*4882a593Smuzhiyun
194*4882a593Smuzhiyun module_init(sha256_mod_init);
195*4882a593Smuzhiyun module_exit(sha256_mod_fini);
196