1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * sha2-ce-glue.c - SHA-224/SHA-256 using ARMv8 Crypto Extensions
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Copyright (C) 2014 - 2017 Linaro Ltd <ard.biesheuvel@linaro.org>
6*4882a593Smuzhiyun */
7*4882a593Smuzhiyun
8*4882a593Smuzhiyun #include <asm/neon.h>
9*4882a593Smuzhiyun #include <asm/simd.h>
10*4882a593Smuzhiyun #include <asm/unaligned.h>
11*4882a593Smuzhiyun #include <crypto/internal/hash.h>
12*4882a593Smuzhiyun #include <crypto/internal/simd.h>
13*4882a593Smuzhiyun #include <crypto/sha.h>
14*4882a593Smuzhiyun #include <crypto/sha256_base.h>
15*4882a593Smuzhiyun #include <linux/cpufeature.h>
16*4882a593Smuzhiyun #include <linux/crypto.h>
17*4882a593Smuzhiyun #include <linux/module.h>
18*4882a593Smuzhiyun
19*4882a593Smuzhiyun MODULE_DESCRIPTION("SHA-224/SHA-256 secure hash using ARMv8 Crypto Extensions");
20*4882a593Smuzhiyun MODULE_AUTHOR("Ard Biesheuvel <ard.biesheuvel@linaro.org>");
21*4882a593Smuzhiyun MODULE_LICENSE("GPL v2");
22*4882a593Smuzhiyun MODULE_ALIAS_CRYPTO("sha224");
23*4882a593Smuzhiyun MODULE_ALIAS_CRYPTO("sha256");
24*4882a593Smuzhiyun
25*4882a593Smuzhiyun struct sha256_ce_state {
26*4882a593Smuzhiyun struct sha256_state sst;
27*4882a593Smuzhiyun u32 finalize;
28*4882a593Smuzhiyun };
29*4882a593Smuzhiyun
30*4882a593Smuzhiyun extern const u32 sha256_ce_offsetof_count;
31*4882a593Smuzhiyun extern const u32 sha256_ce_offsetof_finalize;
32*4882a593Smuzhiyun
33*4882a593Smuzhiyun asmlinkage int sha2_ce_transform(struct sha256_ce_state *sst, u8 const *src,
34*4882a593Smuzhiyun int blocks);
35*4882a593Smuzhiyun
__sha2_ce_transform(struct sha256_state * sst,u8 const * src,int blocks)36*4882a593Smuzhiyun static void __sha2_ce_transform(struct sha256_state *sst, u8 const *src,
37*4882a593Smuzhiyun int blocks)
38*4882a593Smuzhiyun {
39*4882a593Smuzhiyun while (blocks) {
40*4882a593Smuzhiyun int rem;
41*4882a593Smuzhiyun
42*4882a593Smuzhiyun kernel_neon_begin();
43*4882a593Smuzhiyun rem = sha2_ce_transform(container_of(sst, struct sha256_ce_state,
44*4882a593Smuzhiyun sst), src, blocks);
45*4882a593Smuzhiyun kernel_neon_end();
46*4882a593Smuzhiyun src += (blocks - rem) * SHA256_BLOCK_SIZE;
47*4882a593Smuzhiyun blocks = rem;
48*4882a593Smuzhiyun }
49*4882a593Smuzhiyun }
50*4882a593Smuzhiyun
51*4882a593Smuzhiyun const u32 sha256_ce_offsetof_count = offsetof(struct sha256_ce_state,
52*4882a593Smuzhiyun sst.count);
53*4882a593Smuzhiyun const u32 sha256_ce_offsetof_finalize = offsetof(struct sha256_ce_state,
54*4882a593Smuzhiyun finalize);
55*4882a593Smuzhiyun
56*4882a593Smuzhiyun asmlinkage void sha256_block_data_order(u32 *digest, u8 const *src, int blocks);
57*4882a593Smuzhiyun
__sha256_block_data_order(struct sha256_state * sst,u8 const * src,int blocks)58*4882a593Smuzhiyun static void __sha256_block_data_order(struct sha256_state *sst, u8 const *src,
59*4882a593Smuzhiyun int blocks)
60*4882a593Smuzhiyun {
61*4882a593Smuzhiyun sha256_block_data_order(sst->state, src, blocks);
62*4882a593Smuzhiyun }
63*4882a593Smuzhiyun
sha256_ce_update(struct shash_desc * desc,const u8 * data,unsigned int len)64*4882a593Smuzhiyun static int sha256_ce_update(struct shash_desc *desc, const u8 *data,
65*4882a593Smuzhiyun unsigned int len)
66*4882a593Smuzhiyun {
67*4882a593Smuzhiyun struct sha256_ce_state *sctx = shash_desc_ctx(desc);
68*4882a593Smuzhiyun
69*4882a593Smuzhiyun if (!crypto_simd_usable())
70*4882a593Smuzhiyun return sha256_base_do_update(desc, data, len,
71*4882a593Smuzhiyun __sha256_block_data_order);
72*4882a593Smuzhiyun
73*4882a593Smuzhiyun sctx->finalize = 0;
74*4882a593Smuzhiyun sha256_base_do_update(desc, data, len, __sha2_ce_transform);
75*4882a593Smuzhiyun
76*4882a593Smuzhiyun return 0;
77*4882a593Smuzhiyun }
78*4882a593Smuzhiyun
sha256_ce_finup(struct shash_desc * desc,const u8 * data,unsigned int len,u8 * out)79*4882a593Smuzhiyun static int sha256_ce_finup(struct shash_desc *desc, const u8 *data,
80*4882a593Smuzhiyun unsigned int len, u8 *out)
81*4882a593Smuzhiyun {
82*4882a593Smuzhiyun struct sha256_ce_state *sctx = shash_desc_ctx(desc);
83*4882a593Smuzhiyun bool finalize = !sctx->sst.count && !(len % SHA256_BLOCK_SIZE) && len;
84*4882a593Smuzhiyun
85*4882a593Smuzhiyun if (!crypto_simd_usable()) {
86*4882a593Smuzhiyun if (len)
87*4882a593Smuzhiyun sha256_base_do_update(desc, data, len,
88*4882a593Smuzhiyun __sha256_block_data_order);
89*4882a593Smuzhiyun sha256_base_do_finalize(desc, __sha256_block_data_order);
90*4882a593Smuzhiyun return sha256_base_finish(desc, out);
91*4882a593Smuzhiyun }
92*4882a593Smuzhiyun
93*4882a593Smuzhiyun /*
94*4882a593Smuzhiyun * Allow the asm code to perform the finalization if there is no
95*4882a593Smuzhiyun * partial data and the input is a round multiple of the block size.
96*4882a593Smuzhiyun */
97*4882a593Smuzhiyun sctx->finalize = finalize;
98*4882a593Smuzhiyun
99*4882a593Smuzhiyun sha256_base_do_update(desc, data, len, __sha2_ce_transform);
100*4882a593Smuzhiyun if (!finalize)
101*4882a593Smuzhiyun sha256_base_do_finalize(desc, __sha2_ce_transform);
102*4882a593Smuzhiyun return sha256_base_finish(desc, out);
103*4882a593Smuzhiyun }
104*4882a593Smuzhiyun
sha256_ce_final(struct shash_desc * desc,u8 * out)105*4882a593Smuzhiyun static int sha256_ce_final(struct shash_desc *desc, u8 *out)
106*4882a593Smuzhiyun {
107*4882a593Smuzhiyun struct sha256_ce_state *sctx = shash_desc_ctx(desc);
108*4882a593Smuzhiyun
109*4882a593Smuzhiyun if (!crypto_simd_usable()) {
110*4882a593Smuzhiyun sha256_base_do_finalize(desc, __sha256_block_data_order);
111*4882a593Smuzhiyun return sha256_base_finish(desc, out);
112*4882a593Smuzhiyun }
113*4882a593Smuzhiyun
114*4882a593Smuzhiyun sctx->finalize = 0;
115*4882a593Smuzhiyun sha256_base_do_finalize(desc, __sha2_ce_transform);
116*4882a593Smuzhiyun return sha256_base_finish(desc, out);
117*4882a593Smuzhiyun }
118*4882a593Smuzhiyun
sha256_ce_export(struct shash_desc * desc,void * out)119*4882a593Smuzhiyun static int sha256_ce_export(struct shash_desc *desc, void *out)
120*4882a593Smuzhiyun {
121*4882a593Smuzhiyun struct sha256_ce_state *sctx = shash_desc_ctx(desc);
122*4882a593Smuzhiyun
123*4882a593Smuzhiyun memcpy(out, &sctx->sst, sizeof(struct sha256_state));
124*4882a593Smuzhiyun return 0;
125*4882a593Smuzhiyun }
126*4882a593Smuzhiyun
sha256_ce_import(struct shash_desc * desc,const void * in)127*4882a593Smuzhiyun static int sha256_ce_import(struct shash_desc *desc, const void *in)
128*4882a593Smuzhiyun {
129*4882a593Smuzhiyun struct sha256_ce_state *sctx = shash_desc_ctx(desc);
130*4882a593Smuzhiyun
131*4882a593Smuzhiyun memcpy(&sctx->sst, in, sizeof(struct sha256_state));
132*4882a593Smuzhiyun sctx->finalize = 0;
133*4882a593Smuzhiyun return 0;
134*4882a593Smuzhiyun }
135*4882a593Smuzhiyun
136*4882a593Smuzhiyun static struct shash_alg algs[] = { {
137*4882a593Smuzhiyun .init = sha224_base_init,
138*4882a593Smuzhiyun .update = sha256_ce_update,
139*4882a593Smuzhiyun .final = sha256_ce_final,
140*4882a593Smuzhiyun .finup = sha256_ce_finup,
141*4882a593Smuzhiyun .export = sha256_ce_export,
142*4882a593Smuzhiyun .import = sha256_ce_import,
143*4882a593Smuzhiyun .descsize = sizeof(struct sha256_ce_state),
144*4882a593Smuzhiyun .statesize = sizeof(struct sha256_state),
145*4882a593Smuzhiyun .digestsize = SHA224_DIGEST_SIZE,
146*4882a593Smuzhiyun .base = {
147*4882a593Smuzhiyun .cra_name = "sha224",
148*4882a593Smuzhiyun .cra_driver_name = "sha224-ce",
149*4882a593Smuzhiyun .cra_priority = 200,
150*4882a593Smuzhiyun .cra_blocksize = SHA256_BLOCK_SIZE,
151*4882a593Smuzhiyun .cra_module = THIS_MODULE,
152*4882a593Smuzhiyun }
153*4882a593Smuzhiyun }, {
154*4882a593Smuzhiyun .init = sha256_base_init,
155*4882a593Smuzhiyun .update = sha256_ce_update,
156*4882a593Smuzhiyun .final = sha256_ce_final,
157*4882a593Smuzhiyun .finup = sha256_ce_finup,
158*4882a593Smuzhiyun .export = sha256_ce_export,
159*4882a593Smuzhiyun .import = sha256_ce_import,
160*4882a593Smuzhiyun .descsize = sizeof(struct sha256_ce_state),
161*4882a593Smuzhiyun .statesize = sizeof(struct sha256_state),
162*4882a593Smuzhiyun .digestsize = SHA256_DIGEST_SIZE,
163*4882a593Smuzhiyun .base = {
164*4882a593Smuzhiyun .cra_name = "sha256",
165*4882a593Smuzhiyun .cra_driver_name = "sha256-ce",
166*4882a593Smuzhiyun .cra_priority = 200,
167*4882a593Smuzhiyun .cra_blocksize = SHA256_BLOCK_SIZE,
168*4882a593Smuzhiyun .cra_module = THIS_MODULE,
169*4882a593Smuzhiyun }
170*4882a593Smuzhiyun } };
171*4882a593Smuzhiyun
sha2_ce_mod_init(void)172*4882a593Smuzhiyun static int __init sha2_ce_mod_init(void)
173*4882a593Smuzhiyun {
174*4882a593Smuzhiyun return crypto_register_shashes(algs, ARRAY_SIZE(algs));
175*4882a593Smuzhiyun }
176*4882a593Smuzhiyun
sha2_ce_mod_fini(void)177*4882a593Smuzhiyun static void __exit sha2_ce_mod_fini(void)
178*4882a593Smuzhiyun {
179*4882a593Smuzhiyun crypto_unregister_shashes(algs, ARRAY_SIZE(algs));
180*4882a593Smuzhiyun }
181*4882a593Smuzhiyun
182*4882a593Smuzhiyun module_cpu_feature_match(SHA2, sha2_ce_mod_init);
183*4882a593Smuzhiyun module_exit(sha2_ce_mod_fini);
184