1*4882a593Smuzhiyun /* ====================================================================
2*4882a593Smuzhiyun * Copyright (c) 2014 - 2017 The GmSSL Project. All rights reserved.
3*4882a593Smuzhiyun *
4*4882a593Smuzhiyun * Redistribution and use in source and binary forms, with or without
5*4882a593Smuzhiyun * modification, are permitted provided that the following conditions
6*4882a593Smuzhiyun * are met:
7*4882a593Smuzhiyun *
8*4882a593Smuzhiyun * 1. Redistributions of source code must retain the above copyright
9*4882a593Smuzhiyun * notice, this list of conditions and the following disclaimer.
10*4882a593Smuzhiyun *
11*4882a593Smuzhiyun * 2. Redistributions in binary form must reproduce the above copyright
12*4882a593Smuzhiyun * notice, this list of conditions and the following disclaimer in
13*4882a593Smuzhiyun * the documentation and/or other materials provided with the
14*4882a593Smuzhiyun * distribution.
15*4882a593Smuzhiyun *
16*4882a593Smuzhiyun * 3. All advertising materials mentioning features or use of this
17*4882a593Smuzhiyun * software must display the following acknowledgment:
18*4882a593Smuzhiyun * "This product includes software developed by the GmSSL Project.
19*4882a593Smuzhiyun * (http://gmssl.org/)"
20*4882a593Smuzhiyun *
21*4882a593Smuzhiyun * 4. The name "GmSSL Project" must not be used to endorse or promote
22*4882a593Smuzhiyun * products derived from this software without prior written
23*4882a593Smuzhiyun * permission. For written permission, please contact
24*4882a593Smuzhiyun * guanzhi1980@gmail.com.
25*4882a593Smuzhiyun *
26*4882a593Smuzhiyun * 5. Products derived from this software may not be called "GmSSL"
27*4882a593Smuzhiyun * nor may "GmSSL" appear in their names without prior written
28*4882a593Smuzhiyun * permission of the GmSSL Project.
29*4882a593Smuzhiyun *
30*4882a593Smuzhiyun * 6. Redistributions of any form whatsoever must retain the following
31*4882a593Smuzhiyun * acknowledgment:
32*4882a593Smuzhiyun * "This product includes software developed by the GmSSL Project
33*4882a593Smuzhiyun * (http://gmssl.org/)"
34*4882a593Smuzhiyun *
35*4882a593Smuzhiyun * THIS SOFTWARE IS PROVIDED BY THE GmSSL PROJECT ``AS IS'' AND ANY
36*4882a593Smuzhiyun * EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
37*4882a593Smuzhiyun * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
38*4882a593Smuzhiyun * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE GmSSL PROJECT OR
39*4882a593Smuzhiyun * ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
40*4882a593Smuzhiyun * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
41*4882a593Smuzhiyun * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
42*4882a593Smuzhiyun * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
43*4882a593Smuzhiyun * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
44*4882a593Smuzhiyun * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
45*4882a593Smuzhiyun * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
46*4882a593Smuzhiyun * OF THE POSSIBILITY OF SUCH DAMAGE.
47*4882a593Smuzhiyun * ====================================================================
48*4882a593Smuzhiyun */
49*4882a593Smuzhiyun #include <stdint.h>
50*4882a593Smuzhiyun #include <string.h>
51*4882a593Smuzhiyun #include "modes_lcl.h"
52*4882a593Smuzhiyun
53*4882a593Smuzhiyun typedef struct {
54*4882a593Smuzhiyun uint32_t digest[8];
55*4882a593Smuzhiyun uint64_t nblocks;
56*4882a593Smuzhiyun unsigned char block[64];
57*4882a593Smuzhiyun int num;
58*4882a593Smuzhiyun } rkgm_sm3_ctx_t;
59*4882a593Smuzhiyun
60*4882a593Smuzhiyun #define SM3_DIGEST_LENGTH 32
61*4882a593Smuzhiyun #define SM3_BLOCK_SIZE 64
62*4882a593Smuzhiyun #define SM3_CBLOCK (SM3_BLOCK_SIZE)
63*4882a593Smuzhiyun #define SM3_HMAC_SIZE (SM3_DIGEST_LENGTH)
64*4882a593Smuzhiyun
65*4882a593Smuzhiyun void rkgm_sm3_init(rkgm_sm3_ctx_t *ctx);
66*4882a593Smuzhiyun void rkgm_sm3_update(rkgm_sm3_ctx_t *ctx, const unsigned char* data, size_t data_len);
67*4882a593Smuzhiyun void rkgm_sm3_final(rkgm_sm3_ctx_t *ctx, unsigned char digest[SM3_DIGEST_LENGTH]);
68*4882a593Smuzhiyun void rkgm_sm3_compress(uint32_t digest[8], const unsigned char block[SM3_BLOCK_SIZE]);
69*4882a593Smuzhiyun
70*4882a593Smuzhiyun static void sm3_compress_blocks(uint32_t digest[8],
71*4882a593Smuzhiyun const unsigned char *data, size_t blocks);
72*4882a593Smuzhiyun
73*4882a593Smuzhiyun
rkgm_sm3_init(rkgm_sm3_ctx_t * ctx)74*4882a593Smuzhiyun void rkgm_sm3_init(rkgm_sm3_ctx_t *ctx)
75*4882a593Smuzhiyun {
76*4882a593Smuzhiyun memset(ctx, 0, sizeof(*ctx));
77*4882a593Smuzhiyun ctx->digest[0] = 0x7380166F;
78*4882a593Smuzhiyun ctx->digest[1] = 0x4914B2B9;
79*4882a593Smuzhiyun ctx->digest[2] = 0x172442D7;
80*4882a593Smuzhiyun ctx->digest[3] = 0xDA8A0600;
81*4882a593Smuzhiyun ctx->digest[4] = 0xA96F30BC;
82*4882a593Smuzhiyun ctx->digest[5] = 0x163138AA;
83*4882a593Smuzhiyun ctx->digest[6] = 0xE38DEE4D;
84*4882a593Smuzhiyun ctx->digest[7] = 0xB0FB0E4E;
85*4882a593Smuzhiyun }
86*4882a593Smuzhiyun
sm3_compute_id_digest(unsigned char z[32],const char * id,const unsigned char x[32],const unsigned char y[32])87*4882a593Smuzhiyun void sm3_compute_id_digest(unsigned char z[32], const char *id,
88*4882a593Smuzhiyun const unsigned char x[32], const unsigned char y[32])
89*4882a593Smuzhiyun {
90*4882a593Smuzhiyun unsigned char zin[] = {
91*4882a593Smuzhiyun 0x00, 0x80,
92*4882a593Smuzhiyun 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, 0x37, 0x38,
93*4882a593Smuzhiyun 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, 0x37, 0x38,
94*4882a593Smuzhiyun 0xFF, 0xFF, 0xFF, 0xFE, 0xFF, 0xFF, 0xFF, 0xFF,
95*4882a593Smuzhiyun 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
96*4882a593Smuzhiyun 0xFF, 0xFF, 0xFF, 0xFF, 0x00, 0x00, 0x00, 0x00,
97*4882a593Smuzhiyun 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFC,
98*4882a593Smuzhiyun 0x28, 0xE9, 0xFA, 0x9E, 0x9D, 0x9F, 0x5E, 0x34,
99*4882a593Smuzhiyun 0x4D, 0x5A, 0x9E, 0x4B, 0xCF, 0x65, 0x09, 0xA7,
100*4882a593Smuzhiyun 0xF3, 0x97, 0x89, 0xF5, 0x15, 0xAB, 0x8F, 0x92,
101*4882a593Smuzhiyun 0xDD, 0xBC, 0xBD, 0x41, 0x4D, 0x94, 0x0E, 0x93,
102*4882a593Smuzhiyun 0x32, 0xC4, 0xAE, 0x2C, 0x1F, 0x19, 0x81, 0x19,
103*4882a593Smuzhiyun 0x5F, 0x99, 0x04, 0x46, 0x6A, 0x39, 0xC9, 0x94,
104*4882a593Smuzhiyun 0x8F, 0xE3, 0x0B, 0xBF, 0xF2, 0x66, 0x0B, 0xE1,
105*4882a593Smuzhiyun 0x71, 0x5A, 0x45, 0x89, 0x33, 0x4C, 0x74, 0xC7,
106*4882a593Smuzhiyun 0xBC, 0x37, 0x36, 0xA2, 0xF4, 0xF6, 0x77, 0x9C,
107*4882a593Smuzhiyun 0x59, 0xBD, 0xCE, 0xE3, 0x6B, 0x69, 0x21, 0x53,
108*4882a593Smuzhiyun 0xD0, 0xA9, 0x87, 0x7C, 0xC6, 0x2A, 0x47, 0x40,
109*4882a593Smuzhiyun 0x02, 0xDF, 0x32, 0xE5, 0x21, 0x39, 0xF0, 0xA0,
110*4882a593Smuzhiyun 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
111*4882a593Smuzhiyun 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
112*4882a593Smuzhiyun 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
113*4882a593Smuzhiyun 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
114*4882a593Smuzhiyun 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
115*4882a593Smuzhiyun 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
116*4882a593Smuzhiyun 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
117*4882a593Smuzhiyun 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
118*4882a593Smuzhiyun 0x80, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
119*4882a593Smuzhiyun 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
120*4882a593Smuzhiyun 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
121*4882a593Smuzhiyun 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
122*4882a593Smuzhiyun 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
123*4882a593Smuzhiyun 0x00, 0x00, 0x00, 0x00, 0x06, 0x90,
124*4882a593Smuzhiyun };
125*4882a593Smuzhiyun
126*4882a593Smuzhiyun if (!id || strcmp(id, "1234567812345678")) {
127*4882a593Smuzhiyun unsigned int digest[8] = {
128*4882a593Smuzhiyun 0xadadedb5U, 0x0446043fU, 0x08a87aceU, 0xe86d2243U,
129*4882a593Smuzhiyun 0x8e232383U, 0xbfc81fe2U, 0xcf9117c8U, 0x4707011dU,
130*4882a593Smuzhiyun };
131*4882a593Smuzhiyun memcpy(&zin[128], x, 32);
132*4882a593Smuzhiyun memcpy(&zin[160], y, 32);
133*4882a593Smuzhiyun sm3_compress_blocks(digest, zin, 2);
134*4882a593Smuzhiyun PUTU32(z , digest[0]);
135*4882a593Smuzhiyun PUTU32(z + 4, digest[1]);
136*4882a593Smuzhiyun PUTU32(z + 8, digest[2]);
137*4882a593Smuzhiyun PUTU32(z + 12, digest[3]);
138*4882a593Smuzhiyun PUTU32(z + 16, digest[4]);
139*4882a593Smuzhiyun PUTU32(z + 20, digest[5]);
140*4882a593Smuzhiyun PUTU32(z + 24, digest[6]);
141*4882a593Smuzhiyun PUTU32(z + 28, digest[7]);
142*4882a593Smuzhiyun
143*4882a593Smuzhiyun } else {
144*4882a593Smuzhiyun rkgm_sm3_ctx_t ctx;
145*4882a593Smuzhiyun unsigned char idbits[2];
146*4882a593Smuzhiyun size_t len;
147*4882a593Smuzhiyun
148*4882a593Smuzhiyun len = strlen(id);
149*4882a593Smuzhiyun idbits[0] = (unsigned char)(len >> 5);
150*4882a593Smuzhiyun idbits[1] = (unsigned char)(len << 3);
151*4882a593Smuzhiyun
152*4882a593Smuzhiyun rkgm_sm3_init(&ctx);
153*4882a593Smuzhiyun rkgm_sm3_update(&ctx, idbits, 2);
154*4882a593Smuzhiyun rkgm_sm3_update(&ctx, (unsigned char *)id, len);
155*4882a593Smuzhiyun rkgm_sm3_update(&ctx, zin + 18, 128);
156*4882a593Smuzhiyun rkgm_sm3_update(&ctx, x, 32);
157*4882a593Smuzhiyun rkgm_sm3_update(&ctx, y, 32);
158*4882a593Smuzhiyun rkgm_sm3_final(&ctx, z);
159*4882a593Smuzhiyun }
160*4882a593Smuzhiyun }
161*4882a593Smuzhiyun
sm3_sm2_init(rkgm_sm3_ctx_t * ctx,const char * id,const unsigned char * x,const unsigned char * y)162*4882a593Smuzhiyun int sm3_sm2_init(rkgm_sm3_ctx_t *ctx, const char *id,
163*4882a593Smuzhiyun const unsigned char *x, const unsigned char *y)
164*4882a593Smuzhiyun {
165*4882a593Smuzhiyun unsigned char z[32];
166*4882a593Smuzhiyun if ((id && strlen(id) > 65535/8) || !x || !y) {
167*4882a593Smuzhiyun return 0;
168*4882a593Smuzhiyun }
169*4882a593Smuzhiyun sm3_compute_id_digest(z, id, x, y);
170*4882a593Smuzhiyun rkgm_sm3_init(ctx);
171*4882a593Smuzhiyun rkgm_sm3_update(ctx, z, 32);
172*4882a593Smuzhiyun return 1;
173*4882a593Smuzhiyun }
174*4882a593Smuzhiyun
rkgm_sm3_update(rkgm_sm3_ctx_t * ctx,const unsigned char * data,size_t data_len)175*4882a593Smuzhiyun void rkgm_sm3_update(rkgm_sm3_ctx_t *ctx, const unsigned char *data, size_t data_len)
176*4882a593Smuzhiyun {
177*4882a593Smuzhiyun size_t blocks;
178*4882a593Smuzhiyun
179*4882a593Smuzhiyun if (ctx->num) {
180*4882a593Smuzhiyun unsigned int left = SM3_BLOCK_SIZE - ctx->num;
181*4882a593Smuzhiyun if (data_len < left) {
182*4882a593Smuzhiyun memcpy(ctx->block + ctx->num, data, data_len);
183*4882a593Smuzhiyun ctx->num += data_len;
184*4882a593Smuzhiyun return;
185*4882a593Smuzhiyun } else {
186*4882a593Smuzhiyun memcpy(ctx->block + ctx->num, data, left);
187*4882a593Smuzhiyun sm3_compress_blocks(ctx->digest, ctx->block, 1);
188*4882a593Smuzhiyun ctx->nblocks++;
189*4882a593Smuzhiyun data += left;
190*4882a593Smuzhiyun data_len -= left;
191*4882a593Smuzhiyun }
192*4882a593Smuzhiyun }
193*4882a593Smuzhiyun
194*4882a593Smuzhiyun blocks = data_len / SM3_BLOCK_SIZE;
195*4882a593Smuzhiyun sm3_compress_blocks(ctx->digest, data, blocks);
196*4882a593Smuzhiyun ctx->nblocks += blocks;
197*4882a593Smuzhiyun data += SM3_BLOCK_SIZE * blocks;
198*4882a593Smuzhiyun data_len -= SM3_BLOCK_SIZE * blocks;
199*4882a593Smuzhiyun
200*4882a593Smuzhiyun ctx->num = data_len;
201*4882a593Smuzhiyun if (data_len) {
202*4882a593Smuzhiyun memcpy(ctx->block, data, data_len);
203*4882a593Smuzhiyun }
204*4882a593Smuzhiyun }
205*4882a593Smuzhiyun
rkgm_sm3_final(rkgm_sm3_ctx_t * ctx,unsigned char * digest)206*4882a593Smuzhiyun void rkgm_sm3_final(rkgm_sm3_ctx_t *ctx, unsigned char *digest)
207*4882a593Smuzhiyun {
208*4882a593Smuzhiyun int i;
209*4882a593Smuzhiyun
210*4882a593Smuzhiyun ctx->block[ctx->num] = 0x80;
211*4882a593Smuzhiyun
212*4882a593Smuzhiyun if (ctx->num + 9 <= SM3_BLOCK_SIZE) {
213*4882a593Smuzhiyun memset(ctx->block + ctx->num + 1, 0, SM3_BLOCK_SIZE - ctx->num - 9);
214*4882a593Smuzhiyun } else {
215*4882a593Smuzhiyun memset(ctx->block + ctx->num + 1, 0, SM3_BLOCK_SIZE - ctx->num - 1);
216*4882a593Smuzhiyun rkgm_sm3_compress(ctx->digest, ctx->block);
217*4882a593Smuzhiyun memset(ctx->block, 0, SM3_BLOCK_SIZE - 8);
218*4882a593Smuzhiyun }
219*4882a593Smuzhiyun PUTU32(ctx->block + 56, ctx->nblocks >> 23);
220*4882a593Smuzhiyun PUTU32(ctx->block + 60, (ctx->nblocks << 9) + (ctx->num << 3));
221*4882a593Smuzhiyun
222*4882a593Smuzhiyun rkgm_sm3_compress(ctx->digest, ctx->block);
223*4882a593Smuzhiyun for (i = 0; i < 8; i++) {
224*4882a593Smuzhiyun PUTU32(digest + i*4, ctx->digest[i]);
225*4882a593Smuzhiyun }
226*4882a593Smuzhiyun }
227*4882a593Smuzhiyun
228*4882a593Smuzhiyun #define ROTL(x,n) (((x)<<(n)) | ((x)>>(32-(n))))
229*4882a593Smuzhiyun #define P0(x) ((x) ^ ROL32((x), 9) ^ ROL32((x),17))
230*4882a593Smuzhiyun #define P1(x) ((x) ^ ROL32((x),15) ^ ROL32((x),23))
231*4882a593Smuzhiyun
232*4882a593Smuzhiyun #define FF00(x,y,z) ((x) ^ (y) ^ (z))
233*4882a593Smuzhiyun #define FF16(x,y,z) (((x)&(y)) | ((x)&(z)) | ((y)&(z)))
234*4882a593Smuzhiyun #define GG00(x,y,z) ((x) ^ (y) ^ (z))
235*4882a593Smuzhiyun #define GG16(x,y,z) ((((y)^(z)) & (x)) ^ (z))
236*4882a593Smuzhiyun
237*4882a593Smuzhiyun #define R(A, B, C, D, E, F, G, H, xx) \
238*4882a593Smuzhiyun SS1 = ROL32((ROL32(A, 12) + E + K[j]), 7); \
239*4882a593Smuzhiyun SS2 = SS1 ^ ROL32(A, 12); \
240*4882a593Smuzhiyun TT1 = FF##xx(A, B, C) + D + SS2 + (W[j] ^ W[j + 4]); \
241*4882a593Smuzhiyun TT2 = GG##xx(E, F, G) + H + SS1 + W[j]; \
242*4882a593Smuzhiyun B = ROL32(B, 9); \
243*4882a593Smuzhiyun H = TT1; \
244*4882a593Smuzhiyun F = ROL32(F, 19); \
245*4882a593Smuzhiyun D = P0(TT2); \
246*4882a593Smuzhiyun j++
247*4882a593Smuzhiyun
248*4882a593Smuzhiyun #define R8(A, B, C, D, E, F, G, H, xx) \
249*4882a593Smuzhiyun R(A, B, C, D, E, F, G, H, xx); \
250*4882a593Smuzhiyun R(H, A, B, C, D, E, F, G, xx); \
251*4882a593Smuzhiyun R(G, H, A, B, C, D, E, F, xx); \
252*4882a593Smuzhiyun R(F, G, H, A, B, C, D, E, xx); \
253*4882a593Smuzhiyun R(E, F, G, H, A, B, C, D, xx); \
254*4882a593Smuzhiyun R(D, E, F, G, H, A, B, C, xx); \
255*4882a593Smuzhiyun R(C, D, E, F, G, H, A, B, xx); \
256*4882a593Smuzhiyun R(B, C, D, E, F, G, H, A, xx)
257*4882a593Smuzhiyun
258*4882a593Smuzhiyun
259*4882a593Smuzhiyun
260*4882a593Smuzhiyun #define T00 0x79cc4519U
261*4882a593Smuzhiyun #define T16 0x7a879d8aU
262*4882a593Smuzhiyun
263*4882a593Smuzhiyun #define K0 0x79cc4519U
264*4882a593Smuzhiyun #define K1 0xf3988a32U
265*4882a593Smuzhiyun #define K2 0xe7311465U
266*4882a593Smuzhiyun #define K3 0xce6228cbU
267*4882a593Smuzhiyun #define K4 0x9cc45197U
268*4882a593Smuzhiyun #define K5 0x3988a32fU
269*4882a593Smuzhiyun #define K6 0x7311465eU
270*4882a593Smuzhiyun #define K7 0xe6228cbcU
271*4882a593Smuzhiyun #define K8 0xcc451979U
272*4882a593Smuzhiyun #define K9 0x988a32f3U
273*4882a593Smuzhiyun #define K10 0x311465e7U
274*4882a593Smuzhiyun #define K11 0x6228cbceU
275*4882a593Smuzhiyun #define K12 0xc451979cU
276*4882a593Smuzhiyun #define K13 0x88a32f39U
277*4882a593Smuzhiyun #define K14 0x11465e73U
278*4882a593Smuzhiyun #define K15 0x228cbce6U
279*4882a593Smuzhiyun #define K16 0x9d8a7a87U
280*4882a593Smuzhiyun #define K17 0x3b14f50fU
281*4882a593Smuzhiyun #define K18 0x7629ea1eU
282*4882a593Smuzhiyun #define K19 0xec53d43cU
283*4882a593Smuzhiyun #define K20 0xd8a7a879U
284*4882a593Smuzhiyun #define K21 0xb14f50f3U
285*4882a593Smuzhiyun #define K22 0x629ea1e7U
286*4882a593Smuzhiyun #define K23 0xc53d43ceU
287*4882a593Smuzhiyun #define K24 0x8a7a879dU
288*4882a593Smuzhiyun #define K25 0x14f50f3bU
289*4882a593Smuzhiyun #define K26 0x29ea1e76U
290*4882a593Smuzhiyun #define K27 0x53d43cecU
291*4882a593Smuzhiyun #define K28 0xa7a879d8U
292*4882a593Smuzhiyun #define K29 0x4f50f3b1U
293*4882a593Smuzhiyun #define K30 0x9ea1e762U
294*4882a593Smuzhiyun #define K31 0x3d43cec5U
295*4882a593Smuzhiyun #define K32 0x7a879d8aU
296*4882a593Smuzhiyun #define K33 0xf50f3b14U
297*4882a593Smuzhiyun #define K34 0xea1e7629U
298*4882a593Smuzhiyun #define K35 0xd43cec53U
299*4882a593Smuzhiyun #define K36 0xa879d8a7U
300*4882a593Smuzhiyun #define K37 0x50f3b14fU
301*4882a593Smuzhiyun #define K38 0xa1e7629eU
302*4882a593Smuzhiyun #define K39 0x43cec53dU
303*4882a593Smuzhiyun #define K40 0x879d8a7aU
304*4882a593Smuzhiyun #define K41 0x0f3b14f5U
305*4882a593Smuzhiyun #define K42 0x1e7629eaU
306*4882a593Smuzhiyun #define K43 0x3cec53d4U
307*4882a593Smuzhiyun #define K44 0x79d8a7a8U
308*4882a593Smuzhiyun #define K45 0xf3b14f50U
309*4882a593Smuzhiyun #define K46 0xe7629ea1U
310*4882a593Smuzhiyun #define K47 0xcec53d43U
311*4882a593Smuzhiyun #define K48 0x9d8a7a87U
312*4882a593Smuzhiyun #define K49 0x3b14f50fU
313*4882a593Smuzhiyun #define K50 0x7629ea1eU
314*4882a593Smuzhiyun #define K51 0xec53d43cU
315*4882a593Smuzhiyun #define K52 0xd8a7a879U
316*4882a593Smuzhiyun #define K53 0xb14f50f3U
317*4882a593Smuzhiyun #define K54 0x629ea1e7U
318*4882a593Smuzhiyun #define K55 0xc53d43ceU
319*4882a593Smuzhiyun #define K56 0x8a7a879dU
320*4882a593Smuzhiyun #define K57 0x14f50f3bU
321*4882a593Smuzhiyun #define K58 0x29ea1e76U
322*4882a593Smuzhiyun #define K59 0x53d43cecU
323*4882a593Smuzhiyun #define K60 0xa7a879d8U
324*4882a593Smuzhiyun #define K61 0x4f50f3b1U
325*4882a593Smuzhiyun #define K62 0x9ea1e762U
326*4882a593Smuzhiyun #define K63 0x3d43cec5U
327*4882a593Smuzhiyun
328*4882a593Smuzhiyun uint32_t K[64] = {
329*4882a593Smuzhiyun K0, K1, K2, K3, K4, K5, K6, K7,
330*4882a593Smuzhiyun K8, K9, K10, K11, K12, K13, K14, K15,
331*4882a593Smuzhiyun K16, K17, K18, K19, K20, K21, K22, K23,
332*4882a593Smuzhiyun K24, K25, K26, K27, K28, K29, K30, K31,
333*4882a593Smuzhiyun K32, K33, K34, K35, K36, K37, K38, K39,
334*4882a593Smuzhiyun K40, K41, K42, K43, K44, K45, K46, K47,
335*4882a593Smuzhiyun K48, K49, K50, K51, K52, K53, K54, K55,
336*4882a593Smuzhiyun K56, K57, K58, K59, K60, K61, K62, K63,
337*4882a593Smuzhiyun /*
338*4882a593Smuzhiyun 0x79cc4519U, 0xf3988a32U, 0xe7311465U, 0xce6228cbU,
339*4882a593Smuzhiyun 0x9cc45197U, 0x3988a32fU, 0x7311465eU, 0xe6228cbcU,
340*4882a593Smuzhiyun 0xcc451979U, 0x988a32f3U, 0x311465e7U, 0x6228cbceU,
341*4882a593Smuzhiyun 0xc451979cU, 0x88a32f39U, 0x11465e73U, 0x228cbce6U,
342*4882a593Smuzhiyun 0x9d8a7a87U, 0x3b14f50fU, 0x7629ea1eU, 0xec53d43cU,
343*4882a593Smuzhiyun 0xd8a7a879U, 0xb14f50f3U, 0x629ea1e7U, 0xc53d43ceU,
344*4882a593Smuzhiyun 0x8a7a879dU, 0x14f50f3bU, 0x29ea1e76U, 0x53d43cecU,
345*4882a593Smuzhiyun 0xa7a879d8U, 0x4f50f3b1U, 0x9ea1e762U, 0x3d43cec5U,
346*4882a593Smuzhiyun 0x7a879d8aU, 0xf50f3b14U, 0xea1e7629U, 0xd43cec53U,
347*4882a593Smuzhiyun 0xa879d8a7U, 0x50f3b14fU, 0xa1e7629eU, 0x43cec53dU,
348*4882a593Smuzhiyun 0x879d8a7aU, 0x0f3b14f5U, 0x1e7629eaU, 0x3cec53d4U,
349*4882a593Smuzhiyun 0x79d8a7a8U, 0xf3b14f50U, 0xe7629ea1U, 0xcec53d43U,
350*4882a593Smuzhiyun 0x9d8a7a87U, 0x3b14f50fU, 0x7629ea1eU, 0xec53d43cU,
351*4882a593Smuzhiyun 0xd8a7a879U, 0xb14f50f3U, 0x629ea1e7U, 0xc53d43ceU,
352*4882a593Smuzhiyun 0x8a7a879dU, 0x14f50f3bU, 0x29ea1e76U, 0x53d43cecU,
353*4882a593Smuzhiyun 0xa7a879d8U, 0x4f50f3b1U, 0x9ea1e762U, 0x3d43cec5U,
354*4882a593Smuzhiyun */
355*4882a593Smuzhiyun };
356*4882a593Smuzhiyun
sm3_compress_blocks(uint32_t digest[8],const unsigned char * data,size_t blocks)357*4882a593Smuzhiyun static void sm3_compress_blocks(uint32_t digest[8],
358*4882a593Smuzhiyun const unsigned char *data, size_t blocks)
359*4882a593Smuzhiyun {
360*4882a593Smuzhiyun uint32_t A;
361*4882a593Smuzhiyun uint32_t B;
362*4882a593Smuzhiyun uint32_t C;
363*4882a593Smuzhiyun uint32_t D;
364*4882a593Smuzhiyun uint32_t E;
365*4882a593Smuzhiyun uint32_t F;
366*4882a593Smuzhiyun uint32_t G;
367*4882a593Smuzhiyun uint32_t H;
368*4882a593Smuzhiyun uint32_t W[68];
369*4882a593Smuzhiyun uint32_t SS1, SS2, TT1, TT2;
370*4882a593Smuzhiyun int j;
371*4882a593Smuzhiyun
372*4882a593Smuzhiyun #ifdef SM3_SSE3
373*4882a593Smuzhiyun __m128i X, T, R;
374*4882a593Smuzhiyun __m128i M = _mm_setr_epi32(0, 0, 0, 0xffffffff);
375*4882a593Smuzhiyun __m128i V = _mm_setr_epi8(3,2,1,0,7,6,5,4,11,10,9,8,15,14,13,12);
376*4882a593Smuzhiyun #endif
377*4882a593Smuzhiyun
378*4882a593Smuzhiyun while (blocks--) {
379*4882a593Smuzhiyun
380*4882a593Smuzhiyun A = digest[0];
381*4882a593Smuzhiyun B = digest[1];
382*4882a593Smuzhiyun C = digest[2];
383*4882a593Smuzhiyun D = digest[3];
384*4882a593Smuzhiyun E = digest[4];
385*4882a593Smuzhiyun F = digest[5];
386*4882a593Smuzhiyun G = digest[6];
387*4882a593Smuzhiyun H = digest[7];
388*4882a593Smuzhiyun
389*4882a593Smuzhiyun
390*4882a593Smuzhiyun #ifdef SM3_SSE3
391*4882a593Smuzhiyun
392*4882a593Smuzhiyun for (j = 0; j < 16; j += 4) {
393*4882a593Smuzhiyun X = _mm_loadu_si128((__m128i *)(data + j * 4));
394*4882a593Smuzhiyun X = _mm_shuffle_epi8(X, V);
395*4882a593Smuzhiyun _mm_storeu_si128((__m128i *)(W + j), X);
396*4882a593Smuzhiyun }
397*4882a593Smuzhiyun
398*4882a593Smuzhiyun for (j = 16; j < 68; j += 4) {
399*4882a593Smuzhiyun /* X = (W[j - 3], W[j - 2], W[j - 1], 0) */
400*4882a593Smuzhiyun X = _mm_loadu_si128((__m128i *)(W + j - 3));
401*4882a593Smuzhiyun X = _mm_andnot_si128(M, X);
402*4882a593Smuzhiyun
403*4882a593Smuzhiyun X = _mm_rotl_epi32(X, 15);
404*4882a593Smuzhiyun T = _mm_loadu_si128((__m128i *)(W + j - 9));
405*4882a593Smuzhiyun X = _mm_xor_si128(X, T);
406*4882a593Smuzhiyun T = _mm_loadu_si128((__m128i *)(W + j - 16));
407*4882a593Smuzhiyun X = _mm_xor_si128(X, T);
408*4882a593Smuzhiyun
409*4882a593Smuzhiyun /* P1() */
410*4882a593Smuzhiyun T = _mm_rotl_epi32(X, (23 - 15));
411*4882a593Smuzhiyun T = _mm_xor_si128(T, X);
412*4882a593Smuzhiyun T = _mm_rotl_epi32(T, 15);
413*4882a593Smuzhiyun X = _mm_xor_si128(X, T);
414*4882a593Smuzhiyun
415*4882a593Smuzhiyun T = _mm_loadu_si128((__m128i *)(W + j - 13));
416*4882a593Smuzhiyun T = _mm_rotl_epi32(T, 7);
417*4882a593Smuzhiyun X = _mm_xor_si128(X, T);
418*4882a593Smuzhiyun T = _mm_loadu_si128((__m128i *)(W + j - 6));
419*4882a593Smuzhiyun X = _mm_xor_si128(X, T);
420*4882a593Smuzhiyun
421*4882a593Smuzhiyun /* W[j + 3] ^= P1(ROL32(W[j + 1], 15)) */
422*4882a593Smuzhiyun R = _mm_shuffle_epi32(X, 0);
423*4882a593Smuzhiyun R = _mm_and_si128(R, M);
424*4882a593Smuzhiyun T = _mm_rotl_epi32(R, 15);
425*4882a593Smuzhiyun T = _mm_xor_si128(T, R);
426*4882a593Smuzhiyun T = _mm_rotl_epi32(T, 9);
427*4882a593Smuzhiyun R = _mm_xor_si128(R, T);
428*4882a593Smuzhiyun R = _mm_rotl_epi32(R, 6);
429*4882a593Smuzhiyun X = _mm_xor_si128(X, R);
430*4882a593Smuzhiyun
431*4882a593Smuzhiyun _mm_storeu_si128((__m128i *)(W + j), X);
432*4882a593Smuzhiyun }
433*4882a593Smuzhiyun #else
434*4882a593Smuzhiyun for (j = 0; j < 16; j++)
435*4882a593Smuzhiyun W[j] = GETU32(data + j*4);
436*4882a593Smuzhiyun
437*4882a593Smuzhiyun for (; j < 68; j++)
438*4882a593Smuzhiyun W[j] = P1(W[j - 16] ^ W[j - 9] ^ ROL32(W[j - 3], 15))
439*4882a593Smuzhiyun ^ ROL32(W[j - 13], 7) ^ W[j - 6];
440*4882a593Smuzhiyun #endif
441*4882a593Smuzhiyun
442*4882a593Smuzhiyun
443*4882a593Smuzhiyun j = 0;
444*4882a593Smuzhiyun
445*4882a593Smuzhiyun #define FULL_UNROLL
446*4882a593Smuzhiyun #ifdef FULL_UNROLL
447*4882a593Smuzhiyun R8(A, B, C, D, E, F, G, H, 00);
448*4882a593Smuzhiyun R8(A, B, C, D, E, F, G, H, 00);
449*4882a593Smuzhiyun R8(A, B, C, D, E, F, G, H, 16);
450*4882a593Smuzhiyun R8(A, B, C, D, E, F, G, H, 16);
451*4882a593Smuzhiyun R8(A, B, C, D, E, F, G, H, 16);
452*4882a593Smuzhiyun R8(A, B, C, D, E, F, G, H, 16);
453*4882a593Smuzhiyun R8(A, B, C, D, E, F, G, H, 16);
454*4882a593Smuzhiyun R8(A, B, C, D, E, F, G, H, 16);
455*4882a593Smuzhiyun #else
456*4882a593Smuzhiyun for (; j < 16; j++) {
457*4882a593Smuzhiyun SS1 = ROL32((ROL32(A, 12) + E + K(j)), 7);
458*4882a593Smuzhiyun SS2 = SS1 ^ ROL32(A, 12);
459*4882a593Smuzhiyun TT1 = FF00(A, B, C) + D + SS2 + (W[j] ^ W[j + 4]);
460*4882a593Smuzhiyun TT2 = GG00(E, F, G) + H + SS1 + W[j];
461*4882a593Smuzhiyun D = C;
462*4882a593Smuzhiyun C = ROL32(B, 9);
463*4882a593Smuzhiyun B = A;
464*4882a593Smuzhiyun A = TT1;
465*4882a593Smuzhiyun H = G;
466*4882a593Smuzhiyun G = ROL32(F, 19);
467*4882a593Smuzhiyun F = E;
468*4882a593Smuzhiyun E = P0(TT2);
469*4882a593Smuzhiyun }
470*4882a593Smuzhiyun
471*4882a593Smuzhiyun for (; j < 64; j++) {
472*4882a593Smuzhiyun SS1 = ROL32((ROL32(A, 12) + E + K(j)), 7);
473*4882a593Smuzhiyun SS2 = SS1 ^ ROL32(A, 12);
474*4882a593Smuzhiyun TT1 = FF16(A, B, C) + D + SS2 + (W[j] ^ W[j + 4]);
475*4882a593Smuzhiyun TT2 = GG16(E, F, G) + H + SS1 + W[j];
476*4882a593Smuzhiyun D = C;
477*4882a593Smuzhiyun C = ROL32(B, 9);
478*4882a593Smuzhiyun B = A;
479*4882a593Smuzhiyun A = TT1;
480*4882a593Smuzhiyun H = G;
481*4882a593Smuzhiyun G = ROL32(F, 19);
482*4882a593Smuzhiyun F = E;
483*4882a593Smuzhiyun E = P0(TT2);
484*4882a593Smuzhiyun }
485*4882a593Smuzhiyun #endif
486*4882a593Smuzhiyun
487*4882a593Smuzhiyun digest[0] ^= A;
488*4882a593Smuzhiyun digest[1] ^= B;
489*4882a593Smuzhiyun digest[2] ^= C;
490*4882a593Smuzhiyun digest[3] ^= D;
491*4882a593Smuzhiyun digest[4] ^= E;
492*4882a593Smuzhiyun digest[5] ^= F;
493*4882a593Smuzhiyun digest[6] ^= G;
494*4882a593Smuzhiyun digest[7] ^= H;
495*4882a593Smuzhiyun
496*4882a593Smuzhiyun data += 64;
497*4882a593Smuzhiyun }
498*4882a593Smuzhiyun }
499*4882a593Smuzhiyun
rkgm_sm3_compress(uint32_t digest[8],const unsigned char block[64])500*4882a593Smuzhiyun void rkgm_sm3_compress(uint32_t digest[8], const unsigned char block[64])
501*4882a593Smuzhiyun {
502*4882a593Smuzhiyun return sm3_compress_blocks(digest, block, 1);
503*4882a593Smuzhiyun }
504*4882a593Smuzhiyun
rk_hash_sm3(const unsigned char * in,unsigned int in_len,unsigned char * out,unsigned int * out_len)505*4882a593Smuzhiyun int rk_hash_sm3(const unsigned char *in, unsigned int in_len,
506*4882a593Smuzhiyun unsigned char *out, unsigned int *out_len)
507*4882a593Smuzhiyun {
508*4882a593Smuzhiyun rkgm_sm3_ctx_t ctx;
509*4882a593Smuzhiyun
510*4882a593Smuzhiyun rkgm_sm3_init(&ctx);
511*4882a593Smuzhiyun rkgm_sm3_update(&ctx, in, in_len);
512*4882a593Smuzhiyun rkgm_sm3_final(&ctx, out);
513*4882a593Smuzhiyun
514*4882a593Smuzhiyun memset(&ctx, 0, sizeof(rkgm_sm3_ctx_t));
515*4882a593Smuzhiyun
516*4882a593Smuzhiyun *out_len = SM3_DIGEST_LENGTH;
517*4882a593Smuzhiyun
518*4882a593Smuzhiyun return 0;
519*4882a593Smuzhiyun }
520