132b31808SJens Wiklander /*
232b31808SJens Wiklander * Core bignum functions
332b31808SJens Wiklander *
432b31808SJens Wiklander * Copyright The Mbed TLS Contributors
5b0563631STom Van Eyck * SPDX-License-Identifier: Apache-2.0 OR GPL-2.0-or-later
632b31808SJens Wiklander */
732b31808SJens Wiklander
832b31808SJens Wiklander #include "common.h"
932b31808SJens Wiklander
1032b31808SJens Wiklander #if defined(MBEDTLS_BIGNUM_C)
1132b31808SJens Wiklander
1232b31808SJens Wiklander #include <string.h>
1332b31808SJens Wiklander
1432b31808SJens Wiklander #include "mbedtls/error.h"
1532b31808SJens Wiklander #include "mbedtls/platform_util.h"
1632b31808SJens Wiklander #include "constant_time_internal.h"
1732b31808SJens Wiklander
1832b31808SJens Wiklander #include "mbedtls/platform.h"
1932b31808SJens Wiklander
2032b31808SJens Wiklander #include "bignum_core.h"
2132b31808SJens Wiklander #include "bn_mul.h"
2232b31808SJens Wiklander #include "constant_time_internal.h"
2332b31808SJens Wiklander
mbedtls_mpi_core_clz(mbedtls_mpi_uint a)2432b31808SJens Wiklander size_t mbedtls_mpi_core_clz(mbedtls_mpi_uint a)
2532b31808SJens Wiklander {
26b0563631STom Van Eyck #if defined(__has_builtin)
27b0563631STom Van Eyck #if (MBEDTLS_MPI_UINT_MAX == UINT_MAX) && __has_builtin(__builtin_clz)
28b0563631STom Van Eyck #define core_clz __builtin_clz
29b0563631STom Van Eyck #elif (MBEDTLS_MPI_UINT_MAX == ULONG_MAX) && __has_builtin(__builtin_clzl)
30b0563631STom Van Eyck #define core_clz __builtin_clzl
31b0563631STom Van Eyck #elif (MBEDTLS_MPI_UINT_MAX == ULLONG_MAX) && __has_builtin(__builtin_clzll)
32b0563631STom Van Eyck #define core_clz __builtin_clzll
33b0563631STom Van Eyck #endif
34b0563631STom Van Eyck #endif
35b0563631STom Van Eyck #if defined(core_clz)
36b0563631STom Van Eyck return (size_t) core_clz(a);
37b0563631STom Van Eyck #else
3832b31808SJens Wiklander size_t j;
3932b31808SJens Wiklander mbedtls_mpi_uint mask = (mbedtls_mpi_uint) 1 << (biL - 1);
4032b31808SJens Wiklander
4132b31808SJens Wiklander for (j = 0; j < biL; j++) {
4232b31808SJens Wiklander if (a & mask) {
4332b31808SJens Wiklander break;
4432b31808SJens Wiklander }
4532b31808SJens Wiklander
4632b31808SJens Wiklander mask >>= 1;
4732b31808SJens Wiklander }
4832b31808SJens Wiklander
4932b31808SJens Wiklander return j;
50b0563631STom Van Eyck #endif
5132b31808SJens Wiklander }
5232b31808SJens Wiklander
mbedtls_mpi_core_bitlen(const mbedtls_mpi_uint * A,size_t A_limbs)5332b31808SJens Wiklander size_t mbedtls_mpi_core_bitlen(const mbedtls_mpi_uint *A, size_t A_limbs)
5432b31808SJens Wiklander {
55b0563631STom Van Eyck int i;
56b0563631STom Van Eyck size_t j;
5732b31808SJens Wiklander
58b0563631STom Van Eyck for (i = ((int) A_limbs) - 1; i >= 0; i--) {
5932b31808SJens Wiklander if (A[i] != 0) {
6032b31808SJens Wiklander j = biL - mbedtls_mpi_core_clz(A[i]);
6132b31808SJens Wiklander return (i * biL) + j;
6232b31808SJens Wiklander }
6332b31808SJens Wiklander }
6432b31808SJens Wiklander
65b0563631STom Van Eyck return 0;
6632b31808SJens Wiklander }
6732b31808SJens Wiklander
mpi_bigendian_to_host(mbedtls_mpi_uint a)6832b31808SJens Wiklander static mbedtls_mpi_uint mpi_bigendian_to_host(mbedtls_mpi_uint a)
6932b31808SJens Wiklander {
7032b31808SJens Wiklander if (MBEDTLS_IS_BIG_ENDIAN) {
7132b31808SJens Wiklander /* Nothing to do on bigendian systems. */
7232b31808SJens Wiklander return a;
7332b31808SJens Wiklander } else {
74b0563631STom Van Eyck #if defined(MBEDTLS_HAVE_INT32)
75b0563631STom Van Eyck return (mbedtls_mpi_uint) MBEDTLS_BSWAP32(a);
76b0563631STom Van Eyck #elif defined(MBEDTLS_HAVE_INT64)
77b0563631STom Van Eyck return (mbedtls_mpi_uint) MBEDTLS_BSWAP64(a);
78b0563631STom Van Eyck #endif
7932b31808SJens Wiklander }
8032b31808SJens Wiklander }
8132b31808SJens Wiklander
mbedtls_mpi_core_bigendian_to_host(mbedtls_mpi_uint * A,size_t A_limbs)8232b31808SJens Wiklander void mbedtls_mpi_core_bigendian_to_host(mbedtls_mpi_uint *A,
8332b31808SJens Wiklander size_t A_limbs)
8432b31808SJens Wiklander {
8532b31808SJens Wiklander mbedtls_mpi_uint *cur_limb_left;
8632b31808SJens Wiklander mbedtls_mpi_uint *cur_limb_right;
8732b31808SJens Wiklander if (A_limbs == 0) {
8832b31808SJens Wiklander return;
8932b31808SJens Wiklander }
9032b31808SJens Wiklander
9132b31808SJens Wiklander /*
9232b31808SJens Wiklander * Traverse limbs and
9332b31808SJens Wiklander * - adapt byte-order in each limb
9432b31808SJens Wiklander * - swap the limbs themselves.
9532b31808SJens Wiklander * For that, simultaneously traverse the limbs from left to right
9632b31808SJens Wiklander * and from right to left, as long as the left index is not bigger
9732b31808SJens Wiklander * than the right index (it's not a problem if limbs is odd and the
9832b31808SJens Wiklander * indices coincide in the last iteration).
9932b31808SJens Wiklander */
10032b31808SJens Wiklander for (cur_limb_left = A, cur_limb_right = A + (A_limbs - 1);
10132b31808SJens Wiklander cur_limb_left <= cur_limb_right;
10232b31808SJens Wiklander cur_limb_left++, cur_limb_right--) {
10332b31808SJens Wiklander mbedtls_mpi_uint tmp;
10432b31808SJens Wiklander /* Note that if cur_limb_left == cur_limb_right,
10532b31808SJens Wiklander * this code effectively swaps the bytes only once. */
10632b31808SJens Wiklander tmp = mpi_bigendian_to_host(*cur_limb_left);
10732b31808SJens Wiklander *cur_limb_left = mpi_bigendian_to_host(*cur_limb_right);
10832b31808SJens Wiklander *cur_limb_right = tmp;
10932b31808SJens Wiklander }
11032b31808SJens Wiklander }
11132b31808SJens Wiklander
11232b31808SJens Wiklander /* Whether min <= A, in constant time.
11332b31808SJens Wiklander * A_limbs must be at least 1. */
mbedtls_mpi_core_uint_le_mpi(mbedtls_mpi_uint min,const mbedtls_mpi_uint * A,size_t A_limbs)114b0563631STom Van Eyck mbedtls_ct_condition_t mbedtls_mpi_core_uint_le_mpi(mbedtls_mpi_uint min,
11532b31808SJens Wiklander const mbedtls_mpi_uint *A,
11632b31808SJens Wiklander size_t A_limbs)
11732b31808SJens Wiklander {
11832b31808SJens Wiklander /* min <= least significant limb? */
119b0563631STom Van Eyck mbedtls_ct_condition_t min_le_lsl = mbedtls_ct_uint_ge(A[0], min);
12032b31808SJens Wiklander
12132b31808SJens Wiklander /* limbs other than the least significant one are all zero? */
122b0563631STom Van Eyck mbedtls_ct_condition_t msll_mask = MBEDTLS_CT_FALSE;
12332b31808SJens Wiklander for (size_t i = 1; i < A_limbs; i++) {
124b0563631STom Van Eyck msll_mask = mbedtls_ct_bool_or(msll_mask, mbedtls_ct_bool(A[i]));
12532b31808SJens Wiklander }
12632b31808SJens Wiklander
12732b31808SJens Wiklander /* min <= A iff the lowest limb of A is >= min or the other limbs
12832b31808SJens Wiklander * are not all zero. */
129b0563631STom Van Eyck return mbedtls_ct_bool_or(msll_mask, min_le_lsl);
130b0563631STom Van Eyck }
131b0563631STom Van Eyck
mbedtls_mpi_core_lt_ct(const mbedtls_mpi_uint * A,const mbedtls_mpi_uint * B,size_t limbs)132b0563631STom Van Eyck mbedtls_ct_condition_t mbedtls_mpi_core_lt_ct(const mbedtls_mpi_uint *A,
133b0563631STom Van Eyck const mbedtls_mpi_uint *B,
134b0563631STom Van Eyck size_t limbs)
135b0563631STom Van Eyck {
136b0563631STom Van Eyck mbedtls_ct_condition_t ret = MBEDTLS_CT_FALSE, cond = MBEDTLS_CT_FALSE, done = MBEDTLS_CT_FALSE;
137b0563631STom Van Eyck
138b0563631STom Van Eyck for (size_t i = limbs; i > 0; i--) {
139b0563631STom Van Eyck /*
140b0563631STom Van Eyck * If B[i - 1] < A[i - 1] then A < B is false and the result must
141b0563631STom Van Eyck * remain 0.
142b0563631STom Van Eyck *
143b0563631STom Van Eyck * Again even if we can make a decision, we just mark the result and
144b0563631STom Van Eyck * the fact that we are done and continue looping.
145b0563631STom Van Eyck */
146b0563631STom Van Eyck cond = mbedtls_ct_uint_lt(B[i - 1], A[i - 1]);
147b0563631STom Van Eyck done = mbedtls_ct_bool_or(done, cond);
148b0563631STom Van Eyck
149b0563631STom Van Eyck /*
150b0563631STom Van Eyck * If A[i - 1] < B[i - 1] then A < B is true.
151b0563631STom Van Eyck *
152b0563631STom Van Eyck * Again even if we can make a decision, we just mark the result and
153b0563631STom Van Eyck * the fact that we are done and continue looping.
154b0563631STom Van Eyck */
155b0563631STom Van Eyck cond = mbedtls_ct_uint_lt(A[i - 1], B[i - 1]);
156b0563631STom Van Eyck ret = mbedtls_ct_bool_or(ret, mbedtls_ct_bool_and(cond, mbedtls_ct_bool_not(done)));
157b0563631STom Van Eyck done = mbedtls_ct_bool_or(done, cond);
158b0563631STom Van Eyck }
159b0563631STom Van Eyck
160b0563631STom Van Eyck /*
161b0563631STom Van Eyck * If all the limbs were equal, then the numbers are equal, A < B is false
162b0563631STom Van Eyck * and leaving the result 0 is correct.
163b0563631STom Van Eyck */
164b0563631STom Van Eyck
165b0563631STom Van Eyck return ret;
16632b31808SJens Wiklander }
16732b31808SJens Wiklander
mbedtls_mpi_core_cond_assign(mbedtls_mpi_uint * X,const mbedtls_mpi_uint * A,size_t limbs,mbedtls_ct_condition_t assign)16832b31808SJens Wiklander void mbedtls_mpi_core_cond_assign(mbedtls_mpi_uint *X,
16932b31808SJens Wiklander const mbedtls_mpi_uint *A,
17032b31808SJens Wiklander size_t limbs,
171b0563631STom Van Eyck mbedtls_ct_condition_t assign)
17232b31808SJens Wiklander {
17332b31808SJens Wiklander if (X == A) {
17432b31808SJens Wiklander return;
17532b31808SJens Wiklander }
17632b31808SJens Wiklander
177b0563631STom Van Eyck /* This function is very performance-sensitive for RSA. For this reason
178b0563631STom Van Eyck * we have the loop below, instead of calling mbedtls_ct_memcpy_if
179b0563631STom Van Eyck * (this is more optimal since here we don't have to handle the case where
180b0563631STom Van Eyck * we copy awkwardly sized data).
181b0563631STom Van Eyck */
182b0563631STom Van Eyck for (size_t i = 0; i < limbs; i++) {
183b0563631STom Van Eyck X[i] = mbedtls_ct_mpi_uint_if(assign, A[i], X[i]);
184b0563631STom Van Eyck }
18532b31808SJens Wiklander }
18632b31808SJens Wiklander
mbedtls_mpi_core_cond_swap(mbedtls_mpi_uint * X,mbedtls_mpi_uint * Y,size_t limbs,mbedtls_ct_condition_t swap)18732b31808SJens Wiklander void mbedtls_mpi_core_cond_swap(mbedtls_mpi_uint *X,
18832b31808SJens Wiklander mbedtls_mpi_uint *Y,
18932b31808SJens Wiklander size_t limbs,
190b0563631STom Van Eyck mbedtls_ct_condition_t swap)
19132b31808SJens Wiklander {
19232b31808SJens Wiklander if (X == Y) {
19332b31808SJens Wiklander return;
19432b31808SJens Wiklander }
19532b31808SJens Wiklander
19632b31808SJens Wiklander for (size_t i = 0; i < limbs; i++) {
19732b31808SJens Wiklander mbedtls_mpi_uint tmp = X[i];
198b0563631STom Van Eyck X[i] = mbedtls_ct_mpi_uint_if(swap, Y[i], X[i]);
199b0563631STom Van Eyck Y[i] = mbedtls_ct_mpi_uint_if(swap, tmp, Y[i]);
20032b31808SJens Wiklander }
20132b31808SJens Wiklander }
20232b31808SJens Wiklander
mbedtls_mpi_core_read_le(mbedtls_mpi_uint * X,size_t X_limbs,const unsigned char * input,size_t input_length)20332b31808SJens Wiklander int mbedtls_mpi_core_read_le(mbedtls_mpi_uint *X,
20432b31808SJens Wiklander size_t X_limbs,
20532b31808SJens Wiklander const unsigned char *input,
20632b31808SJens Wiklander size_t input_length)
20732b31808SJens Wiklander {
20832b31808SJens Wiklander const size_t limbs = CHARS_TO_LIMBS(input_length);
20932b31808SJens Wiklander
21032b31808SJens Wiklander if (X_limbs < limbs) {
21132b31808SJens Wiklander return MBEDTLS_ERR_MPI_BUFFER_TOO_SMALL;
21232b31808SJens Wiklander }
21332b31808SJens Wiklander
21432b31808SJens Wiklander if (X != NULL) {
21532b31808SJens Wiklander memset(X, 0, X_limbs * ciL);
21632b31808SJens Wiklander
21732b31808SJens Wiklander for (size_t i = 0; i < input_length; i++) {
21832b31808SJens Wiklander size_t offset = ((i % ciL) << 3);
21932b31808SJens Wiklander X[i / ciL] |= ((mbedtls_mpi_uint) input[i]) << offset;
22032b31808SJens Wiklander }
22132b31808SJens Wiklander }
22232b31808SJens Wiklander
22332b31808SJens Wiklander return 0;
22432b31808SJens Wiklander }
22532b31808SJens Wiklander
mbedtls_mpi_core_read_be(mbedtls_mpi_uint * X,size_t X_limbs,const unsigned char * input,size_t input_length)22632b31808SJens Wiklander int mbedtls_mpi_core_read_be(mbedtls_mpi_uint *X,
22732b31808SJens Wiklander size_t X_limbs,
22832b31808SJens Wiklander const unsigned char *input,
22932b31808SJens Wiklander size_t input_length)
23032b31808SJens Wiklander {
23132b31808SJens Wiklander const size_t limbs = CHARS_TO_LIMBS(input_length);
23232b31808SJens Wiklander
23332b31808SJens Wiklander if (X_limbs < limbs) {
23432b31808SJens Wiklander return MBEDTLS_ERR_MPI_BUFFER_TOO_SMALL;
23532b31808SJens Wiklander }
23632b31808SJens Wiklander
23732b31808SJens Wiklander /* If X_limbs is 0, input_length must also be 0 (from previous test).
23832b31808SJens Wiklander * Nothing to do. */
23932b31808SJens Wiklander if (X_limbs == 0) {
24032b31808SJens Wiklander return 0;
24132b31808SJens Wiklander }
24232b31808SJens Wiklander
24332b31808SJens Wiklander memset(X, 0, X_limbs * ciL);
24432b31808SJens Wiklander
24532b31808SJens Wiklander /* memcpy() with (NULL, 0) is undefined behaviour */
24632b31808SJens Wiklander if (input_length != 0) {
24732b31808SJens Wiklander size_t overhead = (X_limbs * ciL) - input_length;
24832b31808SJens Wiklander unsigned char *Xp = (unsigned char *) X;
24932b31808SJens Wiklander memcpy(Xp + overhead, input, input_length);
25032b31808SJens Wiklander }
25132b31808SJens Wiklander
25232b31808SJens Wiklander mbedtls_mpi_core_bigendian_to_host(X, X_limbs);
25332b31808SJens Wiklander
25432b31808SJens Wiklander return 0;
25532b31808SJens Wiklander }
25632b31808SJens Wiklander
mbedtls_mpi_core_write_le(const mbedtls_mpi_uint * A,size_t A_limbs,unsigned char * output,size_t output_length)25732b31808SJens Wiklander int mbedtls_mpi_core_write_le(const mbedtls_mpi_uint *A,
25832b31808SJens Wiklander size_t A_limbs,
25932b31808SJens Wiklander unsigned char *output,
26032b31808SJens Wiklander size_t output_length)
26132b31808SJens Wiklander {
26232b31808SJens Wiklander size_t stored_bytes = A_limbs * ciL;
26332b31808SJens Wiklander size_t bytes_to_copy;
26432b31808SJens Wiklander
26532b31808SJens Wiklander if (stored_bytes < output_length) {
26632b31808SJens Wiklander bytes_to_copy = stored_bytes;
26732b31808SJens Wiklander } else {
26832b31808SJens Wiklander bytes_to_copy = output_length;
26932b31808SJens Wiklander
27032b31808SJens Wiklander /* The output buffer is smaller than the allocated size of A.
27132b31808SJens Wiklander * However A may fit if its leading bytes are zero. */
27232b31808SJens Wiklander for (size_t i = bytes_to_copy; i < stored_bytes; i++) {
27332b31808SJens Wiklander if (GET_BYTE(A, i) != 0) {
27432b31808SJens Wiklander return MBEDTLS_ERR_MPI_BUFFER_TOO_SMALL;
27532b31808SJens Wiklander }
27632b31808SJens Wiklander }
27732b31808SJens Wiklander }
27832b31808SJens Wiklander
27932b31808SJens Wiklander for (size_t i = 0; i < bytes_to_copy; i++) {
28032b31808SJens Wiklander output[i] = GET_BYTE(A, i);
28132b31808SJens Wiklander }
28232b31808SJens Wiklander
28332b31808SJens Wiklander if (stored_bytes < output_length) {
28432b31808SJens Wiklander /* Write trailing 0 bytes */
28532b31808SJens Wiklander memset(output + stored_bytes, 0, output_length - stored_bytes);
28632b31808SJens Wiklander }
28732b31808SJens Wiklander
28832b31808SJens Wiklander return 0;
28932b31808SJens Wiklander }
29032b31808SJens Wiklander
mbedtls_mpi_core_write_be(const mbedtls_mpi_uint * X,size_t X_limbs,unsigned char * output,size_t output_length)29132b31808SJens Wiklander int mbedtls_mpi_core_write_be(const mbedtls_mpi_uint *X,
29232b31808SJens Wiklander size_t X_limbs,
29332b31808SJens Wiklander unsigned char *output,
29432b31808SJens Wiklander size_t output_length)
29532b31808SJens Wiklander {
29632b31808SJens Wiklander size_t stored_bytes;
29732b31808SJens Wiklander size_t bytes_to_copy;
29832b31808SJens Wiklander unsigned char *p;
29932b31808SJens Wiklander
30032b31808SJens Wiklander stored_bytes = X_limbs * ciL;
30132b31808SJens Wiklander
30232b31808SJens Wiklander if (stored_bytes < output_length) {
30332b31808SJens Wiklander /* There is enough space in the output buffer. Write initial
30432b31808SJens Wiklander * null bytes and record the position at which to start
30532b31808SJens Wiklander * writing the significant bytes. In this case, the execution
30632b31808SJens Wiklander * trace of this function does not depend on the value of the
30732b31808SJens Wiklander * number. */
30832b31808SJens Wiklander bytes_to_copy = stored_bytes;
30932b31808SJens Wiklander p = output + output_length - stored_bytes;
31032b31808SJens Wiklander memset(output, 0, output_length - stored_bytes);
31132b31808SJens Wiklander } else {
31232b31808SJens Wiklander /* The output buffer is smaller than the allocated size of X.
31332b31808SJens Wiklander * However X may fit if its leading bytes are zero. */
31432b31808SJens Wiklander bytes_to_copy = output_length;
31532b31808SJens Wiklander p = output;
31632b31808SJens Wiklander for (size_t i = bytes_to_copy; i < stored_bytes; i++) {
31732b31808SJens Wiklander if (GET_BYTE(X, i) != 0) {
31832b31808SJens Wiklander return MBEDTLS_ERR_MPI_BUFFER_TOO_SMALL;
31932b31808SJens Wiklander }
32032b31808SJens Wiklander }
32132b31808SJens Wiklander }
32232b31808SJens Wiklander
32332b31808SJens Wiklander for (size_t i = 0; i < bytes_to_copy; i++) {
32432b31808SJens Wiklander p[bytes_to_copy - i - 1] = GET_BYTE(X, i);
32532b31808SJens Wiklander }
32632b31808SJens Wiklander
32732b31808SJens Wiklander return 0;
32832b31808SJens Wiklander }
32932b31808SJens Wiklander
mbedtls_mpi_core_shift_r(mbedtls_mpi_uint * X,size_t limbs,size_t count)33032b31808SJens Wiklander void mbedtls_mpi_core_shift_r(mbedtls_mpi_uint *X, size_t limbs,
33132b31808SJens Wiklander size_t count)
33232b31808SJens Wiklander {
33332b31808SJens Wiklander size_t i, v0, v1;
33432b31808SJens Wiklander mbedtls_mpi_uint r0 = 0, r1;
33532b31808SJens Wiklander
33632b31808SJens Wiklander v0 = count / biL;
33732b31808SJens Wiklander v1 = count & (biL - 1);
33832b31808SJens Wiklander
33932b31808SJens Wiklander if (v0 > limbs || (v0 == limbs && v1 > 0)) {
34032b31808SJens Wiklander memset(X, 0, limbs * ciL);
34132b31808SJens Wiklander return;
34232b31808SJens Wiklander }
34332b31808SJens Wiklander
34432b31808SJens Wiklander /*
34532b31808SJens Wiklander * shift by count / limb_size
34632b31808SJens Wiklander */
34732b31808SJens Wiklander if (v0 > 0) {
34832b31808SJens Wiklander for (i = 0; i < limbs - v0; i++) {
34932b31808SJens Wiklander X[i] = X[i + v0];
35032b31808SJens Wiklander }
35132b31808SJens Wiklander
35232b31808SJens Wiklander for (; i < limbs; i++) {
35332b31808SJens Wiklander X[i] = 0;
35432b31808SJens Wiklander }
35532b31808SJens Wiklander }
35632b31808SJens Wiklander
35732b31808SJens Wiklander /*
35832b31808SJens Wiklander * shift by count % limb_size
35932b31808SJens Wiklander */
36032b31808SJens Wiklander if (v1 > 0) {
36132b31808SJens Wiklander for (i = limbs; i > 0; i--) {
36232b31808SJens Wiklander r1 = X[i - 1] << (biL - v1);
36332b31808SJens Wiklander X[i - 1] >>= v1;
36432b31808SJens Wiklander X[i - 1] |= r0;
36532b31808SJens Wiklander r0 = r1;
36632b31808SJens Wiklander }
36732b31808SJens Wiklander }
36832b31808SJens Wiklander }
36932b31808SJens Wiklander
mbedtls_mpi_core_shift_l(mbedtls_mpi_uint * X,size_t limbs,size_t count)370b0563631STom Van Eyck void mbedtls_mpi_core_shift_l(mbedtls_mpi_uint *X, size_t limbs,
371b0563631STom Van Eyck size_t count)
372b0563631STom Van Eyck {
373b0563631STom Van Eyck size_t i, v0, v1;
374b0563631STom Van Eyck mbedtls_mpi_uint r0 = 0, r1;
375b0563631STom Van Eyck
376b0563631STom Van Eyck v0 = count / (biL);
377b0563631STom Van Eyck v1 = count & (biL - 1);
378b0563631STom Van Eyck
379b0563631STom Van Eyck /*
380b0563631STom Van Eyck * shift by count / limb_size
381b0563631STom Van Eyck */
382b0563631STom Van Eyck if (v0 > 0) {
383b0563631STom Van Eyck for (i = limbs; i > v0; i--) {
384b0563631STom Van Eyck X[i - 1] = X[i - v0 - 1];
385b0563631STom Van Eyck }
386b0563631STom Van Eyck
387b0563631STom Van Eyck for (; i > 0; i--) {
388b0563631STom Van Eyck X[i - 1] = 0;
389b0563631STom Van Eyck }
390b0563631STom Van Eyck }
391b0563631STom Van Eyck
392b0563631STom Van Eyck /*
393b0563631STom Van Eyck * shift by count % limb_size
394b0563631STom Van Eyck */
395b0563631STom Van Eyck if (v1 > 0) {
396b0563631STom Van Eyck for (i = v0; i < limbs; i++) {
397b0563631STom Van Eyck r1 = X[i] >> (biL - v1);
398b0563631STom Van Eyck X[i] <<= v1;
399b0563631STom Van Eyck X[i] |= r0;
400b0563631STom Van Eyck r0 = r1;
401b0563631STom Van Eyck }
402b0563631STom Van Eyck }
403b0563631STom Van Eyck }
404b0563631STom Van Eyck
mbedtls_mpi_core_add(mbedtls_mpi_uint * X,const mbedtls_mpi_uint * A,const mbedtls_mpi_uint * B,size_t limbs)40532b31808SJens Wiklander mbedtls_mpi_uint mbedtls_mpi_core_add(mbedtls_mpi_uint *X,
40632b31808SJens Wiklander const mbedtls_mpi_uint *A,
40732b31808SJens Wiklander const mbedtls_mpi_uint *B,
40832b31808SJens Wiklander size_t limbs)
40932b31808SJens Wiklander {
41032b31808SJens Wiklander mbedtls_mpi_uint c = 0;
41132b31808SJens Wiklander
41232b31808SJens Wiklander for (size_t i = 0; i < limbs; i++) {
41332b31808SJens Wiklander mbedtls_mpi_uint t = c + A[i];
41432b31808SJens Wiklander c = (t < A[i]);
41532b31808SJens Wiklander t += B[i];
41632b31808SJens Wiklander c += (t < B[i]);
41732b31808SJens Wiklander X[i] = t;
41832b31808SJens Wiklander }
41932b31808SJens Wiklander
42032b31808SJens Wiklander return c;
42132b31808SJens Wiklander }
42232b31808SJens Wiklander
mbedtls_mpi_core_add_if(mbedtls_mpi_uint * X,const mbedtls_mpi_uint * A,size_t limbs,unsigned cond)42332b31808SJens Wiklander mbedtls_mpi_uint mbedtls_mpi_core_add_if(mbedtls_mpi_uint *X,
42432b31808SJens Wiklander const mbedtls_mpi_uint *A,
42532b31808SJens Wiklander size_t limbs,
42632b31808SJens Wiklander unsigned cond)
42732b31808SJens Wiklander {
42832b31808SJens Wiklander mbedtls_mpi_uint c = 0;
42932b31808SJens Wiklander
430b0563631STom Van Eyck mbedtls_ct_condition_t do_add = mbedtls_ct_bool(cond);
43132b31808SJens Wiklander
43232b31808SJens Wiklander for (size_t i = 0; i < limbs; i++) {
433b0563631STom Van Eyck mbedtls_mpi_uint add = mbedtls_ct_mpi_uint_if_else_0(do_add, A[i]);
43432b31808SJens Wiklander mbedtls_mpi_uint t = c + X[i];
43532b31808SJens Wiklander c = (t < X[i]);
43632b31808SJens Wiklander t += add;
43732b31808SJens Wiklander c += (t < add);
43832b31808SJens Wiklander X[i] = t;
43932b31808SJens Wiklander }
44032b31808SJens Wiklander
44132b31808SJens Wiklander return c;
44232b31808SJens Wiklander }
44332b31808SJens Wiklander
mbedtls_mpi_core_sub(mbedtls_mpi_uint * X,const mbedtls_mpi_uint * A,const mbedtls_mpi_uint * B,size_t limbs)44432b31808SJens Wiklander mbedtls_mpi_uint mbedtls_mpi_core_sub(mbedtls_mpi_uint *X,
44532b31808SJens Wiklander const mbedtls_mpi_uint *A,
44632b31808SJens Wiklander const mbedtls_mpi_uint *B,
44732b31808SJens Wiklander size_t limbs)
44832b31808SJens Wiklander {
44932b31808SJens Wiklander mbedtls_mpi_uint c = 0;
45032b31808SJens Wiklander
45132b31808SJens Wiklander for (size_t i = 0; i < limbs; i++) {
45232b31808SJens Wiklander mbedtls_mpi_uint z = (A[i] < c);
45332b31808SJens Wiklander mbedtls_mpi_uint t = A[i] - c;
45432b31808SJens Wiklander c = (t < B[i]) + z;
45532b31808SJens Wiklander X[i] = t - B[i];
45632b31808SJens Wiklander }
45732b31808SJens Wiklander
45832b31808SJens Wiklander return c;
45932b31808SJens Wiklander }
46032b31808SJens Wiklander
mbedtls_mpi_core_mla(mbedtls_mpi_uint * d,size_t d_len,const mbedtls_mpi_uint * s,size_t s_len,mbedtls_mpi_uint b)46132b31808SJens Wiklander mbedtls_mpi_uint mbedtls_mpi_core_mla(mbedtls_mpi_uint *d, size_t d_len,
46232b31808SJens Wiklander const mbedtls_mpi_uint *s, size_t s_len,
46332b31808SJens Wiklander mbedtls_mpi_uint b)
46432b31808SJens Wiklander {
46532b31808SJens Wiklander mbedtls_mpi_uint c = 0; /* carry */
46632b31808SJens Wiklander /*
46732b31808SJens Wiklander * It is a documented precondition of this function that d_len >= s_len.
46832b31808SJens Wiklander * If that's not the case, we swap these round: this turns what would be
46932b31808SJens Wiklander * a buffer overflow into an incorrect result.
47032b31808SJens Wiklander */
47132b31808SJens Wiklander if (d_len < s_len) {
47232b31808SJens Wiklander s_len = d_len;
47332b31808SJens Wiklander }
47432b31808SJens Wiklander size_t excess_len = d_len - s_len;
47532b31808SJens Wiklander size_t steps_x8 = s_len / 8;
47632b31808SJens Wiklander size_t steps_x1 = s_len & 7;
47732b31808SJens Wiklander
47832b31808SJens Wiklander while (steps_x8--) {
47932b31808SJens Wiklander MULADDC_X8_INIT
48032b31808SJens Wiklander MULADDC_X8_CORE
48132b31808SJens Wiklander MULADDC_X8_STOP
48232b31808SJens Wiklander }
48332b31808SJens Wiklander
48432b31808SJens Wiklander while (steps_x1--) {
48532b31808SJens Wiklander MULADDC_X1_INIT
48632b31808SJens Wiklander MULADDC_X1_CORE
48732b31808SJens Wiklander MULADDC_X1_STOP
48832b31808SJens Wiklander }
48932b31808SJens Wiklander
49032b31808SJens Wiklander while (excess_len--) {
49132b31808SJens Wiklander *d += c;
49232b31808SJens Wiklander c = (*d < c);
49332b31808SJens Wiklander d++;
49432b31808SJens Wiklander }
49532b31808SJens Wiklander
49632b31808SJens Wiklander return c;
49732b31808SJens Wiklander }
49832b31808SJens Wiklander
mbedtls_mpi_core_mul(mbedtls_mpi_uint * X,const mbedtls_mpi_uint * A,size_t A_limbs,const mbedtls_mpi_uint * B,size_t B_limbs)499b0563631STom Van Eyck void mbedtls_mpi_core_mul(mbedtls_mpi_uint *X,
500b0563631STom Van Eyck const mbedtls_mpi_uint *A, size_t A_limbs,
501b0563631STom Van Eyck const mbedtls_mpi_uint *B, size_t B_limbs)
502b0563631STom Van Eyck {
503b0563631STom Van Eyck memset(X, 0, (A_limbs + B_limbs) * ciL);
504b0563631STom Van Eyck
505b0563631STom Van Eyck for (size_t i = 0; i < B_limbs; i++) {
506b0563631STom Van Eyck (void) mbedtls_mpi_core_mla(X + i, A_limbs + 1, A, A_limbs, B[i]);
507b0563631STom Van Eyck }
508b0563631STom Van Eyck }
509b0563631STom Van Eyck
51032b31808SJens Wiklander /*
51132b31808SJens Wiklander * Fast Montgomery initialization (thanks to Tom St Denis).
51232b31808SJens Wiklander */
mbedtls_mpi_core_montmul_init(const mbedtls_mpi_uint * N)51332b31808SJens Wiklander mbedtls_mpi_uint mbedtls_mpi_core_montmul_init(const mbedtls_mpi_uint *N)
51432b31808SJens Wiklander {
51532b31808SJens Wiklander mbedtls_mpi_uint x = N[0];
51632b31808SJens Wiklander
51732b31808SJens Wiklander x += ((N[0] + 2) & 4) << 1;
51832b31808SJens Wiklander
51932b31808SJens Wiklander for (unsigned int i = biL; i >= 8; i /= 2) {
52032b31808SJens Wiklander x *= (2 - (N[0] * x));
52132b31808SJens Wiklander }
52232b31808SJens Wiklander
52332b31808SJens Wiklander return ~x + 1;
52432b31808SJens Wiklander }
52532b31808SJens Wiklander
mbedtls_mpi_core_montmul(mbedtls_mpi_uint * X,const mbedtls_mpi_uint * A,const mbedtls_mpi_uint * B,size_t B_limbs,const mbedtls_mpi_uint * N,size_t AN_limbs,mbedtls_mpi_uint mm,mbedtls_mpi_uint * T)52632b31808SJens Wiklander void mbedtls_mpi_core_montmul(mbedtls_mpi_uint *X,
52732b31808SJens Wiklander const mbedtls_mpi_uint *A,
52832b31808SJens Wiklander const mbedtls_mpi_uint *B,
52932b31808SJens Wiklander size_t B_limbs,
53032b31808SJens Wiklander const mbedtls_mpi_uint *N,
53132b31808SJens Wiklander size_t AN_limbs,
53232b31808SJens Wiklander mbedtls_mpi_uint mm,
53332b31808SJens Wiklander mbedtls_mpi_uint *T)
53432b31808SJens Wiklander {
53532b31808SJens Wiklander memset(T, 0, (2 * AN_limbs + 1) * ciL);
53632b31808SJens Wiklander
53732b31808SJens Wiklander for (size_t i = 0; i < AN_limbs; i++) {
53832b31808SJens Wiklander /* T = (T + u0*B + u1*N) / 2^biL */
53932b31808SJens Wiklander mbedtls_mpi_uint u0 = A[i];
54032b31808SJens Wiklander mbedtls_mpi_uint u1 = (T[0] + u0 * B[0]) * mm;
54132b31808SJens Wiklander
54232b31808SJens Wiklander (void) mbedtls_mpi_core_mla(T, AN_limbs + 2, B, B_limbs, u0);
54332b31808SJens Wiklander (void) mbedtls_mpi_core_mla(T, AN_limbs + 2, N, AN_limbs, u1);
54432b31808SJens Wiklander
54532b31808SJens Wiklander T++;
54632b31808SJens Wiklander }
54732b31808SJens Wiklander
54832b31808SJens Wiklander /*
54932b31808SJens Wiklander * The result we want is (T >= N) ? T - N : T.
55032b31808SJens Wiklander *
55132b31808SJens Wiklander * For better constant-time properties in this function, we always do the
55232b31808SJens Wiklander * subtraction, with the result in X.
55332b31808SJens Wiklander *
55432b31808SJens Wiklander * We also look to see if there was any carry in the final additions in the
55532b31808SJens Wiklander * loop above.
55632b31808SJens Wiklander */
55732b31808SJens Wiklander
55832b31808SJens Wiklander mbedtls_mpi_uint carry = T[AN_limbs];
55932b31808SJens Wiklander mbedtls_mpi_uint borrow = mbedtls_mpi_core_sub(X, T, N, AN_limbs);
56032b31808SJens Wiklander
56132b31808SJens Wiklander /*
56232b31808SJens Wiklander * Using R as the Montgomery radix (auxiliary modulus) i.e. 2^(biL*AN_limbs):
56332b31808SJens Wiklander *
56432b31808SJens Wiklander * T can be in one of 3 ranges:
56532b31808SJens Wiklander *
56632b31808SJens Wiklander * 1) T < N : (carry, borrow) = (0, 1): we want T
56732b31808SJens Wiklander * 2) N <= T < R : (carry, borrow) = (0, 0): we want X
56832b31808SJens Wiklander * 3) T >= R : (carry, borrow) = (1, 1): we want X
56932b31808SJens Wiklander *
57032b31808SJens Wiklander * and (carry, borrow) = (1, 0) can't happen.
57132b31808SJens Wiklander *
57232b31808SJens Wiklander * So the correct return value is already in X if (carry ^ borrow) = 0,
57332b31808SJens Wiklander * but is in (the lower AN_limbs limbs of) T if (carry ^ borrow) = 1.
57432b31808SJens Wiklander */
575b0563631STom Van Eyck mbedtls_ct_memcpy_if(mbedtls_ct_bool(carry ^ borrow),
576b0563631STom Van Eyck (unsigned char *) X,
577b0563631STom Van Eyck (unsigned char *) T,
578b0563631STom Van Eyck NULL,
579b0563631STom Van Eyck AN_limbs * sizeof(mbedtls_mpi_uint));
58032b31808SJens Wiklander }
58132b31808SJens Wiklander
mbedtls_mpi_core_get_mont_r2_unsafe(mbedtls_mpi * X,const mbedtls_mpi * N)58232b31808SJens Wiklander int mbedtls_mpi_core_get_mont_r2_unsafe(mbedtls_mpi *X,
58332b31808SJens Wiklander const mbedtls_mpi *N)
58432b31808SJens Wiklander {
58532b31808SJens Wiklander int ret = MBEDTLS_ERR_ERROR_CORRUPTION_DETECTED;
58632b31808SJens Wiklander
58732b31808SJens Wiklander MBEDTLS_MPI_CHK(mbedtls_mpi_lset(X, 1));
58832b31808SJens Wiklander MBEDTLS_MPI_CHK(mbedtls_mpi_shift_l(X, N->n * 2 * biL));
58932b31808SJens Wiklander MBEDTLS_MPI_CHK(mbedtls_mpi_mod_mpi(X, X, N));
59032b31808SJens Wiklander MBEDTLS_MPI_CHK(mbedtls_mpi_shrink(X, N->n));
59132b31808SJens Wiklander
59232b31808SJens Wiklander cleanup:
59332b31808SJens Wiklander return ret;
59432b31808SJens Wiklander }
59532b31808SJens Wiklander
59632b31808SJens Wiklander MBEDTLS_STATIC_TESTABLE
mbedtls_mpi_core_ct_uint_table_lookup(mbedtls_mpi_uint * dest,const mbedtls_mpi_uint * table,size_t limbs,size_t count,size_t index)59732b31808SJens Wiklander void mbedtls_mpi_core_ct_uint_table_lookup(mbedtls_mpi_uint *dest,
59832b31808SJens Wiklander const mbedtls_mpi_uint *table,
59932b31808SJens Wiklander size_t limbs,
60032b31808SJens Wiklander size_t count,
60132b31808SJens Wiklander size_t index)
60232b31808SJens Wiklander {
60332b31808SJens Wiklander for (size_t i = 0; i < count; i++, table += limbs) {
604b0563631STom Van Eyck mbedtls_ct_condition_t assign = mbedtls_ct_uint_eq(i, index);
60532b31808SJens Wiklander mbedtls_mpi_core_cond_assign(dest, table, limbs, assign);
60632b31808SJens Wiklander }
60732b31808SJens Wiklander }
60832b31808SJens Wiklander
60932b31808SJens Wiklander /* Fill X with n_bytes random bytes.
61032b31808SJens Wiklander * X must already have room for those bytes.
61132b31808SJens Wiklander * The ordering of the bytes returned from the RNG is suitable for
61232b31808SJens Wiklander * deterministic ECDSA (see RFC 6979 §3.3 and the specification of
61332b31808SJens Wiklander * mbedtls_mpi_core_random()).
61432b31808SJens Wiklander */
mbedtls_mpi_core_fill_random(mbedtls_mpi_uint * X,size_t X_limbs,size_t n_bytes,int (* f_rng)(void *,unsigned char *,size_t),void * p_rng)61532b31808SJens Wiklander int mbedtls_mpi_core_fill_random(
61632b31808SJens Wiklander mbedtls_mpi_uint *X, size_t X_limbs,
61732b31808SJens Wiklander size_t n_bytes,
61832b31808SJens Wiklander int (*f_rng)(void *, unsigned char *, size_t), void *p_rng)
61932b31808SJens Wiklander {
62032b31808SJens Wiklander int ret = MBEDTLS_ERR_ERROR_CORRUPTION_DETECTED;
62132b31808SJens Wiklander const size_t limbs = CHARS_TO_LIMBS(n_bytes);
62232b31808SJens Wiklander const size_t overhead = (limbs * ciL) - n_bytes;
62332b31808SJens Wiklander
62432b31808SJens Wiklander if (X_limbs < limbs) {
62532b31808SJens Wiklander return MBEDTLS_ERR_MPI_BAD_INPUT_DATA;
62632b31808SJens Wiklander }
62732b31808SJens Wiklander
62832b31808SJens Wiklander memset(X, 0, overhead);
62932b31808SJens Wiklander memset((unsigned char *) X + limbs * ciL, 0, (X_limbs - limbs) * ciL);
63032b31808SJens Wiklander MBEDTLS_MPI_CHK(f_rng(p_rng, (unsigned char *) X + overhead, n_bytes));
63132b31808SJens Wiklander mbedtls_mpi_core_bigendian_to_host(X, limbs);
63232b31808SJens Wiklander
63332b31808SJens Wiklander cleanup:
63432b31808SJens Wiklander return ret;
63532b31808SJens Wiklander }
63632b31808SJens Wiklander
mbedtls_mpi_core_random(mbedtls_mpi_uint * X,mbedtls_mpi_uint min,const mbedtls_mpi_uint * N,size_t limbs,int (* f_rng)(void *,unsigned char *,size_t),void * p_rng)63732b31808SJens Wiklander int mbedtls_mpi_core_random(mbedtls_mpi_uint *X,
63832b31808SJens Wiklander mbedtls_mpi_uint min,
63932b31808SJens Wiklander const mbedtls_mpi_uint *N,
64032b31808SJens Wiklander size_t limbs,
64132b31808SJens Wiklander int (*f_rng)(void *, unsigned char *, size_t),
64232b31808SJens Wiklander void *p_rng)
64332b31808SJens Wiklander {
644b0563631STom Van Eyck mbedtls_ct_condition_t ge_lower = MBEDTLS_CT_TRUE, lt_upper = MBEDTLS_CT_FALSE;
64532b31808SJens Wiklander size_t n_bits = mbedtls_mpi_core_bitlen(N, limbs);
64632b31808SJens Wiklander size_t n_bytes = (n_bits + 7) / 8;
64732b31808SJens Wiklander int ret = MBEDTLS_ERR_ERROR_CORRUPTION_DETECTED;
64832b31808SJens Wiklander
64932b31808SJens Wiklander /*
65032b31808SJens Wiklander * When min == 0, each try has at worst a probability 1/2 of failing
65132b31808SJens Wiklander * (the msb has a probability 1/2 of being 0, and then the result will
65232b31808SJens Wiklander * be < N), so after 30 tries failure probability is a most 2**(-30).
65332b31808SJens Wiklander *
65432b31808SJens Wiklander * When N is just below a power of 2, as is the case when generating
65532b31808SJens Wiklander * a random scalar on most elliptic curves, 1 try is enough with
65632b31808SJens Wiklander * overwhelming probability. When N is just above a power of 2,
65732b31808SJens Wiklander * as when generating a random scalar on secp224k1, each try has
65832b31808SJens Wiklander * a probability of failing that is almost 1/2.
65932b31808SJens Wiklander *
66032b31808SJens Wiklander * The probabilities are almost the same if min is nonzero but negligible
66132b31808SJens Wiklander * compared to N. This is always the case when N is crypto-sized, but
66232b31808SJens Wiklander * it's convenient to support small N for testing purposes. When N
66332b31808SJens Wiklander * is small, use a higher repeat count, otherwise the probability of
66432b31808SJens Wiklander * failure is macroscopic.
66532b31808SJens Wiklander */
66632b31808SJens Wiklander int count = (n_bytes > 4 ? 30 : 250);
66732b31808SJens Wiklander
66832b31808SJens Wiklander /*
66932b31808SJens Wiklander * Match the procedure given in RFC 6979 §3.3 (deterministic ECDSA)
67032b31808SJens Wiklander * when f_rng is a suitably parametrized instance of HMAC_DRBG:
67132b31808SJens Wiklander * - use the same byte ordering;
67232b31808SJens Wiklander * - keep the leftmost n_bits bits of the generated octet string;
67332b31808SJens Wiklander * - try until result is in the desired range.
67432b31808SJens Wiklander * This also avoids any bias, which is especially important for ECDSA.
67532b31808SJens Wiklander */
67632b31808SJens Wiklander do {
67732b31808SJens Wiklander MBEDTLS_MPI_CHK(mbedtls_mpi_core_fill_random(X, limbs,
67832b31808SJens Wiklander n_bytes,
67932b31808SJens Wiklander f_rng, p_rng));
68032b31808SJens Wiklander mbedtls_mpi_core_shift_r(X, limbs, 8 * n_bytes - n_bits);
68132b31808SJens Wiklander
68232b31808SJens Wiklander if (--count == 0) {
68332b31808SJens Wiklander ret = MBEDTLS_ERR_MPI_NOT_ACCEPTABLE;
68432b31808SJens Wiklander goto cleanup;
68532b31808SJens Wiklander }
68632b31808SJens Wiklander
68732b31808SJens Wiklander ge_lower = mbedtls_mpi_core_uint_le_mpi(min, X, limbs);
68832b31808SJens Wiklander lt_upper = mbedtls_mpi_core_lt_ct(X, N, limbs);
689b0563631STom Van Eyck } while (mbedtls_ct_bool_and(ge_lower, lt_upper) == MBEDTLS_CT_FALSE);
69032b31808SJens Wiklander
69132b31808SJens Wiklander cleanup:
69232b31808SJens Wiklander return ret;
69332b31808SJens Wiklander }
69432b31808SJens Wiklander
exp_mod_get_window_size(size_t Ebits)69532b31808SJens Wiklander static size_t exp_mod_get_window_size(size_t Ebits)
69632b31808SJens Wiklander {
697b0563631STom Van Eyck #if MBEDTLS_MPI_WINDOW_SIZE >= 6
698b0563631STom Van Eyck return (Ebits > 671) ? 6 : (Ebits > 239) ? 5 : (Ebits > 79) ? 4 : 1;
699b0563631STom Van Eyck #elif MBEDTLS_MPI_WINDOW_SIZE == 5
700b0563631STom Van Eyck return (Ebits > 239) ? 5 : (Ebits > 79) ? 4 : 1;
701b0563631STom Van Eyck #elif MBEDTLS_MPI_WINDOW_SIZE > 1
702b0563631STom Van Eyck return (Ebits > 79) ? MBEDTLS_MPI_WINDOW_SIZE : 1;
703b0563631STom Van Eyck #else
704b0563631STom Van Eyck (void) Ebits;
705b0563631STom Van Eyck return 1;
70632b31808SJens Wiklander #endif
70732b31808SJens Wiklander }
70832b31808SJens Wiklander
mbedtls_mpi_core_exp_mod_working_limbs(size_t AN_limbs,size_t E_limbs)70932b31808SJens Wiklander size_t mbedtls_mpi_core_exp_mod_working_limbs(size_t AN_limbs, size_t E_limbs)
71032b31808SJens Wiklander {
71132b31808SJens Wiklander const size_t wsize = exp_mod_get_window_size(E_limbs * biL);
71232b31808SJens Wiklander const size_t welem = ((size_t) 1) << wsize;
71332b31808SJens Wiklander
71432b31808SJens Wiklander /* How big does each part of the working memory pool need to be? */
71532b31808SJens Wiklander const size_t table_limbs = welem * AN_limbs;
71632b31808SJens Wiklander const size_t select_limbs = AN_limbs;
71732b31808SJens Wiklander const size_t temp_limbs = 2 * AN_limbs + 1;
71832b31808SJens Wiklander
71932b31808SJens Wiklander return table_limbs + select_limbs + temp_limbs;
72032b31808SJens Wiklander }
72132b31808SJens Wiklander
exp_mod_precompute_window(const mbedtls_mpi_uint * A,const mbedtls_mpi_uint * N,size_t AN_limbs,mbedtls_mpi_uint mm,const mbedtls_mpi_uint * RR,size_t welem,mbedtls_mpi_uint * Wtable,mbedtls_mpi_uint * temp)72232b31808SJens Wiklander static void exp_mod_precompute_window(const mbedtls_mpi_uint *A,
72332b31808SJens Wiklander const mbedtls_mpi_uint *N,
72432b31808SJens Wiklander size_t AN_limbs,
72532b31808SJens Wiklander mbedtls_mpi_uint mm,
72632b31808SJens Wiklander const mbedtls_mpi_uint *RR,
72732b31808SJens Wiklander size_t welem,
72832b31808SJens Wiklander mbedtls_mpi_uint *Wtable,
72932b31808SJens Wiklander mbedtls_mpi_uint *temp)
73032b31808SJens Wiklander {
73132b31808SJens Wiklander /* W[0] = 1 (in Montgomery presentation) */
73232b31808SJens Wiklander memset(Wtable, 0, AN_limbs * ciL);
73332b31808SJens Wiklander Wtable[0] = 1;
73432b31808SJens Wiklander mbedtls_mpi_core_montmul(Wtable, Wtable, RR, AN_limbs, N, AN_limbs, mm, temp);
73532b31808SJens Wiklander
73632b31808SJens Wiklander /* W[1] = A (already in Montgomery presentation) */
73732b31808SJens Wiklander mbedtls_mpi_uint *W1 = Wtable + AN_limbs;
73832b31808SJens Wiklander memcpy(W1, A, AN_limbs * ciL);
73932b31808SJens Wiklander
74032b31808SJens Wiklander /* W[i+1] = W[i] * W[1], i >= 2 */
74132b31808SJens Wiklander mbedtls_mpi_uint *Wprev = W1;
74232b31808SJens Wiklander for (size_t i = 2; i < welem; i++) {
74332b31808SJens Wiklander mbedtls_mpi_uint *Wcur = Wprev + AN_limbs;
74432b31808SJens Wiklander mbedtls_mpi_core_montmul(Wcur, Wprev, W1, AN_limbs, N, AN_limbs, mm, temp);
74532b31808SJens Wiklander Wprev = Wcur;
74632b31808SJens Wiklander }
74732b31808SJens Wiklander }
74832b31808SJens Wiklander
749cb034002SJerome Forissier #if defined(MBEDTLS_TEST_HOOKS) && !defined(MBEDTLS_THREADING_C)
750*c3deb3d6SEtienne Carriere void (*mbedtls_safe_codepath_hook)(void) = NULL;
751*c3deb3d6SEtienne Carriere void (*mbedtls_unsafe_codepath_hook)(void) = NULL;
752cb034002SJerome Forissier #endif
753cb034002SJerome Forissier
754cb034002SJerome Forissier /*
755cb034002SJerome Forissier * This function calculates the indices of the exponent where the exponentiation algorithm should
756cb034002SJerome Forissier * start processing.
757cb034002SJerome Forissier *
758cb034002SJerome Forissier * Warning! If the parameter E_public has MBEDTLS_MPI_IS_PUBLIC as its value,
759cb034002SJerome Forissier * this function is not constant time with respect to the exponent (parameter E).
760cb034002SJerome Forissier */
exp_mod_calc_first_bit_optionally_safe(const mbedtls_mpi_uint * E,size_t E_limbs,int E_public,size_t * E_limb_index,size_t * E_bit_index)761cb034002SJerome Forissier static inline void exp_mod_calc_first_bit_optionally_safe(const mbedtls_mpi_uint *E,
762cb034002SJerome Forissier size_t E_limbs,
763cb034002SJerome Forissier int E_public,
764cb034002SJerome Forissier size_t *E_limb_index,
765cb034002SJerome Forissier size_t *E_bit_index)
766cb034002SJerome Forissier {
767cb034002SJerome Forissier if (E_public == MBEDTLS_MPI_IS_PUBLIC) {
768cb034002SJerome Forissier /*
769cb034002SJerome Forissier * Skip leading zero bits.
770cb034002SJerome Forissier */
771cb034002SJerome Forissier size_t E_bits = mbedtls_mpi_core_bitlen(E, E_limbs);
772cb034002SJerome Forissier if (E_bits == 0) {
773cb034002SJerome Forissier /*
774cb034002SJerome Forissier * If E is 0 mbedtls_mpi_core_bitlen() returns 0. Even if that is the case, we will want
775cb034002SJerome Forissier * to represent it as a single 0 bit and as such the bitlength will be 1.
776cb034002SJerome Forissier */
777cb034002SJerome Forissier E_bits = 1;
778cb034002SJerome Forissier }
779cb034002SJerome Forissier
780cb034002SJerome Forissier *E_limb_index = E_bits / biL;
781cb034002SJerome Forissier *E_bit_index = E_bits % biL;
782cb034002SJerome Forissier
783cb034002SJerome Forissier #if defined(MBEDTLS_TEST_HOOKS) && !defined(MBEDTLS_THREADING_C)
784*c3deb3d6SEtienne Carriere if (mbedtls_unsafe_codepath_hook != NULL) {
785*c3deb3d6SEtienne Carriere mbedtls_unsafe_codepath_hook();
786*c3deb3d6SEtienne Carriere }
787cb034002SJerome Forissier #endif
788cb034002SJerome Forissier } else {
789cb034002SJerome Forissier /*
790cb034002SJerome Forissier * Here we need to be constant time with respect to E and can't do anything better than
791cb034002SJerome Forissier * start at the first allocated bit.
792cb034002SJerome Forissier */
793cb034002SJerome Forissier *E_limb_index = E_limbs;
794cb034002SJerome Forissier *E_bit_index = 0;
795cb034002SJerome Forissier #if defined(MBEDTLS_TEST_HOOKS) && !defined(MBEDTLS_THREADING_C)
796*c3deb3d6SEtienne Carriere if (mbedtls_safe_codepath_hook != NULL) {
797*c3deb3d6SEtienne Carriere mbedtls_safe_codepath_hook();
798cb034002SJerome Forissier }
799cb034002SJerome Forissier #endif
800cb034002SJerome Forissier }
801cb034002SJerome Forissier }
802cb034002SJerome Forissier
803cb034002SJerome Forissier /*
804cb034002SJerome Forissier * Warning! If the parameter window_public has MBEDTLS_MPI_IS_PUBLIC as its value, this function is
805cb034002SJerome Forissier * not constant time with respect to the window parameter and consequently the exponent of the
806cb034002SJerome Forissier * exponentiation (parameter E of mbedtls_mpi_core_exp_mod_optionally_safe).
807cb034002SJerome Forissier */
exp_mod_table_lookup_optionally_safe(mbedtls_mpi_uint * Wselect,mbedtls_mpi_uint * Wtable,size_t AN_limbs,size_t welem,mbedtls_mpi_uint window,int window_public)808cb034002SJerome Forissier static inline void exp_mod_table_lookup_optionally_safe(mbedtls_mpi_uint *Wselect,
809cb034002SJerome Forissier mbedtls_mpi_uint *Wtable,
810cb034002SJerome Forissier size_t AN_limbs, size_t welem,
811cb034002SJerome Forissier mbedtls_mpi_uint window,
812cb034002SJerome Forissier int window_public)
813cb034002SJerome Forissier {
814cb034002SJerome Forissier if (window_public == MBEDTLS_MPI_IS_PUBLIC) {
815cb034002SJerome Forissier memcpy(Wselect, Wtable + window * AN_limbs, AN_limbs * ciL);
816cb034002SJerome Forissier #if defined(MBEDTLS_TEST_HOOKS) && !defined(MBEDTLS_THREADING_C)
817*c3deb3d6SEtienne Carriere if (mbedtls_unsafe_codepath_hook != NULL) {
818*c3deb3d6SEtienne Carriere mbedtls_unsafe_codepath_hook();
819*c3deb3d6SEtienne Carriere }
820cb034002SJerome Forissier #endif
821cb034002SJerome Forissier } else {
822cb034002SJerome Forissier /* Select Wtable[window] without leaking window through
823cb034002SJerome Forissier * memory access patterns. */
824cb034002SJerome Forissier mbedtls_mpi_core_ct_uint_table_lookup(Wselect, Wtable,
825cb034002SJerome Forissier AN_limbs, welem, window);
826cb034002SJerome Forissier #if defined(MBEDTLS_TEST_HOOKS) && !defined(MBEDTLS_THREADING_C)
827*c3deb3d6SEtienne Carriere if (mbedtls_safe_codepath_hook != NULL) {
828*c3deb3d6SEtienne Carriere mbedtls_safe_codepath_hook();
829cb034002SJerome Forissier }
830cb034002SJerome Forissier #endif
831cb034002SJerome Forissier }
832cb034002SJerome Forissier }
833cb034002SJerome Forissier
83432b31808SJens Wiklander /* Exponentiation: X := A^E mod N.
83532b31808SJens Wiklander *
836cb034002SJerome Forissier * Warning! If the parameter E_public has MBEDTLS_MPI_IS_PUBLIC as its value,
837cb034002SJerome Forissier * this function is not constant time with respect to the exponent (parameter E).
838cb034002SJerome Forissier *
83932b31808SJens Wiklander * A must already be in Montgomery form.
84032b31808SJens Wiklander *
84132b31808SJens Wiklander * As in other bignum functions, assume that AN_limbs and E_limbs are nonzero.
84232b31808SJens Wiklander *
84332b31808SJens Wiklander * RR must contain 2^{2*biL} mod N.
84432b31808SJens Wiklander *
84532b31808SJens Wiklander * The algorithm is a variant of Left-to-right k-ary exponentiation: HAC 14.82
84632b31808SJens Wiklander * (The difference is that the body in our loop processes a single bit instead
84732b31808SJens Wiklander * of a full window.)
84832b31808SJens Wiklander */
mbedtls_mpi_core_exp_mod_optionally_safe(mbedtls_mpi_uint * X,const mbedtls_mpi_uint * A,const mbedtls_mpi_uint * N,size_t AN_limbs,const mbedtls_mpi_uint * E,size_t E_limbs,int E_public,const mbedtls_mpi_uint * RR,mbedtls_mpi_uint * T)849cb034002SJerome Forissier static void mbedtls_mpi_core_exp_mod_optionally_safe(mbedtls_mpi_uint *X,
85032b31808SJens Wiklander const mbedtls_mpi_uint *A,
85132b31808SJens Wiklander const mbedtls_mpi_uint *N,
85232b31808SJens Wiklander size_t AN_limbs,
85332b31808SJens Wiklander const mbedtls_mpi_uint *E,
85432b31808SJens Wiklander size_t E_limbs,
855cb034002SJerome Forissier int E_public,
85632b31808SJens Wiklander const mbedtls_mpi_uint *RR,
85732b31808SJens Wiklander mbedtls_mpi_uint *T)
85832b31808SJens Wiklander {
859cb034002SJerome Forissier /* We'll process the bits of E from most significant
860cb034002SJerome Forissier * (limb_index=E_limbs-1, E_bit_index=biL-1) to least significant
861cb034002SJerome Forissier * (limb_index=0, E_bit_index=0). */
862*c3deb3d6SEtienne Carriere size_t E_limb_index = E_limbs;
863*c3deb3d6SEtienne Carriere size_t E_bit_index = 0;
864cb034002SJerome Forissier exp_mod_calc_first_bit_optionally_safe(E, E_limbs, E_public,
865cb034002SJerome Forissier &E_limb_index, &E_bit_index);
866cb034002SJerome Forissier
867cb034002SJerome Forissier const size_t wsize = exp_mod_get_window_size(E_limb_index * biL);
86832b31808SJens Wiklander const size_t welem = ((size_t) 1) << wsize;
86932b31808SJens Wiklander
87032b31808SJens Wiklander /* This is how we will use the temporary storage T, which must have space
87132b31808SJens Wiklander * for table_limbs, select_limbs and (2 * AN_limbs + 1) for montmul. */
87232b31808SJens Wiklander const size_t table_limbs = welem * AN_limbs;
87332b31808SJens Wiklander const size_t select_limbs = AN_limbs;
87432b31808SJens Wiklander
87532b31808SJens Wiklander /* Pointers to specific parts of the temporary working memory pool */
87632b31808SJens Wiklander mbedtls_mpi_uint *const Wtable = T;
87732b31808SJens Wiklander mbedtls_mpi_uint *const Wselect = Wtable + table_limbs;
87832b31808SJens Wiklander mbedtls_mpi_uint *const temp = Wselect + select_limbs;
87932b31808SJens Wiklander
88032b31808SJens Wiklander /*
88132b31808SJens Wiklander * Window precomputation
88232b31808SJens Wiklander */
88332b31808SJens Wiklander
88432b31808SJens Wiklander const mbedtls_mpi_uint mm = mbedtls_mpi_core_montmul_init(N);
88532b31808SJens Wiklander
886cb034002SJerome Forissier /* Set Wtable[i] = A^i (in Montgomery representation) */
88732b31808SJens Wiklander exp_mod_precompute_window(A, N, AN_limbs,
88832b31808SJens Wiklander mm, RR,
88932b31808SJens Wiklander welem, Wtable, temp);
89032b31808SJens Wiklander
89132b31808SJens Wiklander /*
89232b31808SJens Wiklander * Fixed window exponentiation
89332b31808SJens Wiklander */
89432b31808SJens Wiklander
89532b31808SJens Wiklander /* X = 1 (in Montgomery presentation) initially */
89632b31808SJens Wiklander memcpy(X, Wtable, AN_limbs * ciL);
89732b31808SJens Wiklander
89832b31808SJens Wiklander /* At any given time, window contains window_bits bits from E.
89932b31808SJens Wiklander * window_bits can go up to wsize. */
90032b31808SJens Wiklander size_t window_bits = 0;
90132b31808SJens Wiklander mbedtls_mpi_uint window = 0;
90232b31808SJens Wiklander
90332b31808SJens Wiklander do {
90432b31808SJens Wiklander /* Square */
90532b31808SJens Wiklander mbedtls_mpi_core_montmul(X, X, X, AN_limbs, N, AN_limbs, mm, temp);
90632b31808SJens Wiklander
90732b31808SJens Wiklander /* Move to the next bit of the exponent */
90832b31808SJens Wiklander if (E_bit_index == 0) {
90932b31808SJens Wiklander --E_limb_index;
91032b31808SJens Wiklander E_bit_index = biL - 1;
91132b31808SJens Wiklander } else {
91232b31808SJens Wiklander --E_bit_index;
91332b31808SJens Wiklander }
91432b31808SJens Wiklander /* Insert next exponent bit into window */
91532b31808SJens Wiklander ++window_bits;
91632b31808SJens Wiklander window <<= 1;
91732b31808SJens Wiklander window |= (E[E_limb_index] >> E_bit_index) & 1;
91832b31808SJens Wiklander
91932b31808SJens Wiklander /* Clear window if it's full. Also clear the window at the end,
92032b31808SJens Wiklander * when we've finished processing the exponent. */
92132b31808SJens Wiklander if (window_bits == wsize ||
92232b31808SJens Wiklander (E_bit_index == 0 && E_limb_index == 0)) {
923cb034002SJerome Forissier
924cb034002SJerome Forissier exp_mod_table_lookup_optionally_safe(Wselect, Wtable, AN_limbs, welem,
925cb034002SJerome Forissier window, E_public);
92632b31808SJens Wiklander /* Multiply X by the selected element. */
92732b31808SJens Wiklander mbedtls_mpi_core_montmul(X, X, Wselect, AN_limbs, N, AN_limbs, mm,
92832b31808SJens Wiklander temp);
92932b31808SJens Wiklander window = 0;
93032b31808SJens Wiklander window_bits = 0;
93132b31808SJens Wiklander }
93232b31808SJens Wiklander } while (!(E_bit_index == 0 && E_limb_index == 0));
93332b31808SJens Wiklander }
93432b31808SJens Wiklander
mbedtls_mpi_core_exp_mod(mbedtls_mpi_uint * X,const mbedtls_mpi_uint * A,const mbedtls_mpi_uint * N,size_t AN_limbs,const mbedtls_mpi_uint * E,size_t E_limbs,const mbedtls_mpi_uint * RR,mbedtls_mpi_uint * T)935cb034002SJerome Forissier void mbedtls_mpi_core_exp_mod(mbedtls_mpi_uint *X,
936cb034002SJerome Forissier const mbedtls_mpi_uint *A,
937cb034002SJerome Forissier const mbedtls_mpi_uint *N, size_t AN_limbs,
938cb034002SJerome Forissier const mbedtls_mpi_uint *E, size_t E_limbs,
939cb034002SJerome Forissier const mbedtls_mpi_uint *RR,
940cb034002SJerome Forissier mbedtls_mpi_uint *T)
941cb034002SJerome Forissier {
942cb034002SJerome Forissier mbedtls_mpi_core_exp_mod_optionally_safe(X,
943cb034002SJerome Forissier A,
944cb034002SJerome Forissier N,
945cb034002SJerome Forissier AN_limbs,
946cb034002SJerome Forissier E,
947cb034002SJerome Forissier E_limbs,
948cb034002SJerome Forissier MBEDTLS_MPI_IS_SECRET,
949cb034002SJerome Forissier RR,
950cb034002SJerome Forissier T);
951cb034002SJerome Forissier }
952cb034002SJerome Forissier
mbedtls_mpi_core_exp_mod_unsafe(mbedtls_mpi_uint * X,const mbedtls_mpi_uint * A,const mbedtls_mpi_uint * N,size_t AN_limbs,const mbedtls_mpi_uint * E,size_t E_limbs,const mbedtls_mpi_uint * RR,mbedtls_mpi_uint * T)953cb034002SJerome Forissier void mbedtls_mpi_core_exp_mod_unsafe(mbedtls_mpi_uint *X,
954cb034002SJerome Forissier const mbedtls_mpi_uint *A,
955cb034002SJerome Forissier const mbedtls_mpi_uint *N, size_t AN_limbs,
956cb034002SJerome Forissier const mbedtls_mpi_uint *E, size_t E_limbs,
957cb034002SJerome Forissier const mbedtls_mpi_uint *RR,
958cb034002SJerome Forissier mbedtls_mpi_uint *T)
959cb034002SJerome Forissier {
960cb034002SJerome Forissier mbedtls_mpi_core_exp_mod_optionally_safe(X,
961cb034002SJerome Forissier A,
962cb034002SJerome Forissier N,
963cb034002SJerome Forissier AN_limbs,
964cb034002SJerome Forissier E,
965cb034002SJerome Forissier E_limbs,
966cb034002SJerome Forissier MBEDTLS_MPI_IS_PUBLIC,
967cb034002SJerome Forissier RR,
968cb034002SJerome Forissier T);
969cb034002SJerome Forissier }
970cb034002SJerome Forissier
mbedtls_mpi_core_sub_int(mbedtls_mpi_uint * X,const mbedtls_mpi_uint * A,mbedtls_mpi_uint c,size_t limbs)97132b31808SJens Wiklander mbedtls_mpi_uint mbedtls_mpi_core_sub_int(mbedtls_mpi_uint *X,
97232b31808SJens Wiklander const mbedtls_mpi_uint *A,
97332b31808SJens Wiklander mbedtls_mpi_uint c, /* doubles as carry */
97432b31808SJens Wiklander size_t limbs)
97532b31808SJens Wiklander {
97632b31808SJens Wiklander for (size_t i = 0; i < limbs; i++) {
97732b31808SJens Wiklander mbedtls_mpi_uint s = A[i];
97832b31808SJens Wiklander mbedtls_mpi_uint t = s - c;
97932b31808SJens Wiklander c = (t > s);
98032b31808SJens Wiklander X[i] = t;
98132b31808SJens Wiklander }
98232b31808SJens Wiklander
98332b31808SJens Wiklander return c;
98432b31808SJens Wiklander }
98532b31808SJens Wiklander
mbedtls_mpi_core_check_zero_ct(const mbedtls_mpi_uint * A,size_t limbs)986b0563631STom Van Eyck mbedtls_ct_condition_t mbedtls_mpi_core_check_zero_ct(const mbedtls_mpi_uint *A,
98732b31808SJens Wiklander size_t limbs)
98832b31808SJens Wiklander {
989b0563631STom Van Eyck volatile const mbedtls_mpi_uint *force_read_A = A;
99032b31808SJens Wiklander mbedtls_mpi_uint bits = 0;
99132b31808SJens Wiklander
99232b31808SJens Wiklander for (size_t i = 0; i < limbs; i++) {
993b0563631STom Van Eyck bits |= force_read_A[i];
99432b31808SJens Wiklander }
99532b31808SJens Wiklander
996b0563631STom Van Eyck return mbedtls_ct_bool(bits);
99732b31808SJens Wiklander }
99832b31808SJens Wiklander
mbedtls_mpi_core_to_mont_rep(mbedtls_mpi_uint * X,const mbedtls_mpi_uint * A,const mbedtls_mpi_uint * N,size_t AN_limbs,mbedtls_mpi_uint mm,const mbedtls_mpi_uint * rr,mbedtls_mpi_uint * T)99932b31808SJens Wiklander void mbedtls_mpi_core_to_mont_rep(mbedtls_mpi_uint *X,
100032b31808SJens Wiklander const mbedtls_mpi_uint *A,
100132b31808SJens Wiklander const mbedtls_mpi_uint *N,
100232b31808SJens Wiklander size_t AN_limbs,
100332b31808SJens Wiklander mbedtls_mpi_uint mm,
100432b31808SJens Wiklander const mbedtls_mpi_uint *rr,
100532b31808SJens Wiklander mbedtls_mpi_uint *T)
100632b31808SJens Wiklander {
100732b31808SJens Wiklander mbedtls_mpi_core_montmul(X, A, rr, AN_limbs, N, AN_limbs, mm, T);
100832b31808SJens Wiklander }
100932b31808SJens Wiklander
mbedtls_mpi_core_from_mont_rep(mbedtls_mpi_uint * X,const mbedtls_mpi_uint * A,const mbedtls_mpi_uint * N,size_t AN_limbs,mbedtls_mpi_uint mm,mbedtls_mpi_uint * T)101032b31808SJens Wiklander void mbedtls_mpi_core_from_mont_rep(mbedtls_mpi_uint *X,
101132b31808SJens Wiklander const mbedtls_mpi_uint *A,
101232b31808SJens Wiklander const mbedtls_mpi_uint *N,
101332b31808SJens Wiklander size_t AN_limbs,
101432b31808SJens Wiklander mbedtls_mpi_uint mm,
101532b31808SJens Wiklander mbedtls_mpi_uint *T)
101632b31808SJens Wiklander {
101732b31808SJens Wiklander const mbedtls_mpi_uint Rinv = 1; /* 1/R in Mont. rep => 1 */
101832b31808SJens Wiklander
101932b31808SJens Wiklander mbedtls_mpi_core_montmul(X, A, &Rinv, 1, N, AN_limbs, mm, T);
102032b31808SJens Wiklander }
102132b31808SJens Wiklander
102232b31808SJens Wiklander #endif /* MBEDTLS_BIGNUM_C */
1023