xref: /OK3568_Linux_fs/kernel/lib/mpi/mpi-internal.h (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0-or-later */
2*4882a593Smuzhiyun /* mpi-internal.h  -  Internal to the Multi Precision Integers
3*4882a593Smuzhiyun  *	Copyright (C) 1994, 1996 Free Software Foundation, Inc.
4*4882a593Smuzhiyun  *	Copyright (C) 1998, 2000 Free Software Foundation, Inc.
5*4882a593Smuzhiyun  *
6*4882a593Smuzhiyun  * This file is part of GnuPG.
7*4882a593Smuzhiyun  *
8*4882a593Smuzhiyun  * Note: This code is heavily based on the GNU MP Library.
9*4882a593Smuzhiyun  *	 Actually it's the same code with only minor changes in the
10*4882a593Smuzhiyun  *	 way the data is stored; this is to support the abstraction
11*4882a593Smuzhiyun  *	 of an optional secure memory allocation which may be used
12*4882a593Smuzhiyun  *	 to avoid revealing of sensitive data due to paging etc.
13*4882a593Smuzhiyun  *	 The GNU MP Library itself is published under the LGPL;
14*4882a593Smuzhiyun  *	 however I decided to publish this code under the plain GPL.
15*4882a593Smuzhiyun  */
16*4882a593Smuzhiyun 
17*4882a593Smuzhiyun #ifndef G10_MPI_INTERNAL_H
18*4882a593Smuzhiyun #define G10_MPI_INTERNAL_H
19*4882a593Smuzhiyun 
20*4882a593Smuzhiyun #include <linux/module.h>
21*4882a593Smuzhiyun #include <linux/kernel.h>
22*4882a593Smuzhiyun #include <linux/slab.h>
23*4882a593Smuzhiyun #include <linux/string.h>
24*4882a593Smuzhiyun #include <linux/mpi.h>
25*4882a593Smuzhiyun #include <linux/errno.h>
26*4882a593Smuzhiyun 
27*4882a593Smuzhiyun #define log_debug printk
28*4882a593Smuzhiyun #define log_bug printk
29*4882a593Smuzhiyun 
30*4882a593Smuzhiyun #define assert(x) \
31*4882a593Smuzhiyun 	do { \
32*4882a593Smuzhiyun 		if (!x) \
33*4882a593Smuzhiyun 			log_bug("failed assertion\n"); \
34*4882a593Smuzhiyun 	} while (0);
35*4882a593Smuzhiyun 
36*4882a593Smuzhiyun /* If KARATSUBA_THRESHOLD is not already defined, define it to a
37*4882a593Smuzhiyun  * value which is good on most machines.  */
38*4882a593Smuzhiyun 
39*4882a593Smuzhiyun /* tested 4, 16, 32 and 64, where 16 gave the best performance when
40*4882a593Smuzhiyun  * checking a 768 and a 1024 bit ElGamal signature.
41*4882a593Smuzhiyun  * (wk 22.12.97) */
42*4882a593Smuzhiyun #ifndef KARATSUBA_THRESHOLD
43*4882a593Smuzhiyun #define KARATSUBA_THRESHOLD 16
44*4882a593Smuzhiyun #endif
45*4882a593Smuzhiyun 
46*4882a593Smuzhiyun /* The code can't handle KARATSUBA_THRESHOLD smaller than 2.  */
47*4882a593Smuzhiyun #if KARATSUBA_THRESHOLD < 2
48*4882a593Smuzhiyun #undef KARATSUBA_THRESHOLD
49*4882a593Smuzhiyun #define KARATSUBA_THRESHOLD 2
50*4882a593Smuzhiyun #endif
51*4882a593Smuzhiyun 
52*4882a593Smuzhiyun typedef mpi_limb_t *mpi_ptr_t;	/* pointer to a limb */
53*4882a593Smuzhiyun typedef int mpi_size_t;		/* (must be a signed type) */
54*4882a593Smuzhiyun 
55*4882a593Smuzhiyun #define RESIZE_IF_NEEDED(a, b)			\
56*4882a593Smuzhiyun 	do {					\
57*4882a593Smuzhiyun 		if ((a)->alloced < (b))		\
58*4882a593Smuzhiyun 			mpi_resize((a), (b));	\
59*4882a593Smuzhiyun 	} while (0)
60*4882a593Smuzhiyun 
61*4882a593Smuzhiyun /* Copy N limbs from S to D.  */
62*4882a593Smuzhiyun #define MPN_COPY(d, s, n) \
63*4882a593Smuzhiyun 	do {					\
64*4882a593Smuzhiyun 		mpi_size_t _i;			\
65*4882a593Smuzhiyun 		for (_i = 0; _i < (n); _i++)	\
66*4882a593Smuzhiyun 			(d)[_i] = (s)[_i];	\
67*4882a593Smuzhiyun 	} while (0)
68*4882a593Smuzhiyun 
69*4882a593Smuzhiyun #define MPN_COPY_INCR(d, s, n)		\
70*4882a593Smuzhiyun 	do {					\
71*4882a593Smuzhiyun 		mpi_size_t _i;			\
72*4882a593Smuzhiyun 		for (_i = 0; _i < (n); _i++)	\
73*4882a593Smuzhiyun 			(d)[_i] = (s)[_i];	\
74*4882a593Smuzhiyun 	} while (0)
75*4882a593Smuzhiyun 
76*4882a593Smuzhiyun 
77*4882a593Smuzhiyun #define MPN_COPY_DECR(d, s, n) \
78*4882a593Smuzhiyun 	do {					\
79*4882a593Smuzhiyun 		mpi_size_t _i;			\
80*4882a593Smuzhiyun 		for (_i = (n)-1; _i >= 0; _i--) \
81*4882a593Smuzhiyun 			(d)[_i] = (s)[_i];	\
82*4882a593Smuzhiyun 	} while (0)
83*4882a593Smuzhiyun 
84*4882a593Smuzhiyun /* Zero N limbs at D */
85*4882a593Smuzhiyun #define MPN_ZERO(d, n) \
86*4882a593Smuzhiyun 	do {					\
87*4882a593Smuzhiyun 		int  _i;			\
88*4882a593Smuzhiyun 		for (_i = 0; _i < (n); _i++)	\
89*4882a593Smuzhiyun 			(d)[_i] = 0;		\
90*4882a593Smuzhiyun 	} while (0)
91*4882a593Smuzhiyun 
92*4882a593Smuzhiyun #define MPN_NORMALIZE(d, n)  \
93*4882a593Smuzhiyun 	do {					\
94*4882a593Smuzhiyun 		while ((n) > 0) {		\
95*4882a593Smuzhiyun 			if ((d)[(n)-1])		\
96*4882a593Smuzhiyun 				break;		\
97*4882a593Smuzhiyun 			(n)--;			\
98*4882a593Smuzhiyun 		}				\
99*4882a593Smuzhiyun 	} while (0)
100*4882a593Smuzhiyun 
101*4882a593Smuzhiyun #define MPN_MUL_N_RECURSE(prodp, up, vp, size, tspace) \
102*4882a593Smuzhiyun 	do {							\
103*4882a593Smuzhiyun 		if ((size) < KARATSUBA_THRESHOLD)		\
104*4882a593Smuzhiyun 			mul_n_basecase(prodp, up, vp, size);	\
105*4882a593Smuzhiyun 		else						\
106*4882a593Smuzhiyun 			mul_n(prodp, up, vp, size, tspace);	\
107*4882a593Smuzhiyun 	} while (0);
108*4882a593Smuzhiyun 
109*4882a593Smuzhiyun /* Divide the two-limb number in (NH,,NL) by D, with DI being the largest
110*4882a593Smuzhiyun  * limb not larger than (2**(2*BITS_PER_MP_LIMB))/D - (2**BITS_PER_MP_LIMB).
111*4882a593Smuzhiyun  * If this would yield overflow, DI should be the largest possible number
112*4882a593Smuzhiyun  * (i.e., only ones).  For correct operation, the most significant bit of D
113*4882a593Smuzhiyun  * has to be set.  Put the quotient in Q and the remainder in R.
114*4882a593Smuzhiyun  */
115*4882a593Smuzhiyun #define UDIV_QRNND_PREINV(q, r, nh, nl, d, di)				\
116*4882a593Smuzhiyun 	do {								\
117*4882a593Smuzhiyun 		mpi_limb_t _ql __maybe_unused;				\
118*4882a593Smuzhiyun 		mpi_limb_t _q, _r;					\
119*4882a593Smuzhiyun 		mpi_limb_t _xh, _xl;					\
120*4882a593Smuzhiyun 		umul_ppmm(_q, _ql, (nh), (di));				\
121*4882a593Smuzhiyun 		_q += (nh);	/* DI is 2**BITS_PER_MPI_LIMB too small */ \
122*4882a593Smuzhiyun 		umul_ppmm(_xh, _xl, _q, (d));				\
123*4882a593Smuzhiyun 		sub_ddmmss(_xh, _r, (nh), (nl), _xh, _xl);		\
124*4882a593Smuzhiyun 		if (_xh) {						\
125*4882a593Smuzhiyun 			sub_ddmmss(_xh, _r, _xh, _r, 0, (d));		\
126*4882a593Smuzhiyun 			_q++;						\
127*4882a593Smuzhiyun 			if (_xh) {					\
128*4882a593Smuzhiyun 				sub_ddmmss(_xh, _r, _xh, _r, 0, (d));	\
129*4882a593Smuzhiyun 				_q++;					\
130*4882a593Smuzhiyun 			}						\
131*4882a593Smuzhiyun 		}							\
132*4882a593Smuzhiyun 		if (_r >= (d)) {					\
133*4882a593Smuzhiyun 			_r -= (d);					\
134*4882a593Smuzhiyun 			_q++;						\
135*4882a593Smuzhiyun 		}							\
136*4882a593Smuzhiyun 		(r) = _r;						\
137*4882a593Smuzhiyun 		(q) = _q;						\
138*4882a593Smuzhiyun 	} while (0)
139*4882a593Smuzhiyun 
140*4882a593Smuzhiyun 
141*4882a593Smuzhiyun /*-- mpiutil.c --*/
142*4882a593Smuzhiyun mpi_ptr_t mpi_alloc_limb_space(unsigned nlimbs);
143*4882a593Smuzhiyun void mpi_free_limb_space(mpi_ptr_t a);
144*4882a593Smuzhiyun void mpi_assign_limb_space(MPI a, mpi_ptr_t ap, unsigned nlimbs);
145*4882a593Smuzhiyun 
146*4882a593Smuzhiyun static inline mpi_limb_t mpihelp_add_1(mpi_ptr_t res_ptr, mpi_ptr_t s1_ptr,
147*4882a593Smuzhiyun 			 mpi_size_t s1_size, mpi_limb_t s2_limb);
148*4882a593Smuzhiyun mpi_limb_t mpihelp_add_n(mpi_ptr_t res_ptr, mpi_ptr_t s1_ptr,
149*4882a593Smuzhiyun 			 mpi_ptr_t s2_ptr, mpi_size_t size);
150*4882a593Smuzhiyun static inline mpi_limb_t mpihelp_add(mpi_ptr_t res_ptr, mpi_ptr_t s1_ptr, mpi_size_t s1_size,
151*4882a593Smuzhiyun 		       mpi_ptr_t s2_ptr, mpi_size_t s2_size);
152*4882a593Smuzhiyun 
153*4882a593Smuzhiyun static inline mpi_limb_t mpihelp_sub_1(mpi_ptr_t res_ptr, mpi_ptr_t s1_ptr,
154*4882a593Smuzhiyun 			 mpi_size_t s1_size, mpi_limb_t s2_limb);
155*4882a593Smuzhiyun mpi_limb_t mpihelp_sub_n(mpi_ptr_t res_ptr, mpi_ptr_t s1_ptr,
156*4882a593Smuzhiyun 			 mpi_ptr_t s2_ptr, mpi_size_t size);
157*4882a593Smuzhiyun static inline mpi_limb_t mpihelp_sub(mpi_ptr_t res_ptr, mpi_ptr_t s1_ptr, mpi_size_t s1_size,
158*4882a593Smuzhiyun 		       mpi_ptr_t s2_ptr, mpi_size_t s2_size);
159*4882a593Smuzhiyun 
160*4882a593Smuzhiyun /*-- mpih-cmp.c --*/
161*4882a593Smuzhiyun int mpihelp_cmp(mpi_ptr_t op1_ptr, mpi_ptr_t op2_ptr, mpi_size_t size);
162*4882a593Smuzhiyun 
163*4882a593Smuzhiyun /*-- mpih-mul.c --*/
164*4882a593Smuzhiyun 
165*4882a593Smuzhiyun struct karatsuba_ctx {
166*4882a593Smuzhiyun 	struct karatsuba_ctx *next;
167*4882a593Smuzhiyun 	mpi_ptr_t tspace;
168*4882a593Smuzhiyun 	mpi_size_t tspace_size;
169*4882a593Smuzhiyun 	mpi_ptr_t tp;
170*4882a593Smuzhiyun 	mpi_size_t tp_size;
171*4882a593Smuzhiyun };
172*4882a593Smuzhiyun 
173*4882a593Smuzhiyun void mpihelp_release_karatsuba_ctx(struct karatsuba_ctx *ctx);
174*4882a593Smuzhiyun 
175*4882a593Smuzhiyun mpi_limb_t mpihelp_addmul_1(mpi_ptr_t res_ptr, mpi_ptr_t s1_ptr,
176*4882a593Smuzhiyun 			    mpi_size_t s1_size, mpi_limb_t s2_limb);
177*4882a593Smuzhiyun mpi_limb_t mpihelp_submul_1(mpi_ptr_t res_ptr, mpi_ptr_t s1_ptr,
178*4882a593Smuzhiyun 			    mpi_size_t s1_size, mpi_limb_t s2_limb);
179*4882a593Smuzhiyun int mpihelp_mul(mpi_ptr_t prodp, mpi_ptr_t up, mpi_size_t usize,
180*4882a593Smuzhiyun 		mpi_ptr_t vp, mpi_size_t vsize, mpi_limb_t *_result);
181*4882a593Smuzhiyun void mpih_sqr_n_basecase(mpi_ptr_t prodp, mpi_ptr_t up, mpi_size_t size);
182*4882a593Smuzhiyun void mpih_sqr_n(mpi_ptr_t prodp, mpi_ptr_t up, mpi_size_t size,
183*4882a593Smuzhiyun 		mpi_ptr_t tspace);
184*4882a593Smuzhiyun void mpihelp_mul_n(mpi_ptr_t prodp,
185*4882a593Smuzhiyun 		mpi_ptr_t up, mpi_ptr_t vp, mpi_size_t size);
186*4882a593Smuzhiyun 
187*4882a593Smuzhiyun int mpihelp_mul_karatsuba_case(mpi_ptr_t prodp,
188*4882a593Smuzhiyun 			       mpi_ptr_t up, mpi_size_t usize,
189*4882a593Smuzhiyun 			       mpi_ptr_t vp, mpi_size_t vsize,
190*4882a593Smuzhiyun 			       struct karatsuba_ctx *ctx);
191*4882a593Smuzhiyun 
192*4882a593Smuzhiyun /*-- generic_mpih-mul1.c --*/
193*4882a593Smuzhiyun mpi_limb_t mpihelp_mul_1(mpi_ptr_t res_ptr, mpi_ptr_t s1_ptr,
194*4882a593Smuzhiyun 			 mpi_size_t s1_size, mpi_limb_t s2_limb);
195*4882a593Smuzhiyun 
196*4882a593Smuzhiyun /*-- mpih-div.c --*/
197*4882a593Smuzhiyun mpi_limb_t mpihelp_mod_1(mpi_ptr_t dividend_ptr, mpi_size_t dividend_size,
198*4882a593Smuzhiyun 			 mpi_limb_t divisor_limb);
199*4882a593Smuzhiyun mpi_limb_t mpihelp_divrem(mpi_ptr_t qp, mpi_size_t qextra_limbs,
200*4882a593Smuzhiyun 			  mpi_ptr_t np, mpi_size_t nsize,
201*4882a593Smuzhiyun 			  mpi_ptr_t dp, mpi_size_t dsize);
202*4882a593Smuzhiyun mpi_limb_t mpihelp_divmod_1(mpi_ptr_t quot_ptr,
203*4882a593Smuzhiyun 			    mpi_ptr_t dividend_ptr, mpi_size_t dividend_size,
204*4882a593Smuzhiyun 			    mpi_limb_t divisor_limb);
205*4882a593Smuzhiyun 
206*4882a593Smuzhiyun /*-- generic_mpih-[lr]shift.c --*/
207*4882a593Smuzhiyun mpi_limb_t mpihelp_lshift(mpi_ptr_t wp, mpi_ptr_t up, mpi_size_t usize,
208*4882a593Smuzhiyun 			  unsigned cnt);
209*4882a593Smuzhiyun mpi_limb_t mpihelp_rshift(mpi_ptr_t wp, mpi_ptr_t up, mpi_size_t usize,
210*4882a593Smuzhiyun 			  unsigned cnt);
211*4882a593Smuzhiyun 
212*4882a593Smuzhiyun /* Define stuff for longlong.h.  */
213*4882a593Smuzhiyun #define W_TYPE_SIZE BITS_PER_MPI_LIMB
214*4882a593Smuzhiyun typedef mpi_limb_t UWtype;
215*4882a593Smuzhiyun typedef unsigned int UHWtype;
216*4882a593Smuzhiyun #if defined(__GNUC__)
217*4882a593Smuzhiyun typedef unsigned int UQItype __attribute__ ((mode(QI)));
218*4882a593Smuzhiyun typedef int SItype __attribute__ ((mode(SI)));
219*4882a593Smuzhiyun typedef unsigned int USItype __attribute__ ((mode(SI)));
220*4882a593Smuzhiyun typedef int DItype __attribute__ ((mode(DI)));
221*4882a593Smuzhiyun typedef unsigned int UDItype __attribute__ ((mode(DI)));
222*4882a593Smuzhiyun #else
223*4882a593Smuzhiyun typedef unsigned char UQItype;
224*4882a593Smuzhiyun typedef long SItype;
225*4882a593Smuzhiyun typedef unsigned long USItype;
226*4882a593Smuzhiyun #endif
227*4882a593Smuzhiyun 
228*4882a593Smuzhiyun #ifdef __GNUC__
229*4882a593Smuzhiyun #include "mpi-inline.h"
230*4882a593Smuzhiyun #endif
231*4882a593Smuzhiyun 
232*4882a593Smuzhiyun #endif /*G10_MPI_INTERNAL_H */
233