xref: /OK3568_Linux_fs/kernel/lib/reed_solomon/decode_rs.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Generic Reed Solomon encoder / decoder library
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * Copyright 2002, Phil Karn, KA9Q
6*4882a593Smuzhiyun  * May be used under the terms of the GNU General Public License (GPL)
7*4882a593Smuzhiyun  *
8*4882a593Smuzhiyun  * Adaption to the kernel by Thomas Gleixner (tglx@linutronix.de)
9*4882a593Smuzhiyun  *
10*4882a593Smuzhiyun  * Generic data width independent code which is included by the wrappers.
11*4882a593Smuzhiyun  */
12*4882a593Smuzhiyun {
13*4882a593Smuzhiyun 	struct rs_codec *rs = rsc->codec;
14*4882a593Smuzhiyun 	int deg_lambda, el, deg_omega;
15*4882a593Smuzhiyun 	int i, j, r, k, pad;
16*4882a593Smuzhiyun 	int nn = rs->nn;
17*4882a593Smuzhiyun 	int nroots = rs->nroots;
18*4882a593Smuzhiyun 	int fcr = rs->fcr;
19*4882a593Smuzhiyun 	int prim = rs->prim;
20*4882a593Smuzhiyun 	int iprim = rs->iprim;
21*4882a593Smuzhiyun 	uint16_t *alpha_to = rs->alpha_to;
22*4882a593Smuzhiyun 	uint16_t *index_of = rs->index_of;
23*4882a593Smuzhiyun 	uint16_t u, q, tmp, num1, num2, den, discr_r, syn_error;
24*4882a593Smuzhiyun 	int count = 0;
25*4882a593Smuzhiyun 	int num_corrected;
26*4882a593Smuzhiyun 	uint16_t msk = (uint16_t) rs->nn;
27*4882a593Smuzhiyun 
28*4882a593Smuzhiyun 	/*
29*4882a593Smuzhiyun 	 * The decoder buffers are in the rs control struct. They are
30*4882a593Smuzhiyun 	 * arrays sized [nroots + 1]
31*4882a593Smuzhiyun 	 */
32*4882a593Smuzhiyun 	uint16_t *lambda = rsc->buffers + RS_DECODE_LAMBDA * (nroots + 1);
33*4882a593Smuzhiyun 	uint16_t *syn = rsc->buffers + RS_DECODE_SYN * (nroots + 1);
34*4882a593Smuzhiyun 	uint16_t *b = rsc->buffers + RS_DECODE_B * (nroots + 1);
35*4882a593Smuzhiyun 	uint16_t *t = rsc->buffers + RS_DECODE_T * (nroots + 1);
36*4882a593Smuzhiyun 	uint16_t *omega = rsc->buffers + RS_DECODE_OMEGA * (nroots + 1);
37*4882a593Smuzhiyun 	uint16_t *root = rsc->buffers + RS_DECODE_ROOT * (nroots + 1);
38*4882a593Smuzhiyun 	uint16_t *reg = rsc->buffers + RS_DECODE_REG * (nroots + 1);
39*4882a593Smuzhiyun 	uint16_t *loc = rsc->buffers + RS_DECODE_LOC * (nroots + 1);
40*4882a593Smuzhiyun 
41*4882a593Smuzhiyun 	/* Check length parameter for validity */
42*4882a593Smuzhiyun 	pad = nn - nroots - len;
43*4882a593Smuzhiyun 	BUG_ON(pad < 0 || pad >= nn - nroots);
44*4882a593Smuzhiyun 
45*4882a593Smuzhiyun 	/* Does the caller provide the syndrome ? */
46*4882a593Smuzhiyun 	if (s != NULL) {
47*4882a593Smuzhiyun 		for (i = 0; i < nroots; i++) {
48*4882a593Smuzhiyun 			/* The syndrome is in index form,
49*4882a593Smuzhiyun 			 * so nn represents zero
50*4882a593Smuzhiyun 			 */
51*4882a593Smuzhiyun 			if (s[i] != nn)
52*4882a593Smuzhiyun 				goto decode;
53*4882a593Smuzhiyun 		}
54*4882a593Smuzhiyun 
55*4882a593Smuzhiyun 		/* syndrome is zero, no errors to correct  */
56*4882a593Smuzhiyun 		return 0;
57*4882a593Smuzhiyun 	}
58*4882a593Smuzhiyun 
59*4882a593Smuzhiyun 	/* form the syndromes; i.e., evaluate data(x) at roots of
60*4882a593Smuzhiyun 	 * g(x) */
61*4882a593Smuzhiyun 	for (i = 0; i < nroots; i++)
62*4882a593Smuzhiyun 		syn[i] = (((uint16_t) data[0]) ^ invmsk) & msk;
63*4882a593Smuzhiyun 
64*4882a593Smuzhiyun 	for (j = 1; j < len; j++) {
65*4882a593Smuzhiyun 		for (i = 0; i < nroots; i++) {
66*4882a593Smuzhiyun 			if (syn[i] == 0) {
67*4882a593Smuzhiyun 				syn[i] = (((uint16_t) data[j]) ^
68*4882a593Smuzhiyun 					  invmsk) & msk;
69*4882a593Smuzhiyun 			} else {
70*4882a593Smuzhiyun 				syn[i] = ((((uint16_t) data[j]) ^
71*4882a593Smuzhiyun 					   invmsk) & msk) ^
72*4882a593Smuzhiyun 					alpha_to[rs_modnn(rs, index_of[syn[i]] +
73*4882a593Smuzhiyun 						       (fcr + i) * prim)];
74*4882a593Smuzhiyun 			}
75*4882a593Smuzhiyun 		}
76*4882a593Smuzhiyun 	}
77*4882a593Smuzhiyun 
78*4882a593Smuzhiyun 	for (j = 0; j < nroots; j++) {
79*4882a593Smuzhiyun 		for (i = 0; i < nroots; i++) {
80*4882a593Smuzhiyun 			if (syn[i] == 0) {
81*4882a593Smuzhiyun 				syn[i] = ((uint16_t) par[j]) & msk;
82*4882a593Smuzhiyun 			} else {
83*4882a593Smuzhiyun 				syn[i] = (((uint16_t) par[j]) & msk) ^
84*4882a593Smuzhiyun 					alpha_to[rs_modnn(rs, index_of[syn[i]] +
85*4882a593Smuzhiyun 						       (fcr+i)*prim)];
86*4882a593Smuzhiyun 			}
87*4882a593Smuzhiyun 		}
88*4882a593Smuzhiyun 	}
89*4882a593Smuzhiyun 	s = syn;
90*4882a593Smuzhiyun 
91*4882a593Smuzhiyun 	/* Convert syndromes to index form, checking for nonzero condition */
92*4882a593Smuzhiyun 	syn_error = 0;
93*4882a593Smuzhiyun 	for (i = 0; i < nroots; i++) {
94*4882a593Smuzhiyun 		syn_error |= s[i];
95*4882a593Smuzhiyun 		s[i] = index_of[s[i]];
96*4882a593Smuzhiyun 	}
97*4882a593Smuzhiyun 
98*4882a593Smuzhiyun 	if (!syn_error) {
99*4882a593Smuzhiyun 		/* if syndrome is zero, data[] is a codeword and there are no
100*4882a593Smuzhiyun 		 * errors to correct. So return data[] unmodified
101*4882a593Smuzhiyun 		 */
102*4882a593Smuzhiyun 		return 0;
103*4882a593Smuzhiyun 	}
104*4882a593Smuzhiyun 
105*4882a593Smuzhiyun  decode:
106*4882a593Smuzhiyun 	memset(&lambda[1], 0, nroots * sizeof(lambda[0]));
107*4882a593Smuzhiyun 	lambda[0] = 1;
108*4882a593Smuzhiyun 
109*4882a593Smuzhiyun 	if (no_eras > 0) {
110*4882a593Smuzhiyun 		/* Init lambda to be the erasure locator polynomial */
111*4882a593Smuzhiyun 		lambda[1] = alpha_to[rs_modnn(rs,
112*4882a593Smuzhiyun 					prim * (nn - 1 - (eras_pos[0] + pad)))];
113*4882a593Smuzhiyun 		for (i = 1; i < no_eras; i++) {
114*4882a593Smuzhiyun 			u = rs_modnn(rs, prim * (nn - 1 - (eras_pos[i] + pad)));
115*4882a593Smuzhiyun 			for (j = i + 1; j > 0; j--) {
116*4882a593Smuzhiyun 				tmp = index_of[lambda[j - 1]];
117*4882a593Smuzhiyun 				if (tmp != nn) {
118*4882a593Smuzhiyun 					lambda[j] ^=
119*4882a593Smuzhiyun 						alpha_to[rs_modnn(rs, u + tmp)];
120*4882a593Smuzhiyun 				}
121*4882a593Smuzhiyun 			}
122*4882a593Smuzhiyun 		}
123*4882a593Smuzhiyun 	}
124*4882a593Smuzhiyun 
125*4882a593Smuzhiyun 	for (i = 0; i < nroots + 1; i++)
126*4882a593Smuzhiyun 		b[i] = index_of[lambda[i]];
127*4882a593Smuzhiyun 
128*4882a593Smuzhiyun 	/*
129*4882a593Smuzhiyun 	 * Begin Berlekamp-Massey algorithm to determine error+erasure
130*4882a593Smuzhiyun 	 * locator polynomial
131*4882a593Smuzhiyun 	 */
132*4882a593Smuzhiyun 	r = no_eras;
133*4882a593Smuzhiyun 	el = no_eras;
134*4882a593Smuzhiyun 	while (++r <= nroots) {	/* r is the step number */
135*4882a593Smuzhiyun 		/* Compute discrepancy at the r-th step in poly-form */
136*4882a593Smuzhiyun 		discr_r = 0;
137*4882a593Smuzhiyun 		for (i = 0; i < r; i++) {
138*4882a593Smuzhiyun 			if ((lambda[i] != 0) && (s[r - i - 1] != nn)) {
139*4882a593Smuzhiyun 				discr_r ^=
140*4882a593Smuzhiyun 					alpha_to[rs_modnn(rs,
141*4882a593Smuzhiyun 							  index_of[lambda[i]] +
142*4882a593Smuzhiyun 							  s[r - i - 1])];
143*4882a593Smuzhiyun 			}
144*4882a593Smuzhiyun 		}
145*4882a593Smuzhiyun 		discr_r = index_of[discr_r];	/* Index form */
146*4882a593Smuzhiyun 		if (discr_r == nn) {
147*4882a593Smuzhiyun 			/* 2 lines below: B(x) <-- x*B(x) */
148*4882a593Smuzhiyun 			memmove (&b[1], b, nroots * sizeof (b[0]));
149*4882a593Smuzhiyun 			b[0] = nn;
150*4882a593Smuzhiyun 		} else {
151*4882a593Smuzhiyun 			/* 7 lines below: T(x) <-- lambda(x)-discr_r*x*b(x) */
152*4882a593Smuzhiyun 			t[0] = lambda[0];
153*4882a593Smuzhiyun 			for (i = 0; i < nroots; i++) {
154*4882a593Smuzhiyun 				if (b[i] != nn) {
155*4882a593Smuzhiyun 					t[i + 1] = lambda[i + 1] ^
156*4882a593Smuzhiyun 						alpha_to[rs_modnn(rs, discr_r +
157*4882a593Smuzhiyun 								  b[i])];
158*4882a593Smuzhiyun 				} else
159*4882a593Smuzhiyun 					t[i + 1] = lambda[i + 1];
160*4882a593Smuzhiyun 			}
161*4882a593Smuzhiyun 			if (2 * el <= r + no_eras - 1) {
162*4882a593Smuzhiyun 				el = r + no_eras - el;
163*4882a593Smuzhiyun 				/*
164*4882a593Smuzhiyun 				 * 2 lines below: B(x) <-- inv(discr_r) *
165*4882a593Smuzhiyun 				 * lambda(x)
166*4882a593Smuzhiyun 				 */
167*4882a593Smuzhiyun 				for (i = 0; i <= nroots; i++) {
168*4882a593Smuzhiyun 					b[i] = (lambda[i] == 0) ? nn :
169*4882a593Smuzhiyun 						rs_modnn(rs, index_of[lambda[i]]
170*4882a593Smuzhiyun 							 - discr_r + nn);
171*4882a593Smuzhiyun 				}
172*4882a593Smuzhiyun 			} else {
173*4882a593Smuzhiyun 				/* 2 lines below: B(x) <-- x*B(x) */
174*4882a593Smuzhiyun 				memmove(&b[1], b, nroots * sizeof(b[0]));
175*4882a593Smuzhiyun 				b[0] = nn;
176*4882a593Smuzhiyun 			}
177*4882a593Smuzhiyun 			memcpy(lambda, t, (nroots + 1) * sizeof(t[0]));
178*4882a593Smuzhiyun 		}
179*4882a593Smuzhiyun 	}
180*4882a593Smuzhiyun 
181*4882a593Smuzhiyun 	/* Convert lambda to index form and compute deg(lambda(x)) */
182*4882a593Smuzhiyun 	deg_lambda = 0;
183*4882a593Smuzhiyun 	for (i = 0; i < nroots + 1; i++) {
184*4882a593Smuzhiyun 		lambda[i] = index_of[lambda[i]];
185*4882a593Smuzhiyun 		if (lambda[i] != nn)
186*4882a593Smuzhiyun 			deg_lambda = i;
187*4882a593Smuzhiyun 	}
188*4882a593Smuzhiyun 
189*4882a593Smuzhiyun 	if (deg_lambda == 0) {
190*4882a593Smuzhiyun 		/*
191*4882a593Smuzhiyun 		 * deg(lambda) is zero even though the syndrome is non-zero
192*4882a593Smuzhiyun 		 * => uncorrectable error detected
193*4882a593Smuzhiyun 		 */
194*4882a593Smuzhiyun 		return -EBADMSG;
195*4882a593Smuzhiyun 	}
196*4882a593Smuzhiyun 
197*4882a593Smuzhiyun 	/* Find roots of error+erasure locator polynomial by Chien search */
198*4882a593Smuzhiyun 	memcpy(&reg[1], &lambda[1], nroots * sizeof(reg[0]));
199*4882a593Smuzhiyun 	count = 0;		/* Number of roots of lambda(x) */
200*4882a593Smuzhiyun 	for (i = 1, k = iprim - 1; i <= nn; i++, k = rs_modnn(rs, k + iprim)) {
201*4882a593Smuzhiyun 		q = 1;		/* lambda[0] is always 0 */
202*4882a593Smuzhiyun 		for (j = deg_lambda; j > 0; j--) {
203*4882a593Smuzhiyun 			if (reg[j] != nn) {
204*4882a593Smuzhiyun 				reg[j] = rs_modnn(rs, reg[j] + j);
205*4882a593Smuzhiyun 				q ^= alpha_to[reg[j]];
206*4882a593Smuzhiyun 			}
207*4882a593Smuzhiyun 		}
208*4882a593Smuzhiyun 		if (q != 0)
209*4882a593Smuzhiyun 			continue;	/* Not a root */
210*4882a593Smuzhiyun 
211*4882a593Smuzhiyun 		if (k < pad) {
212*4882a593Smuzhiyun 			/* Impossible error location. Uncorrectable error. */
213*4882a593Smuzhiyun 			return -EBADMSG;
214*4882a593Smuzhiyun 		}
215*4882a593Smuzhiyun 
216*4882a593Smuzhiyun 		/* store root (index-form) and error location number */
217*4882a593Smuzhiyun 		root[count] = i;
218*4882a593Smuzhiyun 		loc[count] = k;
219*4882a593Smuzhiyun 		/* If we've already found max possible roots,
220*4882a593Smuzhiyun 		 * abort the search to save time
221*4882a593Smuzhiyun 		 */
222*4882a593Smuzhiyun 		if (++count == deg_lambda)
223*4882a593Smuzhiyun 			break;
224*4882a593Smuzhiyun 	}
225*4882a593Smuzhiyun 	if (deg_lambda != count) {
226*4882a593Smuzhiyun 		/*
227*4882a593Smuzhiyun 		 * deg(lambda) unequal to number of roots => uncorrectable
228*4882a593Smuzhiyun 		 * error detected
229*4882a593Smuzhiyun 		 */
230*4882a593Smuzhiyun 		return -EBADMSG;
231*4882a593Smuzhiyun 	}
232*4882a593Smuzhiyun 	/*
233*4882a593Smuzhiyun 	 * Compute err+eras evaluator poly omega(x) = s(x)*lambda(x) (modulo
234*4882a593Smuzhiyun 	 * x**nroots). in index form. Also find deg(omega).
235*4882a593Smuzhiyun 	 */
236*4882a593Smuzhiyun 	deg_omega = deg_lambda - 1;
237*4882a593Smuzhiyun 	for (i = 0; i <= deg_omega; i++) {
238*4882a593Smuzhiyun 		tmp = 0;
239*4882a593Smuzhiyun 		for (j = i; j >= 0; j--) {
240*4882a593Smuzhiyun 			if ((s[i - j] != nn) && (lambda[j] != nn))
241*4882a593Smuzhiyun 				tmp ^=
242*4882a593Smuzhiyun 				    alpha_to[rs_modnn(rs, s[i - j] + lambda[j])];
243*4882a593Smuzhiyun 		}
244*4882a593Smuzhiyun 		omega[i] = index_of[tmp];
245*4882a593Smuzhiyun 	}
246*4882a593Smuzhiyun 
247*4882a593Smuzhiyun 	/*
248*4882a593Smuzhiyun 	 * Compute error values in poly-form. num1 = omega(inv(X(l))), num2 =
249*4882a593Smuzhiyun 	 * inv(X(l))**(fcr-1) and den = lambda_pr(inv(X(l))) all in poly-form
250*4882a593Smuzhiyun 	 * Note: we reuse the buffer for b to store the correction pattern
251*4882a593Smuzhiyun 	 */
252*4882a593Smuzhiyun 	num_corrected = 0;
253*4882a593Smuzhiyun 	for (j = count - 1; j >= 0; j--) {
254*4882a593Smuzhiyun 		num1 = 0;
255*4882a593Smuzhiyun 		for (i = deg_omega; i >= 0; i--) {
256*4882a593Smuzhiyun 			if (omega[i] != nn)
257*4882a593Smuzhiyun 				num1 ^= alpha_to[rs_modnn(rs, omega[i] +
258*4882a593Smuzhiyun 							i * root[j])];
259*4882a593Smuzhiyun 		}
260*4882a593Smuzhiyun 
261*4882a593Smuzhiyun 		if (num1 == 0) {
262*4882a593Smuzhiyun 			/* Nothing to correct at this position */
263*4882a593Smuzhiyun 			b[j] = 0;
264*4882a593Smuzhiyun 			continue;
265*4882a593Smuzhiyun 		}
266*4882a593Smuzhiyun 
267*4882a593Smuzhiyun 		num2 = alpha_to[rs_modnn(rs, root[j] * (fcr - 1) + nn)];
268*4882a593Smuzhiyun 		den = 0;
269*4882a593Smuzhiyun 
270*4882a593Smuzhiyun 		/* lambda[i+1] for i even is the formal derivative
271*4882a593Smuzhiyun 		 * lambda_pr of lambda[i] */
272*4882a593Smuzhiyun 		for (i = min(deg_lambda, nroots - 1) & ~1; i >= 0; i -= 2) {
273*4882a593Smuzhiyun 			if (lambda[i + 1] != nn) {
274*4882a593Smuzhiyun 				den ^= alpha_to[rs_modnn(rs, lambda[i + 1] +
275*4882a593Smuzhiyun 						       i * root[j])];
276*4882a593Smuzhiyun 			}
277*4882a593Smuzhiyun 		}
278*4882a593Smuzhiyun 
279*4882a593Smuzhiyun 		b[j] = alpha_to[rs_modnn(rs, index_of[num1] +
280*4882a593Smuzhiyun 					       index_of[num2] +
281*4882a593Smuzhiyun 					       nn - index_of[den])];
282*4882a593Smuzhiyun 		num_corrected++;
283*4882a593Smuzhiyun 	}
284*4882a593Smuzhiyun 
285*4882a593Smuzhiyun 	/*
286*4882a593Smuzhiyun 	 * We compute the syndrome of the 'error' and check that it matches
287*4882a593Smuzhiyun 	 * the syndrome of the received word
288*4882a593Smuzhiyun 	 */
289*4882a593Smuzhiyun 	for (i = 0; i < nroots; i++) {
290*4882a593Smuzhiyun 		tmp = 0;
291*4882a593Smuzhiyun 		for (j = 0; j < count; j++) {
292*4882a593Smuzhiyun 			if (b[j] == 0)
293*4882a593Smuzhiyun 				continue;
294*4882a593Smuzhiyun 
295*4882a593Smuzhiyun 			k = (fcr + i) * prim * (nn-loc[j]-1);
296*4882a593Smuzhiyun 			tmp ^= alpha_to[rs_modnn(rs, index_of[b[j]] + k)];
297*4882a593Smuzhiyun 		}
298*4882a593Smuzhiyun 
299*4882a593Smuzhiyun 		if (tmp != alpha_to[s[i]])
300*4882a593Smuzhiyun 			return -EBADMSG;
301*4882a593Smuzhiyun 	}
302*4882a593Smuzhiyun 
303*4882a593Smuzhiyun 	/*
304*4882a593Smuzhiyun 	 * Store the error correction pattern, if a
305*4882a593Smuzhiyun 	 * correction buffer is available
306*4882a593Smuzhiyun 	 */
307*4882a593Smuzhiyun 	if (corr && eras_pos) {
308*4882a593Smuzhiyun 		j = 0;
309*4882a593Smuzhiyun 		for (i = 0; i < count; i++) {
310*4882a593Smuzhiyun 			if (b[i]) {
311*4882a593Smuzhiyun 				corr[j] = b[i];
312*4882a593Smuzhiyun 				eras_pos[j++] = loc[i] - pad;
313*4882a593Smuzhiyun 			}
314*4882a593Smuzhiyun 		}
315*4882a593Smuzhiyun 	} else if (data && par) {
316*4882a593Smuzhiyun 		/* Apply error to data and parity */
317*4882a593Smuzhiyun 		for (i = 0; i < count; i++) {
318*4882a593Smuzhiyun 			if (loc[i] < (nn - nroots))
319*4882a593Smuzhiyun 				data[loc[i] - pad] ^= b[i];
320*4882a593Smuzhiyun 			else
321*4882a593Smuzhiyun 				par[loc[i] - pad - len] ^= b[i];
322*4882a593Smuzhiyun 		}
323*4882a593Smuzhiyun 	}
324*4882a593Smuzhiyun 
325*4882a593Smuzhiyun 	return  num_corrected;
326*4882a593Smuzhiyun }
327