1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0 2*4882a593Smuzhiyun /* 3*4882a593Smuzhiyun * Generic Reed Solomon encoder / decoder library 4*4882a593Smuzhiyun * 5*4882a593Smuzhiyun * Copyright 2002, Phil Karn, KA9Q 6*4882a593Smuzhiyun * May be used under the terms of the GNU General Public License (GPL) 7*4882a593Smuzhiyun * 8*4882a593Smuzhiyun * Adaption to the kernel by Thomas Gleixner (tglx@linutronix.de) 9*4882a593Smuzhiyun * 10*4882a593Smuzhiyun * Generic data width independent code which is included by the wrappers. 11*4882a593Smuzhiyun */ 12*4882a593Smuzhiyun { 13*4882a593Smuzhiyun struct rs_codec *rs = rsc->codec; 14*4882a593Smuzhiyun int deg_lambda, el, deg_omega; 15*4882a593Smuzhiyun int i, j, r, k, pad; 16*4882a593Smuzhiyun int nn = rs->nn; 17*4882a593Smuzhiyun int nroots = rs->nroots; 18*4882a593Smuzhiyun int fcr = rs->fcr; 19*4882a593Smuzhiyun int prim = rs->prim; 20*4882a593Smuzhiyun int iprim = rs->iprim; 21*4882a593Smuzhiyun uint16_t *alpha_to = rs->alpha_to; 22*4882a593Smuzhiyun uint16_t *index_of = rs->index_of; 23*4882a593Smuzhiyun uint16_t u, q, tmp, num1, num2, den, discr_r, syn_error; 24*4882a593Smuzhiyun int count = 0; 25*4882a593Smuzhiyun int num_corrected; 26*4882a593Smuzhiyun uint16_t msk = (uint16_t) rs->nn; 27*4882a593Smuzhiyun 28*4882a593Smuzhiyun /* 29*4882a593Smuzhiyun * The decoder buffers are in the rs control struct. They are 30*4882a593Smuzhiyun * arrays sized [nroots + 1] 31*4882a593Smuzhiyun */ 32*4882a593Smuzhiyun uint16_t *lambda = rsc->buffers + RS_DECODE_LAMBDA * (nroots + 1); 33*4882a593Smuzhiyun uint16_t *syn = rsc->buffers + RS_DECODE_SYN * (nroots + 1); 34*4882a593Smuzhiyun uint16_t *b = rsc->buffers + RS_DECODE_B * (nroots + 1); 35*4882a593Smuzhiyun uint16_t *t = rsc->buffers + RS_DECODE_T * (nroots + 1); 36*4882a593Smuzhiyun uint16_t *omega = rsc->buffers + RS_DECODE_OMEGA * (nroots + 1); 37*4882a593Smuzhiyun uint16_t *root = rsc->buffers + RS_DECODE_ROOT * (nroots + 1); 38*4882a593Smuzhiyun uint16_t *reg = rsc->buffers + RS_DECODE_REG * (nroots + 1); 39*4882a593Smuzhiyun uint16_t *loc = rsc->buffers + RS_DECODE_LOC * (nroots + 1); 40*4882a593Smuzhiyun 41*4882a593Smuzhiyun /* Check length parameter for validity */ 42*4882a593Smuzhiyun pad = nn - nroots - len; 43*4882a593Smuzhiyun BUG_ON(pad < 0 || pad >= nn - nroots); 44*4882a593Smuzhiyun 45*4882a593Smuzhiyun /* Does the caller provide the syndrome ? */ 46*4882a593Smuzhiyun if (s != NULL) { 47*4882a593Smuzhiyun for (i = 0; i < nroots; i++) { 48*4882a593Smuzhiyun /* The syndrome is in index form, 49*4882a593Smuzhiyun * so nn represents zero 50*4882a593Smuzhiyun */ 51*4882a593Smuzhiyun if (s[i] != nn) 52*4882a593Smuzhiyun goto decode; 53*4882a593Smuzhiyun } 54*4882a593Smuzhiyun 55*4882a593Smuzhiyun /* syndrome is zero, no errors to correct */ 56*4882a593Smuzhiyun return 0; 57*4882a593Smuzhiyun } 58*4882a593Smuzhiyun 59*4882a593Smuzhiyun /* form the syndromes; i.e., evaluate data(x) at roots of 60*4882a593Smuzhiyun * g(x) */ 61*4882a593Smuzhiyun for (i = 0; i < nroots; i++) 62*4882a593Smuzhiyun syn[i] = (((uint16_t) data[0]) ^ invmsk) & msk; 63*4882a593Smuzhiyun 64*4882a593Smuzhiyun for (j = 1; j < len; j++) { 65*4882a593Smuzhiyun for (i = 0; i < nroots; i++) { 66*4882a593Smuzhiyun if (syn[i] == 0) { 67*4882a593Smuzhiyun syn[i] = (((uint16_t) data[j]) ^ 68*4882a593Smuzhiyun invmsk) & msk; 69*4882a593Smuzhiyun } else { 70*4882a593Smuzhiyun syn[i] = ((((uint16_t) data[j]) ^ 71*4882a593Smuzhiyun invmsk) & msk) ^ 72*4882a593Smuzhiyun alpha_to[rs_modnn(rs, index_of[syn[i]] + 73*4882a593Smuzhiyun (fcr + i) * prim)]; 74*4882a593Smuzhiyun } 75*4882a593Smuzhiyun } 76*4882a593Smuzhiyun } 77*4882a593Smuzhiyun 78*4882a593Smuzhiyun for (j = 0; j < nroots; j++) { 79*4882a593Smuzhiyun for (i = 0; i < nroots; i++) { 80*4882a593Smuzhiyun if (syn[i] == 0) { 81*4882a593Smuzhiyun syn[i] = ((uint16_t) par[j]) & msk; 82*4882a593Smuzhiyun } else { 83*4882a593Smuzhiyun syn[i] = (((uint16_t) par[j]) & msk) ^ 84*4882a593Smuzhiyun alpha_to[rs_modnn(rs, index_of[syn[i]] + 85*4882a593Smuzhiyun (fcr+i)*prim)]; 86*4882a593Smuzhiyun } 87*4882a593Smuzhiyun } 88*4882a593Smuzhiyun } 89*4882a593Smuzhiyun s = syn; 90*4882a593Smuzhiyun 91*4882a593Smuzhiyun /* Convert syndromes to index form, checking for nonzero condition */ 92*4882a593Smuzhiyun syn_error = 0; 93*4882a593Smuzhiyun for (i = 0; i < nroots; i++) { 94*4882a593Smuzhiyun syn_error |= s[i]; 95*4882a593Smuzhiyun s[i] = index_of[s[i]]; 96*4882a593Smuzhiyun } 97*4882a593Smuzhiyun 98*4882a593Smuzhiyun if (!syn_error) { 99*4882a593Smuzhiyun /* if syndrome is zero, data[] is a codeword and there are no 100*4882a593Smuzhiyun * errors to correct. So return data[] unmodified 101*4882a593Smuzhiyun */ 102*4882a593Smuzhiyun return 0; 103*4882a593Smuzhiyun } 104*4882a593Smuzhiyun 105*4882a593Smuzhiyun decode: 106*4882a593Smuzhiyun memset(&lambda[1], 0, nroots * sizeof(lambda[0])); 107*4882a593Smuzhiyun lambda[0] = 1; 108*4882a593Smuzhiyun 109*4882a593Smuzhiyun if (no_eras > 0) { 110*4882a593Smuzhiyun /* Init lambda to be the erasure locator polynomial */ 111*4882a593Smuzhiyun lambda[1] = alpha_to[rs_modnn(rs, 112*4882a593Smuzhiyun prim * (nn - 1 - (eras_pos[0] + pad)))]; 113*4882a593Smuzhiyun for (i = 1; i < no_eras; i++) { 114*4882a593Smuzhiyun u = rs_modnn(rs, prim * (nn - 1 - (eras_pos[i] + pad))); 115*4882a593Smuzhiyun for (j = i + 1; j > 0; j--) { 116*4882a593Smuzhiyun tmp = index_of[lambda[j - 1]]; 117*4882a593Smuzhiyun if (tmp != nn) { 118*4882a593Smuzhiyun lambda[j] ^= 119*4882a593Smuzhiyun alpha_to[rs_modnn(rs, u + tmp)]; 120*4882a593Smuzhiyun } 121*4882a593Smuzhiyun } 122*4882a593Smuzhiyun } 123*4882a593Smuzhiyun } 124*4882a593Smuzhiyun 125*4882a593Smuzhiyun for (i = 0; i < nroots + 1; i++) 126*4882a593Smuzhiyun b[i] = index_of[lambda[i]]; 127*4882a593Smuzhiyun 128*4882a593Smuzhiyun /* 129*4882a593Smuzhiyun * Begin Berlekamp-Massey algorithm to determine error+erasure 130*4882a593Smuzhiyun * locator polynomial 131*4882a593Smuzhiyun */ 132*4882a593Smuzhiyun r = no_eras; 133*4882a593Smuzhiyun el = no_eras; 134*4882a593Smuzhiyun while (++r <= nroots) { /* r is the step number */ 135*4882a593Smuzhiyun /* Compute discrepancy at the r-th step in poly-form */ 136*4882a593Smuzhiyun discr_r = 0; 137*4882a593Smuzhiyun for (i = 0; i < r; i++) { 138*4882a593Smuzhiyun if ((lambda[i] != 0) && (s[r - i - 1] != nn)) { 139*4882a593Smuzhiyun discr_r ^= 140*4882a593Smuzhiyun alpha_to[rs_modnn(rs, 141*4882a593Smuzhiyun index_of[lambda[i]] + 142*4882a593Smuzhiyun s[r - i - 1])]; 143*4882a593Smuzhiyun } 144*4882a593Smuzhiyun } 145*4882a593Smuzhiyun discr_r = index_of[discr_r]; /* Index form */ 146*4882a593Smuzhiyun if (discr_r == nn) { 147*4882a593Smuzhiyun /* 2 lines below: B(x) <-- x*B(x) */ 148*4882a593Smuzhiyun memmove (&b[1], b, nroots * sizeof (b[0])); 149*4882a593Smuzhiyun b[0] = nn; 150*4882a593Smuzhiyun } else { 151*4882a593Smuzhiyun /* 7 lines below: T(x) <-- lambda(x)-discr_r*x*b(x) */ 152*4882a593Smuzhiyun t[0] = lambda[0]; 153*4882a593Smuzhiyun for (i = 0; i < nroots; i++) { 154*4882a593Smuzhiyun if (b[i] != nn) { 155*4882a593Smuzhiyun t[i + 1] = lambda[i + 1] ^ 156*4882a593Smuzhiyun alpha_to[rs_modnn(rs, discr_r + 157*4882a593Smuzhiyun b[i])]; 158*4882a593Smuzhiyun } else 159*4882a593Smuzhiyun t[i + 1] = lambda[i + 1]; 160*4882a593Smuzhiyun } 161*4882a593Smuzhiyun if (2 * el <= r + no_eras - 1) { 162*4882a593Smuzhiyun el = r + no_eras - el; 163*4882a593Smuzhiyun /* 164*4882a593Smuzhiyun * 2 lines below: B(x) <-- inv(discr_r) * 165*4882a593Smuzhiyun * lambda(x) 166*4882a593Smuzhiyun */ 167*4882a593Smuzhiyun for (i = 0; i <= nroots; i++) { 168*4882a593Smuzhiyun b[i] = (lambda[i] == 0) ? nn : 169*4882a593Smuzhiyun rs_modnn(rs, index_of[lambda[i]] 170*4882a593Smuzhiyun - discr_r + nn); 171*4882a593Smuzhiyun } 172*4882a593Smuzhiyun } else { 173*4882a593Smuzhiyun /* 2 lines below: B(x) <-- x*B(x) */ 174*4882a593Smuzhiyun memmove(&b[1], b, nroots * sizeof(b[0])); 175*4882a593Smuzhiyun b[0] = nn; 176*4882a593Smuzhiyun } 177*4882a593Smuzhiyun memcpy(lambda, t, (nroots + 1) * sizeof(t[0])); 178*4882a593Smuzhiyun } 179*4882a593Smuzhiyun } 180*4882a593Smuzhiyun 181*4882a593Smuzhiyun /* Convert lambda to index form and compute deg(lambda(x)) */ 182*4882a593Smuzhiyun deg_lambda = 0; 183*4882a593Smuzhiyun for (i = 0; i < nroots + 1; i++) { 184*4882a593Smuzhiyun lambda[i] = index_of[lambda[i]]; 185*4882a593Smuzhiyun if (lambda[i] != nn) 186*4882a593Smuzhiyun deg_lambda = i; 187*4882a593Smuzhiyun } 188*4882a593Smuzhiyun 189*4882a593Smuzhiyun if (deg_lambda == 0) { 190*4882a593Smuzhiyun /* 191*4882a593Smuzhiyun * deg(lambda) is zero even though the syndrome is non-zero 192*4882a593Smuzhiyun * => uncorrectable error detected 193*4882a593Smuzhiyun */ 194*4882a593Smuzhiyun return -EBADMSG; 195*4882a593Smuzhiyun } 196*4882a593Smuzhiyun 197*4882a593Smuzhiyun /* Find roots of error+erasure locator polynomial by Chien search */ 198*4882a593Smuzhiyun memcpy(®[1], &lambda[1], nroots * sizeof(reg[0])); 199*4882a593Smuzhiyun count = 0; /* Number of roots of lambda(x) */ 200*4882a593Smuzhiyun for (i = 1, k = iprim - 1; i <= nn; i++, k = rs_modnn(rs, k + iprim)) { 201*4882a593Smuzhiyun q = 1; /* lambda[0] is always 0 */ 202*4882a593Smuzhiyun for (j = deg_lambda; j > 0; j--) { 203*4882a593Smuzhiyun if (reg[j] != nn) { 204*4882a593Smuzhiyun reg[j] = rs_modnn(rs, reg[j] + j); 205*4882a593Smuzhiyun q ^= alpha_to[reg[j]]; 206*4882a593Smuzhiyun } 207*4882a593Smuzhiyun } 208*4882a593Smuzhiyun if (q != 0) 209*4882a593Smuzhiyun continue; /* Not a root */ 210*4882a593Smuzhiyun 211*4882a593Smuzhiyun if (k < pad) { 212*4882a593Smuzhiyun /* Impossible error location. Uncorrectable error. */ 213*4882a593Smuzhiyun return -EBADMSG; 214*4882a593Smuzhiyun } 215*4882a593Smuzhiyun 216*4882a593Smuzhiyun /* store root (index-form) and error location number */ 217*4882a593Smuzhiyun root[count] = i; 218*4882a593Smuzhiyun loc[count] = k; 219*4882a593Smuzhiyun /* If we've already found max possible roots, 220*4882a593Smuzhiyun * abort the search to save time 221*4882a593Smuzhiyun */ 222*4882a593Smuzhiyun if (++count == deg_lambda) 223*4882a593Smuzhiyun break; 224*4882a593Smuzhiyun } 225*4882a593Smuzhiyun if (deg_lambda != count) { 226*4882a593Smuzhiyun /* 227*4882a593Smuzhiyun * deg(lambda) unequal to number of roots => uncorrectable 228*4882a593Smuzhiyun * error detected 229*4882a593Smuzhiyun */ 230*4882a593Smuzhiyun return -EBADMSG; 231*4882a593Smuzhiyun } 232*4882a593Smuzhiyun /* 233*4882a593Smuzhiyun * Compute err+eras evaluator poly omega(x) = s(x)*lambda(x) (modulo 234*4882a593Smuzhiyun * x**nroots). in index form. Also find deg(omega). 235*4882a593Smuzhiyun */ 236*4882a593Smuzhiyun deg_omega = deg_lambda - 1; 237*4882a593Smuzhiyun for (i = 0; i <= deg_omega; i++) { 238*4882a593Smuzhiyun tmp = 0; 239*4882a593Smuzhiyun for (j = i; j >= 0; j--) { 240*4882a593Smuzhiyun if ((s[i - j] != nn) && (lambda[j] != nn)) 241*4882a593Smuzhiyun tmp ^= 242*4882a593Smuzhiyun alpha_to[rs_modnn(rs, s[i - j] + lambda[j])]; 243*4882a593Smuzhiyun } 244*4882a593Smuzhiyun omega[i] = index_of[tmp]; 245*4882a593Smuzhiyun } 246*4882a593Smuzhiyun 247*4882a593Smuzhiyun /* 248*4882a593Smuzhiyun * Compute error values in poly-form. num1 = omega(inv(X(l))), num2 = 249*4882a593Smuzhiyun * inv(X(l))**(fcr-1) and den = lambda_pr(inv(X(l))) all in poly-form 250*4882a593Smuzhiyun * Note: we reuse the buffer for b to store the correction pattern 251*4882a593Smuzhiyun */ 252*4882a593Smuzhiyun num_corrected = 0; 253*4882a593Smuzhiyun for (j = count - 1; j >= 0; j--) { 254*4882a593Smuzhiyun num1 = 0; 255*4882a593Smuzhiyun for (i = deg_omega; i >= 0; i--) { 256*4882a593Smuzhiyun if (omega[i] != nn) 257*4882a593Smuzhiyun num1 ^= alpha_to[rs_modnn(rs, omega[i] + 258*4882a593Smuzhiyun i * root[j])]; 259*4882a593Smuzhiyun } 260*4882a593Smuzhiyun 261*4882a593Smuzhiyun if (num1 == 0) { 262*4882a593Smuzhiyun /* Nothing to correct at this position */ 263*4882a593Smuzhiyun b[j] = 0; 264*4882a593Smuzhiyun continue; 265*4882a593Smuzhiyun } 266*4882a593Smuzhiyun 267*4882a593Smuzhiyun num2 = alpha_to[rs_modnn(rs, root[j] * (fcr - 1) + nn)]; 268*4882a593Smuzhiyun den = 0; 269*4882a593Smuzhiyun 270*4882a593Smuzhiyun /* lambda[i+1] for i even is the formal derivative 271*4882a593Smuzhiyun * lambda_pr of lambda[i] */ 272*4882a593Smuzhiyun for (i = min(deg_lambda, nroots - 1) & ~1; i >= 0; i -= 2) { 273*4882a593Smuzhiyun if (lambda[i + 1] != nn) { 274*4882a593Smuzhiyun den ^= alpha_to[rs_modnn(rs, lambda[i + 1] + 275*4882a593Smuzhiyun i * root[j])]; 276*4882a593Smuzhiyun } 277*4882a593Smuzhiyun } 278*4882a593Smuzhiyun 279*4882a593Smuzhiyun b[j] = alpha_to[rs_modnn(rs, index_of[num1] + 280*4882a593Smuzhiyun index_of[num2] + 281*4882a593Smuzhiyun nn - index_of[den])]; 282*4882a593Smuzhiyun num_corrected++; 283*4882a593Smuzhiyun } 284*4882a593Smuzhiyun 285*4882a593Smuzhiyun /* 286*4882a593Smuzhiyun * We compute the syndrome of the 'error' and check that it matches 287*4882a593Smuzhiyun * the syndrome of the received word 288*4882a593Smuzhiyun */ 289*4882a593Smuzhiyun for (i = 0; i < nroots; i++) { 290*4882a593Smuzhiyun tmp = 0; 291*4882a593Smuzhiyun for (j = 0; j < count; j++) { 292*4882a593Smuzhiyun if (b[j] == 0) 293*4882a593Smuzhiyun continue; 294*4882a593Smuzhiyun 295*4882a593Smuzhiyun k = (fcr + i) * prim * (nn-loc[j]-1); 296*4882a593Smuzhiyun tmp ^= alpha_to[rs_modnn(rs, index_of[b[j]] + k)]; 297*4882a593Smuzhiyun } 298*4882a593Smuzhiyun 299*4882a593Smuzhiyun if (tmp != alpha_to[s[i]]) 300*4882a593Smuzhiyun return -EBADMSG; 301*4882a593Smuzhiyun } 302*4882a593Smuzhiyun 303*4882a593Smuzhiyun /* 304*4882a593Smuzhiyun * Store the error correction pattern, if a 305*4882a593Smuzhiyun * correction buffer is available 306*4882a593Smuzhiyun */ 307*4882a593Smuzhiyun if (corr && eras_pos) { 308*4882a593Smuzhiyun j = 0; 309*4882a593Smuzhiyun for (i = 0; i < count; i++) { 310*4882a593Smuzhiyun if (b[i]) { 311*4882a593Smuzhiyun corr[j] = b[i]; 312*4882a593Smuzhiyun eras_pos[j++] = loc[i] - pad; 313*4882a593Smuzhiyun } 314*4882a593Smuzhiyun } 315*4882a593Smuzhiyun } else if (data && par) { 316*4882a593Smuzhiyun /* Apply error to data and parity */ 317*4882a593Smuzhiyun for (i = 0; i < count; i++) { 318*4882a593Smuzhiyun if (loc[i] < (nn - nroots)) 319*4882a593Smuzhiyun data[loc[i] - pad] ^= b[i]; 320*4882a593Smuzhiyun else 321*4882a593Smuzhiyun par[loc[i] - pad - len] ^= b[i]; 322*4882a593Smuzhiyun } 323*4882a593Smuzhiyun } 324*4882a593Smuzhiyun 325*4882a593Smuzhiyun return num_corrected; 326*4882a593Smuzhiyun } 327