1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun * LZ4 - Fast LZ compression algorithm
3*4882a593Smuzhiyun * Copyright (C) 2011 - 2016, Yann Collet.
4*4882a593Smuzhiyun * BSD 2 - Clause License (http://www.opensource.org/licenses/bsd - license.php)
5*4882a593Smuzhiyun * Redistribution and use in source and binary forms, with or without
6*4882a593Smuzhiyun * modification, are permitted provided that the following conditions are
7*4882a593Smuzhiyun * met:
8*4882a593Smuzhiyun * * Redistributions of source code must retain the above copyright
9*4882a593Smuzhiyun * notice, this list of conditions and the following disclaimer.
10*4882a593Smuzhiyun * * Redistributions in binary form must reproduce the above
11*4882a593Smuzhiyun * copyright notice, this list of conditions and the following disclaimer
12*4882a593Smuzhiyun * in the documentation and/or other materials provided with the
13*4882a593Smuzhiyun * distribution.
14*4882a593Smuzhiyun * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
15*4882a593Smuzhiyun * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
16*4882a593Smuzhiyun * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
17*4882a593Smuzhiyun * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
18*4882a593Smuzhiyun * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
19*4882a593Smuzhiyun * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
20*4882a593Smuzhiyun * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
21*4882a593Smuzhiyun * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
22*4882a593Smuzhiyun * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
23*4882a593Smuzhiyun * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
24*4882a593Smuzhiyun * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
25*4882a593Smuzhiyun * You can contact the author at :
26*4882a593Smuzhiyun * - LZ4 homepage : http://www.lz4.org
27*4882a593Smuzhiyun * - LZ4 source repository : https://github.com/lz4/lz4
28*4882a593Smuzhiyun *
29*4882a593Smuzhiyun * Changed for kernel usage by:
30*4882a593Smuzhiyun * Sven Schmidt <4sschmid@informatik.uni-hamburg.de>
31*4882a593Smuzhiyun */
32*4882a593Smuzhiyun
33*4882a593Smuzhiyun /*-************************************
34*4882a593Smuzhiyun * Dependencies
35*4882a593Smuzhiyun **************************************/
36*4882a593Smuzhiyun #include <linux/lz4.h>
37*4882a593Smuzhiyun #include "lz4defs.h"
38*4882a593Smuzhiyun #include <linux/init.h>
39*4882a593Smuzhiyun #include <linux/module.h>
40*4882a593Smuzhiyun #include <linux/kernel.h>
41*4882a593Smuzhiyun #include <asm/unaligned.h>
42*4882a593Smuzhiyun
43*4882a593Smuzhiyun /*-*****************************
44*4882a593Smuzhiyun * Decompression functions
45*4882a593Smuzhiyun *******************************/
46*4882a593Smuzhiyun
47*4882a593Smuzhiyun #define DEBUGLOG(l, ...) {} /* disabled */
48*4882a593Smuzhiyun
49*4882a593Smuzhiyun #ifndef assert
50*4882a593Smuzhiyun #define assert(condition) ((void)0)
51*4882a593Smuzhiyun #endif
52*4882a593Smuzhiyun
53*4882a593Smuzhiyun /*
54*4882a593Smuzhiyun * LZ4_decompress_generic() :
55*4882a593Smuzhiyun * This generic decompression function covers all use cases.
56*4882a593Smuzhiyun * It shall be instantiated several times, using different sets of directives.
57*4882a593Smuzhiyun * Note that it is important for performance that this function really get inlined,
58*4882a593Smuzhiyun * in order to remove useless branches during compilation optimization.
59*4882a593Smuzhiyun */
LZ4_decompress_generic(const char * const src,char * const dst,int srcSize,int outputSize,endCondition_directive endOnInput,earlyEnd_directive partialDecoding,dict_directive dict,const BYTE * const lowPrefix,const BYTE * const dictStart,const size_t dictSize)60*4882a593Smuzhiyun static FORCE_INLINE int LZ4_decompress_generic(
61*4882a593Smuzhiyun const char * const src,
62*4882a593Smuzhiyun char * const dst,
63*4882a593Smuzhiyun int srcSize,
64*4882a593Smuzhiyun /*
65*4882a593Smuzhiyun * If endOnInput == endOnInputSize,
66*4882a593Smuzhiyun * this value is `dstCapacity`
67*4882a593Smuzhiyun */
68*4882a593Smuzhiyun int outputSize,
69*4882a593Smuzhiyun /* endOnOutputSize, endOnInputSize */
70*4882a593Smuzhiyun endCondition_directive endOnInput,
71*4882a593Smuzhiyun /* full, partial */
72*4882a593Smuzhiyun earlyEnd_directive partialDecoding,
73*4882a593Smuzhiyun /* noDict, withPrefix64k, usingExtDict */
74*4882a593Smuzhiyun dict_directive dict,
75*4882a593Smuzhiyun /* always <= dst, == dst when no prefix */
76*4882a593Smuzhiyun const BYTE * const lowPrefix,
77*4882a593Smuzhiyun /* only if dict == usingExtDict */
78*4882a593Smuzhiyun const BYTE * const dictStart,
79*4882a593Smuzhiyun /* note : = 0 if noDict */
80*4882a593Smuzhiyun const size_t dictSize
81*4882a593Smuzhiyun )
82*4882a593Smuzhiyun {
83*4882a593Smuzhiyun const BYTE *ip = (const BYTE *) src;
84*4882a593Smuzhiyun const BYTE * const iend = ip + srcSize;
85*4882a593Smuzhiyun
86*4882a593Smuzhiyun BYTE *op = (BYTE *) dst;
87*4882a593Smuzhiyun BYTE * const oend = op + outputSize;
88*4882a593Smuzhiyun BYTE *cpy;
89*4882a593Smuzhiyun
90*4882a593Smuzhiyun const BYTE * const dictEnd = (const BYTE *)dictStart + dictSize;
91*4882a593Smuzhiyun static const unsigned int inc32table[8] = {0, 1, 2, 1, 0, 4, 4, 4};
92*4882a593Smuzhiyun static const int dec64table[8] = {0, 0, 0, -1, -4, 1, 2, 3};
93*4882a593Smuzhiyun
94*4882a593Smuzhiyun const int safeDecode = (endOnInput == endOnInputSize);
95*4882a593Smuzhiyun const int checkOffset = ((safeDecode) && (dictSize < (int)(64 * KB)));
96*4882a593Smuzhiyun
97*4882a593Smuzhiyun /* Set up the "end" pointers for the shortcut. */
98*4882a593Smuzhiyun const BYTE *const shortiend = iend -
99*4882a593Smuzhiyun (endOnInput ? 14 : 8) /*maxLL*/ - 2 /*offset*/;
100*4882a593Smuzhiyun const BYTE *const shortoend = oend -
101*4882a593Smuzhiyun (endOnInput ? 14 : 8) /*maxLL*/ - 18 /*maxML*/;
102*4882a593Smuzhiyun
103*4882a593Smuzhiyun DEBUGLOG(5, "%s (srcSize:%i, dstSize:%i)", __func__,
104*4882a593Smuzhiyun srcSize, outputSize);
105*4882a593Smuzhiyun
106*4882a593Smuzhiyun /* Special cases */
107*4882a593Smuzhiyun assert(lowPrefix <= op);
108*4882a593Smuzhiyun assert(src != NULL);
109*4882a593Smuzhiyun
110*4882a593Smuzhiyun /* Empty output buffer */
111*4882a593Smuzhiyun if ((endOnInput) && (unlikely(outputSize == 0)))
112*4882a593Smuzhiyun return ((srcSize == 1) && (*ip == 0)) ? 0 : -1;
113*4882a593Smuzhiyun
114*4882a593Smuzhiyun if ((!endOnInput) && (unlikely(outputSize == 0)))
115*4882a593Smuzhiyun return (*ip == 0 ? 1 : -1);
116*4882a593Smuzhiyun
117*4882a593Smuzhiyun if ((endOnInput) && unlikely(srcSize == 0))
118*4882a593Smuzhiyun return -1;
119*4882a593Smuzhiyun
120*4882a593Smuzhiyun /* Main Loop : decode sequences */
121*4882a593Smuzhiyun while (1) {
122*4882a593Smuzhiyun size_t length;
123*4882a593Smuzhiyun const BYTE *match;
124*4882a593Smuzhiyun size_t offset;
125*4882a593Smuzhiyun
126*4882a593Smuzhiyun /* get literal length */
127*4882a593Smuzhiyun unsigned int const token = *ip++;
128*4882a593Smuzhiyun length = token>>ML_BITS;
129*4882a593Smuzhiyun
130*4882a593Smuzhiyun /* ip < iend before the increment */
131*4882a593Smuzhiyun assert(!endOnInput || ip <= iend);
132*4882a593Smuzhiyun
133*4882a593Smuzhiyun /*
134*4882a593Smuzhiyun * A two-stage shortcut for the most common case:
135*4882a593Smuzhiyun * 1) If the literal length is 0..14, and there is enough
136*4882a593Smuzhiyun * space, enter the shortcut and copy 16 bytes on behalf
137*4882a593Smuzhiyun * of the literals (in the fast mode, only 8 bytes can be
138*4882a593Smuzhiyun * safely copied this way).
139*4882a593Smuzhiyun * 2) Further if the match length is 4..18, copy 18 bytes
140*4882a593Smuzhiyun * in a similar manner; but we ensure that there's enough
141*4882a593Smuzhiyun * space in the output for those 18 bytes earlier, upon
142*4882a593Smuzhiyun * entering the shortcut (in other words, there is a
143*4882a593Smuzhiyun * combined check for both stages).
144*4882a593Smuzhiyun *
145*4882a593Smuzhiyun * The & in the likely() below is intentionally not && so that
146*4882a593Smuzhiyun * some compilers can produce better parallelized runtime code
147*4882a593Smuzhiyun */
148*4882a593Smuzhiyun if ((endOnInput ? length != RUN_MASK : length <= 8)
149*4882a593Smuzhiyun /*
150*4882a593Smuzhiyun * strictly "less than" on input, to re-enter
151*4882a593Smuzhiyun * the loop with at least one byte
152*4882a593Smuzhiyun */
153*4882a593Smuzhiyun && likely((endOnInput ? ip < shortiend : 1) &
154*4882a593Smuzhiyun (op <= shortoend))) {
155*4882a593Smuzhiyun /* Copy the literals */
156*4882a593Smuzhiyun LZ4_memcpy(op, ip, endOnInput ? 16 : 8);
157*4882a593Smuzhiyun op += length; ip += length;
158*4882a593Smuzhiyun
159*4882a593Smuzhiyun /*
160*4882a593Smuzhiyun * The second stage:
161*4882a593Smuzhiyun * prepare for match copying, decode full info.
162*4882a593Smuzhiyun * If it doesn't work out, the info won't be wasted.
163*4882a593Smuzhiyun */
164*4882a593Smuzhiyun length = token & ML_MASK; /* match length */
165*4882a593Smuzhiyun offset = LZ4_readLE16(ip);
166*4882a593Smuzhiyun ip += 2;
167*4882a593Smuzhiyun match = op - offset;
168*4882a593Smuzhiyun assert(match <= op); /* check overflow */
169*4882a593Smuzhiyun
170*4882a593Smuzhiyun /* Do not deal with overlapping matches. */
171*4882a593Smuzhiyun if ((length != ML_MASK) &&
172*4882a593Smuzhiyun (offset >= 8) &&
173*4882a593Smuzhiyun (dict == withPrefix64k || match >= lowPrefix)) {
174*4882a593Smuzhiyun /* Copy the match. */
175*4882a593Smuzhiyun LZ4_memcpy(op + 0, match + 0, 8);
176*4882a593Smuzhiyun LZ4_memcpy(op + 8, match + 8, 8);
177*4882a593Smuzhiyun LZ4_memcpy(op + 16, match + 16, 2);
178*4882a593Smuzhiyun op += length + MINMATCH;
179*4882a593Smuzhiyun /* Both stages worked, load the next token. */
180*4882a593Smuzhiyun continue;
181*4882a593Smuzhiyun }
182*4882a593Smuzhiyun
183*4882a593Smuzhiyun /*
184*4882a593Smuzhiyun * The second stage didn't work out, but the info
185*4882a593Smuzhiyun * is ready. Propel it right to the point of match
186*4882a593Smuzhiyun * copying.
187*4882a593Smuzhiyun */
188*4882a593Smuzhiyun goto _copy_match;
189*4882a593Smuzhiyun }
190*4882a593Smuzhiyun
191*4882a593Smuzhiyun /* decode literal length */
192*4882a593Smuzhiyun if (length == RUN_MASK) {
193*4882a593Smuzhiyun unsigned int s;
194*4882a593Smuzhiyun
195*4882a593Smuzhiyun if (unlikely(endOnInput ? ip >= iend - RUN_MASK : 0)) {
196*4882a593Smuzhiyun /* overflow detection */
197*4882a593Smuzhiyun goto _output_error;
198*4882a593Smuzhiyun }
199*4882a593Smuzhiyun do {
200*4882a593Smuzhiyun s = *ip++;
201*4882a593Smuzhiyun length += s;
202*4882a593Smuzhiyun } while (likely(endOnInput
203*4882a593Smuzhiyun ? ip < iend - RUN_MASK
204*4882a593Smuzhiyun : 1) & (s == 255));
205*4882a593Smuzhiyun
206*4882a593Smuzhiyun if ((safeDecode)
207*4882a593Smuzhiyun && unlikely((uptrval)(op) +
208*4882a593Smuzhiyun length < (uptrval)(op))) {
209*4882a593Smuzhiyun /* overflow detection */
210*4882a593Smuzhiyun goto _output_error;
211*4882a593Smuzhiyun }
212*4882a593Smuzhiyun if ((safeDecode)
213*4882a593Smuzhiyun && unlikely((uptrval)(ip) +
214*4882a593Smuzhiyun length < (uptrval)(ip))) {
215*4882a593Smuzhiyun /* overflow detection */
216*4882a593Smuzhiyun goto _output_error;
217*4882a593Smuzhiyun }
218*4882a593Smuzhiyun }
219*4882a593Smuzhiyun
220*4882a593Smuzhiyun /* copy literals */
221*4882a593Smuzhiyun cpy = op + length;
222*4882a593Smuzhiyun LZ4_STATIC_ASSERT(MFLIMIT >= WILDCOPYLENGTH);
223*4882a593Smuzhiyun
224*4882a593Smuzhiyun if (((endOnInput) && ((cpy > oend - MFLIMIT)
225*4882a593Smuzhiyun || (ip + length > iend - (2 + 1 + LASTLITERALS))))
226*4882a593Smuzhiyun || ((!endOnInput) && (cpy > oend - WILDCOPYLENGTH))) {
227*4882a593Smuzhiyun if (partialDecoding) {
228*4882a593Smuzhiyun if (cpy > oend) {
229*4882a593Smuzhiyun /*
230*4882a593Smuzhiyun * Partial decoding :
231*4882a593Smuzhiyun * stop in the middle of literal segment
232*4882a593Smuzhiyun */
233*4882a593Smuzhiyun cpy = oend;
234*4882a593Smuzhiyun length = oend - op;
235*4882a593Smuzhiyun }
236*4882a593Smuzhiyun if ((endOnInput)
237*4882a593Smuzhiyun && (ip + length > iend)) {
238*4882a593Smuzhiyun /*
239*4882a593Smuzhiyun * Error :
240*4882a593Smuzhiyun * read attempt beyond
241*4882a593Smuzhiyun * end of input buffer
242*4882a593Smuzhiyun */
243*4882a593Smuzhiyun goto _output_error;
244*4882a593Smuzhiyun }
245*4882a593Smuzhiyun } else {
246*4882a593Smuzhiyun if ((!endOnInput)
247*4882a593Smuzhiyun && (cpy != oend)) {
248*4882a593Smuzhiyun /*
249*4882a593Smuzhiyun * Error :
250*4882a593Smuzhiyun * block decoding must
251*4882a593Smuzhiyun * stop exactly there
252*4882a593Smuzhiyun */
253*4882a593Smuzhiyun goto _output_error;
254*4882a593Smuzhiyun }
255*4882a593Smuzhiyun if ((endOnInput)
256*4882a593Smuzhiyun && ((ip + length != iend)
257*4882a593Smuzhiyun || (cpy > oend))) {
258*4882a593Smuzhiyun /*
259*4882a593Smuzhiyun * Error :
260*4882a593Smuzhiyun * input must be consumed
261*4882a593Smuzhiyun */
262*4882a593Smuzhiyun goto _output_error;
263*4882a593Smuzhiyun }
264*4882a593Smuzhiyun }
265*4882a593Smuzhiyun
266*4882a593Smuzhiyun /*
267*4882a593Smuzhiyun * supports overlapping memory regions; only matters
268*4882a593Smuzhiyun * for in-place decompression scenarios
269*4882a593Smuzhiyun */
270*4882a593Smuzhiyun LZ4_memmove(op, ip, length);
271*4882a593Smuzhiyun ip += length;
272*4882a593Smuzhiyun op += length;
273*4882a593Smuzhiyun
274*4882a593Smuzhiyun /* Necessarily EOF when !partialDecoding.
275*4882a593Smuzhiyun * When partialDecoding, it is EOF if we've either
276*4882a593Smuzhiyun * filled the output buffer or
277*4882a593Smuzhiyun * can't proceed with reading an offset for following match.
278*4882a593Smuzhiyun */
279*4882a593Smuzhiyun if (!partialDecoding || (cpy == oend) || (ip >= (iend - 2)))
280*4882a593Smuzhiyun break;
281*4882a593Smuzhiyun } else {
282*4882a593Smuzhiyun /* may overwrite up to WILDCOPYLENGTH beyond cpy */
283*4882a593Smuzhiyun LZ4_wildCopy(op, ip, cpy);
284*4882a593Smuzhiyun ip += length;
285*4882a593Smuzhiyun op = cpy;
286*4882a593Smuzhiyun }
287*4882a593Smuzhiyun
288*4882a593Smuzhiyun /* get offset */
289*4882a593Smuzhiyun offset = LZ4_readLE16(ip);
290*4882a593Smuzhiyun ip += 2;
291*4882a593Smuzhiyun match = op - offset;
292*4882a593Smuzhiyun
293*4882a593Smuzhiyun /* get matchlength */
294*4882a593Smuzhiyun length = token & ML_MASK;
295*4882a593Smuzhiyun
296*4882a593Smuzhiyun _copy_match:
297*4882a593Smuzhiyun if ((checkOffset) && (unlikely(match + dictSize < lowPrefix))) {
298*4882a593Smuzhiyun /* Error : offset outside buffers */
299*4882a593Smuzhiyun goto _output_error;
300*4882a593Smuzhiyun }
301*4882a593Smuzhiyun
302*4882a593Smuzhiyun /* costs ~1%; silence an msan warning when offset == 0 */
303*4882a593Smuzhiyun /*
304*4882a593Smuzhiyun * note : when partialDecoding, there is no guarantee that
305*4882a593Smuzhiyun * at least 4 bytes remain available in output buffer
306*4882a593Smuzhiyun */
307*4882a593Smuzhiyun if (!partialDecoding) {
308*4882a593Smuzhiyun assert(oend > op);
309*4882a593Smuzhiyun assert(oend - op >= 4);
310*4882a593Smuzhiyun
311*4882a593Smuzhiyun LZ4_write32(op, (U32)offset);
312*4882a593Smuzhiyun }
313*4882a593Smuzhiyun
314*4882a593Smuzhiyun if (length == ML_MASK) {
315*4882a593Smuzhiyun unsigned int s;
316*4882a593Smuzhiyun
317*4882a593Smuzhiyun do {
318*4882a593Smuzhiyun s = *ip++;
319*4882a593Smuzhiyun
320*4882a593Smuzhiyun if ((endOnInput) && (ip > iend - LASTLITERALS))
321*4882a593Smuzhiyun goto _output_error;
322*4882a593Smuzhiyun
323*4882a593Smuzhiyun length += s;
324*4882a593Smuzhiyun } while (s == 255);
325*4882a593Smuzhiyun
326*4882a593Smuzhiyun if ((safeDecode)
327*4882a593Smuzhiyun && unlikely(
328*4882a593Smuzhiyun (uptrval)(op) + length < (uptrval)op)) {
329*4882a593Smuzhiyun /* overflow detection */
330*4882a593Smuzhiyun goto _output_error;
331*4882a593Smuzhiyun }
332*4882a593Smuzhiyun }
333*4882a593Smuzhiyun
334*4882a593Smuzhiyun length += MINMATCH;
335*4882a593Smuzhiyun
336*4882a593Smuzhiyun /* match starting within external dictionary */
337*4882a593Smuzhiyun if ((dict == usingExtDict) && (match < lowPrefix)) {
338*4882a593Smuzhiyun if (unlikely(op + length > oend - LASTLITERALS)) {
339*4882a593Smuzhiyun /* doesn't respect parsing restriction */
340*4882a593Smuzhiyun if (!partialDecoding)
341*4882a593Smuzhiyun goto _output_error;
342*4882a593Smuzhiyun length = min(length, (size_t)(oend - op));
343*4882a593Smuzhiyun }
344*4882a593Smuzhiyun
345*4882a593Smuzhiyun if (length <= (size_t)(lowPrefix - match)) {
346*4882a593Smuzhiyun /*
347*4882a593Smuzhiyun * match fits entirely within external
348*4882a593Smuzhiyun * dictionary : just copy
349*4882a593Smuzhiyun */
350*4882a593Smuzhiyun memmove(op, dictEnd - (lowPrefix - match),
351*4882a593Smuzhiyun length);
352*4882a593Smuzhiyun op += length;
353*4882a593Smuzhiyun } else {
354*4882a593Smuzhiyun /*
355*4882a593Smuzhiyun * match stretches into both external
356*4882a593Smuzhiyun * dictionary and current block
357*4882a593Smuzhiyun */
358*4882a593Smuzhiyun size_t const copySize = (size_t)(lowPrefix - match);
359*4882a593Smuzhiyun size_t const restSize = length - copySize;
360*4882a593Smuzhiyun
361*4882a593Smuzhiyun LZ4_memcpy(op, dictEnd - copySize, copySize);
362*4882a593Smuzhiyun op += copySize;
363*4882a593Smuzhiyun if (restSize > (size_t)(op - lowPrefix)) {
364*4882a593Smuzhiyun /* overlap copy */
365*4882a593Smuzhiyun BYTE * const endOfMatch = op + restSize;
366*4882a593Smuzhiyun const BYTE *copyFrom = lowPrefix;
367*4882a593Smuzhiyun
368*4882a593Smuzhiyun while (op < endOfMatch)
369*4882a593Smuzhiyun *op++ = *copyFrom++;
370*4882a593Smuzhiyun } else {
371*4882a593Smuzhiyun LZ4_memcpy(op, lowPrefix, restSize);
372*4882a593Smuzhiyun op += restSize;
373*4882a593Smuzhiyun }
374*4882a593Smuzhiyun }
375*4882a593Smuzhiyun continue;
376*4882a593Smuzhiyun }
377*4882a593Smuzhiyun
378*4882a593Smuzhiyun /* copy match within block */
379*4882a593Smuzhiyun cpy = op + length;
380*4882a593Smuzhiyun
381*4882a593Smuzhiyun /*
382*4882a593Smuzhiyun * partialDecoding :
383*4882a593Smuzhiyun * may not respect endBlock parsing restrictions
384*4882a593Smuzhiyun */
385*4882a593Smuzhiyun assert(op <= oend);
386*4882a593Smuzhiyun if (partialDecoding &&
387*4882a593Smuzhiyun (cpy > oend - MATCH_SAFEGUARD_DISTANCE)) {
388*4882a593Smuzhiyun size_t const mlen = min(length, (size_t)(oend - op));
389*4882a593Smuzhiyun const BYTE * const matchEnd = match + mlen;
390*4882a593Smuzhiyun BYTE * const copyEnd = op + mlen;
391*4882a593Smuzhiyun
392*4882a593Smuzhiyun if (matchEnd > op) {
393*4882a593Smuzhiyun /* overlap copy */
394*4882a593Smuzhiyun while (op < copyEnd)
395*4882a593Smuzhiyun *op++ = *match++;
396*4882a593Smuzhiyun } else {
397*4882a593Smuzhiyun LZ4_memcpy(op, match, mlen);
398*4882a593Smuzhiyun }
399*4882a593Smuzhiyun op = copyEnd;
400*4882a593Smuzhiyun if (op == oend)
401*4882a593Smuzhiyun break;
402*4882a593Smuzhiyun continue;
403*4882a593Smuzhiyun }
404*4882a593Smuzhiyun
405*4882a593Smuzhiyun if (unlikely(offset < 8)) {
406*4882a593Smuzhiyun op[0] = match[0];
407*4882a593Smuzhiyun op[1] = match[1];
408*4882a593Smuzhiyun op[2] = match[2];
409*4882a593Smuzhiyun op[3] = match[3];
410*4882a593Smuzhiyun match += inc32table[offset];
411*4882a593Smuzhiyun LZ4_memcpy(op + 4, match, 4);
412*4882a593Smuzhiyun match -= dec64table[offset];
413*4882a593Smuzhiyun } else {
414*4882a593Smuzhiyun LZ4_copy8(op, match);
415*4882a593Smuzhiyun match += 8;
416*4882a593Smuzhiyun }
417*4882a593Smuzhiyun
418*4882a593Smuzhiyun op += 8;
419*4882a593Smuzhiyun
420*4882a593Smuzhiyun if (unlikely(cpy > oend - MATCH_SAFEGUARD_DISTANCE)) {
421*4882a593Smuzhiyun BYTE * const oCopyLimit = oend - (WILDCOPYLENGTH - 1);
422*4882a593Smuzhiyun
423*4882a593Smuzhiyun if (cpy > oend - LASTLITERALS) {
424*4882a593Smuzhiyun /*
425*4882a593Smuzhiyun * Error : last LASTLITERALS bytes
426*4882a593Smuzhiyun * must be literals (uncompressed)
427*4882a593Smuzhiyun */
428*4882a593Smuzhiyun goto _output_error;
429*4882a593Smuzhiyun }
430*4882a593Smuzhiyun
431*4882a593Smuzhiyun if (op < oCopyLimit) {
432*4882a593Smuzhiyun LZ4_wildCopy(op, match, oCopyLimit);
433*4882a593Smuzhiyun match += oCopyLimit - op;
434*4882a593Smuzhiyun op = oCopyLimit;
435*4882a593Smuzhiyun }
436*4882a593Smuzhiyun while (op < cpy)
437*4882a593Smuzhiyun *op++ = *match++;
438*4882a593Smuzhiyun } else {
439*4882a593Smuzhiyun LZ4_copy8(op, match);
440*4882a593Smuzhiyun if (length > 16)
441*4882a593Smuzhiyun LZ4_wildCopy(op + 8, match + 8, cpy);
442*4882a593Smuzhiyun }
443*4882a593Smuzhiyun op = cpy; /* wildcopy correction */
444*4882a593Smuzhiyun }
445*4882a593Smuzhiyun
446*4882a593Smuzhiyun /* end of decoding */
447*4882a593Smuzhiyun if (endOnInput) {
448*4882a593Smuzhiyun /* Nb of output bytes decoded */
449*4882a593Smuzhiyun return (int) (((char *)op) - dst);
450*4882a593Smuzhiyun } else {
451*4882a593Smuzhiyun /* Nb of input bytes read */
452*4882a593Smuzhiyun return (int) (((const char *)ip) - src);
453*4882a593Smuzhiyun }
454*4882a593Smuzhiyun
455*4882a593Smuzhiyun /* Overflow error detected */
456*4882a593Smuzhiyun _output_error:
457*4882a593Smuzhiyun return (int) (-(((const char *)ip) - src)) - 1;
458*4882a593Smuzhiyun }
459*4882a593Smuzhiyun
LZ4_decompress_safe(const char * source,char * dest,int compressedSize,int maxDecompressedSize)460*4882a593Smuzhiyun int LZ4_decompress_safe(const char *source, char *dest,
461*4882a593Smuzhiyun int compressedSize, int maxDecompressedSize)
462*4882a593Smuzhiyun {
463*4882a593Smuzhiyun return LZ4_decompress_generic(source, dest,
464*4882a593Smuzhiyun compressedSize, maxDecompressedSize,
465*4882a593Smuzhiyun endOnInputSize, decode_full_block,
466*4882a593Smuzhiyun noDict, (BYTE *)dest, NULL, 0);
467*4882a593Smuzhiyun }
468*4882a593Smuzhiyun
LZ4_decompress_safe_partial(const char * src,char * dst,int compressedSize,int targetOutputSize,int dstCapacity)469*4882a593Smuzhiyun int LZ4_decompress_safe_partial(const char *src, char *dst,
470*4882a593Smuzhiyun int compressedSize, int targetOutputSize, int dstCapacity)
471*4882a593Smuzhiyun {
472*4882a593Smuzhiyun dstCapacity = min(targetOutputSize, dstCapacity);
473*4882a593Smuzhiyun return LZ4_decompress_generic(src, dst, compressedSize, dstCapacity,
474*4882a593Smuzhiyun endOnInputSize, partial_decode,
475*4882a593Smuzhiyun noDict, (BYTE *)dst, NULL, 0);
476*4882a593Smuzhiyun }
477*4882a593Smuzhiyun
LZ4_decompress_fast(const char * source,char * dest,int originalSize)478*4882a593Smuzhiyun int LZ4_decompress_fast(const char *source, char *dest, int originalSize)
479*4882a593Smuzhiyun {
480*4882a593Smuzhiyun return LZ4_decompress_generic(source, dest, 0, originalSize,
481*4882a593Smuzhiyun endOnOutputSize, decode_full_block,
482*4882a593Smuzhiyun withPrefix64k,
483*4882a593Smuzhiyun (BYTE *)dest - 64 * KB, NULL, 0);
484*4882a593Smuzhiyun }
485*4882a593Smuzhiyun
486*4882a593Smuzhiyun /* ===== Instantiate a few more decoding cases, used more than once. ===== */
487*4882a593Smuzhiyun
LZ4_decompress_safe_withPrefix64k(const char * source,char * dest,int compressedSize,int maxOutputSize)488*4882a593Smuzhiyun int LZ4_decompress_safe_withPrefix64k(const char *source, char *dest,
489*4882a593Smuzhiyun int compressedSize, int maxOutputSize)
490*4882a593Smuzhiyun {
491*4882a593Smuzhiyun return LZ4_decompress_generic(source, dest,
492*4882a593Smuzhiyun compressedSize, maxOutputSize,
493*4882a593Smuzhiyun endOnInputSize, decode_full_block,
494*4882a593Smuzhiyun withPrefix64k,
495*4882a593Smuzhiyun (BYTE *)dest - 64 * KB, NULL, 0);
496*4882a593Smuzhiyun }
497*4882a593Smuzhiyun
LZ4_decompress_safe_withSmallPrefix(const char * source,char * dest,int compressedSize,int maxOutputSize,size_t prefixSize)498*4882a593Smuzhiyun static int LZ4_decompress_safe_withSmallPrefix(const char *source, char *dest,
499*4882a593Smuzhiyun int compressedSize,
500*4882a593Smuzhiyun int maxOutputSize,
501*4882a593Smuzhiyun size_t prefixSize)
502*4882a593Smuzhiyun {
503*4882a593Smuzhiyun return LZ4_decompress_generic(source, dest,
504*4882a593Smuzhiyun compressedSize, maxOutputSize,
505*4882a593Smuzhiyun endOnInputSize, decode_full_block,
506*4882a593Smuzhiyun noDict,
507*4882a593Smuzhiyun (BYTE *)dest - prefixSize, NULL, 0);
508*4882a593Smuzhiyun }
509*4882a593Smuzhiyun
LZ4_decompress_safe_forceExtDict(const char * source,char * dest,int compressedSize,int maxOutputSize,const void * dictStart,size_t dictSize)510*4882a593Smuzhiyun int LZ4_decompress_safe_forceExtDict(const char *source, char *dest,
511*4882a593Smuzhiyun int compressedSize, int maxOutputSize,
512*4882a593Smuzhiyun const void *dictStart, size_t dictSize)
513*4882a593Smuzhiyun {
514*4882a593Smuzhiyun return LZ4_decompress_generic(source, dest,
515*4882a593Smuzhiyun compressedSize, maxOutputSize,
516*4882a593Smuzhiyun endOnInputSize, decode_full_block,
517*4882a593Smuzhiyun usingExtDict, (BYTE *)dest,
518*4882a593Smuzhiyun (const BYTE *)dictStart, dictSize);
519*4882a593Smuzhiyun }
520*4882a593Smuzhiyun
LZ4_decompress_fast_extDict(const char * source,char * dest,int originalSize,const void * dictStart,size_t dictSize)521*4882a593Smuzhiyun static int LZ4_decompress_fast_extDict(const char *source, char *dest,
522*4882a593Smuzhiyun int originalSize,
523*4882a593Smuzhiyun const void *dictStart, size_t dictSize)
524*4882a593Smuzhiyun {
525*4882a593Smuzhiyun return LZ4_decompress_generic(source, dest,
526*4882a593Smuzhiyun 0, originalSize,
527*4882a593Smuzhiyun endOnOutputSize, decode_full_block,
528*4882a593Smuzhiyun usingExtDict, (BYTE *)dest,
529*4882a593Smuzhiyun (const BYTE *)dictStart, dictSize);
530*4882a593Smuzhiyun }
531*4882a593Smuzhiyun
532*4882a593Smuzhiyun /*
533*4882a593Smuzhiyun * The "double dictionary" mode, for use with e.g. ring buffers: the first part
534*4882a593Smuzhiyun * of the dictionary is passed as prefix, and the second via dictStart + dictSize.
535*4882a593Smuzhiyun * These routines are used only once, in LZ4_decompress_*_continue().
536*4882a593Smuzhiyun */
537*4882a593Smuzhiyun static FORCE_INLINE
LZ4_decompress_safe_doubleDict(const char * source,char * dest,int compressedSize,int maxOutputSize,size_t prefixSize,const void * dictStart,size_t dictSize)538*4882a593Smuzhiyun int LZ4_decompress_safe_doubleDict(const char *source, char *dest,
539*4882a593Smuzhiyun int compressedSize, int maxOutputSize,
540*4882a593Smuzhiyun size_t prefixSize,
541*4882a593Smuzhiyun const void *dictStart, size_t dictSize)
542*4882a593Smuzhiyun {
543*4882a593Smuzhiyun return LZ4_decompress_generic(source, dest,
544*4882a593Smuzhiyun compressedSize, maxOutputSize,
545*4882a593Smuzhiyun endOnInputSize, decode_full_block,
546*4882a593Smuzhiyun usingExtDict, (BYTE *)dest - prefixSize,
547*4882a593Smuzhiyun (const BYTE *)dictStart, dictSize);
548*4882a593Smuzhiyun }
549*4882a593Smuzhiyun
550*4882a593Smuzhiyun static FORCE_INLINE
LZ4_decompress_fast_doubleDict(const char * source,char * dest,int originalSize,size_t prefixSize,const void * dictStart,size_t dictSize)551*4882a593Smuzhiyun int LZ4_decompress_fast_doubleDict(const char *source, char *dest,
552*4882a593Smuzhiyun int originalSize, size_t prefixSize,
553*4882a593Smuzhiyun const void *dictStart, size_t dictSize)
554*4882a593Smuzhiyun {
555*4882a593Smuzhiyun return LZ4_decompress_generic(source, dest,
556*4882a593Smuzhiyun 0, originalSize,
557*4882a593Smuzhiyun endOnOutputSize, decode_full_block,
558*4882a593Smuzhiyun usingExtDict, (BYTE *)dest - prefixSize,
559*4882a593Smuzhiyun (const BYTE *)dictStart, dictSize);
560*4882a593Smuzhiyun }
561*4882a593Smuzhiyun
562*4882a593Smuzhiyun /* ===== streaming decompression functions ===== */
563*4882a593Smuzhiyun
LZ4_setStreamDecode(LZ4_streamDecode_t * LZ4_streamDecode,const char * dictionary,int dictSize)564*4882a593Smuzhiyun int LZ4_setStreamDecode(LZ4_streamDecode_t *LZ4_streamDecode,
565*4882a593Smuzhiyun const char *dictionary, int dictSize)
566*4882a593Smuzhiyun {
567*4882a593Smuzhiyun LZ4_streamDecode_t_internal *lz4sd =
568*4882a593Smuzhiyun &LZ4_streamDecode->internal_donotuse;
569*4882a593Smuzhiyun
570*4882a593Smuzhiyun lz4sd->prefixSize = (size_t) dictSize;
571*4882a593Smuzhiyun lz4sd->prefixEnd = (const BYTE *) dictionary + dictSize;
572*4882a593Smuzhiyun lz4sd->externalDict = NULL;
573*4882a593Smuzhiyun lz4sd->extDictSize = 0;
574*4882a593Smuzhiyun return 1;
575*4882a593Smuzhiyun }
576*4882a593Smuzhiyun
577*4882a593Smuzhiyun /*
578*4882a593Smuzhiyun * *_continue() :
579*4882a593Smuzhiyun * These decoding functions allow decompression of multiple blocks
580*4882a593Smuzhiyun * in "streaming" mode.
581*4882a593Smuzhiyun * Previously decoded blocks must still be available at the memory
582*4882a593Smuzhiyun * position where they were decoded.
583*4882a593Smuzhiyun * If it's not possible, save the relevant part of
584*4882a593Smuzhiyun * decoded data into a safe buffer,
585*4882a593Smuzhiyun * and indicate where it stands using LZ4_setStreamDecode()
586*4882a593Smuzhiyun */
LZ4_decompress_safe_continue(LZ4_streamDecode_t * LZ4_streamDecode,const char * source,char * dest,int compressedSize,int maxOutputSize)587*4882a593Smuzhiyun int LZ4_decompress_safe_continue(LZ4_streamDecode_t *LZ4_streamDecode,
588*4882a593Smuzhiyun const char *source, char *dest, int compressedSize, int maxOutputSize)
589*4882a593Smuzhiyun {
590*4882a593Smuzhiyun LZ4_streamDecode_t_internal *lz4sd =
591*4882a593Smuzhiyun &LZ4_streamDecode->internal_donotuse;
592*4882a593Smuzhiyun int result;
593*4882a593Smuzhiyun
594*4882a593Smuzhiyun if (lz4sd->prefixSize == 0) {
595*4882a593Smuzhiyun /* The first call, no dictionary yet. */
596*4882a593Smuzhiyun assert(lz4sd->extDictSize == 0);
597*4882a593Smuzhiyun result = LZ4_decompress_safe(source, dest,
598*4882a593Smuzhiyun compressedSize, maxOutputSize);
599*4882a593Smuzhiyun if (result <= 0)
600*4882a593Smuzhiyun return result;
601*4882a593Smuzhiyun lz4sd->prefixSize = result;
602*4882a593Smuzhiyun lz4sd->prefixEnd = (BYTE *)dest + result;
603*4882a593Smuzhiyun } else if (lz4sd->prefixEnd == (BYTE *)dest) {
604*4882a593Smuzhiyun /* They're rolling the current segment. */
605*4882a593Smuzhiyun if (lz4sd->prefixSize >= 64 * KB - 1)
606*4882a593Smuzhiyun result = LZ4_decompress_safe_withPrefix64k(source, dest,
607*4882a593Smuzhiyun compressedSize, maxOutputSize);
608*4882a593Smuzhiyun else if (lz4sd->extDictSize == 0)
609*4882a593Smuzhiyun result = LZ4_decompress_safe_withSmallPrefix(source,
610*4882a593Smuzhiyun dest, compressedSize, maxOutputSize,
611*4882a593Smuzhiyun lz4sd->prefixSize);
612*4882a593Smuzhiyun else
613*4882a593Smuzhiyun result = LZ4_decompress_safe_doubleDict(source, dest,
614*4882a593Smuzhiyun compressedSize, maxOutputSize,
615*4882a593Smuzhiyun lz4sd->prefixSize,
616*4882a593Smuzhiyun lz4sd->externalDict, lz4sd->extDictSize);
617*4882a593Smuzhiyun if (result <= 0)
618*4882a593Smuzhiyun return result;
619*4882a593Smuzhiyun lz4sd->prefixSize += result;
620*4882a593Smuzhiyun lz4sd->prefixEnd += result;
621*4882a593Smuzhiyun } else {
622*4882a593Smuzhiyun /*
623*4882a593Smuzhiyun * The buffer wraps around, or they're
624*4882a593Smuzhiyun * switching to another buffer.
625*4882a593Smuzhiyun */
626*4882a593Smuzhiyun lz4sd->extDictSize = lz4sd->prefixSize;
627*4882a593Smuzhiyun lz4sd->externalDict = lz4sd->prefixEnd - lz4sd->extDictSize;
628*4882a593Smuzhiyun result = LZ4_decompress_safe_forceExtDict(source, dest,
629*4882a593Smuzhiyun compressedSize, maxOutputSize,
630*4882a593Smuzhiyun lz4sd->externalDict, lz4sd->extDictSize);
631*4882a593Smuzhiyun if (result <= 0)
632*4882a593Smuzhiyun return result;
633*4882a593Smuzhiyun lz4sd->prefixSize = result;
634*4882a593Smuzhiyun lz4sd->prefixEnd = (BYTE *)dest + result;
635*4882a593Smuzhiyun }
636*4882a593Smuzhiyun
637*4882a593Smuzhiyun return result;
638*4882a593Smuzhiyun }
639*4882a593Smuzhiyun
LZ4_decompress_fast_continue(LZ4_streamDecode_t * LZ4_streamDecode,const char * source,char * dest,int originalSize)640*4882a593Smuzhiyun int LZ4_decompress_fast_continue(LZ4_streamDecode_t *LZ4_streamDecode,
641*4882a593Smuzhiyun const char *source, char *dest, int originalSize)
642*4882a593Smuzhiyun {
643*4882a593Smuzhiyun LZ4_streamDecode_t_internal *lz4sd = &LZ4_streamDecode->internal_donotuse;
644*4882a593Smuzhiyun int result;
645*4882a593Smuzhiyun
646*4882a593Smuzhiyun if (lz4sd->prefixSize == 0) {
647*4882a593Smuzhiyun assert(lz4sd->extDictSize == 0);
648*4882a593Smuzhiyun result = LZ4_decompress_fast(source, dest, originalSize);
649*4882a593Smuzhiyun if (result <= 0)
650*4882a593Smuzhiyun return result;
651*4882a593Smuzhiyun lz4sd->prefixSize = originalSize;
652*4882a593Smuzhiyun lz4sd->prefixEnd = (BYTE *)dest + originalSize;
653*4882a593Smuzhiyun } else if (lz4sd->prefixEnd == (BYTE *)dest) {
654*4882a593Smuzhiyun if (lz4sd->prefixSize >= 64 * KB - 1 ||
655*4882a593Smuzhiyun lz4sd->extDictSize == 0)
656*4882a593Smuzhiyun result = LZ4_decompress_fast(source, dest,
657*4882a593Smuzhiyun originalSize);
658*4882a593Smuzhiyun else
659*4882a593Smuzhiyun result = LZ4_decompress_fast_doubleDict(source, dest,
660*4882a593Smuzhiyun originalSize, lz4sd->prefixSize,
661*4882a593Smuzhiyun lz4sd->externalDict, lz4sd->extDictSize);
662*4882a593Smuzhiyun if (result <= 0)
663*4882a593Smuzhiyun return result;
664*4882a593Smuzhiyun lz4sd->prefixSize += originalSize;
665*4882a593Smuzhiyun lz4sd->prefixEnd += originalSize;
666*4882a593Smuzhiyun } else {
667*4882a593Smuzhiyun lz4sd->extDictSize = lz4sd->prefixSize;
668*4882a593Smuzhiyun lz4sd->externalDict = lz4sd->prefixEnd - lz4sd->extDictSize;
669*4882a593Smuzhiyun result = LZ4_decompress_fast_extDict(source, dest,
670*4882a593Smuzhiyun originalSize, lz4sd->externalDict, lz4sd->extDictSize);
671*4882a593Smuzhiyun if (result <= 0)
672*4882a593Smuzhiyun return result;
673*4882a593Smuzhiyun lz4sd->prefixSize = originalSize;
674*4882a593Smuzhiyun lz4sd->prefixEnd = (BYTE *)dest + originalSize;
675*4882a593Smuzhiyun }
676*4882a593Smuzhiyun return result;
677*4882a593Smuzhiyun }
678*4882a593Smuzhiyun
LZ4_decompress_safe_usingDict(const char * source,char * dest,int compressedSize,int maxOutputSize,const char * dictStart,int dictSize)679*4882a593Smuzhiyun int LZ4_decompress_safe_usingDict(const char *source, char *dest,
680*4882a593Smuzhiyun int compressedSize, int maxOutputSize,
681*4882a593Smuzhiyun const char *dictStart, int dictSize)
682*4882a593Smuzhiyun {
683*4882a593Smuzhiyun if (dictSize == 0)
684*4882a593Smuzhiyun return LZ4_decompress_safe(source, dest,
685*4882a593Smuzhiyun compressedSize, maxOutputSize);
686*4882a593Smuzhiyun if (dictStart+dictSize == dest) {
687*4882a593Smuzhiyun if (dictSize >= 64 * KB - 1)
688*4882a593Smuzhiyun return LZ4_decompress_safe_withPrefix64k(source, dest,
689*4882a593Smuzhiyun compressedSize, maxOutputSize);
690*4882a593Smuzhiyun return LZ4_decompress_safe_withSmallPrefix(source, dest,
691*4882a593Smuzhiyun compressedSize, maxOutputSize, dictSize);
692*4882a593Smuzhiyun }
693*4882a593Smuzhiyun return LZ4_decompress_safe_forceExtDict(source, dest,
694*4882a593Smuzhiyun compressedSize, maxOutputSize, dictStart, dictSize);
695*4882a593Smuzhiyun }
696*4882a593Smuzhiyun
LZ4_decompress_fast_usingDict(const char * source,char * dest,int originalSize,const char * dictStart,int dictSize)697*4882a593Smuzhiyun int LZ4_decompress_fast_usingDict(const char *source, char *dest,
698*4882a593Smuzhiyun int originalSize,
699*4882a593Smuzhiyun const char *dictStart, int dictSize)
700*4882a593Smuzhiyun {
701*4882a593Smuzhiyun if (dictSize == 0 || dictStart + dictSize == dest)
702*4882a593Smuzhiyun return LZ4_decompress_fast(source, dest, originalSize);
703*4882a593Smuzhiyun
704*4882a593Smuzhiyun return LZ4_decompress_fast_extDict(source, dest, originalSize,
705*4882a593Smuzhiyun dictStart, dictSize);
706*4882a593Smuzhiyun }
707*4882a593Smuzhiyun
708*4882a593Smuzhiyun #ifndef STATIC
709*4882a593Smuzhiyun EXPORT_SYMBOL(LZ4_decompress_safe);
710*4882a593Smuzhiyun EXPORT_SYMBOL(LZ4_decompress_safe_partial);
711*4882a593Smuzhiyun EXPORT_SYMBOL(LZ4_decompress_fast);
712*4882a593Smuzhiyun EXPORT_SYMBOL(LZ4_setStreamDecode);
713*4882a593Smuzhiyun EXPORT_SYMBOL(LZ4_decompress_safe_continue);
714*4882a593Smuzhiyun EXPORT_SYMBOL(LZ4_decompress_fast_continue);
715*4882a593Smuzhiyun EXPORT_SYMBOL(LZ4_decompress_safe_usingDict);
716*4882a593Smuzhiyun EXPORT_SYMBOL(LZ4_decompress_fast_usingDict);
717*4882a593Smuzhiyun
718*4882a593Smuzhiyun MODULE_LICENSE("Dual BSD/GPL");
719*4882a593Smuzhiyun MODULE_DESCRIPTION("LZ4 decompressor");
720*4882a593Smuzhiyun #endif
721