xref: /OK3568_Linux_fs/kernel/lib/zstd/zstd_opt.h (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /**
2*4882a593Smuzhiyun  * Copyright (c) 2016-present, Przemyslaw Skibinski, Yann Collet, Facebook, Inc.
3*4882a593Smuzhiyun  * All rights reserved.
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * This source code is licensed under the BSD-style license found in the
6*4882a593Smuzhiyun  * LICENSE file in the root directory of https://github.com/facebook/zstd.
7*4882a593Smuzhiyun  * An additional grant of patent rights can be found in the PATENTS file in the
8*4882a593Smuzhiyun  * same directory.
9*4882a593Smuzhiyun  *
10*4882a593Smuzhiyun  * This program is free software; you can redistribute it and/or modify it under
11*4882a593Smuzhiyun  * the terms of the GNU General Public License version 2 as published by the
12*4882a593Smuzhiyun  * Free Software Foundation. This program is dual-licensed; you may select
13*4882a593Smuzhiyun  * either version 2 of the GNU General Public License ("GPL") or BSD license
14*4882a593Smuzhiyun  * ("BSD").
15*4882a593Smuzhiyun  */
16*4882a593Smuzhiyun 
17*4882a593Smuzhiyun /* Note : this file is intended to be included within zstd_compress.c */
18*4882a593Smuzhiyun 
19*4882a593Smuzhiyun #ifndef ZSTD_OPT_H_91842398743
20*4882a593Smuzhiyun #define ZSTD_OPT_H_91842398743
21*4882a593Smuzhiyun 
22*4882a593Smuzhiyun #define ZSTD_LITFREQ_ADD 2
23*4882a593Smuzhiyun #define ZSTD_FREQ_DIV 4
24*4882a593Smuzhiyun #define ZSTD_MAX_PRICE (1 << 30)
25*4882a593Smuzhiyun 
26*4882a593Smuzhiyun /*-*************************************
27*4882a593Smuzhiyun *  Price functions for optimal parser
28*4882a593Smuzhiyun ***************************************/
ZSTD_setLog2Prices(seqStore_t * ssPtr)29*4882a593Smuzhiyun FORCE_INLINE void ZSTD_setLog2Prices(seqStore_t *ssPtr)
30*4882a593Smuzhiyun {
31*4882a593Smuzhiyun 	ssPtr->log2matchLengthSum = ZSTD_highbit32(ssPtr->matchLengthSum + 1);
32*4882a593Smuzhiyun 	ssPtr->log2litLengthSum = ZSTD_highbit32(ssPtr->litLengthSum + 1);
33*4882a593Smuzhiyun 	ssPtr->log2litSum = ZSTD_highbit32(ssPtr->litSum + 1);
34*4882a593Smuzhiyun 	ssPtr->log2offCodeSum = ZSTD_highbit32(ssPtr->offCodeSum + 1);
35*4882a593Smuzhiyun 	ssPtr->factor = 1 + ((ssPtr->litSum >> 5) / ssPtr->litLengthSum) + ((ssPtr->litSum << 1) / (ssPtr->litSum + ssPtr->matchSum));
36*4882a593Smuzhiyun }
37*4882a593Smuzhiyun 
ZSTD_rescaleFreqs(seqStore_t * ssPtr,const BYTE * src,size_t srcSize)38*4882a593Smuzhiyun ZSTD_STATIC void ZSTD_rescaleFreqs(seqStore_t *ssPtr, const BYTE *src, size_t srcSize)
39*4882a593Smuzhiyun {
40*4882a593Smuzhiyun 	unsigned u;
41*4882a593Smuzhiyun 
42*4882a593Smuzhiyun 	ssPtr->cachedLiterals = NULL;
43*4882a593Smuzhiyun 	ssPtr->cachedPrice = ssPtr->cachedLitLength = 0;
44*4882a593Smuzhiyun 	ssPtr->staticPrices = 0;
45*4882a593Smuzhiyun 
46*4882a593Smuzhiyun 	if (ssPtr->litLengthSum == 0) {
47*4882a593Smuzhiyun 		if (srcSize <= 1024)
48*4882a593Smuzhiyun 			ssPtr->staticPrices = 1;
49*4882a593Smuzhiyun 
50*4882a593Smuzhiyun 		for (u = 0; u <= MaxLit; u++)
51*4882a593Smuzhiyun 			ssPtr->litFreq[u] = 0;
52*4882a593Smuzhiyun 		for (u = 0; u < srcSize; u++)
53*4882a593Smuzhiyun 			ssPtr->litFreq[src[u]]++;
54*4882a593Smuzhiyun 
55*4882a593Smuzhiyun 		ssPtr->litSum = 0;
56*4882a593Smuzhiyun 		ssPtr->litLengthSum = MaxLL + 1;
57*4882a593Smuzhiyun 		ssPtr->matchLengthSum = MaxML + 1;
58*4882a593Smuzhiyun 		ssPtr->offCodeSum = (MaxOff + 1);
59*4882a593Smuzhiyun 		ssPtr->matchSum = (ZSTD_LITFREQ_ADD << Litbits);
60*4882a593Smuzhiyun 
61*4882a593Smuzhiyun 		for (u = 0; u <= MaxLit; u++) {
62*4882a593Smuzhiyun 			ssPtr->litFreq[u] = 1 + (ssPtr->litFreq[u] >> ZSTD_FREQ_DIV);
63*4882a593Smuzhiyun 			ssPtr->litSum += ssPtr->litFreq[u];
64*4882a593Smuzhiyun 		}
65*4882a593Smuzhiyun 		for (u = 0; u <= MaxLL; u++)
66*4882a593Smuzhiyun 			ssPtr->litLengthFreq[u] = 1;
67*4882a593Smuzhiyun 		for (u = 0; u <= MaxML; u++)
68*4882a593Smuzhiyun 			ssPtr->matchLengthFreq[u] = 1;
69*4882a593Smuzhiyun 		for (u = 0; u <= MaxOff; u++)
70*4882a593Smuzhiyun 			ssPtr->offCodeFreq[u] = 1;
71*4882a593Smuzhiyun 	} else {
72*4882a593Smuzhiyun 		ssPtr->matchLengthSum = 0;
73*4882a593Smuzhiyun 		ssPtr->litLengthSum = 0;
74*4882a593Smuzhiyun 		ssPtr->offCodeSum = 0;
75*4882a593Smuzhiyun 		ssPtr->matchSum = 0;
76*4882a593Smuzhiyun 		ssPtr->litSum = 0;
77*4882a593Smuzhiyun 
78*4882a593Smuzhiyun 		for (u = 0; u <= MaxLit; u++) {
79*4882a593Smuzhiyun 			ssPtr->litFreq[u] = 1 + (ssPtr->litFreq[u] >> (ZSTD_FREQ_DIV + 1));
80*4882a593Smuzhiyun 			ssPtr->litSum += ssPtr->litFreq[u];
81*4882a593Smuzhiyun 		}
82*4882a593Smuzhiyun 		for (u = 0; u <= MaxLL; u++) {
83*4882a593Smuzhiyun 			ssPtr->litLengthFreq[u] = 1 + (ssPtr->litLengthFreq[u] >> (ZSTD_FREQ_DIV + 1));
84*4882a593Smuzhiyun 			ssPtr->litLengthSum += ssPtr->litLengthFreq[u];
85*4882a593Smuzhiyun 		}
86*4882a593Smuzhiyun 		for (u = 0; u <= MaxML; u++) {
87*4882a593Smuzhiyun 			ssPtr->matchLengthFreq[u] = 1 + (ssPtr->matchLengthFreq[u] >> ZSTD_FREQ_DIV);
88*4882a593Smuzhiyun 			ssPtr->matchLengthSum += ssPtr->matchLengthFreq[u];
89*4882a593Smuzhiyun 			ssPtr->matchSum += ssPtr->matchLengthFreq[u] * (u + 3);
90*4882a593Smuzhiyun 		}
91*4882a593Smuzhiyun 		ssPtr->matchSum *= ZSTD_LITFREQ_ADD;
92*4882a593Smuzhiyun 		for (u = 0; u <= MaxOff; u++) {
93*4882a593Smuzhiyun 			ssPtr->offCodeFreq[u] = 1 + (ssPtr->offCodeFreq[u] >> ZSTD_FREQ_DIV);
94*4882a593Smuzhiyun 			ssPtr->offCodeSum += ssPtr->offCodeFreq[u];
95*4882a593Smuzhiyun 		}
96*4882a593Smuzhiyun 	}
97*4882a593Smuzhiyun 
98*4882a593Smuzhiyun 	ZSTD_setLog2Prices(ssPtr);
99*4882a593Smuzhiyun }
100*4882a593Smuzhiyun 
ZSTD_getLiteralPrice(seqStore_t * ssPtr,U32 litLength,const BYTE * literals)101*4882a593Smuzhiyun FORCE_INLINE U32 ZSTD_getLiteralPrice(seqStore_t *ssPtr, U32 litLength, const BYTE *literals)
102*4882a593Smuzhiyun {
103*4882a593Smuzhiyun 	U32 price, u;
104*4882a593Smuzhiyun 
105*4882a593Smuzhiyun 	if (ssPtr->staticPrices)
106*4882a593Smuzhiyun 		return ZSTD_highbit32((U32)litLength + 1) + (litLength * 6);
107*4882a593Smuzhiyun 
108*4882a593Smuzhiyun 	if (litLength == 0)
109*4882a593Smuzhiyun 		return ssPtr->log2litLengthSum - ZSTD_highbit32(ssPtr->litLengthFreq[0] + 1);
110*4882a593Smuzhiyun 
111*4882a593Smuzhiyun 	/* literals */
112*4882a593Smuzhiyun 	if (ssPtr->cachedLiterals == literals) {
113*4882a593Smuzhiyun 		U32 const additional = litLength - ssPtr->cachedLitLength;
114*4882a593Smuzhiyun 		const BYTE *literals2 = ssPtr->cachedLiterals + ssPtr->cachedLitLength;
115*4882a593Smuzhiyun 		price = ssPtr->cachedPrice + additional * ssPtr->log2litSum;
116*4882a593Smuzhiyun 		for (u = 0; u < additional; u++)
117*4882a593Smuzhiyun 			price -= ZSTD_highbit32(ssPtr->litFreq[literals2[u]] + 1);
118*4882a593Smuzhiyun 		ssPtr->cachedPrice = price;
119*4882a593Smuzhiyun 		ssPtr->cachedLitLength = litLength;
120*4882a593Smuzhiyun 	} else {
121*4882a593Smuzhiyun 		price = litLength * ssPtr->log2litSum;
122*4882a593Smuzhiyun 		for (u = 0; u < litLength; u++)
123*4882a593Smuzhiyun 			price -= ZSTD_highbit32(ssPtr->litFreq[literals[u]] + 1);
124*4882a593Smuzhiyun 
125*4882a593Smuzhiyun 		if (litLength >= 12) {
126*4882a593Smuzhiyun 			ssPtr->cachedLiterals = literals;
127*4882a593Smuzhiyun 			ssPtr->cachedPrice = price;
128*4882a593Smuzhiyun 			ssPtr->cachedLitLength = litLength;
129*4882a593Smuzhiyun 		}
130*4882a593Smuzhiyun 	}
131*4882a593Smuzhiyun 
132*4882a593Smuzhiyun 	/* literal Length */
133*4882a593Smuzhiyun 	{
134*4882a593Smuzhiyun 		const BYTE LL_deltaCode = 19;
135*4882a593Smuzhiyun 		const BYTE llCode = (litLength > 63) ? (BYTE)ZSTD_highbit32(litLength) + LL_deltaCode : LL_Code[litLength];
136*4882a593Smuzhiyun 		price += LL_bits[llCode] + ssPtr->log2litLengthSum - ZSTD_highbit32(ssPtr->litLengthFreq[llCode] + 1);
137*4882a593Smuzhiyun 	}
138*4882a593Smuzhiyun 
139*4882a593Smuzhiyun 	return price;
140*4882a593Smuzhiyun }
141*4882a593Smuzhiyun 
ZSTD_getPrice(seqStore_t * seqStorePtr,U32 litLength,const BYTE * literals,U32 offset,U32 matchLength,const int ultra)142*4882a593Smuzhiyun FORCE_INLINE U32 ZSTD_getPrice(seqStore_t *seqStorePtr, U32 litLength, const BYTE *literals, U32 offset, U32 matchLength, const int ultra)
143*4882a593Smuzhiyun {
144*4882a593Smuzhiyun 	/* offset */
145*4882a593Smuzhiyun 	U32 price;
146*4882a593Smuzhiyun 	BYTE const offCode = (BYTE)ZSTD_highbit32(offset + 1);
147*4882a593Smuzhiyun 
148*4882a593Smuzhiyun 	if (seqStorePtr->staticPrices)
149*4882a593Smuzhiyun 		return ZSTD_getLiteralPrice(seqStorePtr, litLength, literals) + ZSTD_highbit32((U32)matchLength + 1) + 16 + offCode;
150*4882a593Smuzhiyun 
151*4882a593Smuzhiyun 	price = offCode + seqStorePtr->log2offCodeSum - ZSTD_highbit32(seqStorePtr->offCodeFreq[offCode] + 1);
152*4882a593Smuzhiyun 	if (!ultra && offCode >= 20)
153*4882a593Smuzhiyun 		price += (offCode - 19) * 2;
154*4882a593Smuzhiyun 
155*4882a593Smuzhiyun 	/* match Length */
156*4882a593Smuzhiyun 	{
157*4882a593Smuzhiyun 		const BYTE ML_deltaCode = 36;
158*4882a593Smuzhiyun 		const BYTE mlCode = (matchLength > 127) ? (BYTE)ZSTD_highbit32(matchLength) + ML_deltaCode : ML_Code[matchLength];
159*4882a593Smuzhiyun 		price += ML_bits[mlCode] + seqStorePtr->log2matchLengthSum - ZSTD_highbit32(seqStorePtr->matchLengthFreq[mlCode] + 1);
160*4882a593Smuzhiyun 	}
161*4882a593Smuzhiyun 
162*4882a593Smuzhiyun 	return price + ZSTD_getLiteralPrice(seqStorePtr, litLength, literals) + seqStorePtr->factor;
163*4882a593Smuzhiyun }
164*4882a593Smuzhiyun 
ZSTD_updatePrice(seqStore_t * seqStorePtr,U32 litLength,const BYTE * literals,U32 offset,U32 matchLength)165*4882a593Smuzhiyun ZSTD_STATIC void ZSTD_updatePrice(seqStore_t *seqStorePtr, U32 litLength, const BYTE *literals, U32 offset, U32 matchLength)
166*4882a593Smuzhiyun {
167*4882a593Smuzhiyun 	U32 u;
168*4882a593Smuzhiyun 
169*4882a593Smuzhiyun 	/* literals */
170*4882a593Smuzhiyun 	seqStorePtr->litSum += litLength * ZSTD_LITFREQ_ADD;
171*4882a593Smuzhiyun 	for (u = 0; u < litLength; u++)
172*4882a593Smuzhiyun 		seqStorePtr->litFreq[literals[u]] += ZSTD_LITFREQ_ADD;
173*4882a593Smuzhiyun 
174*4882a593Smuzhiyun 	/* literal Length */
175*4882a593Smuzhiyun 	{
176*4882a593Smuzhiyun 		const BYTE LL_deltaCode = 19;
177*4882a593Smuzhiyun 		const BYTE llCode = (litLength > 63) ? (BYTE)ZSTD_highbit32(litLength) + LL_deltaCode : LL_Code[litLength];
178*4882a593Smuzhiyun 		seqStorePtr->litLengthFreq[llCode]++;
179*4882a593Smuzhiyun 		seqStorePtr->litLengthSum++;
180*4882a593Smuzhiyun 	}
181*4882a593Smuzhiyun 
182*4882a593Smuzhiyun 	/* match offset */
183*4882a593Smuzhiyun 	{
184*4882a593Smuzhiyun 		BYTE const offCode = (BYTE)ZSTD_highbit32(offset + 1);
185*4882a593Smuzhiyun 		seqStorePtr->offCodeSum++;
186*4882a593Smuzhiyun 		seqStorePtr->offCodeFreq[offCode]++;
187*4882a593Smuzhiyun 	}
188*4882a593Smuzhiyun 
189*4882a593Smuzhiyun 	/* match Length */
190*4882a593Smuzhiyun 	{
191*4882a593Smuzhiyun 		const BYTE ML_deltaCode = 36;
192*4882a593Smuzhiyun 		const BYTE mlCode = (matchLength > 127) ? (BYTE)ZSTD_highbit32(matchLength) + ML_deltaCode : ML_Code[matchLength];
193*4882a593Smuzhiyun 		seqStorePtr->matchLengthFreq[mlCode]++;
194*4882a593Smuzhiyun 		seqStorePtr->matchLengthSum++;
195*4882a593Smuzhiyun 	}
196*4882a593Smuzhiyun 
197*4882a593Smuzhiyun 	ZSTD_setLog2Prices(seqStorePtr);
198*4882a593Smuzhiyun }
199*4882a593Smuzhiyun 
200*4882a593Smuzhiyun #define SET_PRICE(pos, mlen_, offset_, litlen_, price_)           \
201*4882a593Smuzhiyun 	{                                                         \
202*4882a593Smuzhiyun 		while (last_pos < pos) {                          \
203*4882a593Smuzhiyun 			opt[last_pos + 1].price = ZSTD_MAX_PRICE; \
204*4882a593Smuzhiyun 			last_pos++;                               \
205*4882a593Smuzhiyun 		}                                                 \
206*4882a593Smuzhiyun 		opt[pos].mlen = mlen_;                            \
207*4882a593Smuzhiyun 		opt[pos].off = offset_;                           \
208*4882a593Smuzhiyun 		opt[pos].litlen = litlen_;                        \
209*4882a593Smuzhiyun 		opt[pos].price = price_;                          \
210*4882a593Smuzhiyun 	}
211*4882a593Smuzhiyun 
212*4882a593Smuzhiyun /* Update hashTable3 up to ip (excluded)
213*4882a593Smuzhiyun    Assumption : always within prefix (i.e. not within extDict) */
214*4882a593Smuzhiyun FORCE_INLINE
ZSTD_insertAndFindFirstIndexHash3(ZSTD_CCtx * zc,const BYTE * ip)215*4882a593Smuzhiyun U32 ZSTD_insertAndFindFirstIndexHash3(ZSTD_CCtx *zc, const BYTE *ip)
216*4882a593Smuzhiyun {
217*4882a593Smuzhiyun 	U32 *const hashTable3 = zc->hashTable3;
218*4882a593Smuzhiyun 	U32 const hashLog3 = zc->hashLog3;
219*4882a593Smuzhiyun 	const BYTE *const base = zc->base;
220*4882a593Smuzhiyun 	U32 idx = zc->nextToUpdate3;
221*4882a593Smuzhiyun 	const U32 target = zc->nextToUpdate3 = (U32)(ip - base);
222*4882a593Smuzhiyun 	const size_t hash3 = ZSTD_hash3Ptr(ip, hashLog3);
223*4882a593Smuzhiyun 
224*4882a593Smuzhiyun 	while (idx < target) {
225*4882a593Smuzhiyun 		hashTable3[ZSTD_hash3Ptr(base + idx, hashLog3)] = idx;
226*4882a593Smuzhiyun 		idx++;
227*4882a593Smuzhiyun 	}
228*4882a593Smuzhiyun 
229*4882a593Smuzhiyun 	return hashTable3[hash3];
230*4882a593Smuzhiyun }
231*4882a593Smuzhiyun 
232*4882a593Smuzhiyun /*-*************************************
233*4882a593Smuzhiyun *  Binary Tree search
234*4882a593Smuzhiyun ***************************************/
ZSTD_insertBtAndGetAllMatches(ZSTD_CCtx * zc,const BYTE * const ip,const BYTE * const iLimit,U32 nbCompares,const U32 mls,U32 extDict,ZSTD_match_t * matches,const U32 minMatchLen)235*4882a593Smuzhiyun static U32 ZSTD_insertBtAndGetAllMatches(ZSTD_CCtx *zc, const BYTE *const ip, const BYTE *const iLimit, U32 nbCompares, const U32 mls, U32 extDict,
236*4882a593Smuzhiyun 					 ZSTD_match_t *matches, const U32 minMatchLen)
237*4882a593Smuzhiyun {
238*4882a593Smuzhiyun 	const BYTE *const base = zc->base;
239*4882a593Smuzhiyun 	const U32 curr = (U32)(ip - base);
240*4882a593Smuzhiyun 	const U32 hashLog = zc->params.cParams.hashLog;
241*4882a593Smuzhiyun 	const size_t h = ZSTD_hashPtr(ip, hashLog, mls);
242*4882a593Smuzhiyun 	U32 *const hashTable = zc->hashTable;
243*4882a593Smuzhiyun 	U32 matchIndex = hashTable[h];
244*4882a593Smuzhiyun 	U32 *const bt = zc->chainTable;
245*4882a593Smuzhiyun 	const U32 btLog = zc->params.cParams.chainLog - 1;
246*4882a593Smuzhiyun 	const U32 btMask = (1U << btLog) - 1;
247*4882a593Smuzhiyun 	size_t commonLengthSmaller = 0, commonLengthLarger = 0;
248*4882a593Smuzhiyun 	const BYTE *const dictBase = zc->dictBase;
249*4882a593Smuzhiyun 	const U32 dictLimit = zc->dictLimit;
250*4882a593Smuzhiyun 	const BYTE *const dictEnd = dictBase + dictLimit;
251*4882a593Smuzhiyun 	const BYTE *const prefixStart = base + dictLimit;
252*4882a593Smuzhiyun 	const U32 btLow = btMask >= curr ? 0 : curr - btMask;
253*4882a593Smuzhiyun 	const U32 windowLow = zc->lowLimit;
254*4882a593Smuzhiyun 	U32 *smallerPtr = bt + 2 * (curr & btMask);
255*4882a593Smuzhiyun 	U32 *largerPtr = bt + 2 * (curr & btMask) + 1;
256*4882a593Smuzhiyun 	U32 matchEndIdx = curr + 8;
257*4882a593Smuzhiyun 	U32 dummy32; /* to be nullified at the end */
258*4882a593Smuzhiyun 	U32 mnum = 0;
259*4882a593Smuzhiyun 
260*4882a593Smuzhiyun 	const U32 minMatch = (mls == 3) ? 3 : 4;
261*4882a593Smuzhiyun 	size_t bestLength = minMatchLen - 1;
262*4882a593Smuzhiyun 
263*4882a593Smuzhiyun 	if (minMatch == 3) { /* HC3 match finder */
264*4882a593Smuzhiyun 		U32 const matchIndex3 = ZSTD_insertAndFindFirstIndexHash3(zc, ip);
265*4882a593Smuzhiyun 		if (matchIndex3 > windowLow && (curr - matchIndex3 < (1 << 18))) {
266*4882a593Smuzhiyun 			const BYTE *match;
267*4882a593Smuzhiyun 			size_t currMl = 0;
268*4882a593Smuzhiyun 			if ((!extDict) || matchIndex3 >= dictLimit) {
269*4882a593Smuzhiyun 				match = base + matchIndex3;
270*4882a593Smuzhiyun 				if (match[bestLength] == ip[bestLength])
271*4882a593Smuzhiyun 					currMl = ZSTD_count(ip, match, iLimit);
272*4882a593Smuzhiyun 			} else {
273*4882a593Smuzhiyun 				match = dictBase + matchIndex3;
274*4882a593Smuzhiyun 				if (ZSTD_readMINMATCH(match, MINMATCH) ==
275*4882a593Smuzhiyun 				    ZSTD_readMINMATCH(ip, MINMATCH)) /* assumption : matchIndex3 <= dictLimit-4 (by table construction) */
276*4882a593Smuzhiyun 					currMl = ZSTD_count_2segments(ip + MINMATCH, match + MINMATCH, iLimit, dictEnd, prefixStart) + MINMATCH;
277*4882a593Smuzhiyun 			}
278*4882a593Smuzhiyun 
279*4882a593Smuzhiyun 			/* save best solution */
280*4882a593Smuzhiyun 			if (currMl > bestLength) {
281*4882a593Smuzhiyun 				bestLength = currMl;
282*4882a593Smuzhiyun 				matches[mnum].off = ZSTD_REP_MOVE_OPT + curr - matchIndex3;
283*4882a593Smuzhiyun 				matches[mnum].len = (U32)currMl;
284*4882a593Smuzhiyun 				mnum++;
285*4882a593Smuzhiyun 				if (currMl > ZSTD_OPT_NUM)
286*4882a593Smuzhiyun 					goto update;
287*4882a593Smuzhiyun 				if (ip + currMl == iLimit)
288*4882a593Smuzhiyun 					goto update; /* best possible, and avoid read overflow*/
289*4882a593Smuzhiyun 			}
290*4882a593Smuzhiyun 		}
291*4882a593Smuzhiyun 	}
292*4882a593Smuzhiyun 
293*4882a593Smuzhiyun 	hashTable[h] = curr; /* Update Hash Table */
294*4882a593Smuzhiyun 
295*4882a593Smuzhiyun 	while (nbCompares-- && (matchIndex > windowLow)) {
296*4882a593Smuzhiyun 		U32 *nextPtr = bt + 2 * (matchIndex & btMask);
297*4882a593Smuzhiyun 		size_t matchLength = MIN(commonLengthSmaller, commonLengthLarger); /* guaranteed minimum nb of common bytes */
298*4882a593Smuzhiyun 		const BYTE *match;
299*4882a593Smuzhiyun 
300*4882a593Smuzhiyun 		if ((!extDict) || (matchIndex + matchLength >= dictLimit)) {
301*4882a593Smuzhiyun 			match = base + matchIndex;
302*4882a593Smuzhiyun 			if (match[matchLength] == ip[matchLength]) {
303*4882a593Smuzhiyun 				matchLength += ZSTD_count(ip + matchLength + 1, match + matchLength + 1, iLimit) + 1;
304*4882a593Smuzhiyun 			}
305*4882a593Smuzhiyun 		} else {
306*4882a593Smuzhiyun 			match = dictBase + matchIndex;
307*4882a593Smuzhiyun 			matchLength += ZSTD_count_2segments(ip + matchLength, match + matchLength, iLimit, dictEnd, prefixStart);
308*4882a593Smuzhiyun 			if (matchIndex + matchLength >= dictLimit)
309*4882a593Smuzhiyun 				match = base + matchIndex; /* to prepare for next usage of match[matchLength] */
310*4882a593Smuzhiyun 		}
311*4882a593Smuzhiyun 
312*4882a593Smuzhiyun 		if (matchLength > bestLength) {
313*4882a593Smuzhiyun 			if (matchLength > matchEndIdx - matchIndex)
314*4882a593Smuzhiyun 				matchEndIdx = matchIndex + (U32)matchLength;
315*4882a593Smuzhiyun 			bestLength = matchLength;
316*4882a593Smuzhiyun 			matches[mnum].off = ZSTD_REP_MOVE_OPT + curr - matchIndex;
317*4882a593Smuzhiyun 			matches[mnum].len = (U32)matchLength;
318*4882a593Smuzhiyun 			mnum++;
319*4882a593Smuzhiyun 			if (matchLength > ZSTD_OPT_NUM)
320*4882a593Smuzhiyun 				break;
321*4882a593Smuzhiyun 			if (ip + matchLength == iLimit) /* equal : no way to know if inf or sup */
322*4882a593Smuzhiyun 				break;			/* drop, to guarantee consistency (miss a little bit of compression) */
323*4882a593Smuzhiyun 		}
324*4882a593Smuzhiyun 
325*4882a593Smuzhiyun 		if (match[matchLength] < ip[matchLength]) {
326*4882a593Smuzhiyun 			/* match is smaller than curr */
327*4882a593Smuzhiyun 			*smallerPtr = matchIndex;	  /* update smaller idx */
328*4882a593Smuzhiyun 			commonLengthSmaller = matchLength; /* all smaller will now have at least this guaranteed common length */
329*4882a593Smuzhiyun 			if (matchIndex <= btLow) {
330*4882a593Smuzhiyun 				smallerPtr = &dummy32;
331*4882a593Smuzhiyun 				break;
332*4882a593Smuzhiyun 			}			  /* beyond tree size, stop the search */
333*4882a593Smuzhiyun 			smallerPtr = nextPtr + 1; /* new "smaller" => larger of match */
334*4882a593Smuzhiyun 			matchIndex = nextPtr[1];  /* new matchIndex larger than previous (closer to curr) */
335*4882a593Smuzhiyun 		} else {
336*4882a593Smuzhiyun 			/* match is larger than curr */
337*4882a593Smuzhiyun 			*largerPtr = matchIndex;
338*4882a593Smuzhiyun 			commonLengthLarger = matchLength;
339*4882a593Smuzhiyun 			if (matchIndex <= btLow) {
340*4882a593Smuzhiyun 				largerPtr = &dummy32;
341*4882a593Smuzhiyun 				break;
342*4882a593Smuzhiyun 			} /* beyond tree size, stop the search */
343*4882a593Smuzhiyun 			largerPtr = nextPtr;
344*4882a593Smuzhiyun 			matchIndex = nextPtr[0];
345*4882a593Smuzhiyun 		}
346*4882a593Smuzhiyun 	}
347*4882a593Smuzhiyun 
348*4882a593Smuzhiyun 	*smallerPtr = *largerPtr = 0;
349*4882a593Smuzhiyun 
350*4882a593Smuzhiyun update:
351*4882a593Smuzhiyun 	zc->nextToUpdate = (matchEndIdx > curr + 8) ? matchEndIdx - 8 : curr + 1;
352*4882a593Smuzhiyun 	return mnum;
353*4882a593Smuzhiyun }
354*4882a593Smuzhiyun 
355*4882a593Smuzhiyun /** Tree updater, providing best match */
ZSTD_BtGetAllMatches(ZSTD_CCtx * zc,const BYTE * const ip,const BYTE * const iLimit,const U32 maxNbAttempts,const U32 mls,ZSTD_match_t * matches,const U32 minMatchLen)356*4882a593Smuzhiyun static U32 ZSTD_BtGetAllMatches(ZSTD_CCtx *zc, const BYTE *const ip, const BYTE *const iLimit, const U32 maxNbAttempts, const U32 mls, ZSTD_match_t *matches,
357*4882a593Smuzhiyun 				const U32 minMatchLen)
358*4882a593Smuzhiyun {
359*4882a593Smuzhiyun 	if (ip < zc->base + zc->nextToUpdate)
360*4882a593Smuzhiyun 		return 0; /* skipped area */
361*4882a593Smuzhiyun 	ZSTD_updateTree(zc, ip, iLimit, maxNbAttempts, mls);
362*4882a593Smuzhiyun 	return ZSTD_insertBtAndGetAllMatches(zc, ip, iLimit, maxNbAttempts, mls, 0, matches, minMatchLen);
363*4882a593Smuzhiyun }
364*4882a593Smuzhiyun 
ZSTD_BtGetAllMatches_selectMLS(ZSTD_CCtx * zc,const BYTE * ip,const BYTE * const iHighLimit,const U32 maxNbAttempts,const U32 matchLengthSearch,ZSTD_match_t * matches,const U32 minMatchLen)365*4882a593Smuzhiyun static U32 ZSTD_BtGetAllMatches_selectMLS(ZSTD_CCtx *zc, /* Index table will be updated */
366*4882a593Smuzhiyun 					  const BYTE *ip, const BYTE *const iHighLimit, const U32 maxNbAttempts, const U32 matchLengthSearch,
367*4882a593Smuzhiyun 					  ZSTD_match_t *matches, const U32 minMatchLen)
368*4882a593Smuzhiyun {
369*4882a593Smuzhiyun 	switch (matchLengthSearch) {
370*4882a593Smuzhiyun 	case 3: return ZSTD_BtGetAllMatches(zc, ip, iHighLimit, maxNbAttempts, 3, matches, minMatchLen);
371*4882a593Smuzhiyun 	default:
372*4882a593Smuzhiyun 	case 4: return ZSTD_BtGetAllMatches(zc, ip, iHighLimit, maxNbAttempts, 4, matches, minMatchLen);
373*4882a593Smuzhiyun 	case 5: return ZSTD_BtGetAllMatches(zc, ip, iHighLimit, maxNbAttempts, 5, matches, minMatchLen);
374*4882a593Smuzhiyun 	case 7:
375*4882a593Smuzhiyun 	case 6: return ZSTD_BtGetAllMatches(zc, ip, iHighLimit, maxNbAttempts, 6, matches, minMatchLen);
376*4882a593Smuzhiyun 	}
377*4882a593Smuzhiyun }
378*4882a593Smuzhiyun 
379*4882a593Smuzhiyun /** Tree updater, providing best match */
ZSTD_BtGetAllMatches_extDict(ZSTD_CCtx * zc,const BYTE * const ip,const BYTE * const iLimit,const U32 maxNbAttempts,const U32 mls,ZSTD_match_t * matches,const U32 minMatchLen)380*4882a593Smuzhiyun static U32 ZSTD_BtGetAllMatches_extDict(ZSTD_CCtx *zc, const BYTE *const ip, const BYTE *const iLimit, const U32 maxNbAttempts, const U32 mls,
381*4882a593Smuzhiyun 					ZSTD_match_t *matches, const U32 minMatchLen)
382*4882a593Smuzhiyun {
383*4882a593Smuzhiyun 	if (ip < zc->base + zc->nextToUpdate)
384*4882a593Smuzhiyun 		return 0; /* skipped area */
385*4882a593Smuzhiyun 	ZSTD_updateTree_extDict(zc, ip, iLimit, maxNbAttempts, mls);
386*4882a593Smuzhiyun 	return ZSTD_insertBtAndGetAllMatches(zc, ip, iLimit, maxNbAttempts, mls, 1, matches, minMatchLen);
387*4882a593Smuzhiyun }
388*4882a593Smuzhiyun 
ZSTD_BtGetAllMatches_selectMLS_extDict(ZSTD_CCtx * zc,const BYTE * ip,const BYTE * const iHighLimit,const U32 maxNbAttempts,const U32 matchLengthSearch,ZSTD_match_t * matches,const U32 minMatchLen)389*4882a593Smuzhiyun static U32 ZSTD_BtGetAllMatches_selectMLS_extDict(ZSTD_CCtx *zc, /* Index table will be updated */
390*4882a593Smuzhiyun 						  const BYTE *ip, const BYTE *const iHighLimit, const U32 maxNbAttempts, const U32 matchLengthSearch,
391*4882a593Smuzhiyun 						  ZSTD_match_t *matches, const U32 minMatchLen)
392*4882a593Smuzhiyun {
393*4882a593Smuzhiyun 	switch (matchLengthSearch) {
394*4882a593Smuzhiyun 	case 3: return ZSTD_BtGetAllMatches_extDict(zc, ip, iHighLimit, maxNbAttempts, 3, matches, minMatchLen);
395*4882a593Smuzhiyun 	default:
396*4882a593Smuzhiyun 	case 4: return ZSTD_BtGetAllMatches_extDict(zc, ip, iHighLimit, maxNbAttempts, 4, matches, minMatchLen);
397*4882a593Smuzhiyun 	case 5: return ZSTD_BtGetAllMatches_extDict(zc, ip, iHighLimit, maxNbAttempts, 5, matches, minMatchLen);
398*4882a593Smuzhiyun 	case 7:
399*4882a593Smuzhiyun 	case 6: return ZSTD_BtGetAllMatches_extDict(zc, ip, iHighLimit, maxNbAttempts, 6, matches, minMatchLen);
400*4882a593Smuzhiyun 	}
401*4882a593Smuzhiyun }
402*4882a593Smuzhiyun 
403*4882a593Smuzhiyun /*-*******************************
404*4882a593Smuzhiyun *  Optimal parser
405*4882a593Smuzhiyun *********************************/
406*4882a593Smuzhiyun FORCE_INLINE
ZSTD_compressBlock_opt_generic(ZSTD_CCtx * ctx,const void * src,size_t srcSize,const int ultra)407*4882a593Smuzhiyun void ZSTD_compressBlock_opt_generic(ZSTD_CCtx *ctx, const void *src, size_t srcSize, const int ultra)
408*4882a593Smuzhiyun {
409*4882a593Smuzhiyun 	seqStore_t *seqStorePtr = &(ctx->seqStore);
410*4882a593Smuzhiyun 	const BYTE *const istart = (const BYTE *)src;
411*4882a593Smuzhiyun 	const BYTE *ip = istart;
412*4882a593Smuzhiyun 	const BYTE *anchor = istart;
413*4882a593Smuzhiyun 	const BYTE *const iend = istart + srcSize;
414*4882a593Smuzhiyun 	const BYTE *const ilimit = iend - 8;
415*4882a593Smuzhiyun 	const BYTE *const base = ctx->base;
416*4882a593Smuzhiyun 	const BYTE *const prefixStart = base + ctx->dictLimit;
417*4882a593Smuzhiyun 
418*4882a593Smuzhiyun 	const U32 maxSearches = 1U << ctx->params.cParams.searchLog;
419*4882a593Smuzhiyun 	const U32 sufficient_len = ctx->params.cParams.targetLength;
420*4882a593Smuzhiyun 	const U32 mls = ctx->params.cParams.searchLength;
421*4882a593Smuzhiyun 	const U32 minMatch = (ctx->params.cParams.searchLength == 3) ? 3 : 4;
422*4882a593Smuzhiyun 
423*4882a593Smuzhiyun 	ZSTD_optimal_t *opt = seqStorePtr->priceTable;
424*4882a593Smuzhiyun 	ZSTD_match_t *matches = seqStorePtr->matchTable;
425*4882a593Smuzhiyun 	const BYTE *inr;
426*4882a593Smuzhiyun 	U32 offset, rep[ZSTD_REP_NUM];
427*4882a593Smuzhiyun 
428*4882a593Smuzhiyun 	/* init */
429*4882a593Smuzhiyun 	ctx->nextToUpdate3 = ctx->nextToUpdate;
430*4882a593Smuzhiyun 	ZSTD_rescaleFreqs(seqStorePtr, (const BYTE *)src, srcSize);
431*4882a593Smuzhiyun 	ip += (ip == prefixStart);
432*4882a593Smuzhiyun 	{
433*4882a593Smuzhiyun 		U32 i;
434*4882a593Smuzhiyun 		for (i = 0; i < ZSTD_REP_NUM; i++)
435*4882a593Smuzhiyun 			rep[i] = ctx->rep[i];
436*4882a593Smuzhiyun 	}
437*4882a593Smuzhiyun 
438*4882a593Smuzhiyun 	/* Match Loop */
439*4882a593Smuzhiyun 	while (ip < ilimit) {
440*4882a593Smuzhiyun 		U32 cur, match_num, last_pos, litlen, price;
441*4882a593Smuzhiyun 		U32 u, mlen, best_mlen, best_off, litLength;
442*4882a593Smuzhiyun 		memset(opt, 0, sizeof(ZSTD_optimal_t));
443*4882a593Smuzhiyun 		last_pos = 0;
444*4882a593Smuzhiyun 		litlen = (U32)(ip - anchor);
445*4882a593Smuzhiyun 
446*4882a593Smuzhiyun 		/* check repCode */
447*4882a593Smuzhiyun 		{
448*4882a593Smuzhiyun 			U32 i, last_i = ZSTD_REP_CHECK + (ip == anchor);
449*4882a593Smuzhiyun 			for (i = (ip == anchor); i < last_i; i++) {
450*4882a593Smuzhiyun 				const S32 repCur = (i == ZSTD_REP_MOVE_OPT) ? (rep[0] - 1) : rep[i];
451*4882a593Smuzhiyun 				if ((repCur > 0) && (repCur < (S32)(ip - prefixStart)) &&
452*4882a593Smuzhiyun 				    (ZSTD_readMINMATCH(ip, minMatch) == ZSTD_readMINMATCH(ip - repCur, minMatch))) {
453*4882a593Smuzhiyun 					mlen = (U32)ZSTD_count(ip + minMatch, ip + minMatch - repCur, iend) + minMatch;
454*4882a593Smuzhiyun 					if (mlen > sufficient_len || mlen >= ZSTD_OPT_NUM) {
455*4882a593Smuzhiyun 						best_mlen = mlen;
456*4882a593Smuzhiyun 						best_off = i;
457*4882a593Smuzhiyun 						cur = 0;
458*4882a593Smuzhiyun 						last_pos = 1;
459*4882a593Smuzhiyun 						goto _storeSequence;
460*4882a593Smuzhiyun 					}
461*4882a593Smuzhiyun 					best_off = i - (ip == anchor);
462*4882a593Smuzhiyun 					do {
463*4882a593Smuzhiyun 						price = ZSTD_getPrice(seqStorePtr, litlen, anchor, best_off, mlen - MINMATCH, ultra);
464*4882a593Smuzhiyun 						if (mlen > last_pos || price < opt[mlen].price)
465*4882a593Smuzhiyun 							SET_PRICE(mlen, mlen, i, litlen, price); /* note : macro modifies last_pos */
466*4882a593Smuzhiyun 						mlen--;
467*4882a593Smuzhiyun 					} while (mlen >= minMatch);
468*4882a593Smuzhiyun 				}
469*4882a593Smuzhiyun 			}
470*4882a593Smuzhiyun 		}
471*4882a593Smuzhiyun 
472*4882a593Smuzhiyun 		match_num = ZSTD_BtGetAllMatches_selectMLS(ctx, ip, iend, maxSearches, mls, matches, minMatch);
473*4882a593Smuzhiyun 
474*4882a593Smuzhiyun 		if (!last_pos && !match_num) {
475*4882a593Smuzhiyun 			ip++;
476*4882a593Smuzhiyun 			continue;
477*4882a593Smuzhiyun 		}
478*4882a593Smuzhiyun 
479*4882a593Smuzhiyun 		if (match_num && (matches[match_num - 1].len > sufficient_len || matches[match_num - 1].len >= ZSTD_OPT_NUM)) {
480*4882a593Smuzhiyun 			best_mlen = matches[match_num - 1].len;
481*4882a593Smuzhiyun 			best_off = matches[match_num - 1].off;
482*4882a593Smuzhiyun 			cur = 0;
483*4882a593Smuzhiyun 			last_pos = 1;
484*4882a593Smuzhiyun 			goto _storeSequence;
485*4882a593Smuzhiyun 		}
486*4882a593Smuzhiyun 
487*4882a593Smuzhiyun 		/* set prices using matches at position = 0 */
488*4882a593Smuzhiyun 		best_mlen = (last_pos) ? last_pos : minMatch;
489*4882a593Smuzhiyun 		for (u = 0; u < match_num; u++) {
490*4882a593Smuzhiyun 			mlen = (u > 0) ? matches[u - 1].len + 1 : best_mlen;
491*4882a593Smuzhiyun 			best_mlen = matches[u].len;
492*4882a593Smuzhiyun 			while (mlen <= best_mlen) {
493*4882a593Smuzhiyun 				price = ZSTD_getPrice(seqStorePtr, litlen, anchor, matches[u].off - 1, mlen - MINMATCH, ultra);
494*4882a593Smuzhiyun 				if (mlen > last_pos || price < opt[mlen].price)
495*4882a593Smuzhiyun 					SET_PRICE(mlen, mlen, matches[u].off, litlen, price); /* note : macro modifies last_pos */
496*4882a593Smuzhiyun 				mlen++;
497*4882a593Smuzhiyun 			}
498*4882a593Smuzhiyun 		}
499*4882a593Smuzhiyun 
500*4882a593Smuzhiyun 		if (last_pos < minMatch) {
501*4882a593Smuzhiyun 			ip++;
502*4882a593Smuzhiyun 			continue;
503*4882a593Smuzhiyun 		}
504*4882a593Smuzhiyun 
505*4882a593Smuzhiyun 		/* initialize opt[0] */
506*4882a593Smuzhiyun 		{
507*4882a593Smuzhiyun 			U32 i;
508*4882a593Smuzhiyun 			for (i = 0; i < ZSTD_REP_NUM; i++)
509*4882a593Smuzhiyun 				opt[0].rep[i] = rep[i];
510*4882a593Smuzhiyun 		}
511*4882a593Smuzhiyun 		opt[0].mlen = 1;
512*4882a593Smuzhiyun 		opt[0].litlen = litlen;
513*4882a593Smuzhiyun 
514*4882a593Smuzhiyun 		/* check further positions */
515*4882a593Smuzhiyun 		for (cur = 1; cur <= last_pos; cur++) {
516*4882a593Smuzhiyun 			inr = ip + cur;
517*4882a593Smuzhiyun 
518*4882a593Smuzhiyun 			if (opt[cur - 1].mlen == 1) {
519*4882a593Smuzhiyun 				litlen = opt[cur - 1].litlen + 1;
520*4882a593Smuzhiyun 				if (cur > litlen) {
521*4882a593Smuzhiyun 					price = opt[cur - litlen].price + ZSTD_getLiteralPrice(seqStorePtr, litlen, inr - litlen);
522*4882a593Smuzhiyun 				} else
523*4882a593Smuzhiyun 					price = ZSTD_getLiteralPrice(seqStorePtr, litlen, anchor);
524*4882a593Smuzhiyun 			} else {
525*4882a593Smuzhiyun 				litlen = 1;
526*4882a593Smuzhiyun 				price = opt[cur - 1].price + ZSTD_getLiteralPrice(seqStorePtr, litlen, inr - 1);
527*4882a593Smuzhiyun 			}
528*4882a593Smuzhiyun 
529*4882a593Smuzhiyun 			if (cur > last_pos || price <= opt[cur].price)
530*4882a593Smuzhiyun 				SET_PRICE(cur, 1, 0, litlen, price);
531*4882a593Smuzhiyun 
532*4882a593Smuzhiyun 			if (cur == last_pos)
533*4882a593Smuzhiyun 				break;
534*4882a593Smuzhiyun 
535*4882a593Smuzhiyun 			if (inr > ilimit) /* last match must start at a minimum distance of 8 from oend */
536*4882a593Smuzhiyun 				continue;
537*4882a593Smuzhiyun 
538*4882a593Smuzhiyun 			mlen = opt[cur].mlen;
539*4882a593Smuzhiyun 			if (opt[cur].off > ZSTD_REP_MOVE_OPT) {
540*4882a593Smuzhiyun 				opt[cur].rep[2] = opt[cur - mlen].rep[1];
541*4882a593Smuzhiyun 				opt[cur].rep[1] = opt[cur - mlen].rep[0];
542*4882a593Smuzhiyun 				opt[cur].rep[0] = opt[cur].off - ZSTD_REP_MOVE_OPT;
543*4882a593Smuzhiyun 			} else {
544*4882a593Smuzhiyun 				opt[cur].rep[2] = (opt[cur].off > 1) ? opt[cur - mlen].rep[1] : opt[cur - mlen].rep[2];
545*4882a593Smuzhiyun 				opt[cur].rep[1] = (opt[cur].off > 0) ? opt[cur - mlen].rep[0] : opt[cur - mlen].rep[1];
546*4882a593Smuzhiyun 				opt[cur].rep[0] =
547*4882a593Smuzhiyun 				    ((opt[cur].off == ZSTD_REP_MOVE_OPT) && (mlen != 1)) ? (opt[cur - mlen].rep[0] - 1) : (opt[cur - mlen].rep[opt[cur].off]);
548*4882a593Smuzhiyun 			}
549*4882a593Smuzhiyun 
550*4882a593Smuzhiyun 			best_mlen = minMatch;
551*4882a593Smuzhiyun 			{
552*4882a593Smuzhiyun 				U32 i, last_i = ZSTD_REP_CHECK + (mlen != 1);
553*4882a593Smuzhiyun 				for (i = (opt[cur].mlen != 1); i < last_i; i++) { /* check rep */
554*4882a593Smuzhiyun 					const S32 repCur = (i == ZSTD_REP_MOVE_OPT) ? (opt[cur].rep[0] - 1) : opt[cur].rep[i];
555*4882a593Smuzhiyun 					if ((repCur > 0) && (repCur < (S32)(inr - prefixStart)) &&
556*4882a593Smuzhiyun 					    (ZSTD_readMINMATCH(inr, minMatch) == ZSTD_readMINMATCH(inr - repCur, minMatch))) {
557*4882a593Smuzhiyun 						mlen = (U32)ZSTD_count(inr + minMatch, inr + minMatch - repCur, iend) + minMatch;
558*4882a593Smuzhiyun 
559*4882a593Smuzhiyun 						if (mlen > sufficient_len || cur + mlen >= ZSTD_OPT_NUM) {
560*4882a593Smuzhiyun 							best_mlen = mlen;
561*4882a593Smuzhiyun 							best_off = i;
562*4882a593Smuzhiyun 							last_pos = cur + 1;
563*4882a593Smuzhiyun 							goto _storeSequence;
564*4882a593Smuzhiyun 						}
565*4882a593Smuzhiyun 
566*4882a593Smuzhiyun 						best_off = i - (opt[cur].mlen != 1);
567*4882a593Smuzhiyun 						if (mlen > best_mlen)
568*4882a593Smuzhiyun 							best_mlen = mlen;
569*4882a593Smuzhiyun 
570*4882a593Smuzhiyun 						do {
571*4882a593Smuzhiyun 							if (opt[cur].mlen == 1) {
572*4882a593Smuzhiyun 								litlen = opt[cur].litlen;
573*4882a593Smuzhiyun 								if (cur > litlen) {
574*4882a593Smuzhiyun 									price = opt[cur - litlen].price + ZSTD_getPrice(seqStorePtr, litlen, inr - litlen,
575*4882a593Smuzhiyun 															best_off, mlen - MINMATCH, ultra);
576*4882a593Smuzhiyun 								} else
577*4882a593Smuzhiyun 									price = ZSTD_getPrice(seqStorePtr, litlen, anchor, best_off, mlen - MINMATCH, ultra);
578*4882a593Smuzhiyun 							} else {
579*4882a593Smuzhiyun 								litlen = 0;
580*4882a593Smuzhiyun 								price = opt[cur].price + ZSTD_getPrice(seqStorePtr, 0, NULL, best_off, mlen - MINMATCH, ultra);
581*4882a593Smuzhiyun 							}
582*4882a593Smuzhiyun 
583*4882a593Smuzhiyun 							if (cur + mlen > last_pos || price <= opt[cur + mlen].price)
584*4882a593Smuzhiyun 								SET_PRICE(cur + mlen, mlen, i, litlen, price);
585*4882a593Smuzhiyun 							mlen--;
586*4882a593Smuzhiyun 						} while (mlen >= minMatch);
587*4882a593Smuzhiyun 					}
588*4882a593Smuzhiyun 				}
589*4882a593Smuzhiyun 			}
590*4882a593Smuzhiyun 
591*4882a593Smuzhiyun 			match_num = ZSTD_BtGetAllMatches_selectMLS(ctx, inr, iend, maxSearches, mls, matches, best_mlen);
592*4882a593Smuzhiyun 
593*4882a593Smuzhiyun 			if (match_num > 0 && (matches[match_num - 1].len > sufficient_len || cur + matches[match_num - 1].len >= ZSTD_OPT_NUM)) {
594*4882a593Smuzhiyun 				best_mlen = matches[match_num - 1].len;
595*4882a593Smuzhiyun 				best_off = matches[match_num - 1].off;
596*4882a593Smuzhiyun 				last_pos = cur + 1;
597*4882a593Smuzhiyun 				goto _storeSequence;
598*4882a593Smuzhiyun 			}
599*4882a593Smuzhiyun 
600*4882a593Smuzhiyun 			/* set prices using matches at position = cur */
601*4882a593Smuzhiyun 			for (u = 0; u < match_num; u++) {
602*4882a593Smuzhiyun 				mlen = (u > 0) ? matches[u - 1].len + 1 : best_mlen;
603*4882a593Smuzhiyun 				best_mlen = matches[u].len;
604*4882a593Smuzhiyun 
605*4882a593Smuzhiyun 				while (mlen <= best_mlen) {
606*4882a593Smuzhiyun 					if (opt[cur].mlen == 1) {
607*4882a593Smuzhiyun 						litlen = opt[cur].litlen;
608*4882a593Smuzhiyun 						if (cur > litlen)
609*4882a593Smuzhiyun 							price = opt[cur - litlen].price + ZSTD_getPrice(seqStorePtr, litlen, ip + cur - litlen,
610*4882a593Smuzhiyun 													matches[u].off - 1, mlen - MINMATCH, ultra);
611*4882a593Smuzhiyun 						else
612*4882a593Smuzhiyun 							price = ZSTD_getPrice(seqStorePtr, litlen, anchor, matches[u].off - 1, mlen - MINMATCH, ultra);
613*4882a593Smuzhiyun 					} else {
614*4882a593Smuzhiyun 						litlen = 0;
615*4882a593Smuzhiyun 						price = opt[cur].price + ZSTD_getPrice(seqStorePtr, 0, NULL, matches[u].off - 1, mlen - MINMATCH, ultra);
616*4882a593Smuzhiyun 					}
617*4882a593Smuzhiyun 
618*4882a593Smuzhiyun 					if (cur + mlen > last_pos || (price < opt[cur + mlen].price))
619*4882a593Smuzhiyun 						SET_PRICE(cur + mlen, mlen, matches[u].off, litlen, price);
620*4882a593Smuzhiyun 
621*4882a593Smuzhiyun 					mlen++;
622*4882a593Smuzhiyun 				}
623*4882a593Smuzhiyun 			}
624*4882a593Smuzhiyun 		}
625*4882a593Smuzhiyun 
626*4882a593Smuzhiyun 		best_mlen = opt[last_pos].mlen;
627*4882a593Smuzhiyun 		best_off = opt[last_pos].off;
628*4882a593Smuzhiyun 		cur = last_pos - best_mlen;
629*4882a593Smuzhiyun 
630*4882a593Smuzhiyun 	/* store sequence */
631*4882a593Smuzhiyun _storeSequence: /* cur, last_pos, best_mlen, best_off have to be set */
632*4882a593Smuzhiyun 		opt[0].mlen = 1;
633*4882a593Smuzhiyun 
634*4882a593Smuzhiyun 		while (1) {
635*4882a593Smuzhiyun 			mlen = opt[cur].mlen;
636*4882a593Smuzhiyun 			offset = opt[cur].off;
637*4882a593Smuzhiyun 			opt[cur].mlen = best_mlen;
638*4882a593Smuzhiyun 			opt[cur].off = best_off;
639*4882a593Smuzhiyun 			best_mlen = mlen;
640*4882a593Smuzhiyun 			best_off = offset;
641*4882a593Smuzhiyun 			if (mlen > cur)
642*4882a593Smuzhiyun 				break;
643*4882a593Smuzhiyun 			cur -= mlen;
644*4882a593Smuzhiyun 		}
645*4882a593Smuzhiyun 
646*4882a593Smuzhiyun 		for (u = 0; u <= last_pos;) {
647*4882a593Smuzhiyun 			u += opt[u].mlen;
648*4882a593Smuzhiyun 		}
649*4882a593Smuzhiyun 
650*4882a593Smuzhiyun 		for (cur = 0; cur < last_pos;) {
651*4882a593Smuzhiyun 			mlen = opt[cur].mlen;
652*4882a593Smuzhiyun 			if (mlen == 1) {
653*4882a593Smuzhiyun 				ip++;
654*4882a593Smuzhiyun 				cur++;
655*4882a593Smuzhiyun 				continue;
656*4882a593Smuzhiyun 			}
657*4882a593Smuzhiyun 			offset = opt[cur].off;
658*4882a593Smuzhiyun 			cur += mlen;
659*4882a593Smuzhiyun 			litLength = (U32)(ip - anchor);
660*4882a593Smuzhiyun 
661*4882a593Smuzhiyun 			if (offset > ZSTD_REP_MOVE_OPT) {
662*4882a593Smuzhiyun 				rep[2] = rep[1];
663*4882a593Smuzhiyun 				rep[1] = rep[0];
664*4882a593Smuzhiyun 				rep[0] = offset - ZSTD_REP_MOVE_OPT;
665*4882a593Smuzhiyun 				offset--;
666*4882a593Smuzhiyun 			} else {
667*4882a593Smuzhiyun 				if (offset != 0) {
668*4882a593Smuzhiyun 					best_off = (offset == ZSTD_REP_MOVE_OPT) ? (rep[0] - 1) : (rep[offset]);
669*4882a593Smuzhiyun 					if (offset != 1)
670*4882a593Smuzhiyun 						rep[2] = rep[1];
671*4882a593Smuzhiyun 					rep[1] = rep[0];
672*4882a593Smuzhiyun 					rep[0] = best_off;
673*4882a593Smuzhiyun 				}
674*4882a593Smuzhiyun 				if (litLength == 0)
675*4882a593Smuzhiyun 					offset--;
676*4882a593Smuzhiyun 			}
677*4882a593Smuzhiyun 
678*4882a593Smuzhiyun 			ZSTD_updatePrice(seqStorePtr, litLength, anchor, offset, mlen - MINMATCH);
679*4882a593Smuzhiyun 			ZSTD_storeSeq(seqStorePtr, litLength, anchor, offset, mlen - MINMATCH);
680*4882a593Smuzhiyun 			anchor = ip = ip + mlen;
681*4882a593Smuzhiyun 		}
682*4882a593Smuzhiyun 	} /* for (cur=0; cur < last_pos; ) */
683*4882a593Smuzhiyun 
684*4882a593Smuzhiyun 	/* Save reps for next block */
685*4882a593Smuzhiyun 	{
686*4882a593Smuzhiyun 		int i;
687*4882a593Smuzhiyun 		for (i = 0; i < ZSTD_REP_NUM; i++)
688*4882a593Smuzhiyun 			ctx->repToConfirm[i] = rep[i];
689*4882a593Smuzhiyun 	}
690*4882a593Smuzhiyun 
691*4882a593Smuzhiyun 	/* Last Literals */
692*4882a593Smuzhiyun 	{
693*4882a593Smuzhiyun 		size_t const lastLLSize = iend - anchor;
694*4882a593Smuzhiyun 		memcpy(seqStorePtr->lit, anchor, lastLLSize);
695*4882a593Smuzhiyun 		seqStorePtr->lit += lastLLSize;
696*4882a593Smuzhiyun 	}
697*4882a593Smuzhiyun }
698*4882a593Smuzhiyun 
699*4882a593Smuzhiyun FORCE_INLINE
ZSTD_compressBlock_opt_extDict_generic(ZSTD_CCtx * ctx,const void * src,size_t srcSize,const int ultra)700*4882a593Smuzhiyun void ZSTD_compressBlock_opt_extDict_generic(ZSTD_CCtx *ctx, const void *src, size_t srcSize, const int ultra)
701*4882a593Smuzhiyun {
702*4882a593Smuzhiyun 	seqStore_t *seqStorePtr = &(ctx->seqStore);
703*4882a593Smuzhiyun 	const BYTE *const istart = (const BYTE *)src;
704*4882a593Smuzhiyun 	const BYTE *ip = istart;
705*4882a593Smuzhiyun 	const BYTE *anchor = istart;
706*4882a593Smuzhiyun 	const BYTE *const iend = istart + srcSize;
707*4882a593Smuzhiyun 	const BYTE *const ilimit = iend - 8;
708*4882a593Smuzhiyun 	const BYTE *const base = ctx->base;
709*4882a593Smuzhiyun 	const U32 lowestIndex = ctx->lowLimit;
710*4882a593Smuzhiyun 	const U32 dictLimit = ctx->dictLimit;
711*4882a593Smuzhiyun 	const BYTE *const prefixStart = base + dictLimit;
712*4882a593Smuzhiyun 	const BYTE *const dictBase = ctx->dictBase;
713*4882a593Smuzhiyun 	const BYTE *const dictEnd = dictBase + dictLimit;
714*4882a593Smuzhiyun 
715*4882a593Smuzhiyun 	const U32 maxSearches = 1U << ctx->params.cParams.searchLog;
716*4882a593Smuzhiyun 	const U32 sufficient_len = ctx->params.cParams.targetLength;
717*4882a593Smuzhiyun 	const U32 mls = ctx->params.cParams.searchLength;
718*4882a593Smuzhiyun 	const U32 minMatch = (ctx->params.cParams.searchLength == 3) ? 3 : 4;
719*4882a593Smuzhiyun 
720*4882a593Smuzhiyun 	ZSTD_optimal_t *opt = seqStorePtr->priceTable;
721*4882a593Smuzhiyun 	ZSTD_match_t *matches = seqStorePtr->matchTable;
722*4882a593Smuzhiyun 	const BYTE *inr;
723*4882a593Smuzhiyun 
724*4882a593Smuzhiyun 	/* init */
725*4882a593Smuzhiyun 	U32 offset, rep[ZSTD_REP_NUM];
726*4882a593Smuzhiyun 	{
727*4882a593Smuzhiyun 		U32 i;
728*4882a593Smuzhiyun 		for (i = 0; i < ZSTD_REP_NUM; i++)
729*4882a593Smuzhiyun 			rep[i] = ctx->rep[i];
730*4882a593Smuzhiyun 	}
731*4882a593Smuzhiyun 
732*4882a593Smuzhiyun 	ctx->nextToUpdate3 = ctx->nextToUpdate;
733*4882a593Smuzhiyun 	ZSTD_rescaleFreqs(seqStorePtr, (const BYTE *)src, srcSize);
734*4882a593Smuzhiyun 	ip += (ip == prefixStart);
735*4882a593Smuzhiyun 
736*4882a593Smuzhiyun 	/* Match Loop */
737*4882a593Smuzhiyun 	while (ip < ilimit) {
738*4882a593Smuzhiyun 		U32 cur, match_num, last_pos, litlen, price;
739*4882a593Smuzhiyun 		U32 u, mlen, best_mlen, best_off, litLength;
740*4882a593Smuzhiyun 		U32 curr = (U32)(ip - base);
741*4882a593Smuzhiyun 		memset(opt, 0, sizeof(ZSTD_optimal_t));
742*4882a593Smuzhiyun 		last_pos = 0;
743*4882a593Smuzhiyun 		opt[0].litlen = (U32)(ip - anchor);
744*4882a593Smuzhiyun 
745*4882a593Smuzhiyun 		/* check repCode */
746*4882a593Smuzhiyun 		{
747*4882a593Smuzhiyun 			U32 i, last_i = ZSTD_REP_CHECK + (ip == anchor);
748*4882a593Smuzhiyun 			for (i = (ip == anchor); i < last_i; i++) {
749*4882a593Smuzhiyun 				const S32 repCur = (i == ZSTD_REP_MOVE_OPT) ? (rep[0] - 1) : rep[i];
750*4882a593Smuzhiyun 				const U32 repIndex = (U32)(curr - repCur);
751*4882a593Smuzhiyun 				const BYTE *const repBase = repIndex < dictLimit ? dictBase : base;
752*4882a593Smuzhiyun 				const BYTE *const repMatch = repBase + repIndex;
753*4882a593Smuzhiyun 				if ((repCur > 0 && repCur <= (S32)curr) &&
754*4882a593Smuzhiyun 				    (((U32)((dictLimit - 1) - repIndex) >= 3) & (repIndex > lowestIndex)) /* intentional overflow */
755*4882a593Smuzhiyun 				    && (ZSTD_readMINMATCH(ip, minMatch) == ZSTD_readMINMATCH(repMatch, minMatch))) {
756*4882a593Smuzhiyun 					/* repcode detected we should take it */
757*4882a593Smuzhiyun 					const BYTE *const repEnd = repIndex < dictLimit ? dictEnd : iend;
758*4882a593Smuzhiyun 					mlen = (U32)ZSTD_count_2segments(ip + minMatch, repMatch + minMatch, iend, repEnd, prefixStart) + minMatch;
759*4882a593Smuzhiyun 
760*4882a593Smuzhiyun 					if (mlen > sufficient_len || mlen >= ZSTD_OPT_NUM) {
761*4882a593Smuzhiyun 						best_mlen = mlen;
762*4882a593Smuzhiyun 						best_off = i;
763*4882a593Smuzhiyun 						cur = 0;
764*4882a593Smuzhiyun 						last_pos = 1;
765*4882a593Smuzhiyun 						goto _storeSequence;
766*4882a593Smuzhiyun 					}
767*4882a593Smuzhiyun 
768*4882a593Smuzhiyun 					best_off = i - (ip == anchor);
769*4882a593Smuzhiyun 					litlen = opt[0].litlen;
770*4882a593Smuzhiyun 					do {
771*4882a593Smuzhiyun 						price = ZSTD_getPrice(seqStorePtr, litlen, anchor, best_off, mlen - MINMATCH, ultra);
772*4882a593Smuzhiyun 						if (mlen > last_pos || price < opt[mlen].price)
773*4882a593Smuzhiyun 							SET_PRICE(mlen, mlen, i, litlen, price); /* note : macro modifies last_pos */
774*4882a593Smuzhiyun 						mlen--;
775*4882a593Smuzhiyun 					} while (mlen >= minMatch);
776*4882a593Smuzhiyun 				}
777*4882a593Smuzhiyun 			}
778*4882a593Smuzhiyun 		}
779*4882a593Smuzhiyun 
780*4882a593Smuzhiyun 		match_num = ZSTD_BtGetAllMatches_selectMLS_extDict(ctx, ip, iend, maxSearches, mls, matches, minMatch); /* first search (depth 0) */
781*4882a593Smuzhiyun 
782*4882a593Smuzhiyun 		if (!last_pos && !match_num) {
783*4882a593Smuzhiyun 			ip++;
784*4882a593Smuzhiyun 			continue;
785*4882a593Smuzhiyun 		}
786*4882a593Smuzhiyun 
787*4882a593Smuzhiyun 		{
788*4882a593Smuzhiyun 			U32 i;
789*4882a593Smuzhiyun 			for (i = 0; i < ZSTD_REP_NUM; i++)
790*4882a593Smuzhiyun 				opt[0].rep[i] = rep[i];
791*4882a593Smuzhiyun 		}
792*4882a593Smuzhiyun 		opt[0].mlen = 1;
793*4882a593Smuzhiyun 
794*4882a593Smuzhiyun 		if (match_num && (matches[match_num - 1].len > sufficient_len || matches[match_num - 1].len >= ZSTD_OPT_NUM)) {
795*4882a593Smuzhiyun 			best_mlen = matches[match_num - 1].len;
796*4882a593Smuzhiyun 			best_off = matches[match_num - 1].off;
797*4882a593Smuzhiyun 			cur = 0;
798*4882a593Smuzhiyun 			last_pos = 1;
799*4882a593Smuzhiyun 			goto _storeSequence;
800*4882a593Smuzhiyun 		}
801*4882a593Smuzhiyun 
802*4882a593Smuzhiyun 		best_mlen = (last_pos) ? last_pos : minMatch;
803*4882a593Smuzhiyun 
804*4882a593Smuzhiyun 		/* set prices using matches at position = 0 */
805*4882a593Smuzhiyun 		for (u = 0; u < match_num; u++) {
806*4882a593Smuzhiyun 			mlen = (u > 0) ? matches[u - 1].len + 1 : best_mlen;
807*4882a593Smuzhiyun 			best_mlen = matches[u].len;
808*4882a593Smuzhiyun 			litlen = opt[0].litlen;
809*4882a593Smuzhiyun 			while (mlen <= best_mlen) {
810*4882a593Smuzhiyun 				price = ZSTD_getPrice(seqStorePtr, litlen, anchor, matches[u].off - 1, mlen - MINMATCH, ultra);
811*4882a593Smuzhiyun 				if (mlen > last_pos || price < opt[mlen].price)
812*4882a593Smuzhiyun 					SET_PRICE(mlen, mlen, matches[u].off, litlen, price);
813*4882a593Smuzhiyun 				mlen++;
814*4882a593Smuzhiyun 			}
815*4882a593Smuzhiyun 		}
816*4882a593Smuzhiyun 
817*4882a593Smuzhiyun 		if (last_pos < minMatch) {
818*4882a593Smuzhiyun 			ip++;
819*4882a593Smuzhiyun 			continue;
820*4882a593Smuzhiyun 		}
821*4882a593Smuzhiyun 
822*4882a593Smuzhiyun 		/* check further positions */
823*4882a593Smuzhiyun 		for (cur = 1; cur <= last_pos; cur++) {
824*4882a593Smuzhiyun 			inr = ip + cur;
825*4882a593Smuzhiyun 
826*4882a593Smuzhiyun 			if (opt[cur - 1].mlen == 1) {
827*4882a593Smuzhiyun 				litlen = opt[cur - 1].litlen + 1;
828*4882a593Smuzhiyun 				if (cur > litlen) {
829*4882a593Smuzhiyun 					price = opt[cur - litlen].price + ZSTD_getLiteralPrice(seqStorePtr, litlen, inr - litlen);
830*4882a593Smuzhiyun 				} else
831*4882a593Smuzhiyun 					price = ZSTD_getLiteralPrice(seqStorePtr, litlen, anchor);
832*4882a593Smuzhiyun 			} else {
833*4882a593Smuzhiyun 				litlen = 1;
834*4882a593Smuzhiyun 				price = opt[cur - 1].price + ZSTD_getLiteralPrice(seqStorePtr, litlen, inr - 1);
835*4882a593Smuzhiyun 			}
836*4882a593Smuzhiyun 
837*4882a593Smuzhiyun 			if (cur > last_pos || price <= opt[cur].price)
838*4882a593Smuzhiyun 				SET_PRICE(cur, 1, 0, litlen, price);
839*4882a593Smuzhiyun 
840*4882a593Smuzhiyun 			if (cur == last_pos)
841*4882a593Smuzhiyun 				break;
842*4882a593Smuzhiyun 
843*4882a593Smuzhiyun 			if (inr > ilimit) /* last match must start at a minimum distance of 8 from oend */
844*4882a593Smuzhiyun 				continue;
845*4882a593Smuzhiyun 
846*4882a593Smuzhiyun 			mlen = opt[cur].mlen;
847*4882a593Smuzhiyun 			if (opt[cur].off > ZSTD_REP_MOVE_OPT) {
848*4882a593Smuzhiyun 				opt[cur].rep[2] = opt[cur - mlen].rep[1];
849*4882a593Smuzhiyun 				opt[cur].rep[1] = opt[cur - mlen].rep[0];
850*4882a593Smuzhiyun 				opt[cur].rep[0] = opt[cur].off - ZSTD_REP_MOVE_OPT;
851*4882a593Smuzhiyun 			} else {
852*4882a593Smuzhiyun 				opt[cur].rep[2] = (opt[cur].off > 1) ? opt[cur - mlen].rep[1] : opt[cur - mlen].rep[2];
853*4882a593Smuzhiyun 				opt[cur].rep[1] = (opt[cur].off > 0) ? opt[cur - mlen].rep[0] : opt[cur - mlen].rep[1];
854*4882a593Smuzhiyun 				opt[cur].rep[0] =
855*4882a593Smuzhiyun 				    ((opt[cur].off == ZSTD_REP_MOVE_OPT) && (mlen != 1)) ? (opt[cur - mlen].rep[0] - 1) : (opt[cur - mlen].rep[opt[cur].off]);
856*4882a593Smuzhiyun 			}
857*4882a593Smuzhiyun 
858*4882a593Smuzhiyun 			best_mlen = minMatch;
859*4882a593Smuzhiyun 			{
860*4882a593Smuzhiyun 				U32 i, last_i = ZSTD_REP_CHECK + (mlen != 1);
861*4882a593Smuzhiyun 				for (i = (mlen != 1); i < last_i; i++) {
862*4882a593Smuzhiyun 					const S32 repCur = (i == ZSTD_REP_MOVE_OPT) ? (opt[cur].rep[0] - 1) : opt[cur].rep[i];
863*4882a593Smuzhiyun 					const U32 repIndex = (U32)(curr + cur - repCur);
864*4882a593Smuzhiyun 					const BYTE *const repBase = repIndex < dictLimit ? dictBase : base;
865*4882a593Smuzhiyun 					const BYTE *const repMatch = repBase + repIndex;
866*4882a593Smuzhiyun 					if ((repCur > 0 && repCur <= (S32)(curr + cur)) &&
867*4882a593Smuzhiyun 					    (((U32)((dictLimit - 1) - repIndex) >= 3) & (repIndex > lowestIndex)) /* intentional overflow */
868*4882a593Smuzhiyun 					    && (ZSTD_readMINMATCH(inr, minMatch) == ZSTD_readMINMATCH(repMatch, minMatch))) {
869*4882a593Smuzhiyun 						/* repcode detected */
870*4882a593Smuzhiyun 						const BYTE *const repEnd = repIndex < dictLimit ? dictEnd : iend;
871*4882a593Smuzhiyun 						mlen = (U32)ZSTD_count_2segments(inr + minMatch, repMatch + minMatch, iend, repEnd, prefixStart) + minMatch;
872*4882a593Smuzhiyun 
873*4882a593Smuzhiyun 						if (mlen > sufficient_len || cur + mlen >= ZSTD_OPT_NUM) {
874*4882a593Smuzhiyun 							best_mlen = mlen;
875*4882a593Smuzhiyun 							best_off = i;
876*4882a593Smuzhiyun 							last_pos = cur + 1;
877*4882a593Smuzhiyun 							goto _storeSequence;
878*4882a593Smuzhiyun 						}
879*4882a593Smuzhiyun 
880*4882a593Smuzhiyun 						best_off = i - (opt[cur].mlen != 1);
881*4882a593Smuzhiyun 						if (mlen > best_mlen)
882*4882a593Smuzhiyun 							best_mlen = mlen;
883*4882a593Smuzhiyun 
884*4882a593Smuzhiyun 						do {
885*4882a593Smuzhiyun 							if (opt[cur].mlen == 1) {
886*4882a593Smuzhiyun 								litlen = opt[cur].litlen;
887*4882a593Smuzhiyun 								if (cur > litlen) {
888*4882a593Smuzhiyun 									price = opt[cur - litlen].price + ZSTD_getPrice(seqStorePtr, litlen, inr - litlen,
889*4882a593Smuzhiyun 															best_off, mlen - MINMATCH, ultra);
890*4882a593Smuzhiyun 								} else
891*4882a593Smuzhiyun 									price = ZSTD_getPrice(seqStorePtr, litlen, anchor, best_off, mlen - MINMATCH, ultra);
892*4882a593Smuzhiyun 							} else {
893*4882a593Smuzhiyun 								litlen = 0;
894*4882a593Smuzhiyun 								price = opt[cur].price + ZSTD_getPrice(seqStorePtr, 0, NULL, best_off, mlen - MINMATCH, ultra);
895*4882a593Smuzhiyun 							}
896*4882a593Smuzhiyun 
897*4882a593Smuzhiyun 							if (cur + mlen > last_pos || price <= opt[cur + mlen].price)
898*4882a593Smuzhiyun 								SET_PRICE(cur + mlen, mlen, i, litlen, price);
899*4882a593Smuzhiyun 							mlen--;
900*4882a593Smuzhiyun 						} while (mlen >= minMatch);
901*4882a593Smuzhiyun 					}
902*4882a593Smuzhiyun 				}
903*4882a593Smuzhiyun 			}
904*4882a593Smuzhiyun 
905*4882a593Smuzhiyun 			match_num = ZSTD_BtGetAllMatches_selectMLS_extDict(ctx, inr, iend, maxSearches, mls, matches, minMatch);
906*4882a593Smuzhiyun 
907*4882a593Smuzhiyun 			if (match_num > 0 && (matches[match_num - 1].len > sufficient_len || cur + matches[match_num - 1].len >= ZSTD_OPT_NUM)) {
908*4882a593Smuzhiyun 				best_mlen = matches[match_num - 1].len;
909*4882a593Smuzhiyun 				best_off = matches[match_num - 1].off;
910*4882a593Smuzhiyun 				last_pos = cur + 1;
911*4882a593Smuzhiyun 				goto _storeSequence;
912*4882a593Smuzhiyun 			}
913*4882a593Smuzhiyun 
914*4882a593Smuzhiyun 			/* set prices using matches at position = cur */
915*4882a593Smuzhiyun 			for (u = 0; u < match_num; u++) {
916*4882a593Smuzhiyun 				mlen = (u > 0) ? matches[u - 1].len + 1 : best_mlen;
917*4882a593Smuzhiyun 				best_mlen = matches[u].len;
918*4882a593Smuzhiyun 
919*4882a593Smuzhiyun 				while (mlen <= best_mlen) {
920*4882a593Smuzhiyun 					if (opt[cur].mlen == 1) {
921*4882a593Smuzhiyun 						litlen = opt[cur].litlen;
922*4882a593Smuzhiyun 						if (cur > litlen)
923*4882a593Smuzhiyun 							price = opt[cur - litlen].price + ZSTD_getPrice(seqStorePtr, litlen, ip + cur - litlen,
924*4882a593Smuzhiyun 													matches[u].off - 1, mlen - MINMATCH, ultra);
925*4882a593Smuzhiyun 						else
926*4882a593Smuzhiyun 							price = ZSTD_getPrice(seqStorePtr, litlen, anchor, matches[u].off - 1, mlen - MINMATCH, ultra);
927*4882a593Smuzhiyun 					} else {
928*4882a593Smuzhiyun 						litlen = 0;
929*4882a593Smuzhiyun 						price = opt[cur].price + ZSTD_getPrice(seqStorePtr, 0, NULL, matches[u].off - 1, mlen - MINMATCH, ultra);
930*4882a593Smuzhiyun 					}
931*4882a593Smuzhiyun 
932*4882a593Smuzhiyun 					if (cur + mlen > last_pos || (price < opt[cur + mlen].price))
933*4882a593Smuzhiyun 						SET_PRICE(cur + mlen, mlen, matches[u].off, litlen, price);
934*4882a593Smuzhiyun 
935*4882a593Smuzhiyun 					mlen++;
936*4882a593Smuzhiyun 				}
937*4882a593Smuzhiyun 			}
938*4882a593Smuzhiyun 		} /* for (cur = 1; cur <= last_pos; cur++) */
939*4882a593Smuzhiyun 
940*4882a593Smuzhiyun 		best_mlen = opt[last_pos].mlen;
941*4882a593Smuzhiyun 		best_off = opt[last_pos].off;
942*4882a593Smuzhiyun 		cur = last_pos - best_mlen;
943*4882a593Smuzhiyun 
944*4882a593Smuzhiyun 	/* store sequence */
945*4882a593Smuzhiyun _storeSequence: /* cur, last_pos, best_mlen, best_off have to be set */
946*4882a593Smuzhiyun 		opt[0].mlen = 1;
947*4882a593Smuzhiyun 
948*4882a593Smuzhiyun 		while (1) {
949*4882a593Smuzhiyun 			mlen = opt[cur].mlen;
950*4882a593Smuzhiyun 			offset = opt[cur].off;
951*4882a593Smuzhiyun 			opt[cur].mlen = best_mlen;
952*4882a593Smuzhiyun 			opt[cur].off = best_off;
953*4882a593Smuzhiyun 			best_mlen = mlen;
954*4882a593Smuzhiyun 			best_off = offset;
955*4882a593Smuzhiyun 			if (mlen > cur)
956*4882a593Smuzhiyun 				break;
957*4882a593Smuzhiyun 			cur -= mlen;
958*4882a593Smuzhiyun 		}
959*4882a593Smuzhiyun 
960*4882a593Smuzhiyun 		for (u = 0; u <= last_pos;) {
961*4882a593Smuzhiyun 			u += opt[u].mlen;
962*4882a593Smuzhiyun 		}
963*4882a593Smuzhiyun 
964*4882a593Smuzhiyun 		for (cur = 0; cur < last_pos;) {
965*4882a593Smuzhiyun 			mlen = opt[cur].mlen;
966*4882a593Smuzhiyun 			if (mlen == 1) {
967*4882a593Smuzhiyun 				ip++;
968*4882a593Smuzhiyun 				cur++;
969*4882a593Smuzhiyun 				continue;
970*4882a593Smuzhiyun 			}
971*4882a593Smuzhiyun 			offset = opt[cur].off;
972*4882a593Smuzhiyun 			cur += mlen;
973*4882a593Smuzhiyun 			litLength = (U32)(ip - anchor);
974*4882a593Smuzhiyun 
975*4882a593Smuzhiyun 			if (offset > ZSTD_REP_MOVE_OPT) {
976*4882a593Smuzhiyun 				rep[2] = rep[1];
977*4882a593Smuzhiyun 				rep[1] = rep[0];
978*4882a593Smuzhiyun 				rep[0] = offset - ZSTD_REP_MOVE_OPT;
979*4882a593Smuzhiyun 				offset--;
980*4882a593Smuzhiyun 			} else {
981*4882a593Smuzhiyun 				if (offset != 0) {
982*4882a593Smuzhiyun 					best_off = (offset == ZSTD_REP_MOVE_OPT) ? (rep[0] - 1) : (rep[offset]);
983*4882a593Smuzhiyun 					if (offset != 1)
984*4882a593Smuzhiyun 						rep[2] = rep[1];
985*4882a593Smuzhiyun 					rep[1] = rep[0];
986*4882a593Smuzhiyun 					rep[0] = best_off;
987*4882a593Smuzhiyun 				}
988*4882a593Smuzhiyun 
989*4882a593Smuzhiyun 				if (litLength == 0)
990*4882a593Smuzhiyun 					offset--;
991*4882a593Smuzhiyun 			}
992*4882a593Smuzhiyun 
993*4882a593Smuzhiyun 			ZSTD_updatePrice(seqStorePtr, litLength, anchor, offset, mlen - MINMATCH);
994*4882a593Smuzhiyun 			ZSTD_storeSeq(seqStorePtr, litLength, anchor, offset, mlen - MINMATCH);
995*4882a593Smuzhiyun 			anchor = ip = ip + mlen;
996*4882a593Smuzhiyun 		}
997*4882a593Smuzhiyun 	} /* for (cur=0; cur < last_pos; ) */
998*4882a593Smuzhiyun 
999*4882a593Smuzhiyun 	/* Save reps for next block */
1000*4882a593Smuzhiyun 	{
1001*4882a593Smuzhiyun 		int i;
1002*4882a593Smuzhiyun 		for (i = 0; i < ZSTD_REP_NUM; i++)
1003*4882a593Smuzhiyun 			ctx->repToConfirm[i] = rep[i];
1004*4882a593Smuzhiyun 	}
1005*4882a593Smuzhiyun 
1006*4882a593Smuzhiyun 	/* Last Literals */
1007*4882a593Smuzhiyun 	{
1008*4882a593Smuzhiyun 		size_t lastLLSize = iend - anchor;
1009*4882a593Smuzhiyun 		memcpy(seqStorePtr->lit, anchor, lastLLSize);
1010*4882a593Smuzhiyun 		seqStorePtr->lit += lastLLSize;
1011*4882a593Smuzhiyun 	}
1012*4882a593Smuzhiyun }
1013*4882a593Smuzhiyun 
1014*4882a593Smuzhiyun #endif /* ZSTD_OPT_H_91842398743 */
1015