xref: /freebsd/sys/contrib/zstd/lib/compress/zstd_compress_internal.h (revision a521f2116473fbd8c09db395518f060a27d02334)
1 /*
2  * Copyright (c) 2016-2020, Yann Collet, Facebook, Inc.
3  * All rights reserved.
4  *
5  * This source code is licensed under both the BSD-style license (found in the
6  * LICENSE file in the root directory of this source tree) and the GPLv2 (found
7  * in the COPYING file in the root directory of this source tree).
8  * You may select, at your option, one of the above-listed licenses.
9  */
10 
11 /* This header contains definitions
12  * that shall **only** be used by modules within lib/compress.
13  */
14 
15 #ifndef ZSTD_COMPRESS_H
16 #define ZSTD_COMPRESS_H
17 
18 /*-*************************************
19 *  Dependencies
20 ***************************************/
21 #include "../common/zstd_internal.h"
22 #include "zstd_cwksp.h"
23 #ifdef ZSTD_MULTITHREAD
24 #  include "zstdmt_compress.h"
25 #endif
26 
27 #if defined (__cplusplus)
28 extern "C" {
29 #endif
30 
31 
32 /*-*************************************
33 *  Constants
34 ***************************************/
35 #define kSearchStrength      8
36 #define HASH_READ_SIZE       8
37 #define ZSTD_DUBT_UNSORTED_MARK 1   /* For btlazy2 strategy, index ZSTD_DUBT_UNSORTED_MARK==1 means "unsorted".
38                                        It could be confused for a real successor at index "1", if sorted as larger than its predecessor.
39                                        It's not a big deal though : candidate will just be sorted again.
40                                        Additionally, candidate position 1 will be lost.
41                                        But candidate 1 cannot hide a large tree of candidates, so it's a minimal loss.
42                                        The benefit is that ZSTD_DUBT_UNSORTED_MARK cannot be mishandled after table re-use with a different strategy.
43                                        This constant is required by ZSTD_compressBlock_btlazy2() and ZSTD_reduceTable_internal() */
44 
45 
46 /*-*************************************
47 *  Context memory management
48 ***************************************/
49 typedef enum { ZSTDcs_created=0, ZSTDcs_init, ZSTDcs_ongoing, ZSTDcs_ending } ZSTD_compressionStage_e;
50 typedef enum { zcss_init=0, zcss_load, zcss_flush } ZSTD_cStreamStage;
51 
52 typedef struct ZSTD_prefixDict_s {
53     const void* dict;
54     size_t dictSize;
55     ZSTD_dictContentType_e dictContentType;
56 } ZSTD_prefixDict;
57 
58 typedef struct {
59     void* dictBuffer;
60     void const* dict;
61     size_t dictSize;
62     ZSTD_dictContentType_e dictContentType;
63     ZSTD_CDict* cdict;
64 } ZSTD_localDict;
65 
66 typedef struct {
67     U32 CTable[HUF_CTABLE_SIZE_U32(255)];
68     HUF_repeat repeatMode;
69 } ZSTD_hufCTables_t;
70 
71 typedef struct {
72     FSE_CTable offcodeCTable[FSE_CTABLE_SIZE_U32(OffFSELog, MaxOff)];
73     FSE_CTable matchlengthCTable[FSE_CTABLE_SIZE_U32(MLFSELog, MaxML)];
74     FSE_CTable litlengthCTable[FSE_CTABLE_SIZE_U32(LLFSELog, MaxLL)];
75     FSE_repeat offcode_repeatMode;
76     FSE_repeat matchlength_repeatMode;
77     FSE_repeat litlength_repeatMode;
78 } ZSTD_fseCTables_t;
79 
80 typedef struct {
81     ZSTD_hufCTables_t huf;
82     ZSTD_fseCTables_t fse;
83 } ZSTD_entropyCTables_t;
84 
85 typedef struct {
86     U32 off;
87     U32 len;
88 } ZSTD_match_t;
89 
90 typedef struct {
91     int price;
92     U32 off;
93     U32 mlen;
94     U32 litlen;
95     U32 rep[ZSTD_REP_NUM];
96 } ZSTD_optimal_t;
97 
98 typedef enum { zop_dynamic=0, zop_predef } ZSTD_OptPrice_e;
99 
100 typedef struct {
101     /* All tables are allocated inside cctx->workspace by ZSTD_resetCCtx_internal() */
102     unsigned* litFreq;           /* table of literals statistics, of size 256 */
103     unsigned* litLengthFreq;     /* table of litLength statistics, of size (MaxLL+1) */
104     unsigned* matchLengthFreq;   /* table of matchLength statistics, of size (MaxML+1) */
105     unsigned* offCodeFreq;       /* table of offCode statistics, of size (MaxOff+1) */
106     ZSTD_match_t* matchTable;    /* list of found matches, of size ZSTD_OPT_NUM+1 */
107     ZSTD_optimal_t* priceTable;  /* All positions tracked by optimal parser, of size ZSTD_OPT_NUM+1 */
108 
109     U32  litSum;                 /* nb of literals */
110     U32  litLengthSum;           /* nb of litLength codes */
111     U32  matchLengthSum;         /* nb of matchLength codes */
112     U32  offCodeSum;             /* nb of offset codes */
113     U32  litSumBasePrice;        /* to compare to log2(litfreq) */
114     U32  litLengthSumBasePrice;  /* to compare to log2(llfreq)  */
115     U32  matchLengthSumBasePrice;/* to compare to log2(mlfreq)  */
116     U32  offCodeSumBasePrice;    /* to compare to log2(offreq)  */
117     ZSTD_OptPrice_e priceType;   /* prices can be determined dynamically, or follow a pre-defined cost structure */
118     const ZSTD_entropyCTables_t* symbolCosts;  /* pre-calculated dictionary statistics */
119     ZSTD_literalCompressionMode_e literalCompressionMode;
120 } optState_t;
121 
122 typedef struct {
123   ZSTD_entropyCTables_t entropy;
124   U32 rep[ZSTD_REP_NUM];
125 } ZSTD_compressedBlockState_t;
126 
127 typedef struct {
128     BYTE const* nextSrc;    /* next block here to continue on current prefix */
129     BYTE const* base;       /* All regular indexes relative to this position */
130     BYTE const* dictBase;   /* extDict indexes relative to this position */
131     U32 dictLimit;          /* below that point, need extDict */
132     U32 lowLimit;           /* below that point, no more valid data */
133 } ZSTD_window_t;
134 
135 typedef struct ZSTD_matchState_t ZSTD_matchState_t;
136 struct ZSTD_matchState_t {
137     ZSTD_window_t window;   /* State for window round buffer management */
138     U32 loadedDictEnd;      /* index of end of dictionary, within context's referential.
139                              * When loadedDictEnd != 0, a dictionary is in use, and still valid.
140                              * This relies on a mechanism to set loadedDictEnd=0 when dictionary is no longer within distance.
141                              * Such mechanism is provided within ZSTD_window_enforceMaxDist() and ZSTD_checkDictValidity().
142                              * When dict referential is copied into active context (i.e. not attached),
143                              * loadedDictEnd == dictSize, since referential starts from zero.
144                              */
145     U32 nextToUpdate;       /* index from which to continue table update */
146     U32 hashLog3;           /* dispatch table for matches of len==3 : larger == faster, more memory */
147     U32* hashTable;
148     U32* hashTable3;
149     U32* chainTable;
150     optState_t opt;         /* optimal parser state */
151     const ZSTD_matchState_t* dictMatchState;
152     ZSTD_compressionParameters cParams;
153 };
154 
155 typedef struct {
156     ZSTD_compressedBlockState_t* prevCBlock;
157     ZSTD_compressedBlockState_t* nextCBlock;
158     ZSTD_matchState_t matchState;
159 } ZSTD_blockState_t;
160 
161 typedef struct {
162     U32 offset;
163     U32 checksum;
164 } ldmEntry_t;
165 
166 typedef struct {
167     ZSTD_window_t window;   /* State for the window round buffer management */
168     ldmEntry_t* hashTable;
169     U32 loadedDictEnd;
170     BYTE* bucketOffsets;    /* Next position in bucket to insert entry */
171     U64 hashPower;          /* Used to compute the rolling hash.
172                              * Depends on ldmParams.minMatchLength */
173 } ldmState_t;
174 
175 typedef struct {
176     U32 enableLdm;          /* 1 if enable long distance matching */
177     U32 hashLog;            /* Log size of hashTable */
178     U32 bucketSizeLog;      /* Log bucket size for collision resolution, at most 8 */
179     U32 minMatchLength;     /* Minimum match length */
180     U32 hashRateLog;       /* Log number of entries to skip */
181     U32 windowLog;          /* Window log for the LDM */
182 } ldmParams_t;
183 
184 typedef struct {
185     U32 offset;
186     U32 litLength;
187     U32 matchLength;
188 } rawSeq;
189 
190 typedef struct {
191   rawSeq* seq;     /* The start of the sequences */
192   size_t pos;      /* The position where reading stopped. <= size. */
193   size_t size;     /* The number of sequences. <= capacity. */
194   size_t capacity; /* The capacity starting from `seq` pointer */
195 } rawSeqStore_t;
196 
197 typedef struct {
198     int collectSequences;
199     ZSTD_Sequence* seqStart;
200     size_t seqIndex;
201     size_t maxSequences;
202 } SeqCollector;
203 
204 struct ZSTD_CCtx_params_s {
205     ZSTD_format_e format;
206     ZSTD_compressionParameters cParams;
207     ZSTD_frameParameters fParams;
208 
209     int compressionLevel;
210     int forceWindow;           /* force back-references to respect limit of
211                                 * 1<<wLog, even for dictionary */
212     size_t targetCBlockSize;   /* Tries to fit compressed block size to be around targetCBlockSize.
213                                 * No target when targetCBlockSize == 0.
214                                 * There is no guarantee on compressed block size */
215     int srcSizeHint;           /* User's best guess of source size.
216                                 * Hint is not valid when srcSizeHint == 0.
217                                 * There is no guarantee that hint is close to actual source size */
218 
219     ZSTD_dictAttachPref_e attachDictPref;
220     ZSTD_literalCompressionMode_e literalCompressionMode;
221 
222     /* Multithreading: used to pass parameters to mtctx */
223     int nbWorkers;
224     size_t jobSize;
225     int overlapLog;
226     int rsyncable;
227 
228     /* Long distance matching parameters */
229     ldmParams_t ldmParams;
230 
231     /* Internal use, for createCCtxParams() and freeCCtxParams() only */
232     ZSTD_customMem customMem;
233 };  /* typedef'd to ZSTD_CCtx_params within "zstd.h" */
234 
235 struct ZSTD_CCtx_s {
236     ZSTD_compressionStage_e stage;
237     int cParamsChanged;                  /* == 1 if cParams(except wlog) or compression level are changed in requestedParams. Triggers transmission of new params to ZSTDMT (if available) then reset to 0. */
238     int bmi2;                            /* == 1 if the CPU supports BMI2 and 0 otherwise. CPU support is determined dynamically once per context lifetime. */
239     ZSTD_CCtx_params requestedParams;
240     ZSTD_CCtx_params appliedParams;
241     U32   dictID;
242 
243     ZSTD_cwksp workspace; /* manages buffer for dynamic allocations */
244     size_t blockSize;
245     unsigned long long pledgedSrcSizePlusOne;  /* this way, 0 (default) == unknown */
246     unsigned long long consumedSrcSize;
247     unsigned long long producedCSize;
248     XXH64_state_t xxhState;
249     ZSTD_customMem customMem;
250     size_t staticSize;
251     SeqCollector seqCollector;
252     int isFirstBlock;
253     int initialized;
254 
255     seqStore_t seqStore;      /* sequences storage ptrs */
256     ldmState_t ldmState;      /* long distance matching state */
257     rawSeq* ldmSequences;     /* Storage for the ldm output sequences */
258     size_t maxNbLdmSequences;
259     rawSeqStore_t externSeqStore; /* Mutable reference to external sequences */
260     ZSTD_blockState_t blockState;
261     U32* entropyWorkspace;  /* entropy workspace of HUF_WORKSPACE_SIZE bytes */
262 
263     /* streaming */
264     char*  inBuff;
265     size_t inBuffSize;
266     size_t inToCompress;
267     size_t inBuffPos;
268     size_t inBuffTarget;
269     char*  outBuff;
270     size_t outBuffSize;
271     size_t outBuffContentSize;
272     size_t outBuffFlushedSize;
273     ZSTD_cStreamStage streamStage;
274     U32    frameEnded;
275 
276     /* Dictionary */
277     ZSTD_localDict localDict;
278     const ZSTD_CDict* cdict;
279     ZSTD_prefixDict prefixDict;   /* single-usage dictionary */
280 
281     /* Multi-threading */
282 #ifdef ZSTD_MULTITHREAD
283     ZSTDMT_CCtx* mtctx;
284 #endif
285 };
286 
287 typedef enum { ZSTD_dtlm_fast, ZSTD_dtlm_full } ZSTD_dictTableLoadMethod_e;
288 
289 typedef enum { ZSTD_noDict = 0, ZSTD_extDict = 1, ZSTD_dictMatchState = 2 } ZSTD_dictMode_e;
290 
291 
292 typedef size_t (*ZSTD_blockCompressor) (
293         ZSTD_matchState_t* bs, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
294         void const* src, size_t srcSize);
295 ZSTD_blockCompressor ZSTD_selectBlockCompressor(ZSTD_strategy strat, ZSTD_dictMode_e dictMode);
296 
297 
298 MEM_STATIC U32 ZSTD_LLcode(U32 litLength)
299 {
300     static const BYTE LL_Code[64] = {  0,  1,  2,  3,  4,  5,  6,  7,
301                                        8,  9, 10, 11, 12, 13, 14, 15,
302                                       16, 16, 17, 17, 18, 18, 19, 19,
303                                       20, 20, 20, 20, 21, 21, 21, 21,
304                                       22, 22, 22, 22, 22, 22, 22, 22,
305                                       23, 23, 23, 23, 23, 23, 23, 23,
306                                       24, 24, 24, 24, 24, 24, 24, 24,
307                                       24, 24, 24, 24, 24, 24, 24, 24 };
308     static const U32 LL_deltaCode = 19;
309     return (litLength > 63) ? ZSTD_highbit32(litLength) + LL_deltaCode : LL_Code[litLength];
310 }
311 
312 /* ZSTD_MLcode() :
313  * note : mlBase = matchLength - MINMATCH;
314  *        because it's the format it's stored in seqStore->sequences */
315 MEM_STATIC U32 ZSTD_MLcode(U32 mlBase)
316 {
317     static const BYTE ML_Code[128] = { 0,  1,  2,  3,  4,  5,  6,  7,  8,  9, 10, 11, 12, 13, 14, 15,
318                                       16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31,
319                                       32, 32, 33, 33, 34, 34, 35, 35, 36, 36, 36, 36, 37, 37, 37, 37,
320                                       38, 38, 38, 38, 38, 38, 38, 38, 39, 39, 39, 39, 39, 39, 39, 39,
321                                       40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40,
322                                       41, 41, 41, 41, 41, 41, 41, 41, 41, 41, 41, 41, 41, 41, 41, 41,
323                                       42, 42, 42, 42, 42, 42, 42, 42, 42, 42, 42, 42, 42, 42, 42, 42,
324                                       42, 42, 42, 42, 42, 42, 42, 42, 42, 42, 42, 42, 42, 42, 42, 42 };
325     static const U32 ML_deltaCode = 36;
326     return (mlBase > 127) ? ZSTD_highbit32(mlBase) + ML_deltaCode : ML_Code[mlBase];
327 }
328 
329 typedef struct repcodes_s {
330     U32 rep[3];
331 } repcodes_t;
332 
333 MEM_STATIC repcodes_t ZSTD_updateRep(U32 const rep[3], U32 const offset, U32 const ll0)
334 {
335     repcodes_t newReps;
336     if (offset >= ZSTD_REP_NUM) {  /* full offset */
337         newReps.rep[2] = rep[1];
338         newReps.rep[1] = rep[0];
339         newReps.rep[0] = offset - ZSTD_REP_MOVE;
340     } else {   /* repcode */
341         U32 const repCode = offset + ll0;
342         if (repCode > 0) {  /* note : if repCode==0, no change */
343             U32 const currentOffset = (repCode==ZSTD_REP_NUM) ? (rep[0] - 1) : rep[repCode];
344             newReps.rep[2] = (repCode >= 2) ? rep[1] : rep[2];
345             newReps.rep[1] = rep[0];
346             newReps.rep[0] = currentOffset;
347         } else {   /* repCode == 0 */
348             memcpy(&newReps, rep, sizeof(newReps));
349         }
350     }
351     return newReps;
352 }
353 
354 /* ZSTD_cParam_withinBounds:
355  * @return 1 if value is within cParam bounds,
356  * 0 otherwise */
357 MEM_STATIC int ZSTD_cParam_withinBounds(ZSTD_cParameter cParam, int value)
358 {
359     ZSTD_bounds const bounds = ZSTD_cParam_getBounds(cParam);
360     if (ZSTD_isError(bounds.error)) return 0;
361     if (value < bounds.lowerBound) return 0;
362     if (value > bounds.upperBound) return 0;
363     return 1;
364 }
365 
366 /* ZSTD_noCompressBlock() :
367  * Writes uncompressed block to dst buffer from given src.
368  * Returns the size of the block */
369 MEM_STATIC size_t ZSTD_noCompressBlock (void* dst, size_t dstCapacity, const void* src, size_t srcSize, U32 lastBlock)
370 {
371     U32 const cBlockHeader24 = lastBlock + (((U32)bt_raw)<<1) + (U32)(srcSize << 3);
372     RETURN_ERROR_IF(srcSize + ZSTD_blockHeaderSize > dstCapacity,
373                     dstSize_tooSmall, "dst buf too small for uncompressed block");
374     MEM_writeLE24(dst, cBlockHeader24);
375     memcpy((BYTE*)dst + ZSTD_blockHeaderSize, src, srcSize);
376     return ZSTD_blockHeaderSize + srcSize;
377 }
378 
379 MEM_STATIC size_t ZSTD_rleCompressBlock (void* dst, size_t dstCapacity, BYTE src, size_t srcSize, U32 lastBlock)
380 {
381     BYTE* const op = (BYTE*)dst;
382     U32 const cBlockHeader = lastBlock + (((U32)bt_rle)<<1) + (U32)(srcSize << 3);
383     RETURN_ERROR_IF(dstCapacity < 4, dstSize_tooSmall, "");
384     MEM_writeLE24(op, cBlockHeader);
385     op[3] = src;
386     return 4;
387 }
388 
389 
390 /* ZSTD_minGain() :
391  * minimum compression required
392  * to generate a compress block or a compressed literals section.
393  * note : use same formula for both situations */
394 MEM_STATIC size_t ZSTD_minGain(size_t srcSize, ZSTD_strategy strat)
395 {
396     U32 const minlog = (strat>=ZSTD_btultra) ? (U32)(strat) - 1 : 6;
397     ZSTD_STATIC_ASSERT(ZSTD_btultra == 8);
398     assert(ZSTD_cParam_withinBounds(ZSTD_c_strategy, strat));
399     return (srcSize >> minlog) + 2;
400 }
401 
402 MEM_STATIC int ZSTD_disableLiteralsCompression(const ZSTD_CCtx_params* cctxParams)
403 {
404     switch (cctxParams->literalCompressionMode) {
405     case ZSTD_lcm_huffman:
406         return 0;
407     case ZSTD_lcm_uncompressed:
408         return 1;
409     default:
410         assert(0 /* impossible: pre-validated */);
411         /* fall-through */
412     case ZSTD_lcm_auto:
413         return (cctxParams->cParams.strategy == ZSTD_fast) && (cctxParams->cParams.targetLength > 0);
414     }
415 }
416 
417 /*! ZSTD_safecopyLiterals() :
418  *  memcpy() function that won't read beyond more than WILDCOPY_OVERLENGTH bytes past ilimit_w.
419  *  Only called when the sequence ends past ilimit_w, so it only needs to be optimized for single
420  *  large copies.
421  */
422 static void ZSTD_safecopyLiterals(BYTE* op, BYTE const* ip, BYTE const* const iend, BYTE const* ilimit_w) {
423     assert(iend > ilimit_w);
424     if (ip <= ilimit_w) {
425         ZSTD_wildcopy(op, ip, ilimit_w - ip, ZSTD_no_overlap);
426         op += ilimit_w - ip;
427         ip = ilimit_w;
428     }
429     while (ip < iend) *op++ = *ip++;
430 }
431 
432 /*! ZSTD_storeSeq() :
433  *  Store a sequence (litlen, litPtr, offCode and mlBase) into seqStore_t.
434  *  `offCode` : distance to match + ZSTD_REP_MOVE (values <= ZSTD_REP_MOVE are repCodes).
435  *  `mlBase` : matchLength - MINMATCH
436  *  Allowed to overread literals up to litLimit.
437 */
438 HINT_INLINE UNUSED_ATTR
439 void ZSTD_storeSeq(seqStore_t* seqStorePtr, size_t litLength, const BYTE* literals, const BYTE* litLimit, U32 offCode, size_t mlBase)
440 {
441     BYTE const* const litLimit_w = litLimit - WILDCOPY_OVERLENGTH;
442     BYTE const* const litEnd = literals + litLength;
443 #if defined(DEBUGLEVEL) && (DEBUGLEVEL >= 6)
444     static const BYTE* g_start = NULL;
445     if (g_start==NULL) g_start = (const BYTE*)literals;  /* note : index only works for compression within a single segment */
446     {   U32 const pos = (U32)((const BYTE*)literals - g_start);
447         DEBUGLOG(6, "Cpos%7u :%3u literals, match%4u bytes at offCode%7u",
448                pos, (U32)litLength, (U32)mlBase+MINMATCH, (U32)offCode);
449     }
450 #endif
451     assert((size_t)(seqStorePtr->sequences - seqStorePtr->sequencesStart) < seqStorePtr->maxNbSeq);
452     /* copy Literals */
453     assert(seqStorePtr->maxNbLit <= 128 KB);
454     assert(seqStorePtr->lit + litLength <= seqStorePtr->litStart + seqStorePtr->maxNbLit);
455     assert(literals + litLength <= litLimit);
456     if (litEnd <= litLimit_w) {
457         /* Common case we can use wildcopy.
458 	 * First copy 16 bytes, because literals are likely short.
459 	 */
460         assert(WILDCOPY_OVERLENGTH >= 16);
461         ZSTD_copy16(seqStorePtr->lit, literals);
462         if (litLength > 16) {
463             ZSTD_wildcopy(seqStorePtr->lit+16, literals+16, (ptrdiff_t)litLength-16, ZSTD_no_overlap);
464         }
465     } else {
466         ZSTD_safecopyLiterals(seqStorePtr->lit, literals, litEnd, litLimit_w);
467     }
468     seqStorePtr->lit += litLength;
469 
470     /* literal Length */
471     if (litLength>0xFFFF) {
472         assert(seqStorePtr->longLengthID == 0); /* there can only be a single long length */
473         seqStorePtr->longLengthID = 1;
474         seqStorePtr->longLengthPos = (U32)(seqStorePtr->sequences - seqStorePtr->sequencesStart);
475     }
476     seqStorePtr->sequences[0].litLength = (U16)litLength;
477 
478     /* match offset */
479     seqStorePtr->sequences[0].offset = offCode + 1;
480 
481     /* match Length */
482     if (mlBase>0xFFFF) {
483         assert(seqStorePtr->longLengthID == 0); /* there can only be a single long length */
484         seqStorePtr->longLengthID = 2;
485         seqStorePtr->longLengthPos = (U32)(seqStorePtr->sequences - seqStorePtr->sequencesStart);
486     }
487     seqStorePtr->sequences[0].matchLength = (U16)mlBase;
488 
489     seqStorePtr->sequences++;
490 }
491 
492 
493 /*-*************************************
494 *  Match length counter
495 ***************************************/
496 static unsigned ZSTD_NbCommonBytes (size_t val)
497 {
498     if (MEM_isLittleEndian()) {
499         if (MEM_64bits()) {
500 #       if defined(_MSC_VER) && defined(_WIN64)
501             unsigned long r = 0;
502             return _BitScanForward64( &r, (U64)val ) ? (unsigned)(r >> 3) : 0;
503 #       elif defined(__GNUC__) && (__GNUC__ >= 4)
504             return (__builtin_ctzll((U64)val) >> 3);
505 #       else
506             static const int DeBruijnBytePos[64] = { 0, 0, 0, 0, 0, 1, 1, 2,
507                                                      0, 3, 1, 3, 1, 4, 2, 7,
508                                                      0, 2, 3, 6, 1, 5, 3, 5,
509                                                      1, 3, 4, 4, 2, 5, 6, 7,
510                                                      7, 0, 1, 2, 3, 3, 4, 6,
511                                                      2, 6, 5, 5, 3, 4, 5, 6,
512                                                      7, 1, 2, 4, 6, 4, 4, 5,
513                                                      7, 2, 6, 5, 7, 6, 7, 7 };
514             return DeBruijnBytePos[((U64)((val & -(long long)val) * 0x0218A392CDABBD3FULL)) >> 58];
515 #       endif
516         } else { /* 32 bits */
517 #       if defined(_MSC_VER)
518             unsigned long r=0;
519             return _BitScanForward( &r, (U32)val ) ? (unsigned)(r >> 3) : 0;
520 #       elif defined(__GNUC__) && (__GNUC__ >= 3)
521             return (__builtin_ctz((U32)val) >> 3);
522 #       else
523             static const int DeBruijnBytePos[32] = { 0, 0, 3, 0, 3, 1, 3, 0,
524                                                      3, 2, 2, 1, 3, 2, 0, 1,
525                                                      3, 3, 1, 2, 2, 2, 2, 0,
526                                                      3, 1, 2, 0, 1, 0, 1, 1 };
527             return DeBruijnBytePos[((U32)((val & -(S32)val) * 0x077CB531U)) >> 27];
528 #       endif
529         }
530     } else {  /* Big Endian CPU */
531         if (MEM_64bits()) {
532 #       if defined(_MSC_VER) && defined(_WIN64)
533             unsigned long r = 0;
534             return _BitScanReverse64( &r, val ) ? (unsigned)(r >> 3) : 0;
535 #       elif defined(__GNUC__) && (__GNUC__ >= 4)
536             return (__builtin_clzll(val) >> 3);
537 #       else
538             unsigned r;
539             const unsigned n32 = sizeof(size_t)*4;   /* calculate this way due to compiler complaining in 32-bits mode */
540             if (!(val>>n32)) { r=4; } else { r=0; val>>=n32; }
541             if (!(val>>16)) { r+=2; val>>=8; } else { val>>=24; }
542             r += (!val);
543             return r;
544 #       endif
545         } else { /* 32 bits */
546 #       if defined(_MSC_VER)
547             unsigned long r = 0;
548             return _BitScanReverse( &r, (unsigned long)val ) ? (unsigned)(r >> 3) : 0;
549 #       elif defined(__GNUC__) && (__GNUC__ >= 3)
550             return (__builtin_clz((U32)val) >> 3);
551 #       else
552             unsigned r;
553             if (!(val>>16)) { r=2; val>>=8; } else { r=0; val>>=24; }
554             r += (!val);
555             return r;
556 #       endif
557     }   }
558 }
559 
560 
561 MEM_STATIC size_t ZSTD_count(const BYTE* pIn, const BYTE* pMatch, const BYTE* const pInLimit)
562 {
563     const BYTE* const pStart = pIn;
564     const BYTE* const pInLoopLimit = pInLimit - (sizeof(size_t)-1);
565 
566     if (pIn < pInLoopLimit) {
567         { size_t const diff = MEM_readST(pMatch) ^ MEM_readST(pIn);
568           if (diff) return ZSTD_NbCommonBytes(diff); }
569         pIn+=sizeof(size_t); pMatch+=sizeof(size_t);
570         while (pIn < pInLoopLimit) {
571             size_t const diff = MEM_readST(pMatch) ^ MEM_readST(pIn);
572             if (!diff) { pIn+=sizeof(size_t); pMatch+=sizeof(size_t); continue; }
573             pIn += ZSTD_NbCommonBytes(diff);
574             return (size_t)(pIn - pStart);
575     }   }
576     if (MEM_64bits() && (pIn<(pInLimit-3)) && (MEM_read32(pMatch) == MEM_read32(pIn))) { pIn+=4; pMatch+=4; }
577     if ((pIn<(pInLimit-1)) && (MEM_read16(pMatch) == MEM_read16(pIn))) { pIn+=2; pMatch+=2; }
578     if ((pIn<pInLimit) && (*pMatch == *pIn)) pIn++;
579     return (size_t)(pIn - pStart);
580 }
581 
582 /** ZSTD_count_2segments() :
583  *  can count match length with `ip` & `match` in 2 different segments.
584  *  convention : on reaching mEnd, match count continue starting from iStart
585  */
586 MEM_STATIC size_t
587 ZSTD_count_2segments(const BYTE* ip, const BYTE* match,
588                      const BYTE* iEnd, const BYTE* mEnd, const BYTE* iStart)
589 {
590     const BYTE* const vEnd = MIN( ip + (mEnd - match), iEnd);
591     size_t const matchLength = ZSTD_count(ip, match, vEnd);
592     if (match + matchLength != mEnd) return matchLength;
593     DEBUGLOG(7, "ZSTD_count_2segments: found a 2-parts match (current length==%zu)", matchLength);
594     DEBUGLOG(7, "distance from match beginning to end dictionary = %zi", mEnd - match);
595     DEBUGLOG(7, "distance from current pos to end buffer = %zi", iEnd - ip);
596     DEBUGLOG(7, "next byte : ip==%02X, istart==%02X", ip[matchLength], *iStart);
597     DEBUGLOG(7, "final match length = %zu", matchLength + ZSTD_count(ip+matchLength, iStart, iEnd));
598     return matchLength + ZSTD_count(ip+matchLength, iStart, iEnd);
599 }
600 
601 
602 /*-*************************************
603  *  Hashes
604  ***************************************/
605 static const U32 prime3bytes = 506832829U;
606 static U32    ZSTD_hash3(U32 u, U32 h) { return ((u << (32-24)) * prime3bytes)  >> (32-h) ; }
607 MEM_STATIC size_t ZSTD_hash3Ptr(const void* ptr, U32 h) { return ZSTD_hash3(MEM_readLE32(ptr), h); } /* only in zstd_opt.h */
608 
609 static const U32 prime4bytes = 2654435761U;
610 static U32    ZSTD_hash4(U32 u, U32 h) { return (u * prime4bytes) >> (32-h) ; }
611 static size_t ZSTD_hash4Ptr(const void* ptr, U32 h) { return ZSTD_hash4(MEM_read32(ptr), h); }
612 
613 static const U64 prime5bytes = 889523592379ULL;
614 static size_t ZSTD_hash5(U64 u, U32 h) { return (size_t)(((u  << (64-40)) * prime5bytes) >> (64-h)) ; }
615 static size_t ZSTD_hash5Ptr(const void* p, U32 h) { return ZSTD_hash5(MEM_readLE64(p), h); }
616 
617 static const U64 prime6bytes = 227718039650203ULL;
618 static size_t ZSTD_hash6(U64 u, U32 h) { return (size_t)(((u  << (64-48)) * prime6bytes) >> (64-h)) ; }
619 static size_t ZSTD_hash6Ptr(const void* p, U32 h) { return ZSTD_hash6(MEM_readLE64(p), h); }
620 
621 static const U64 prime7bytes = 58295818150454627ULL;
622 static size_t ZSTD_hash7(U64 u, U32 h) { return (size_t)(((u  << (64-56)) * prime7bytes) >> (64-h)) ; }
623 static size_t ZSTD_hash7Ptr(const void* p, U32 h) { return ZSTD_hash7(MEM_readLE64(p), h); }
624 
625 static const U64 prime8bytes = 0xCF1BBCDCB7A56463ULL;
626 static size_t ZSTD_hash8(U64 u, U32 h) { return (size_t)(((u) * prime8bytes) >> (64-h)) ; }
627 static size_t ZSTD_hash8Ptr(const void* p, U32 h) { return ZSTD_hash8(MEM_readLE64(p), h); }
628 
629 MEM_STATIC size_t ZSTD_hashPtr(const void* p, U32 hBits, U32 mls)
630 {
631     switch(mls)
632     {
633     default:
634     case 4: return ZSTD_hash4Ptr(p, hBits);
635     case 5: return ZSTD_hash5Ptr(p, hBits);
636     case 6: return ZSTD_hash6Ptr(p, hBits);
637     case 7: return ZSTD_hash7Ptr(p, hBits);
638     case 8: return ZSTD_hash8Ptr(p, hBits);
639     }
640 }
641 
642 /** ZSTD_ipow() :
643  * Return base^exponent.
644  */
645 static U64 ZSTD_ipow(U64 base, U64 exponent)
646 {
647     U64 power = 1;
648     while (exponent) {
649       if (exponent & 1) power *= base;
650       exponent >>= 1;
651       base *= base;
652     }
653     return power;
654 }
655 
656 #define ZSTD_ROLL_HASH_CHAR_OFFSET 10
657 
658 /** ZSTD_rollingHash_append() :
659  * Add the buffer to the hash value.
660  */
661 static U64 ZSTD_rollingHash_append(U64 hash, void const* buf, size_t size)
662 {
663     BYTE const* istart = (BYTE const*)buf;
664     size_t pos;
665     for (pos = 0; pos < size; ++pos) {
666         hash *= prime8bytes;
667         hash += istart[pos] + ZSTD_ROLL_HASH_CHAR_OFFSET;
668     }
669     return hash;
670 }
671 
672 /** ZSTD_rollingHash_compute() :
673  * Compute the rolling hash value of the buffer.
674  */
675 MEM_STATIC U64 ZSTD_rollingHash_compute(void const* buf, size_t size)
676 {
677     return ZSTD_rollingHash_append(0, buf, size);
678 }
679 
680 /** ZSTD_rollingHash_primePower() :
681  * Compute the primePower to be passed to ZSTD_rollingHash_rotate() for a hash
682  * over a window of length bytes.
683  */
684 MEM_STATIC U64 ZSTD_rollingHash_primePower(U32 length)
685 {
686     return ZSTD_ipow(prime8bytes, length - 1);
687 }
688 
689 /** ZSTD_rollingHash_rotate() :
690  * Rotate the rolling hash by one byte.
691  */
692 MEM_STATIC U64 ZSTD_rollingHash_rotate(U64 hash, BYTE toRemove, BYTE toAdd, U64 primePower)
693 {
694     hash -= (toRemove + ZSTD_ROLL_HASH_CHAR_OFFSET) * primePower;
695     hash *= prime8bytes;
696     hash += toAdd + ZSTD_ROLL_HASH_CHAR_OFFSET;
697     return hash;
698 }
699 
700 /*-*************************************
701 *  Round buffer management
702 ***************************************/
703 #if (ZSTD_WINDOWLOG_MAX_64 > 31)
704 # error "ZSTD_WINDOWLOG_MAX is too large : would overflow ZSTD_CURRENT_MAX"
705 #endif
706 /* Max current allowed */
707 #define ZSTD_CURRENT_MAX ((3U << 29) + (1U << ZSTD_WINDOWLOG_MAX))
708 /* Maximum chunk size before overflow correction needs to be called again */
709 #define ZSTD_CHUNKSIZE_MAX                                                     \
710     ( ((U32)-1)                  /* Maximum ending current index */            \
711     - ZSTD_CURRENT_MAX)          /* Maximum beginning lowLimit */
712 
713 /**
714  * ZSTD_window_clear():
715  * Clears the window containing the history by simply setting it to empty.
716  */
717 MEM_STATIC void ZSTD_window_clear(ZSTD_window_t* window)
718 {
719     size_t const endT = (size_t)(window->nextSrc - window->base);
720     U32 const end = (U32)endT;
721 
722     window->lowLimit = end;
723     window->dictLimit = end;
724 }
725 
726 /**
727  * ZSTD_window_hasExtDict():
728  * Returns non-zero if the window has a non-empty extDict.
729  */
730 MEM_STATIC U32 ZSTD_window_hasExtDict(ZSTD_window_t const window)
731 {
732     return window.lowLimit < window.dictLimit;
733 }
734 
735 /**
736  * ZSTD_matchState_dictMode():
737  * Inspects the provided matchState and figures out what dictMode should be
738  * passed to the compressor.
739  */
740 MEM_STATIC ZSTD_dictMode_e ZSTD_matchState_dictMode(const ZSTD_matchState_t *ms)
741 {
742     return ZSTD_window_hasExtDict(ms->window) ?
743         ZSTD_extDict :
744         ms->dictMatchState != NULL ?
745             ZSTD_dictMatchState :
746             ZSTD_noDict;
747 }
748 
749 /**
750  * ZSTD_window_needOverflowCorrection():
751  * Returns non-zero if the indices are getting too large and need overflow
752  * protection.
753  */
754 MEM_STATIC U32 ZSTD_window_needOverflowCorrection(ZSTD_window_t const window,
755                                                   void const* srcEnd)
756 {
757     U32 const current = (U32)((BYTE const*)srcEnd - window.base);
758     return current > ZSTD_CURRENT_MAX;
759 }
760 
761 /**
762  * ZSTD_window_correctOverflow():
763  * Reduces the indices to protect from index overflow.
764  * Returns the correction made to the indices, which must be applied to every
765  * stored index.
766  *
767  * The least significant cycleLog bits of the indices must remain the same,
768  * which may be 0. Every index up to maxDist in the past must be valid.
769  * NOTE: (maxDist & cycleMask) must be zero.
770  */
771 MEM_STATIC U32 ZSTD_window_correctOverflow(ZSTD_window_t* window, U32 cycleLog,
772                                            U32 maxDist, void const* src)
773 {
774     /* preemptive overflow correction:
775      * 1. correction is large enough:
776      *    lowLimit > (3<<29) ==> current > 3<<29 + 1<<windowLog
777      *    1<<windowLog <= newCurrent < 1<<chainLog + 1<<windowLog
778      *
779      *    current - newCurrent
780      *    > (3<<29 + 1<<windowLog) - (1<<windowLog + 1<<chainLog)
781      *    > (3<<29) - (1<<chainLog)
782      *    > (3<<29) - (1<<30)             (NOTE: chainLog <= 30)
783      *    > 1<<29
784      *
785      * 2. (ip+ZSTD_CHUNKSIZE_MAX - cctx->base) doesn't overflow:
786      *    After correction, current is less than (1<<chainLog + 1<<windowLog).
787      *    In 64-bit mode we are safe, because we have 64-bit ptrdiff_t.
788      *    In 32-bit mode we are safe, because (chainLog <= 29), so
789      *    ip+ZSTD_CHUNKSIZE_MAX - cctx->base < 1<<32.
790      * 3. (cctx->lowLimit + 1<<windowLog) < 1<<32:
791      *    windowLog <= 31 ==> 3<<29 + 1<<windowLog < 7<<29 < 1<<32.
792      */
793     U32 const cycleMask = (1U << cycleLog) - 1;
794     U32 const current = (U32)((BYTE const*)src - window->base);
795     U32 const currentCycle0 = current & cycleMask;
796     /* Exclude zero so that newCurrent - maxDist >= 1. */
797     U32 const currentCycle1 = currentCycle0 == 0 ? (1U << cycleLog) : currentCycle0;
798     U32 const newCurrent = currentCycle1 + maxDist;
799     U32 const correction = current - newCurrent;
800     assert((maxDist & cycleMask) == 0);
801     assert(current > newCurrent);
802     /* Loose bound, should be around 1<<29 (see above) */
803     assert(correction > 1<<28);
804 
805     window->base += correction;
806     window->dictBase += correction;
807     if (window->lowLimit <= correction) window->lowLimit = 1;
808     else window->lowLimit -= correction;
809     if (window->dictLimit <= correction) window->dictLimit = 1;
810     else window->dictLimit -= correction;
811 
812     /* Ensure we can still reference the full window. */
813     assert(newCurrent >= maxDist);
814     assert(newCurrent - maxDist >= 1);
815     /* Ensure that lowLimit and dictLimit didn't underflow. */
816     assert(window->lowLimit <= newCurrent);
817     assert(window->dictLimit <= newCurrent);
818 
819     DEBUGLOG(4, "Correction of 0x%x bytes to lowLimit=0x%x", correction,
820              window->lowLimit);
821     return correction;
822 }
823 
824 /**
825  * ZSTD_window_enforceMaxDist():
826  * Updates lowLimit so that:
827  *    (srcEnd - base) - lowLimit == maxDist + loadedDictEnd
828  *
829  * It ensures index is valid as long as index >= lowLimit.
830  * This must be called before a block compression call.
831  *
832  * loadedDictEnd is only defined if a dictionary is in use for current compression.
833  * As the name implies, loadedDictEnd represents the index at end of dictionary.
834  * The value lies within context's referential, it can be directly compared to blockEndIdx.
835  *
836  * If loadedDictEndPtr is NULL, no dictionary is in use, and we use loadedDictEnd == 0.
837  * If loadedDictEndPtr is not NULL, we set it to zero after updating lowLimit.
838  * This is because dictionaries are allowed to be referenced fully
839  * as long as the last byte of the dictionary is in the window.
840  * Once input has progressed beyond window size, dictionary cannot be referenced anymore.
841  *
842  * In normal dict mode, the dictionary lies between lowLimit and dictLimit.
843  * In dictMatchState mode, lowLimit and dictLimit are the same,
844  * and the dictionary is below them.
845  * forceWindow and dictMatchState are therefore incompatible.
846  */
847 MEM_STATIC void
848 ZSTD_window_enforceMaxDist(ZSTD_window_t* window,
849                      const void* blockEnd,
850                            U32   maxDist,
851                            U32*  loadedDictEndPtr,
852                      const ZSTD_matchState_t** dictMatchStatePtr)
853 {
854     U32 const blockEndIdx = (U32)((BYTE const*)blockEnd - window->base);
855     U32 const loadedDictEnd = (loadedDictEndPtr != NULL) ? *loadedDictEndPtr : 0;
856     DEBUGLOG(5, "ZSTD_window_enforceMaxDist: blockEndIdx=%u, maxDist=%u, loadedDictEnd=%u",
857                 (unsigned)blockEndIdx, (unsigned)maxDist, (unsigned)loadedDictEnd);
858 
859     /* - When there is no dictionary : loadedDictEnd == 0.
860          In which case, the test (blockEndIdx > maxDist) is merely to avoid
861          overflowing next operation `newLowLimit = blockEndIdx - maxDist`.
862        - When there is a standard dictionary :
863          Index referential is copied from the dictionary,
864          which means it starts from 0.
865          In which case, loadedDictEnd == dictSize,
866          and it makes sense to compare `blockEndIdx > maxDist + dictSize`
867          since `blockEndIdx` also starts from zero.
868        - When there is an attached dictionary :
869          loadedDictEnd is expressed within the referential of the context,
870          so it can be directly compared against blockEndIdx.
871     */
872     if (blockEndIdx > maxDist + loadedDictEnd) {
873         U32 const newLowLimit = blockEndIdx - maxDist;
874         if (window->lowLimit < newLowLimit) window->lowLimit = newLowLimit;
875         if (window->dictLimit < window->lowLimit) {
876             DEBUGLOG(5, "Update dictLimit to match lowLimit, from %u to %u",
877                         (unsigned)window->dictLimit, (unsigned)window->lowLimit);
878             window->dictLimit = window->lowLimit;
879         }
880         /* On reaching window size, dictionaries are invalidated */
881         if (loadedDictEndPtr) *loadedDictEndPtr = 0;
882         if (dictMatchStatePtr) *dictMatchStatePtr = NULL;
883     }
884 }
885 
886 /* Similar to ZSTD_window_enforceMaxDist(),
887  * but only invalidates dictionary
888  * when input progresses beyond window size.
889  * assumption : loadedDictEndPtr and dictMatchStatePtr are valid (non NULL)
890  *              loadedDictEnd uses same referential as window->base
891  *              maxDist is the window size */
892 MEM_STATIC void
893 ZSTD_checkDictValidity(const ZSTD_window_t* window,
894                        const void* blockEnd,
895                              U32   maxDist,
896                              U32*  loadedDictEndPtr,
897                        const ZSTD_matchState_t** dictMatchStatePtr)
898 {
899     assert(loadedDictEndPtr != NULL);
900     assert(dictMatchStatePtr != NULL);
901     {   U32 const blockEndIdx = (U32)((BYTE const*)blockEnd - window->base);
902         U32 const loadedDictEnd = *loadedDictEndPtr;
903         DEBUGLOG(5, "ZSTD_checkDictValidity: blockEndIdx=%u, maxDist=%u, loadedDictEnd=%u",
904                     (unsigned)blockEndIdx, (unsigned)maxDist, (unsigned)loadedDictEnd);
905         assert(blockEndIdx >= loadedDictEnd);
906 
907         if (blockEndIdx > loadedDictEnd + maxDist) {
908             /* On reaching window size, dictionaries are invalidated.
909              * For simplification, if window size is reached anywhere within next block,
910              * the dictionary is invalidated for the full block.
911              */
912             DEBUGLOG(6, "invalidating dictionary for current block (distance > windowSize)");
913             *loadedDictEndPtr = 0;
914             *dictMatchStatePtr = NULL;
915         } else {
916             if (*loadedDictEndPtr != 0) {
917                 DEBUGLOG(6, "dictionary considered valid for current block");
918     }   }   }
919 }
920 
921 MEM_STATIC void ZSTD_window_init(ZSTD_window_t* window) {
922     memset(window, 0, sizeof(*window));
923     window->base = (BYTE const*)"";
924     window->dictBase = (BYTE const*)"";
925     window->dictLimit = 1;    /* start from 1, so that 1st position is valid */
926     window->lowLimit = 1;     /* it ensures first and later CCtx usages compress the same */
927     window->nextSrc = window->base + 1;   /* see issue #1241 */
928 }
929 
930 /**
931  * ZSTD_window_update():
932  * Updates the window by appending [src, src + srcSize) to the window.
933  * If it is not contiguous, the current prefix becomes the extDict, and we
934  * forget about the extDict. Handles overlap of the prefix and extDict.
935  * Returns non-zero if the segment is contiguous.
936  */
937 MEM_STATIC U32 ZSTD_window_update(ZSTD_window_t* window,
938                                   void const* src, size_t srcSize)
939 {
940     BYTE const* const ip = (BYTE const*)src;
941     U32 contiguous = 1;
942     DEBUGLOG(5, "ZSTD_window_update");
943     if (srcSize == 0)
944         return contiguous;
945     assert(window->base != NULL);
946     assert(window->dictBase != NULL);
947     /* Check if blocks follow each other */
948     if (src != window->nextSrc) {
949         /* not contiguous */
950         size_t const distanceFromBase = (size_t)(window->nextSrc - window->base);
951         DEBUGLOG(5, "Non contiguous blocks, new segment starts at %u", window->dictLimit);
952         window->lowLimit = window->dictLimit;
953         assert(distanceFromBase == (size_t)(U32)distanceFromBase);  /* should never overflow */
954         window->dictLimit = (U32)distanceFromBase;
955         window->dictBase = window->base;
956         window->base = ip - distanceFromBase;
957         /* ms->nextToUpdate = window->dictLimit; */
958         if (window->dictLimit - window->lowLimit < HASH_READ_SIZE) window->lowLimit = window->dictLimit;   /* too small extDict */
959         contiguous = 0;
960     }
961     window->nextSrc = ip + srcSize;
962     /* if input and dictionary overlap : reduce dictionary (area presumed modified by input) */
963     if ( (ip+srcSize > window->dictBase + window->lowLimit)
964        & (ip < window->dictBase + window->dictLimit)) {
965         ptrdiff_t const highInputIdx = (ip + srcSize) - window->dictBase;
966         U32 const lowLimitMax = (highInputIdx > (ptrdiff_t)window->dictLimit) ? window->dictLimit : (U32)highInputIdx;
967         window->lowLimit = lowLimitMax;
968         DEBUGLOG(5, "Overlapping extDict and input : new lowLimit = %u", window->lowLimit);
969     }
970     return contiguous;
971 }
972 
973 /**
974  * Returns the lowest allowed match index. It may either be in the ext-dict or the prefix.
975  */
976 MEM_STATIC U32 ZSTD_getLowestMatchIndex(const ZSTD_matchState_t* ms, U32 current, unsigned windowLog)
977 {
978     U32    const maxDistance = 1U << windowLog;
979     U32    const lowestValid = ms->window.lowLimit;
980     U32    const withinWindow = (current - lowestValid > maxDistance) ? current - maxDistance : lowestValid;
981     U32    const isDictionary = (ms->loadedDictEnd != 0);
982     U32    const matchLowest = isDictionary ? lowestValid : withinWindow;
983     return matchLowest;
984 }
985 
986 /**
987  * Returns the lowest allowed match index in the prefix.
988  */
989 MEM_STATIC U32 ZSTD_getLowestPrefixIndex(const ZSTD_matchState_t* ms, U32 current, unsigned windowLog)
990 {
991     U32    const maxDistance = 1U << windowLog;
992     U32    const lowestValid = ms->window.dictLimit;
993     U32    const withinWindow = (current - lowestValid > maxDistance) ? current - maxDistance : lowestValid;
994     U32    const isDictionary = (ms->loadedDictEnd != 0);
995     U32    const matchLowest = isDictionary ? lowestValid : withinWindow;
996     return matchLowest;
997 }
998 
999 
1000 
1001 /* debug functions */
1002 #if (DEBUGLEVEL>=2)
1003 
1004 MEM_STATIC double ZSTD_fWeight(U32 rawStat)
1005 {
1006     U32 const fp_accuracy = 8;
1007     U32 const fp_multiplier = (1 << fp_accuracy);
1008     U32 const newStat = rawStat + 1;
1009     U32 const hb = ZSTD_highbit32(newStat);
1010     U32 const BWeight = hb * fp_multiplier;
1011     U32 const FWeight = (newStat << fp_accuracy) >> hb;
1012     U32 const weight = BWeight + FWeight;
1013     assert(hb + fp_accuracy < 31);
1014     return (double)weight / fp_multiplier;
1015 }
1016 
1017 /* display a table content,
1018  * listing each element, its frequency, and its predicted bit cost */
1019 MEM_STATIC void ZSTD_debugTable(const U32* table, U32 max)
1020 {
1021     unsigned u, sum;
1022     for (u=0, sum=0; u<=max; u++) sum += table[u];
1023     DEBUGLOG(2, "total nb elts: %u", sum);
1024     for (u=0; u<=max; u++) {
1025         DEBUGLOG(2, "%2u: %5u  (%.2f)",
1026                 u, table[u], ZSTD_fWeight(sum) - ZSTD_fWeight(table[u]) );
1027     }
1028 }
1029 
1030 #endif
1031 
1032 
1033 #if defined (__cplusplus)
1034 }
1035 #endif
1036 
1037 /* ===============================================================
1038  * Shared internal declarations
1039  * These prototypes may be called from sources not in lib/compress
1040  * =============================================================== */
1041 
1042 /* ZSTD_loadCEntropy() :
1043  * dict : must point at beginning of a valid zstd dictionary.
1044  * return : size of dictionary header (size of magic number + dict ID + entropy tables)
1045  * assumptions : magic number supposed already checked
1046  *               and dictSize >= 8 */
1047 size_t ZSTD_loadCEntropy(ZSTD_compressedBlockState_t* bs, void* workspace,
1048                          short* offcodeNCount, unsigned* offcodeMaxValue,
1049                          const void* const dict, size_t dictSize);
1050 
1051 void ZSTD_reset_compressedBlockState(ZSTD_compressedBlockState_t* bs);
1052 
1053 /* ==============================================================
1054  * Private declarations
1055  * These prototypes shall only be called from within lib/compress
1056  * ============================================================== */
1057 
1058 /* ZSTD_getCParamsFromCCtxParams() :
1059  * cParams are built depending on compressionLevel, src size hints,
1060  * LDM and manually set compression parameters.
1061  * Note: srcSizeHint == 0 means 0!
1062  */
1063 ZSTD_compressionParameters ZSTD_getCParamsFromCCtxParams(
1064         const ZSTD_CCtx_params* CCtxParams, U64 srcSizeHint, size_t dictSize);
1065 
1066 /*! ZSTD_initCStream_internal() :
1067  *  Private use only. Init streaming operation.
1068  *  expects params to be valid.
1069  *  must receive dict, or cdict, or none, but not both.
1070  *  @return : 0, or an error code */
1071 size_t ZSTD_initCStream_internal(ZSTD_CStream* zcs,
1072                      const void* dict, size_t dictSize,
1073                      const ZSTD_CDict* cdict,
1074                      const ZSTD_CCtx_params* params, unsigned long long pledgedSrcSize);
1075 
1076 void ZSTD_resetSeqStore(seqStore_t* ssPtr);
1077 
1078 /*! ZSTD_getCParamsFromCDict() :
1079  *  as the name implies */
1080 ZSTD_compressionParameters ZSTD_getCParamsFromCDict(const ZSTD_CDict* cdict);
1081 
1082 /* ZSTD_compressBegin_advanced_internal() :
1083  * Private use only. To be called from zstdmt_compress.c. */
1084 size_t ZSTD_compressBegin_advanced_internal(ZSTD_CCtx* cctx,
1085                                     const void* dict, size_t dictSize,
1086                                     ZSTD_dictContentType_e dictContentType,
1087                                     ZSTD_dictTableLoadMethod_e dtlm,
1088                                     const ZSTD_CDict* cdict,
1089                                     const ZSTD_CCtx_params* params,
1090                                     unsigned long long pledgedSrcSize);
1091 
1092 /* ZSTD_compress_advanced_internal() :
1093  * Private use only. To be called from zstdmt_compress.c. */
1094 size_t ZSTD_compress_advanced_internal(ZSTD_CCtx* cctx,
1095                                        void* dst, size_t dstCapacity,
1096                                  const void* src, size_t srcSize,
1097                                  const void* dict,size_t dictSize,
1098                                  const ZSTD_CCtx_params* params);
1099 
1100 
1101 /* ZSTD_writeLastEmptyBlock() :
1102  * output an empty Block with end-of-frame mark to complete a frame
1103  * @return : size of data written into `dst` (== ZSTD_blockHeaderSize (defined in zstd_internal.h))
1104  *           or an error code if `dstCapacity` is too small (<ZSTD_blockHeaderSize)
1105  */
1106 size_t ZSTD_writeLastEmptyBlock(void* dst, size_t dstCapacity);
1107 
1108 
1109 /* ZSTD_referenceExternalSequences() :
1110  * Must be called before starting a compression operation.
1111  * seqs must parse a prefix of the source.
1112  * This cannot be used when long range matching is enabled.
1113  * Zstd will use these sequences, and pass the literals to a secondary block
1114  * compressor.
1115  * @return : An error code on failure.
1116  * NOTE: seqs are not verified! Invalid sequences can cause out-of-bounds memory
1117  * access and data corruption.
1118  */
1119 size_t ZSTD_referenceExternalSequences(ZSTD_CCtx* cctx, rawSeq* seq, size_t nbSeq);
1120 
1121 /** ZSTD_cycleLog() :
1122  *  condition for correct operation : hashLog > 1 */
1123 #ifdef	__FreeBSD__	/* This symbol is needed by dll-linked CLI zstd(1). */
1124 ZSTDLIB_API U32 ZSTD_cycleLog(U32 hashLog, ZSTD_strategy strat);
1125 #endif
1126 
1127 #endif /* ZSTD_COMPRESS_H */
1128