10c16b537SWarner Losh /* 237f1f268SConrad Meyer * Copyright (c) 2016-2020, Yann Collet, Facebook, Inc. 30c16b537SWarner Losh * All rights reserved. 40c16b537SWarner Losh * 50c16b537SWarner Losh * This source code is licensed under both the BSD-style license (found in the 60c16b537SWarner Losh * LICENSE file in the root directory of this source tree) and the GPLv2 (found 70c16b537SWarner Losh * in the COPYING file in the root directory of this source tree). 80c16b537SWarner Losh * You may select, at your option, one of the above-listed licenses. 90c16b537SWarner Losh */ 100c16b537SWarner Losh #if defined (__cplusplus) 110c16b537SWarner Losh extern "C" { 120c16b537SWarner Losh #endif 130c16b537SWarner Losh 140c16b537SWarner Losh #ifndef ZSTD_H_235446 150c16b537SWarner Losh #define ZSTD_H_235446 160c16b537SWarner Losh 170c16b537SWarner Losh /* ====== Dependency ======*/ 189cbefe25SConrad Meyer #include <limits.h> /* INT_MAX */ 190c16b537SWarner Losh #include <stddef.h> /* size_t */ 200c16b537SWarner Losh 210c16b537SWarner Losh 220c16b537SWarner Losh /* ===== ZSTDLIB_API : control library symbols visibility ===== */ 230c16b537SWarner Losh #ifndef ZSTDLIB_VISIBILITY 240c16b537SWarner Losh # if defined(__GNUC__) && (__GNUC__ >= 4) 250c16b537SWarner Losh # define ZSTDLIB_VISIBILITY __attribute__ ((visibility ("default"))) 260c16b537SWarner Losh # else 270c16b537SWarner Losh # define ZSTDLIB_VISIBILITY 280c16b537SWarner Losh # endif 290c16b537SWarner Losh #endif 300c16b537SWarner Losh #if defined(ZSTD_DLL_EXPORT) && (ZSTD_DLL_EXPORT==1) 310c16b537SWarner Losh # define ZSTDLIB_API __declspec(dllexport) ZSTDLIB_VISIBILITY 320c16b537SWarner Losh #elif defined(ZSTD_DLL_IMPORT) && (ZSTD_DLL_IMPORT==1) 330c16b537SWarner Losh # define ZSTDLIB_API __declspec(dllimport) ZSTDLIB_VISIBILITY /* It isn't required but allows to generate better code, saving a function pointer load from the IAT and an indirect jump.*/ 340c16b537SWarner Losh #else 350c16b537SWarner Losh # define ZSTDLIB_API ZSTDLIB_VISIBILITY 360c16b537SWarner Losh #endif 370c16b537SWarner Losh 380c16b537SWarner Losh 390f743729SConrad Meyer /******************************************************************************* 400c16b537SWarner Losh Introduction 410c16b537SWarner Losh 420f743729SConrad Meyer zstd, short for Zstandard, is a fast lossless compression algorithm, targeting 430f743729SConrad Meyer real-time compression scenarios at zlib-level and better compression ratios. 440f743729SConrad Meyer The zstd compression library provides in-memory compression and decompression 450f743729SConrad Meyer functions. 460f743729SConrad Meyer 470f743729SConrad Meyer The library supports regular compression levels from 1 up to ZSTD_maxCLevel(), 480f743729SConrad Meyer which is currently 22. Levels >= 20, labeled `--ultra`, should be used with 490f743729SConrad Meyer caution, as they require more memory. The library also offers negative 500f743729SConrad Meyer compression levels, which extend the range of speed vs. ratio preferences. 510f743729SConrad Meyer The lower the level, the faster the speed (at the cost of compression). 520f743729SConrad Meyer 530c16b537SWarner Losh Compression can be done in: 540c16b537SWarner Losh - a single step (described as Simple API) 5519fcbaf1SConrad Meyer - a single step, reusing a context (described as Explicit context) 560c16b537SWarner Losh - unbounded multiple steps (described as Streaming compression) 570c16b537SWarner Losh 580f743729SConrad Meyer The compression ratio achievable on small data can be highly improved using 590f743729SConrad Meyer a dictionary. Dictionary compression can be performed in: 600f743729SConrad Meyer - a single step (described as Simple dictionary API) 610f743729SConrad Meyer - a single step, reusing a dictionary (described as Bulk-processing 620f743729SConrad Meyer dictionary API) 630f743729SConrad Meyer 640f743729SConrad Meyer Advanced experimental functions can be accessed using 650f743729SConrad Meyer `#define ZSTD_STATIC_LINKING_ONLY` before including zstd.h. 660f743729SConrad Meyer 670f743729SConrad Meyer Advanced experimental APIs should never be used with a dynamically-linked 680f743729SConrad Meyer library. They are not "stable"; their definitions or signatures may change in 690f743729SConrad Meyer the future. Only static linking is allowed. 700f743729SConrad Meyer *******************************************************************************/ 710c16b537SWarner Losh 720c16b537SWarner Losh /*------ Version ------*/ 730c16b537SWarner Losh #define ZSTD_VERSION_MAJOR 1 742b9c00cbSConrad Meyer #define ZSTD_VERSION_MINOR 4 75*f7cd7fe5SConrad Meyer #define ZSTD_VERSION_RELEASE 8 760c16b537SWarner Losh #define ZSTD_VERSION_NUMBER (ZSTD_VERSION_MAJOR *100*100 + ZSTD_VERSION_MINOR *100 + ZSTD_VERSION_RELEASE) 77*f7cd7fe5SConrad Meyer 78*f7cd7fe5SConrad Meyer /*! ZSTD_versionNumber() : 79*f7cd7fe5SConrad Meyer * Return runtime library version, the value is (MAJOR*100*100 + MINOR*100 + RELEASE). */ 80*f7cd7fe5SConrad Meyer ZSTDLIB_API unsigned ZSTD_versionNumber(void); 810c16b537SWarner Losh 820c16b537SWarner Losh #define ZSTD_LIB_VERSION ZSTD_VERSION_MAJOR.ZSTD_VERSION_MINOR.ZSTD_VERSION_RELEASE 830c16b537SWarner Losh #define ZSTD_QUOTE(str) #str 840c16b537SWarner Losh #define ZSTD_EXPAND_AND_QUOTE(str) ZSTD_QUOTE(str) 850c16b537SWarner Losh #define ZSTD_VERSION_STRING ZSTD_EXPAND_AND_QUOTE(ZSTD_LIB_VERSION) 86*f7cd7fe5SConrad Meyer 87*f7cd7fe5SConrad Meyer /*! ZSTD_versionString() : 88*f7cd7fe5SConrad Meyer * Return runtime library version, like "1.4.5". Requires v1.3.0+. */ 89*f7cd7fe5SConrad Meyer ZSTDLIB_API const char* ZSTD_versionString(void); 900c16b537SWarner Losh 914d3f1eafSConrad Meyer /* ************************************* 920f743729SConrad Meyer * Default constant 930f743729SConrad Meyer ***************************************/ 940f743729SConrad Meyer #ifndef ZSTD_CLEVEL_DEFAULT 950f743729SConrad Meyer # define ZSTD_CLEVEL_DEFAULT 3 960f743729SConrad Meyer #endif 970c16b537SWarner Losh 984d3f1eafSConrad Meyer /* ************************************* 992b9c00cbSConrad Meyer * Constants 1002b9c00cbSConrad Meyer ***************************************/ 1012b9c00cbSConrad Meyer 1022b9c00cbSConrad Meyer /* All magic numbers are supposed read/written to/from files/memory using little-endian convention */ 1032b9c00cbSConrad Meyer #define ZSTD_MAGICNUMBER 0xFD2FB528 /* valid since v0.8.0 */ 1042b9c00cbSConrad Meyer #define ZSTD_MAGIC_DICTIONARY 0xEC30A437 /* valid since v0.7.0 */ 1052b9c00cbSConrad Meyer #define ZSTD_MAGIC_SKIPPABLE_START 0x184D2A50 /* all 16 values, from 0x184D2A50 to 0x184D2A5F, signal the beginning of a skippable frame */ 1062b9c00cbSConrad Meyer #define ZSTD_MAGIC_SKIPPABLE_MASK 0xFFFFFFF0 1072b9c00cbSConrad Meyer 1082b9c00cbSConrad Meyer #define ZSTD_BLOCKSIZELOG_MAX 17 1092b9c00cbSConrad Meyer #define ZSTD_BLOCKSIZE_MAX (1<<ZSTD_BLOCKSIZELOG_MAX) 1102b9c00cbSConrad Meyer 1112b9c00cbSConrad Meyer 1122b9c00cbSConrad Meyer 1132b9c00cbSConrad Meyer /*************************************** 1140c16b537SWarner Losh * Simple API 1150c16b537SWarner Losh ***************************************/ 1160c16b537SWarner Losh /*! ZSTD_compress() : 1170c16b537SWarner Losh * Compresses `src` content as a single zstd compressed frame into already allocated `dst`. 1180c16b537SWarner Losh * Hint : compression runs faster if `dstCapacity` >= `ZSTD_compressBound(srcSize)`. 1190c16b537SWarner Losh * @return : compressed size written into `dst` (<= `dstCapacity), 1200c16b537SWarner Losh * or an error code if it fails (which can be tested using ZSTD_isError()). */ 1210c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_compress( void* dst, size_t dstCapacity, 1220c16b537SWarner Losh const void* src, size_t srcSize, 1230c16b537SWarner Losh int compressionLevel); 1240c16b537SWarner Losh 1250c16b537SWarner Losh /*! ZSTD_decompress() : 1260c16b537SWarner Losh * `compressedSize` : must be the _exact_ size of some number of compressed and/or skippable frames. 1270c16b537SWarner Losh * `dstCapacity` is an upper bound of originalSize to regenerate. 1280c16b537SWarner Losh * If user cannot imply a maximum upper bound, it's better to use streaming mode to decompress data. 1290c16b537SWarner Losh * @return : the number of bytes decompressed into `dst` (<= `dstCapacity`), 1300c16b537SWarner Losh * or an errorCode if it fails (which can be tested using ZSTD_isError()). */ 1310c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_decompress( void* dst, size_t dstCapacity, 1320c16b537SWarner Losh const void* src, size_t compressedSize); 1330c16b537SWarner Losh 134a0483764SConrad Meyer /*! ZSTD_getFrameContentSize() : requires v1.3.0+ 1350c16b537SWarner Losh * `src` should point to the start of a ZSTD encoded frame. 1360c16b537SWarner Losh * `srcSize` must be at least as large as the frame header. 1370c16b537SWarner Losh * hint : any size >= `ZSTD_frameHeaderSize_max` is large enough. 1380f743729SConrad Meyer * @return : - decompressed size of `src` frame content, if known 1390c16b537SWarner Losh * - ZSTD_CONTENTSIZE_UNKNOWN if the size cannot be determined 1400c16b537SWarner Losh * - ZSTD_CONTENTSIZE_ERROR if an error occurred (e.g. invalid magic number, srcSize too small) 1410c16b537SWarner Losh * note 1 : a 0 return value means the frame is valid but "empty". 1420c16b537SWarner Losh * note 2 : decompressed size is an optional field, it may not be present, typically in streaming mode. 1430c16b537SWarner Losh * When `return==ZSTD_CONTENTSIZE_UNKNOWN`, data to decompress could be any size. 1440c16b537SWarner Losh * In which case, it's necessary to use streaming mode to decompress data. 1450c16b537SWarner Losh * Optionally, application can rely on some implicit limit, 1460c16b537SWarner Losh * as ZSTD_decompress() only needs an upper bound of decompressed size. 1470c16b537SWarner Losh * (For example, data could be necessarily cut into blocks <= 16 KB). 1480f743729SConrad Meyer * note 3 : decompressed size is always present when compression is completed using single-pass functions, 1490f743729SConrad Meyer * such as ZSTD_compress(), ZSTD_compressCCtx() ZSTD_compress_usingDict() or ZSTD_compress_usingCDict(). 1500c16b537SWarner Losh * note 4 : decompressed size can be very large (64-bits value), 1510c16b537SWarner Losh * potentially larger than what local system can handle as a single memory segment. 1520c16b537SWarner Losh * In which case, it's necessary to use streaming mode to decompress data. 1530c16b537SWarner Losh * note 5 : If source is untrusted, decompressed size could be wrong or intentionally modified. 1540c16b537SWarner Losh * Always ensure return value fits within application's authorized limits. 1550c16b537SWarner Losh * Each application can set its own limits. 1560c16b537SWarner Losh * note 6 : This function replaces ZSTD_getDecompressedSize() */ 1570c16b537SWarner Losh #define ZSTD_CONTENTSIZE_UNKNOWN (0ULL - 1) 1580c16b537SWarner Losh #define ZSTD_CONTENTSIZE_ERROR (0ULL - 2) 1590c16b537SWarner Losh ZSTDLIB_API unsigned long long ZSTD_getFrameContentSize(const void *src, size_t srcSize); 1600c16b537SWarner Losh 1610c16b537SWarner Losh /*! ZSTD_getDecompressedSize() : 1620c16b537SWarner Losh * NOTE: This function is now obsolete, in favor of ZSTD_getFrameContentSize(). 16319fcbaf1SConrad Meyer * Both functions work the same way, but ZSTD_getDecompressedSize() blends 16419fcbaf1SConrad Meyer * "empty", "unknown" and "error" results to the same return value (0), 16519fcbaf1SConrad Meyer * while ZSTD_getFrameContentSize() gives them separate return values. 1660f743729SConrad Meyer * @return : decompressed size of `src` frame content _if known and not empty_, 0 otherwise. */ 1670c16b537SWarner Losh ZSTDLIB_API unsigned long long ZSTD_getDecompressedSize(const void* src, size_t srcSize); 1680c16b537SWarner Losh 1692b9c00cbSConrad Meyer /*! ZSTD_findFrameCompressedSize() : 1702b9c00cbSConrad Meyer * `src` should point to the start of a ZSTD frame or skippable frame. 1712b9c00cbSConrad Meyer * `srcSize` must be >= first frame size 1722b9c00cbSConrad Meyer * @return : the compressed size of the first frame starting at `src`, 1732b9c00cbSConrad Meyer * suitable to pass as `srcSize` to `ZSTD_decompress` or similar, 1742b9c00cbSConrad Meyer * or an error code if input is invalid */ 1752b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_findFrameCompressedSize(const void* src, size_t srcSize); 1762b9c00cbSConrad Meyer 1770c16b537SWarner Losh 1780c16b537SWarner Losh /*====== Helper functions ======*/ 179052d3c12SConrad Meyer #define ZSTD_COMPRESSBOUND(srcSize) ((srcSize) + ((srcSize)>>8) + (((srcSize) < (128<<10)) ? (((128<<10) - (srcSize)) >> 11) /* margin, from 64 to 0 */ : 0)) /* this formula ensures that bound(A) + bound(B) <= bound(A+B) as long as A and B >= 128 KB */ 18019fcbaf1SConrad Meyer ZSTDLIB_API size_t ZSTD_compressBound(size_t srcSize); /*!< maximum compressed size in worst case single-pass scenario */ 1810c16b537SWarner Losh ZSTDLIB_API unsigned ZSTD_isError(size_t code); /*!< tells if a `size_t` function result is an error code */ 1820c16b537SWarner Losh ZSTDLIB_API const char* ZSTD_getErrorName(size_t code); /*!< provides readable string from an error code */ 1832b9c00cbSConrad Meyer ZSTDLIB_API int ZSTD_minCLevel(void); /*!< minimum negative compression level allowed */ 1840c16b537SWarner Losh ZSTDLIB_API int ZSTD_maxCLevel(void); /*!< maximum compression level available */ 1850c16b537SWarner Losh 1860c16b537SWarner Losh 1870c16b537SWarner Losh /*************************************** 18819fcbaf1SConrad Meyer * Explicit context 1890c16b537SWarner Losh ***************************************/ 1900c16b537SWarner Losh /*= Compression context 1910c16b537SWarner Losh * When compressing many times, 1924d3f1eafSConrad Meyer * it is recommended to allocate a context just once, 1934d3f1eafSConrad Meyer * and re-use it for each successive compression operation. 1940c16b537SWarner Losh * This will make workload friendlier for system's memory. 1954d3f1eafSConrad Meyer * Note : re-using context is just a speed / resource optimization. 1964d3f1eafSConrad Meyer * It doesn't change the compression ratio, which remains identical. 1974d3f1eafSConrad Meyer * Note 2 : In multi-threaded environments, 1984d3f1eafSConrad Meyer * use one different context per thread for parallel execution. 1994d3f1eafSConrad Meyer */ 2000c16b537SWarner Losh typedef struct ZSTD_CCtx_s ZSTD_CCtx; 2010c16b537SWarner Losh ZSTDLIB_API ZSTD_CCtx* ZSTD_createCCtx(void); 2020c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_freeCCtx(ZSTD_CCtx* cctx); 2030c16b537SWarner Losh 2040c16b537SWarner Losh /*! ZSTD_compressCCtx() : 2059cbefe25SConrad Meyer * Same as ZSTD_compress(), using an explicit ZSTD_CCtx. 2069cbefe25SConrad Meyer * Important : in order to behave similarly to `ZSTD_compress()`, 2079cbefe25SConrad Meyer * this function compresses at requested compression level, 2089cbefe25SConrad Meyer * __ignoring any other parameter__ . 2099cbefe25SConrad Meyer * If any advanced parameter was set using the advanced API, 2109cbefe25SConrad Meyer * they will all be reset. Only `compressionLevel` remains. 2119cbefe25SConrad Meyer */ 212a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_compressCCtx(ZSTD_CCtx* cctx, 2130c16b537SWarner Losh void* dst, size_t dstCapacity, 2140c16b537SWarner Losh const void* src, size_t srcSize, 2150c16b537SWarner Losh int compressionLevel); 2160c16b537SWarner Losh 2170c16b537SWarner Losh /*= Decompression context 2180c16b537SWarner Losh * When decompressing many times, 2190c16b537SWarner Losh * it is recommended to allocate a context only once, 2200c16b537SWarner Losh * and re-use it for each successive compression operation. 2210c16b537SWarner Losh * This will make workload friendlier for system's memory. 2220c16b537SWarner Losh * Use one context per thread for parallel execution. */ 2230c16b537SWarner Losh typedef struct ZSTD_DCtx_s ZSTD_DCtx; 2240c16b537SWarner Losh ZSTDLIB_API ZSTD_DCtx* ZSTD_createDCtx(void); 2250c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_freeDCtx(ZSTD_DCtx* dctx); 2260c16b537SWarner Losh 2270c16b537SWarner Losh /*! ZSTD_decompressDCtx() : 228a0483764SConrad Meyer * Same as ZSTD_decompress(), 229a0483764SConrad Meyer * requires an allocated ZSTD_DCtx. 230a0483764SConrad Meyer * Compatible with sticky parameters. 231a0483764SConrad Meyer */ 232a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_decompressDCtx(ZSTD_DCtx* dctx, 2330c16b537SWarner Losh void* dst, size_t dstCapacity, 2340c16b537SWarner Losh const void* src, size_t srcSize); 2350c16b537SWarner Losh 2360c16b537SWarner Losh 237a0483764SConrad Meyer /*************************************** 238a0483764SConrad Meyer * Advanced compression API 239a0483764SConrad Meyer ***************************************/ 240a0483764SConrad Meyer 241a0483764SConrad Meyer /* API design : 242a0483764SConrad Meyer * Parameters are pushed one by one into an existing context, 243a0483764SConrad Meyer * using ZSTD_CCtx_set*() functions. 244a0483764SConrad Meyer * Pushed parameters are sticky : they are valid for next compressed frame, and any subsequent frame. 245a0483764SConrad Meyer * "sticky" parameters are applicable to `ZSTD_compress2()` and `ZSTD_compressStream*()` ! 2469cbefe25SConrad Meyer * __They do not apply to "simple" one-shot variants such as ZSTD_compressCCtx()__ . 247a0483764SConrad Meyer * 248a0483764SConrad Meyer * It's possible to reset all parameters to "default" using ZSTD_CCtx_reset(). 249a0483764SConrad Meyer * 250a0483764SConrad Meyer * This API supercedes all other "advanced" API entry points in the experimental section. 251a0483764SConrad Meyer * In the future, we expect to remove from experimental API entry points which are redundant with this API. 252a0483764SConrad Meyer */ 253a0483764SConrad Meyer 254a0483764SConrad Meyer 255a0483764SConrad Meyer /* Compression strategies, listed from fastest to strongest */ 256a0483764SConrad Meyer typedef enum { ZSTD_fast=1, 257a0483764SConrad Meyer ZSTD_dfast=2, 258a0483764SConrad Meyer ZSTD_greedy=3, 259a0483764SConrad Meyer ZSTD_lazy=4, 260a0483764SConrad Meyer ZSTD_lazy2=5, 261a0483764SConrad Meyer ZSTD_btlazy2=6, 262a0483764SConrad Meyer ZSTD_btopt=7, 263a0483764SConrad Meyer ZSTD_btultra=8, 264a0483764SConrad Meyer ZSTD_btultra2=9 265a0483764SConrad Meyer /* note : new strategies _might_ be added in the future. 266a0483764SConrad Meyer Only the order (from fast to strong) is guaranteed */ 267a0483764SConrad Meyer } ZSTD_strategy; 268a0483764SConrad Meyer 269a0483764SConrad Meyer 270a0483764SConrad Meyer typedef enum { 271a0483764SConrad Meyer 2722b9c00cbSConrad Meyer /* compression parameters 2732b9c00cbSConrad Meyer * Note: When compressing with a ZSTD_CDict these parameters are superseded 2749cbefe25SConrad Meyer * by the parameters used to construct the ZSTD_CDict. 2759cbefe25SConrad Meyer * See ZSTD_CCtx_refCDict() for more info (superseded-by-cdict). */ 2769cbefe25SConrad Meyer ZSTD_c_compressionLevel=100, /* Set compression parameters according to pre-defined cLevel table. 2779cbefe25SConrad Meyer * Note that exact compression parameters are dynamically determined, 2789cbefe25SConrad Meyer * depending on both compression level and srcSize (when known). 279a0483764SConrad Meyer * Default level is ZSTD_CLEVEL_DEFAULT==3. 280a0483764SConrad Meyer * Special: value 0 means default, which is controlled by ZSTD_CLEVEL_DEFAULT. 281a0483764SConrad Meyer * Note 1 : it's possible to pass a negative compression level. 28237f1f268SConrad Meyer * Note 2 : setting a level does not automatically set all other compression parameters 28337f1f268SConrad Meyer * to default. Setting this will however eventually dynamically impact the compression 28437f1f268SConrad Meyer * parameters which have not been manually set. The manually set 28537f1f268SConrad Meyer * ones will 'stick'. */ 2869cbefe25SConrad Meyer /* Advanced compression parameters : 2879cbefe25SConrad Meyer * It's possible to pin down compression parameters to some specific values. 2889cbefe25SConrad Meyer * In which case, these values are no longer dynamically selected by the compressor */ 289a0483764SConrad Meyer ZSTD_c_windowLog=101, /* Maximum allowed back-reference distance, expressed as power of 2. 2909cbefe25SConrad Meyer * This will set a memory budget for streaming decompression, 2919cbefe25SConrad Meyer * with larger values requiring more memory 2929cbefe25SConrad Meyer * and typically compressing more. 293a0483764SConrad Meyer * Must be clamped between ZSTD_WINDOWLOG_MIN and ZSTD_WINDOWLOG_MAX. 294a0483764SConrad Meyer * Special: value 0 means "use default windowLog". 295a0483764SConrad Meyer * Note: Using a windowLog greater than ZSTD_WINDOWLOG_LIMIT_DEFAULT 2969cbefe25SConrad Meyer * requires explicitly allowing such size at streaming decompression stage. */ 297a0483764SConrad Meyer ZSTD_c_hashLog=102, /* Size of the initial probe table, as a power of 2. 298a0483764SConrad Meyer * Resulting memory usage is (1 << (hashLog+2)). 299a0483764SConrad Meyer * Must be clamped between ZSTD_HASHLOG_MIN and ZSTD_HASHLOG_MAX. 300a0483764SConrad Meyer * Larger tables improve compression ratio of strategies <= dFast, 301a0483764SConrad Meyer * and improve speed of strategies > dFast. 302a0483764SConrad Meyer * Special: value 0 means "use default hashLog". */ 303a0483764SConrad Meyer ZSTD_c_chainLog=103, /* Size of the multi-probe search table, as a power of 2. 304a0483764SConrad Meyer * Resulting memory usage is (1 << (chainLog+2)). 305a0483764SConrad Meyer * Must be clamped between ZSTD_CHAINLOG_MIN and ZSTD_CHAINLOG_MAX. 306a0483764SConrad Meyer * Larger tables result in better and slower compression. 3079cbefe25SConrad Meyer * This parameter is useless for "fast" strategy. 308a0483764SConrad Meyer * It's still useful when using "dfast" strategy, 309a0483764SConrad Meyer * in which case it defines a secondary probe table. 310a0483764SConrad Meyer * Special: value 0 means "use default chainLog". */ 311a0483764SConrad Meyer ZSTD_c_searchLog=104, /* Number of search attempts, as a power of 2. 312a0483764SConrad Meyer * More attempts result in better and slower compression. 3139cbefe25SConrad Meyer * This parameter is useless for "fast" and "dFast" strategies. 314a0483764SConrad Meyer * Special: value 0 means "use default searchLog". */ 315a0483764SConrad Meyer ZSTD_c_minMatch=105, /* Minimum size of searched matches. 316a0483764SConrad Meyer * Note that Zstandard can still find matches of smaller size, 317a0483764SConrad Meyer * it just tweaks its search algorithm to look for this size and larger. 318a0483764SConrad Meyer * Larger values increase compression and decompression speed, but decrease ratio. 319a0483764SConrad Meyer * Must be clamped between ZSTD_MINMATCH_MIN and ZSTD_MINMATCH_MAX. 320a0483764SConrad Meyer * Note that currently, for all strategies < btopt, effective minimum is 4. 321a0483764SConrad Meyer * , for all strategies > fast, effective maximum is 6. 322a0483764SConrad Meyer * Special: value 0 means "use default minMatchLength". */ 323a0483764SConrad Meyer ZSTD_c_targetLength=106, /* Impact of this field depends on strategy. 324a0483764SConrad Meyer * For strategies btopt, btultra & btultra2: 325a0483764SConrad Meyer * Length of Match considered "good enough" to stop search. 326a0483764SConrad Meyer * Larger values make compression stronger, and slower. 327a0483764SConrad Meyer * For strategy fast: 328a0483764SConrad Meyer * Distance between match sampling. 329a0483764SConrad Meyer * Larger values make compression faster, and weaker. 330a0483764SConrad Meyer * Special: value 0 means "use default targetLength". */ 331a0483764SConrad Meyer ZSTD_c_strategy=107, /* See ZSTD_strategy enum definition. 332a0483764SConrad Meyer * The higher the value of selected strategy, the more complex it is, 333a0483764SConrad Meyer * resulting in stronger and slower compression. 334a0483764SConrad Meyer * Special: value 0 means "use default strategy". */ 335a0483764SConrad Meyer 336a0483764SConrad Meyer /* LDM mode parameters */ 337a0483764SConrad Meyer ZSTD_c_enableLongDistanceMatching=160, /* Enable long distance matching. 338a0483764SConrad Meyer * This parameter is designed to improve compression ratio 339a0483764SConrad Meyer * for large inputs, by finding large matches at long distance. 340a0483764SConrad Meyer * It increases memory usage and window size. 341a0483764SConrad Meyer * Note: enabling this parameter increases default ZSTD_c_windowLog to 128 MB 342*f7cd7fe5SConrad Meyer * except when expressly set to a different value. 343*f7cd7fe5SConrad Meyer * Note: will be enabled by default if ZSTD_c_windowLog >= 128 MB and 344*f7cd7fe5SConrad Meyer * compression strategy >= ZSTD_btopt (== compression level 16+) */ 345a0483764SConrad Meyer ZSTD_c_ldmHashLog=161, /* Size of the table for long distance matching, as a power of 2. 346a0483764SConrad Meyer * Larger values increase memory usage and compression ratio, 347a0483764SConrad Meyer * but decrease compression speed. 348a0483764SConrad Meyer * Must be clamped between ZSTD_HASHLOG_MIN and ZSTD_HASHLOG_MAX 349a0483764SConrad Meyer * default: windowlog - 7. 350a0483764SConrad Meyer * Special: value 0 means "automatically determine hashlog". */ 351a0483764SConrad Meyer ZSTD_c_ldmMinMatch=162, /* Minimum match size for long distance matcher. 352a0483764SConrad Meyer * Larger/too small values usually decrease compression ratio. 353a0483764SConrad Meyer * Must be clamped between ZSTD_LDM_MINMATCH_MIN and ZSTD_LDM_MINMATCH_MAX. 354a0483764SConrad Meyer * Special: value 0 means "use default value" (default: 64). */ 355a0483764SConrad Meyer ZSTD_c_ldmBucketSizeLog=163, /* Log size of each bucket in the LDM hash table for collision resolution. 356a0483764SConrad Meyer * Larger values improve collision resolution but decrease compression speed. 357a0483764SConrad Meyer * The maximum value is ZSTD_LDM_BUCKETSIZELOG_MAX. 358a0483764SConrad Meyer * Special: value 0 means "use default value" (default: 3). */ 359a0483764SConrad Meyer ZSTD_c_ldmHashRateLog=164, /* Frequency of inserting/looking up entries into the LDM hash table. 360a0483764SConrad Meyer * Must be clamped between 0 and (ZSTD_WINDOWLOG_MAX - ZSTD_HASHLOG_MIN). 361a0483764SConrad Meyer * Default is MAX(0, (windowLog - ldmHashLog)), optimizing hash table usage. 362a0483764SConrad Meyer * Larger values improve compression speed. 363a0483764SConrad Meyer * Deviating far from default value will likely result in a compression ratio decrease. 364a0483764SConrad Meyer * Special: value 0 means "automatically determine hashRateLog". */ 365a0483764SConrad Meyer 366a0483764SConrad Meyer /* frame parameters */ 367a0483764SConrad Meyer ZSTD_c_contentSizeFlag=200, /* Content size will be written into frame header _whenever known_ (default:1) 368a0483764SConrad Meyer * Content size must be known at the beginning of compression. 369a0483764SConrad Meyer * This is automatically the case when using ZSTD_compress2(), 3709cbefe25SConrad Meyer * For streaming scenarios, content size must be provided with ZSTD_CCtx_setPledgedSrcSize() */ 371a0483764SConrad Meyer ZSTD_c_checksumFlag=201, /* A 32-bits checksum of content is written at end of frame (default:0) */ 372a0483764SConrad Meyer ZSTD_c_dictIDFlag=202, /* When applicable, dictionary's ID is written into frame header (default:1) */ 373a0483764SConrad Meyer 374a0483764SConrad Meyer /* multi-threading parameters */ 375*f7cd7fe5SConrad Meyer /* These parameters are only active if multi-threading is enabled (compiled with build macro ZSTD_MULTITHREAD). 376*f7cd7fe5SConrad Meyer * Otherwise, trying to set any other value than default (0) will be a no-op and return an error. 377*f7cd7fe5SConrad Meyer * In a situation where it's unknown if the linked library supports multi-threading or not, 378*f7cd7fe5SConrad Meyer * setting ZSTD_c_nbWorkers to any value >= 1 and consulting the return value provides a quick way to check this property. 379*f7cd7fe5SConrad Meyer */ 380a0483764SConrad Meyer ZSTD_c_nbWorkers=400, /* Select how many threads will be spawned to compress in parallel. 381*f7cd7fe5SConrad Meyer * When nbWorkers >= 1, triggers asynchronous mode when invoking ZSTD_compressStream*() : 382a0483764SConrad Meyer * ZSTD_compressStream*() consumes input and flush output if possible, but immediately gives back control to caller, 383*f7cd7fe5SConrad Meyer * while compression is performed in parallel, within worker thread(s). 384a0483764SConrad Meyer * (note : a strong exception to this rule is when first invocation of ZSTD_compressStream2() sets ZSTD_e_end : 385a0483764SConrad Meyer * in which case, ZSTD_compressStream2() delegates to ZSTD_compress2(), which is always a blocking call). 386a0483764SConrad Meyer * More workers improve speed, but also increase memory usage. 387*f7cd7fe5SConrad Meyer * Default value is `0`, aka "single-threaded mode" : no worker is spawned, 388*f7cd7fe5SConrad Meyer * compression is performed inside Caller's thread, and all invocations are blocking */ 389a0483764SConrad Meyer ZSTD_c_jobSize=401, /* Size of a compression job. This value is enforced only when nbWorkers >= 1. 390a0483764SConrad Meyer * Each compression job is completed in parallel, so this value can indirectly impact the nb of active threads. 391a0483764SConrad Meyer * 0 means default, which is dynamically determined based on compression parameters. 392a0483764SConrad Meyer * Job size must be a minimum of overlap size, or 1 MB, whichever is largest. 3939cbefe25SConrad Meyer * The minimum size is automatically and transparently enforced. */ 394a0483764SConrad Meyer ZSTD_c_overlapLog=402, /* Control the overlap size, as a fraction of window size. 395a0483764SConrad Meyer * The overlap size is an amount of data reloaded from previous job at the beginning of a new job. 396a0483764SConrad Meyer * It helps preserve compression ratio, while each job is compressed in parallel. 397a0483764SConrad Meyer * This value is enforced only when nbWorkers >= 1. 398a0483764SConrad Meyer * Larger values increase compression ratio, but decrease speed. 399a0483764SConrad Meyer * Possible values range from 0 to 9 : 400a0483764SConrad Meyer * - 0 means "default" : value will be determined by the library, depending on strategy 401a0483764SConrad Meyer * - 1 means "no overlap" 402a0483764SConrad Meyer * - 9 means "full overlap", using a full window size. 403a0483764SConrad Meyer * Each intermediate rank increases/decreases load size by a factor 2 : 404a0483764SConrad Meyer * 9: full window; 8: w/2; 7: w/4; 6: w/8; 5:w/16; 4: w/32; 3:w/64; 2:w/128; 1:no overlap; 0:default 405a0483764SConrad Meyer * default value varies between 6 and 9, depending on strategy */ 406a0483764SConrad Meyer 407a0483764SConrad Meyer /* note : additional experimental parameters are also available 408a0483764SConrad Meyer * within the experimental section of the API. 409a0483764SConrad Meyer * At the time of this writing, they include : 410a0483764SConrad Meyer * ZSTD_c_rsyncable 411a0483764SConrad Meyer * ZSTD_c_format 412a0483764SConrad Meyer * ZSTD_c_forceMaxWindow 413a0483764SConrad Meyer * ZSTD_c_forceAttachDict 4142b9c00cbSConrad Meyer * ZSTD_c_literalCompressionMode 4154d3f1eafSConrad Meyer * ZSTD_c_targetCBlockSize 4169cbefe25SConrad Meyer * ZSTD_c_srcSizeHint 417*f7cd7fe5SConrad Meyer * ZSTD_c_enableDedicatedDictSearch 418*f7cd7fe5SConrad Meyer * ZSTD_c_stableInBuffer 419*f7cd7fe5SConrad Meyer * ZSTD_c_stableOutBuffer 420*f7cd7fe5SConrad Meyer * ZSTD_c_blockDelimiters 421*f7cd7fe5SConrad Meyer * ZSTD_c_validateSequences 422a0483764SConrad Meyer * Because they are not stable, it's necessary to define ZSTD_STATIC_LINKING_ONLY to access them. 423a0483764SConrad Meyer * note : never ever use experimentalParam? names directly; 424a0483764SConrad Meyer * also, the enums values themselves are unstable and can still change. 425a0483764SConrad Meyer */ 426a0483764SConrad Meyer ZSTD_c_experimentalParam1=500, 427a0483764SConrad Meyer ZSTD_c_experimentalParam2=10, 428a0483764SConrad Meyer ZSTD_c_experimentalParam3=1000, 4292b9c00cbSConrad Meyer ZSTD_c_experimentalParam4=1001, 4302b9c00cbSConrad Meyer ZSTD_c_experimentalParam5=1002, 4314d3f1eafSConrad Meyer ZSTD_c_experimentalParam6=1003, 432*f7cd7fe5SConrad Meyer ZSTD_c_experimentalParam7=1004, 433*f7cd7fe5SConrad Meyer ZSTD_c_experimentalParam8=1005, 434*f7cd7fe5SConrad Meyer ZSTD_c_experimentalParam9=1006, 435*f7cd7fe5SConrad Meyer ZSTD_c_experimentalParam10=1007, 436*f7cd7fe5SConrad Meyer ZSTD_c_experimentalParam11=1008, 437*f7cd7fe5SConrad Meyer ZSTD_c_experimentalParam12=1009 438a0483764SConrad Meyer } ZSTD_cParameter; 439a0483764SConrad Meyer 440a0483764SConrad Meyer typedef struct { 441a0483764SConrad Meyer size_t error; 442a0483764SConrad Meyer int lowerBound; 443a0483764SConrad Meyer int upperBound; 444a0483764SConrad Meyer } ZSTD_bounds; 445a0483764SConrad Meyer 446a0483764SConrad Meyer /*! ZSTD_cParam_getBounds() : 447a0483764SConrad Meyer * All parameters must belong to an interval with lower and upper bounds, 448a0483764SConrad Meyer * otherwise they will either trigger an error or be automatically clamped. 449a0483764SConrad Meyer * @return : a structure, ZSTD_bounds, which contains 450a0483764SConrad Meyer * - an error status field, which must be tested using ZSTD_isError() 451a0483764SConrad Meyer * - lower and upper bounds, both inclusive 452a0483764SConrad Meyer */ 453a0483764SConrad Meyer ZSTDLIB_API ZSTD_bounds ZSTD_cParam_getBounds(ZSTD_cParameter cParam); 454a0483764SConrad Meyer 455a0483764SConrad Meyer /*! ZSTD_CCtx_setParameter() : 456a0483764SConrad Meyer * Set one compression parameter, selected by enum ZSTD_cParameter. 457a0483764SConrad Meyer * All parameters have valid bounds. Bounds can be queried using ZSTD_cParam_getBounds(). 458a0483764SConrad Meyer * Providing a value beyond bound will either clamp it, or trigger an error (depending on parameter). 459a0483764SConrad Meyer * Setting a parameter is generally only possible during frame initialization (before starting compression). 460a0483764SConrad Meyer * Exception : when using multi-threading mode (nbWorkers >= 1), 461a0483764SConrad Meyer * the following parameters can be updated _during_ compression (within same frame): 462a0483764SConrad Meyer * => compressionLevel, hashLog, chainLog, searchLog, minMatch, targetLength and strategy. 463a0483764SConrad Meyer * new parameters will be active for next job only (after a flush()). 464a0483764SConrad Meyer * @return : an error code (which can be tested using ZSTD_isError()). 465a0483764SConrad Meyer */ 466a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_CCtx_setParameter(ZSTD_CCtx* cctx, ZSTD_cParameter param, int value); 467a0483764SConrad Meyer 468a0483764SConrad Meyer /*! ZSTD_CCtx_setPledgedSrcSize() : 469a0483764SConrad Meyer * Total input data size to be compressed as a single frame. 470a0483764SConrad Meyer * Value will be written in frame header, unless if explicitly forbidden using ZSTD_c_contentSizeFlag. 471a0483764SConrad Meyer * This value will also be controlled at end of frame, and trigger an error if not respected. 472a0483764SConrad Meyer * @result : 0, or an error code (which can be tested with ZSTD_isError()). 473a0483764SConrad Meyer * Note 1 : pledgedSrcSize==0 actually means zero, aka an empty frame. 474a0483764SConrad Meyer * In order to mean "unknown content size", pass constant ZSTD_CONTENTSIZE_UNKNOWN. 475a0483764SConrad Meyer * ZSTD_CONTENTSIZE_UNKNOWN is default value for any new frame. 476a0483764SConrad Meyer * Note 2 : pledgedSrcSize is only valid once, for the next frame. 477a0483764SConrad Meyer * It's discarded at the end of the frame, and replaced by ZSTD_CONTENTSIZE_UNKNOWN. 478a0483764SConrad Meyer * Note 3 : Whenever all input data is provided and consumed in a single round, 479a0483764SConrad Meyer * for example with ZSTD_compress2(), 480a0483764SConrad Meyer * or invoking immediately ZSTD_compressStream2(,,,ZSTD_e_end), 4812b9c00cbSConrad Meyer * this value is automatically overridden by srcSize instead. 482a0483764SConrad Meyer */ 483a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_CCtx_setPledgedSrcSize(ZSTD_CCtx* cctx, unsigned long long pledgedSrcSize); 484a0483764SConrad Meyer 4852b9c00cbSConrad Meyer typedef enum { 4862b9c00cbSConrad Meyer ZSTD_reset_session_only = 1, 4872b9c00cbSConrad Meyer ZSTD_reset_parameters = 2, 4882b9c00cbSConrad Meyer ZSTD_reset_session_and_parameters = 3 4892b9c00cbSConrad Meyer } ZSTD_ResetDirective; 4902b9c00cbSConrad Meyer 4912b9c00cbSConrad Meyer /*! ZSTD_CCtx_reset() : 4922b9c00cbSConrad Meyer * There are 2 different things that can be reset, independently or jointly : 4932b9c00cbSConrad Meyer * - The session : will stop compressing current frame, and make CCtx ready to start a new one. 4942b9c00cbSConrad Meyer * Useful after an error, or to interrupt any ongoing compression. 4952b9c00cbSConrad Meyer * Any internal data not yet flushed is cancelled. 4962b9c00cbSConrad Meyer * Compression parameters and dictionary remain unchanged. 4972b9c00cbSConrad Meyer * They will be used to compress next frame. 4982b9c00cbSConrad Meyer * Resetting session never fails. 4992b9c00cbSConrad Meyer * - The parameters : changes all parameters back to "default". 5002b9c00cbSConrad Meyer * This removes any reference to any dictionary too. 5012b9c00cbSConrad Meyer * Parameters can only be changed between 2 sessions (i.e. no compression is currently ongoing) 5022b9c00cbSConrad Meyer * otherwise the reset fails, and function returns an error value (which can be tested using ZSTD_isError()) 5032b9c00cbSConrad Meyer * - Both : similar to resetting the session, followed by resetting parameters. 5042b9c00cbSConrad Meyer */ 5052b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_CCtx_reset(ZSTD_CCtx* cctx, ZSTD_ResetDirective reset); 5062b9c00cbSConrad Meyer 5072b9c00cbSConrad Meyer /*! ZSTD_compress2() : 5082b9c00cbSConrad Meyer * Behave the same as ZSTD_compressCCtx(), but compression parameters are set using the advanced API. 5092b9c00cbSConrad Meyer * ZSTD_compress2() always starts a new frame. 5102b9c00cbSConrad Meyer * Should cctx hold data from a previously unfinished frame, everything about it is forgotten. 5112b9c00cbSConrad Meyer * - Compression parameters are pushed into CCtx before starting compression, using ZSTD_CCtx_set*() 5122b9c00cbSConrad Meyer * - The function is always blocking, returns when compression is completed. 5132b9c00cbSConrad Meyer * Hint : compression runs faster if `dstCapacity` >= `ZSTD_compressBound(srcSize)`. 5142b9c00cbSConrad Meyer * @return : compressed size written into `dst` (<= `dstCapacity), 5152b9c00cbSConrad Meyer * or an error code if it fails (which can be tested using ZSTD_isError()). 5162b9c00cbSConrad Meyer */ 5172b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_compress2( ZSTD_CCtx* cctx, 5182b9c00cbSConrad Meyer void* dst, size_t dstCapacity, 5192b9c00cbSConrad Meyer const void* src, size_t srcSize); 5202b9c00cbSConrad Meyer 5212b9c00cbSConrad Meyer 5222b9c00cbSConrad Meyer /*************************************** 5232b9c00cbSConrad Meyer * Advanced decompression API 5242b9c00cbSConrad Meyer ***************************************/ 5252b9c00cbSConrad Meyer 5262b9c00cbSConrad Meyer /* The advanced API pushes parameters one by one into an existing DCtx context. 5272b9c00cbSConrad Meyer * Parameters are sticky, and remain valid for all following frames 5282b9c00cbSConrad Meyer * using the same DCtx context. 5292b9c00cbSConrad Meyer * It's possible to reset parameters to default values using ZSTD_DCtx_reset(). 5302b9c00cbSConrad Meyer * Note : This API is compatible with existing ZSTD_decompressDCtx() and ZSTD_decompressStream(). 5312b9c00cbSConrad Meyer * Therefore, no new decompression function is necessary. 5322b9c00cbSConrad Meyer */ 5332b9c00cbSConrad Meyer 5342b9c00cbSConrad Meyer typedef enum { 5352b9c00cbSConrad Meyer 5362b9c00cbSConrad Meyer ZSTD_d_windowLogMax=100, /* Select a size limit (in power of 2) beyond which 5372b9c00cbSConrad Meyer * the streaming API will refuse to allocate memory buffer 5382b9c00cbSConrad Meyer * in order to protect the host from unreasonable memory requirements. 5392b9c00cbSConrad Meyer * This parameter is only useful in streaming mode, since no internal buffer is allocated in single-pass mode. 5402b9c00cbSConrad Meyer * By default, a decompression context accepts window sizes <= (1 << ZSTD_WINDOWLOG_LIMIT_DEFAULT). 5412b9c00cbSConrad Meyer * Special: value 0 means "use default maximum windowLog". */ 5422b9c00cbSConrad Meyer 5432b9c00cbSConrad Meyer /* note : additional experimental parameters are also available 5442b9c00cbSConrad Meyer * within the experimental section of the API. 5452b9c00cbSConrad Meyer * At the time of this writing, they include : 54637f1f268SConrad Meyer * ZSTD_d_format 54737f1f268SConrad Meyer * ZSTD_d_stableOutBuffer 548*f7cd7fe5SConrad Meyer * ZSTD_d_forceIgnoreChecksum 5492b9c00cbSConrad Meyer * Because they are not stable, it's necessary to define ZSTD_STATIC_LINKING_ONLY to access them. 5502b9c00cbSConrad Meyer * note : never ever use experimentalParam? names directly 5512b9c00cbSConrad Meyer */ 55237f1f268SConrad Meyer ZSTD_d_experimentalParam1=1000, 553*f7cd7fe5SConrad Meyer ZSTD_d_experimentalParam2=1001, 554*f7cd7fe5SConrad Meyer ZSTD_d_experimentalParam3=1002 5552b9c00cbSConrad Meyer 5562b9c00cbSConrad Meyer } ZSTD_dParameter; 5572b9c00cbSConrad Meyer 5582b9c00cbSConrad Meyer /*! ZSTD_dParam_getBounds() : 5592b9c00cbSConrad Meyer * All parameters must belong to an interval with lower and upper bounds, 5602b9c00cbSConrad Meyer * otherwise they will either trigger an error or be automatically clamped. 5612b9c00cbSConrad Meyer * @return : a structure, ZSTD_bounds, which contains 5622b9c00cbSConrad Meyer * - an error status field, which must be tested using ZSTD_isError() 5632b9c00cbSConrad Meyer * - both lower and upper bounds, inclusive 5642b9c00cbSConrad Meyer */ 5652b9c00cbSConrad Meyer ZSTDLIB_API ZSTD_bounds ZSTD_dParam_getBounds(ZSTD_dParameter dParam); 5662b9c00cbSConrad Meyer 5672b9c00cbSConrad Meyer /*! ZSTD_DCtx_setParameter() : 5682b9c00cbSConrad Meyer * Set one compression parameter, selected by enum ZSTD_dParameter. 5692b9c00cbSConrad Meyer * All parameters have valid bounds. Bounds can be queried using ZSTD_dParam_getBounds(). 5702b9c00cbSConrad Meyer * Providing a value beyond bound will either clamp it, or trigger an error (depending on parameter). 5712b9c00cbSConrad Meyer * Setting a parameter is only possible during frame initialization (before starting decompression). 5722b9c00cbSConrad Meyer * @return : 0, or an error code (which can be tested using ZSTD_isError()). 5732b9c00cbSConrad Meyer */ 5742b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_DCtx_setParameter(ZSTD_DCtx* dctx, ZSTD_dParameter param, int value); 5752b9c00cbSConrad Meyer 5762b9c00cbSConrad Meyer /*! ZSTD_DCtx_reset() : 5772b9c00cbSConrad Meyer * Return a DCtx to clean state. 5782b9c00cbSConrad Meyer * Session and parameters can be reset jointly or separately. 5792b9c00cbSConrad Meyer * Parameters can only be reset when no active frame is being decompressed. 5802b9c00cbSConrad Meyer * @return : 0, or an error code, which can be tested with ZSTD_isError() 5812b9c00cbSConrad Meyer */ 5822b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_DCtx_reset(ZSTD_DCtx* dctx, ZSTD_ResetDirective reset); 5832b9c00cbSConrad Meyer 5842b9c00cbSConrad Meyer 5852b9c00cbSConrad Meyer /**************************** 5862b9c00cbSConrad Meyer * Streaming 5872b9c00cbSConrad Meyer ****************************/ 5882b9c00cbSConrad Meyer 5892b9c00cbSConrad Meyer typedef struct ZSTD_inBuffer_s { 5902b9c00cbSConrad Meyer const void* src; /**< start of input buffer */ 5912b9c00cbSConrad Meyer size_t size; /**< size of input buffer */ 5922b9c00cbSConrad Meyer size_t pos; /**< position where reading stopped. Will be updated. Necessarily 0 <= pos <= size */ 5932b9c00cbSConrad Meyer } ZSTD_inBuffer; 5942b9c00cbSConrad Meyer 5952b9c00cbSConrad Meyer typedef struct ZSTD_outBuffer_s { 5962b9c00cbSConrad Meyer void* dst; /**< start of output buffer */ 5972b9c00cbSConrad Meyer size_t size; /**< size of output buffer */ 5982b9c00cbSConrad Meyer size_t pos; /**< position where writing stopped. Will be updated. Necessarily 0 <= pos <= size */ 5992b9c00cbSConrad Meyer } ZSTD_outBuffer; 6002b9c00cbSConrad Meyer 6012b9c00cbSConrad Meyer 6022b9c00cbSConrad Meyer 6032b9c00cbSConrad Meyer /*-*********************************************************************** 6042b9c00cbSConrad Meyer * Streaming compression - HowTo 6052b9c00cbSConrad Meyer * 6062b9c00cbSConrad Meyer * A ZSTD_CStream object is required to track streaming operation. 6072b9c00cbSConrad Meyer * Use ZSTD_createCStream() and ZSTD_freeCStream() to create/release resources. 6082b9c00cbSConrad Meyer * ZSTD_CStream objects can be reused multiple times on consecutive compression operations. 6092b9c00cbSConrad Meyer * It is recommended to re-use ZSTD_CStream since it will play nicer with system's memory, by re-using already allocated memory. 6102b9c00cbSConrad Meyer * 6112b9c00cbSConrad Meyer * For parallel execution, use one separate ZSTD_CStream per thread. 6122b9c00cbSConrad Meyer * 6132b9c00cbSConrad Meyer * note : since v1.3.0, ZSTD_CStream and ZSTD_CCtx are the same thing. 6142b9c00cbSConrad Meyer * 6152b9c00cbSConrad Meyer * Parameters are sticky : when starting a new compression on the same context, 6162b9c00cbSConrad Meyer * it will re-use the same sticky parameters as previous compression session. 6172b9c00cbSConrad Meyer * When in doubt, it's recommended to fully initialize the context before usage. 6182b9c00cbSConrad Meyer * Use ZSTD_CCtx_reset() to reset the context and ZSTD_CCtx_setParameter(), 6192b9c00cbSConrad Meyer * ZSTD_CCtx_setPledgedSrcSize(), or ZSTD_CCtx_loadDictionary() and friends to 6202b9c00cbSConrad Meyer * set more specific parameters, the pledged source size, or load a dictionary. 6212b9c00cbSConrad Meyer * 6222b9c00cbSConrad Meyer * Use ZSTD_compressStream2() with ZSTD_e_continue as many times as necessary to 6232b9c00cbSConrad Meyer * consume input stream. The function will automatically update both `pos` 6242b9c00cbSConrad Meyer * fields within `input` and `output`. 6252b9c00cbSConrad Meyer * Note that the function may not consume the entire input, for example, because 6262b9c00cbSConrad Meyer * the output buffer is already full, in which case `input.pos < input.size`. 6272b9c00cbSConrad Meyer * The caller must check if input has been entirely consumed. 6282b9c00cbSConrad Meyer * If not, the caller must make some room to receive more compressed data, 6292b9c00cbSConrad Meyer * and then present again remaining input data. 6302b9c00cbSConrad Meyer * note: ZSTD_e_continue is guaranteed to make some forward progress when called, 6312b9c00cbSConrad Meyer * but doesn't guarantee maximal forward progress. This is especially relevant 6322b9c00cbSConrad Meyer * when compressing with multiple threads. The call won't block if it can 6332b9c00cbSConrad Meyer * consume some input, but if it can't it will wait for some, but not all, 6342b9c00cbSConrad Meyer * output to be flushed. 6352b9c00cbSConrad Meyer * @return : provides a minimum amount of data remaining to be flushed from internal buffers 6362b9c00cbSConrad Meyer * or an error code, which can be tested using ZSTD_isError(). 6372b9c00cbSConrad Meyer * 6382b9c00cbSConrad Meyer * At any moment, it's possible to flush whatever data might remain stuck within internal buffer, 6392b9c00cbSConrad Meyer * using ZSTD_compressStream2() with ZSTD_e_flush. `output->pos` will be updated. 6402b9c00cbSConrad Meyer * Note that, if `output->size` is too small, a single invocation with ZSTD_e_flush might not be enough (return code > 0). 6412b9c00cbSConrad Meyer * In which case, make some room to receive more compressed data, and call again ZSTD_compressStream2() with ZSTD_e_flush. 6422b9c00cbSConrad Meyer * You must continue calling ZSTD_compressStream2() with ZSTD_e_flush until it returns 0, at which point you can change the 6432b9c00cbSConrad Meyer * operation. 6442b9c00cbSConrad Meyer * note: ZSTD_e_flush will flush as much output as possible, meaning when compressing with multiple threads, it will 6452b9c00cbSConrad Meyer * block until the flush is complete or the output buffer is full. 6462b9c00cbSConrad Meyer * @return : 0 if internal buffers are entirely flushed, 6472b9c00cbSConrad Meyer * >0 if some data still present within internal buffer (the value is minimal estimation of remaining size), 6482b9c00cbSConrad Meyer * or an error code, which can be tested using ZSTD_isError(). 6492b9c00cbSConrad Meyer * 6502b9c00cbSConrad Meyer * Calling ZSTD_compressStream2() with ZSTD_e_end instructs to finish a frame. 6512b9c00cbSConrad Meyer * It will perform a flush and write frame epilogue. 6522b9c00cbSConrad Meyer * The epilogue is required for decoders to consider a frame completed. 6532b9c00cbSConrad Meyer * flush operation is the same, and follows same rules as calling ZSTD_compressStream2() with ZSTD_e_flush. 6542b9c00cbSConrad Meyer * You must continue calling ZSTD_compressStream2() with ZSTD_e_end until it returns 0, at which point you are free to 6552b9c00cbSConrad Meyer * start a new frame. 6562b9c00cbSConrad Meyer * note: ZSTD_e_end will flush as much output as possible, meaning when compressing with multiple threads, it will 6572b9c00cbSConrad Meyer * block until the flush is complete or the output buffer is full. 6582b9c00cbSConrad Meyer * @return : 0 if frame fully completed and fully flushed, 6592b9c00cbSConrad Meyer * >0 if some data still present within internal buffer (the value is minimal estimation of remaining size), 6602b9c00cbSConrad Meyer * or an error code, which can be tested using ZSTD_isError(). 6612b9c00cbSConrad Meyer * 6622b9c00cbSConrad Meyer * *******************************************************************/ 6632b9c00cbSConrad Meyer 6642b9c00cbSConrad Meyer typedef ZSTD_CCtx ZSTD_CStream; /**< CCtx and CStream are now effectively same object (>= v1.3.0) */ 6652b9c00cbSConrad Meyer /* Continue to distinguish them for compatibility with older versions <= v1.2.0 */ 6662b9c00cbSConrad Meyer /*===== ZSTD_CStream management functions =====*/ 6672b9c00cbSConrad Meyer ZSTDLIB_API ZSTD_CStream* ZSTD_createCStream(void); 6682b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_freeCStream(ZSTD_CStream* zcs); 6692b9c00cbSConrad Meyer 6702b9c00cbSConrad Meyer /*===== Streaming compression functions =====*/ 6712b9c00cbSConrad Meyer typedef enum { 6722b9c00cbSConrad Meyer ZSTD_e_continue=0, /* collect more data, encoder decides when to output compressed result, for optimal compression ratio */ 6732b9c00cbSConrad Meyer ZSTD_e_flush=1, /* flush any data provided so far, 6742b9c00cbSConrad Meyer * it creates (at least) one new block, that can be decoded immediately on reception; 6752b9c00cbSConrad Meyer * frame will continue: any future data can still reference previously compressed data, improving compression. 6762b9c00cbSConrad Meyer * note : multithreaded compression will block to flush as much output as possible. */ 6772b9c00cbSConrad Meyer ZSTD_e_end=2 /* flush any remaining data _and_ close current frame. 6782b9c00cbSConrad Meyer * note that frame is only closed after compressed data is fully flushed (return value == 0). 6792b9c00cbSConrad Meyer * After that point, any additional data starts a new frame. 6802b9c00cbSConrad Meyer * note : each frame is independent (does not reference any content from previous frame). 6812b9c00cbSConrad Meyer : note : multithreaded compression will block to flush as much output as possible. */ 6822b9c00cbSConrad Meyer } ZSTD_EndDirective; 6832b9c00cbSConrad Meyer 6842b9c00cbSConrad Meyer /*! ZSTD_compressStream2() : 6852b9c00cbSConrad Meyer * Behaves about the same as ZSTD_compressStream, with additional control on end directive. 6862b9c00cbSConrad Meyer * - Compression parameters are pushed into CCtx before starting compression, using ZSTD_CCtx_set*() 6872b9c00cbSConrad Meyer * - Compression parameters cannot be changed once compression is started (save a list of exceptions in multi-threading mode) 6882b9c00cbSConrad Meyer * - output->pos must be <= dstCapacity, input->pos must be <= srcSize 6892b9c00cbSConrad Meyer * - output->pos and input->pos will be updated. They are guaranteed to remain below their respective limit. 690*f7cd7fe5SConrad Meyer * - endOp must be a valid directive 6912b9c00cbSConrad Meyer * - When nbWorkers==0 (default), function is blocking : it completes its job before returning to caller. 692*f7cd7fe5SConrad Meyer * - When nbWorkers>=1, function is non-blocking : it copies a portion of input, distributes jobs to internal worker threads, flush to output whatever is available, 6932b9c00cbSConrad Meyer * and then immediately returns, just indicating that there is some data remaining to be flushed. 6942b9c00cbSConrad Meyer * The function nonetheless guarantees forward progress : it will return only after it reads or write at least 1+ byte. 6952b9c00cbSConrad Meyer * - Exception : if the first call requests a ZSTD_e_end directive and provides enough dstCapacity, the function delegates to ZSTD_compress2() which is always blocking. 6962b9c00cbSConrad Meyer * - @return provides a minimum amount of data remaining to be flushed from internal buffers 6972b9c00cbSConrad Meyer * or an error code, which can be tested using ZSTD_isError(). 6982b9c00cbSConrad Meyer * if @return != 0, flush is not fully completed, there is still some data left within internal buffers. 6992b9c00cbSConrad Meyer * This is useful for ZSTD_e_flush, since in this case more flushes are necessary to empty all buffers. 7002b9c00cbSConrad Meyer * For ZSTD_e_end, @return == 0 when internal buffers are fully flushed and frame is completed. 7012b9c00cbSConrad Meyer * - after a ZSTD_e_end directive, if internal buffer is not fully flushed (@return != 0), 7022b9c00cbSConrad Meyer * only ZSTD_e_end or ZSTD_e_flush operations are allowed. 7032b9c00cbSConrad Meyer * Before starting a new compression job, or changing compression parameters, 7042b9c00cbSConrad Meyer * it is required to fully flush internal buffers. 7052b9c00cbSConrad Meyer */ 7062b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_compressStream2( ZSTD_CCtx* cctx, 7072b9c00cbSConrad Meyer ZSTD_outBuffer* output, 7082b9c00cbSConrad Meyer ZSTD_inBuffer* input, 7092b9c00cbSConrad Meyer ZSTD_EndDirective endOp); 7102b9c00cbSConrad Meyer 7112b9c00cbSConrad Meyer 7124d3f1eafSConrad Meyer /* These buffer sizes are softly recommended. 7134d3f1eafSConrad Meyer * They are not required : ZSTD_compressStream*() happily accepts any buffer size, for both input and output. 7144d3f1eafSConrad Meyer * Respecting the recommended size just makes it a bit easier for ZSTD_compressStream*(), 7154d3f1eafSConrad Meyer * reducing the amount of memory shuffling and buffering, resulting in minor performance savings. 7164d3f1eafSConrad Meyer * 7174d3f1eafSConrad Meyer * However, note that these recommendations are from the perspective of a C caller program. 7184d3f1eafSConrad Meyer * If the streaming interface is invoked from some other language, 7194d3f1eafSConrad Meyer * especially managed ones such as Java or Go, through a foreign function interface such as jni or cgo, 7204d3f1eafSConrad Meyer * a major performance rule is to reduce crossing such interface to an absolute minimum. 7214d3f1eafSConrad Meyer * It's not rare that performance ends being spent more into the interface, rather than compression itself. 7224d3f1eafSConrad Meyer * In which cases, prefer using large buffers, as large as practical, 7234d3f1eafSConrad Meyer * for both input and output, to reduce the nb of roundtrips. 7244d3f1eafSConrad Meyer */ 7254d3f1eafSConrad Meyer ZSTDLIB_API size_t ZSTD_CStreamInSize(void); /**< recommended size for input buffer */ 7264d3f1eafSConrad Meyer ZSTDLIB_API size_t ZSTD_CStreamOutSize(void); /**< recommended size for output buffer. Guarantee to successfully flush at least one complete compressed block. */ 7274d3f1eafSConrad Meyer 7284d3f1eafSConrad Meyer 7294d3f1eafSConrad Meyer /* ***************************************************************************** 7304d3f1eafSConrad Meyer * This following is a legacy streaming API. 7314d3f1eafSConrad Meyer * It can be replaced by ZSTD_CCtx_reset() and ZSTD_compressStream2(). 7324d3f1eafSConrad Meyer * It is redundant, but remains fully supported. 7332b9c00cbSConrad Meyer * Advanced parameters and dictionary compression can only be used through the 7342b9c00cbSConrad Meyer * new API. 7352b9c00cbSConrad Meyer ******************************************************************************/ 7362b9c00cbSConrad Meyer 7374d3f1eafSConrad Meyer /*! 7382b9c00cbSConrad Meyer * Equivalent to: 7392b9c00cbSConrad Meyer * 7402b9c00cbSConrad Meyer * ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only); 7412b9c00cbSConrad Meyer * ZSTD_CCtx_refCDict(zcs, NULL); // clear the dictionary (if any) 7422b9c00cbSConrad Meyer * ZSTD_CCtx_setParameter(zcs, ZSTD_c_compressionLevel, compressionLevel); 7432b9c00cbSConrad Meyer */ 7442b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_initCStream(ZSTD_CStream* zcs, int compressionLevel); 7454d3f1eafSConrad Meyer /*! 7462b9c00cbSConrad Meyer * Alternative for ZSTD_compressStream2(zcs, output, input, ZSTD_e_continue). 7472b9c00cbSConrad Meyer * NOTE: The return value is different. ZSTD_compressStream() returns a hint for 7482b9c00cbSConrad Meyer * the next read size (if non-zero and not an error). ZSTD_compressStream2() 7494d3f1eafSConrad Meyer * returns the minimum nb of bytes left to flush (if non-zero and not an error). 7502b9c00cbSConrad Meyer */ 7512b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_compressStream(ZSTD_CStream* zcs, ZSTD_outBuffer* output, ZSTD_inBuffer* input); 7524d3f1eafSConrad Meyer /*! Equivalent to ZSTD_compressStream2(zcs, output, &emptyInput, ZSTD_e_flush). */ 7532b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_flushStream(ZSTD_CStream* zcs, ZSTD_outBuffer* output); 7544d3f1eafSConrad Meyer /*! Equivalent to ZSTD_compressStream2(zcs, output, &emptyInput, ZSTD_e_end). */ 7552b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_endStream(ZSTD_CStream* zcs, ZSTD_outBuffer* output); 7562b9c00cbSConrad Meyer 7572b9c00cbSConrad Meyer 7582b9c00cbSConrad Meyer /*-*************************************************************************** 7592b9c00cbSConrad Meyer * Streaming decompression - HowTo 7602b9c00cbSConrad Meyer * 7612b9c00cbSConrad Meyer * A ZSTD_DStream object is required to track streaming operations. 7622b9c00cbSConrad Meyer * Use ZSTD_createDStream() and ZSTD_freeDStream() to create/release resources. 7632b9c00cbSConrad Meyer * ZSTD_DStream objects can be re-used multiple times. 7642b9c00cbSConrad Meyer * 7652b9c00cbSConrad Meyer * Use ZSTD_initDStream() to start a new decompression operation. 7662b9c00cbSConrad Meyer * @return : recommended first input size 7672b9c00cbSConrad Meyer * Alternatively, use advanced API to set specific properties. 7682b9c00cbSConrad Meyer * 7692b9c00cbSConrad Meyer * Use ZSTD_decompressStream() repetitively to consume your input. 7702b9c00cbSConrad Meyer * The function will update both `pos` fields. 7712b9c00cbSConrad Meyer * If `input.pos < input.size`, some input has not been consumed. 7722b9c00cbSConrad Meyer * It's up to the caller to present again remaining data. 7732b9c00cbSConrad Meyer * The function tries to flush all data decoded immediately, respecting output buffer size. 7742b9c00cbSConrad Meyer * If `output.pos < output.size`, decoder has flushed everything it could. 7752b9c00cbSConrad Meyer * But if `output.pos == output.size`, there might be some data left within internal buffers., 7762b9c00cbSConrad Meyer * In which case, call ZSTD_decompressStream() again to flush whatever remains in the buffer. 7772b9c00cbSConrad Meyer * Note : with no additional input provided, amount of data flushed is necessarily <= ZSTD_BLOCKSIZE_MAX. 7782b9c00cbSConrad Meyer * @return : 0 when a frame is completely decoded and fully flushed, 7792b9c00cbSConrad Meyer * or an error code, which can be tested using ZSTD_isError(), 7802b9c00cbSConrad Meyer * or any other value > 0, which means there is still some decoding or flushing to do to complete current frame : 7812b9c00cbSConrad Meyer * the return value is a suggested next input size (just a hint for better latency) 7822b9c00cbSConrad Meyer * that will never request more than the remaining frame size. 7832b9c00cbSConrad Meyer * *******************************************************************************/ 7842b9c00cbSConrad Meyer 7852b9c00cbSConrad Meyer typedef ZSTD_DCtx ZSTD_DStream; /**< DCtx and DStream are now effectively same object (>= v1.3.0) */ 7862b9c00cbSConrad Meyer /* For compatibility with versions <= v1.2.0, prefer differentiating them. */ 7872b9c00cbSConrad Meyer /*===== ZSTD_DStream management functions =====*/ 7882b9c00cbSConrad Meyer ZSTDLIB_API ZSTD_DStream* ZSTD_createDStream(void); 7892b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_freeDStream(ZSTD_DStream* zds); 7902b9c00cbSConrad Meyer 7912b9c00cbSConrad Meyer /*===== Streaming decompression functions =====*/ 7922b9c00cbSConrad Meyer 7932b9c00cbSConrad Meyer /* This function is redundant with the advanced API and equivalent to: 7942b9c00cbSConrad Meyer * 79537f1f268SConrad Meyer * ZSTD_DCtx_reset(zds, ZSTD_reset_session_only); 7962b9c00cbSConrad Meyer * ZSTD_DCtx_refDDict(zds, NULL); 7972b9c00cbSConrad Meyer */ 7982b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_initDStream(ZSTD_DStream* zds); 7992b9c00cbSConrad Meyer 8002b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_decompressStream(ZSTD_DStream* zds, ZSTD_outBuffer* output, ZSTD_inBuffer* input); 8012b9c00cbSConrad Meyer 8022b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_DStreamInSize(void); /*!< recommended size for input buffer */ 8032b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_DStreamOutSize(void); /*!< recommended size for output buffer. Guarantee to successfully flush at least one complete block in all circumstances. */ 8042b9c00cbSConrad Meyer 8052b9c00cbSConrad Meyer 8062b9c00cbSConrad Meyer /************************** 8072b9c00cbSConrad Meyer * Simple dictionary API 8082b9c00cbSConrad Meyer ***************************/ 8092b9c00cbSConrad Meyer /*! ZSTD_compress_usingDict() : 8102b9c00cbSConrad Meyer * Compression at an explicit compression level using a Dictionary. 8112b9c00cbSConrad Meyer * A dictionary can be any arbitrary data segment (also called a prefix), 8122b9c00cbSConrad Meyer * or a buffer with specified information (see dictBuilder/zdict.h). 8132b9c00cbSConrad Meyer * Note : This function loads the dictionary, resulting in significant startup delay. 8142b9c00cbSConrad Meyer * It's intended for a dictionary used only once. 8152b9c00cbSConrad Meyer * Note 2 : When `dict == NULL || dictSize < 8` no dictionary is used. */ 8162b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_compress_usingDict(ZSTD_CCtx* ctx, 8172b9c00cbSConrad Meyer void* dst, size_t dstCapacity, 8182b9c00cbSConrad Meyer const void* src, size_t srcSize, 8192b9c00cbSConrad Meyer const void* dict,size_t dictSize, 8202b9c00cbSConrad Meyer int compressionLevel); 8212b9c00cbSConrad Meyer 8222b9c00cbSConrad Meyer /*! ZSTD_decompress_usingDict() : 8232b9c00cbSConrad Meyer * Decompression using a known Dictionary. 8242b9c00cbSConrad Meyer * Dictionary must be identical to the one used during compression. 8252b9c00cbSConrad Meyer * Note : This function loads the dictionary, resulting in significant startup delay. 8262b9c00cbSConrad Meyer * It's intended for a dictionary used only once. 8272b9c00cbSConrad Meyer * Note : When `dict == NULL || dictSize < 8` no dictionary is used. */ 8282b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_decompress_usingDict(ZSTD_DCtx* dctx, 8292b9c00cbSConrad Meyer void* dst, size_t dstCapacity, 8302b9c00cbSConrad Meyer const void* src, size_t srcSize, 8312b9c00cbSConrad Meyer const void* dict,size_t dictSize); 8322b9c00cbSConrad Meyer 8332b9c00cbSConrad Meyer 8342b9c00cbSConrad Meyer /*********************************** 8352b9c00cbSConrad Meyer * Bulk processing dictionary API 8362b9c00cbSConrad Meyer **********************************/ 8372b9c00cbSConrad Meyer typedef struct ZSTD_CDict_s ZSTD_CDict; 8382b9c00cbSConrad Meyer 8392b9c00cbSConrad Meyer /*! ZSTD_createCDict() : 8409cbefe25SConrad Meyer * When compressing multiple messages or blocks using the same dictionary, 8419cbefe25SConrad Meyer * it's recommended to digest the dictionary only once, since it's a costly operation. 8429cbefe25SConrad Meyer * ZSTD_createCDict() will create a state from digesting a dictionary. 8439cbefe25SConrad Meyer * The resulting state can be used for future compression operations with very limited startup cost. 8442b9c00cbSConrad Meyer * ZSTD_CDict can be created once and shared by multiple threads concurrently, since its usage is read-only. 8459cbefe25SConrad Meyer * @dictBuffer can be released after ZSTD_CDict creation, because its content is copied within CDict. 8469cbefe25SConrad Meyer * Note 1 : Consider experimental function `ZSTD_createCDict_byReference()` if you prefer to not duplicate @dictBuffer content. 8479cbefe25SConrad Meyer * Note 2 : A ZSTD_CDict can be created from an empty @dictBuffer, 8489cbefe25SConrad Meyer * in which case the only thing that it transports is the @compressionLevel. 8499cbefe25SConrad Meyer * This can be useful in a pipeline featuring ZSTD_compress_usingCDict() exclusively, 8509cbefe25SConrad Meyer * expecting a ZSTD_CDict parameter with any data, including those without a known dictionary. */ 8512b9c00cbSConrad Meyer ZSTDLIB_API ZSTD_CDict* ZSTD_createCDict(const void* dictBuffer, size_t dictSize, 8522b9c00cbSConrad Meyer int compressionLevel); 8532b9c00cbSConrad Meyer 8542b9c00cbSConrad Meyer /*! ZSTD_freeCDict() : 8552b9c00cbSConrad Meyer * Function frees memory allocated by ZSTD_createCDict(). */ 8562b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_freeCDict(ZSTD_CDict* CDict); 8572b9c00cbSConrad Meyer 8582b9c00cbSConrad Meyer /*! ZSTD_compress_usingCDict() : 8592b9c00cbSConrad Meyer * Compression using a digested Dictionary. 8602b9c00cbSConrad Meyer * Recommended when same dictionary is used multiple times. 8612b9c00cbSConrad Meyer * Note : compression level is _decided at dictionary creation time_, 8622b9c00cbSConrad Meyer * and frame parameters are hardcoded (dictID=yes, contentSize=yes, checksum=no) */ 8632b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_compress_usingCDict(ZSTD_CCtx* cctx, 8642b9c00cbSConrad Meyer void* dst, size_t dstCapacity, 8652b9c00cbSConrad Meyer const void* src, size_t srcSize, 8662b9c00cbSConrad Meyer const ZSTD_CDict* cdict); 8672b9c00cbSConrad Meyer 8682b9c00cbSConrad Meyer 8692b9c00cbSConrad Meyer typedef struct ZSTD_DDict_s ZSTD_DDict; 8702b9c00cbSConrad Meyer 8712b9c00cbSConrad Meyer /*! ZSTD_createDDict() : 8722b9c00cbSConrad Meyer * Create a digested dictionary, ready to start decompression operation without startup delay. 8732b9c00cbSConrad Meyer * dictBuffer can be released after DDict creation, as its content is copied inside DDict. */ 8742b9c00cbSConrad Meyer ZSTDLIB_API ZSTD_DDict* ZSTD_createDDict(const void* dictBuffer, size_t dictSize); 8752b9c00cbSConrad Meyer 8762b9c00cbSConrad Meyer /*! ZSTD_freeDDict() : 8772b9c00cbSConrad Meyer * Function frees memory allocated with ZSTD_createDDict() */ 8782b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_freeDDict(ZSTD_DDict* ddict); 8792b9c00cbSConrad Meyer 8802b9c00cbSConrad Meyer /*! ZSTD_decompress_usingDDict() : 8812b9c00cbSConrad Meyer * Decompression using a digested Dictionary. 8822b9c00cbSConrad Meyer * Recommended when same dictionary is used multiple times. */ 8832b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_decompress_usingDDict(ZSTD_DCtx* dctx, 8842b9c00cbSConrad Meyer void* dst, size_t dstCapacity, 8852b9c00cbSConrad Meyer const void* src, size_t srcSize, 8862b9c00cbSConrad Meyer const ZSTD_DDict* ddict); 8872b9c00cbSConrad Meyer 8882b9c00cbSConrad Meyer 8892b9c00cbSConrad Meyer /******************************** 8902b9c00cbSConrad Meyer * Dictionary helper functions 8912b9c00cbSConrad Meyer *******************************/ 8922b9c00cbSConrad Meyer 8932b9c00cbSConrad Meyer /*! ZSTD_getDictID_fromDict() : 8942b9c00cbSConrad Meyer * Provides the dictID stored within dictionary. 8952b9c00cbSConrad Meyer * if @return == 0, the dictionary is not conformant with Zstandard specification. 8962b9c00cbSConrad Meyer * It can still be loaded, but as a content-only dictionary. */ 8972b9c00cbSConrad Meyer ZSTDLIB_API unsigned ZSTD_getDictID_fromDict(const void* dict, size_t dictSize); 8982b9c00cbSConrad Meyer 8992b9c00cbSConrad Meyer /*! ZSTD_getDictID_fromDDict() : 9002b9c00cbSConrad Meyer * Provides the dictID of the dictionary loaded into `ddict`. 9012b9c00cbSConrad Meyer * If @return == 0, the dictionary is not conformant to Zstandard specification, or empty. 9022b9c00cbSConrad Meyer * Non-conformant dictionaries can still be loaded, but as content-only dictionaries. */ 9032b9c00cbSConrad Meyer ZSTDLIB_API unsigned ZSTD_getDictID_fromDDict(const ZSTD_DDict* ddict); 9042b9c00cbSConrad Meyer 9052b9c00cbSConrad Meyer /*! ZSTD_getDictID_fromFrame() : 9062b9c00cbSConrad Meyer * Provides the dictID required to decompressed the frame stored within `src`. 9072b9c00cbSConrad Meyer * If @return == 0, the dictID could not be decoded. 9082b9c00cbSConrad Meyer * This could for one of the following reasons : 9092b9c00cbSConrad Meyer * - The frame does not require a dictionary to be decoded (most common case). 9102b9c00cbSConrad Meyer * - The frame was built with dictID intentionally removed. Whatever dictionary is necessary is a hidden information. 9112b9c00cbSConrad Meyer * Note : this use case also happens when using a non-conformant dictionary. 9122b9c00cbSConrad Meyer * - `srcSize` is too small, and as a result, the frame header could not be decoded (only possible if `srcSize < ZSTD_FRAMEHEADERSIZE_MAX`). 9132b9c00cbSConrad Meyer * - This is not a Zstandard frame. 9142b9c00cbSConrad Meyer * When identifying the exact failure cause, it's possible to use ZSTD_getFrameHeader(), which will provide a more precise error code. */ 9152b9c00cbSConrad Meyer ZSTDLIB_API unsigned ZSTD_getDictID_fromFrame(const void* src, size_t srcSize); 9162b9c00cbSConrad Meyer 9172b9c00cbSConrad Meyer 9182b9c00cbSConrad Meyer /******************************************************************************* 9192b9c00cbSConrad Meyer * Advanced dictionary and prefix API 9202b9c00cbSConrad Meyer * 9212b9c00cbSConrad Meyer * This API allows dictionaries to be used with ZSTD_compress2(), 9222b9c00cbSConrad Meyer * ZSTD_compressStream2(), and ZSTD_decompress(). Dictionaries are sticky, and 9232b9c00cbSConrad Meyer * only reset with the context is reset with ZSTD_reset_parameters or 9242b9c00cbSConrad Meyer * ZSTD_reset_session_and_parameters. Prefixes are single-use. 9252b9c00cbSConrad Meyer ******************************************************************************/ 9262b9c00cbSConrad Meyer 9272b9c00cbSConrad Meyer 928a0483764SConrad Meyer /*! ZSTD_CCtx_loadDictionary() : 929a0483764SConrad Meyer * Create an internal CDict from `dict` buffer. 930a0483764SConrad Meyer * Decompression will have to use same dictionary. 931a0483764SConrad Meyer * @result : 0, or an error code (which can be tested with ZSTD_isError()). 932a0483764SConrad Meyer * Special: Loading a NULL (or 0-size) dictionary invalidates previous dictionary, 933a0483764SConrad Meyer * meaning "return to no-dictionary mode". 934a0483764SConrad Meyer * Note 1 : Dictionary is sticky, it will be used for all future compressed frames. 935a0483764SConrad Meyer * To return to "no-dictionary" situation, load a NULL dictionary (or reset parameters). 936a0483764SConrad Meyer * Note 2 : Loading a dictionary involves building tables. 937a0483764SConrad Meyer * It's also a CPU consuming operation, with non-negligible impact on latency. 938a0483764SConrad Meyer * Tables are dependent on compression parameters, and for this reason, 939a0483764SConrad Meyer * compression parameters can no longer be changed after loading a dictionary. 940a0483764SConrad Meyer * Note 3 :`dict` content will be copied internally. 941a0483764SConrad Meyer * Use experimental ZSTD_CCtx_loadDictionary_byReference() to reference content instead. 942a0483764SConrad Meyer * In such a case, dictionary buffer must outlive its users. 943a0483764SConrad Meyer * Note 4 : Use ZSTD_CCtx_loadDictionary_advanced() 944a0483764SConrad Meyer * to precisely select how dictionary content must be interpreted. */ 945a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_CCtx_loadDictionary(ZSTD_CCtx* cctx, const void* dict, size_t dictSize); 946a0483764SConrad Meyer 947a0483764SConrad Meyer /*! ZSTD_CCtx_refCDict() : 948a0483764SConrad Meyer * Reference a prepared dictionary, to be used for all next compressed frames. 949a0483764SConrad Meyer * Note that compression parameters are enforced from within CDict, 9502b9c00cbSConrad Meyer * and supersede any compression parameter previously set within CCtx. 9512b9c00cbSConrad Meyer * The parameters ignored are labled as "superseded-by-cdict" in the ZSTD_cParameter enum docs. 9522b9c00cbSConrad Meyer * The ignored parameters will be used again if the CCtx is returned to no-dictionary mode. 953a0483764SConrad Meyer * The dictionary will remain valid for future compressed frames using same CCtx. 954a0483764SConrad Meyer * @result : 0, or an error code (which can be tested with ZSTD_isError()). 955a0483764SConrad Meyer * Special : Referencing a NULL CDict means "return to no-dictionary mode". 956a0483764SConrad Meyer * Note 1 : Currently, only one dictionary can be managed. 957a0483764SConrad Meyer * Referencing a new dictionary effectively "discards" any previous one. 958a0483764SConrad Meyer * Note 2 : CDict is just referenced, its lifetime must outlive its usage within CCtx. */ 959a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_CCtx_refCDict(ZSTD_CCtx* cctx, const ZSTD_CDict* cdict); 960a0483764SConrad Meyer 961a0483764SConrad Meyer /*! ZSTD_CCtx_refPrefix() : 962a0483764SConrad Meyer * Reference a prefix (single-usage dictionary) for next compressed frame. 963a0483764SConrad Meyer * A prefix is **only used once**. Tables are discarded at end of frame (ZSTD_e_end). 964a0483764SConrad Meyer * Decompression will need same prefix to properly regenerate data. 965a0483764SConrad Meyer * Compressing with a prefix is similar in outcome as performing a diff and compressing it, 966a0483764SConrad Meyer * but performs much faster, especially during decompression (compression speed is tunable with compression level). 967a0483764SConrad Meyer * @result : 0, or an error code (which can be tested with ZSTD_isError()). 968a0483764SConrad Meyer * Special: Adding any prefix (including NULL) invalidates any previous prefix or dictionary 969a0483764SConrad Meyer * Note 1 : Prefix buffer is referenced. It **must** outlive compression. 970a0483764SConrad Meyer * Its content must remain unmodified during compression. 971a0483764SConrad Meyer * Note 2 : If the intention is to diff some large src data blob with some prior version of itself, 972a0483764SConrad Meyer * ensure that the window size is large enough to contain the entire source. 973a0483764SConrad Meyer * See ZSTD_c_windowLog. 974a0483764SConrad Meyer * Note 3 : Referencing a prefix involves building tables, which are dependent on compression parameters. 975a0483764SConrad Meyer * It's a CPU consuming operation, with non-negligible impact on latency. 976a0483764SConrad Meyer * If there is a need to use the same prefix multiple times, consider loadDictionary instead. 9779cbefe25SConrad Meyer * Note 4 : By default, the prefix is interpreted as raw content (ZSTD_dct_rawContent). 978a0483764SConrad Meyer * Use experimental ZSTD_CCtx_refPrefix_advanced() to alter dictionary interpretation. */ 979a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_CCtx_refPrefix(ZSTD_CCtx* cctx, 980a0483764SConrad Meyer const void* prefix, size_t prefixSize); 981a0483764SConrad Meyer 982a0483764SConrad Meyer /*! ZSTD_DCtx_loadDictionary() : 983a0483764SConrad Meyer * Create an internal DDict from dict buffer, 984a0483764SConrad Meyer * to be used to decompress next frames. 985a0483764SConrad Meyer * The dictionary remains valid for all future frames, until explicitly invalidated. 986a0483764SConrad Meyer * @result : 0, or an error code (which can be tested with ZSTD_isError()). 987a0483764SConrad Meyer * Special : Adding a NULL (or 0-size) dictionary invalidates any previous dictionary, 988a0483764SConrad Meyer * meaning "return to no-dictionary mode". 989a0483764SConrad Meyer * Note 1 : Loading a dictionary involves building tables, 990a0483764SConrad Meyer * which has a non-negligible impact on CPU usage and latency. 991a0483764SConrad Meyer * It's recommended to "load once, use many times", to amortize the cost 992a0483764SConrad Meyer * Note 2 :`dict` content will be copied internally, so `dict` can be released after loading. 993a0483764SConrad Meyer * Use ZSTD_DCtx_loadDictionary_byReference() to reference dictionary content instead. 994a0483764SConrad Meyer * Note 3 : Use ZSTD_DCtx_loadDictionary_advanced() to take control of 995a0483764SConrad Meyer * how dictionary content is loaded and interpreted. 996a0483764SConrad Meyer */ 997a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_DCtx_loadDictionary(ZSTD_DCtx* dctx, const void* dict, size_t dictSize); 998a0483764SConrad Meyer 999a0483764SConrad Meyer /*! ZSTD_DCtx_refDDict() : 1000a0483764SConrad Meyer * Reference a prepared dictionary, to be used to decompress next frames. 1001a0483764SConrad Meyer * The dictionary remains active for decompression of future frames using same DCtx. 1002a0483764SConrad Meyer * @result : 0, or an error code (which can be tested with ZSTD_isError()). 1003a0483764SConrad Meyer * Note 1 : Currently, only one dictionary can be managed. 1004a0483764SConrad Meyer * Referencing a new dictionary effectively "discards" any previous one. 1005a0483764SConrad Meyer * Special: referencing a NULL DDict means "return to no-dictionary mode". 1006a0483764SConrad Meyer * Note 2 : DDict is just referenced, its lifetime must outlive its usage from DCtx. 1007a0483764SConrad Meyer */ 1008a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_DCtx_refDDict(ZSTD_DCtx* dctx, const ZSTD_DDict* ddict); 1009a0483764SConrad Meyer 1010a0483764SConrad Meyer /*! ZSTD_DCtx_refPrefix() : 1011a0483764SConrad Meyer * Reference a prefix (single-usage dictionary) to decompress next frame. 1012a0483764SConrad Meyer * This is the reverse operation of ZSTD_CCtx_refPrefix(), 1013a0483764SConrad Meyer * and must use the same prefix as the one used during compression. 1014a0483764SConrad Meyer * Prefix is **only used once**. Reference is discarded at end of frame. 1015a0483764SConrad Meyer * End of frame is reached when ZSTD_decompressStream() returns 0. 1016a0483764SConrad Meyer * @result : 0, or an error code (which can be tested with ZSTD_isError()). 1017a0483764SConrad Meyer * Note 1 : Adding any prefix (including NULL) invalidates any previously set prefix or dictionary 1018a0483764SConrad Meyer * Note 2 : Prefix buffer is referenced. It **must** outlive decompression. 1019a0483764SConrad Meyer * Prefix buffer must remain unmodified up to the end of frame, 1020a0483764SConrad Meyer * reached when ZSTD_decompressStream() returns 0. 10219cbefe25SConrad Meyer * Note 3 : By default, the prefix is treated as raw content (ZSTD_dct_rawContent). 1022a0483764SConrad Meyer * Use ZSTD_CCtx_refPrefix_advanced() to alter dictMode (Experimental section) 1023a0483764SConrad Meyer * Note 4 : Referencing a raw content prefix has almost no cpu nor memory cost. 1024a0483764SConrad Meyer * A full dictionary is more costly, as it requires building tables. 1025a0483764SConrad Meyer */ 1026a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_DCtx_refPrefix(ZSTD_DCtx* dctx, 1027a0483764SConrad Meyer const void* prefix, size_t prefixSize); 1028a0483764SConrad Meyer 10292b9c00cbSConrad Meyer /* === Memory management === */ 10302b9c00cbSConrad Meyer 10312b9c00cbSConrad Meyer /*! ZSTD_sizeof_*() : 10322b9c00cbSConrad Meyer * These functions give the _current_ memory usage of selected object. 10332b9c00cbSConrad Meyer * Note that object memory usage can evolve (increase or decrease) over time. */ 10342b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_sizeof_CCtx(const ZSTD_CCtx* cctx); 10352b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_sizeof_DCtx(const ZSTD_DCtx* dctx); 10362b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_sizeof_CStream(const ZSTD_CStream* zcs); 10372b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_sizeof_DStream(const ZSTD_DStream* zds); 10382b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_sizeof_CDict(const ZSTD_CDict* cdict); 10392b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_sizeof_DDict(const ZSTD_DDict* ddict); 10402b9c00cbSConrad Meyer 10412b9c00cbSConrad Meyer #endif /* ZSTD_H_235446 */ 1042a0483764SConrad Meyer 1043a0483764SConrad Meyer 10444d3f1eafSConrad Meyer /* ************************************************************************************** 10452b9c00cbSConrad Meyer * ADVANCED AND EXPERIMENTAL FUNCTIONS 10462b9c00cbSConrad Meyer **************************************************************************************** 10472b9c00cbSConrad Meyer * The definitions in the following section are considered experimental. 10482b9c00cbSConrad Meyer * They are provided for advanced scenarios. 10492b9c00cbSConrad Meyer * They should never be used with a dynamic library, as prototypes may change in the future. 10502b9c00cbSConrad Meyer * Use them only in association with static linking. 10512b9c00cbSConrad Meyer * ***************************************************************************************/ 10522b9c00cbSConrad Meyer 10532b9c00cbSConrad Meyer #if defined(ZSTD_STATIC_LINKING_ONLY) && !defined(ZSTD_H_ZSTD_STATIC_LINKING_ONLY) 10542b9c00cbSConrad Meyer #define ZSTD_H_ZSTD_STATIC_LINKING_ONLY 1055a0483764SConrad Meyer 1056a0483764SConrad Meyer /**************************************************************************************** 1057a0483764SConrad Meyer * experimental API (static linking only) 1058a0483764SConrad Meyer **************************************************************************************** 1059a0483764SConrad Meyer * The following symbols and constants 1060a0483764SConrad Meyer * are not planned to join "stable API" status in the near future. 1061a0483764SConrad Meyer * They can still change in future versions. 1062a0483764SConrad Meyer * Some of them are planned to remain in the static_only section indefinitely. 1063a0483764SConrad Meyer * Some of them might be removed in the future (especially when redundant with existing stable functions) 1064a0483764SConrad Meyer * ***************************************************************************************/ 1065a0483764SConrad Meyer 10669cbefe25SConrad Meyer #define ZSTD_FRAMEHEADERSIZE_PREFIX(format) ((format) == ZSTD_f_zstd1 ? 5 : 1) /* minimum input size required to query frame header size */ 10679cbefe25SConrad Meyer #define ZSTD_FRAMEHEADERSIZE_MIN(format) ((format) == ZSTD_f_zstd1 ? 6 : 2) 1068a0483764SConrad Meyer #define ZSTD_FRAMEHEADERSIZE_MAX 18 /* can be useful for static allocation */ 1069a0483764SConrad Meyer #define ZSTD_SKIPPABLEHEADERSIZE 8 1070a0483764SConrad Meyer 1071a0483764SConrad Meyer /* compression parameter bounds */ 10720c16b537SWarner Losh #define ZSTD_WINDOWLOG_MAX_32 30 10730c16b537SWarner Losh #define ZSTD_WINDOWLOG_MAX_64 31 1074a0483764SConrad Meyer #define ZSTD_WINDOWLOG_MAX ((int)(sizeof(size_t) == 4 ? ZSTD_WINDOWLOG_MAX_32 : ZSTD_WINDOWLOG_MAX_64)) 10750c16b537SWarner Losh #define ZSTD_WINDOWLOG_MIN 10 107619fcbaf1SConrad Meyer #define ZSTD_HASHLOG_MAX ((ZSTD_WINDOWLOG_MAX < 30) ? ZSTD_WINDOWLOG_MAX : 30) 10770c16b537SWarner Losh #define ZSTD_HASHLOG_MIN 6 107819fcbaf1SConrad Meyer #define ZSTD_CHAINLOG_MAX_32 29 107919fcbaf1SConrad Meyer #define ZSTD_CHAINLOG_MAX_64 30 1080a0483764SConrad Meyer #define ZSTD_CHAINLOG_MAX ((int)(sizeof(size_t) == 4 ? ZSTD_CHAINLOG_MAX_32 : ZSTD_CHAINLOG_MAX_64)) 10810c16b537SWarner Losh #define ZSTD_CHAINLOG_MIN ZSTD_HASHLOG_MIN 10820c16b537SWarner Losh #define ZSTD_SEARCHLOG_MAX (ZSTD_WINDOWLOG_MAX-1) 10830c16b537SWarner Losh #define ZSTD_SEARCHLOG_MIN 1 1084a0483764SConrad Meyer #define ZSTD_MINMATCH_MAX 7 /* only for ZSTD_fast, other strategies are limited to 6 */ 1085a0483764SConrad Meyer #define ZSTD_MINMATCH_MIN 3 /* only for ZSTD_btopt+, faster strategies are limited to 4 */ 10860f743729SConrad Meyer #define ZSTD_TARGETLENGTH_MAX ZSTD_BLOCKSIZE_MAX 10870f743729SConrad Meyer #define ZSTD_TARGETLENGTH_MIN 0 /* note : comparing this constant to an unsigned results in a tautological test */ 1088a0483764SConrad Meyer #define ZSTD_STRATEGY_MIN ZSTD_fast 1089a0483764SConrad Meyer #define ZSTD_STRATEGY_MAX ZSTD_btultra2 1090a0483764SConrad Meyer 1091a0483764SConrad Meyer 1092a0483764SConrad Meyer #define ZSTD_OVERLAPLOG_MIN 0 1093a0483764SConrad Meyer #define ZSTD_OVERLAPLOG_MAX 9 1094a0483764SConrad Meyer 1095a0483764SConrad Meyer #define ZSTD_WINDOWLOG_LIMIT_DEFAULT 27 /* by default, the streaming decoder will refuse any frame 1096a0483764SConrad Meyer * requiring larger than (1<<ZSTD_WINDOWLOG_LIMIT_DEFAULT) window size, 1097a0483764SConrad Meyer * to preserve host's memory from unreasonable requirements. 10982b9c00cbSConrad Meyer * This limit can be overridden using ZSTD_DCtx_setParameter(,ZSTD_d_windowLogMax,). 1099a0483764SConrad Meyer * The limit does not apply for one-pass decoders (such as ZSTD_decompress()), since no additional memory is allocated */ 1100a0483764SConrad Meyer 1101a0483764SConrad Meyer 1102a0483764SConrad Meyer /* LDM parameter bounds */ 1103a0483764SConrad Meyer #define ZSTD_LDM_HASHLOG_MIN ZSTD_HASHLOG_MIN 1104a0483764SConrad Meyer #define ZSTD_LDM_HASHLOG_MAX ZSTD_HASHLOG_MAX 11050f743729SConrad Meyer #define ZSTD_LDM_MINMATCH_MIN 4 1106a0483764SConrad Meyer #define ZSTD_LDM_MINMATCH_MAX 4096 1107a0483764SConrad Meyer #define ZSTD_LDM_BUCKETSIZELOG_MIN 1 11080c16b537SWarner Losh #define ZSTD_LDM_BUCKETSIZELOG_MAX 8 1109a0483764SConrad Meyer #define ZSTD_LDM_HASHRATELOG_MIN 0 1110a0483764SConrad Meyer #define ZSTD_LDM_HASHRATELOG_MAX (ZSTD_WINDOWLOG_MAX - ZSTD_HASHLOG_MIN) 11110c16b537SWarner Losh 11124d3f1eafSConrad Meyer /* Advanced parameter bounds */ 11134d3f1eafSConrad Meyer #define ZSTD_TARGETCBLOCKSIZE_MIN 64 11144d3f1eafSConrad Meyer #define ZSTD_TARGETCBLOCKSIZE_MAX ZSTD_BLOCKSIZE_MAX 11159cbefe25SConrad Meyer #define ZSTD_SRCSIZEHINT_MIN 0 11169cbefe25SConrad Meyer #define ZSTD_SRCSIZEHINT_MAX INT_MAX 11174d3f1eafSConrad Meyer 1118a0483764SConrad Meyer /* internal */ 1119a0483764SConrad Meyer #define ZSTD_HASHLOG3_MAX 17 11200c16b537SWarner Losh 11210f743729SConrad Meyer 11220c16b537SWarner Losh /* --- Advanced types --- */ 1123a0483764SConrad Meyer 1124a0483764SConrad Meyer typedef struct ZSTD_CCtx_params_s ZSTD_CCtx_params; 11250c16b537SWarner Losh 11260c16b537SWarner Losh typedef struct { 1127*f7cd7fe5SConrad Meyer unsigned int offset; /* The offset of the match. (NOT the same as the offset code) 1128*f7cd7fe5SConrad Meyer * If offset == 0 and matchLength == 0, this sequence represents the last 1129*f7cd7fe5SConrad Meyer * literals in the block of litLength size. 11309cbefe25SConrad Meyer */ 1131*f7cd7fe5SConrad Meyer 1132*f7cd7fe5SConrad Meyer unsigned int litLength; /* Literal length of the sequence. */ 1133*f7cd7fe5SConrad Meyer unsigned int matchLength; /* Match length of the sequence. */ 1134*f7cd7fe5SConrad Meyer 1135*f7cd7fe5SConrad Meyer /* Note: Users of this API may provide a sequence with matchLength == litLength == offset == 0. 1136*f7cd7fe5SConrad Meyer * In this case, we will treat the sequence as a marker for a block boundary. 11379cbefe25SConrad Meyer */ 1138*f7cd7fe5SConrad Meyer 1139*f7cd7fe5SConrad Meyer unsigned int rep; /* Represents which repeat offset is represented by the field 'offset'. 1140*f7cd7fe5SConrad Meyer * Ranges from [0, 3]. 1141*f7cd7fe5SConrad Meyer * 1142*f7cd7fe5SConrad Meyer * Repeat offsets are essentially previous offsets from previous sequences sorted in 1143*f7cd7fe5SConrad Meyer * recency order. For more detail, see doc/zstd_compression_format.md 1144*f7cd7fe5SConrad Meyer * 1145*f7cd7fe5SConrad Meyer * If rep == 0, then 'offset' does not contain a repeat offset. 1146*f7cd7fe5SConrad Meyer * If rep > 0: 1147*f7cd7fe5SConrad Meyer * If litLength != 0: 1148*f7cd7fe5SConrad Meyer * rep == 1 --> offset == repeat_offset_1 1149*f7cd7fe5SConrad Meyer * rep == 2 --> offset == repeat_offset_2 1150*f7cd7fe5SConrad Meyer * rep == 3 --> offset == repeat_offset_3 1151*f7cd7fe5SConrad Meyer * If litLength == 0: 1152*f7cd7fe5SConrad Meyer * rep == 1 --> offset == repeat_offset_2 1153*f7cd7fe5SConrad Meyer * rep == 2 --> offset == repeat_offset_3 1154*f7cd7fe5SConrad Meyer * rep == 3 --> offset == repeat_offset_1 - 1 1155*f7cd7fe5SConrad Meyer * 1156*f7cd7fe5SConrad Meyer * Note: This field is optional. ZSTD_generateSequences() will calculate the value of 1157*f7cd7fe5SConrad Meyer * 'rep', but repeat offsets do not necessarily need to be calculated from an external 1158*f7cd7fe5SConrad Meyer * sequence provider's perspective. For example, ZSTD_compressSequences() does not 1159*f7cd7fe5SConrad Meyer * use this 'rep' field at all (as of now). 1160*f7cd7fe5SConrad Meyer */ 11619cbefe25SConrad Meyer } ZSTD_Sequence; 11629cbefe25SConrad Meyer 11639cbefe25SConrad Meyer typedef struct { 11640c16b537SWarner Losh unsigned windowLog; /**< largest match distance : larger == more compression, more memory needed during decompression */ 11650c16b537SWarner Losh unsigned chainLog; /**< fully searched segment : larger == more compression, slower, more memory (useless for fast) */ 11660c16b537SWarner Losh unsigned hashLog; /**< dispatch table : larger == faster, more memory */ 11670c16b537SWarner Losh unsigned searchLog; /**< nb of searches : larger == more compression, slower */ 1168a0483764SConrad Meyer unsigned minMatch; /**< match length searched : larger == faster decompression, sometimes less compression */ 11690c16b537SWarner Losh unsigned targetLength; /**< acceptable match size for optimal parser (only) : larger == more compression, slower */ 1170a0483764SConrad Meyer ZSTD_strategy strategy; /**< see ZSTD_strategy definition above */ 11710c16b537SWarner Losh } ZSTD_compressionParameters; 11720c16b537SWarner Losh 11730c16b537SWarner Losh typedef struct { 1174a0483764SConrad Meyer int contentSizeFlag; /**< 1: content size will be in frame header (when known) */ 1175a0483764SConrad Meyer int checksumFlag; /**< 1: generate a 32-bits checksum using XXH64 algorithm at end of frame, for error detection */ 1176a0483764SConrad Meyer int noDictIDFlag; /**< 1: no dictID will be saved into frame header (dictID is only useful for dictionary compression) */ 11770c16b537SWarner Losh } ZSTD_frameParameters; 11780c16b537SWarner Losh 11790c16b537SWarner Losh typedef struct { 11800c16b537SWarner Losh ZSTD_compressionParameters cParams; 11810c16b537SWarner Losh ZSTD_frameParameters fParams; 11820c16b537SWarner Losh } ZSTD_parameters; 11830c16b537SWarner Losh 118419fcbaf1SConrad Meyer typedef enum { 118519fcbaf1SConrad Meyer ZSTD_dct_auto = 0, /* dictionary is "full" when starting with ZSTD_MAGIC_DICTIONARY, otherwise it is "rawContent" */ 1186a0483764SConrad Meyer ZSTD_dct_rawContent = 1, /* ensures dictionary is always loaded as rawContent, even if it starts with ZSTD_MAGIC_DICTIONARY */ 1187a0483764SConrad Meyer ZSTD_dct_fullDict = 2 /* refuses to load a dictionary if it does not respect Zstandard's specification, starting with ZSTD_MAGIC_DICTIONARY */ 118819fcbaf1SConrad Meyer } ZSTD_dictContentType_e; 118919fcbaf1SConrad Meyer 119019fcbaf1SConrad Meyer typedef enum { 119119fcbaf1SConrad Meyer ZSTD_dlm_byCopy = 0, /**< Copy dictionary content internally */ 11929cbefe25SConrad Meyer ZSTD_dlm_byRef = 1 /**< Reference dictionary content -- the dictionary buffer must outlive its users. */ 119319fcbaf1SConrad Meyer } ZSTD_dictLoadMethod_e; 119419fcbaf1SConrad Meyer 1195a0483764SConrad Meyer typedef enum { 1196a0483764SConrad Meyer ZSTD_f_zstd1 = 0, /* zstd frame format, specified in zstd_compression_format.md (default) */ 11979cbefe25SConrad Meyer ZSTD_f_zstd1_magicless = 1 /* Variant of zstd frame format, without initial 4-bytes magic number. 1198a0483764SConrad Meyer * Useful to save 4 bytes per generated frame. 1199a0483764SConrad Meyer * Decoder cannot recognise automatically this format, requiring this instruction. */ 1200a0483764SConrad Meyer } ZSTD_format_e; 1201a0483764SConrad Meyer 1202a0483764SConrad Meyer typedef enum { 1203*f7cd7fe5SConrad Meyer /* Note: this enum controls ZSTD_d_forceIgnoreChecksum */ 1204*f7cd7fe5SConrad Meyer ZSTD_d_validateChecksum = 0, 1205*f7cd7fe5SConrad Meyer ZSTD_d_ignoreChecksum = 1 1206*f7cd7fe5SConrad Meyer } ZSTD_forceIgnoreChecksum_e; 1207*f7cd7fe5SConrad Meyer 1208*f7cd7fe5SConrad Meyer typedef enum { 1209a0483764SConrad Meyer /* Note: this enum and the behavior it controls are effectively internal 1210a0483764SConrad Meyer * implementation details of the compressor. They are expected to continue 1211a0483764SConrad Meyer * to evolve and should be considered only in the context of extremely 1212a0483764SConrad Meyer * advanced performance tuning. 1213a0483764SConrad Meyer * 12149cbefe25SConrad Meyer * Zstd currently supports the use of a CDict in three ways: 1215a0483764SConrad Meyer * 1216a0483764SConrad Meyer * - The contents of the CDict can be copied into the working context. This 1217a0483764SConrad Meyer * means that the compression can search both the dictionary and input 1218a0483764SConrad Meyer * while operating on a single set of internal tables. This makes 1219a0483764SConrad Meyer * the compression faster per-byte of input. However, the initial copy of 1220a0483764SConrad Meyer * the CDict's tables incurs a fixed cost at the beginning of the 1221a0483764SConrad Meyer * compression. For small compressions (< 8 KB), that copy can dominate 1222a0483764SConrad Meyer * the cost of the compression. 1223a0483764SConrad Meyer * 1224a0483764SConrad Meyer * - The CDict's tables can be used in-place. In this model, compression is 1225a0483764SConrad Meyer * slower per input byte, because the compressor has to search two sets of 1226a0483764SConrad Meyer * tables. However, this model incurs no start-up cost (as long as the 1227a0483764SConrad Meyer * working context's tables can be reused). For small inputs, this can be 1228a0483764SConrad Meyer * faster than copying the CDict's tables. 1229a0483764SConrad Meyer * 12309cbefe25SConrad Meyer * - The CDict's tables are not used at all, and instead we use the working 12319cbefe25SConrad Meyer * context alone to reload the dictionary and use params based on the source 12329cbefe25SConrad Meyer * size. See ZSTD_compress_insertDictionary() and ZSTD_compress_usingDict(). 12339cbefe25SConrad Meyer * This method is effective when the dictionary sizes are very small relative 12349cbefe25SConrad Meyer * to the input size, and the input size is fairly large to begin with. 12359cbefe25SConrad Meyer * 1236a0483764SConrad Meyer * Zstd has a simple internal heuristic that selects which strategy to use 1237a0483764SConrad Meyer * at the beginning of a compression. However, if experimentation shows that 1238a0483764SConrad Meyer * Zstd is making poor choices, it is possible to override that choice with 1239a0483764SConrad Meyer * this enum. 1240a0483764SConrad Meyer */ 1241a0483764SConrad Meyer ZSTD_dictDefaultAttach = 0, /* Use the default heuristic. */ 1242a0483764SConrad Meyer ZSTD_dictForceAttach = 1, /* Never copy the dictionary. */ 1243a0483764SConrad Meyer ZSTD_dictForceCopy = 2, /* Always copy the dictionary. */ 12449cbefe25SConrad Meyer ZSTD_dictForceLoad = 3 /* Always reload the dictionary */ 1245a0483764SConrad Meyer } ZSTD_dictAttachPref_e; 12460c16b537SWarner Losh 12472b9c00cbSConrad Meyer typedef enum { 12482b9c00cbSConrad Meyer ZSTD_lcm_auto = 0, /**< Automatically determine the compression mode based on the compression level. 12492b9c00cbSConrad Meyer * Negative compression levels will be uncompressed, and positive compression 12502b9c00cbSConrad Meyer * levels will be compressed. */ 12512b9c00cbSConrad Meyer ZSTD_lcm_huffman = 1, /**< Always attempt Huffman compression. Uncompressed literals will still be 12522b9c00cbSConrad Meyer * emitted if Huffman compression is not profitable. */ 12539cbefe25SConrad Meyer ZSTD_lcm_uncompressed = 2 /**< Always emit uncompressed literals. */ 12542b9c00cbSConrad Meyer } ZSTD_literalCompressionMode_e; 12552b9c00cbSConrad Meyer 12560c16b537SWarner Losh 12570c16b537SWarner Losh /*************************************** 12580c16b537SWarner Losh * Frame size functions 12590c16b537SWarner Losh ***************************************/ 12600c16b537SWarner Losh 12610c16b537SWarner Losh /*! ZSTD_findDecompressedSize() : 12622b9c00cbSConrad Meyer * `src` should point to the start of a series of ZSTD encoded and/or skippable frames 12630c16b537SWarner Losh * `srcSize` must be the _exact_ size of this series 12642b9c00cbSConrad Meyer * (i.e. there should be a frame boundary at `src + srcSize`) 12650c16b537SWarner Losh * @return : - decompressed size of all data in all successive frames 12660c16b537SWarner Losh * - if the decompressed size cannot be determined: ZSTD_CONTENTSIZE_UNKNOWN 12670c16b537SWarner Losh * - if an error occurred: ZSTD_CONTENTSIZE_ERROR 12680c16b537SWarner Losh * 12690c16b537SWarner Losh * note 1 : decompressed size is an optional field, that may not be present, especially in streaming mode. 12700c16b537SWarner Losh * When `return==ZSTD_CONTENTSIZE_UNKNOWN`, data to decompress could be any size. 12710c16b537SWarner Losh * In which case, it's necessary to use streaming mode to decompress data. 12720c16b537SWarner Losh * note 2 : decompressed size is always present when compression is done with ZSTD_compress() 12730c16b537SWarner Losh * note 3 : decompressed size can be very large (64-bits value), 12740c16b537SWarner Losh * potentially larger than what local system can handle as a single memory segment. 12750c16b537SWarner Losh * In which case, it's necessary to use streaming mode to decompress data. 12760c16b537SWarner Losh * note 4 : If source is untrusted, decompressed size could be wrong or intentionally modified. 12770c16b537SWarner Losh * Always ensure result fits within application's authorized limits. 12780c16b537SWarner Losh * Each application can set its own limits. 12790c16b537SWarner Losh * note 5 : ZSTD_findDecompressedSize handles multiple frames, and so it must traverse the input to 12800c16b537SWarner Losh * read each contained frame header. This is fast as most of the data is skipped, 12810c16b537SWarner Losh * however it does mean that all frame data must be present and valid. */ 12820c16b537SWarner Losh ZSTDLIB_API unsigned long long ZSTD_findDecompressedSize(const void* src, size_t srcSize); 12830c16b537SWarner Losh 12844d3f1eafSConrad Meyer /*! ZSTD_decompressBound() : 12852b9c00cbSConrad Meyer * `src` should point to the start of a series of ZSTD encoded and/or skippable frames 12862b9c00cbSConrad Meyer * `srcSize` must be the _exact_ size of this series 12872b9c00cbSConrad Meyer * (i.e. there should be a frame boundary at `src + srcSize`) 12882b9c00cbSConrad Meyer * @return : - upper-bound for the decompressed size of all data in all successive frames 12892b9c00cbSConrad Meyer * - if an error occured: ZSTD_CONTENTSIZE_ERROR 12902b9c00cbSConrad Meyer * 12912b9c00cbSConrad Meyer * note 1 : an error can occur if `src` contains an invalid or incorrectly formatted frame. 12922b9c00cbSConrad Meyer * note 2 : the upper-bound is exact when the decompressed size field is available in every ZSTD encoded frame of `src`. 12932b9c00cbSConrad Meyer * in this case, `ZSTD_findDecompressedSize` and `ZSTD_decompressBound` return the same value. 12942b9c00cbSConrad Meyer * note 3 : when the decompressed size field isn't available, the upper-bound for that frame is calculated by: 12952b9c00cbSConrad Meyer * upper-bound = # blocks * min(128 KB, Window_Size) 12962b9c00cbSConrad Meyer */ 12972b9c00cbSConrad Meyer ZSTDLIB_API unsigned long long ZSTD_decompressBound(const void* src, size_t srcSize); 12982b9c00cbSConrad Meyer 12990c16b537SWarner Losh /*! ZSTD_frameHeaderSize() : 1300a0483764SConrad Meyer * srcSize must be >= ZSTD_FRAMEHEADERSIZE_PREFIX. 13010f743729SConrad Meyer * @return : size of the Frame Header, 13020f743729SConrad Meyer * or an error code (if srcSize is too small) */ 13030c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_frameHeaderSize(const void* src, size_t srcSize); 13040c16b537SWarner Losh 1305*f7cd7fe5SConrad Meyer typedef enum { 1306*f7cd7fe5SConrad Meyer ZSTD_sf_noBlockDelimiters = 0, /* Representation of ZSTD_Sequence has no block delimiters, sequences only */ 1307*f7cd7fe5SConrad Meyer ZSTD_sf_explicitBlockDelimiters = 1 /* Representation of ZSTD_Sequence contains explicit block delimiters */ 1308*f7cd7fe5SConrad Meyer } ZSTD_sequenceFormat_e; 1309*f7cd7fe5SConrad Meyer 1310*f7cd7fe5SConrad Meyer /*! ZSTD_generateSequences() : 1311*f7cd7fe5SConrad Meyer * Generate sequences using ZSTD_compress2, given a source buffer. 1312*f7cd7fe5SConrad Meyer * 1313*f7cd7fe5SConrad Meyer * Each block will end with a dummy sequence 1314*f7cd7fe5SConrad Meyer * with offset == 0, matchLength == 0, and litLength == length of last literals. 1315*f7cd7fe5SConrad Meyer * litLength may be == 0, and if so, then the sequence of (of: 0 ml: 0 ll: 0) 1316*f7cd7fe5SConrad Meyer * simply acts as a block delimiter. 1317*f7cd7fe5SConrad Meyer * 13189cbefe25SConrad Meyer * zc can be used to insert custom compression params. 13199cbefe25SConrad Meyer * This function invokes ZSTD_compress2 1320*f7cd7fe5SConrad Meyer * 1321*f7cd7fe5SConrad Meyer * The output of this function can be fed into ZSTD_compressSequences() with CCtx 1322*f7cd7fe5SConrad Meyer * setting of ZSTD_c_blockDelimiters as ZSTD_sf_explicitBlockDelimiters 1323*f7cd7fe5SConrad Meyer * @return : number of sequences generated 13249cbefe25SConrad Meyer */ 1325*f7cd7fe5SConrad Meyer 1326*f7cd7fe5SConrad Meyer ZSTDLIB_API size_t ZSTD_generateSequences(ZSTD_CCtx* zc, ZSTD_Sequence* outSeqs, 13279cbefe25SConrad Meyer size_t outSeqsSize, const void* src, size_t srcSize); 13289cbefe25SConrad Meyer 1329*f7cd7fe5SConrad Meyer /*! ZSTD_mergeBlockDelimiters() : 1330*f7cd7fe5SConrad Meyer * Given an array of ZSTD_Sequence, remove all sequences that represent block delimiters/last literals 1331*f7cd7fe5SConrad Meyer * by merging them into into the literals of the next sequence. 1332*f7cd7fe5SConrad Meyer * 1333*f7cd7fe5SConrad Meyer * As such, the final generated result has no explicit representation of block boundaries, 1334*f7cd7fe5SConrad Meyer * and the final last literals segment is not represented in the sequences. 1335*f7cd7fe5SConrad Meyer * 1336*f7cd7fe5SConrad Meyer * The output of this function can be fed into ZSTD_compressSequences() with CCtx 1337*f7cd7fe5SConrad Meyer * setting of ZSTD_c_blockDelimiters as ZSTD_sf_noBlockDelimiters 1338*f7cd7fe5SConrad Meyer * @return : number of sequences left after merging 1339*f7cd7fe5SConrad Meyer */ 1340*f7cd7fe5SConrad Meyer ZSTDLIB_API size_t ZSTD_mergeBlockDelimiters(ZSTD_Sequence* sequences, size_t seqsSize); 1341*f7cd7fe5SConrad Meyer 1342*f7cd7fe5SConrad Meyer /*! ZSTD_compressSequences() : 1343*f7cd7fe5SConrad Meyer * Compress an array of ZSTD_Sequence, generated from the original source buffer, into dst. 1344*f7cd7fe5SConrad Meyer * If a dictionary is included, then the cctx should reference the dict. (see: ZSTD_CCtx_refCDict(), ZSTD_CCtx_loadDictionary(), etc.) 1345*f7cd7fe5SConrad Meyer * The entire source is compressed into a single frame. 1346*f7cd7fe5SConrad Meyer * 1347*f7cd7fe5SConrad Meyer * The compression behavior changes based on cctx params. In particular: 1348*f7cd7fe5SConrad Meyer * If ZSTD_c_blockDelimiters == ZSTD_sf_noBlockDelimiters, the array of ZSTD_Sequence is expected to contain 1349*f7cd7fe5SConrad Meyer * no block delimiters (defined in ZSTD_Sequence). Block boundaries are roughly determined based on 1350*f7cd7fe5SConrad Meyer * the block size derived from the cctx, and sequences may be split. This is the default setting. 1351*f7cd7fe5SConrad Meyer * 1352*f7cd7fe5SConrad Meyer * If ZSTD_c_blockDelimiters == ZSTD_sf_explicitBlockDelimiters, the array of ZSTD_Sequence is expected to contain 1353*f7cd7fe5SConrad Meyer * block delimiters (defined in ZSTD_Sequence). Behavior is undefined if no block delimiters are provided. 1354*f7cd7fe5SConrad Meyer * 1355*f7cd7fe5SConrad Meyer * If ZSTD_c_validateSequences == 0, this function will blindly accept the sequences provided. Invalid sequences cause undefined 1356*f7cd7fe5SConrad Meyer * behavior. If ZSTD_c_validateSequences == 1, then if sequence is invalid (see doc/zstd_compression_format.md for 1357*f7cd7fe5SConrad Meyer * specifics regarding offset/matchlength requirements) then the function will bail out and return an error. 1358*f7cd7fe5SConrad Meyer * 1359*f7cd7fe5SConrad Meyer * In addition to the two adjustable experimental params, there are other important cctx params. 1360*f7cd7fe5SConrad Meyer * - ZSTD_c_minMatch MUST be set as less than or equal to the smallest match generated by the match finder. It has a minimum value of ZSTD_MINMATCH_MIN. 1361*f7cd7fe5SConrad Meyer * - ZSTD_c_compressionLevel accordingly adjusts the strength of the entropy coder, as it would in typical compression. 1362*f7cd7fe5SConrad Meyer * - ZSTD_c_windowLog affects offset validation: this function will return an error at higher debug levels if a provided offset 1363*f7cd7fe5SConrad Meyer * is larger than what the spec allows for a given window log and dictionary (if present). See: doc/zstd_compression_format.md 1364*f7cd7fe5SConrad Meyer * 1365*f7cd7fe5SConrad Meyer * Note: Repcodes are, as of now, always re-calculated within this function, so ZSTD_Sequence::rep is unused. 1366*f7cd7fe5SConrad Meyer * Note 2: Once we integrate ability to ingest repcodes, the explicit block delims mode must respect those repcodes exactly, 1367*f7cd7fe5SConrad Meyer * and cannot emit an RLE block that disagrees with the repcode history 1368*f7cd7fe5SConrad Meyer * @return : final compressed size or a ZSTD error. 1369*f7cd7fe5SConrad Meyer */ 1370*f7cd7fe5SConrad Meyer ZSTDLIB_API size_t ZSTD_compressSequences(ZSTD_CCtx* const cctx, void* dst, size_t dstSize, 1371*f7cd7fe5SConrad Meyer const ZSTD_Sequence* inSeqs, size_t inSeqsSize, 1372*f7cd7fe5SConrad Meyer const void* src, size_t srcSize); 1373*f7cd7fe5SConrad Meyer 13740c16b537SWarner Losh 13750c16b537SWarner Losh /*************************************** 137619fcbaf1SConrad Meyer * Memory management 13770c16b537SWarner Losh ***************************************/ 13780c16b537SWarner Losh 13790c16b537SWarner Losh /*! ZSTD_estimate*() : 138037f1f268SConrad Meyer * These functions make it possible to estimate memory usage 138137f1f268SConrad Meyer * of a future {D,C}Ctx, before its creation. 13829cbefe25SConrad Meyer * 138337f1f268SConrad Meyer * ZSTD_estimateCCtxSize() will provide a memory budget large enough 138437f1f268SConrad Meyer * for any compression level up to selected one. 138537f1f268SConrad Meyer * Note : Unlike ZSTD_estimateCStreamSize*(), this estimate 138637f1f268SConrad Meyer * does not include space for a window buffer. 138737f1f268SConrad Meyer * Therefore, the estimation is only guaranteed for single-shot compressions, not streaming. 138837f1f268SConrad Meyer * The estimate will assume the input may be arbitrarily large, 138937f1f268SConrad Meyer * which is the worst case. 13909cbefe25SConrad Meyer * 139137f1f268SConrad Meyer * When srcSize can be bound by a known and rather "small" value, 139237f1f268SConrad Meyer * this fact can be used to provide a tighter estimation 139337f1f268SConrad Meyer * because the CCtx compression context will need less memory. 139437f1f268SConrad Meyer * This tighter estimation can be provided by more advanced functions 139537f1f268SConrad Meyer * ZSTD_estimateCCtxSize_usingCParams(), which can be used in tandem with ZSTD_getCParams(), 139637f1f268SConrad Meyer * and ZSTD_estimateCCtxSize_usingCCtxParams(), which can be used in tandem with ZSTD_CCtxParams_setParameter(). 139737f1f268SConrad Meyer * Both can be used to estimate memory using custom compression parameters and arbitrary srcSize limits. 139837f1f268SConrad Meyer * 139937f1f268SConrad Meyer * Note 2 : only single-threaded compression is supported. 140037f1f268SConrad Meyer * ZSTD_estimateCCtxSize_usingCCtxParams() will return an error code if ZSTD_c_nbWorkers is >= 1. 140137f1f268SConrad Meyer */ 14020c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_estimateCCtxSize(int compressionLevel); 14030c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_estimateCCtxSize_usingCParams(ZSTD_compressionParameters cParams); 14040c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_estimateCCtxSize_usingCCtxParams(const ZSTD_CCtx_params* params); 14050c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_estimateDCtxSize(void); 14060c16b537SWarner Losh 14070c16b537SWarner Losh /*! ZSTD_estimateCStreamSize() : 14080c16b537SWarner Losh * ZSTD_estimateCStreamSize() will provide a budget large enough for any compression level up to selected one. 14090c16b537SWarner Losh * It will also consider src size to be arbitrarily "large", which is worst case. 14100c16b537SWarner Losh * If srcSize is known to always be small, ZSTD_estimateCStreamSize_usingCParams() can provide a tighter estimation. 14110c16b537SWarner Losh * ZSTD_estimateCStreamSize_usingCParams() can be used in tandem with ZSTD_getCParams() to create cParams from compressionLevel. 14122b9c00cbSConrad Meyer * ZSTD_estimateCStreamSize_usingCCtxParams() can be used in tandem with ZSTD_CCtxParams_setParameter(). Only single-threaded compression is supported. This function will return an error code if ZSTD_c_nbWorkers is >= 1. 141319fcbaf1SConrad Meyer * Note : CStream size estimation is only correct for single-threaded compression. 14140c16b537SWarner Losh * ZSTD_DStream memory budget depends on window Size. 14150c16b537SWarner Losh * This information can be passed manually, using ZSTD_estimateDStreamSize, 14160c16b537SWarner Losh * or deducted from a valid frame Header, using ZSTD_estimateDStreamSize_fromFrame(); 14170c16b537SWarner Losh * Note : if streaming is init with function ZSTD_init?Stream_usingDict(), 14180c16b537SWarner Losh * an internal ?Dict will be created, which additional size is not estimated here. 14190c16b537SWarner Losh * In this case, get total size by adding ZSTD_estimate?DictSize */ 14200c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_estimateCStreamSize(int compressionLevel); 14210c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_estimateCStreamSize_usingCParams(ZSTD_compressionParameters cParams); 14220c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_estimateCStreamSize_usingCCtxParams(const ZSTD_CCtx_params* params); 14230c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_estimateDStreamSize(size_t windowSize); 14240c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_estimateDStreamSize_fromFrame(const void* src, size_t srcSize); 14250c16b537SWarner Losh 14260c16b537SWarner Losh /*! ZSTD_estimate?DictSize() : 14270c16b537SWarner Losh * ZSTD_estimateCDictSize() will bet that src size is relatively "small", and content is copied, like ZSTD_createCDict(). 142819fcbaf1SConrad Meyer * ZSTD_estimateCDictSize_advanced() makes it possible to control compression parameters precisely, like ZSTD_createCDict_advanced(). 142919fcbaf1SConrad Meyer * Note : dictionaries created by reference (`ZSTD_dlm_byRef`) are logically smaller. 14300c16b537SWarner Losh */ 14310c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_estimateCDictSize(size_t dictSize, int compressionLevel); 14320c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_estimateCDictSize_advanced(size_t dictSize, ZSTD_compressionParameters cParams, ZSTD_dictLoadMethod_e dictLoadMethod); 14330c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_estimateDDictSize(size_t dictSize, ZSTD_dictLoadMethod_e dictLoadMethod); 14340c16b537SWarner Losh 143519fcbaf1SConrad Meyer /*! ZSTD_initStatic*() : 143619fcbaf1SConrad Meyer * Initialize an object using a pre-allocated fixed-size buffer. 143719fcbaf1SConrad Meyer * workspace: The memory area to emplace the object into. 143819fcbaf1SConrad Meyer * Provided pointer *must be 8-bytes aligned*. 143919fcbaf1SConrad Meyer * Buffer must outlive object. 144019fcbaf1SConrad Meyer * workspaceSize: Use ZSTD_estimate*Size() to determine 144119fcbaf1SConrad Meyer * how large workspace must be to support target scenario. 144219fcbaf1SConrad Meyer * @return : pointer to object (same address as workspace, just different type), 144319fcbaf1SConrad Meyer * or NULL if error (size too small, incorrect alignment, etc.) 144419fcbaf1SConrad Meyer * Note : zstd will never resize nor malloc() when using a static buffer. 144519fcbaf1SConrad Meyer * If the object requires more memory than available, 144619fcbaf1SConrad Meyer * zstd will just error out (typically ZSTD_error_memory_allocation). 144719fcbaf1SConrad Meyer * Note 2 : there is no corresponding "free" function. 144819fcbaf1SConrad Meyer * Since workspace is allocated externally, it must be freed externally too. 144919fcbaf1SConrad Meyer * Note 3 : cParams : use ZSTD_getCParams() to convert a compression level 145019fcbaf1SConrad Meyer * into its associated cParams. 145119fcbaf1SConrad Meyer * Limitation 1 : currently not compatible with internal dictionary creation, triggered by 145219fcbaf1SConrad Meyer * ZSTD_CCtx_loadDictionary(), ZSTD_initCStream_usingDict() or ZSTD_initDStream_usingDict(). 145319fcbaf1SConrad Meyer * Limitation 2 : static cctx currently not compatible with multi-threading. 145419fcbaf1SConrad Meyer * Limitation 3 : static dctx is incompatible with legacy support. 145519fcbaf1SConrad Meyer */ 145619fcbaf1SConrad Meyer ZSTDLIB_API ZSTD_CCtx* ZSTD_initStaticCCtx(void* workspace, size_t workspaceSize); 145719fcbaf1SConrad Meyer ZSTDLIB_API ZSTD_CStream* ZSTD_initStaticCStream(void* workspace, size_t workspaceSize); /**< same as ZSTD_initStaticCCtx() */ 145819fcbaf1SConrad Meyer 145919fcbaf1SConrad Meyer ZSTDLIB_API ZSTD_DCtx* ZSTD_initStaticDCtx(void* workspace, size_t workspaceSize); 146019fcbaf1SConrad Meyer ZSTDLIB_API ZSTD_DStream* ZSTD_initStaticDStream(void* workspace, size_t workspaceSize); /**< same as ZSTD_initStaticDCtx() */ 146119fcbaf1SConrad Meyer 146219fcbaf1SConrad Meyer ZSTDLIB_API const ZSTD_CDict* ZSTD_initStaticCDict( 146319fcbaf1SConrad Meyer void* workspace, size_t workspaceSize, 146419fcbaf1SConrad Meyer const void* dict, size_t dictSize, 146519fcbaf1SConrad Meyer ZSTD_dictLoadMethod_e dictLoadMethod, 146619fcbaf1SConrad Meyer ZSTD_dictContentType_e dictContentType, 146719fcbaf1SConrad Meyer ZSTD_compressionParameters cParams); 146819fcbaf1SConrad Meyer 146919fcbaf1SConrad Meyer ZSTDLIB_API const ZSTD_DDict* ZSTD_initStaticDDict( 147019fcbaf1SConrad Meyer void* workspace, size_t workspaceSize, 147119fcbaf1SConrad Meyer const void* dict, size_t dictSize, 147219fcbaf1SConrad Meyer ZSTD_dictLoadMethod_e dictLoadMethod, 147319fcbaf1SConrad Meyer ZSTD_dictContentType_e dictContentType); 147419fcbaf1SConrad Meyer 1475a0483764SConrad Meyer 147619fcbaf1SConrad Meyer /*! Custom memory allocation : 147719fcbaf1SConrad Meyer * These prototypes make it possible to pass your own allocation/free functions. 147819fcbaf1SConrad Meyer * ZSTD_customMem is provided at creation time, using ZSTD_create*_advanced() variants listed below. 147919fcbaf1SConrad Meyer * All allocation/free operations will be completed using these custom variants instead of regular <stdlib.h> ones. 148019fcbaf1SConrad Meyer */ 148119fcbaf1SConrad Meyer typedef void* (*ZSTD_allocFunction) (void* opaque, size_t size); 148219fcbaf1SConrad Meyer typedef void (*ZSTD_freeFunction) (void* opaque, void* address); 148319fcbaf1SConrad Meyer typedef struct { ZSTD_allocFunction customAlloc; ZSTD_freeFunction customFree; void* opaque; } ZSTD_customMem; 1484*f7cd7fe5SConrad Meyer static 1485*f7cd7fe5SConrad Meyer #ifdef __GNUC__ 1486*f7cd7fe5SConrad Meyer __attribute__((__unused__)) 1487*f7cd7fe5SConrad Meyer #endif 1488*f7cd7fe5SConrad Meyer ZSTD_customMem const ZSTD_defaultCMem = { NULL, NULL, NULL }; /**< this constant defers to stdlib's functions */ 148919fcbaf1SConrad Meyer 149019fcbaf1SConrad Meyer ZSTDLIB_API ZSTD_CCtx* ZSTD_createCCtx_advanced(ZSTD_customMem customMem); 149119fcbaf1SConrad Meyer ZSTDLIB_API ZSTD_CStream* ZSTD_createCStream_advanced(ZSTD_customMem customMem); 149219fcbaf1SConrad Meyer ZSTDLIB_API ZSTD_DCtx* ZSTD_createDCtx_advanced(ZSTD_customMem customMem); 149319fcbaf1SConrad Meyer ZSTDLIB_API ZSTD_DStream* ZSTD_createDStream_advanced(ZSTD_customMem customMem); 149419fcbaf1SConrad Meyer 149519fcbaf1SConrad Meyer ZSTDLIB_API ZSTD_CDict* ZSTD_createCDict_advanced(const void* dict, size_t dictSize, 149619fcbaf1SConrad Meyer ZSTD_dictLoadMethod_e dictLoadMethod, 149719fcbaf1SConrad Meyer ZSTD_dictContentType_e dictContentType, 149819fcbaf1SConrad Meyer ZSTD_compressionParameters cParams, 149919fcbaf1SConrad Meyer ZSTD_customMem customMem); 150019fcbaf1SConrad Meyer 1501*f7cd7fe5SConrad Meyer /* ! Thread pool : 1502*f7cd7fe5SConrad Meyer * These prototypes make it possible to share a thread pool among multiple compression contexts. 1503*f7cd7fe5SConrad Meyer * This can limit resources for applications with multiple threads where each one uses 1504*f7cd7fe5SConrad Meyer * a threaded compression mode (via ZSTD_c_nbWorkers parameter). 1505*f7cd7fe5SConrad Meyer * ZSTD_createThreadPool creates a new thread pool with a given number of threads. 1506*f7cd7fe5SConrad Meyer * Note that the lifetime of such pool must exist while being used. 1507*f7cd7fe5SConrad Meyer * ZSTD_CCtx_refThreadPool assigns a thread pool to a context (use NULL argument value 1508*f7cd7fe5SConrad Meyer * to use an internal thread pool). 1509*f7cd7fe5SConrad Meyer * ZSTD_freeThreadPool frees a thread pool. 1510*f7cd7fe5SConrad Meyer */ 1511*f7cd7fe5SConrad Meyer typedef struct POOL_ctx_s ZSTD_threadPool; 1512*f7cd7fe5SConrad Meyer ZSTDLIB_API ZSTD_threadPool* ZSTD_createThreadPool(size_t numThreads); 1513*f7cd7fe5SConrad Meyer ZSTDLIB_API void ZSTD_freeThreadPool (ZSTD_threadPool* pool); 1514*f7cd7fe5SConrad Meyer ZSTDLIB_API size_t ZSTD_CCtx_refThreadPool(ZSTD_CCtx* cctx, ZSTD_threadPool* pool); 1515*f7cd7fe5SConrad Meyer 1516*f7cd7fe5SConrad Meyer /* 1517*f7cd7fe5SConrad Meyer * This API is temporary and is expected to change or disappear in the future! 1518*f7cd7fe5SConrad Meyer */ 1519*f7cd7fe5SConrad Meyer ZSTDLIB_API ZSTD_CDict* ZSTD_createCDict_advanced2( 1520*f7cd7fe5SConrad Meyer const void* dict, size_t dictSize, 1521*f7cd7fe5SConrad Meyer ZSTD_dictLoadMethod_e dictLoadMethod, 1522*f7cd7fe5SConrad Meyer ZSTD_dictContentType_e dictContentType, 1523*f7cd7fe5SConrad Meyer const ZSTD_CCtx_params* cctxParams, 1524*f7cd7fe5SConrad Meyer ZSTD_customMem customMem); 1525*f7cd7fe5SConrad Meyer 152619fcbaf1SConrad Meyer ZSTDLIB_API ZSTD_DDict* ZSTD_createDDict_advanced(const void* dict, size_t dictSize, 152719fcbaf1SConrad Meyer ZSTD_dictLoadMethod_e dictLoadMethod, 152819fcbaf1SConrad Meyer ZSTD_dictContentType_e dictContentType, 152919fcbaf1SConrad Meyer ZSTD_customMem customMem); 153019fcbaf1SConrad Meyer 15310c16b537SWarner Losh /*************************************** 15320c16b537SWarner Losh * Advanced compression functions 15330c16b537SWarner Losh ***************************************/ 15340c16b537SWarner Losh 15350c16b537SWarner Losh /*! ZSTD_createCDict_byReference() : 15360c16b537SWarner Losh * Create a digested dictionary for compression 1537a0483764SConrad Meyer * Dictionary content is just referenced, not duplicated. 1538a0483764SConrad Meyer * As a consequence, `dictBuffer` **must** outlive CDict, 15399cbefe25SConrad Meyer * and its content must remain unmodified throughout the lifetime of CDict. 15409cbefe25SConrad Meyer * note: equivalent to ZSTD_createCDict_advanced(), with dictLoadMethod==ZSTD_dlm_byRef */ 15410c16b537SWarner Losh ZSTDLIB_API ZSTD_CDict* ZSTD_createCDict_byReference(const void* dictBuffer, size_t dictSize, int compressionLevel); 15420c16b537SWarner Losh 1543*f7cd7fe5SConrad Meyer /*! ZSTD_getDictID_fromCDict() : 1544*f7cd7fe5SConrad Meyer * Provides the dictID of the dictionary loaded into `cdict`. 1545*f7cd7fe5SConrad Meyer * If @return == 0, the dictionary is not conformant to Zstandard specification, or empty. 1546*f7cd7fe5SConrad Meyer * Non-conformant dictionaries can still be loaded, but as content-only dictionaries. */ 1547*f7cd7fe5SConrad Meyer ZSTDLIB_API unsigned ZSTD_getDictID_fromCDict(const ZSTD_CDict* cdict); 1548*f7cd7fe5SConrad Meyer 15490c16b537SWarner Losh /*! ZSTD_getCParams() : 15500c16b537SWarner Losh * @return ZSTD_compressionParameters structure for a selected compression level and estimated srcSize. 15510c16b537SWarner Losh * `estimatedSrcSize` value is optional, select 0 if not known */ 15520c16b537SWarner Losh ZSTDLIB_API ZSTD_compressionParameters ZSTD_getCParams(int compressionLevel, unsigned long long estimatedSrcSize, size_t dictSize); 15530c16b537SWarner Losh 15540c16b537SWarner Losh /*! ZSTD_getParams() : 15550c16b537SWarner Losh * same as ZSTD_getCParams(), but @return a full `ZSTD_parameters` object instead of sub-component `ZSTD_compressionParameters`. 1556052d3c12SConrad Meyer * All fields of `ZSTD_frameParameters` are set to default : contentSize=1, checksum=0, noDictID=0 */ 15570c16b537SWarner Losh ZSTDLIB_API ZSTD_parameters ZSTD_getParams(int compressionLevel, unsigned long long estimatedSrcSize, size_t dictSize); 15580c16b537SWarner Losh 15590c16b537SWarner Losh /*! ZSTD_checkCParams() : 15602b9c00cbSConrad Meyer * Ensure param values remain within authorized range. 15612b9c00cbSConrad Meyer * @return 0 on success, or an error code (can be checked with ZSTD_isError()) */ 15620c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_checkCParams(ZSTD_compressionParameters params); 15630c16b537SWarner Losh 15640c16b537SWarner Losh /*! ZSTD_adjustCParams() : 15650c16b537SWarner Losh * optimize params for a given `srcSize` and `dictSize`. 15662b9c00cbSConrad Meyer * `srcSize` can be unknown, in which case use ZSTD_CONTENTSIZE_UNKNOWN. 15672b9c00cbSConrad Meyer * `dictSize` must be `0` when there is no dictionary. 15682b9c00cbSConrad Meyer * cPar can be invalid : all parameters will be clamped within valid range in the @return struct. 15692b9c00cbSConrad Meyer * This function never fails (wide contract) */ 15700c16b537SWarner Losh ZSTDLIB_API ZSTD_compressionParameters ZSTD_adjustCParams(ZSTD_compressionParameters cPar, unsigned long long srcSize, size_t dictSize); 15710c16b537SWarner Losh 15720c16b537SWarner Losh /*! ZSTD_compress_advanced() : 15739cbefe25SConrad Meyer * Note : this function is now DEPRECATED. 15749cbefe25SConrad Meyer * It can be replaced by ZSTD_compress2(), in combination with ZSTD_CCtx_setParameter() and other parameter setters. 15759cbefe25SConrad Meyer * This prototype will be marked as deprecated and generate compilation warning on reaching v1.5.x */ 15760c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_compress_advanced(ZSTD_CCtx* cctx, 15770c16b537SWarner Losh void* dst, size_t dstCapacity, 15780c16b537SWarner Losh const void* src, size_t srcSize, 15790c16b537SWarner Losh const void* dict,size_t dictSize, 15800c16b537SWarner Losh ZSTD_parameters params); 15810c16b537SWarner Losh 15820c16b537SWarner Losh /*! ZSTD_compress_usingCDict_advanced() : 15839cbefe25SConrad Meyer * Note : this function is now REDUNDANT. 15849cbefe25SConrad Meyer * It can be replaced by ZSTD_compress2(), in combination with ZSTD_CCtx_loadDictionary() and other parameter setters. 15859cbefe25SConrad Meyer * This prototype will be marked as deprecated and generate compilation warning in some future version */ 15860c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_compress_usingCDict_advanced(ZSTD_CCtx* cctx, 15870c16b537SWarner Losh void* dst, size_t dstCapacity, 15880c16b537SWarner Losh const void* src, size_t srcSize, 1589a0483764SConrad Meyer const ZSTD_CDict* cdict, 1590a0483764SConrad Meyer ZSTD_frameParameters fParams); 15910c16b537SWarner Losh 15920c16b537SWarner Losh 1593a0483764SConrad Meyer /*! ZSTD_CCtx_loadDictionary_byReference() : 1594a0483764SConrad Meyer * Same as ZSTD_CCtx_loadDictionary(), but dictionary content is referenced, instead of being copied into CCtx. 1595a0483764SConrad Meyer * It saves some memory, but also requires that `dict` outlives its usage within `cctx` */ 1596a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_CCtx_loadDictionary_byReference(ZSTD_CCtx* cctx, const void* dict, size_t dictSize); 1597a0483764SConrad Meyer 1598a0483764SConrad Meyer /*! ZSTD_CCtx_loadDictionary_advanced() : 1599a0483764SConrad Meyer * Same as ZSTD_CCtx_loadDictionary(), but gives finer control over 1600a0483764SConrad Meyer * how to load the dictionary (by copy ? by reference ?) 1601a0483764SConrad Meyer * and how to interpret it (automatic ? force raw mode ? full mode only ?) */ 1602a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_CCtx_loadDictionary_advanced(ZSTD_CCtx* cctx, const void* dict, size_t dictSize, ZSTD_dictLoadMethod_e dictLoadMethod, ZSTD_dictContentType_e dictContentType); 1603a0483764SConrad Meyer 1604a0483764SConrad Meyer /*! ZSTD_CCtx_refPrefix_advanced() : 1605a0483764SConrad Meyer * Same as ZSTD_CCtx_refPrefix(), but gives finer control over 1606a0483764SConrad Meyer * how to interpret prefix content (automatic ? force raw mode (default) ? full mode only ?) */ 1607a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_CCtx_refPrefix_advanced(ZSTD_CCtx* cctx, const void* prefix, size_t prefixSize, ZSTD_dictContentType_e dictContentType); 1608a0483764SConrad Meyer 1609a0483764SConrad Meyer /* === experimental parameters === */ 1610a0483764SConrad Meyer /* these parameters can be used with ZSTD_setParameter() 1611a0483764SConrad Meyer * they are not guaranteed to remain supported in the future */ 1612a0483764SConrad Meyer 1613a0483764SConrad Meyer /* Enables rsyncable mode, 1614a0483764SConrad Meyer * which makes compressed files more rsync friendly 1615a0483764SConrad Meyer * by adding periodic synchronization points to the compressed data. 1616a0483764SConrad Meyer * The target average block size is ZSTD_c_jobSize / 2. 1617a0483764SConrad Meyer * It's possible to modify the job size to increase or decrease 1618a0483764SConrad Meyer * the granularity of the synchronization point. 1619a0483764SConrad Meyer * Once the jobSize is smaller than the window size, 1620a0483764SConrad Meyer * it will result in compression ratio degradation. 1621a0483764SConrad Meyer * NOTE 1: rsyncable mode only works when multithreading is enabled. 1622a0483764SConrad Meyer * NOTE 2: rsyncable performs poorly in combination with long range mode, 1623a0483764SConrad Meyer * since it will decrease the effectiveness of synchronization points, 1624a0483764SConrad Meyer * though mileage may vary. 1625a0483764SConrad Meyer * NOTE 3: Rsyncable mode limits maximum compression speed to ~400 MB/s. 1626a0483764SConrad Meyer * If the selected compression level is already running significantly slower, 1627a0483764SConrad Meyer * the overall speed won't be significantly impacted. 1628a0483764SConrad Meyer */ 1629a0483764SConrad Meyer #define ZSTD_c_rsyncable ZSTD_c_experimentalParam1 1630a0483764SConrad Meyer 1631a0483764SConrad Meyer /* Select a compression format. 1632a0483764SConrad Meyer * The value must be of type ZSTD_format_e. 1633a0483764SConrad Meyer * See ZSTD_format_e enum definition for details */ 1634a0483764SConrad Meyer #define ZSTD_c_format ZSTD_c_experimentalParam2 1635a0483764SConrad Meyer 1636a0483764SConrad Meyer /* Force back-reference distances to remain < windowSize, 1637a0483764SConrad Meyer * even when referencing into Dictionary content (default:0) */ 1638a0483764SConrad Meyer #define ZSTD_c_forceMaxWindow ZSTD_c_experimentalParam3 1639a0483764SConrad Meyer 1640a0483764SConrad Meyer /* Controls whether the contents of a CDict 1641a0483764SConrad Meyer * are used in place, or copied into the working context. 1642a0483764SConrad Meyer * Accepts values from the ZSTD_dictAttachPref_e enum. 1643a0483764SConrad Meyer * See the comments on that enum for an explanation of the feature. */ 1644a0483764SConrad Meyer #define ZSTD_c_forceAttachDict ZSTD_c_experimentalParam4 1645a0483764SConrad Meyer 16462b9c00cbSConrad Meyer /* Controls how the literals are compressed (default is auto). 16472b9c00cbSConrad Meyer * The value must be of type ZSTD_literalCompressionMode_e. 16482b9c00cbSConrad Meyer * See ZSTD_literalCompressionMode_t enum definition for details. 16492b9c00cbSConrad Meyer */ 16502b9c00cbSConrad Meyer #define ZSTD_c_literalCompressionMode ZSTD_c_experimentalParam5 16512b9c00cbSConrad Meyer 16524d3f1eafSConrad Meyer /* Tries to fit compressed block size to be around targetCBlockSize. 16534d3f1eafSConrad Meyer * No target when targetCBlockSize == 0. 16544d3f1eafSConrad Meyer * There is no guarantee on compressed block size (default:0) */ 16554d3f1eafSConrad Meyer #define ZSTD_c_targetCBlockSize ZSTD_c_experimentalParam6 16564d3f1eafSConrad Meyer 16579cbefe25SConrad Meyer /* User's best guess of source size. 16589cbefe25SConrad Meyer * Hint is not valid when srcSizeHint == 0. 16599cbefe25SConrad Meyer * There is no guarantee that hint is close to actual source size, 16609cbefe25SConrad Meyer * but compression ratio may regress significantly if guess considerably underestimates */ 16619cbefe25SConrad Meyer #define ZSTD_c_srcSizeHint ZSTD_c_experimentalParam7 16629cbefe25SConrad Meyer 1663*f7cd7fe5SConrad Meyer /* Controls whether the new and experimental "dedicated dictionary search 1664*f7cd7fe5SConrad Meyer * structure" can be used. This feature is still rough around the edges, be 1665*f7cd7fe5SConrad Meyer * prepared for surprising behavior! 1666*f7cd7fe5SConrad Meyer * 1667*f7cd7fe5SConrad Meyer * How to use it: 1668*f7cd7fe5SConrad Meyer * 1669*f7cd7fe5SConrad Meyer * When using a CDict, whether to use this feature or not is controlled at 1670*f7cd7fe5SConrad Meyer * CDict creation, and it must be set in a CCtxParams set passed into that 1671*f7cd7fe5SConrad Meyer * construction (via ZSTD_createCDict_advanced2()). A compression will then 1672*f7cd7fe5SConrad Meyer * use the feature or not based on how the CDict was constructed; the value of 1673*f7cd7fe5SConrad Meyer * this param, set in the CCtx, will have no effect. 1674*f7cd7fe5SConrad Meyer * 1675*f7cd7fe5SConrad Meyer * However, when a dictionary buffer is passed into a CCtx, such as via 1676*f7cd7fe5SConrad Meyer * ZSTD_CCtx_loadDictionary(), this param can be set on the CCtx to control 1677*f7cd7fe5SConrad Meyer * whether the CDict that is created internally can use the feature or not. 1678*f7cd7fe5SConrad Meyer * 1679*f7cd7fe5SConrad Meyer * What it does: 1680*f7cd7fe5SConrad Meyer * 1681*f7cd7fe5SConrad Meyer * Normally, the internal data structures of the CDict are analogous to what 1682*f7cd7fe5SConrad Meyer * would be stored in a CCtx after compressing the contents of a dictionary. 1683*f7cd7fe5SConrad Meyer * To an approximation, a compression using a dictionary can then use those 1684*f7cd7fe5SConrad Meyer * data structures to simply continue what is effectively a streaming 1685*f7cd7fe5SConrad Meyer * compression where the simulated compression of the dictionary left off. 1686*f7cd7fe5SConrad Meyer * Which is to say, the search structures in the CDict are normally the same 1687*f7cd7fe5SConrad Meyer * format as in the CCtx. 1688*f7cd7fe5SConrad Meyer * 1689*f7cd7fe5SConrad Meyer * It is possible to do better, since the CDict is not like a CCtx: the search 1690*f7cd7fe5SConrad Meyer * structures are written once during CDict creation, and then are only read 1691*f7cd7fe5SConrad Meyer * after that, while the search structures in the CCtx are both read and 1692*f7cd7fe5SConrad Meyer * written as the compression goes along. This means we can choose a search 1693*f7cd7fe5SConrad Meyer * structure for the dictionary that is read-optimized. 1694*f7cd7fe5SConrad Meyer * 1695*f7cd7fe5SConrad Meyer * This feature enables the use of that different structure. 1696*f7cd7fe5SConrad Meyer * 1697*f7cd7fe5SConrad Meyer * Note that some of the members of the ZSTD_compressionParameters struct have 1698*f7cd7fe5SConrad Meyer * different semantics and constraints in the dedicated search structure. It is 1699*f7cd7fe5SConrad Meyer * highly recommended that you simply set a compression level in the CCtxParams 1700*f7cd7fe5SConrad Meyer * you pass into the CDict creation call, and avoid messing with the cParams 1701*f7cd7fe5SConrad Meyer * directly. 1702*f7cd7fe5SConrad Meyer * 1703*f7cd7fe5SConrad Meyer * Effects: 1704*f7cd7fe5SConrad Meyer * 1705*f7cd7fe5SConrad Meyer * This will only have any effect when the selected ZSTD_strategy 1706*f7cd7fe5SConrad Meyer * implementation supports this feature. Currently, that's limited to 1707*f7cd7fe5SConrad Meyer * ZSTD_greedy, ZSTD_lazy, and ZSTD_lazy2. 1708*f7cd7fe5SConrad Meyer * 1709*f7cd7fe5SConrad Meyer * Note that this means that the CDict tables can no longer be copied into the 1710*f7cd7fe5SConrad Meyer * CCtx, so the dict attachment mode ZSTD_dictForceCopy will no longer be 1711*f7cd7fe5SConrad Meyer * useable. The dictionary can only be attached or reloaded. 1712*f7cd7fe5SConrad Meyer * 1713*f7cd7fe5SConrad Meyer * In general, you should expect compression to be faster--sometimes very much 1714*f7cd7fe5SConrad Meyer * so--and CDict creation to be slightly slower. Eventually, we will probably 1715*f7cd7fe5SConrad Meyer * make this mode the default. 1716*f7cd7fe5SConrad Meyer */ 1717*f7cd7fe5SConrad Meyer #define ZSTD_c_enableDedicatedDictSearch ZSTD_c_experimentalParam8 1718*f7cd7fe5SConrad Meyer 1719*f7cd7fe5SConrad Meyer /* ZSTD_c_stableInBuffer 1720*f7cd7fe5SConrad Meyer * Experimental parameter. 1721*f7cd7fe5SConrad Meyer * Default is 0 == disabled. Set to 1 to enable. 1722*f7cd7fe5SConrad Meyer * 1723*f7cd7fe5SConrad Meyer * Tells the compressor that the ZSTD_inBuffer will ALWAYS be the same 1724*f7cd7fe5SConrad Meyer * between calls, except for the modifications that zstd makes to pos (the 1725*f7cd7fe5SConrad Meyer * caller must not modify pos). This is checked by the compressor, and 1726*f7cd7fe5SConrad Meyer * compression will fail if it ever changes. This means the only flush 1727*f7cd7fe5SConrad Meyer * mode that makes sense is ZSTD_e_end, so zstd will error if ZSTD_e_end 1728*f7cd7fe5SConrad Meyer * is not used. The data in the ZSTD_inBuffer in the range [src, src + pos) 1729*f7cd7fe5SConrad Meyer * MUST not be modified during compression or you will get data corruption. 1730*f7cd7fe5SConrad Meyer * 1731*f7cd7fe5SConrad Meyer * When this flag is enabled zstd won't allocate an input window buffer, 1732*f7cd7fe5SConrad Meyer * because the user guarantees it can reference the ZSTD_inBuffer until 1733*f7cd7fe5SConrad Meyer * the frame is complete. But, it will still allocate an output buffer 1734*f7cd7fe5SConrad Meyer * large enough to fit a block (see ZSTD_c_stableOutBuffer). This will also 1735*f7cd7fe5SConrad Meyer * avoid the memcpy() from the input buffer to the input window buffer. 1736*f7cd7fe5SConrad Meyer * 1737*f7cd7fe5SConrad Meyer * NOTE: ZSTD_compressStream2() will error if ZSTD_e_end is not used. 1738*f7cd7fe5SConrad Meyer * That means this flag cannot be used with ZSTD_compressStream(). 1739*f7cd7fe5SConrad Meyer * 1740*f7cd7fe5SConrad Meyer * NOTE: So long as the ZSTD_inBuffer always points to valid memory, using 1741*f7cd7fe5SConrad Meyer * this flag is ALWAYS memory safe, and will never access out-of-bounds 1742*f7cd7fe5SConrad Meyer * memory. However, compression WILL fail if you violate the preconditions. 1743*f7cd7fe5SConrad Meyer * 1744*f7cd7fe5SConrad Meyer * WARNING: The data in the ZSTD_inBuffer in the range [dst, dst + pos) MUST 1745*f7cd7fe5SConrad Meyer * not be modified during compression or you will get data corruption. This 1746*f7cd7fe5SConrad Meyer * is because zstd needs to reference data in the ZSTD_inBuffer to find 1747*f7cd7fe5SConrad Meyer * matches. Normally zstd maintains its own window buffer for this purpose, 1748*f7cd7fe5SConrad Meyer * but passing this flag tells zstd to use the user provided buffer. 1749*f7cd7fe5SConrad Meyer */ 1750*f7cd7fe5SConrad Meyer #define ZSTD_c_stableInBuffer ZSTD_c_experimentalParam9 1751*f7cd7fe5SConrad Meyer 1752*f7cd7fe5SConrad Meyer /* ZSTD_c_stableOutBuffer 1753*f7cd7fe5SConrad Meyer * Experimental parameter. 1754*f7cd7fe5SConrad Meyer * Default is 0 == disabled. Set to 1 to enable. 1755*f7cd7fe5SConrad Meyer * 1756*f7cd7fe5SConrad Meyer * Tells he compressor that the ZSTD_outBuffer will not be resized between 1757*f7cd7fe5SConrad Meyer * calls. Specifically: (out.size - out.pos) will never grow. This gives the 1758*f7cd7fe5SConrad Meyer * compressor the freedom to say: If the compressed data doesn't fit in the 1759*f7cd7fe5SConrad Meyer * output buffer then return ZSTD_error_dstSizeTooSmall. This allows us to 1760*f7cd7fe5SConrad Meyer * always decompress directly into the output buffer, instead of decompressing 1761*f7cd7fe5SConrad Meyer * into an internal buffer and copying to the output buffer. 1762*f7cd7fe5SConrad Meyer * 1763*f7cd7fe5SConrad Meyer * When this flag is enabled zstd won't allocate an output buffer, because 1764*f7cd7fe5SConrad Meyer * it can write directly to the ZSTD_outBuffer. It will still allocate the 1765*f7cd7fe5SConrad Meyer * input window buffer (see ZSTD_c_stableInBuffer). 1766*f7cd7fe5SConrad Meyer * 1767*f7cd7fe5SConrad Meyer * Zstd will check that (out.size - out.pos) never grows and return an error 1768*f7cd7fe5SConrad Meyer * if it does. While not strictly necessary, this should prevent surprises. 1769*f7cd7fe5SConrad Meyer */ 1770*f7cd7fe5SConrad Meyer #define ZSTD_c_stableOutBuffer ZSTD_c_experimentalParam10 1771*f7cd7fe5SConrad Meyer 1772*f7cd7fe5SConrad Meyer /* ZSTD_c_blockDelimiters 1773*f7cd7fe5SConrad Meyer * Default is 0 == ZSTD_sf_noBlockDelimiters. 1774*f7cd7fe5SConrad Meyer * 1775*f7cd7fe5SConrad Meyer * For use with sequence compression API: ZSTD_compressSequences(). 1776*f7cd7fe5SConrad Meyer * 1777*f7cd7fe5SConrad Meyer * Designates whether or not the given array of ZSTD_Sequence contains block delimiters 1778*f7cd7fe5SConrad Meyer * and last literals, which are defined as sequences with offset == 0 and matchLength == 0. 1779*f7cd7fe5SConrad Meyer * See the definition of ZSTD_Sequence for more specifics. 1780*f7cd7fe5SConrad Meyer */ 1781*f7cd7fe5SConrad Meyer #define ZSTD_c_blockDelimiters ZSTD_c_experimentalParam11 1782*f7cd7fe5SConrad Meyer 1783*f7cd7fe5SConrad Meyer /* ZSTD_c_validateSequences 1784*f7cd7fe5SConrad Meyer * Default is 0 == disabled. Set to 1 to enable sequence validation. 1785*f7cd7fe5SConrad Meyer * 1786*f7cd7fe5SConrad Meyer * For use with sequence compression API: ZSTD_compressSequences(). 1787*f7cd7fe5SConrad Meyer * Designates whether or not we validate sequences provided to ZSTD_compressSequences() 1788*f7cd7fe5SConrad Meyer * during function execution. 1789*f7cd7fe5SConrad Meyer * 1790*f7cd7fe5SConrad Meyer * Without validation, providing a sequence that does not conform to the zstd spec will cause 1791*f7cd7fe5SConrad Meyer * undefined behavior, and may produce a corrupted block. 1792*f7cd7fe5SConrad Meyer * 1793*f7cd7fe5SConrad Meyer * With validation enabled, a if sequence is invalid (see doc/zstd_compression_format.md for 1794*f7cd7fe5SConrad Meyer * specifics regarding offset/matchlength requirements) then the function will bail out and 1795*f7cd7fe5SConrad Meyer * return an error. 1796*f7cd7fe5SConrad Meyer * 1797*f7cd7fe5SConrad Meyer */ 1798*f7cd7fe5SConrad Meyer #define ZSTD_c_validateSequences ZSTD_c_experimentalParam12 1799*f7cd7fe5SConrad Meyer 1800a0483764SConrad Meyer /*! ZSTD_CCtx_getParameter() : 1801a0483764SConrad Meyer * Get the requested compression parameter value, selected by enum ZSTD_cParameter, 1802a0483764SConrad Meyer * and store it into int* value. 1803a0483764SConrad Meyer * @return : 0, or an error code (which can be tested with ZSTD_isError()). 1804a0483764SConrad Meyer */ 1805a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_CCtx_getParameter(ZSTD_CCtx* cctx, ZSTD_cParameter param, int* value); 1806a0483764SConrad Meyer 1807a0483764SConrad Meyer 1808a0483764SConrad Meyer /*! ZSTD_CCtx_params : 1809a0483764SConrad Meyer * Quick howto : 1810a0483764SConrad Meyer * - ZSTD_createCCtxParams() : Create a ZSTD_CCtx_params structure 18112b9c00cbSConrad Meyer * - ZSTD_CCtxParams_setParameter() : Push parameters one by one into 1812a0483764SConrad Meyer * an existing ZSTD_CCtx_params structure. 1813a0483764SConrad Meyer * This is similar to 1814a0483764SConrad Meyer * ZSTD_CCtx_setParameter(). 1815a0483764SConrad Meyer * - ZSTD_CCtx_setParametersUsingCCtxParams() : Apply parameters to 1816a0483764SConrad Meyer * an existing CCtx. 1817a0483764SConrad Meyer * These parameters will be applied to 1818a0483764SConrad Meyer * all subsequent frames. 1819a0483764SConrad Meyer * - ZSTD_compressStream2() : Do compression using the CCtx. 1820a0483764SConrad Meyer * - ZSTD_freeCCtxParams() : Free the memory. 1821a0483764SConrad Meyer * 1822a0483764SConrad Meyer * This can be used with ZSTD_estimateCCtxSize_advanced_usingCCtxParams() 1823a0483764SConrad Meyer * for static allocation of CCtx for single-threaded compression. 1824a0483764SConrad Meyer */ 1825a0483764SConrad Meyer ZSTDLIB_API ZSTD_CCtx_params* ZSTD_createCCtxParams(void); 1826a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_freeCCtxParams(ZSTD_CCtx_params* params); 1827a0483764SConrad Meyer 1828a0483764SConrad Meyer /*! ZSTD_CCtxParams_reset() : 1829a0483764SConrad Meyer * Reset params to default values. 1830a0483764SConrad Meyer */ 1831a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_CCtxParams_reset(ZSTD_CCtx_params* params); 1832a0483764SConrad Meyer 1833a0483764SConrad Meyer /*! ZSTD_CCtxParams_init() : 1834a0483764SConrad Meyer * Initializes the compression parameters of cctxParams according to 1835a0483764SConrad Meyer * compression level. All other parameters are reset to their default values. 1836a0483764SConrad Meyer */ 1837a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_CCtxParams_init(ZSTD_CCtx_params* cctxParams, int compressionLevel); 1838a0483764SConrad Meyer 1839a0483764SConrad Meyer /*! ZSTD_CCtxParams_init_advanced() : 1840a0483764SConrad Meyer * Initializes the compression and frame parameters of cctxParams according to 1841a0483764SConrad Meyer * params. All other parameters are reset to their default values. 1842a0483764SConrad Meyer */ 1843a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_CCtxParams_init_advanced(ZSTD_CCtx_params* cctxParams, ZSTD_parameters params); 1844a0483764SConrad Meyer 18452b9c00cbSConrad Meyer /*! ZSTD_CCtxParams_setParameter() : 1846a0483764SConrad Meyer * Similar to ZSTD_CCtx_setParameter. 1847a0483764SConrad Meyer * Set one compression parameter, selected by enum ZSTD_cParameter. 1848*f7cd7fe5SConrad Meyer * Parameters must be applied to a ZSTD_CCtx using 1849*f7cd7fe5SConrad Meyer * ZSTD_CCtx_setParametersUsingCCtxParams(). 1850*f7cd7fe5SConrad Meyer * @result : a code representing success or failure (which can be tested with 1851*f7cd7fe5SConrad Meyer * ZSTD_isError()). 1852a0483764SConrad Meyer */ 18532b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_CCtxParams_setParameter(ZSTD_CCtx_params* params, ZSTD_cParameter param, int value); 1854a0483764SConrad Meyer 18552b9c00cbSConrad Meyer /*! ZSTD_CCtxParams_getParameter() : 1856a0483764SConrad Meyer * Similar to ZSTD_CCtx_getParameter. 1857a0483764SConrad Meyer * Get the requested value of one compression parameter, selected by enum ZSTD_cParameter. 1858a0483764SConrad Meyer * @result : 0, or an error code (which can be tested with ZSTD_isError()). 1859a0483764SConrad Meyer */ 18602b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_CCtxParams_getParameter(ZSTD_CCtx_params* params, ZSTD_cParameter param, int* value); 1861a0483764SConrad Meyer 1862a0483764SConrad Meyer /*! ZSTD_CCtx_setParametersUsingCCtxParams() : 1863a0483764SConrad Meyer * Apply a set of ZSTD_CCtx_params to the compression context. 1864a0483764SConrad Meyer * This can be done even after compression is started, 1865a0483764SConrad Meyer * if nbWorkers==0, this will have no impact until a new compression is started. 1866a0483764SConrad Meyer * if nbWorkers>=1, new parameters will be picked up at next job, 1867a0483764SConrad Meyer * with a few restrictions (windowLog, pledgedSrcSize, nbWorkers, jobSize, and overlapLog are not updated). 1868a0483764SConrad Meyer */ 1869a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_CCtx_setParametersUsingCCtxParams( 1870a0483764SConrad Meyer ZSTD_CCtx* cctx, const ZSTD_CCtx_params* params); 1871a0483764SConrad Meyer 1872a0483764SConrad Meyer /*! ZSTD_compressStream2_simpleArgs() : 1873a0483764SConrad Meyer * Same as ZSTD_compressStream2(), 1874a0483764SConrad Meyer * but using only integral types as arguments. 1875a0483764SConrad Meyer * This variant might be helpful for binders from dynamic languages 1876a0483764SConrad Meyer * which have troubles handling structures containing memory pointers. 1877a0483764SConrad Meyer */ 1878a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_compressStream2_simpleArgs ( 1879a0483764SConrad Meyer ZSTD_CCtx* cctx, 1880a0483764SConrad Meyer void* dst, size_t dstCapacity, size_t* dstPos, 1881a0483764SConrad Meyer const void* src, size_t srcSize, size_t* srcPos, 1882a0483764SConrad Meyer ZSTD_EndDirective endOp); 1883a0483764SConrad Meyer 1884a0483764SConrad Meyer 1885a0483764SConrad Meyer /*************************************** 1886a0483764SConrad Meyer * Advanced decompression functions 1887a0483764SConrad Meyer ***************************************/ 18880c16b537SWarner Losh 18890c16b537SWarner Losh /*! ZSTD_isFrame() : 18900c16b537SWarner Losh * Tells if the content of `buffer` starts with a valid Frame Identifier. 18910c16b537SWarner Losh * Note : Frame Identifier is 4 bytes. If `size < 4`, @return will always be 0. 18920c16b537SWarner Losh * Note 2 : Legacy Frame Identifiers are considered valid only if Legacy Support is enabled. 18930c16b537SWarner Losh * Note 3 : Skippable Frame Identifiers are considered valid. */ 18940c16b537SWarner Losh ZSTDLIB_API unsigned ZSTD_isFrame(const void* buffer, size_t size); 18950c16b537SWarner Losh 18960c16b537SWarner Losh /*! ZSTD_createDDict_byReference() : 18970c16b537SWarner Losh * Create a digested dictionary, ready to start decompression operation without startup delay. 18980c16b537SWarner Losh * Dictionary content is referenced, and therefore stays in dictBuffer. 18990c16b537SWarner Losh * It is important that dictBuffer outlives DDict, 19000c16b537SWarner Losh * it must remain read accessible throughout the lifetime of DDict */ 19010c16b537SWarner Losh ZSTDLIB_API ZSTD_DDict* ZSTD_createDDict_byReference(const void* dictBuffer, size_t dictSize); 19020c16b537SWarner Losh 1903a0483764SConrad Meyer /*! ZSTD_DCtx_loadDictionary_byReference() : 1904a0483764SConrad Meyer * Same as ZSTD_DCtx_loadDictionary(), 1905a0483764SConrad Meyer * but references `dict` content instead of copying it into `dctx`. 1906a0483764SConrad Meyer * This saves memory if `dict` remains around., 1907a0483764SConrad Meyer * However, it's imperative that `dict` remains accessible (and unmodified) while being used, so it must outlive decompression. */ 1908a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_DCtx_loadDictionary_byReference(ZSTD_DCtx* dctx, const void* dict, size_t dictSize); 1909a0483764SConrad Meyer 1910a0483764SConrad Meyer /*! ZSTD_DCtx_loadDictionary_advanced() : 1911a0483764SConrad Meyer * Same as ZSTD_DCtx_loadDictionary(), 1912a0483764SConrad Meyer * but gives direct control over 1913a0483764SConrad Meyer * how to load the dictionary (by copy ? by reference ?) 1914a0483764SConrad Meyer * and how to interpret it (automatic ? force raw mode ? full mode only ?). */ 1915a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_DCtx_loadDictionary_advanced(ZSTD_DCtx* dctx, const void* dict, size_t dictSize, ZSTD_dictLoadMethod_e dictLoadMethod, ZSTD_dictContentType_e dictContentType); 1916a0483764SConrad Meyer 1917a0483764SConrad Meyer /*! ZSTD_DCtx_refPrefix_advanced() : 1918a0483764SConrad Meyer * Same as ZSTD_DCtx_refPrefix(), but gives finer control over 1919a0483764SConrad Meyer * how to interpret prefix content (automatic ? force raw mode (default) ? full mode only ?) */ 1920a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_DCtx_refPrefix_advanced(ZSTD_DCtx* dctx, const void* prefix, size_t prefixSize, ZSTD_dictContentType_e dictContentType); 1921a0483764SConrad Meyer 1922a0483764SConrad Meyer /*! ZSTD_DCtx_setMaxWindowSize() : 1923a0483764SConrad Meyer * Refuses allocating internal buffers for frames requiring a window size larger than provided limit. 1924a0483764SConrad Meyer * This protects a decoder context from reserving too much memory for itself (potential attack scenario). 1925a0483764SConrad Meyer * This parameter is only useful in streaming mode, since no internal buffer is allocated in single-pass mode. 1926a0483764SConrad Meyer * By default, a decompression context accepts all window sizes <= (1 << ZSTD_WINDOWLOG_LIMIT_DEFAULT) 1927a0483764SConrad Meyer * @return : 0, or an error code (which can be tested using ZSTD_isError()). 1928a0483764SConrad Meyer */ 1929a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_DCtx_setMaxWindowSize(ZSTD_DCtx* dctx, size_t maxWindowSize); 1930a0483764SConrad Meyer 1931*f7cd7fe5SConrad Meyer /*! ZSTD_DCtx_getParameter() : 1932*f7cd7fe5SConrad Meyer * Get the requested decompression parameter value, selected by enum ZSTD_dParameter, 1933*f7cd7fe5SConrad Meyer * and store it into int* value. 1934*f7cd7fe5SConrad Meyer * @return : 0, or an error code (which can be tested with ZSTD_isError()). 1935*f7cd7fe5SConrad Meyer */ 1936*f7cd7fe5SConrad Meyer ZSTDLIB_API size_t ZSTD_DCtx_getParameter(ZSTD_DCtx* dctx, ZSTD_dParameter param, int* value); 1937*f7cd7fe5SConrad Meyer 1938a0483764SConrad Meyer /* ZSTD_d_format 1939a0483764SConrad Meyer * experimental parameter, 1940a0483764SConrad Meyer * allowing selection between ZSTD_format_e input compression formats 1941a0483764SConrad Meyer */ 1942a0483764SConrad Meyer #define ZSTD_d_format ZSTD_d_experimentalParam1 194337f1f268SConrad Meyer /* ZSTD_d_stableOutBuffer 194437f1f268SConrad Meyer * Experimental parameter. 194537f1f268SConrad Meyer * Default is 0 == disabled. Set to 1 to enable. 194637f1f268SConrad Meyer * 194737f1f268SConrad Meyer * Tells the decompressor that the ZSTD_outBuffer will ALWAYS be the same 194837f1f268SConrad Meyer * between calls, except for the modifications that zstd makes to pos (the 194937f1f268SConrad Meyer * caller must not modify pos). This is checked by the decompressor, and 195037f1f268SConrad Meyer * decompression will fail if it ever changes. Therefore the ZSTD_outBuffer 195137f1f268SConrad Meyer * MUST be large enough to fit the entire decompressed frame. This will be 195237f1f268SConrad Meyer * checked when the frame content size is known. The data in the ZSTD_outBuffer 195337f1f268SConrad Meyer * in the range [dst, dst + pos) MUST not be modified during decompression 195437f1f268SConrad Meyer * or you will get data corruption. 195537f1f268SConrad Meyer * 195637f1f268SConrad Meyer * When this flags is enabled zstd won't allocate an output buffer, because 195737f1f268SConrad Meyer * it can write directly to the ZSTD_outBuffer, but it will still allocate 195837f1f268SConrad Meyer * an input buffer large enough to fit any compressed block. This will also 195937f1f268SConrad Meyer * avoid the memcpy() from the internal output buffer to the ZSTD_outBuffer. 196037f1f268SConrad Meyer * If you need to avoid the input buffer allocation use the buffer-less 196137f1f268SConrad Meyer * streaming API. 196237f1f268SConrad Meyer * 196337f1f268SConrad Meyer * NOTE: So long as the ZSTD_outBuffer always points to valid memory, using 196437f1f268SConrad Meyer * this flag is ALWAYS memory safe, and will never access out-of-bounds 196537f1f268SConrad Meyer * memory. However, decompression WILL fail if you violate the preconditions. 196637f1f268SConrad Meyer * 196737f1f268SConrad Meyer * WARNING: The data in the ZSTD_outBuffer in the range [dst, dst + pos) MUST 196837f1f268SConrad Meyer * not be modified during decompression or you will get data corruption. This 196937f1f268SConrad Meyer * is because zstd needs to reference data in the ZSTD_outBuffer to regenerate 197037f1f268SConrad Meyer * matches. Normally zstd maintains its own buffer for this purpose, but passing 197137f1f268SConrad Meyer * this flag tells zstd to use the user provided buffer. 197237f1f268SConrad Meyer */ 197337f1f268SConrad Meyer #define ZSTD_d_stableOutBuffer ZSTD_d_experimentalParam2 1974a0483764SConrad Meyer 1975*f7cd7fe5SConrad Meyer /* ZSTD_d_forceIgnoreChecksum 1976*f7cd7fe5SConrad Meyer * Experimental parameter. 1977*f7cd7fe5SConrad Meyer * Default is 0 == disabled. Set to 1 to enable 1978*f7cd7fe5SConrad Meyer * 1979*f7cd7fe5SConrad Meyer * Tells the decompressor to skip checksum validation during decompression, regardless 1980*f7cd7fe5SConrad Meyer * of whether checksumming was specified during compression. This offers some 1981*f7cd7fe5SConrad Meyer * slight performance benefits, and may be useful for debugging. 1982*f7cd7fe5SConrad Meyer * Param has values of type ZSTD_forceIgnoreChecksum_e 1983*f7cd7fe5SConrad Meyer */ 1984*f7cd7fe5SConrad Meyer #define ZSTD_d_forceIgnoreChecksum ZSTD_d_experimentalParam3 1985*f7cd7fe5SConrad Meyer 1986a0483764SConrad Meyer /*! ZSTD_DCtx_setFormat() : 1987a0483764SConrad Meyer * Instruct the decoder context about what kind of data to decode next. 1988a0483764SConrad Meyer * This instruction is mandatory to decode data without a fully-formed header, 1989a0483764SConrad Meyer * such ZSTD_f_zstd1_magicless for example. 1990a0483764SConrad Meyer * @return : 0, or an error code (which can be tested using ZSTD_isError()). */ 1991a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_DCtx_setFormat(ZSTD_DCtx* dctx, ZSTD_format_e format); 1992a0483764SConrad Meyer 1993a0483764SConrad Meyer /*! ZSTD_decompressStream_simpleArgs() : 1994a0483764SConrad Meyer * Same as ZSTD_decompressStream(), 1995a0483764SConrad Meyer * but using only integral types as arguments. 1996a0483764SConrad Meyer * This can be helpful for binders from dynamic languages 1997a0483764SConrad Meyer * which have troubles handling structures containing memory pointers. 1998a0483764SConrad Meyer */ 1999a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_decompressStream_simpleArgs ( 2000a0483764SConrad Meyer ZSTD_DCtx* dctx, 2001a0483764SConrad Meyer void* dst, size_t dstCapacity, size_t* dstPos, 2002a0483764SConrad Meyer const void* src, size_t srcSize, size_t* srcPos); 2003a0483764SConrad Meyer 20040c16b537SWarner Losh 20050c16b537SWarner Losh /******************************************************************** 20060c16b537SWarner Losh * Advanced streaming functions 2007a0483764SConrad Meyer * Warning : most of these functions are now redundant with the Advanced API. 2008a0483764SConrad Meyer * Once Advanced API reaches "stable" status, 2009a0483764SConrad Meyer * redundant functions will be deprecated, and then at some point removed. 20100c16b537SWarner Losh ********************************************************************/ 20110c16b537SWarner Losh 20120c16b537SWarner Losh /*===== Advanced Streaming compression functions =====*/ 2013*f7cd7fe5SConrad Meyer 2014*f7cd7fe5SConrad Meyer /*! ZSTD_initCStream_srcSize() : 20152b9c00cbSConrad Meyer * This function is deprecated, and equivalent to: 20162b9c00cbSConrad Meyer * ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only); 20172b9c00cbSConrad Meyer * ZSTD_CCtx_refCDict(zcs, NULL); // clear the dictionary (if any) 20182b9c00cbSConrad Meyer * ZSTD_CCtx_setParameter(zcs, ZSTD_c_compressionLevel, compressionLevel); 20192b9c00cbSConrad Meyer * ZSTD_CCtx_setPledgedSrcSize(zcs, pledgedSrcSize); 20202b9c00cbSConrad Meyer * 20212b9c00cbSConrad Meyer * pledgedSrcSize must be correct. If it is not known at init time, use 20222b9c00cbSConrad Meyer * ZSTD_CONTENTSIZE_UNKNOWN. Note that, for compatibility with older programs, 20232b9c00cbSConrad Meyer * "0" also disables frame content size field. It may be enabled in the future. 20249cbefe25SConrad Meyer * Note : this prototype will be marked as deprecated and generate compilation warnings on reaching v1.5.x 20252b9c00cbSConrad Meyer */ 20269cbefe25SConrad Meyer ZSTDLIB_API size_t 20279cbefe25SConrad Meyer ZSTD_initCStream_srcSize(ZSTD_CStream* zcs, 20289cbefe25SConrad Meyer int compressionLevel, 20299cbefe25SConrad Meyer unsigned long long pledgedSrcSize); 20309cbefe25SConrad Meyer 2031*f7cd7fe5SConrad Meyer /*! ZSTD_initCStream_usingDict() : 20322b9c00cbSConrad Meyer * This function is deprecated, and is equivalent to: 20332b9c00cbSConrad Meyer * ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only); 20342b9c00cbSConrad Meyer * ZSTD_CCtx_setParameter(zcs, ZSTD_c_compressionLevel, compressionLevel); 20352b9c00cbSConrad Meyer * ZSTD_CCtx_loadDictionary(zcs, dict, dictSize); 20362b9c00cbSConrad Meyer * 20372b9c00cbSConrad Meyer * Creates of an internal CDict (incompatible with static CCtx), except if 20382b9c00cbSConrad Meyer * dict == NULL or dictSize < 8, in which case no dict is used. 20399cbefe25SConrad Meyer * Note: dict is loaded with ZSTD_dct_auto (treated as a full zstd dictionary if 20402b9c00cbSConrad Meyer * it begins with ZSTD_MAGIC_DICTIONARY, else as raw content) and ZSTD_dlm_byCopy. 20419cbefe25SConrad Meyer * Note : this prototype will be marked as deprecated and generate compilation warnings on reaching v1.5.x 20422b9c00cbSConrad Meyer */ 20439cbefe25SConrad Meyer ZSTDLIB_API size_t 20449cbefe25SConrad Meyer ZSTD_initCStream_usingDict(ZSTD_CStream* zcs, 20459cbefe25SConrad Meyer const void* dict, size_t dictSize, 20469cbefe25SConrad Meyer int compressionLevel); 20479cbefe25SConrad Meyer 2048*f7cd7fe5SConrad Meyer /*! ZSTD_initCStream_advanced() : 20492b9c00cbSConrad Meyer * This function is deprecated, and is approximately equivalent to: 20502b9c00cbSConrad Meyer * ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only); 20519cbefe25SConrad Meyer * // Pseudocode: Set each zstd parameter and leave the rest as-is. 20529cbefe25SConrad Meyer * for ((param, value) : params) { 20539cbefe25SConrad Meyer * ZSTD_CCtx_setParameter(zcs, param, value); 20549cbefe25SConrad Meyer * } 20552b9c00cbSConrad Meyer * ZSTD_CCtx_setPledgedSrcSize(zcs, pledgedSrcSize); 20562b9c00cbSConrad Meyer * ZSTD_CCtx_loadDictionary(zcs, dict, dictSize); 20572b9c00cbSConrad Meyer * 20589cbefe25SConrad Meyer * dict is loaded with ZSTD_dct_auto and ZSTD_dlm_byCopy. 20599cbefe25SConrad Meyer * pledgedSrcSize must be correct. 20609cbefe25SConrad Meyer * If srcSize is not known at init time, use value ZSTD_CONTENTSIZE_UNKNOWN. 20619cbefe25SConrad Meyer * Note : this prototype will be marked as deprecated and generate compilation warnings on reaching v1.5.x 20622b9c00cbSConrad Meyer */ 20639cbefe25SConrad Meyer ZSTDLIB_API size_t 20649cbefe25SConrad Meyer ZSTD_initCStream_advanced(ZSTD_CStream* zcs, 20659cbefe25SConrad Meyer const void* dict, size_t dictSize, 20669cbefe25SConrad Meyer ZSTD_parameters params, 20679cbefe25SConrad Meyer unsigned long long pledgedSrcSize); 20689cbefe25SConrad Meyer 2069*f7cd7fe5SConrad Meyer /*! ZSTD_initCStream_usingCDict() : 20702b9c00cbSConrad Meyer * This function is deprecated, and equivalent to: 20712b9c00cbSConrad Meyer * ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only); 20722b9c00cbSConrad Meyer * ZSTD_CCtx_refCDict(zcs, cdict); 20732b9c00cbSConrad Meyer * 20742b9c00cbSConrad Meyer * note : cdict will just be referenced, and must outlive compression session 20759cbefe25SConrad Meyer * Note : this prototype will be marked as deprecated and generate compilation warnings on reaching v1.5.x 20762b9c00cbSConrad Meyer */ 20772b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_initCStream_usingCDict(ZSTD_CStream* zcs, const ZSTD_CDict* cdict); 20789cbefe25SConrad Meyer 2079*f7cd7fe5SConrad Meyer /*! ZSTD_initCStream_usingCDict_advanced() : 20809cbefe25SConrad Meyer * This function is DEPRECATED, and is approximately equivalent to: 20812b9c00cbSConrad Meyer * ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only); 20829cbefe25SConrad Meyer * // Pseudocode: Set each zstd frame parameter and leave the rest as-is. 20839cbefe25SConrad Meyer * for ((fParam, value) : fParams) { 20849cbefe25SConrad Meyer * ZSTD_CCtx_setParameter(zcs, fParam, value); 20859cbefe25SConrad Meyer * } 20862b9c00cbSConrad Meyer * ZSTD_CCtx_setPledgedSrcSize(zcs, pledgedSrcSize); 20872b9c00cbSConrad Meyer * ZSTD_CCtx_refCDict(zcs, cdict); 20882b9c00cbSConrad Meyer * 20892b9c00cbSConrad Meyer * same as ZSTD_initCStream_usingCDict(), with control over frame parameters. 20902b9c00cbSConrad Meyer * pledgedSrcSize must be correct. If srcSize is not known at init time, use 20912b9c00cbSConrad Meyer * value ZSTD_CONTENTSIZE_UNKNOWN. 20929cbefe25SConrad Meyer * Note : this prototype will be marked as deprecated and generate compilation warnings on reaching v1.5.x 20932b9c00cbSConrad Meyer */ 20949cbefe25SConrad Meyer ZSTDLIB_API size_t 20959cbefe25SConrad Meyer ZSTD_initCStream_usingCDict_advanced(ZSTD_CStream* zcs, 20969cbefe25SConrad Meyer const ZSTD_CDict* cdict, 20979cbefe25SConrad Meyer ZSTD_frameParameters fParams, 20989cbefe25SConrad Meyer unsigned long long pledgedSrcSize); 20990c16b537SWarner Losh 21000c16b537SWarner Losh /*! ZSTD_resetCStream() : 21012b9c00cbSConrad Meyer * This function is deprecated, and is equivalent to: 21022b9c00cbSConrad Meyer * ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only); 21032b9c00cbSConrad Meyer * ZSTD_CCtx_setPledgedSrcSize(zcs, pledgedSrcSize); 21042b9c00cbSConrad Meyer * 2105a0483764SConrad Meyer * start a new frame, using same parameters from previous frame. 21060f743729SConrad Meyer * This is typically useful to skip dictionary loading stage, since it will re-use it in-place. 21070c16b537SWarner Losh * Note that zcs must be init at least once before using ZSTD_resetCStream(). 2108052d3c12SConrad Meyer * If pledgedSrcSize is not known at reset time, use macro ZSTD_CONTENTSIZE_UNKNOWN. 21090c16b537SWarner Losh * If pledgedSrcSize > 0, its value must be correct, as it will be written in header, and controlled at the end. 2110052d3c12SConrad Meyer * For the time being, pledgedSrcSize==0 is interpreted as "srcSize unknown" for compatibility with older programs, 211119fcbaf1SConrad Meyer * but it will change to mean "empty" in future version, so use macro ZSTD_CONTENTSIZE_UNKNOWN instead. 21120f743729SConrad Meyer * @return : 0, or an error code (which can be tested using ZSTD_isError()) 21139cbefe25SConrad Meyer * Note : this prototype will be marked as deprecated and generate compilation warnings on reaching v1.5.x 21140f743729SConrad Meyer */ 21150c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_resetCStream(ZSTD_CStream* zcs, unsigned long long pledgedSrcSize); 21160c16b537SWarner Losh 21170c16b537SWarner Losh 211819fcbaf1SConrad Meyer typedef struct { 21190f743729SConrad Meyer unsigned long long ingested; /* nb input bytes read and buffered */ 21200f743729SConrad Meyer unsigned long long consumed; /* nb input bytes actually compressed */ 21210f743729SConrad Meyer unsigned long long produced; /* nb of compressed bytes generated and buffered */ 21220f743729SConrad Meyer unsigned long long flushed; /* nb of compressed bytes flushed : not provided; can be tracked from caller side */ 21230f743729SConrad Meyer unsigned currentJobID; /* MT only : latest started job nb */ 21240f743729SConrad Meyer unsigned nbActiveWorkers; /* MT only : nb of workers actively compressing at probe time */ 212519fcbaf1SConrad Meyer } ZSTD_frameProgression; 212619fcbaf1SConrad Meyer 212719fcbaf1SConrad Meyer /* ZSTD_getFrameProgression() : 212819fcbaf1SConrad Meyer * tells how much data has been ingested (read from input) 212919fcbaf1SConrad Meyer * consumed (input actually compressed) and produced (output) for current frame. 21300f743729SConrad Meyer * Note : (ingested - consumed) is amount of input data buffered internally, not yet compressed. 21310f743729SConrad Meyer * Aggregates progression inside active worker threads. 213219fcbaf1SConrad Meyer */ 21330f743729SConrad Meyer ZSTDLIB_API ZSTD_frameProgression ZSTD_getFrameProgression(const ZSTD_CCtx* cctx); 21340f743729SConrad Meyer 21350f743729SConrad Meyer /*! ZSTD_toFlushNow() : 21360f743729SConrad Meyer * Tell how many bytes are ready to be flushed immediately. 21370f743729SConrad Meyer * Useful for multithreading scenarios (nbWorkers >= 1). 21380f743729SConrad Meyer * Probe the oldest active job, defined as oldest job not yet entirely flushed, 21390f743729SConrad Meyer * and check its output buffer. 21400f743729SConrad Meyer * @return : amount of data stored in oldest job and ready to be flushed immediately. 21410f743729SConrad Meyer * if @return == 0, it means either : 21420f743729SConrad Meyer * + there is no active job (could be checked with ZSTD_frameProgression()), or 21430f743729SConrad Meyer * + oldest job is still actively compressing data, 21440f743729SConrad Meyer * but everything it has produced has also been flushed so far, 2145a0483764SConrad Meyer * therefore flush speed is limited by production speed of oldest job 2146a0483764SConrad Meyer * irrespective of the speed of concurrent (and newer) jobs. 21470f743729SConrad Meyer */ 21480f743729SConrad Meyer ZSTDLIB_API size_t ZSTD_toFlushNow(ZSTD_CCtx* cctx); 214919fcbaf1SConrad Meyer 215019fcbaf1SConrad Meyer 21510c16b537SWarner Losh /*===== Advanced Streaming decompression functions =====*/ 2152*f7cd7fe5SConrad Meyer 2153*f7cd7fe5SConrad Meyer /*! 21542b9c00cbSConrad Meyer * This function is deprecated, and is equivalent to: 21552b9c00cbSConrad Meyer * 21562b9c00cbSConrad Meyer * ZSTD_DCtx_reset(zds, ZSTD_reset_session_only); 21572b9c00cbSConrad Meyer * ZSTD_DCtx_loadDictionary(zds, dict, dictSize); 21582b9c00cbSConrad Meyer * 21592b9c00cbSConrad Meyer * note: no dictionary will be used if dict == NULL or dictSize < 8 21609cbefe25SConrad Meyer * Note : this prototype will be marked as deprecated and generate compilation warnings on reaching v1.5.x 21612b9c00cbSConrad Meyer */ 21622b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_initDStream_usingDict(ZSTD_DStream* zds, const void* dict, size_t dictSize); 21639cbefe25SConrad Meyer 2164*f7cd7fe5SConrad Meyer /*! 21652b9c00cbSConrad Meyer * This function is deprecated, and is equivalent to: 21662b9c00cbSConrad Meyer * 21672b9c00cbSConrad Meyer * ZSTD_DCtx_reset(zds, ZSTD_reset_session_only); 21682b9c00cbSConrad Meyer * ZSTD_DCtx_refDDict(zds, ddict); 21692b9c00cbSConrad Meyer * 21702b9c00cbSConrad Meyer * note : ddict is referenced, it must outlive decompression session 21719cbefe25SConrad Meyer * Note : this prototype will be marked as deprecated and generate compilation warnings on reaching v1.5.x 21722b9c00cbSConrad Meyer */ 21732b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_initDStream_usingDDict(ZSTD_DStream* zds, const ZSTD_DDict* ddict); 21749cbefe25SConrad Meyer 2175*f7cd7fe5SConrad Meyer /*! 21762b9c00cbSConrad Meyer * This function is deprecated, and is equivalent to: 21772b9c00cbSConrad Meyer * 21782b9c00cbSConrad Meyer * ZSTD_DCtx_reset(zds, ZSTD_reset_session_only); 21792b9c00cbSConrad Meyer * 21802b9c00cbSConrad Meyer * re-use decompression parameters from previous init; saves dictionary loading 21819cbefe25SConrad Meyer * Note : this prototype will be marked as deprecated and generate compilation warnings on reaching v1.5.x 21822b9c00cbSConrad Meyer */ 21832b9c00cbSConrad Meyer ZSTDLIB_API size_t ZSTD_resetDStream(ZSTD_DStream* zds); 21840c16b537SWarner Losh 21850c16b537SWarner Losh 21860c16b537SWarner Losh /********************************************************************* 21870c16b537SWarner Losh * Buffer-less and synchronous inner streaming functions 21880c16b537SWarner Losh * 21890c16b537SWarner Losh * This is an advanced API, giving full control over buffer management, for users which need direct control over memory. 21900c16b537SWarner Losh * But it's also a complex one, with several restrictions, documented below. 21910c16b537SWarner Losh * Prefer normal streaming API for an easier experience. 21920c16b537SWarner Losh ********************************************************************* */ 21930c16b537SWarner Losh 21940c16b537SWarner Losh /** 21950c16b537SWarner Losh Buffer-less streaming compression (synchronous mode) 21960c16b537SWarner Losh 21970c16b537SWarner Losh A ZSTD_CCtx object is required to track streaming operations. 21980c16b537SWarner Losh Use ZSTD_createCCtx() / ZSTD_freeCCtx() to manage resource. 21990c16b537SWarner Losh ZSTD_CCtx object can be re-used multiple times within successive compression operations. 22000c16b537SWarner Losh 22010c16b537SWarner Losh Start by initializing a context. 22020c16b537SWarner Losh Use ZSTD_compressBegin(), or ZSTD_compressBegin_usingDict() for dictionary compression, 22030c16b537SWarner Losh or ZSTD_compressBegin_advanced(), for finer parameter control. 22040c16b537SWarner Losh It's also possible to duplicate a reference context which has already been initialized, using ZSTD_copyCCtx() 22050c16b537SWarner Losh 22060c16b537SWarner Losh Then, consume your input using ZSTD_compressContinue(). 22070c16b537SWarner Losh There are some important considerations to keep in mind when using this advanced function : 22080c16b537SWarner Losh - ZSTD_compressContinue() has no internal buffer. It uses externally provided buffers only. 22090c16b537SWarner Losh - Interface is synchronous : input is consumed entirely and produces 1+ compressed blocks. 22100c16b537SWarner Losh - Caller must ensure there is enough space in `dst` to store compressed data under worst case scenario. 22110c16b537SWarner Losh Worst case evaluation is provided by ZSTD_compressBound(). 22120c16b537SWarner Losh ZSTD_compressContinue() doesn't guarantee recover after a failed compression. 22130c16b537SWarner Losh - ZSTD_compressContinue() presumes prior input ***is still accessible and unmodified*** (up to maximum distance size, see WindowLog). 22140c16b537SWarner Losh It remembers all previous contiguous blocks, plus one separated memory segment (which can itself consists of multiple contiguous blocks) 22150c16b537SWarner Losh - ZSTD_compressContinue() detects that prior input has been overwritten when `src` buffer overlaps. 22160c16b537SWarner Losh In which case, it will "discard" the relevant memory section from its history. 22170c16b537SWarner Losh 22180c16b537SWarner Losh Finish a frame with ZSTD_compressEnd(), which will write the last block(s) and optional checksum. 22190c16b537SWarner Losh It's possible to use srcSize==0, in which case, it will write a final empty block to end the frame. 22200c16b537SWarner Losh Without last block mark, frames are considered unfinished (hence corrupted) by compliant decoders. 22210c16b537SWarner Losh 22220c16b537SWarner Losh `ZSTD_CCtx` object can be re-used (ZSTD_compressBegin()) to compress again. 22230c16b537SWarner Losh */ 22240c16b537SWarner Losh 22250c16b537SWarner Losh /*===== Buffer-less streaming compression functions =====*/ 22260c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_compressBegin(ZSTD_CCtx* cctx, int compressionLevel); 22270c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_compressBegin_usingDict(ZSTD_CCtx* cctx, const void* dict, size_t dictSize, int compressionLevel); 2228052d3c12SConrad Meyer ZSTDLIB_API size_t ZSTD_compressBegin_advanced(ZSTD_CCtx* cctx, const void* dict, size_t dictSize, ZSTD_parameters params, unsigned long long pledgedSrcSize); /**< pledgedSrcSize : If srcSize is not known at init time, use ZSTD_CONTENTSIZE_UNKNOWN */ 22290c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_compressBegin_usingCDict(ZSTD_CCtx* cctx, const ZSTD_CDict* cdict); /**< note: fails if cdict==NULL */ 2230052d3c12SConrad Meyer ZSTDLIB_API size_t ZSTD_compressBegin_usingCDict_advanced(ZSTD_CCtx* const cctx, const ZSTD_CDict* const cdict, ZSTD_frameParameters const fParams, unsigned long long const pledgedSrcSize); /* compression parameters are already set within cdict. pledgedSrcSize must be correct. If srcSize is not known, use macro ZSTD_CONTENTSIZE_UNKNOWN */ 2231052d3c12SConrad Meyer ZSTDLIB_API size_t ZSTD_copyCCtx(ZSTD_CCtx* cctx, const ZSTD_CCtx* preparedCCtx, unsigned long long pledgedSrcSize); /**< note: if pledgedSrcSize is not known, use ZSTD_CONTENTSIZE_UNKNOWN */ 22320c16b537SWarner Losh 22330c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_compressContinue(ZSTD_CCtx* cctx, void* dst, size_t dstCapacity, const void* src, size_t srcSize); 22340c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_compressEnd(ZSTD_CCtx* cctx, void* dst, size_t dstCapacity, const void* src, size_t srcSize); 22350c16b537SWarner Losh 22360c16b537SWarner Losh 2237*f7cd7fe5SConrad Meyer /** 22380c16b537SWarner Losh Buffer-less streaming decompression (synchronous mode) 22390c16b537SWarner Losh 22400c16b537SWarner Losh A ZSTD_DCtx object is required to track streaming operations. 22410c16b537SWarner Losh Use ZSTD_createDCtx() / ZSTD_freeDCtx() to manage it. 22420c16b537SWarner Losh A ZSTD_DCtx object can be re-used multiple times. 22430c16b537SWarner Losh 22440c16b537SWarner Losh First typical operation is to retrieve frame parameters, using ZSTD_getFrameHeader(). 22450c16b537SWarner Losh Frame header is extracted from the beginning of compressed frame, so providing only the frame's beginning is enough. 22460c16b537SWarner Losh Data fragment must be large enough to ensure successful decoding. 22470c16b537SWarner Losh `ZSTD_frameHeaderSize_max` bytes is guaranteed to always be large enough. 22480c16b537SWarner Losh @result : 0 : successful decoding, the `ZSTD_frameHeader` structure is correctly filled. 22490c16b537SWarner Losh >0 : `srcSize` is too small, please provide at least @result bytes on next attempt. 22500c16b537SWarner Losh errorCode, which can be tested using ZSTD_isError(). 22510c16b537SWarner Losh 22520c16b537SWarner Losh It fills a ZSTD_frameHeader structure with important information to correctly decode the frame, 22530c16b537SWarner Losh such as the dictionary ID, content size, or maximum back-reference distance (`windowSize`). 22540c16b537SWarner Losh Note that these values could be wrong, either because of data corruption, or because a 3rd party deliberately spoofs false information. 22550c16b537SWarner Losh As a consequence, check that values remain within valid application range. 22560c16b537SWarner Losh For example, do not allocate memory blindly, check that `windowSize` is within expectation. 22570c16b537SWarner Losh Each application can set its own limits, depending on local restrictions. 22580c16b537SWarner Losh For extended interoperability, it is recommended to support `windowSize` of at least 8 MB. 22590c16b537SWarner Losh 22600c16b537SWarner Losh ZSTD_decompressContinue() needs previous data blocks during decompression, up to `windowSize` bytes. 22610c16b537SWarner Losh ZSTD_decompressContinue() is very sensitive to contiguity, 22620c16b537SWarner Losh if 2 blocks don't follow each other, make sure that either the compressor breaks contiguity at the same place, 22630c16b537SWarner Losh or that previous contiguous segment is large enough to properly handle maximum back-reference distance. 22640c16b537SWarner Losh There are multiple ways to guarantee this condition. 22650c16b537SWarner Losh 22660c16b537SWarner Losh The most memory efficient way is to use a round buffer of sufficient size. 22670c16b537SWarner Losh Sufficient size is determined by invoking ZSTD_decodingBufferSize_min(), 22680c16b537SWarner Losh which can @return an error code if required value is too large for current system (in 32-bits mode). 22690c16b537SWarner Losh In a round buffer methodology, ZSTD_decompressContinue() decompresses each block next to previous one, 22700c16b537SWarner Losh up to the moment there is not enough room left in the buffer to guarantee decoding another full block, 22710c16b537SWarner Losh which maximum size is provided in `ZSTD_frameHeader` structure, field `blockSizeMax`. 22720c16b537SWarner Losh At which point, decoding can resume from the beginning of the buffer. 22730c16b537SWarner Losh Note that already decoded data stored in the buffer should be flushed before being overwritten. 22740c16b537SWarner Losh 22750c16b537SWarner Losh There are alternatives possible, for example using two or more buffers of size `windowSize` each, though they consume more memory. 22760c16b537SWarner Losh 22770c16b537SWarner Losh Finally, if you control the compression process, you can also ignore all buffer size rules, 22780c16b537SWarner Losh as long as the encoder and decoder progress in "lock-step", 22790c16b537SWarner Losh aka use exactly the same buffer sizes, break contiguity at the same place, etc. 22800c16b537SWarner Losh 22810c16b537SWarner Losh Once buffers are setup, start decompression, with ZSTD_decompressBegin(). 22820c16b537SWarner Losh If decompression requires a dictionary, use ZSTD_decompressBegin_usingDict() or ZSTD_decompressBegin_usingDDict(). 22830c16b537SWarner Losh 22840c16b537SWarner Losh Then use ZSTD_nextSrcSizeToDecompress() and ZSTD_decompressContinue() alternatively. 22850c16b537SWarner Losh ZSTD_nextSrcSizeToDecompress() tells how many bytes to provide as 'srcSize' to ZSTD_decompressContinue(). 22860c16b537SWarner Losh ZSTD_decompressContinue() requires this _exact_ amount of bytes, or it will fail. 22870c16b537SWarner Losh 22880c16b537SWarner Losh @result of ZSTD_decompressContinue() is the number of bytes regenerated within 'dst' (necessarily <= dstCapacity). 22890c16b537SWarner Losh It can be zero : it just means ZSTD_decompressContinue() has decoded some metadata item. 22900c16b537SWarner Losh It can also be an error code, which can be tested with ZSTD_isError(). 22910c16b537SWarner Losh 22920c16b537SWarner Losh A frame is fully decoded when ZSTD_nextSrcSizeToDecompress() returns zero. 22930c16b537SWarner Losh Context can then be reset to start a new decompression. 22940c16b537SWarner Losh 22950c16b537SWarner Losh Note : it's possible to know if next input to present is a header or a block, using ZSTD_nextInputType(). 22960c16b537SWarner Losh This information is not required to properly decode a frame. 22970c16b537SWarner Losh 22980c16b537SWarner Losh == Special case : skippable frames == 22990c16b537SWarner Losh 23000c16b537SWarner Losh Skippable frames allow integration of user-defined data into a flow of concatenated frames. 23010c16b537SWarner Losh Skippable frames will be ignored (skipped) by decompressor. 23020c16b537SWarner Losh The format of skippable frames is as follows : 23030c16b537SWarner Losh a) Skippable frame ID - 4 Bytes, Little endian format, any value from 0x184D2A50 to 0x184D2A5F 23040c16b537SWarner Losh b) Frame Size - 4 Bytes, Little endian format, unsigned 32-bits 23050c16b537SWarner Losh c) Frame Content - any content (User Data) of length equal to Frame Size 23060c16b537SWarner Losh For skippable frames ZSTD_getFrameHeader() returns zfhPtr->frameType==ZSTD_skippableFrame. 23070c16b537SWarner Losh For skippable frames ZSTD_decompressContinue() always returns 0 : it only skips the content. 23080c16b537SWarner Losh */ 23090c16b537SWarner Losh 23100c16b537SWarner Losh /*===== Buffer-less streaming decompression functions =====*/ 23110c16b537SWarner Losh typedef enum { ZSTD_frame, ZSTD_skippableFrame } ZSTD_frameType_e; 23120c16b537SWarner Losh typedef struct { 23130c16b537SWarner Losh unsigned long long frameContentSize; /* if == ZSTD_CONTENTSIZE_UNKNOWN, it means this field is not available. 0 means "empty" */ 23140c16b537SWarner Losh unsigned long long windowSize; /* can be very large, up to <= frameContentSize */ 23150c16b537SWarner Losh unsigned blockSizeMax; 23160c16b537SWarner Losh ZSTD_frameType_e frameType; /* if == ZSTD_skippableFrame, frameContentSize is the size of skippable content */ 23170c16b537SWarner Losh unsigned headerSize; 23180c16b537SWarner Losh unsigned dictID; 23190c16b537SWarner Losh unsigned checksumFlag; 23200c16b537SWarner Losh } ZSTD_frameHeader; 2321a0483764SConrad Meyer 23224d3f1eafSConrad Meyer /*! ZSTD_getFrameHeader() : 23230f743729SConrad Meyer * decode Frame Header, or requires larger `srcSize`. 23240f743729SConrad Meyer * @return : 0, `zfhPtr` is correctly filled, 23250f743729SConrad Meyer * >0, `srcSize` is too small, value is wanted `srcSize` amount, 23260f743729SConrad Meyer * or an error code, which can be tested using ZSTD_isError() */ 23270c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_getFrameHeader(ZSTD_frameHeader* zfhPtr, const void* src, size_t srcSize); /**< doesn't consume input */ 2328a0483764SConrad Meyer /*! ZSTD_getFrameHeader_advanced() : 2329a0483764SConrad Meyer * same as ZSTD_getFrameHeader(), 2330a0483764SConrad Meyer * with added capability to select a format (like ZSTD_f_zstd1_magicless) */ 2331a0483764SConrad Meyer ZSTDLIB_API size_t ZSTD_getFrameHeader_advanced(ZSTD_frameHeader* zfhPtr, const void* src, size_t srcSize, ZSTD_format_e format); 23320c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_decodingBufferSize_min(unsigned long long windowSize, unsigned long long frameContentSize); /**< when frame content size is not known, pass in frameContentSize == ZSTD_CONTENTSIZE_UNKNOWN */ 23330c16b537SWarner Losh 23340c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_decompressBegin(ZSTD_DCtx* dctx); 23350c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_decompressBegin_usingDict(ZSTD_DCtx* dctx, const void* dict, size_t dictSize); 23360c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_decompressBegin_usingDDict(ZSTD_DCtx* dctx, const ZSTD_DDict* ddict); 23370c16b537SWarner Losh 23380c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_nextSrcSizeToDecompress(ZSTD_DCtx* dctx); 23390c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_decompressContinue(ZSTD_DCtx* dctx, void* dst, size_t dstCapacity, const void* src, size_t srcSize); 23400c16b537SWarner Losh 23410c16b537SWarner Losh /* misc */ 23420c16b537SWarner Losh ZSTDLIB_API void ZSTD_copyDCtx(ZSTD_DCtx* dctx, const ZSTD_DCtx* preparedDCtx); 23430c16b537SWarner Losh typedef enum { ZSTDnit_frameHeader, ZSTDnit_blockHeader, ZSTDnit_block, ZSTDnit_lastBlock, ZSTDnit_checksum, ZSTDnit_skippableFrame } ZSTD_nextInputType_e; 23440c16b537SWarner Losh ZSTDLIB_API ZSTD_nextInputType_e ZSTD_nextInputType(ZSTD_DCtx* dctx); 23450c16b537SWarner Losh 23460c16b537SWarner Losh 23470c16b537SWarner Losh 23480c16b537SWarner Losh 23490c16b537SWarner Losh /* ============================ */ 23500c16b537SWarner Losh /** Block level API */ 23510c16b537SWarner Losh /* ============================ */ 23520c16b537SWarner Losh 23530c16b537SWarner Losh /*! 23540c16b537SWarner Losh Block functions produce and decode raw zstd blocks, without frame metadata. 23559cbefe25SConrad Meyer Frame metadata cost is typically ~12 bytes, which can be non-negligible for very small blocks (< 100 bytes). 23569cbefe25SConrad Meyer But users will have to take in charge needed metadata to regenerate data, such as compressed and content sizes. 23570c16b537SWarner Losh 23580c16b537SWarner Losh A few rules to respect : 23590c16b537SWarner Losh - Compressing and decompressing require a context structure 23600c16b537SWarner Losh + Use ZSTD_createCCtx() and ZSTD_createDCtx() 23610c16b537SWarner Losh - It is necessary to init context before starting 23620c16b537SWarner Losh + compression : any ZSTD_compressBegin*() variant, including with dictionary 23630c16b537SWarner Losh + decompression : any ZSTD_decompressBegin*() variant, including with dictionary 23640c16b537SWarner Losh + copyCCtx() and copyDCtx() can be used too 23650c16b537SWarner Losh - Block size is limited, it must be <= ZSTD_getBlockSize() <= ZSTD_BLOCKSIZE_MAX == 128 KB 23660c16b537SWarner Losh + If input is larger than a block size, it's necessary to split input data into multiple blocks 23679cbefe25SConrad Meyer + For inputs larger than a single block, consider using regular ZSTD_compress() instead. 23689cbefe25SConrad Meyer Frame metadata is not that costly, and quickly becomes negligible as source size grows larger than a block. 23699cbefe25SConrad Meyer - When a block is considered not compressible enough, ZSTD_compressBlock() result will be 0 (zero) ! 23709cbefe25SConrad Meyer ===> In which case, nothing is produced into `dst` ! 23719cbefe25SConrad Meyer + User __must__ test for such outcome and deal directly with uncompressed data 23729cbefe25SConrad Meyer + A block cannot be declared incompressible if ZSTD_compressBlock() return value was != 0. 23739cbefe25SConrad Meyer Doing so would mess up with statistics history, leading to potential data corruption. 23749cbefe25SConrad Meyer + ZSTD_decompressBlock() _doesn't accept uncompressed data as input_ !! 23750c16b537SWarner Losh + In case of multiple successive blocks, should some of them be uncompressed, 23760c16b537SWarner Losh decoder must be informed of their existence in order to follow proper history. 23770c16b537SWarner Losh Use ZSTD_insertBlock() for such a case. 23780c16b537SWarner Losh */ 23790c16b537SWarner Losh 23800c16b537SWarner Losh /*===== Raw zstd block functions =====*/ 23810c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_getBlockSize (const ZSTD_CCtx* cctx); 23820c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_compressBlock (ZSTD_CCtx* cctx, void* dst, size_t dstCapacity, const void* src, size_t srcSize); 23830c16b537SWarner Losh ZSTDLIB_API size_t ZSTD_decompressBlock(ZSTD_DCtx* dctx, void* dst, size_t dstCapacity, const void* src, size_t srcSize); 238419fcbaf1SConrad Meyer ZSTDLIB_API size_t ZSTD_insertBlock (ZSTD_DCtx* dctx, const void* blockStart, size_t blockSize); /**< insert uncompressed block into `dctx` history. Useful for multi-blocks decompression. */ 23850c16b537SWarner Losh 23860c16b537SWarner Losh 23870c16b537SWarner Losh #endif /* ZSTD_H_ZSTD_STATIC_LINKING_ONLY */ 23880c16b537SWarner Losh 23890c16b537SWarner Losh #if defined (__cplusplus) 23900c16b537SWarner Losh } 23910c16b537SWarner Losh #endif 2392