xref: /freebsd/sys/contrib/zstd/lib/compress/zstd_cwksp.h (revision f7cd7fe51c4140960ebea00410ed62894f5625d1)
19cbefe25SConrad Meyer /*
237f1f268SConrad Meyer  * Copyright (c) 2016-2020, Yann Collet, Facebook, Inc.
39cbefe25SConrad Meyer  * All rights reserved.
49cbefe25SConrad Meyer  *
59cbefe25SConrad Meyer  * This source code is licensed under both the BSD-style license (found in the
69cbefe25SConrad Meyer  * LICENSE file in the root directory of this source tree) and the GPLv2 (found
79cbefe25SConrad Meyer  * in the COPYING file in the root directory of this source tree).
89cbefe25SConrad Meyer  * You may select, at your option, one of the above-listed licenses.
99cbefe25SConrad Meyer  */
109cbefe25SConrad Meyer 
119cbefe25SConrad Meyer #ifndef ZSTD_CWKSP_H
129cbefe25SConrad Meyer #define ZSTD_CWKSP_H
139cbefe25SConrad Meyer 
149cbefe25SConrad Meyer /*-*************************************
159cbefe25SConrad Meyer *  Dependencies
169cbefe25SConrad Meyer ***************************************/
1737f1f268SConrad Meyer #include "../common/zstd_internal.h"
189cbefe25SConrad Meyer 
199cbefe25SConrad Meyer #if defined (__cplusplus)
209cbefe25SConrad Meyer extern "C" {
219cbefe25SConrad Meyer #endif
229cbefe25SConrad Meyer 
239cbefe25SConrad Meyer /*-*************************************
249cbefe25SConrad Meyer *  Constants
259cbefe25SConrad Meyer ***************************************/
269cbefe25SConrad Meyer 
279cbefe25SConrad Meyer /* Since the workspace is effectively its own little malloc implementation /
289cbefe25SConrad Meyer  * arena, when we run under ASAN, we should similarly insert redzones between
299cbefe25SConrad Meyer  * each internal element of the workspace, so ASAN will catch overruns that
309cbefe25SConrad Meyer  * reach outside an object but that stay inside the workspace.
319cbefe25SConrad Meyer  *
329cbefe25SConrad Meyer  * This defines the size of that redzone.
339cbefe25SConrad Meyer  */
349cbefe25SConrad Meyer #ifndef ZSTD_CWKSP_ASAN_REDZONE_SIZE
359cbefe25SConrad Meyer #define ZSTD_CWKSP_ASAN_REDZONE_SIZE 128
369cbefe25SConrad Meyer #endif
379cbefe25SConrad Meyer 
389cbefe25SConrad Meyer /*-*************************************
399cbefe25SConrad Meyer *  Structures
409cbefe25SConrad Meyer ***************************************/
419cbefe25SConrad Meyer typedef enum {
429cbefe25SConrad Meyer     ZSTD_cwksp_alloc_objects,
439cbefe25SConrad Meyer     ZSTD_cwksp_alloc_buffers,
449cbefe25SConrad Meyer     ZSTD_cwksp_alloc_aligned
459cbefe25SConrad Meyer } ZSTD_cwksp_alloc_phase_e;
469cbefe25SConrad Meyer 
479cbefe25SConrad Meyer /**
48*f7cd7fe5SConrad Meyer  * Used to describe whether the workspace is statically allocated (and will not
49*f7cd7fe5SConrad Meyer  * necessarily ever be freed), or if it's dynamically allocated and we can
50*f7cd7fe5SConrad Meyer  * expect a well-formed caller to free this.
51*f7cd7fe5SConrad Meyer  */
52*f7cd7fe5SConrad Meyer typedef enum {
53*f7cd7fe5SConrad Meyer     ZSTD_cwksp_dynamic_alloc,
54*f7cd7fe5SConrad Meyer     ZSTD_cwksp_static_alloc
55*f7cd7fe5SConrad Meyer } ZSTD_cwksp_static_alloc_e;
56*f7cd7fe5SConrad Meyer 
57*f7cd7fe5SConrad Meyer /**
589cbefe25SConrad Meyer  * Zstd fits all its internal datastructures into a single continuous buffer,
599cbefe25SConrad Meyer  * so that it only needs to perform a single OS allocation (or so that a buffer
609cbefe25SConrad Meyer  * can be provided to it and it can perform no allocations at all). This buffer
619cbefe25SConrad Meyer  * is called the workspace.
629cbefe25SConrad Meyer  *
639cbefe25SConrad Meyer  * Several optimizations complicate that process of allocating memory ranges
649cbefe25SConrad Meyer  * from this workspace for each internal datastructure:
659cbefe25SConrad Meyer  *
669cbefe25SConrad Meyer  * - These different internal datastructures have different setup requirements:
679cbefe25SConrad Meyer  *
689cbefe25SConrad Meyer  *   - The static objects need to be cleared once and can then be trivially
699cbefe25SConrad Meyer  *     reused for each compression.
709cbefe25SConrad Meyer  *
719cbefe25SConrad Meyer  *   - Various buffers don't need to be initialized at all--they are always
729cbefe25SConrad Meyer  *     written into before they're read.
739cbefe25SConrad Meyer  *
749cbefe25SConrad Meyer  *   - The matchstate tables have a unique requirement that they don't need
759cbefe25SConrad Meyer  *     their memory to be totally cleared, but they do need the memory to have
769cbefe25SConrad Meyer  *     some bound, i.e., a guarantee that all values in the memory they've been
779cbefe25SConrad Meyer  *     allocated is less than some maximum value (which is the starting value
789cbefe25SConrad Meyer  *     for the indices that they will then use for compression). When this
799cbefe25SConrad Meyer  *     guarantee is provided to them, they can use the memory without any setup
809cbefe25SConrad Meyer  *     work. When it can't, they have to clear the area.
819cbefe25SConrad Meyer  *
829cbefe25SConrad Meyer  * - These buffers also have different alignment requirements.
839cbefe25SConrad Meyer  *
849cbefe25SConrad Meyer  * - We would like to reuse the objects in the workspace for multiple
859cbefe25SConrad Meyer  *   compressions without having to perform any expensive reallocation or
869cbefe25SConrad Meyer  *   reinitialization work.
879cbefe25SConrad Meyer  *
889cbefe25SConrad Meyer  * - We would like to be able to efficiently reuse the workspace across
899cbefe25SConrad Meyer  *   multiple compressions **even when the compression parameters change** and
909cbefe25SConrad Meyer  *   we need to resize some of the objects (where possible).
919cbefe25SConrad Meyer  *
929cbefe25SConrad Meyer  * To attempt to manage this buffer, given these constraints, the ZSTD_cwksp
939cbefe25SConrad Meyer  * abstraction was created. It works as follows:
949cbefe25SConrad Meyer  *
959cbefe25SConrad Meyer  * Workspace Layout:
969cbefe25SConrad Meyer  *
979cbefe25SConrad Meyer  * [                        ... workspace ...                         ]
989cbefe25SConrad Meyer  * [objects][tables ... ->] free space [<- ... aligned][<- ... buffers]
999cbefe25SConrad Meyer  *
1009cbefe25SConrad Meyer  * The various objects that live in the workspace are divided into the
1019cbefe25SConrad Meyer  * following categories, and are allocated separately:
1029cbefe25SConrad Meyer  *
1039cbefe25SConrad Meyer  * - Static objects: this is optionally the enclosing ZSTD_CCtx or ZSTD_CDict,
1049cbefe25SConrad Meyer  *   so that literally everything fits in a single buffer. Note: if present,
105*f7cd7fe5SConrad Meyer  *   this must be the first object in the workspace, since ZSTD_customFree{CCtx,
1069cbefe25SConrad Meyer  *   CDict}() rely on a pointer comparison to see whether one or two frees are
1079cbefe25SConrad Meyer  *   required.
1089cbefe25SConrad Meyer  *
1099cbefe25SConrad Meyer  * - Fixed size objects: these are fixed-size, fixed-count objects that are
1109cbefe25SConrad Meyer  *   nonetheless "dynamically" allocated in the workspace so that we can
1119cbefe25SConrad Meyer  *   control how they're initialized separately from the broader ZSTD_CCtx.
1129cbefe25SConrad Meyer  *   Examples:
1139cbefe25SConrad Meyer  *   - Entropy Workspace
1149cbefe25SConrad Meyer  *   - 2 x ZSTD_compressedBlockState_t
1159cbefe25SConrad Meyer  *   - CDict dictionary contents
1169cbefe25SConrad Meyer  *
1179cbefe25SConrad Meyer  * - Tables: these are any of several different datastructures (hash tables,
1189cbefe25SConrad Meyer  *   chain tables, binary trees) that all respect a common format: they are
1199cbefe25SConrad Meyer  *   uint32_t arrays, all of whose values are between 0 and (nextSrc - base).
1209cbefe25SConrad Meyer  *   Their sizes depend on the cparams.
1219cbefe25SConrad Meyer  *
1229cbefe25SConrad Meyer  * - Aligned: these buffers are used for various purposes that require 4 byte
1239cbefe25SConrad Meyer  *   alignment, but don't require any initialization before they're used.
1249cbefe25SConrad Meyer  *
1259cbefe25SConrad Meyer  * - Buffers: these buffers are used for various purposes that don't require
1269cbefe25SConrad Meyer  *   any alignment or initialization before they're used. This means they can
1279cbefe25SConrad Meyer  *   be moved around at no cost for a new compression.
1289cbefe25SConrad Meyer  *
1299cbefe25SConrad Meyer  * Allocating Memory:
1309cbefe25SConrad Meyer  *
1319cbefe25SConrad Meyer  * The various types of objects must be allocated in order, so they can be
1329cbefe25SConrad Meyer  * correctly packed into the workspace buffer. That order is:
1339cbefe25SConrad Meyer  *
1349cbefe25SConrad Meyer  * 1. Objects
1359cbefe25SConrad Meyer  * 2. Buffers
1369cbefe25SConrad Meyer  * 3. Aligned
1379cbefe25SConrad Meyer  * 4. Tables
1389cbefe25SConrad Meyer  *
1399cbefe25SConrad Meyer  * Attempts to reserve objects of different types out of order will fail.
1409cbefe25SConrad Meyer  */
1419cbefe25SConrad Meyer typedef struct {
1429cbefe25SConrad Meyer     void* workspace;
1439cbefe25SConrad Meyer     void* workspaceEnd;
1449cbefe25SConrad Meyer 
1459cbefe25SConrad Meyer     void* objectEnd;
1469cbefe25SConrad Meyer     void* tableEnd;
1479cbefe25SConrad Meyer     void* tableValidEnd;
1489cbefe25SConrad Meyer     void* allocStart;
1499cbefe25SConrad Meyer 
150*f7cd7fe5SConrad Meyer     BYTE allocFailed;
1519cbefe25SConrad Meyer     int workspaceOversizedDuration;
1529cbefe25SConrad Meyer     ZSTD_cwksp_alloc_phase_e phase;
153*f7cd7fe5SConrad Meyer     ZSTD_cwksp_static_alloc_e isStatic;
1549cbefe25SConrad Meyer } ZSTD_cwksp;
1559cbefe25SConrad Meyer 
1569cbefe25SConrad Meyer /*-*************************************
1579cbefe25SConrad Meyer *  Functions
1589cbefe25SConrad Meyer ***************************************/
1599cbefe25SConrad Meyer 
1609cbefe25SConrad Meyer MEM_STATIC size_t ZSTD_cwksp_available_space(ZSTD_cwksp* ws);
1619cbefe25SConrad Meyer 
1629cbefe25SConrad Meyer MEM_STATIC void ZSTD_cwksp_assert_internal_consistency(ZSTD_cwksp* ws) {
1639cbefe25SConrad Meyer     (void)ws;
1649cbefe25SConrad Meyer     assert(ws->workspace <= ws->objectEnd);
1659cbefe25SConrad Meyer     assert(ws->objectEnd <= ws->tableEnd);
1669cbefe25SConrad Meyer     assert(ws->objectEnd <= ws->tableValidEnd);
1679cbefe25SConrad Meyer     assert(ws->tableEnd <= ws->allocStart);
1689cbefe25SConrad Meyer     assert(ws->tableValidEnd <= ws->allocStart);
1699cbefe25SConrad Meyer     assert(ws->allocStart <= ws->workspaceEnd);
1709cbefe25SConrad Meyer }
1719cbefe25SConrad Meyer 
1729cbefe25SConrad Meyer /**
1739cbefe25SConrad Meyer  * Align must be a power of 2.
1749cbefe25SConrad Meyer  */
1759cbefe25SConrad Meyer MEM_STATIC size_t ZSTD_cwksp_align(size_t size, size_t const align) {
1769cbefe25SConrad Meyer     size_t const mask = align - 1;
1779cbefe25SConrad Meyer     assert((align & mask) == 0);
1789cbefe25SConrad Meyer     return (size + mask) & ~mask;
1799cbefe25SConrad Meyer }
1809cbefe25SConrad Meyer 
1819cbefe25SConrad Meyer /**
1829cbefe25SConrad Meyer  * Use this to determine how much space in the workspace we will consume to
1839cbefe25SConrad Meyer  * allocate this object. (Normally it should be exactly the size of the object,
1849cbefe25SConrad Meyer  * but under special conditions, like ASAN, where we pad each object, it might
1859cbefe25SConrad Meyer  * be larger.)
1869cbefe25SConrad Meyer  *
1879cbefe25SConrad Meyer  * Since tables aren't currently redzoned, you don't need to call through this
1889cbefe25SConrad Meyer  * to figure out how much space you need for the matchState tables. Everything
1899cbefe25SConrad Meyer  * else is though.
1909cbefe25SConrad Meyer  */
1919cbefe25SConrad Meyer MEM_STATIC size_t ZSTD_cwksp_alloc_size(size_t size) {
192*f7cd7fe5SConrad Meyer     if (size == 0)
193*f7cd7fe5SConrad Meyer         return 0;
194*f7cd7fe5SConrad Meyer #if ZSTD_ADDRESS_SANITIZER && !defined (ZSTD_ASAN_DONT_POISON_WORKSPACE)
1959cbefe25SConrad Meyer     return size + 2 * ZSTD_CWKSP_ASAN_REDZONE_SIZE;
1969cbefe25SConrad Meyer #else
1979cbefe25SConrad Meyer     return size;
1989cbefe25SConrad Meyer #endif
1999cbefe25SConrad Meyer }
2009cbefe25SConrad Meyer 
2019cbefe25SConrad Meyer MEM_STATIC void ZSTD_cwksp_internal_advance_phase(
2029cbefe25SConrad Meyer         ZSTD_cwksp* ws, ZSTD_cwksp_alloc_phase_e phase) {
2039cbefe25SConrad Meyer     assert(phase >= ws->phase);
2049cbefe25SConrad Meyer     if (phase > ws->phase) {
2059cbefe25SConrad Meyer         if (ws->phase < ZSTD_cwksp_alloc_buffers &&
2069cbefe25SConrad Meyer                 phase >= ZSTD_cwksp_alloc_buffers) {
2079cbefe25SConrad Meyer             ws->tableValidEnd = ws->objectEnd;
2089cbefe25SConrad Meyer         }
2099cbefe25SConrad Meyer         if (ws->phase < ZSTD_cwksp_alloc_aligned &&
2109cbefe25SConrad Meyer                 phase >= ZSTD_cwksp_alloc_aligned) {
2119cbefe25SConrad Meyer             /* If unaligned allocations down from a too-large top have left us
2129cbefe25SConrad Meyer              * unaligned, we need to realign our alloc ptr. Technically, this
2139cbefe25SConrad Meyer              * can consume space that is unaccounted for in the neededSpace
2149cbefe25SConrad Meyer              * calculation. However, I believe this can only happen when the
2159cbefe25SConrad Meyer              * workspace is too large, and specifically when it is too large
2169cbefe25SConrad Meyer              * by a larger margin than the space that will be consumed. */
2179cbefe25SConrad Meyer             /* TODO: cleaner, compiler warning friendly way to do this??? */
2189cbefe25SConrad Meyer             ws->allocStart = (BYTE*)ws->allocStart - ((size_t)ws->allocStart & (sizeof(U32)-1));
2199cbefe25SConrad Meyer             if (ws->allocStart < ws->tableValidEnd) {
2209cbefe25SConrad Meyer                 ws->tableValidEnd = ws->allocStart;
2219cbefe25SConrad Meyer             }
2229cbefe25SConrad Meyer         }
2239cbefe25SConrad Meyer         ws->phase = phase;
2249cbefe25SConrad Meyer     }
2259cbefe25SConrad Meyer }
2269cbefe25SConrad Meyer 
2279cbefe25SConrad Meyer /**
2289cbefe25SConrad Meyer  * Returns whether this object/buffer/etc was allocated in this workspace.
2299cbefe25SConrad Meyer  */
2309cbefe25SConrad Meyer MEM_STATIC int ZSTD_cwksp_owns_buffer(const ZSTD_cwksp* ws, const void* ptr) {
2319cbefe25SConrad Meyer     return (ptr != NULL) && (ws->workspace <= ptr) && (ptr <= ws->workspaceEnd);
2329cbefe25SConrad Meyer }
2339cbefe25SConrad Meyer 
2349cbefe25SConrad Meyer /**
2359cbefe25SConrad Meyer  * Internal function. Do not use directly.
2369cbefe25SConrad Meyer  */
2379cbefe25SConrad Meyer MEM_STATIC void* ZSTD_cwksp_reserve_internal(
2389cbefe25SConrad Meyer         ZSTD_cwksp* ws, size_t bytes, ZSTD_cwksp_alloc_phase_e phase) {
2399cbefe25SConrad Meyer     void* alloc;
2409cbefe25SConrad Meyer     void* bottom = ws->tableEnd;
2419cbefe25SConrad Meyer     ZSTD_cwksp_internal_advance_phase(ws, phase);
2429cbefe25SConrad Meyer     alloc = (BYTE *)ws->allocStart - bytes;
2439cbefe25SConrad Meyer 
244*f7cd7fe5SConrad Meyer     if (bytes == 0)
245*f7cd7fe5SConrad Meyer         return NULL;
246*f7cd7fe5SConrad Meyer 
247*f7cd7fe5SConrad Meyer #if ZSTD_ADDRESS_SANITIZER && !defined (ZSTD_ASAN_DONT_POISON_WORKSPACE)
2489cbefe25SConrad Meyer     /* over-reserve space */
2499cbefe25SConrad Meyer     alloc = (BYTE *)alloc - 2 * ZSTD_CWKSP_ASAN_REDZONE_SIZE;
2509cbefe25SConrad Meyer #endif
2519cbefe25SConrad Meyer 
2529cbefe25SConrad Meyer     DEBUGLOG(5, "cwksp: reserving %p %zd bytes, %zd bytes remaining",
2539cbefe25SConrad Meyer         alloc, bytes, ZSTD_cwksp_available_space(ws) - bytes);
2549cbefe25SConrad Meyer     ZSTD_cwksp_assert_internal_consistency(ws);
2559cbefe25SConrad Meyer     assert(alloc >= bottom);
2569cbefe25SConrad Meyer     if (alloc < bottom) {
2579cbefe25SConrad Meyer         DEBUGLOG(4, "cwksp: alloc failed!");
2589cbefe25SConrad Meyer         ws->allocFailed = 1;
2599cbefe25SConrad Meyer         return NULL;
2609cbefe25SConrad Meyer     }
2619cbefe25SConrad Meyer     if (alloc < ws->tableValidEnd) {
2629cbefe25SConrad Meyer         ws->tableValidEnd = alloc;
2639cbefe25SConrad Meyer     }
2649cbefe25SConrad Meyer     ws->allocStart = alloc;
2659cbefe25SConrad Meyer 
266*f7cd7fe5SConrad Meyer #if ZSTD_ADDRESS_SANITIZER && !defined (ZSTD_ASAN_DONT_POISON_WORKSPACE)
2679cbefe25SConrad Meyer     /* Move alloc so there's ZSTD_CWKSP_ASAN_REDZONE_SIZE unused space on
2689cbefe25SConrad Meyer      * either size. */
2699cbefe25SConrad Meyer     alloc = (BYTE *)alloc + ZSTD_CWKSP_ASAN_REDZONE_SIZE;
270*f7cd7fe5SConrad Meyer     if (ws->isStatic == ZSTD_cwksp_dynamic_alloc) {
2719cbefe25SConrad Meyer         __asan_unpoison_memory_region(alloc, bytes);
272*f7cd7fe5SConrad Meyer     }
2739cbefe25SConrad Meyer #endif
2749cbefe25SConrad Meyer 
2759cbefe25SConrad Meyer     return alloc;
2769cbefe25SConrad Meyer }
2779cbefe25SConrad Meyer 
2789cbefe25SConrad Meyer /**
2799cbefe25SConrad Meyer  * Reserves and returns unaligned memory.
2809cbefe25SConrad Meyer  */
2819cbefe25SConrad Meyer MEM_STATIC BYTE* ZSTD_cwksp_reserve_buffer(ZSTD_cwksp* ws, size_t bytes) {
2829cbefe25SConrad Meyer     return (BYTE*)ZSTD_cwksp_reserve_internal(ws, bytes, ZSTD_cwksp_alloc_buffers);
2839cbefe25SConrad Meyer }
2849cbefe25SConrad Meyer 
2859cbefe25SConrad Meyer /**
2869cbefe25SConrad Meyer  * Reserves and returns memory sized on and aligned on sizeof(unsigned).
2879cbefe25SConrad Meyer  */
2889cbefe25SConrad Meyer MEM_STATIC void* ZSTD_cwksp_reserve_aligned(ZSTD_cwksp* ws, size_t bytes) {
2899cbefe25SConrad Meyer     assert((bytes & (sizeof(U32)-1)) == 0);
2909cbefe25SConrad Meyer     return ZSTD_cwksp_reserve_internal(ws, ZSTD_cwksp_align(bytes, sizeof(U32)), ZSTD_cwksp_alloc_aligned);
2919cbefe25SConrad Meyer }
2929cbefe25SConrad Meyer 
2939cbefe25SConrad Meyer /**
2949cbefe25SConrad Meyer  * Aligned on sizeof(unsigned). These buffers have the special property that
2959cbefe25SConrad Meyer  * their values remain constrained, allowing us to re-use them without
2969cbefe25SConrad Meyer  * memset()-ing them.
2979cbefe25SConrad Meyer  */
2989cbefe25SConrad Meyer MEM_STATIC void* ZSTD_cwksp_reserve_table(ZSTD_cwksp* ws, size_t bytes) {
2999cbefe25SConrad Meyer     const ZSTD_cwksp_alloc_phase_e phase = ZSTD_cwksp_alloc_aligned;
3009cbefe25SConrad Meyer     void* alloc = ws->tableEnd;
3019cbefe25SConrad Meyer     void* end = (BYTE *)alloc + bytes;
3029cbefe25SConrad Meyer     void* top = ws->allocStart;
3039cbefe25SConrad Meyer 
3049cbefe25SConrad Meyer     DEBUGLOG(5, "cwksp: reserving %p table %zd bytes, %zd bytes remaining",
3059cbefe25SConrad Meyer         alloc, bytes, ZSTD_cwksp_available_space(ws) - bytes);
3069cbefe25SConrad Meyer     assert((bytes & (sizeof(U32)-1)) == 0);
3079cbefe25SConrad Meyer     ZSTD_cwksp_internal_advance_phase(ws, phase);
3089cbefe25SConrad Meyer     ZSTD_cwksp_assert_internal_consistency(ws);
3099cbefe25SConrad Meyer     assert(end <= top);
3109cbefe25SConrad Meyer     if (end > top) {
3119cbefe25SConrad Meyer         DEBUGLOG(4, "cwksp: table alloc failed!");
3129cbefe25SConrad Meyer         ws->allocFailed = 1;
3139cbefe25SConrad Meyer         return NULL;
3149cbefe25SConrad Meyer     }
3159cbefe25SConrad Meyer     ws->tableEnd = end;
3169cbefe25SConrad Meyer 
317*f7cd7fe5SConrad Meyer #if ZSTD_ADDRESS_SANITIZER && !defined (ZSTD_ASAN_DONT_POISON_WORKSPACE)
318*f7cd7fe5SConrad Meyer     if (ws->isStatic == ZSTD_cwksp_dynamic_alloc) {
3199cbefe25SConrad Meyer         __asan_unpoison_memory_region(alloc, bytes);
320*f7cd7fe5SConrad Meyer     }
3219cbefe25SConrad Meyer #endif
3229cbefe25SConrad Meyer 
3239cbefe25SConrad Meyer     return alloc;
3249cbefe25SConrad Meyer }
3259cbefe25SConrad Meyer 
3269cbefe25SConrad Meyer /**
3279cbefe25SConrad Meyer  * Aligned on sizeof(void*).
3289cbefe25SConrad Meyer  */
3299cbefe25SConrad Meyer MEM_STATIC void* ZSTD_cwksp_reserve_object(ZSTD_cwksp* ws, size_t bytes) {
3309cbefe25SConrad Meyer     size_t roundedBytes = ZSTD_cwksp_align(bytes, sizeof(void*));
3319cbefe25SConrad Meyer     void* alloc = ws->objectEnd;
3329cbefe25SConrad Meyer     void* end = (BYTE*)alloc + roundedBytes;
3339cbefe25SConrad Meyer 
334*f7cd7fe5SConrad Meyer #if ZSTD_ADDRESS_SANITIZER && !defined (ZSTD_ASAN_DONT_POISON_WORKSPACE)
3359cbefe25SConrad Meyer     /* over-reserve space */
3369cbefe25SConrad Meyer     end = (BYTE *)end + 2 * ZSTD_CWKSP_ASAN_REDZONE_SIZE;
3379cbefe25SConrad Meyer #endif
3389cbefe25SConrad Meyer 
3399cbefe25SConrad Meyer     DEBUGLOG(5,
3409cbefe25SConrad Meyer         "cwksp: reserving %p object %zd bytes (rounded to %zd), %zd bytes remaining",
3419cbefe25SConrad Meyer         alloc, bytes, roundedBytes, ZSTD_cwksp_available_space(ws) - roundedBytes);
3429cbefe25SConrad Meyer     assert(((size_t)alloc & (sizeof(void*)-1)) == 0);
3439cbefe25SConrad Meyer     assert((bytes & (sizeof(void*)-1)) == 0);
3449cbefe25SConrad Meyer     ZSTD_cwksp_assert_internal_consistency(ws);
3459cbefe25SConrad Meyer     /* we must be in the first phase, no advance is possible */
3469cbefe25SConrad Meyer     if (ws->phase != ZSTD_cwksp_alloc_objects || end > ws->workspaceEnd) {
3479cbefe25SConrad Meyer         DEBUGLOG(4, "cwksp: object alloc failed!");
3489cbefe25SConrad Meyer         ws->allocFailed = 1;
3499cbefe25SConrad Meyer         return NULL;
3509cbefe25SConrad Meyer     }
3519cbefe25SConrad Meyer     ws->objectEnd = end;
3529cbefe25SConrad Meyer     ws->tableEnd = end;
3539cbefe25SConrad Meyer     ws->tableValidEnd = end;
3549cbefe25SConrad Meyer 
355*f7cd7fe5SConrad Meyer #if ZSTD_ADDRESS_SANITIZER && !defined (ZSTD_ASAN_DONT_POISON_WORKSPACE)
3569cbefe25SConrad Meyer     /* Move alloc so there's ZSTD_CWKSP_ASAN_REDZONE_SIZE unused space on
3579cbefe25SConrad Meyer      * either size. */
3589cbefe25SConrad Meyer     alloc = (BYTE *)alloc + ZSTD_CWKSP_ASAN_REDZONE_SIZE;
359*f7cd7fe5SConrad Meyer     if (ws->isStatic == ZSTD_cwksp_dynamic_alloc) {
3609cbefe25SConrad Meyer         __asan_unpoison_memory_region(alloc, bytes);
361*f7cd7fe5SConrad Meyer     }
3629cbefe25SConrad Meyer #endif
3639cbefe25SConrad Meyer 
3649cbefe25SConrad Meyer     return alloc;
3659cbefe25SConrad Meyer }
3669cbefe25SConrad Meyer 
3679cbefe25SConrad Meyer MEM_STATIC void ZSTD_cwksp_mark_tables_dirty(ZSTD_cwksp* ws) {
3689cbefe25SConrad Meyer     DEBUGLOG(4, "cwksp: ZSTD_cwksp_mark_tables_dirty");
3699cbefe25SConrad Meyer 
370*f7cd7fe5SConrad Meyer #if ZSTD_MEMORY_SANITIZER && !defined (ZSTD_MSAN_DONT_POISON_WORKSPACE)
3719cbefe25SConrad Meyer     /* To validate that the table re-use logic is sound, and that we don't
3729cbefe25SConrad Meyer      * access table space that we haven't cleaned, we re-"poison" the table
3739cbefe25SConrad Meyer      * space every time we mark it dirty. */
3749cbefe25SConrad Meyer     {
3759cbefe25SConrad Meyer         size_t size = (BYTE*)ws->tableValidEnd - (BYTE*)ws->objectEnd;
3769cbefe25SConrad Meyer         assert(__msan_test_shadow(ws->objectEnd, size) == -1);
3779cbefe25SConrad Meyer         __msan_poison(ws->objectEnd, size);
3789cbefe25SConrad Meyer     }
3799cbefe25SConrad Meyer #endif
3809cbefe25SConrad Meyer 
3819cbefe25SConrad Meyer     assert(ws->tableValidEnd >= ws->objectEnd);
3829cbefe25SConrad Meyer     assert(ws->tableValidEnd <= ws->allocStart);
3839cbefe25SConrad Meyer     ws->tableValidEnd = ws->objectEnd;
3849cbefe25SConrad Meyer     ZSTD_cwksp_assert_internal_consistency(ws);
3859cbefe25SConrad Meyer }
3869cbefe25SConrad Meyer 
3879cbefe25SConrad Meyer MEM_STATIC void ZSTD_cwksp_mark_tables_clean(ZSTD_cwksp* ws) {
3889cbefe25SConrad Meyer     DEBUGLOG(4, "cwksp: ZSTD_cwksp_mark_tables_clean");
3899cbefe25SConrad Meyer     assert(ws->tableValidEnd >= ws->objectEnd);
3909cbefe25SConrad Meyer     assert(ws->tableValidEnd <= ws->allocStart);
3919cbefe25SConrad Meyer     if (ws->tableValidEnd < ws->tableEnd) {
3929cbefe25SConrad Meyer         ws->tableValidEnd = ws->tableEnd;
3939cbefe25SConrad Meyer     }
3949cbefe25SConrad Meyer     ZSTD_cwksp_assert_internal_consistency(ws);
3959cbefe25SConrad Meyer }
3969cbefe25SConrad Meyer 
3979cbefe25SConrad Meyer /**
3989cbefe25SConrad Meyer  * Zero the part of the allocated tables not already marked clean.
3999cbefe25SConrad Meyer  */
4009cbefe25SConrad Meyer MEM_STATIC void ZSTD_cwksp_clean_tables(ZSTD_cwksp* ws) {
4019cbefe25SConrad Meyer     DEBUGLOG(4, "cwksp: ZSTD_cwksp_clean_tables");
4029cbefe25SConrad Meyer     assert(ws->tableValidEnd >= ws->objectEnd);
4039cbefe25SConrad Meyer     assert(ws->tableValidEnd <= ws->allocStart);
4049cbefe25SConrad Meyer     if (ws->tableValidEnd < ws->tableEnd) {
405*f7cd7fe5SConrad Meyer         ZSTD_memset(ws->tableValidEnd, 0, (BYTE*)ws->tableEnd - (BYTE*)ws->tableValidEnd);
4069cbefe25SConrad Meyer     }
4079cbefe25SConrad Meyer     ZSTD_cwksp_mark_tables_clean(ws);
4089cbefe25SConrad Meyer }
4099cbefe25SConrad Meyer 
4109cbefe25SConrad Meyer /**
4119cbefe25SConrad Meyer  * Invalidates table allocations.
4129cbefe25SConrad Meyer  * All other allocations remain valid.
4139cbefe25SConrad Meyer  */
4149cbefe25SConrad Meyer MEM_STATIC void ZSTD_cwksp_clear_tables(ZSTD_cwksp* ws) {
4159cbefe25SConrad Meyer     DEBUGLOG(4, "cwksp: clearing tables!");
4169cbefe25SConrad Meyer 
417*f7cd7fe5SConrad Meyer #if ZSTD_ADDRESS_SANITIZER && !defined (ZSTD_ASAN_DONT_POISON_WORKSPACE)
418*f7cd7fe5SConrad Meyer     /* We don't do this when the workspace is statically allocated, because
419*f7cd7fe5SConrad Meyer      * when that is the case, we have no capability to hook into the end of the
420*f7cd7fe5SConrad Meyer      * workspace's lifecycle to unpoison the memory.
421*f7cd7fe5SConrad Meyer      */
422*f7cd7fe5SConrad Meyer     if (ws->isStatic == ZSTD_cwksp_dynamic_alloc) {
4239cbefe25SConrad Meyer         size_t size = (BYTE*)ws->tableValidEnd - (BYTE*)ws->objectEnd;
4249cbefe25SConrad Meyer         __asan_poison_memory_region(ws->objectEnd, size);
4259cbefe25SConrad Meyer     }
4269cbefe25SConrad Meyer #endif
4279cbefe25SConrad Meyer 
4289cbefe25SConrad Meyer     ws->tableEnd = ws->objectEnd;
4299cbefe25SConrad Meyer     ZSTD_cwksp_assert_internal_consistency(ws);
4309cbefe25SConrad Meyer }
4319cbefe25SConrad Meyer 
4329cbefe25SConrad Meyer /**
4339cbefe25SConrad Meyer  * Invalidates all buffer, aligned, and table allocations.
4349cbefe25SConrad Meyer  * Object allocations remain valid.
4359cbefe25SConrad Meyer  */
4369cbefe25SConrad Meyer MEM_STATIC void ZSTD_cwksp_clear(ZSTD_cwksp* ws) {
4379cbefe25SConrad Meyer     DEBUGLOG(4, "cwksp: clearing!");
4389cbefe25SConrad Meyer 
439*f7cd7fe5SConrad Meyer #if ZSTD_MEMORY_SANITIZER && !defined (ZSTD_MSAN_DONT_POISON_WORKSPACE)
4409cbefe25SConrad Meyer     /* To validate that the context re-use logic is sound, and that we don't
4419cbefe25SConrad Meyer      * access stuff that this compression hasn't initialized, we re-"poison"
4429cbefe25SConrad Meyer      * the workspace (or at least the non-static, non-table parts of it)
4439cbefe25SConrad Meyer      * every time we start a new compression. */
4449cbefe25SConrad Meyer     {
4459cbefe25SConrad Meyer         size_t size = (BYTE*)ws->workspaceEnd - (BYTE*)ws->tableValidEnd;
4469cbefe25SConrad Meyer         __msan_poison(ws->tableValidEnd, size);
4479cbefe25SConrad Meyer     }
4489cbefe25SConrad Meyer #endif
4499cbefe25SConrad Meyer 
450*f7cd7fe5SConrad Meyer #if ZSTD_ADDRESS_SANITIZER && !defined (ZSTD_ASAN_DONT_POISON_WORKSPACE)
451*f7cd7fe5SConrad Meyer     /* We don't do this when the workspace is statically allocated, because
452*f7cd7fe5SConrad Meyer      * when that is the case, we have no capability to hook into the end of the
453*f7cd7fe5SConrad Meyer      * workspace's lifecycle to unpoison the memory.
454*f7cd7fe5SConrad Meyer      */
455*f7cd7fe5SConrad Meyer     if (ws->isStatic == ZSTD_cwksp_dynamic_alloc) {
4569cbefe25SConrad Meyer         size_t size = (BYTE*)ws->workspaceEnd - (BYTE*)ws->objectEnd;
4579cbefe25SConrad Meyer         __asan_poison_memory_region(ws->objectEnd, size);
4589cbefe25SConrad Meyer     }
4599cbefe25SConrad Meyer #endif
4609cbefe25SConrad Meyer 
4619cbefe25SConrad Meyer     ws->tableEnd = ws->objectEnd;
4629cbefe25SConrad Meyer     ws->allocStart = ws->workspaceEnd;
4639cbefe25SConrad Meyer     ws->allocFailed = 0;
4649cbefe25SConrad Meyer     if (ws->phase > ZSTD_cwksp_alloc_buffers) {
4659cbefe25SConrad Meyer         ws->phase = ZSTD_cwksp_alloc_buffers;
4669cbefe25SConrad Meyer     }
4679cbefe25SConrad Meyer     ZSTD_cwksp_assert_internal_consistency(ws);
4689cbefe25SConrad Meyer }
4699cbefe25SConrad Meyer 
4709cbefe25SConrad Meyer /**
4719cbefe25SConrad Meyer  * The provided workspace takes ownership of the buffer [start, start+size).
4729cbefe25SConrad Meyer  * Any existing values in the workspace are ignored (the previously managed
4739cbefe25SConrad Meyer  * buffer, if present, must be separately freed).
4749cbefe25SConrad Meyer  */
475*f7cd7fe5SConrad Meyer MEM_STATIC void ZSTD_cwksp_init(ZSTD_cwksp* ws, void* start, size_t size, ZSTD_cwksp_static_alloc_e isStatic) {
4769cbefe25SConrad Meyer     DEBUGLOG(4, "cwksp: init'ing workspace with %zd bytes", size);
4779cbefe25SConrad Meyer     assert(((size_t)start & (sizeof(void*)-1)) == 0); /* ensure correct alignment */
4789cbefe25SConrad Meyer     ws->workspace = start;
4799cbefe25SConrad Meyer     ws->workspaceEnd = (BYTE*)start + size;
4809cbefe25SConrad Meyer     ws->objectEnd = ws->workspace;
4819cbefe25SConrad Meyer     ws->tableValidEnd = ws->objectEnd;
4829cbefe25SConrad Meyer     ws->phase = ZSTD_cwksp_alloc_objects;
483*f7cd7fe5SConrad Meyer     ws->isStatic = isStatic;
4849cbefe25SConrad Meyer     ZSTD_cwksp_clear(ws);
4859cbefe25SConrad Meyer     ws->workspaceOversizedDuration = 0;
4869cbefe25SConrad Meyer     ZSTD_cwksp_assert_internal_consistency(ws);
4879cbefe25SConrad Meyer }
4889cbefe25SConrad Meyer 
4899cbefe25SConrad Meyer MEM_STATIC size_t ZSTD_cwksp_create(ZSTD_cwksp* ws, size_t size, ZSTD_customMem customMem) {
490*f7cd7fe5SConrad Meyer     void* workspace = ZSTD_customMalloc(size, customMem);
4919cbefe25SConrad Meyer     DEBUGLOG(4, "cwksp: creating new workspace with %zd bytes", size);
49237f1f268SConrad Meyer     RETURN_ERROR_IF(workspace == NULL, memory_allocation, "NULL pointer!");
493*f7cd7fe5SConrad Meyer     ZSTD_cwksp_init(ws, workspace, size, ZSTD_cwksp_dynamic_alloc);
4949cbefe25SConrad Meyer     return 0;
4959cbefe25SConrad Meyer }
4969cbefe25SConrad Meyer 
4979cbefe25SConrad Meyer MEM_STATIC void ZSTD_cwksp_free(ZSTD_cwksp* ws, ZSTD_customMem customMem) {
4989cbefe25SConrad Meyer     void *ptr = ws->workspace;
4999cbefe25SConrad Meyer     DEBUGLOG(4, "cwksp: freeing workspace");
500*f7cd7fe5SConrad Meyer     ZSTD_memset(ws, 0, sizeof(ZSTD_cwksp));
501*f7cd7fe5SConrad Meyer     ZSTD_customFree(ptr, customMem);
5029cbefe25SConrad Meyer }
5039cbefe25SConrad Meyer 
5049cbefe25SConrad Meyer /**
5059cbefe25SConrad Meyer  * Moves the management of a workspace from one cwksp to another. The src cwksp
5069cbefe25SConrad Meyer  * is left in an invalid state (src must be re-init()'ed before its used again).
5079cbefe25SConrad Meyer  */
5089cbefe25SConrad Meyer MEM_STATIC void ZSTD_cwksp_move(ZSTD_cwksp* dst, ZSTD_cwksp* src) {
5099cbefe25SConrad Meyer     *dst = *src;
510*f7cd7fe5SConrad Meyer     ZSTD_memset(src, 0, sizeof(ZSTD_cwksp));
5119cbefe25SConrad Meyer }
5129cbefe25SConrad Meyer 
5139cbefe25SConrad Meyer MEM_STATIC size_t ZSTD_cwksp_sizeof(const ZSTD_cwksp* ws) {
5149cbefe25SConrad Meyer     return (size_t)((BYTE*)ws->workspaceEnd - (BYTE*)ws->workspace);
5159cbefe25SConrad Meyer }
5169cbefe25SConrad Meyer 
517*f7cd7fe5SConrad Meyer MEM_STATIC size_t ZSTD_cwksp_used(const ZSTD_cwksp* ws) {
518*f7cd7fe5SConrad Meyer     return (size_t)((BYTE*)ws->tableEnd - (BYTE*)ws->workspace)
519*f7cd7fe5SConrad Meyer          + (size_t)((BYTE*)ws->workspaceEnd - (BYTE*)ws->allocStart);
520*f7cd7fe5SConrad Meyer }
521*f7cd7fe5SConrad Meyer 
5229cbefe25SConrad Meyer MEM_STATIC int ZSTD_cwksp_reserve_failed(const ZSTD_cwksp* ws) {
5239cbefe25SConrad Meyer     return ws->allocFailed;
5249cbefe25SConrad Meyer }
5259cbefe25SConrad Meyer 
5269cbefe25SConrad Meyer /*-*************************************
5279cbefe25SConrad Meyer *  Functions Checking Free Space
5289cbefe25SConrad Meyer ***************************************/
5299cbefe25SConrad Meyer 
5309cbefe25SConrad Meyer MEM_STATIC size_t ZSTD_cwksp_available_space(ZSTD_cwksp* ws) {
5319cbefe25SConrad Meyer     return (size_t)((BYTE*)ws->allocStart - (BYTE*)ws->tableEnd);
5329cbefe25SConrad Meyer }
5339cbefe25SConrad Meyer 
5349cbefe25SConrad Meyer MEM_STATIC int ZSTD_cwksp_check_available(ZSTD_cwksp* ws, size_t additionalNeededSpace) {
5359cbefe25SConrad Meyer     return ZSTD_cwksp_available_space(ws) >= additionalNeededSpace;
5369cbefe25SConrad Meyer }
5379cbefe25SConrad Meyer 
5389cbefe25SConrad Meyer MEM_STATIC int ZSTD_cwksp_check_too_large(ZSTD_cwksp* ws, size_t additionalNeededSpace) {
5399cbefe25SConrad Meyer     return ZSTD_cwksp_check_available(
5409cbefe25SConrad Meyer         ws, additionalNeededSpace * ZSTD_WORKSPACETOOLARGE_FACTOR);
5419cbefe25SConrad Meyer }
5429cbefe25SConrad Meyer 
5439cbefe25SConrad Meyer MEM_STATIC int ZSTD_cwksp_check_wasteful(ZSTD_cwksp* ws, size_t additionalNeededSpace) {
5449cbefe25SConrad Meyer     return ZSTD_cwksp_check_too_large(ws, additionalNeededSpace)
5459cbefe25SConrad Meyer         && ws->workspaceOversizedDuration > ZSTD_WORKSPACETOOLARGE_MAXDURATION;
5469cbefe25SConrad Meyer }
5479cbefe25SConrad Meyer 
5489cbefe25SConrad Meyer MEM_STATIC void ZSTD_cwksp_bump_oversized_duration(
5499cbefe25SConrad Meyer         ZSTD_cwksp* ws, size_t additionalNeededSpace) {
5509cbefe25SConrad Meyer     if (ZSTD_cwksp_check_too_large(ws, additionalNeededSpace)) {
5519cbefe25SConrad Meyer         ws->workspaceOversizedDuration++;
5529cbefe25SConrad Meyer     } else {
5539cbefe25SConrad Meyer         ws->workspaceOversizedDuration = 0;
5549cbefe25SConrad Meyer     }
5559cbefe25SConrad Meyer }
5569cbefe25SConrad Meyer 
5579cbefe25SConrad Meyer #if defined (__cplusplus)
5589cbefe25SConrad Meyer }
5599cbefe25SConrad Meyer #endif
5609cbefe25SConrad Meyer 
5619cbefe25SConrad Meyer #endif /* ZSTD_CWKSP_H */
562