162306a36Sopenharmony_ci/*
262306a36Sopenharmony_ci * Copyright (c) Yann Collet, Facebook, Inc.
362306a36Sopenharmony_ci * All rights reserved.
462306a36Sopenharmony_ci *
562306a36Sopenharmony_ci * This source code is licensed under both the BSD-style license (found in the
662306a36Sopenharmony_ci * LICENSE file in the root directory of this source tree) and the GPLv2 (found
762306a36Sopenharmony_ci * in the COPYING file in the root directory of this source tree).
862306a36Sopenharmony_ci * You may select, at your option, one of the above-listed licenses.
962306a36Sopenharmony_ci */
1062306a36Sopenharmony_ci
1162306a36Sopenharmony_ci#ifndef ZSTD_CWKSP_H
1262306a36Sopenharmony_ci#define ZSTD_CWKSP_H
1362306a36Sopenharmony_ci
1462306a36Sopenharmony_ci/*-*************************************
1562306a36Sopenharmony_ci*  Dependencies
1662306a36Sopenharmony_ci***************************************/
1762306a36Sopenharmony_ci#include "../common/zstd_internal.h"
1862306a36Sopenharmony_ci
1962306a36Sopenharmony_ci
2062306a36Sopenharmony_ci/*-*************************************
2162306a36Sopenharmony_ci*  Constants
2262306a36Sopenharmony_ci***************************************/
2362306a36Sopenharmony_ci
2462306a36Sopenharmony_ci/* Since the workspace is effectively its own little malloc implementation /
2562306a36Sopenharmony_ci * arena, when we run under ASAN, we should similarly insert redzones between
2662306a36Sopenharmony_ci * each internal element of the workspace, so ASAN will catch overruns that
2762306a36Sopenharmony_ci * reach outside an object but that stay inside the workspace.
2862306a36Sopenharmony_ci *
2962306a36Sopenharmony_ci * This defines the size of that redzone.
3062306a36Sopenharmony_ci */
3162306a36Sopenharmony_ci#ifndef ZSTD_CWKSP_ASAN_REDZONE_SIZE
3262306a36Sopenharmony_ci#define ZSTD_CWKSP_ASAN_REDZONE_SIZE 128
3362306a36Sopenharmony_ci#endif
3462306a36Sopenharmony_ci
3562306a36Sopenharmony_ci
3662306a36Sopenharmony_ci/* Set our tables and aligneds to align by 64 bytes */
3762306a36Sopenharmony_ci#define ZSTD_CWKSP_ALIGNMENT_BYTES 64
3862306a36Sopenharmony_ci
3962306a36Sopenharmony_ci/*-*************************************
4062306a36Sopenharmony_ci*  Structures
4162306a36Sopenharmony_ci***************************************/
4262306a36Sopenharmony_citypedef enum {
4362306a36Sopenharmony_ci    ZSTD_cwksp_alloc_objects,
4462306a36Sopenharmony_ci    ZSTD_cwksp_alloc_buffers,
4562306a36Sopenharmony_ci    ZSTD_cwksp_alloc_aligned
4662306a36Sopenharmony_ci} ZSTD_cwksp_alloc_phase_e;
4762306a36Sopenharmony_ci
4862306a36Sopenharmony_ci/*
4962306a36Sopenharmony_ci * Used to describe whether the workspace is statically allocated (and will not
5062306a36Sopenharmony_ci * necessarily ever be freed), or if it's dynamically allocated and we can
5162306a36Sopenharmony_ci * expect a well-formed caller to free this.
5262306a36Sopenharmony_ci */
5362306a36Sopenharmony_citypedef enum {
5462306a36Sopenharmony_ci    ZSTD_cwksp_dynamic_alloc,
5562306a36Sopenharmony_ci    ZSTD_cwksp_static_alloc
5662306a36Sopenharmony_ci} ZSTD_cwksp_static_alloc_e;
5762306a36Sopenharmony_ci
5862306a36Sopenharmony_ci/*
5962306a36Sopenharmony_ci * Zstd fits all its internal datastructures into a single continuous buffer,
6062306a36Sopenharmony_ci * so that it only needs to perform a single OS allocation (or so that a buffer
6162306a36Sopenharmony_ci * can be provided to it and it can perform no allocations at all). This buffer
6262306a36Sopenharmony_ci * is called the workspace.
6362306a36Sopenharmony_ci *
6462306a36Sopenharmony_ci * Several optimizations complicate that process of allocating memory ranges
6562306a36Sopenharmony_ci * from this workspace for each internal datastructure:
6662306a36Sopenharmony_ci *
6762306a36Sopenharmony_ci * - These different internal datastructures have different setup requirements:
6862306a36Sopenharmony_ci *
6962306a36Sopenharmony_ci *   - The static objects need to be cleared once and can then be trivially
7062306a36Sopenharmony_ci *     reused for each compression.
7162306a36Sopenharmony_ci *
7262306a36Sopenharmony_ci *   - Various buffers don't need to be initialized at all--they are always
7362306a36Sopenharmony_ci *     written into before they're read.
7462306a36Sopenharmony_ci *
7562306a36Sopenharmony_ci *   - The matchstate tables have a unique requirement that they don't need
7662306a36Sopenharmony_ci *     their memory to be totally cleared, but they do need the memory to have
7762306a36Sopenharmony_ci *     some bound, i.e., a guarantee that all values in the memory they've been
7862306a36Sopenharmony_ci *     allocated is less than some maximum value (which is the starting value
7962306a36Sopenharmony_ci *     for the indices that they will then use for compression). When this
8062306a36Sopenharmony_ci *     guarantee is provided to them, they can use the memory without any setup
8162306a36Sopenharmony_ci *     work. When it can't, they have to clear the area.
8262306a36Sopenharmony_ci *
8362306a36Sopenharmony_ci * - These buffers also have different alignment requirements.
8462306a36Sopenharmony_ci *
8562306a36Sopenharmony_ci * - We would like to reuse the objects in the workspace for multiple
8662306a36Sopenharmony_ci *   compressions without having to perform any expensive reallocation or
8762306a36Sopenharmony_ci *   reinitialization work.
8862306a36Sopenharmony_ci *
8962306a36Sopenharmony_ci * - We would like to be able to efficiently reuse the workspace across
9062306a36Sopenharmony_ci *   multiple compressions **even when the compression parameters change** and
9162306a36Sopenharmony_ci *   we need to resize some of the objects (where possible).
9262306a36Sopenharmony_ci *
9362306a36Sopenharmony_ci * To attempt to manage this buffer, given these constraints, the ZSTD_cwksp
9462306a36Sopenharmony_ci * abstraction was created. It works as follows:
9562306a36Sopenharmony_ci *
9662306a36Sopenharmony_ci * Workspace Layout:
9762306a36Sopenharmony_ci *
9862306a36Sopenharmony_ci * [                        ... workspace ...                         ]
9962306a36Sopenharmony_ci * [objects][tables ... ->] free space [<- ... aligned][<- ... buffers]
10062306a36Sopenharmony_ci *
10162306a36Sopenharmony_ci * The various objects that live in the workspace are divided into the
10262306a36Sopenharmony_ci * following categories, and are allocated separately:
10362306a36Sopenharmony_ci *
10462306a36Sopenharmony_ci * - Static objects: this is optionally the enclosing ZSTD_CCtx or ZSTD_CDict,
10562306a36Sopenharmony_ci *   so that literally everything fits in a single buffer. Note: if present,
10662306a36Sopenharmony_ci *   this must be the first object in the workspace, since ZSTD_customFree{CCtx,
10762306a36Sopenharmony_ci *   CDict}() rely on a pointer comparison to see whether one or two frees are
10862306a36Sopenharmony_ci *   required.
10962306a36Sopenharmony_ci *
11062306a36Sopenharmony_ci * - Fixed size objects: these are fixed-size, fixed-count objects that are
11162306a36Sopenharmony_ci *   nonetheless "dynamically" allocated in the workspace so that we can
11262306a36Sopenharmony_ci *   control how they're initialized separately from the broader ZSTD_CCtx.
11362306a36Sopenharmony_ci *   Examples:
11462306a36Sopenharmony_ci *   - Entropy Workspace
11562306a36Sopenharmony_ci *   - 2 x ZSTD_compressedBlockState_t
11662306a36Sopenharmony_ci *   - CDict dictionary contents
11762306a36Sopenharmony_ci *
11862306a36Sopenharmony_ci * - Tables: these are any of several different datastructures (hash tables,
11962306a36Sopenharmony_ci *   chain tables, binary trees) that all respect a common format: they are
12062306a36Sopenharmony_ci *   uint32_t arrays, all of whose values are between 0 and (nextSrc - base).
12162306a36Sopenharmony_ci *   Their sizes depend on the cparams. These tables are 64-byte aligned.
12262306a36Sopenharmony_ci *
12362306a36Sopenharmony_ci * - Aligned: these buffers are used for various purposes that require 4 byte
12462306a36Sopenharmony_ci *   alignment, but don't require any initialization before they're used. These
12562306a36Sopenharmony_ci *   buffers are each aligned to 64 bytes.
12662306a36Sopenharmony_ci *
12762306a36Sopenharmony_ci * - Buffers: these buffers are used for various purposes that don't require
12862306a36Sopenharmony_ci *   any alignment or initialization before they're used. This means they can
12962306a36Sopenharmony_ci *   be moved around at no cost for a new compression.
13062306a36Sopenharmony_ci *
13162306a36Sopenharmony_ci * Allocating Memory:
13262306a36Sopenharmony_ci *
13362306a36Sopenharmony_ci * The various types of objects must be allocated in order, so they can be
13462306a36Sopenharmony_ci * correctly packed into the workspace buffer. That order is:
13562306a36Sopenharmony_ci *
13662306a36Sopenharmony_ci * 1. Objects
13762306a36Sopenharmony_ci * 2. Buffers
13862306a36Sopenharmony_ci * 3. Aligned/Tables
13962306a36Sopenharmony_ci *
14062306a36Sopenharmony_ci * Attempts to reserve objects of different types out of order will fail.
14162306a36Sopenharmony_ci */
14262306a36Sopenharmony_citypedef struct {
14362306a36Sopenharmony_ci    void* workspace;
14462306a36Sopenharmony_ci    void* workspaceEnd;
14562306a36Sopenharmony_ci
14662306a36Sopenharmony_ci    void* objectEnd;
14762306a36Sopenharmony_ci    void* tableEnd;
14862306a36Sopenharmony_ci    void* tableValidEnd;
14962306a36Sopenharmony_ci    void* allocStart;
15062306a36Sopenharmony_ci
15162306a36Sopenharmony_ci    BYTE allocFailed;
15262306a36Sopenharmony_ci    int workspaceOversizedDuration;
15362306a36Sopenharmony_ci    ZSTD_cwksp_alloc_phase_e phase;
15462306a36Sopenharmony_ci    ZSTD_cwksp_static_alloc_e isStatic;
15562306a36Sopenharmony_ci} ZSTD_cwksp;
15662306a36Sopenharmony_ci
15762306a36Sopenharmony_ci/*-*************************************
15862306a36Sopenharmony_ci*  Functions
15962306a36Sopenharmony_ci***************************************/
16062306a36Sopenharmony_ci
16162306a36Sopenharmony_ciMEM_STATIC size_t ZSTD_cwksp_available_space(ZSTD_cwksp* ws);
16262306a36Sopenharmony_ci
16362306a36Sopenharmony_ciMEM_STATIC void ZSTD_cwksp_assert_internal_consistency(ZSTD_cwksp* ws) {
16462306a36Sopenharmony_ci    (void)ws;
16562306a36Sopenharmony_ci    assert(ws->workspace <= ws->objectEnd);
16662306a36Sopenharmony_ci    assert(ws->objectEnd <= ws->tableEnd);
16762306a36Sopenharmony_ci    assert(ws->objectEnd <= ws->tableValidEnd);
16862306a36Sopenharmony_ci    assert(ws->tableEnd <= ws->allocStart);
16962306a36Sopenharmony_ci    assert(ws->tableValidEnd <= ws->allocStart);
17062306a36Sopenharmony_ci    assert(ws->allocStart <= ws->workspaceEnd);
17162306a36Sopenharmony_ci}
17262306a36Sopenharmony_ci
17362306a36Sopenharmony_ci/*
17462306a36Sopenharmony_ci * Align must be a power of 2.
17562306a36Sopenharmony_ci */
17662306a36Sopenharmony_ciMEM_STATIC size_t ZSTD_cwksp_align(size_t size, size_t const align) {
17762306a36Sopenharmony_ci    size_t const mask = align - 1;
17862306a36Sopenharmony_ci    assert((align & mask) == 0);
17962306a36Sopenharmony_ci    return (size + mask) & ~mask;
18062306a36Sopenharmony_ci}
18162306a36Sopenharmony_ci
18262306a36Sopenharmony_ci/*
18362306a36Sopenharmony_ci * Use this to determine how much space in the workspace we will consume to
18462306a36Sopenharmony_ci * allocate this object. (Normally it should be exactly the size of the object,
18562306a36Sopenharmony_ci * but under special conditions, like ASAN, where we pad each object, it might
18662306a36Sopenharmony_ci * be larger.)
18762306a36Sopenharmony_ci *
18862306a36Sopenharmony_ci * Since tables aren't currently redzoned, you don't need to call through this
18962306a36Sopenharmony_ci * to figure out how much space you need for the matchState tables. Everything
19062306a36Sopenharmony_ci * else is though.
19162306a36Sopenharmony_ci *
19262306a36Sopenharmony_ci * Do not use for sizing aligned buffers. Instead, use ZSTD_cwksp_aligned_alloc_size().
19362306a36Sopenharmony_ci */
19462306a36Sopenharmony_ciMEM_STATIC size_t ZSTD_cwksp_alloc_size(size_t size) {
19562306a36Sopenharmony_ci    if (size == 0)
19662306a36Sopenharmony_ci        return 0;
19762306a36Sopenharmony_ci    return size;
19862306a36Sopenharmony_ci}
19962306a36Sopenharmony_ci
20062306a36Sopenharmony_ci/*
20162306a36Sopenharmony_ci * Returns an adjusted alloc size that is the nearest larger multiple of 64 bytes.
20262306a36Sopenharmony_ci * Used to determine the number of bytes required for a given "aligned".
20362306a36Sopenharmony_ci */
20462306a36Sopenharmony_ciMEM_STATIC size_t ZSTD_cwksp_aligned_alloc_size(size_t size) {
20562306a36Sopenharmony_ci    return ZSTD_cwksp_alloc_size(ZSTD_cwksp_align(size, ZSTD_CWKSP_ALIGNMENT_BYTES));
20662306a36Sopenharmony_ci}
20762306a36Sopenharmony_ci
20862306a36Sopenharmony_ci/*
20962306a36Sopenharmony_ci * Returns the amount of additional space the cwksp must allocate
21062306a36Sopenharmony_ci * for internal purposes (currently only alignment).
21162306a36Sopenharmony_ci */
21262306a36Sopenharmony_ciMEM_STATIC size_t ZSTD_cwksp_slack_space_required(void) {
21362306a36Sopenharmony_ci    /* For alignment, the wksp will always allocate an additional n_1=[1, 64] bytes
21462306a36Sopenharmony_ci     * to align the beginning of tables section, as well as another n_2=[0, 63] bytes
21562306a36Sopenharmony_ci     * to align the beginning of the aligned section.
21662306a36Sopenharmony_ci     *
21762306a36Sopenharmony_ci     * n_1 + n_2 == 64 bytes if the cwksp is freshly allocated, due to tables and
21862306a36Sopenharmony_ci     * aligneds being sized in multiples of 64 bytes.
21962306a36Sopenharmony_ci     */
22062306a36Sopenharmony_ci    size_t const slackSpace = ZSTD_CWKSP_ALIGNMENT_BYTES;
22162306a36Sopenharmony_ci    return slackSpace;
22262306a36Sopenharmony_ci}
22362306a36Sopenharmony_ci
22462306a36Sopenharmony_ci
22562306a36Sopenharmony_ci/*
22662306a36Sopenharmony_ci * Return the number of additional bytes required to align a pointer to the given number of bytes.
22762306a36Sopenharmony_ci * alignBytes must be a power of two.
22862306a36Sopenharmony_ci */
22962306a36Sopenharmony_ciMEM_STATIC size_t ZSTD_cwksp_bytes_to_align_ptr(void* ptr, const size_t alignBytes) {
23062306a36Sopenharmony_ci    size_t const alignBytesMask = alignBytes - 1;
23162306a36Sopenharmony_ci    size_t const bytes = (alignBytes - ((size_t)ptr & (alignBytesMask))) & alignBytesMask;
23262306a36Sopenharmony_ci    assert((alignBytes & alignBytesMask) == 0);
23362306a36Sopenharmony_ci    assert(bytes != ZSTD_CWKSP_ALIGNMENT_BYTES);
23462306a36Sopenharmony_ci    return bytes;
23562306a36Sopenharmony_ci}
23662306a36Sopenharmony_ci
23762306a36Sopenharmony_ci/*
23862306a36Sopenharmony_ci * Internal function. Do not use directly.
23962306a36Sopenharmony_ci * Reserves the given number of bytes within the aligned/buffer segment of the wksp,
24062306a36Sopenharmony_ci * which counts from the end of the wksp (as opposed to the object/table segment).
24162306a36Sopenharmony_ci *
24262306a36Sopenharmony_ci * Returns a pointer to the beginning of that space.
24362306a36Sopenharmony_ci */
24462306a36Sopenharmony_ciMEM_STATIC void*
24562306a36Sopenharmony_ciZSTD_cwksp_reserve_internal_buffer_space(ZSTD_cwksp* ws, size_t const bytes)
24662306a36Sopenharmony_ci{
24762306a36Sopenharmony_ci    void* const alloc = (BYTE*)ws->allocStart - bytes;
24862306a36Sopenharmony_ci    void* const bottom = ws->tableEnd;
24962306a36Sopenharmony_ci    DEBUGLOG(5, "cwksp: reserving %p %zd bytes, %zd bytes remaining",
25062306a36Sopenharmony_ci        alloc, bytes, ZSTD_cwksp_available_space(ws) - bytes);
25162306a36Sopenharmony_ci    ZSTD_cwksp_assert_internal_consistency(ws);
25262306a36Sopenharmony_ci    assert(alloc >= bottom);
25362306a36Sopenharmony_ci    if (alloc < bottom) {
25462306a36Sopenharmony_ci        DEBUGLOG(4, "cwksp: alloc failed!");
25562306a36Sopenharmony_ci        ws->allocFailed = 1;
25662306a36Sopenharmony_ci        return NULL;
25762306a36Sopenharmony_ci    }
25862306a36Sopenharmony_ci    /* the area is reserved from the end of wksp.
25962306a36Sopenharmony_ci     * If it overlaps with tableValidEnd, it voids guarantees on values' range */
26062306a36Sopenharmony_ci    if (alloc < ws->tableValidEnd) {
26162306a36Sopenharmony_ci        ws->tableValidEnd = alloc;
26262306a36Sopenharmony_ci    }
26362306a36Sopenharmony_ci    ws->allocStart = alloc;
26462306a36Sopenharmony_ci    return alloc;
26562306a36Sopenharmony_ci}
26662306a36Sopenharmony_ci
26762306a36Sopenharmony_ci/*
26862306a36Sopenharmony_ci * Moves the cwksp to the next phase, and does any necessary allocations.
26962306a36Sopenharmony_ci * cwksp initialization must necessarily go through each phase in order.
27062306a36Sopenharmony_ci * Returns a 0 on success, or zstd error
27162306a36Sopenharmony_ci */
27262306a36Sopenharmony_ciMEM_STATIC size_t
27362306a36Sopenharmony_ciZSTD_cwksp_internal_advance_phase(ZSTD_cwksp* ws, ZSTD_cwksp_alloc_phase_e phase)
27462306a36Sopenharmony_ci{
27562306a36Sopenharmony_ci    assert(phase >= ws->phase);
27662306a36Sopenharmony_ci    if (phase > ws->phase) {
27762306a36Sopenharmony_ci        /* Going from allocating objects to allocating buffers */
27862306a36Sopenharmony_ci        if (ws->phase < ZSTD_cwksp_alloc_buffers &&
27962306a36Sopenharmony_ci                phase >= ZSTD_cwksp_alloc_buffers) {
28062306a36Sopenharmony_ci            ws->tableValidEnd = ws->objectEnd;
28162306a36Sopenharmony_ci        }
28262306a36Sopenharmony_ci
28362306a36Sopenharmony_ci        /* Going from allocating buffers to allocating aligneds/tables */
28462306a36Sopenharmony_ci        if (ws->phase < ZSTD_cwksp_alloc_aligned &&
28562306a36Sopenharmony_ci                phase >= ZSTD_cwksp_alloc_aligned) {
28662306a36Sopenharmony_ci            {   /* Align the start of the "aligned" to 64 bytes. Use [1, 64] bytes. */
28762306a36Sopenharmony_ci                size_t const bytesToAlign =
28862306a36Sopenharmony_ci                    ZSTD_CWKSP_ALIGNMENT_BYTES - ZSTD_cwksp_bytes_to_align_ptr(ws->allocStart, ZSTD_CWKSP_ALIGNMENT_BYTES);
28962306a36Sopenharmony_ci                DEBUGLOG(5, "reserving aligned alignment addtl space: %zu", bytesToAlign);
29062306a36Sopenharmony_ci                ZSTD_STATIC_ASSERT((ZSTD_CWKSP_ALIGNMENT_BYTES & (ZSTD_CWKSP_ALIGNMENT_BYTES - 1)) == 0); /* power of 2 */
29162306a36Sopenharmony_ci                RETURN_ERROR_IF(!ZSTD_cwksp_reserve_internal_buffer_space(ws, bytesToAlign),
29262306a36Sopenharmony_ci                                memory_allocation, "aligned phase - alignment initial allocation failed!");
29362306a36Sopenharmony_ci            }
29462306a36Sopenharmony_ci            {   /* Align the start of the tables to 64 bytes. Use [0, 63] bytes */
29562306a36Sopenharmony_ci                void* const alloc = ws->objectEnd;
29662306a36Sopenharmony_ci                size_t const bytesToAlign = ZSTD_cwksp_bytes_to_align_ptr(alloc, ZSTD_CWKSP_ALIGNMENT_BYTES);
29762306a36Sopenharmony_ci                void* const objectEnd = (BYTE*)alloc + bytesToAlign;
29862306a36Sopenharmony_ci                DEBUGLOG(5, "reserving table alignment addtl space: %zu", bytesToAlign);
29962306a36Sopenharmony_ci                RETURN_ERROR_IF(objectEnd > ws->workspaceEnd, memory_allocation,
30062306a36Sopenharmony_ci                                "table phase - alignment initial allocation failed!");
30162306a36Sopenharmony_ci                ws->objectEnd = objectEnd;
30262306a36Sopenharmony_ci                ws->tableEnd = objectEnd;  /* table area starts being empty */
30362306a36Sopenharmony_ci                if (ws->tableValidEnd < ws->tableEnd) {
30462306a36Sopenharmony_ci                    ws->tableValidEnd = ws->tableEnd;
30562306a36Sopenharmony_ci        }   }   }
30662306a36Sopenharmony_ci        ws->phase = phase;
30762306a36Sopenharmony_ci        ZSTD_cwksp_assert_internal_consistency(ws);
30862306a36Sopenharmony_ci    }
30962306a36Sopenharmony_ci    return 0;
31062306a36Sopenharmony_ci}
31162306a36Sopenharmony_ci
31262306a36Sopenharmony_ci/*
31362306a36Sopenharmony_ci * Returns whether this object/buffer/etc was allocated in this workspace.
31462306a36Sopenharmony_ci */
31562306a36Sopenharmony_ciMEM_STATIC int ZSTD_cwksp_owns_buffer(const ZSTD_cwksp* ws, const void* ptr)
31662306a36Sopenharmony_ci{
31762306a36Sopenharmony_ci    return (ptr != NULL) && (ws->workspace <= ptr) && (ptr <= ws->workspaceEnd);
31862306a36Sopenharmony_ci}
31962306a36Sopenharmony_ci
32062306a36Sopenharmony_ci/*
32162306a36Sopenharmony_ci * Internal function. Do not use directly.
32262306a36Sopenharmony_ci */
32362306a36Sopenharmony_ciMEM_STATIC void*
32462306a36Sopenharmony_ciZSTD_cwksp_reserve_internal(ZSTD_cwksp* ws, size_t bytes, ZSTD_cwksp_alloc_phase_e phase)
32562306a36Sopenharmony_ci{
32662306a36Sopenharmony_ci    void* alloc;
32762306a36Sopenharmony_ci    if (ZSTD_isError(ZSTD_cwksp_internal_advance_phase(ws, phase)) || bytes == 0) {
32862306a36Sopenharmony_ci        return NULL;
32962306a36Sopenharmony_ci    }
33062306a36Sopenharmony_ci
33162306a36Sopenharmony_ci
33262306a36Sopenharmony_ci    alloc = ZSTD_cwksp_reserve_internal_buffer_space(ws, bytes);
33362306a36Sopenharmony_ci
33462306a36Sopenharmony_ci
33562306a36Sopenharmony_ci    return alloc;
33662306a36Sopenharmony_ci}
33762306a36Sopenharmony_ci
33862306a36Sopenharmony_ci/*
33962306a36Sopenharmony_ci * Reserves and returns unaligned memory.
34062306a36Sopenharmony_ci */
34162306a36Sopenharmony_ciMEM_STATIC BYTE* ZSTD_cwksp_reserve_buffer(ZSTD_cwksp* ws, size_t bytes)
34262306a36Sopenharmony_ci{
34362306a36Sopenharmony_ci    return (BYTE*)ZSTD_cwksp_reserve_internal(ws, bytes, ZSTD_cwksp_alloc_buffers);
34462306a36Sopenharmony_ci}
34562306a36Sopenharmony_ci
34662306a36Sopenharmony_ci/*
34762306a36Sopenharmony_ci * Reserves and returns memory sized on and aligned on ZSTD_CWKSP_ALIGNMENT_BYTES (64 bytes).
34862306a36Sopenharmony_ci */
34962306a36Sopenharmony_ciMEM_STATIC void* ZSTD_cwksp_reserve_aligned(ZSTD_cwksp* ws, size_t bytes)
35062306a36Sopenharmony_ci{
35162306a36Sopenharmony_ci    void* ptr = ZSTD_cwksp_reserve_internal(ws, ZSTD_cwksp_align(bytes, ZSTD_CWKSP_ALIGNMENT_BYTES),
35262306a36Sopenharmony_ci                                            ZSTD_cwksp_alloc_aligned);
35362306a36Sopenharmony_ci    assert(((size_t)ptr & (ZSTD_CWKSP_ALIGNMENT_BYTES-1))== 0);
35462306a36Sopenharmony_ci    return ptr;
35562306a36Sopenharmony_ci}
35662306a36Sopenharmony_ci
35762306a36Sopenharmony_ci/*
35862306a36Sopenharmony_ci * Aligned on 64 bytes. These buffers have the special property that
35962306a36Sopenharmony_ci * their values remain constrained, allowing us to re-use them without
36062306a36Sopenharmony_ci * memset()-ing them.
36162306a36Sopenharmony_ci */
36262306a36Sopenharmony_ciMEM_STATIC void* ZSTD_cwksp_reserve_table(ZSTD_cwksp* ws, size_t bytes)
36362306a36Sopenharmony_ci{
36462306a36Sopenharmony_ci    const ZSTD_cwksp_alloc_phase_e phase = ZSTD_cwksp_alloc_aligned;
36562306a36Sopenharmony_ci    void* alloc;
36662306a36Sopenharmony_ci    void* end;
36762306a36Sopenharmony_ci    void* top;
36862306a36Sopenharmony_ci
36962306a36Sopenharmony_ci    if (ZSTD_isError(ZSTD_cwksp_internal_advance_phase(ws, phase))) {
37062306a36Sopenharmony_ci        return NULL;
37162306a36Sopenharmony_ci    }
37262306a36Sopenharmony_ci    alloc = ws->tableEnd;
37362306a36Sopenharmony_ci    end = (BYTE *)alloc + bytes;
37462306a36Sopenharmony_ci    top = ws->allocStart;
37562306a36Sopenharmony_ci
37662306a36Sopenharmony_ci    DEBUGLOG(5, "cwksp: reserving %p table %zd bytes, %zd bytes remaining",
37762306a36Sopenharmony_ci        alloc, bytes, ZSTD_cwksp_available_space(ws) - bytes);
37862306a36Sopenharmony_ci    assert((bytes & (sizeof(U32)-1)) == 0);
37962306a36Sopenharmony_ci    ZSTD_cwksp_assert_internal_consistency(ws);
38062306a36Sopenharmony_ci    assert(end <= top);
38162306a36Sopenharmony_ci    if (end > top) {
38262306a36Sopenharmony_ci        DEBUGLOG(4, "cwksp: table alloc failed!");
38362306a36Sopenharmony_ci        ws->allocFailed = 1;
38462306a36Sopenharmony_ci        return NULL;
38562306a36Sopenharmony_ci    }
38662306a36Sopenharmony_ci    ws->tableEnd = end;
38762306a36Sopenharmony_ci
38862306a36Sopenharmony_ci
38962306a36Sopenharmony_ci    assert((bytes & (ZSTD_CWKSP_ALIGNMENT_BYTES-1)) == 0);
39062306a36Sopenharmony_ci    assert(((size_t)alloc & (ZSTD_CWKSP_ALIGNMENT_BYTES-1))== 0);
39162306a36Sopenharmony_ci    return alloc;
39262306a36Sopenharmony_ci}
39362306a36Sopenharmony_ci
39462306a36Sopenharmony_ci/*
39562306a36Sopenharmony_ci * Aligned on sizeof(void*).
39662306a36Sopenharmony_ci * Note : should happen only once, at workspace first initialization
39762306a36Sopenharmony_ci */
39862306a36Sopenharmony_ciMEM_STATIC void* ZSTD_cwksp_reserve_object(ZSTD_cwksp* ws, size_t bytes)
39962306a36Sopenharmony_ci{
40062306a36Sopenharmony_ci    size_t const roundedBytes = ZSTD_cwksp_align(bytes, sizeof(void*));
40162306a36Sopenharmony_ci    void* alloc = ws->objectEnd;
40262306a36Sopenharmony_ci    void* end = (BYTE*)alloc + roundedBytes;
40362306a36Sopenharmony_ci
40462306a36Sopenharmony_ci
40562306a36Sopenharmony_ci    DEBUGLOG(4,
40662306a36Sopenharmony_ci        "cwksp: reserving %p object %zd bytes (rounded to %zd), %zd bytes remaining",
40762306a36Sopenharmony_ci        alloc, bytes, roundedBytes, ZSTD_cwksp_available_space(ws) - roundedBytes);
40862306a36Sopenharmony_ci    assert((size_t)alloc % ZSTD_ALIGNOF(void*) == 0);
40962306a36Sopenharmony_ci    assert(bytes % ZSTD_ALIGNOF(void*) == 0);
41062306a36Sopenharmony_ci    ZSTD_cwksp_assert_internal_consistency(ws);
41162306a36Sopenharmony_ci    /* we must be in the first phase, no advance is possible */
41262306a36Sopenharmony_ci    if (ws->phase != ZSTD_cwksp_alloc_objects || end > ws->workspaceEnd) {
41362306a36Sopenharmony_ci        DEBUGLOG(3, "cwksp: object alloc failed!");
41462306a36Sopenharmony_ci        ws->allocFailed = 1;
41562306a36Sopenharmony_ci        return NULL;
41662306a36Sopenharmony_ci    }
41762306a36Sopenharmony_ci    ws->objectEnd = end;
41862306a36Sopenharmony_ci    ws->tableEnd = end;
41962306a36Sopenharmony_ci    ws->tableValidEnd = end;
42062306a36Sopenharmony_ci
42162306a36Sopenharmony_ci
42262306a36Sopenharmony_ci    return alloc;
42362306a36Sopenharmony_ci}
42462306a36Sopenharmony_ci
42562306a36Sopenharmony_ciMEM_STATIC void ZSTD_cwksp_mark_tables_dirty(ZSTD_cwksp* ws)
42662306a36Sopenharmony_ci{
42762306a36Sopenharmony_ci    DEBUGLOG(4, "cwksp: ZSTD_cwksp_mark_tables_dirty");
42862306a36Sopenharmony_ci
42962306a36Sopenharmony_ci
43062306a36Sopenharmony_ci    assert(ws->tableValidEnd >= ws->objectEnd);
43162306a36Sopenharmony_ci    assert(ws->tableValidEnd <= ws->allocStart);
43262306a36Sopenharmony_ci    ws->tableValidEnd = ws->objectEnd;
43362306a36Sopenharmony_ci    ZSTD_cwksp_assert_internal_consistency(ws);
43462306a36Sopenharmony_ci}
43562306a36Sopenharmony_ci
43662306a36Sopenharmony_ciMEM_STATIC void ZSTD_cwksp_mark_tables_clean(ZSTD_cwksp* ws) {
43762306a36Sopenharmony_ci    DEBUGLOG(4, "cwksp: ZSTD_cwksp_mark_tables_clean");
43862306a36Sopenharmony_ci    assert(ws->tableValidEnd >= ws->objectEnd);
43962306a36Sopenharmony_ci    assert(ws->tableValidEnd <= ws->allocStart);
44062306a36Sopenharmony_ci    if (ws->tableValidEnd < ws->tableEnd) {
44162306a36Sopenharmony_ci        ws->tableValidEnd = ws->tableEnd;
44262306a36Sopenharmony_ci    }
44362306a36Sopenharmony_ci    ZSTD_cwksp_assert_internal_consistency(ws);
44462306a36Sopenharmony_ci}
44562306a36Sopenharmony_ci
44662306a36Sopenharmony_ci/*
44762306a36Sopenharmony_ci * Zero the part of the allocated tables not already marked clean.
44862306a36Sopenharmony_ci */
44962306a36Sopenharmony_ciMEM_STATIC void ZSTD_cwksp_clean_tables(ZSTD_cwksp* ws) {
45062306a36Sopenharmony_ci    DEBUGLOG(4, "cwksp: ZSTD_cwksp_clean_tables");
45162306a36Sopenharmony_ci    assert(ws->tableValidEnd >= ws->objectEnd);
45262306a36Sopenharmony_ci    assert(ws->tableValidEnd <= ws->allocStart);
45362306a36Sopenharmony_ci    if (ws->tableValidEnd < ws->tableEnd) {
45462306a36Sopenharmony_ci        ZSTD_memset(ws->tableValidEnd, 0, (BYTE*)ws->tableEnd - (BYTE*)ws->tableValidEnd);
45562306a36Sopenharmony_ci    }
45662306a36Sopenharmony_ci    ZSTD_cwksp_mark_tables_clean(ws);
45762306a36Sopenharmony_ci}
45862306a36Sopenharmony_ci
45962306a36Sopenharmony_ci/*
46062306a36Sopenharmony_ci * Invalidates table allocations.
46162306a36Sopenharmony_ci * All other allocations remain valid.
46262306a36Sopenharmony_ci */
46362306a36Sopenharmony_ciMEM_STATIC void ZSTD_cwksp_clear_tables(ZSTD_cwksp* ws) {
46462306a36Sopenharmony_ci    DEBUGLOG(4, "cwksp: clearing tables!");
46562306a36Sopenharmony_ci
46662306a36Sopenharmony_ci
46762306a36Sopenharmony_ci    ws->tableEnd = ws->objectEnd;
46862306a36Sopenharmony_ci    ZSTD_cwksp_assert_internal_consistency(ws);
46962306a36Sopenharmony_ci}
47062306a36Sopenharmony_ci
47162306a36Sopenharmony_ci/*
47262306a36Sopenharmony_ci * Invalidates all buffer, aligned, and table allocations.
47362306a36Sopenharmony_ci * Object allocations remain valid.
47462306a36Sopenharmony_ci */
47562306a36Sopenharmony_ciMEM_STATIC void ZSTD_cwksp_clear(ZSTD_cwksp* ws) {
47662306a36Sopenharmony_ci    DEBUGLOG(4, "cwksp: clearing!");
47762306a36Sopenharmony_ci
47862306a36Sopenharmony_ci
47962306a36Sopenharmony_ci
48062306a36Sopenharmony_ci    ws->tableEnd = ws->objectEnd;
48162306a36Sopenharmony_ci    ws->allocStart = ws->workspaceEnd;
48262306a36Sopenharmony_ci    ws->allocFailed = 0;
48362306a36Sopenharmony_ci    if (ws->phase > ZSTD_cwksp_alloc_buffers) {
48462306a36Sopenharmony_ci        ws->phase = ZSTD_cwksp_alloc_buffers;
48562306a36Sopenharmony_ci    }
48662306a36Sopenharmony_ci    ZSTD_cwksp_assert_internal_consistency(ws);
48762306a36Sopenharmony_ci}
48862306a36Sopenharmony_ci
48962306a36Sopenharmony_ci/*
49062306a36Sopenharmony_ci * The provided workspace takes ownership of the buffer [start, start+size).
49162306a36Sopenharmony_ci * Any existing values in the workspace are ignored (the previously managed
49262306a36Sopenharmony_ci * buffer, if present, must be separately freed).
49362306a36Sopenharmony_ci */
49462306a36Sopenharmony_ciMEM_STATIC void ZSTD_cwksp_init(ZSTD_cwksp* ws, void* start, size_t size, ZSTD_cwksp_static_alloc_e isStatic) {
49562306a36Sopenharmony_ci    DEBUGLOG(4, "cwksp: init'ing workspace with %zd bytes", size);
49662306a36Sopenharmony_ci    assert(((size_t)start & (sizeof(void*)-1)) == 0); /* ensure correct alignment */
49762306a36Sopenharmony_ci    ws->workspace = start;
49862306a36Sopenharmony_ci    ws->workspaceEnd = (BYTE*)start + size;
49962306a36Sopenharmony_ci    ws->objectEnd = ws->workspace;
50062306a36Sopenharmony_ci    ws->tableValidEnd = ws->objectEnd;
50162306a36Sopenharmony_ci    ws->phase = ZSTD_cwksp_alloc_objects;
50262306a36Sopenharmony_ci    ws->isStatic = isStatic;
50362306a36Sopenharmony_ci    ZSTD_cwksp_clear(ws);
50462306a36Sopenharmony_ci    ws->workspaceOversizedDuration = 0;
50562306a36Sopenharmony_ci    ZSTD_cwksp_assert_internal_consistency(ws);
50662306a36Sopenharmony_ci}
50762306a36Sopenharmony_ci
50862306a36Sopenharmony_ciMEM_STATIC size_t ZSTD_cwksp_create(ZSTD_cwksp* ws, size_t size, ZSTD_customMem customMem) {
50962306a36Sopenharmony_ci    void* workspace = ZSTD_customMalloc(size, customMem);
51062306a36Sopenharmony_ci    DEBUGLOG(4, "cwksp: creating new workspace with %zd bytes", size);
51162306a36Sopenharmony_ci    RETURN_ERROR_IF(workspace == NULL, memory_allocation, "NULL pointer!");
51262306a36Sopenharmony_ci    ZSTD_cwksp_init(ws, workspace, size, ZSTD_cwksp_dynamic_alloc);
51362306a36Sopenharmony_ci    return 0;
51462306a36Sopenharmony_ci}
51562306a36Sopenharmony_ci
51662306a36Sopenharmony_ciMEM_STATIC void ZSTD_cwksp_free(ZSTD_cwksp* ws, ZSTD_customMem customMem) {
51762306a36Sopenharmony_ci    void *ptr = ws->workspace;
51862306a36Sopenharmony_ci    DEBUGLOG(4, "cwksp: freeing workspace");
51962306a36Sopenharmony_ci    ZSTD_memset(ws, 0, sizeof(ZSTD_cwksp));
52062306a36Sopenharmony_ci    ZSTD_customFree(ptr, customMem);
52162306a36Sopenharmony_ci}
52262306a36Sopenharmony_ci
52362306a36Sopenharmony_ci/*
52462306a36Sopenharmony_ci * Moves the management of a workspace from one cwksp to another. The src cwksp
52562306a36Sopenharmony_ci * is left in an invalid state (src must be re-init()'ed before it's used again).
52662306a36Sopenharmony_ci */
52762306a36Sopenharmony_ciMEM_STATIC void ZSTD_cwksp_move(ZSTD_cwksp* dst, ZSTD_cwksp* src) {
52862306a36Sopenharmony_ci    *dst = *src;
52962306a36Sopenharmony_ci    ZSTD_memset(src, 0, sizeof(ZSTD_cwksp));
53062306a36Sopenharmony_ci}
53162306a36Sopenharmony_ci
53262306a36Sopenharmony_ciMEM_STATIC size_t ZSTD_cwksp_sizeof(const ZSTD_cwksp* ws) {
53362306a36Sopenharmony_ci    return (size_t)((BYTE*)ws->workspaceEnd - (BYTE*)ws->workspace);
53462306a36Sopenharmony_ci}
53562306a36Sopenharmony_ci
53662306a36Sopenharmony_ciMEM_STATIC size_t ZSTD_cwksp_used(const ZSTD_cwksp* ws) {
53762306a36Sopenharmony_ci    return (size_t)((BYTE*)ws->tableEnd - (BYTE*)ws->workspace)
53862306a36Sopenharmony_ci         + (size_t)((BYTE*)ws->workspaceEnd - (BYTE*)ws->allocStart);
53962306a36Sopenharmony_ci}
54062306a36Sopenharmony_ci
54162306a36Sopenharmony_ciMEM_STATIC int ZSTD_cwksp_reserve_failed(const ZSTD_cwksp* ws) {
54262306a36Sopenharmony_ci    return ws->allocFailed;
54362306a36Sopenharmony_ci}
54462306a36Sopenharmony_ci
54562306a36Sopenharmony_ci/*-*************************************
54662306a36Sopenharmony_ci*  Functions Checking Free Space
54762306a36Sopenharmony_ci***************************************/
54862306a36Sopenharmony_ci
54962306a36Sopenharmony_ci/* ZSTD_alignmentSpaceWithinBounds() :
55062306a36Sopenharmony_ci * Returns if the estimated space needed for a wksp is within an acceptable limit of the
55162306a36Sopenharmony_ci * actual amount of space used.
55262306a36Sopenharmony_ci */
55362306a36Sopenharmony_ciMEM_STATIC int ZSTD_cwksp_estimated_space_within_bounds(const ZSTD_cwksp* const ws,
55462306a36Sopenharmony_ci                                                        size_t const estimatedSpace, int resizedWorkspace) {
55562306a36Sopenharmony_ci    if (resizedWorkspace) {
55662306a36Sopenharmony_ci        /* Resized/newly allocated wksp should have exact bounds */
55762306a36Sopenharmony_ci        return ZSTD_cwksp_used(ws) == estimatedSpace;
55862306a36Sopenharmony_ci    } else {
55962306a36Sopenharmony_ci        /* Due to alignment, when reusing a workspace, we can actually consume 63 fewer or more bytes
56062306a36Sopenharmony_ci         * than estimatedSpace. See the comments in zstd_cwksp.h for details.
56162306a36Sopenharmony_ci         */
56262306a36Sopenharmony_ci        return (ZSTD_cwksp_used(ws) >= estimatedSpace - 63) && (ZSTD_cwksp_used(ws) <= estimatedSpace + 63);
56362306a36Sopenharmony_ci    }
56462306a36Sopenharmony_ci}
56562306a36Sopenharmony_ci
56662306a36Sopenharmony_ci
56762306a36Sopenharmony_ciMEM_STATIC size_t ZSTD_cwksp_available_space(ZSTD_cwksp* ws) {
56862306a36Sopenharmony_ci    return (size_t)((BYTE*)ws->allocStart - (BYTE*)ws->tableEnd);
56962306a36Sopenharmony_ci}
57062306a36Sopenharmony_ci
57162306a36Sopenharmony_ciMEM_STATIC int ZSTD_cwksp_check_available(ZSTD_cwksp* ws, size_t additionalNeededSpace) {
57262306a36Sopenharmony_ci    return ZSTD_cwksp_available_space(ws) >= additionalNeededSpace;
57362306a36Sopenharmony_ci}
57462306a36Sopenharmony_ci
57562306a36Sopenharmony_ciMEM_STATIC int ZSTD_cwksp_check_too_large(ZSTD_cwksp* ws, size_t additionalNeededSpace) {
57662306a36Sopenharmony_ci    return ZSTD_cwksp_check_available(
57762306a36Sopenharmony_ci        ws, additionalNeededSpace * ZSTD_WORKSPACETOOLARGE_FACTOR);
57862306a36Sopenharmony_ci}
57962306a36Sopenharmony_ci
58062306a36Sopenharmony_ciMEM_STATIC int ZSTD_cwksp_check_wasteful(ZSTD_cwksp* ws, size_t additionalNeededSpace) {
58162306a36Sopenharmony_ci    return ZSTD_cwksp_check_too_large(ws, additionalNeededSpace)
58262306a36Sopenharmony_ci        && ws->workspaceOversizedDuration > ZSTD_WORKSPACETOOLARGE_MAXDURATION;
58362306a36Sopenharmony_ci}
58462306a36Sopenharmony_ci
58562306a36Sopenharmony_ciMEM_STATIC void ZSTD_cwksp_bump_oversized_duration(
58662306a36Sopenharmony_ci        ZSTD_cwksp* ws, size_t additionalNeededSpace) {
58762306a36Sopenharmony_ci    if (ZSTD_cwksp_check_too_large(ws, additionalNeededSpace)) {
58862306a36Sopenharmony_ci        ws->workspaceOversizedDuration++;
58962306a36Sopenharmony_ci    } else {
59062306a36Sopenharmony_ci        ws->workspaceOversizedDuration = 0;
59162306a36Sopenharmony_ci    }
59262306a36Sopenharmony_ci}
59362306a36Sopenharmony_ci
59462306a36Sopenharmony_ci
59562306a36Sopenharmony_ci#endif /* ZSTD_CWKSP_H */
596