Add `ZSTD_cwksp_alloc_size()` to Help Calculate Needed Workspace Size
parent
da88c35d41
commit
19a0955ec9
|
@ -1078,9 +1078,16 @@ ZSTD_sizeof_matchState(const ZSTD_compressionParameters* const cParams,
|
||||||
size_t const hSize = ((size_t)1) << cParams->hashLog;
|
size_t const hSize = ((size_t)1) << cParams->hashLog;
|
||||||
U32 const hashLog3 = (forCCtx && cParams->minMatch==3) ? MIN(ZSTD_HASHLOG3_MAX, cParams->windowLog) : 0;
|
U32 const hashLog3 = (forCCtx && cParams->minMatch==3) ? MIN(ZSTD_HASHLOG3_MAX, cParams->windowLog) : 0;
|
||||||
size_t const h3Size = ((size_t)1) << hashLog3;
|
size_t const h3Size = ((size_t)1) << hashLog3;
|
||||||
size_t const tableSpace = (chainSize + hSize + h3Size) * sizeof(U32);
|
size_t const tableSpace = ZSTD_cwksp_alloc_size(chainSize * sizeof(U32))
|
||||||
size_t const optPotentialSpace = ((MaxML+1) + (MaxLL+1) + (MaxOff+1) + (1<<Litbits)) * sizeof(U32)
|
+ ZSTD_cwksp_alloc_size(hSize * sizeof(U32))
|
||||||
+ (ZSTD_OPT_NUM+1) * (sizeof(ZSTD_match_t)+sizeof(ZSTD_optimal_t));
|
+ ZSTD_cwksp_alloc_size(h3Size * sizeof(U32));
|
||||||
|
size_t const optPotentialSpace =
|
||||||
|
ZSTD_cwksp_alloc_size((MaxML+1) * sizeof(U32))
|
||||||
|
+ ZSTD_cwksp_alloc_size((MaxLL+1) * sizeof(U32))
|
||||||
|
+ ZSTD_cwksp_alloc_size((MaxOff+1) * sizeof(U32))
|
||||||
|
+ ZSTD_cwksp_alloc_size((1<<Litbits) * sizeof(U32))
|
||||||
|
+ ZSTD_cwksp_alloc_size((ZSTD_OPT_NUM+1) * sizeof(ZSTD_match_t))
|
||||||
|
+ ZSTD_cwksp_alloc_size((ZSTD_OPT_NUM+1) * sizeof(ZSTD_optimal_t));
|
||||||
size_t const optSpace = (forCCtx && (cParams->strategy >= ZSTD_btopt))
|
size_t const optSpace = (forCCtx && (cParams->strategy >= ZSTD_btopt))
|
||||||
? optPotentialSpace
|
? optPotentialSpace
|
||||||
: 0;
|
: 0;
|
||||||
|
@ -1097,20 +1104,21 @@ size_t ZSTD_estimateCCtxSize_usingCCtxParams(const ZSTD_CCtx_params* params)
|
||||||
size_t const blockSize = MIN(ZSTD_BLOCKSIZE_MAX, (size_t)1 << cParams.windowLog);
|
size_t const blockSize = MIN(ZSTD_BLOCKSIZE_MAX, (size_t)1 << cParams.windowLog);
|
||||||
U32 const divider = (cParams.minMatch==3) ? 3 : 4;
|
U32 const divider = (cParams.minMatch==3) ? 3 : 4;
|
||||||
size_t const maxNbSeq = blockSize / divider;
|
size_t const maxNbSeq = blockSize / divider;
|
||||||
size_t const tokenSpace = WILDCOPY_OVERLENGTH + blockSize + 11*maxNbSeq;
|
size_t const tokenSpace = ZSTD_cwksp_alloc_size(WILDCOPY_OVERLENGTH + blockSize + 11*maxNbSeq);
|
||||||
size_t const entropySpace = HUF_WORKSPACE_SIZE;
|
size_t const entropySpace = ZSTD_cwksp_alloc_size(HUF_WORKSPACE_SIZE);
|
||||||
size_t const blockStateSpace = 2 * sizeof(ZSTD_compressedBlockState_t);
|
size_t const blockStateSpace = 2 * ZSTD_cwksp_alloc_size(sizeof(ZSTD_compressedBlockState_t));
|
||||||
size_t const matchStateSize = ZSTD_sizeof_matchState(&cParams, /* forCCtx */ 1);
|
size_t const matchStateSize = ZSTD_sizeof_matchState(&cParams, /* forCCtx */ 1);
|
||||||
|
|
||||||
size_t const ldmSpace = ZSTD_ldm_getTableSize(params->ldmParams);
|
size_t const ldmSpace = ZSTD_ldm_getTableSize(params->ldmParams);
|
||||||
size_t const ldmSeqSpace = ZSTD_ldm_getMaxNbSeq(params->ldmParams, blockSize) * sizeof(rawSeq);
|
size_t const ldmSeqSpace = ZSTD_cwksp_alloc_size(ZSTD_ldm_getMaxNbSeq(params->ldmParams, blockSize) * sizeof(rawSeq));
|
||||||
|
|
||||||
size_t const neededSpace = entropySpace + blockStateSpace + tokenSpace +
|
size_t const neededSpace = entropySpace + blockStateSpace + tokenSpace +
|
||||||
matchStateSize + ldmSpace + ldmSeqSpace;
|
matchStateSize + ldmSpace + ldmSeqSpace;
|
||||||
|
size_t const cctxSpace = ZSTD_cwksp_alloc_size(sizeof(ZSTD_CCtx));
|
||||||
|
|
||||||
DEBUGLOG(5, "sizeof(ZSTD_CCtx) : %u", (U32)sizeof(ZSTD_CCtx));
|
DEBUGLOG(5, "sizeof(ZSTD_CCtx) : %u", (U32)cctxSpace);
|
||||||
DEBUGLOG(5, "estimate workspace : %u", (U32)neededSpace);
|
DEBUGLOG(5, "estimate workspace : %u", (U32)neededSpace);
|
||||||
return sizeof(ZSTD_CCtx) + neededSpace;
|
return cctxSpace + neededSpace;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -1393,7 +1401,7 @@ static size_t ZSTD_resetCCtx_internal(ZSTD_CCtx* zc,
|
||||||
size_t const blockSize = MIN(ZSTD_BLOCKSIZE_MAX, windowSize);
|
size_t const blockSize = MIN(ZSTD_BLOCKSIZE_MAX, windowSize);
|
||||||
U32 const divider = (params.cParams.minMatch==3) ? 3 : 4;
|
U32 const divider = (params.cParams.minMatch==3) ? 3 : 4;
|
||||||
size_t const maxNbSeq = blockSize / divider;
|
size_t const maxNbSeq = blockSize / divider;
|
||||||
size_t const tokenSpace = WILDCOPY_OVERLENGTH + blockSize + 11*maxNbSeq;
|
size_t const tokenSpace = ZSTD_cwksp_alloc_size(WILDCOPY_OVERLENGTH + blockSize + 11*maxNbSeq);
|
||||||
size_t const buffOutSize = (zbuff==ZSTDb_buffered) ? ZSTD_compressBound(blockSize)+1 : 0;
|
size_t const buffOutSize = (zbuff==ZSTDb_buffered) ? ZSTD_compressBound(blockSize)+1 : 0;
|
||||||
size_t const buffInSize = (zbuff==ZSTDb_buffered) ? windowSize + blockSize : 0;
|
size_t const buffInSize = (zbuff==ZSTDb_buffered) ? windowSize + blockSize : 0;
|
||||||
size_t const matchStateSize = ZSTD_sizeof_matchState(¶ms.cParams, /* forCCtx */ 1);
|
size_t const matchStateSize = ZSTD_sizeof_matchState(¶ms.cParams, /* forCCtx */ 1);
|
||||||
|
@ -1408,12 +1416,12 @@ static size_t ZSTD_resetCCtx_internal(ZSTD_CCtx* zc,
|
||||||
ZSTD_cwksp_bump_oversized_duration(ws, 0);
|
ZSTD_cwksp_bump_oversized_duration(ws, 0);
|
||||||
|
|
||||||
/* Check if workspace is large enough, alloc a new one if needed */
|
/* Check if workspace is large enough, alloc a new one if needed */
|
||||||
{ size_t const cctxSpace = zc->staticSize ? sizeof(ZSTD_CCtx) : 0;
|
{ size_t const cctxSpace = zc->staticSize ? ZSTD_cwksp_alloc_size(sizeof(ZSTD_CCtx)) : 0;
|
||||||
size_t const entropySpace = HUF_WORKSPACE_SIZE;
|
size_t const entropySpace = ZSTD_cwksp_alloc_size(HUF_WORKSPACE_SIZE);
|
||||||
size_t const blockStateSpace = 2 * sizeof(ZSTD_compressedBlockState_t);
|
size_t const blockStateSpace = 2 * ZSTD_cwksp_alloc_size(sizeof(ZSTD_compressedBlockState_t));
|
||||||
size_t const bufferSpace = buffInSize + buffOutSize;
|
size_t const bufferSpace = ZSTD_cwksp_alloc_size(buffInSize) + ZSTD_cwksp_alloc_size(buffOutSize);
|
||||||
size_t const ldmSpace = ZSTD_ldm_getTableSize(params.ldmParams);
|
size_t const ldmSpace = ZSTD_ldm_getTableSize(params.ldmParams);
|
||||||
size_t const ldmSeqSpace = maxNbLdmSeq * sizeof(rawSeq);
|
size_t const ldmSeqSpace = ZSTD_cwksp_alloc_size(maxNbLdmSeq * sizeof(rawSeq));
|
||||||
|
|
||||||
size_t const neededSpace =
|
size_t const neededSpace =
|
||||||
cctxSpace +
|
cctxSpace +
|
||||||
|
@ -3060,8 +3068,11 @@ size_t ZSTD_estimateCDictSize_advanced(
|
||||||
ZSTD_dictLoadMethod_e dictLoadMethod)
|
ZSTD_dictLoadMethod_e dictLoadMethod)
|
||||||
{
|
{
|
||||||
DEBUGLOG(5, "sizeof(ZSTD_CDict) : %u", (unsigned)sizeof(ZSTD_CDict));
|
DEBUGLOG(5, "sizeof(ZSTD_CDict) : %u", (unsigned)sizeof(ZSTD_CDict));
|
||||||
return sizeof(ZSTD_CDict) + HUF_WORKSPACE_SIZE + ZSTD_sizeof_matchState(&cParams, /* forCCtx */ 0)
|
return ZSTD_cwksp_alloc_size(sizeof(ZSTD_CDict))
|
||||||
+ (dictLoadMethod == ZSTD_dlm_byRef ? 0 : ZSTD_cwksp_align(dictSize, sizeof(void *)));
|
+ ZSTD_cwksp_alloc_size(HUF_WORKSPACE_SIZE)
|
||||||
|
+ ZSTD_sizeof_matchState(&cParams, /* forCCtx */ 0)
|
||||||
|
+ (dictLoadMethod == ZSTD_dlm_byRef ? 0
|
||||||
|
: ZSTD_cwksp_alloc_size(ZSTD_cwksp_align(dictSize, sizeof(void *))));
|
||||||
}
|
}
|
||||||
|
|
||||||
size_t ZSTD_estimateCDictSize(size_t dictSize, int compressionLevel)
|
size_t ZSTD_estimateCDictSize(size_t dictSize, int compressionLevel)
|
||||||
|
@ -3141,11 +3152,11 @@ ZSTD_CDict* ZSTD_createCDict_advanced(const void* dictBuffer, size_t dictSize,
|
||||||
if (!customMem.customAlloc ^ !customMem.customFree) return NULL;
|
if (!customMem.customAlloc ^ !customMem.customFree) return NULL;
|
||||||
|
|
||||||
{ size_t const workspaceSize =
|
{ size_t const workspaceSize =
|
||||||
sizeof(ZSTD_CDict) +
|
ZSTD_cwksp_alloc_size(sizeof(ZSTD_CDict)) +
|
||||||
HUF_WORKSPACE_SIZE +
|
ZSTD_cwksp_alloc_size(HUF_WORKSPACE_SIZE) +
|
||||||
ZSTD_sizeof_matchState(&cParams, /* forCCtx */ 0) +
|
ZSTD_sizeof_matchState(&cParams, /* forCCtx */ 0) +
|
||||||
(dictLoadMethod == ZSTD_dlm_byRef ? 0
|
(dictLoadMethod == ZSTD_dlm_byRef ? 0
|
||||||
: ZSTD_cwksp_align(dictSize, sizeof(void*)));
|
: ZSTD_cwksp_alloc_size(ZSTD_cwksp_align(dictSize, sizeof(void*))));
|
||||||
void* const workspace = ZSTD_malloc(workspaceSize, customMem);
|
void* const workspace = ZSTD_malloc(workspaceSize, customMem);
|
||||||
ZSTD_cwksp ws;
|
ZSTD_cwksp ws;
|
||||||
ZSTD_CDict* cdict;
|
ZSTD_CDict* cdict;
|
||||||
|
@ -3224,8 +3235,11 @@ const ZSTD_CDict* ZSTD_initStaticCDict(
|
||||||
ZSTD_compressionParameters cParams)
|
ZSTD_compressionParameters cParams)
|
||||||
{
|
{
|
||||||
size_t const matchStateSize = ZSTD_sizeof_matchState(&cParams, /* forCCtx */ 0);
|
size_t const matchStateSize = ZSTD_sizeof_matchState(&cParams, /* forCCtx */ 0);
|
||||||
size_t const neededSize = sizeof(ZSTD_CDict) + (dictLoadMethod == ZSTD_dlm_byRef ? 0 : ZSTD_cwksp_align(dictSize, sizeof(void*)))
|
size_t const neededSize = ZSTD_cwksp_alloc_size(sizeof(ZSTD_CDict))
|
||||||
+ HUF_WORKSPACE_SIZE + matchStateSize;
|
+ (dictLoadMethod == ZSTD_dlm_byRef ? 0
|
||||||
|
: ZSTD_cwksp_alloc_size(ZSTD_cwksp_align(dictSize, sizeof(void*))))
|
||||||
|
+ ZSTD_cwksp_alloc_size(HUF_WORKSPACE_SIZE)
|
||||||
|
+ matchStateSize;
|
||||||
ZSTD_CDict* cdict;
|
ZSTD_CDict* cdict;
|
||||||
|
|
||||||
if ((size_t)workspace & 7) return NULL; /* 8-aligned */
|
if ((size_t)workspace & 7) return NULL; /* 8-aligned */
|
||||||
|
|
|
@ -34,6 +34,17 @@ extern "C" {
|
||||||
* In which case, resize it down to free some memory */
|
* In which case, resize it down to free some memory */
|
||||||
#define ZSTD_WORKSPACETOOLARGE_MAXDURATION 128
|
#define ZSTD_WORKSPACETOOLARGE_MAXDURATION 128
|
||||||
|
|
||||||
|
/* Since the workspace is effectively its own little malloc implementation /
|
||||||
|
* arena, when we run under ASAN, we should similarly insert redzones between
|
||||||
|
* each internal element of the workspace, so ASAN will catch overruns that
|
||||||
|
* reach outside an object but that stay inside the workspace.
|
||||||
|
*
|
||||||
|
* This defines the size of that redzone.
|
||||||
|
*/
|
||||||
|
#ifndef ZSTD_CWKSP_ASAN_REDZONE_SIZE
|
||||||
|
#define ZSTD_CWKSP_ASAN_REDZONE_SIZE 8
|
||||||
|
#endif
|
||||||
|
|
||||||
/*-*************************************
|
/*-*************************************
|
||||||
* Structures
|
* Structures
|
||||||
***************************************/
|
***************************************/
|
||||||
|
@ -166,6 +177,20 @@ MEM_STATIC size_t ZSTD_cwksp_align(size_t size, size_t const align) {
|
||||||
return (size + mask) & ~mask;
|
return (size + mask) & ~mask;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Use this to determine how much space in the workspace we will consume to
|
||||||
|
* allocate this object. (Normally it should be exactly the size of the object,
|
||||||
|
* but under special conditions, like ASAN, where we pad each object, it might
|
||||||
|
* be larger.)
|
||||||
|
*/
|
||||||
|
MEM_STATIC size_t ZSTD_cwksp_alloc_size(size_t size) {
|
||||||
|
#if defined (ADDRESS_SANITIZER) && !defined (ZSTD_ASAN_DONT_POISON_WORKSPACE)
|
||||||
|
return size + 2 * ZSTD_CWKSP_ASAN_REDZONE_SIZE;
|
||||||
|
#else
|
||||||
|
return size;
|
||||||
|
#endif
|
||||||
|
}
|
||||||
|
|
||||||
MEM_STATIC void ZSTD_cwksp_internal_advance_phase(
|
MEM_STATIC void ZSTD_cwksp_internal_advance_phase(
|
||||||
ZSTD_cwksp* ws, ZSTD_cwksp_alloc_phase_e phase) {
|
ZSTD_cwksp* ws, ZSTD_cwksp_alloc_phase_e phase) {
|
||||||
assert(phase >= ws->phase);
|
assert(phase >= ws->phase);
|
||||||
|
|
|
@ -49,9 +49,9 @@ size_t ZSTD_ldm_getTableSize(ldmParams_t params)
|
||||||
{
|
{
|
||||||
size_t const ldmHSize = ((size_t)1) << params.hashLog;
|
size_t const ldmHSize = ((size_t)1) << params.hashLog;
|
||||||
size_t const ldmBucketSizeLog = MIN(params.bucketSizeLog, params.hashLog);
|
size_t const ldmBucketSizeLog = MIN(params.bucketSizeLog, params.hashLog);
|
||||||
size_t const ldmBucketSize =
|
size_t const ldmBucketSize = ((size_t)1) << (params.hashLog - ldmBucketSizeLog);
|
||||||
((size_t)1) << (params.hashLog - ldmBucketSizeLog);
|
size_t const totalSize = ZSTD_cwksp_alloc_size(ldmBucketSize)
|
||||||
size_t const totalSize = ldmBucketSize + ldmHSize * sizeof(ldmEntry_t);
|
+ ZSTD_cwksp_alloc_size(ldmHSize * sizeof(ldmEntry_t));
|
||||||
return params.enableLdm ? totalSize : 0;
|
return params.enableLdm ? totalSize : 0;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue