1*a28cd43dSSascha Wildner /*
2*a28cd43dSSascha Wildner * Copyright (c) 2016-2020, Yann Collet, Facebook, Inc.
3*a28cd43dSSascha Wildner * All rights reserved.
4*a28cd43dSSascha Wildner *
5*a28cd43dSSascha Wildner * This source code is licensed under both the BSD-style license (found in the
6*a28cd43dSSascha Wildner * LICENSE file in the root directory of this source tree) and the GPLv2 (found
7*a28cd43dSSascha Wildner * in the COPYING file in the root directory of this source tree).
8*a28cd43dSSascha Wildner * You may select, at your option, one of the above-listed licenses.
9*a28cd43dSSascha Wildner */
10*a28cd43dSSascha Wildner
11*a28cd43dSSascha Wildner /*-*************************************
12*a28cd43dSSascha Wildner * Dependencies
13*a28cd43dSSascha Wildner ***************************************/
14*a28cd43dSSascha Wildner #include "../common/zstd_deps.h" /* INT_MAX, ZSTD_memset, ZSTD_memcpy */
15*a28cd43dSSascha Wildner #include "../common/cpu.h"
16*a28cd43dSSascha Wildner #include "../common/mem.h"
17*a28cd43dSSascha Wildner #include "hist.h" /* HIST_countFast_wksp */
18*a28cd43dSSascha Wildner #define FSE_STATIC_LINKING_ONLY /* FSE_encodeSymbol */
19*a28cd43dSSascha Wildner #include "../common/fse.h"
20*a28cd43dSSascha Wildner #define HUF_STATIC_LINKING_ONLY
21*a28cd43dSSascha Wildner #include "../common/huf.h"
22*a28cd43dSSascha Wildner #include "zstd_compress_internal.h"
23*a28cd43dSSascha Wildner #include "zstd_compress_sequences.h"
24*a28cd43dSSascha Wildner #include "zstd_compress_literals.h"
25*a28cd43dSSascha Wildner #include "zstd_fast.h"
26*a28cd43dSSascha Wildner #include "zstd_double_fast.h"
27*a28cd43dSSascha Wildner #include "zstd_lazy.h"
28*a28cd43dSSascha Wildner #include "zstd_opt.h"
29*a28cd43dSSascha Wildner #include "zstd_ldm.h"
30*a28cd43dSSascha Wildner #include "zstd_compress_superblock.h"
31*a28cd43dSSascha Wildner
32*a28cd43dSSascha Wildner /* ***************************************************************
33*a28cd43dSSascha Wildner * Tuning parameters
34*a28cd43dSSascha Wildner *****************************************************************/
35*a28cd43dSSascha Wildner /*!
36*a28cd43dSSascha Wildner * COMPRESS_HEAPMODE :
37*a28cd43dSSascha Wildner * Select how default decompression function ZSTD_compress() allocates its context,
38*a28cd43dSSascha Wildner * on stack (0, default), or into heap (1).
39*a28cd43dSSascha Wildner * Note that functions with explicit context such as ZSTD_compressCCtx() are unaffected.
40*a28cd43dSSascha Wildner */
41*a28cd43dSSascha Wildner #ifndef ZSTD_COMPRESS_HEAPMODE
42*a28cd43dSSascha Wildner # define ZSTD_COMPRESS_HEAPMODE 0
43*a28cd43dSSascha Wildner #endif
44*a28cd43dSSascha Wildner
45*a28cd43dSSascha Wildner
46*a28cd43dSSascha Wildner /*-*************************************
47*a28cd43dSSascha Wildner * Helper functions
48*a28cd43dSSascha Wildner ***************************************/
49*a28cd43dSSascha Wildner /* ZSTD_compressBound()
50*a28cd43dSSascha Wildner * Note that the result from this function is only compatible with the "normal"
51*a28cd43dSSascha Wildner * full-block strategy.
52*a28cd43dSSascha Wildner * When there are a lot of small blocks due to frequent flush in streaming mode
53*a28cd43dSSascha Wildner * the overhead of headers can make the compressed data to be larger than the
54*a28cd43dSSascha Wildner * return value of ZSTD_compressBound().
55*a28cd43dSSascha Wildner */
ZSTD_compressBound(size_t srcSize)56*a28cd43dSSascha Wildner size_t ZSTD_compressBound(size_t srcSize) {
57*a28cd43dSSascha Wildner return ZSTD_COMPRESSBOUND(srcSize);
58*a28cd43dSSascha Wildner }
59*a28cd43dSSascha Wildner
60*a28cd43dSSascha Wildner
61*a28cd43dSSascha Wildner /*-*************************************
62*a28cd43dSSascha Wildner * Context memory management
63*a28cd43dSSascha Wildner ***************************************/
64*a28cd43dSSascha Wildner struct ZSTD_CDict_s {
65*a28cd43dSSascha Wildner const void* dictContent;
66*a28cd43dSSascha Wildner size_t dictContentSize;
67*a28cd43dSSascha Wildner ZSTD_dictContentType_e dictContentType; /* The dictContentType the CDict was created with */
68*a28cd43dSSascha Wildner U32* entropyWorkspace; /* entropy workspace of HUF_WORKSPACE_SIZE bytes */
69*a28cd43dSSascha Wildner ZSTD_cwksp workspace;
70*a28cd43dSSascha Wildner ZSTD_matchState_t matchState;
71*a28cd43dSSascha Wildner ZSTD_compressedBlockState_t cBlockState;
72*a28cd43dSSascha Wildner ZSTD_customMem customMem;
73*a28cd43dSSascha Wildner U32 dictID;
74*a28cd43dSSascha Wildner int compressionLevel; /* 0 indicates that advanced API was used to select CDict params */
75*a28cd43dSSascha Wildner }; /* typedef'd to ZSTD_CDict within "zstd.h" */
76*a28cd43dSSascha Wildner
ZSTD_createCCtx(void)77*a28cd43dSSascha Wildner ZSTD_CCtx* ZSTD_createCCtx(void)
78*a28cd43dSSascha Wildner {
79*a28cd43dSSascha Wildner return ZSTD_createCCtx_advanced(ZSTD_defaultCMem);
80*a28cd43dSSascha Wildner }
81*a28cd43dSSascha Wildner
ZSTD_initCCtx(ZSTD_CCtx * cctx,ZSTD_customMem memManager)82*a28cd43dSSascha Wildner static void ZSTD_initCCtx(ZSTD_CCtx* cctx, ZSTD_customMem memManager)
83*a28cd43dSSascha Wildner {
84*a28cd43dSSascha Wildner assert(cctx != NULL);
85*a28cd43dSSascha Wildner ZSTD_memset(cctx, 0, sizeof(*cctx));
86*a28cd43dSSascha Wildner cctx->customMem = memManager;
87*a28cd43dSSascha Wildner cctx->bmi2 = ZSTD_cpuid_bmi2(ZSTD_cpuid());
88*a28cd43dSSascha Wildner { size_t const err = ZSTD_CCtx_reset(cctx, ZSTD_reset_parameters);
89*a28cd43dSSascha Wildner assert(!ZSTD_isError(err));
90*a28cd43dSSascha Wildner (void)err;
91*a28cd43dSSascha Wildner }
92*a28cd43dSSascha Wildner }
93*a28cd43dSSascha Wildner
ZSTD_createCCtx_advanced(ZSTD_customMem customMem)94*a28cd43dSSascha Wildner ZSTD_CCtx* ZSTD_createCCtx_advanced(ZSTD_customMem customMem)
95*a28cd43dSSascha Wildner {
96*a28cd43dSSascha Wildner ZSTD_STATIC_ASSERT(zcss_init==0);
97*a28cd43dSSascha Wildner ZSTD_STATIC_ASSERT(ZSTD_CONTENTSIZE_UNKNOWN==(0ULL - 1));
98*a28cd43dSSascha Wildner if ((!customMem.customAlloc) ^ (!customMem.customFree)) return NULL;
99*a28cd43dSSascha Wildner { ZSTD_CCtx* const cctx = (ZSTD_CCtx*)ZSTD_customMalloc(sizeof(ZSTD_CCtx), customMem);
100*a28cd43dSSascha Wildner if (!cctx) return NULL;
101*a28cd43dSSascha Wildner ZSTD_initCCtx(cctx, customMem);
102*a28cd43dSSascha Wildner return cctx;
103*a28cd43dSSascha Wildner }
104*a28cd43dSSascha Wildner }
105*a28cd43dSSascha Wildner
ZSTD_initStaticCCtx(void * workspace,size_t workspaceSize)106*a28cd43dSSascha Wildner ZSTD_CCtx* ZSTD_initStaticCCtx(void* workspace, size_t workspaceSize)
107*a28cd43dSSascha Wildner {
108*a28cd43dSSascha Wildner ZSTD_cwksp ws;
109*a28cd43dSSascha Wildner ZSTD_CCtx* cctx;
110*a28cd43dSSascha Wildner if (workspaceSize <= sizeof(ZSTD_CCtx)) return NULL; /* minimum size */
111*a28cd43dSSascha Wildner if ((size_t)workspace & 7) return NULL; /* must be 8-aligned */
112*a28cd43dSSascha Wildner ZSTD_cwksp_init(&ws, workspace, workspaceSize, ZSTD_cwksp_static_alloc);
113*a28cd43dSSascha Wildner
114*a28cd43dSSascha Wildner cctx = (ZSTD_CCtx*)ZSTD_cwksp_reserve_object(&ws, sizeof(ZSTD_CCtx));
115*a28cd43dSSascha Wildner if (cctx == NULL) return NULL;
116*a28cd43dSSascha Wildner
117*a28cd43dSSascha Wildner ZSTD_memset(cctx, 0, sizeof(ZSTD_CCtx));
118*a28cd43dSSascha Wildner ZSTD_cwksp_move(&cctx->workspace, &ws);
119*a28cd43dSSascha Wildner cctx->staticSize = workspaceSize;
120*a28cd43dSSascha Wildner
121*a28cd43dSSascha Wildner /* statically sized space. entropyWorkspace never moves (but prev/next block swap places) */
122*a28cd43dSSascha Wildner if (!ZSTD_cwksp_check_available(&cctx->workspace, ENTROPY_WORKSPACE_SIZE + 2 * sizeof(ZSTD_compressedBlockState_t))) return NULL;
123*a28cd43dSSascha Wildner cctx->blockState.prevCBlock = (ZSTD_compressedBlockState_t*)ZSTD_cwksp_reserve_object(&cctx->workspace, sizeof(ZSTD_compressedBlockState_t));
124*a28cd43dSSascha Wildner cctx->blockState.nextCBlock = (ZSTD_compressedBlockState_t*)ZSTD_cwksp_reserve_object(&cctx->workspace, sizeof(ZSTD_compressedBlockState_t));
125*a28cd43dSSascha Wildner cctx->entropyWorkspace = (U32*)ZSTD_cwksp_reserve_object(&cctx->workspace, ENTROPY_WORKSPACE_SIZE);
126*a28cd43dSSascha Wildner cctx->bmi2 = ZSTD_cpuid_bmi2(ZSTD_cpuid());
127*a28cd43dSSascha Wildner return cctx;
128*a28cd43dSSascha Wildner }
129*a28cd43dSSascha Wildner
130*a28cd43dSSascha Wildner /**
131*a28cd43dSSascha Wildner * Clears and frees all of the dictionaries in the CCtx.
132*a28cd43dSSascha Wildner */
ZSTD_clearAllDicts(ZSTD_CCtx * cctx)133*a28cd43dSSascha Wildner static void ZSTD_clearAllDicts(ZSTD_CCtx* cctx)
134*a28cd43dSSascha Wildner {
135*a28cd43dSSascha Wildner ZSTD_customFree(cctx->localDict.dictBuffer, cctx->customMem);
136*a28cd43dSSascha Wildner ZSTD_freeCDict(cctx->localDict.cdict);
137*a28cd43dSSascha Wildner ZSTD_memset(&cctx->localDict, 0, sizeof(cctx->localDict));
138*a28cd43dSSascha Wildner ZSTD_memset(&cctx->prefixDict, 0, sizeof(cctx->prefixDict));
139*a28cd43dSSascha Wildner cctx->cdict = NULL;
140*a28cd43dSSascha Wildner }
141*a28cd43dSSascha Wildner
ZSTD_sizeof_localDict(ZSTD_localDict dict)142*a28cd43dSSascha Wildner static size_t ZSTD_sizeof_localDict(ZSTD_localDict dict)
143*a28cd43dSSascha Wildner {
144*a28cd43dSSascha Wildner size_t const bufferSize = dict.dictBuffer != NULL ? dict.dictSize : 0;
145*a28cd43dSSascha Wildner size_t const cdictSize = ZSTD_sizeof_CDict(dict.cdict);
146*a28cd43dSSascha Wildner return bufferSize + cdictSize;
147*a28cd43dSSascha Wildner }
148*a28cd43dSSascha Wildner
ZSTD_freeCCtxContent(ZSTD_CCtx * cctx)149*a28cd43dSSascha Wildner static void ZSTD_freeCCtxContent(ZSTD_CCtx* cctx)
150*a28cd43dSSascha Wildner {
151*a28cd43dSSascha Wildner assert(cctx != NULL);
152*a28cd43dSSascha Wildner assert(cctx->staticSize == 0);
153*a28cd43dSSascha Wildner ZSTD_clearAllDicts(cctx);
154*a28cd43dSSascha Wildner #ifdef ZSTD_MULTITHREAD
155*a28cd43dSSascha Wildner ZSTDMT_freeCCtx(cctx->mtctx); cctx->mtctx = NULL;
156*a28cd43dSSascha Wildner #endif
157*a28cd43dSSascha Wildner ZSTD_cwksp_free(&cctx->workspace, cctx->customMem);
158*a28cd43dSSascha Wildner }
159*a28cd43dSSascha Wildner
ZSTD_freeCCtx(ZSTD_CCtx * cctx)160*a28cd43dSSascha Wildner size_t ZSTD_freeCCtx(ZSTD_CCtx* cctx)
161*a28cd43dSSascha Wildner {
162*a28cd43dSSascha Wildner if (cctx==NULL) return 0; /* support free on NULL */
163*a28cd43dSSascha Wildner RETURN_ERROR_IF(cctx->staticSize, memory_allocation,
164*a28cd43dSSascha Wildner "not compatible with static CCtx");
165*a28cd43dSSascha Wildner {
166*a28cd43dSSascha Wildner int cctxInWorkspace = ZSTD_cwksp_owns_buffer(&cctx->workspace, cctx);
167*a28cd43dSSascha Wildner ZSTD_freeCCtxContent(cctx);
168*a28cd43dSSascha Wildner if (!cctxInWorkspace) {
169*a28cd43dSSascha Wildner ZSTD_customFree(cctx, cctx->customMem);
170*a28cd43dSSascha Wildner }
171*a28cd43dSSascha Wildner }
172*a28cd43dSSascha Wildner return 0;
173*a28cd43dSSascha Wildner }
174*a28cd43dSSascha Wildner
175*a28cd43dSSascha Wildner
ZSTD_sizeof_mtctx(const ZSTD_CCtx * cctx)176*a28cd43dSSascha Wildner static size_t ZSTD_sizeof_mtctx(const ZSTD_CCtx* cctx)
177*a28cd43dSSascha Wildner {
178*a28cd43dSSascha Wildner #ifdef ZSTD_MULTITHREAD
179*a28cd43dSSascha Wildner return ZSTDMT_sizeof_CCtx(cctx->mtctx);
180*a28cd43dSSascha Wildner #else
181*a28cd43dSSascha Wildner (void)cctx;
182*a28cd43dSSascha Wildner return 0;
183*a28cd43dSSascha Wildner #endif
184*a28cd43dSSascha Wildner }
185*a28cd43dSSascha Wildner
186*a28cd43dSSascha Wildner
ZSTD_sizeof_CCtx(const ZSTD_CCtx * cctx)187*a28cd43dSSascha Wildner size_t ZSTD_sizeof_CCtx(const ZSTD_CCtx* cctx)
188*a28cd43dSSascha Wildner {
189*a28cd43dSSascha Wildner if (cctx==NULL) return 0; /* support sizeof on NULL */
190*a28cd43dSSascha Wildner /* cctx may be in the workspace */
191*a28cd43dSSascha Wildner return (cctx->workspace.workspace == cctx ? 0 : sizeof(*cctx))
192*a28cd43dSSascha Wildner + ZSTD_cwksp_sizeof(&cctx->workspace)
193*a28cd43dSSascha Wildner + ZSTD_sizeof_localDict(cctx->localDict)
194*a28cd43dSSascha Wildner + ZSTD_sizeof_mtctx(cctx);
195*a28cd43dSSascha Wildner }
196*a28cd43dSSascha Wildner
ZSTD_sizeof_CStream(const ZSTD_CStream * zcs)197*a28cd43dSSascha Wildner size_t ZSTD_sizeof_CStream(const ZSTD_CStream* zcs)
198*a28cd43dSSascha Wildner {
199*a28cd43dSSascha Wildner return ZSTD_sizeof_CCtx(zcs); /* same object */
200*a28cd43dSSascha Wildner }
201*a28cd43dSSascha Wildner
202*a28cd43dSSascha Wildner /* private API call, for dictBuilder only */
ZSTD_getSeqStore(const ZSTD_CCtx * ctx)203*a28cd43dSSascha Wildner const seqStore_t* ZSTD_getSeqStore(const ZSTD_CCtx* ctx) { return &(ctx->seqStore); }
204*a28cd43dSSascha Wildner
205*a28cd43dSSascha Wildner /* Returns 1 if compression parameters are such that we should
206*a28cd43dSSascha Wildner * enable long distance matching (wlog >= 27, strategy >= btopt).
207*a28cd43dSSascha Wildner * Returns 0 otherwise.
208*a28cd43dSSascha Wildner */
ZSTD_CParams_shouldEnableLdm(const ZSTD_compressionParameters * const cParams)209*a28cd43dSSascha Wildner static U32 ZSTD_CParams_shouldEnableLdm(const ZSTD_compressionParameters* const cParams) {
210*a28cd43dSSascha Wildner return cParams->strategy >= ZSTD_btopt && cParams->windowLog >= 27;
211*a28cd43dSSascha Wildner }
212*a28cd43dSSascha Wildner
ZSTD_makeCCtxParamsFromCParams(ZSTD_compressionParameters cParams)213*a28cd43dSSascha Wildner static ZSTD_CCtx_params ZSTD_makeCCtxParamsFromCParams(
214*a28cd43dSSascha Wildner ZSTD_compressionParameters cParams)
215*a28cd43dSSascha Wildner {
216*a28cd43dSSascha Wildner ZSTD_CCtx_params cctxParams;
217*a28cd43dSSascha Wildner /* should not matter, as all cParams are presumed properly defined */
218*a28cd43dSSascha Wildner ZSTD_CCtxParams_init(&cctxParams, ZSTD_CLEVEL_DEFAULT);
219*a28cd43dSSascha Wildner cctxParams.cParams = cParams;
220*a28cd43dSSascha Wildner
221*a28cd43dSSascha Wildner if (ZSTD_CParams_shouldEnableLdm(&cParams)) {
222*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_makeCCtxParamsFromCParams(): Including LDM into cctx params");
223*a28cd43dSSascha Wildner cctxParams.ldmParams.enableLdm = 1;
224*a28cd43dSSascha Wildner /* LDM is enabled by default for optimal parser and window size >= 128MB */
225*a28cd43dSSascha Wildner ZSTD_ldm_adjustParameters(&cctxParams.ldmParams, &cParams);
226*a28cd43dSSascha Wildner assert(cctxParams.ldmParams.hashLog >= cctxParams.ldmParams.bucketSizeLog);
227*a28cd43dSSascha Wildner assert(cctxParams.ldmParams.hashRateLog < 32);
228*a28cd43dSSascha Wildner }
229*a28cd43dSSascha Wildner
230*a28cd43dSSascha Wildner assert(!ZSTD_checkCParams(cParams));
231*a28cd43dSSascha Wildner return cctxParams;
232*a28cd43dSSascha Wildner }
233*a28cd43dSSascha Wildner
ZSTD_createCCtxParams_advanced(ZSTD_customMem customMem)234*a28cd43dSSascha Wildner static ZSTD_CCtx_params* ZSTD_createCCtxParams_advanced(
235*a28cd43dSSascha Wildner ZSTD_customMem customMem)
236*a28cd43dSSascha Wildner {
237*a28cd43dSSascha Wildner ZSTD_CCtx_params* params;
238*a28cd43dSSascha Wildner if ((!customMem.customAlloc) ^ (!customMem.customFree)) return NULL;
239*a28cd43dSSascha Wildner params = (ZSTD_CCtx_params*)ZSTD_customCalloc(
240*a28cd43dSSascha Wildner sizeof(ZSTD_CCtx_params), customMem);
241*a28cd43dSSascha Wildner if (!params) { return NULL; }
242*a28cd43dSSascha Wildner ZSTD_CCtxParams_init(params, ZSTD_CLEVEL_DEFAULT);
243*a28cd43dSSascha Wildner params->customMem = customMem;
244*a28cd43dSSascha Wildner return params;
245*a28cd43dSSascha Wildner }
246*a28cd43dSSascha Wildner
ZSTD_createCCtxParams(void)247*a28cd43dSSascha Wildner ZSTD_CCtx_params* ZSTD_createCCtxParams(void)
248*a28cd43dSSascha Wildner {
249*a28cd43dSSascha Wildner return ZSTD_createCCtxParams_advanced(ZSTD_defaultCMem);
250*a28cd43dSSascha Wildner }
251*a28cd43dSSascha Wildner
ZSTD_freeCCtxParams(ZSTD_CCtx_params * params)252*a28cd43dSSascha Wildner size_t ZSTD_freeCCtxParams(ZSTD_CCtx_params* params)
253*a28cd43dSSascha Wildner {
254*a28cd43dSSascha Wildner if (params == NULL) { return 0; }
255*a28cd43dSSascha Wildner ZSTD_customFree(params, params->customMem);
256*a28cd43dSSascha Wildner return 0;
257*a28cd43dSSascha Wildner }
258*a28cd43dSSascha Wildner
ZSTD_CCtxParams_reset(ZSTD_CCtx_params * params)259*a28cd43dSSascha Wildner size_t ZSTD_CCtxParams_reset(ZSTD_CCtx_params* params)
260*a28cd43dSSascha Wildner {
261*a28cd43dSSascha Wildner return ZSTD_CCtxParams_init(params, ZSTD_CLEVEL_DEFAULT);
262*a28cd43dSSascha Wildner }
263*a28cd43dSSascha Wildner
ZSTD_CCtxParams_init(ZSTD_CCtx_params * cctxParams,int compressionLevel)264*a28cd43dSSascha Wildner size_t ZSTD_CCtxParams_init(ZSTD_CCtx_params* cctxParams, int compressionLevel) {
265*a28cd43dSSascha Wildner RETURN_ERROR_IF(!cctxParams, GENERIC, "NULL pointer!");
266*a28cd43dSSascha Wildner ZSTD_memset(cctxParams, 0, sizeof(*cctxParams));
267*a28cd43dSSascha Wildner cctxParams->compressionLevel = compressionLevel;
268*a28cd43dSSascha Wildner cctxParams->fParams.contentSizeFlag = 1;
269*a28cd43dSSascha Wildner return 0;
270*a28cd43dSSascha Wildner }
271*a28cd43dSSascha Wildner
ZSTD_CCtxParams_init_advanced(ZSTD_CCtx_params * cctxParams,ZSTD_parameters params)272*a28cd43dSSascha Wildner size_t ZSTD_CCtxParams_init_advanced(ZSTD_CCtx_params* cctxParams, ZSTD_parameters params)
273*a28cd43dSSascha Wildner {
274*a28cd43dSSascha Wildner RETURN_ERROR_IF(!cctxParams, GENERIC, "NULL pointer!");
275*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_checkCParams(params.cParams) , "");
276*a28cd43dSSascha Wildner ZSTD_memset(cctxParams, 0, sizeof(*cctxParams));
277*a28cd43dSSascha Wildner assert(!ZSTD_checkCParams(params.cParams));
278*a28cd43dSSascha Wildner cctxParams->cParams = params.cParams;
279*a28cd43dSSascha Wildner cctxParams->fParams = params.fParams;
280*a28cd43dSSascha Wildner cctxParams->compressionLevel = ZSTD_CLEVEL_DEFAULT; /* should not matter, as all cParams are presumed properly defined */
281*a28cd43dSSascha Wildner return 0;
282*a28cd43dSSascha Wildner }
283*a28cd43dSSascha Wildner
284*a28cd43dSSascha Wildner /* ZSTD_assignParamsToCCtxParams() :
285*a28cd43dSSascha Wildner * params is presumed valid at this stage */
ZSTD_assignParamsToCCtxParams(const ZSTD_CCtx_params * cctxParams,const ZSTD_parameters * params)286*a28cd43dSSascha Wildner static ZSTD_CCtx_params ZSTD_assignParamsToCCtxParams(
287*a28cd43dSSascha Wildner const ZSTD_CCtx_params* cctxParams, const ZSTD_parameters* params)
288*a28cd43dSSascha Wildner {
289*a28cd43dSSascha Wildner ZSTD_CCtx_params ret = *cctxParams;
290*a28cd43dSSascha Wildner assert(!ZSTD_checkCParams(params->cParams));
291*a28cd43dSSascha Wildner ret.cParams = params->cParams;
292*a28cd43dSSascha Wildner ret.fParams = params->fParams;
293*a28cd43dSSascha Wildner ret.compressionLevel = ZSTD_CLEVEL_DEFAULT; /* should not matter, as all cParams are presumed properly defined */
294*a28cd43dSSascha Wildner return ret;
295*a28cd43dSSascha Wildner }
296*a28cd43dSSascha Wildner
ZSTD_cParam_getBounds(ZSTD_cParameter param)297*a28cd43dSSascha Wildner ZSTD_bounds ZSTD_cParam_getBounds(ZSTD_cParameter param)
298*a28cd43dSSascha Wildner {
299*a28cd43dSSascha Wildner ZSTD_bounds bounds = { 0, 0, 0 };
300*a28cd43dSSascha Wildner
301*a28cd43dSSascha Wildner switch(param)
302*a28cd43dSSascha Wildner {
303*a28cd43dSSascha Wildner case ZSTD_c_compressionLevel:
304*a28cd43dSSascha Wildner bounds.lowerBound = ZSTD_minCLevel();
305*a28cd43dSSascha Wildner bounds.upperBound = ZSTD_maxCLevel();
306*a28cd43dSSascha Wildner return bounds;
307*a28cd43dSSascha Wildner
308*a28cd43dSSascha Wildner case ZSTD_c_windowLog:
309*a28cd43dSSascha Wildner bounds.lowerBound = ZSTD_WINDOWLOG_MIN;
310*a28cd43dSSascha Wildner bounds.upperBound = ZSTD_WINDOWLOG_MAX;
311*a28cd43dSSascha Wildner return bounds;
312*a28cd43dSSascha Wildner
313*a28cd43dSSascha Wildner case ZSTD_c_hashLog:
314*a28cd43dSSascha Wildner bounds.lowerBound = ZSTD_HASHLOG_MIN;
315*a28cd43dSSascha Wildner bounds.upperBound = ZSTD_HASHLOG_MAX;
316*a28cd43dSSascha Wildner return bounds;
317*a28cd43dSSascha Wildner
318*a28cd43dSSascha Wildner case ZSTD_c_chainLog:
319*a28cd43dSSascha Wildner bounds.lowerBound = ZSTD_CHAINLOG_MIN;
320*a28cd43dSSascha Wildner bounds.upperBound = ZSTD_CHAINLOG_MAX;
321*a28cd43dSSascha Wildner return bounds;
322*a28cd43dSSascha Wildner
323*a28cd43dSSascha Wildner case ZSTD_c_searchLog:
324*a28cd43dSSascha Wildner bounds.lowerBound = ZSTD_SEARCHLOG_MIN;
325*a28cd43dSSascha Wildner bounds.upperBound = ZSTD_SEARCHLOG_MAX;
326*a28cd43dSSascha Wildner return bounds;
327*a28cd43dSSascha Wildner
328*a28cd43dSSascha Wildner case ZSTD_c_minMatch:
329*a28cd43dSSascha Wildner bounds.lowerBound = ZSTD_MINMATCH_MIN;
330*a28cd43dSSascha Wildner bounds.upperBound = ZSTD_MINMATCH_MAX;
331*a28cd43dSSascha Wildner return bounds;
332*a28cd43dSSascha Wildner
333*a28cd43dSSascha Wildner case ZSTD_c_targetLength:
334*a28cd43dSSascha Wildner bounds.lowerBound = ZSTD_TARGETLENGTH_MIN;
335*a28cd43dSSascha Wildner bounds.upperBound = ZSTD_TARGETLENGTH_MAX;
336*a28cd43dSSascha Wildner return bounds;
337*a28cd43dSSascha Wildner
338*a28cd43dSSascha Wildner case ZSTD_c_strategy:
339*a28cd43dSSascha Wildner bounds.lowerBound = ZSTD_STRATEGY_MIN;
340*a28cd43dSSascha Wildner bounds.upperBound = ZSTD_STRATEGY_MAX;
341*a28cd43dSSascha Wildner return bounds;
342*a28cd43dSSascha Wildner
343*a28cd43dSSascha Wildner case ZSTD_c_contentSizeFlag:
344*a28cd43dSSascha Wildner bounds.lowerBound = 0;
345*a28cd43dSSascha Wildner bounds.upperBound = 1;
346*a28cd43dSSascha Wildner return bounds;
347*a28cd43dSSascha Wildner
348*a28cd43dSSascha Wildner case ZSTD_c_checksumFlag:
349*a28cd43dSSascha Wildner bounds.lowerBound = 0;
350*a28cd43dSSascha Wildner bounds.upperBound = 1;
351*a28cd43dSSascha Wildner return bounds;
352*a28cd43dSSascha Wildner
353*a28cd43dSSascha Wildner case ZSTD_c_dictIDFlag:
354*a28cd43dSSascha Wildner bounds.lowerBound = 0;
355*a28cd43dSSascha Wildner bounds.upperBound = 1;
356*a28cd43dSSascha Wildner return bounds;
357*a28cd43dSSascha Wildner
358*a28cd43dSSascha Wildner case ZSTD_c_nbWorkers:
359*a28cd43dSSascha Wildner bounds.lowerBound = 0;
360*a28cd43dSSascha Wildner #ifdef ZSTD_MULTITHREAD
361*a28cd43dSSascha Wildner bounds.upperBound = ZSTDMT_NBWORKERS_MAX;
362*a28cd43dSSascha Wildner #else
363*a28cd43dSSascha Wildner bounds.upperBound = 0;
364*a28cd43dSSascha Wildner #endif
365*a28cd43dSSascha Wildner return bounds;
366*a28cd43dSSascha Wildner
367*a28cd43dSSascha Wildner case ZSTD_c_jobSize:
368*a28cd43dSSascha Wildner bounds.lowerBound = 0;
369*a28cd43dSSascha Wildner #ifdef ZSTD_MULTITHREAD
370*a28cd43dSSascha Wildner bounds.upperBound = ZSTDMT_JOBSIZE_MAX;
371*a28cd43dSSascha Wildner #else
372*a28cd43dSSascha Wildner bounds.upperBound = 0;
373*a28cd43dSSascha Wildner #endif
374*a28cd43dSSascha Wildner return bounds;
375*a28cd43dSSascha Wildner
376*a28cd43dSSascha Wildner case ZSTD_c_overlapLog:
377*a28cd43dSSascha Wildner #ifdef ZSTD_MULTITHREAD
378*a28cd43dSSascha Wildner bounds.lowerBound = ZSTD_OVERLAPLOG_MIN;
379*a28cd43dSSascha Wildner bounds.upperBound = ZSTD_OVERLAPLOG_MAX;
380*a28cd43dSSascha Wildner #else
381*a28cd43dSSascha Wildner bounds.lowerBound = 0;
382*a28cd43dSSascha Wildner bounds.upperBound = 0;
383*a28cd43dSSascha Wildner #endif
384*a28cd43dSSascha Wildner return bounds;
385*a28cd43dSSascha Wildner
386*a28cd43dSSascha Wildner case ZSTD_c_enableDedicatedDictSearch:
387*a28cd43dSSascha Wildner bounds.lowerBound = 0;
388*a28cd43dSSascha Wildner bounds.upperBound = 1;
389*a28cd43dSSascha Wildner return bounds;
390*a28cd43dSSascha Wildner
391*a28cd43dSSascha Wildner case ZSTD_c_enableLongDistanceMatching:
392*a28cd43dSSascha Wildner bounds.lowerBound = 0;
393*a28cd43dSSascha Wildner bounds.upperBound = 1;
394*a28cd43dSSascha Wildner return bounds;
395*a28cd43dSSascha Wildner
396*a28cd43dSSascha Wildner case ZSTD_c_ldmHashLog:
397*a28cd43dSSascha Wildner bounds.lowerBound = ZSTD_LDM_HASHLOG_MIN;
398*a28cd43dSSascha Wildner bounds.upperBound = ZSTD_LDM_HASHLOG_MAX;
399*a28cd43dSSascha Wildner return bounds;
400*a28cd43dSSascha Wildner
401*a28cd43dSSascha Wildner case ZSTD_c_ldmMinMatch:
402*a28cd43dSSascha Wildner bounds.lowerBound = ZSTD_LDM_MINMATCH_MIN;
403*a28cd43dSSascha Wildner bounds.upperBound = ZSTD_LDM_MINMATCH_MAX;
404*a28cd43dSSascha Wildner return bounds;
405*a28cd43dSSascha Wildner
406*a28cd43dSSascha Wildner case ZSTD_c_ldmBucketSizeLog:
407*a28cd43dSSascha Wildner bounds.lowerBound = ZSTD_LDM_BUCKETSIZELOG_MIN;
408*a28cd43dSSascha Wildner bounds.upperBound = ZSTD_LDM_BUCKETSIZELOG_MAX;
409*a28cd43dSSascha Wildner return bounds;
410*a28cd43dSSascha Wildner
411*a28cd43dSSascha Wildner case ZSTD_c_ldmHashRateLog:
412*a28cd43dSSascha Wildner bounds.lowerBound = ZSTD_LDM_HASHRATELOG_MIN;
413*a28cd43dSSascha Wildner bounds.upperBound = ZSTD_LDM_HASHRATELOG_MAX;
414*a28cd43dSSascha Wildner return bounds;
415*a28cd43dSSascha Wildner
416*a28cd43dSSascha Wildner /* experimental parameters */
417*a28cd43dSSascha Wildner case ZSTD_c_rsyncable:
418*a28cd43dSSascha Wildner bounds.lowerBound = 0;
419*a28cd43dSSascha Wildner bounds.upperBound = 1;
420*a28cd43dSSascha Wildner return bounds;
421*a28cd43dSSascha Wildner
422*a28cd43dSSascha Wildner case ZSTD_c_forceMaxWindow :
423*a28cd43dSSascha Wildner bounds.lowerBound = 0;
424*a28cd43dSSascha Wildner bounds.upperBound = 1;
425*a28cd43dSSascha Wildner return bounds;
426*a28cd43dSSascha Wildner
427*a28cd43dSSascha Wildner case ZSTD_c_format:
428*a28cd43dSSascha Wildner ZSTD_STATIC_ASSERT(ZSTD_f_zstd1 < ZSTD_f_zstd1_magicless);
429*a28cd43dSSascha Wildner bounds.lowerBound = ZSTD_f_zstd1;
430*a28cd43dSSascha Wildner bounds.upperBound = ZSTD_f_zstd1_magicless; /* note : how to ensure at compile time that this is the highest value enum ? */
431*a28cd43dSSascha Wildner return bounds;
432*a28cd43dSSascha Wildner
433*a28cd43dSSascha Wildner case ZSTD_c_forceAttachDict:
434*a28cd43dSSascha Wildner ZSTD_STATIC_ASSERT(ZSTD_dictDefaultAttach < ZSTD_dictForceLoad);
435*a28cd43dSSascha Wildner bounds.lowerBound = ZSTD_dictDefaultAttach;
436*a28cd43dSSascha Wildner bounds.upperBound = ZSTD_dictForceLoad; /* note : how to ensure at compile time that this is the highest value enum ? */
437*a28cd43dSSascha Wildner return bounds;
438*a28cd43dSSascha Wildner
439*a28cd43dSSascha Wildner case ZSTD_c_literalCompressionMode:
440*a28cd43dSSascha Wildner ZSTD_STATIC_ASSERT(ZSTD_lcm_auto < ZSTD_lcm_huffman && ZSTD_lcm_huffman < ZSTD_lcm_uncompressed);
441*a28cd43dSSascha Wildner bounds.lowerBound = ZSTD_lcm_auto;
442*a28cd43dSSascha Wildner bounds.upperBound = ZSTD_lcm_uncompressed;
443*a28cd43dSSascha Wildner return bounds;
444*a28cd43dSSascha Wildner
445*a28cd43dSSascha Wildner case ZSTD_c_targetCBlockSize:
446*a28cd43dSSascha Wildner bounds.lowerBound = ZSTD_TARGETCBLOCKSIZE_MIN;
447*a28cd43dSSascha Wildner bounds.upperBound = ZSTD_TARGETCBLOCKSIZE_MAX;
448*a28cd43dSSascha Wildner return bounds;
449*a28cd43dSSascha Wildner
450*a28cd43dSSascha Wildner case ZSTD_c_srcSizeHint:
451*a28cd43dSSascha Wildner bounds.lowerBound = ZSTD_SRCSIZEHINT_MIN;
452*a28cd43dSSascha Wildner bounds.upperBound = ZSTD_SRCSIZEHINT_MAX;
453*a28cd43dSSascha Wildner return bounds;
454*a28cd43dSSascha Wildner
455*a28cd43dSSascha Wildner case ZSTD_c_stableInBuffer:
456*a28cd43dSSascha Wildner case ZSTD_c_stableOutBuffer:
457*a28cd43dSSascha Wildner bounds.lowerBound = (int)ZSTD_bm_buffered;
458*a28cd43dSSascha Wildner bounds.upperBound = (int)ZSTD_bm_stable;
459*a28cd43dSSascha Wildner return bounds;
460*a28cd43dSSascha Wildner
461*a28cd43dSSascha Wildner case ZSTD_c_blockDelimiters:
462*a28cd43dSSascha Wildner bounds.lowerBound = (int)ZSTD_sf_noBlockDelimiters;
463*a28cd43dSSascha Wildner bounds.upperBound = (int)ZSTD_sf_explicitBlockDelimiters;
464*a28cd43dSSascha Wildner return bounds;
465*a28cd43dSSascha Wildner
466*a28cd43dSSascha Wildner case ZSTD_c_validateSequences:
467*a28cd43dSSascha Wildner bounds.lowerBound = 0;
468*a28cd43dSSascha Wildner bounds.upperBound = 1;
469*a28cd43dSSascha Wildner return bounds;
470*a28cd43dSSascha Wildner
471*a28cd43dSSascha Wildner default:
472*a28cd43dSSascha Wildner bounds.error = ERROR(parameter_unsupported);
473*a28cd43dSSascha Wildner return bounds;
474*a28cd43dSSascha Wildner }
475*a28cd43dSSascha Wildner }
476*a28cd43dSSascha Wildner
477*a28cd43dSSascha Wildner /* ZSTD_cParam_clampBounds:
478*a28cd43dSSascha Wildner * Clamps the value into the bounded range.
479*a28cd43dSSascha Wildner */
ZSTD_cParam_clampBounds(ZSTD_cParameter cParam,int * value)480*a28cd43dSSascha Wildner static size_t ZSTD_cParam_clampBounds(ZSTD_cParameter cParam, int* value)
481*a28cd43dSSascha Wildner {
482*a28cd43dSSascha Wildner ZSTD_bounds const bounds = ZSTD_cParam_getBounds(cParam);
483*a28cd43dSSascha Wildner if (ZSTD_isError(bounds.error)) return bounds.error;
484*a28cd43dSSascha Wildner if (*value < bounds.lowerBound) *value = bounds.lowerBound;
485*a28cd43dSSascha Wildner if (*value > bounds.upperBound) *value = bounds.upperBound;
486*a28cd43dSSascha Wildner return 0;
487*a28cd43dSSascha Wildner }
488*a28cd43dSSascha Wildner
489*a28cd43dSSascha Wildner #define BOUNDCHECK(cParam, val) { \
490*a28cd43dSSascha Wildner RETURN_ERROR_IF(!ZSTD_cParam_withinBounds(cParam,val), \
491*a28cd43dSSascha Wildner parameter_outOfBound, "Param out of bounds"); \
492*a28cd43dSSascha Wildner }
493*a28cd43dSSascha Wildner
494*a28cd43dSSascha Wildner
ZSTD_isUpdateAuthorized(ZSTD_cParameter param)495*a28cd43dSSascha Wildner static int ZSTD_isUpdateAuthorized(ZSTD_cParameter param)
496*a28cd43dSSascha Wildner {
497*a28cd43dSSascha Wildner switch(param)
498*a28cd43dSSascha Wildner {
499*a28cd43dSSascha Wildner case ZSTD_c_compressionLevel:
500*a28cd43dSSascha Wildner case ZSTD_c_hashLog:
501*a28cd43dSSascha Wildner case ZSTD_c_chainLog:
502*a28cd43dSSascha Wildner case ZSTD_c_searchLog:
503*a28cd43dSSascha Wildner case ZSTD_c_minMatch:
504*a28cd43dSSascha Wildner case ZSTD_c_targetLength:
505*a28cd43dSSascha Wildner case ZSTD_c_strategy:
506*a28cd43dSSascha Wildner return 1;
507*a28cd43dSSascha Wildner
508*a28cd43dSSascha Wildner case ZSTD_c_format:
509*a28cd43dSSascha Wildner case ZSTD_c_windowLog:
510*a28cd43dSSascha Wildner case ZSTD_c_contentSizeFlag:
511*a28cd43dSSascha Wildner case ZSTD_c_checksumFlag:
512*a28cd43dSSascha Wildner case ZSTD_c_dictIDFlag:
513*a28cd43dSSascha Wildner case ZSTD_c_forceMaxWindow :
514*a28cd43dSSascha Wildner case ZSTD_c_nbWorkers:
515*a28cd43dSSascha Wildner case ZSTD_c_jobSize:
516*a28cd43dSSascha Wildner case ZSTD_c_overlapLog:
517*a28cd43dSSascha Wildner case ZSTD_c_rsyncable:
518*a28cd43dSSascha Wildner case ZSTD_c_enableDedicatedDictSearch:
519*a28cd43dSSascha Wildner case ZSTD_c_enableLongDistanceMatching:
520*a28cd43dSSascha Wildner case ZSTD_c_ldmHashLog:
521*a28cd43dSSascha Wildner case ZSTD_c_ldmMinMatch:
522*a28cd43dSSascha Wildner case ZSTD_c_ldmBucketSizeLog:
523*a28cd43dSSascha Wildner case ZSTD_c_ldmHashRateLog:
524*a28cd43dSSascha Wildner case ZSTD_c_forceAttachDict:
525*a28cd43dSSascha Wildner case ZSTD_c_literalCompressionMode:
526*a28cd43dSSascha Wildner case ZSTD_c_targetCBlockSize:
527*a28cd43dSSascha Wildner case ZSTD_c_srcSizeHint:
528*a28cd43dSSascha Wildner case ZSTD_c_stableInBuffer:
529*a28cd43dSSascha Wildner case ZSTD_c_stableOutBuffer:
530*a28cd43dSSascha Wildner case ZSTD_c_blockDelimiters:
531*a28cd43dSSascha Wildner case ZSTD_c_validateSequences:
532*a28cd43dSSascha Wildner default:
533*a28cd43dSSascha Wildner return 0;
534*a28cd43dSSascha Wildner }
535*a28cd43dSSascha Wildner }
536*a28cd43dSSascha Wildner
ZSTD_CCtx_setParameter(ZSTD_CCtx * cctx,ZSTD_cParameter param,int value)537*a28cd43dSSascha Wildner size_t ZSTD_CCtx_setParameter(ZSTD_CCtx* cctx, ZSTD_cParameter param, int value)
538*a28cd43dSSascha Wildner {
539*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_CCtx_setParameter (%i, %i)", (int)param, value);
540*a28cd43dSSascha Wildner if (cctx->streamStage != zcss_init) {
541*a28cd43dSSascha Wildner if (ZSTD_isUpdateAuthorized(param)) {
542*a28cd43dSSascha Wildner cctx->cParamsChanged = 1;
543*a28cd43dSSascha Wildner } else {
544*a28cd43dSSascha Wildner RETURN_ERROR(stage_wrong, "can only set params in ctx init stage");
545*a28cd43dSSascha Wildner } }
546*a28cd43dSSascha Wildner
547*a28cd43dSSascha Wildner switch(param)
548*a28cd43dSSascha Wildner {
549*a28cd43dSSascha Wildner case ZSTD_c_nbWorkers:
550*a28cd43dSSascha Wildner RETURN_ERROR_IF((value!=0) && cctx->staticSize, parameter_unsupported,
551*a28cd43dSSascha Wildner "MT not compatible with static alloc");
552*a28cd43dSSascha Wildner break;
553*a28cd43dSSascha Wildner
554*a28cd43dSSascha Wildner case ZSTD_c_compressionLevel:
555*a28cd43dSSascha Wildner case ZSTD_c_windowLog:
556*a28cd43dSSascha Wildner case ZSTD_c_hashLog:
557*a28cd43dSSascha Wildner case ZSTD_c_chainLog:
558*a28cd43dSSascha Wildner case ZSTD_c_searchLog:
559*a28cd43dSSascha Wildner case ZSTD_c_minMatch:
560*a28cd43dSSascha Wildner case ZSTD_c_targetLength:
561*a28cd43dSSascha Wildner case ZSTD_c_strategy:
562*a28cd43dSSascha Wildner case ZSTD_c_ldmHashRateLog:
563*a28cd43dSSascha Wildner case ZSTD_c_format:
564*a28cd43dSSascha Wildner case ZSTD_c_contentSizeFlag:
565*a28cd43dSSascha Wildner case ZSTD_c_checksumFlag:
566*a28cd43dSSascha Wildner case ZSTD_c_dictIDFlag:
567*a28cd43dSSascha Wildner case ZSTD_c_forceMaxWindow:
568*a28cd43dSSascha Wildner case ZSTD_c_forceAttachDict:
569*a28cd43dSSascha Wildner case ZSTD_c_literalCompressionMode:
570*a28cd43dSSascha Wildner case ZSTD_c_jobSize:
571*a28cd43dSSascha Wildner case ZSTD_c_overlapLog:
572*a28cd43dSSascha Wildner case ZSTD_c_rsyncable:
573*a28cd43dSSascha Wildner case ZSTD_c_enableDedicatedDictSearch:
574*a28cd43dSSascha Wildner case ZSTD_c_enableLongDistanceMatching:
575*a28cd43dSSascha Wildner case ZSTD_c_ldmHashLog:
576*a28cd43dSSascha Wildner case ZSTD_c_ldmMinMatch:
577*a28cd43dSSascha Wildner case ZSTD_c_ldmBucketSizeLog:
578*a28cd43dSSascha Wildner case ZSTD_c_targetCBlockSize:
579*a28cd43dSSascha Wildner case ZSTD_c_srcSizeHint:
580*a28cd43dSSascha Wildner case ZSTD_c_stableInBuffer:
581*a28cd43dSSascha Wildner case ZSTD_c_stableOutBuffer:
582*a28cd43dSSascha Wildner case ZSTD_c_blockDelimiters:
583*a28cd43dSSascha Wildner case ZSTD_c_validateSequences:
584*a28cd43dSSascha Wildner break;
585*a28cd43dSSascha Wildner
586*a28cd43dSSascha Wildner default: RETURN_ERROR(parameter_unsupported, "unknown parameter");
587*a28cd43dSSascha Wildner }
588*a28cd43dSSascha Wildner return ZSTD_CCtxParams_setParameter(&cctx->requestedParams, param, value);
589*a28cd43dSSascha Wildner }
590*a28cd43dSSascha Wildner
ZSTD_CCtxParams_setParameter(ZSTD_CCtx_params * CCtxParams,ZSTD_cParameter param,int value)591*a28cd43dSSascha Wildner size_t ZSTD_CCtxParams_setParameter(ZSTD_CCtx_params* CCtxParams,
592*a28cd43dSSascha Wildner ZSTD_cParameter param, int value)
593*a28cd43dSSascha Wildner {
594*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_CCtxParams_setParameter (%i, %i)", (int)param, value);
595*a28cd43dSSascha Wildner switch(param)
596*a28cd43dSSascha Wildner {
597*a28cd43dSSascha Wildner case ZSTD_c_format :
598*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_format, value);
599*a28cd43dSSascha Wildner CCtxParams->format = (ZSTD_format_e)value;
600*a28cd43dSSascha Wildner return (size_t)CCtxParams->format;
601*a28cd43dSSascha Wildner
602*a28cd43dSSascha Wildner case ZSTD_c_compressionLevel : {
603*a28cd43dSSascha Wildner FORWARD_IF_ERROR(ZSTD_cParam_clampBounds(param, &value), "");
604*a28cd43dSSascha Wildner if (value == 0)
605*a28cd43dSSascha Wildner CCtxParams->compressionLevel = ZSTD_CLEVEL_DEFAULT; /* 0 == default */
606*a28cd43dSSascha Wildner else
607*a28cd43dSSascha Wildner CCtxParams->compressionLevel = value;
608*a28cd43dSSascha Wildner if (CCtxParams->compressionLevel >= 0) return (size_t)CCtxParams->compressionLevel;
609*a28cd43dSSascha Wildner return 0; /* return type (size_t) cannot represent negative values */
610*a28cd43dSSascha Wildner }
611*a28cd43dSSascha Wildner
612*a28cd43dSSascha Wildner case ZSTD_c_windowLog :
613*a28cd43dSSascha Wildner if (value!=0) /* 0 => use default */
614*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_windowLog, value);
615*a28cd43dSSascha Wildner CCtxParams->cParams.windowLog = (U32)value;
616*a28cd43dSSascha Wildner return CCtxParams->cParams.windowLog;
617*a28cd43dSSascha Wildner
618*a28cd43dSSascha Wildner case ZSTD_c_hashLog :
619*a28cd43dSSascha Wildner if (value!=0) /* 0 => use default */
620*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_hashLog, value);
621*a28cd43dSSascha Wildner CCtxParams->cParams.hashLog = (U32)value;
622*a28cd43dSSascha Wildner return CCtxParams->cParams.hashLog;
623*a28cd43dSSascha Wildner
624*a28cd43dSSascha Wildner case ZSTD_c_chainLog :
625*a28cd43dSSascha Wildner if (value!=0) /* 0 => use default */
626*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_chainLog, value);
627*a28cd43dSSascha Wildner CCtxParams->cParams.chainLog = (U32)value;
628*a28cd43dSSascha Wildner return CCtxParams->cParams.chainLog;
629*a28cd43dSSascha Wildner
630*a28cd43dSSascha Wildner case ZSTD_c_searchLog :
631*a28cd43dSSascha Wildner if (value!=0) /* 0 => use default */
632*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_searchLog, value);
633*a28cd43dSSascha Wildner CCtxParams->cParams.searchLog = (U32)value;
634*a28cd43dSSascha Wildner return (size_t)value;
635*a28cd43dSSascha Wildner
636*a28cd43dSSascha Wildner case ZSTD_c_minMatch :
637*a28cd43dSSascha Wildner if (value!=0) /* 0 => use default */
638*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_minMatch, value);
639*a28cd43dSSascha Wildner CCtxParams->cParams.minMatch = value;
640*a28cd43dSSascha Wildner return CCtxParams->cParams.minMatch;
641*a28cd43dSSascha Wildner
642*a28cd43dSSascha Wildner case ZSTD_c_targetLength :
643*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_targetLength, value);
644*a28cd43dSSascha Wildner CCtxParams->cParams.targetLength = value;
645*a28cd43dSSascha Wildner return CCtxParams->cParams.targetLength;
646*a28cd43dSSascha Wildner
647*a28cd43dSSascha Wildner case ZSTD_c_strategy :
648*a28cd43dSSascha Wildner if (value!=0) /* 0 => use default */
649*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_strategy, value);
650*a28cd43dSSascha Wildner CCtxParams->cParams.strategy = (ZSTD_strategy)value;
651*a28cd43dSSascha Wildner return (size_t)CCtxParams->cParams.strategy;
652*a28cd43dSSascha Wildner
653*a28cd43dSSascha Wildner case ZSTD_c_contentSizeFlag :
654*a28cd43dSSascha Wildner /* Content size written in frame header _when known_ (default:1) */
655*a28cd43dSSascha Wildner DEBUGLOG(4, "set content size flag = %u", (value!=0));
656*a28cd43dSSascha Wildner CCtxParams->fParams.contentSizeFlag = value != 0;
657*a28cd43dSSascha Wildner return CCtxParams->fParams.contentSizeFlag;
658*a28cd43dSSascha Wildner
659*a28cd43dSSascha Wildner case ZSTD_c_checksumFlag :
660*a28cd43dSSascha Wildner /* A 32-bits content checksum will be calculated and written at end of frame (default:0) */
661*a28cd43dSSascha Wildner CCtxParams->fParams.checksumFlag = value != 0;
662*a28cd43dSSascha Wildner return CCtxParams->fParams.checksumFlag;
663*a28cd43dSSascha Wildner
664*a28cd43dSSascha Wildner case ZSTD_c_dictIDFlag : /* When applicable, dictionary's dictID is provided in frame header (default:1) */
665*a28cd43dSSascha Wildner DEBUGLOG(4, "set dictIDFlag = %u", (value!=0));
666*a28cd43dSSascha Wildner CCtxParams->fParams.noDictIDFlag = !value;
667*a28cd43dSSascha Wildner return !CCtxParams->fParams.noDictIDFlag;
668*a28cd43dSSascha Wildner
669*a28cd43dSSascha Wildner case ZSTD_c_forceMaxWindow :
670*a28cd43dSSascha Wildner CCtxParams->forceWindow = (value != 0);
671*a28cd43dSSascha Wildner return CCtxParams->forceWindow;
672*a28cd43dSSascha Wildner
673*a28cd43dSSascha Wildner case ZSTD_c_forceAttachDict : {
674*a28cd43dSSascha Wildner const ZSTD_dictAttachPref_e pref = (ZSTD_dictAttachPref_e)value;
675*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_forceAttachDict, pref);
676*a28cd43dSSascha Wildner CCtxParams->attachDictPref = pref;
677*a28cd43dSSascha Wildner return CCtxParams->attachDictPref;
678*a28cd43dSSascha Wildner }
679*a28cd43dSSascha Wildner
680*a28cd43dSSascha Wildner case ZSTD_c_literalCompressionMode : {
681*a28cd43dSSascha Wildner const ZSTD_literalCompressionMode_e lcm = (ZSTD_literalCompressionMode_e)value;
682*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_literalCompressionMode, lcm);
683*a28cd43dSSascha Wildner CCtxParams->literalCompressionMode = lcm;
684*a28cd43dSSascha Wildner return CCtxParams->literalCompressionMode;
685*a28cd43dSSascha Wildner }
686*a28cd43dSSascha Wildner
687*a28cd43dSSascha Wildner case ZSTD_c_nbWorkers :
688*a28cd43dSSascha Wildner #ifndef ZSTD_MULTITHREAD
689*a28cd43dSSascha Wildner RETURN_ERROR_IF(value!=0, parameter_unsupported, "not compiled with multithreading");
690*a28cd43dSSascha Wildner return 0;
691*a28cd43dSSascha Wildner #else
692*a28cd43dSSascha Wildner FORWARD_IF_ERROR(ZSTD_cParam_clampBounds(param, &value), "");
693*a28cd43dSSascha Wildner CCtxParams->nbWorkers = value;
694*a28cd43dSSascha Wildner return CCtxParams->nbWorkers;
695*a28cd43dSSascha Wildner #endif
696*a28cd43dSSascha Wildner
697*a28cd43dSSascha Wildner case ZSTD_c_jobSize :
698*a28cd43dSSascha Wildner #ifndef ZSTD_MULTITHREAD
699*a28cd43dSSascha Wildner RETURN_ERROR_IF(value!=0, parameter_unsupported, "not compiled with multithreading");
700*a28cd43dSSascha Wildner return 0;
701*a28cd43dSSascha Wildner #else
702*a28cd43dSSascha Wildner /* Adjust to the minimum non-default value. */
703*a28cd43dSSascha Wildner if (value != 0 && value < ZSTDMT_JOBSIZE_MIN)
704*a28cd43dSSascha Wildner value = ZSTDMT_JOBSIZE_MIN;
705*a28cd43dSSascha Wildner FORWARD_IF_ERROR(ZSTD_cParam_clampBounds(param, &value), "");
706*a28cd43dSSascha Wildner assert(value >= 0);
707*a28cd43dSSascha Wildner CCtxParams->jobSize = value;
708*a28cd43dSSascha Wildner return CCtxParams->jobSize;
709*a28cd43dSSascha Wildner #endif
710*a28cd43dSSascha Wildner
711*a28cd43dSSascha Wildner case ZSTD_c_overlapLog :
712*a28cd43dSSascha Wildner #ifndef ZSTD_MULTITHREAD
713*a28cd43dSSascha Wildner RETURN_ERROR_IF(value!=0, parameter_unsupported, "not compiled with multithreading");
714*a28cd43dSSascha Wildner return 0;
715*a28cd43dSSascha Wildner #else
716*a28cd43dSSascha Wildner FORWARD_IF_ERROR(ZSTD_cParam_clampBounds(ZSTD_c_overlapLog, &value), "");
717*a28cd43dSSascha Wildner CCtxParams->overlapLog = value;
718*a28cd43dSSascha Wildner return CCtxParams->overlapLog;
719*a28cd43dSSascha Wildner #endif
720*a28cd43dSSascha Wildner
721*a28cd43dSSascha Wildner case ZSTD_c_rsyncable :
722*a28cd43dSSascha Wildner #ifndef ZSTD_MULTITHREAD
723*a28cd43dSSascha Wildner RETURN_ERROR_IF(value!=0, parameter_unsupported, "not compiled with multithreading");
724*a28cd43dSSascha Wildner return 0;
725*a28cd43dSSascha Wildner #else
726*a28cd43dSSascha Wildner FORWARD_IF_ERROR(ZSTD_cParam_clampBounds(ZSTD_c_overlapLog, &value), "");
727*a28cd43dSSascha Wildner CCtxParams->rsyncable = value;
728*a28cd43dSSascha Wildner return CCtxParams->rsyncable;
729*a28cd43dSSascha Wildner #endif
730*a28cd43dSSascha Wildner
731*a28cd43dSSascha Wildner case ZSTD_c_enableDedicatedDictSearch :
732*a28cd43dSSascha Wildner CCtxParams->enableDedicatedDictSearch = (value!=0);
733*a28cd43dSSascha Wildner return CCtxParams->enableDedicatedDictSearch;
734*a28cd43dSSascha Wildner
735*a28cd43dSSascha Wildner case ZSTD_c_enableLongDistanceMatching :
736*a28cd43dSSascha Wildner CCtxParams->ldmParams.enableLdm = (value!=0);
737*a28cd43dSSascha Wildner return CCtxParams->ldmParams.enableLdm;
738*a28cd43dSSascha Wildner
739*a28cd43dSSascha Wildner case ZSTD_c_ldmHashLog :
740*a28cd43dSSascha Wildner if (value!=0) /* 0 ==> auto */
741*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_ldmHashLog, value);
742*a28cd43dSSascha Wildner CCtxParams->ldmParams.hashLog = value;
743*a28cd43dSSascha Wildner return CCtxParams->ldmParams.hashLog;
744*a28cd43dSSascha Wildner
745*a28cd43dSSascha Wildner case ZSTD_c_ldmMinMatch :
746*a28cd43dSSascha Wildner if (value!=0) /* 0 ==> default */
747*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_ldmMinMatch, value);
748*a28cd43dSSascha Wildner CCtxParams->ldmParams.minMatchLength = value;
749*a28cd43dSSascha Wildner return CCtxParams->ldmParams.minMatchLength;
750*a28cd43dSSascha Wildner
751*a28cd43dSSascha Wildner case ZSTD_c_ldmBucketSizeLog :
752*a28cd43dSSascha Wildner if (value!=0) /* 0 ==> default */
753*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_ldmBucketSizeLog, value);
754*a28cd43dSSascha Wildner CCtxParams->ldmParams.bucketSizeLog = value;
755*a28cd43dSSascha Wildner return CCtxParams->ldmParams.bucketSizeLog;
756*a28cd43dSSascha Wildner
757*a28cd43dSSascha Wildner case ZSTD_c_ldmHashRateLog :
758*a28cd43dSSascha Wildner RETURN_ERROR_IF(value > ZSTD_WINDOWLOG_MAX - ZSTD_HASHLOG_MIN,
759*a28cd43dSSascha Wildner parameter_outOfBound, "Param out of bounds!");
760*a28cd43dSSascha Wildner CCtxParams->ldmParams.hashRateLog = value;
761*a28cd43dSSascha Wildner return CCtxParams->ldmParams.hashRateLog;
762*a28cd43dSSascha Wildner
763*a28cd43dSSascha Wildner case ZSTD_c_targetCBlockSize :
764*a28cd43dSSascha Wildner if (value!=0) /* 0 ==> default */
765*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_targetCBlockSize, value);
766*a28cd43dSSascha Wildner CCtxParams->targetCBlockSize = value;
767*a28cd43dSSascha Wildner return CCtxParams->targetCBlockSize;
768*a28cd43dSSascha Wildner
769*a28cd43dSSascha Wildner case ZSTD_c_srcSizeHint :
770*a28cd43dSSascha Wildner if (value!=0) /* 0 ==> default */
771*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_srcSizeHint, value);
772*a28cd43dSSascha Wildner CCtxParams->srcSizeHint = value;
773*a28cd43dSSascha Wildner return CCtxParams->srcSizeHint;
774*a28cd43dSSascha Wildner
775*a28cd43dSSascha Wildner case ZSTD_c_stableInBuffer:
776*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_stableInBuffer, value);
777*a28cd43dSSascha Wildner CCtxParams->inBufferMode = (ZSTD_bufferMode_e)value;
778*a28cd43dSSascha Wildner return CCtxParams->inBufferMode;
779*a28cd43dSSascha Wildner
780*a28cd43dSSascha Wildner case ZSTD_c_stableOutBuffer:
781*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_stableOutBuffer, value);
782*a28cd43dSSascha Wildner CCtxParams->outBufferMode = (ZSTD_bufferMode_e)value;
783*a28cd43dSSascha Wildner return CCtxParams->outBufferMode;
784*a28cd43dSSascha Wildner
785*a28cd43dSSascha Wildner case ZSTD_c_blockDelimiters:
786*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_blockDelimiters, value);
787*a28cd43dSSascha Wildner CCtxParams->blockDelimiters = (ZSTD_sequenceFormat_e)value;
788*a28cd43dSSascha Wildner return CCtxParams->blockDelimiters;
789*a28cd43dSSascha Wildner
790*a28cd43dSSascha Wildner case ZSTD_c_validateSequences:
791*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_validateSequences, value);
792*a28cd43dSSascha Wildner CCtxParams->validateSequences = value;
793*a28cd43dSSascha Wildner return CCtxParams->validateSequences;
794*a28cd43dSSascha Wildner
795*a28cd43dSSascha Wildner default: RETURN_ERROR(parameter_unsupported, "unknown parameter");
796*a28cd43dSSascha Wildner }
797*a28cd43dSSascha Wildner }
798*a28cd43dSSascha Wildner
ZSTD_CCtx_getParameter(ZSTD_CCtx * cctx,ZSTD_cParameter param,int * value)799*a28cd43dSSascha Wildner size_t ZSTD_CCtx_getParameter(ZSTD_CCtx* cctx, ZSTD_cParameter param, int* value)
800*a28cd43dSSascha Wildner {
801*a28cd43dSSascha Wildner return ZSTD_CCtxParams_getParameter(&cctx->requestedParams, param, value);
802*a28cd43dSSascha Wildner }
803*a28cd43dSSascha Wildner
ZSTD_CCtxParams_getParameter(ZSTD_CCtx_params * CCtxParams,ZSTD_cParameter param,int * value)804*a28cd43dSSascha Wildner size_t ZSTD_CCtxParams_getParameter(
805*a28cd43dSSascha Wildner ZSTD_CCtx_params* CCtxParams, ZSTD_cParameter param, int* value)
806*a28cd43dSSascha Wildner {
807*a28cd43dSSascha Wildner switch(param)
808*a28cd43dSSascha Wildner {
809*a28cd43dSSascha Wildner case ZSTD_c_format :
810*a28cd43dSSascha Wildner *value = CCtxParams->format;
811*a28cd43dSSascha Wildner break;
812*a28cd43dSSascha Wildner case ZSTD_c_compressionLevel :
813*a28cd43dSSascha Wildner *value = CCtxParams->compressionLevel;
814*a28cd43dSSascha Wildner break;
815*a28cd43dSSascha Wildner case ZSTD_c_windowLog :
816*a28cd43dSSascha Wildner *value = (int)CCtxParams->cParams.windowLog;
817*a28cd43dSSascha Wildner break;
818*a28cd43dSSascha Wildner case ZSTD_c_hashLog :
819*a28cd43dSSascha Wildner *value = (int)CCtxParams->cParams.hashLog;
820*a28cd43dSSascha Wildner break;
821*a28cd43dSSascha Wildner case ZSTD_c_chainLog :
822*a28cd43dSSascha Wildner *value = (int)CCtxParams->cParams.chainLog;
823*a28cd43dSSascha Wildner break;
824*a28cd43dSSascha Wildner case ZSTD_c_searchLog :
825*a28cd43dSSascha Wildner *value = CCtxParams->cParams.searchLog;
826*a28cd43dSSascha Wildner break;
827*a28cd43dSSascha Wildner case ZSTD_c_minMatch :
828*a28cd43dSSascha Wildner *value = CCtxParams->cParams.minMatch;
829*a28cd43dSSascha Wildner break;
830*a28cd43dSSascha Wildner case ZSTD_c_targetLength :
831*a28cd43dSSascha Wildner *value = CCtxParams->cParams.targetLength;
832*a28cd43dSSascha Wildner break;
833*a28cd43dSSascha Wildner case ZSTD_c_strategy :
834*a28cd43dSSascha Wildner *value = (unsigned)CCtxParams->cParams.strategy;
835*a28cd43dSSascha Wildner break;
836*a28cd43dSSascha Wildner case ZSTD_c_contentSizeFlag :
837*a28cd43dSSascha Wildner *value = CCtxParams->fParams.contentSizeFlag;
838*a28cd43dSSascha Wildner break;
839*a28cd43dSSascha Wildner case ZSTD_c_checksumFlag :
840*a28cd43dSSascha Wildner *value = CCtxParams->fParams.checksumFlag;
841*a28cd43dSSascha Wildner break;
842*a28cd43dSSascha Wildner case ZSTD_c_dictIDFlag :
843*a28cd43dSSascha Wildner *value = !CCtxParams->fParams.noDictIDFlag;
844*a28cd43dSSascha Wildner break;
845*a28cd43dSSascha Wildner case ZSTD_c_forceMaxWindow :
846*a28cd43dSSascha Wildner *value = CCtxParams->forceWindow;
847*a28cd43dSSascha Wildner break;
848*a28cd43dSSascha Wildner case ZSTD_c_forceAttachDict :
849*a28cd43dSSascha Wildner *value = CCtxParams->attachDictPref;
850*a28cd43dSSascha Wildner break;
851*a28cd43dSSascha Wildner case ZSTD_c_literalCompressionMode :
852*a28cd43dSSascha Wildner *value = CCtxParams->literalCompressionMode;
853*a28cd43dSSascha Wildner break;
854*a28cd43dSSascha Wildner case ZSTD_c_nbWorkers :
855*a28cd43dSSascha Wildner #ifndef ZSTD_MULTITHREAD
856*a28cd43dSSascha Wildner assert(CCtxParams->nbWorkers == 0);
857*a28cd43dSSascha Wildner #endif
858*a28cd43dSSascha Wildner *value = CCtxParams->nbWorkers;
859*a28cd43dSSascha Wildner break;
860*a28cd43dSSascha Wildner case ZSTD_c_jobSize :
861*a28cd43dSSascha Wildner #ifndef ZSTD_MULTITHREAD
862*a28cd43dSSascha Wildner RETURN_ERROR(parameter_unsupported, "not compiled with multithreading");
863*a28cd43dSSascha Wildner #else
864*a28cd43dSSascha Wildner assert(CCtxParams->jobSize <= INT_MAX);
865*a28cd43dSSascha Wildner *value = (int)CCtxParams->jobSize;
866*a28cd43dSSascha Wildner break;
867*a28cd43dSSascha Wildner #endif
868*a28cd43dSSascha Wildner case ZSTD_c_overlapLog :
869*a28cd43dSSascha Wildner #ifndef ZSTD_MULTITHREAD
870*a28cd43dSSascha Wildner RETURN_ERROR(parameter_unsupported, "not compiled with multithreading");
871*a28cd43dSSascha Wildner #else
872*a28cd43dSSascha Wildner *value = CCtxParams->overlapLog;
873*a28cd43dSSascha Wildner break;
874*a28cd43dSSascha Wildner #endif
875*a28cd43dSSascha Wildner case ZSTD_c_rsyncable :
876*a28cd43dSSascha Wildner #ifndef ZSTD_MULTITHREAD
877*a28cd43dSSascha Wildner RETURN_ERROR(parameter_unsupported, "not compiled with multithreading");
878*a28cd43dSSascha Wildner #else
879*a28cd43dSSascha Wildner *value = CCtxParams->rsyncable;
880*a28cd43dSSascha Wildner break;
881*a28cd43dSSascha Wildner #endif
882*a28cd43dSSascha Wildner case ZSTD_c_enableDedicatedDictSearch :
883*a28cd43dSSascha Wildner *value = CCtxParams->enableDedicatedDictSearch;
884*a28cd43dSSascha Wildner break;
885*a28cd43dSSascha Wildner case ZSTD_c_enableLongDistanceMatching :
886*a28cd43dSSascha Wildner *value = CCtxParams->ldmParams.enableLdm;
887*a28cd43dSSascha Wildner break;
888*a28cd43dSSascha Wildner case ZSTD_c_ldmHashLog :
889*a28cd43dSSascha Wildner *value = CCtxParams->ldmParams.hashLog;
890*a28cd43dSSascha Wildner break;
891*a28cd43dSSascha Wildner case ZSTD_c_ldmMinMatch :
892*a28cd43dSSascha Wildner *value = CCtxParams->ldmParams.minMatchLength;
893*a28cd43dSSascha Wildner break;
894*a28cd43dSSascha Wildner case ZSTD_c_ldmBucketSizeLog :
895*a28cd43dSSascha Wildner *value = CCtxParams->ldmParams.bucketSizeLog;
896*a28cd43dSSascha Wildner break;
897*a28cd43dSSascha Wildner case ZSTD_c_ldmHashRateLog :
898*a28cd43dSSascha Wildner *value = CCtxParams->ldmParams.hashRateLog;
899*a28cd43dSSascha Wildner break;
900*a28cd43dSSascha Wildner case ZSTD_c_targetCBlockSize :
901*a28cd43dSSascha Wildner *value = (int)CCtxParams->targetCBlockSize;
902*a28cd43dSSascha Wildner break;
903*a28cd43dSSascha Wildner case ZSTD_c_srcSizeHint :
904*a28cd43dSSascha Wildner *value = (int)CCtxParams->srcSizeHint;
905*a28cd43dSSascha Wildner break;
906*a28cd43dSSascha Wildner case ZSTD_c_stableInBuffer :
907*a28cd43dSSascha Wildner *value = (int)CCtxParams->inBufferMode;
908*a28cd43dSSascha Wildner break;
909*a28cd43dSSascha Wildner case ZSTD_c_stableOutBuffer :
910*a28cd43dSSascha Wildner *value = (int)CCtxParams->outBufferMode;
911*a28cd43dSSascha Wildner break;
912*a28cd43dSSascha Wildner case ZSTD_c_blockDelimiters :
913*a28cd43dSSascha Wildner *value = (int)CCtxParams->blockDelimiters;
914*a28cd43dSSascha Wildner break;
915*a28cd43dSSascha Wildner case ZSTD_c_validateSequences :
916*a28cd43dSSascha Wildner *value = (int)CCtxParams->validateSequences;
917*a28cd43dSSascha Wildner break;
918*a28cd43dSSascha Wildner default: RETURN_ERROR(parameter_unsupported, "unknown parameter");
919*a28cd43dSSascha Wildner }
920*a28cd43dSSascha Wildner return 0;
921*a28cd43dSSascha Wildner }
922*a28cd43dSSascha Wildner
923*a28cd43dSSascha Wildner /** ZSTD_CCtx_setParametersUsingCCtxParams() :
924*a28cd43dSSascha Wildner * just applies `params` into `cctx`
925*a28cd43dSSascha Wildner * no action is performed, parameters are merely stored.
926*a28cd43dSSascha Wildner * If ZSTDMT is enabled, parameters are pushed to cctx->mtctx.
927*a28cd43dSSascha Wildner * This is possible even if a compression is ongoing.
928*a28cd43dSSascha Wildner * In which case, new parameters will be applied on the fly, starting with next compression job.
929*a28cd43dSSascha Wildner */
ZSTD_CCtx_setParametersUsingCCtxParams(ZSTD_CCtx * cctx,const ZSTD_CCtx_params * params)930*a28cd43dSSascha Wildner size_t ZSTD_CCtx_setParametersUsingCCtxParams(
931*a28cd43dSSascha Wildner ZSTD_CCtx* cctx, const ZSTD_CCtx_params* params)
932*a28cd43dSSascha Wildner {
933*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_CCtx_setParametersUsingCCtxParams");
934*a28cd43dSSascha Wildner RETURN_ERROR_IF(cctx->streamStage != zcss_init, stage_wrong,
935*a28cd43dSSascha Wildner "The context is in the wrong stage!");
936*a28cd43dSSascha Wildner RETURN_ERROR_IF(cctx->cdict, stage_wrong,
937*a28cd43dSSascha Wildner "Can't override parameters with cdict attached (some must "
938*a28cd43dSSascha Wildner "be inherited from the cdict).");
939*a28cd43dSSascha Wildner
940*a28cd43dSSascha Wildner cctx->requestedParams = *params;
941*a28cd43dSSascha Wildner return 0;
942*a28cd43dSSascha Wildner }
943*a28cd43dSSascha Wildner
ZSTD_CCtx_setPledgedSrcSize(ZSTD_CCtx * cctx,unsigned long long pledgedSrcSize)944*a28cd43dSSascha Wildner ZSTDLIB_API size_t ZSTD_CCtx_setPledgedSrcSize(ZSTD_CCtx* cctx, unsigned long long pledgedSrcSize)
945*a28cd43dSSascha Wildner {
946*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_CCtx_setPledgedSrcSize to %u bytes", (U32)pledgedSrcSize);
947*a28cd43dSSascha Wildner RETURN_ERROR_IF(cctx->streamStage != zcss_init, stage_wrong,
948*a28cd43dSSascha Wildner "Can't set pledgedSrcSize when not in init stage.");
949*a28cd43dSSascha Wildner cctx->pledgedSrcSizePlusOne = pledgedSrcSize+1;
950*a28cd43dSSascha Wildner return 0;
951*a28cd43dSSascha Wildner }
952*a28cd43dSSascha Wildner
953*a28cd43dSSascha Wildner static ZSTD_compressionParameters ZSTD_dedicatedDictSearch_getCParams(
954*a28cd43dSSascha Wildner int const compressionLevel,
955*a28cd43dSSascha Wildner size_t const dictSize);
956*a28cd43dSSascha Wildner static int ZSTD_dedicatedDictSearch_isSupported(
957*a28cd43dSSascha Wildner const ZSTD_compressionParameters* cParams);
958*a28cd43dSSascha Wildner static void ZSTD_dedicatedDictSearch_revertCParams(
959*a28cd43dSSascha Wildner ZSTD_compressionParameters* cParams);
960*a28cd43dSSascha Wildner
961*a28cd43dSSascha Wildner /**
962*a28cd43dSSascha Wildner * Initializes the local dict using the requested parameters.
963*a28cd43dSSascha Wildner * NOTE: This does not use the pledged src size, because it may be used for more
964*a28cd43dSSascha Wildner * than one compression.
965*a28cd43dSSascha Wildner */
ZSTD_initLocalDict(ZSTD_CCtx * cctx)966*a28cd43dSSascha Wildner static size_t ZSTD_initLocalDict(ZSTD_CCtx* cctx)
967*a28cd43dSSascha Wildner {
968*a28cd43dSSascha Wildner ZSTD_localDict* const dl = &cctx->localDict;
969*a28cd43dSSascha Wildner if (dl->dict == NULL) {
970*a28cd43dSSascha Wildner /* No local dictionary. */
971*a28cd43dSSascha Wildner assert(dl->dictBuffer == NULL);
972*a28cd43dSSascha Wildner assert(dl->cdict == NULL);
973*a28cd43dSSascha Wildner assert(dl->dictSize == 0);
974*a28cd43dSSascha Wildner return 0;
975*a28cd43dSSascha Wildner }
976*a28cd43dSSascha Wildner if (dl->cdict != NULL) {
977*a28cd43dSSascha Wildner assert(cctx->cdict == dl->cdict);
978*a28cd43dSSascha Wildner /* Local dictionary already initialized. */
979*a28cd43dSSascha Wildner return 0;
980*a28cd43dSSascha Wildner }
981*a28cd43dSSascha Wildner assert(dl->dictSize > 0);
982*a28cd43dSSascha Wildner assert(cctx->cdict == NULL);
983*a28cd43dSSascha Wildner assert(cctx->prefixDict.dict == NULL);
984*a28cd43dSSascha Wildner
985*a28cd43dSSascha Wildner dl->cdict = ZSTD_createCDict_advanced2(
986*a28cd43dSSascha Wildner dl->dict,
987*a28cd43dSSascha Wildner dl->dictSize,
988*a28cd43dSSascha Wildner ZSTD_dlm_byRef,
989*a28cd43dSSascha Wildner dl->dictContentType,
990*a28cd43dSSascha Wildner &cctx->requestedParams,
991*a28cd43dSSascha Wildner cctx->customMem);
992*a28cd43dSSascha Wildner RETURN_ERROR_IF(!dl->cdict, memory_allocation, "ZSTD_createCDict_advanced failed");
993*a28cd43dSSascha Wildner cctx->cdict = dl->cdict;
994*a28cd43dSSascha Wildner return 0;
995*a28cd43dSSascha Wildner }
996*a28cd43dSSascha Wildner
ZSTD_CCtx_loadDictionary_advanced(ZSTD_CCtx * cctx,const void * dict,size_t dictSize,ZSTD_dictLoadMethod_e dictLoadMethod,ZSTD_dictContentType_e dictContentType)997*a28cd43dSSascha Wildner size_t ZSTD_CCtx_loadDictionary_advanced(
998*a28cd43dSSascha Wildner ZSTD_CCtx* cctx, const void* dict, size_t dictSize,
999*a28cd43dSSascha Wildner ZSTD_dictLoadMethod_e dictLoadMethod, ZSTD_dictContentType_e dictContentType)
1000*a28cd43dSSascha Wildner {
1001*a28cd43dSSascha Wildner RETURN_ERROR_IF(cctx->streamStage != zcss_init, stage_wrong,
1002*a28cd43dSSascha Wildner "Can't load a dictionary when ctx is not in init stage.");
1003*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_CCtx_loadDictionary_advanced (size: %u)", (U32)dictSize);
1004*a28cd43dSSascha Wildner ZSTD_clearAllDicts(cctx); /* in case one already exists */
1005*a28cd43dSSascha Wildner if (dict == NULL || dictSize == 0) /* no dictionary mode */
1006*a28cd43dSSascha Wildner return 0;
1007*a28cd43dSSascha Wildner if (dictLoadMethod == ZSTD_dlm_byRef) {
1008*a28cd43dSSascha Wildner cctx->localDict.dict = dict;
1009*a28cd43dSSascha Wildner } else {
1010*a28cd43dSSascha Wildner void* dictBuffer;
1011*a28cd43dSSascha Wildner RETURN_ERROR_IF(cctx->staticSize, memory_allocation,
1012*a28cd43dSSascha Wildner "no malloc for static CCtx");
1013*a28cd43dSSascha Wildner dictBuffer = ZSTD_customMalloc(dictSize, cctx->customMem);
1014*a28cd43dSSascha Wildner RETURN_ERROR_IF(!dictBuffer, memory_allocation, "NULL pointer!");
1015*a28cd43dSSascha Wildner ZSTD_memcpy(dictBuffer, dict, dictSize);
1016*a28cd43dSSascha Wildner cctx->localDict.dictBuffer = dictBuffer;
1017*a28cd43dSSascha Wildner cctx->localDict.dict = dictBuffer;
1018*a28cd43dSSascha Wildner }
1019*a28cd43dSSascha Wildner cctx->localDict.dictSize = dictSize;
1020*a28cd43dSSascha Wildner cctx->localDict.dictContentType = dictContentType;
1021*a28cd43dSSascha Wildner return 0;
1022*a28cd43dSSascha Wildner }
1023*a28cd43dSSascha Wildner
ZSTD_CCtx_loadDictionary_byReference(ZSTD_CCtx * cctx,const void * dict,size_t dictSize)1024*a28cd43dSSascha Wildner ZSTDLIB_API size_t ZSTD_CCtx_loadDictionary_byReference(
1025*a28cd43dSSascha Wildner ZSTD_CCtx* cctx, const void* dict, size_t dictSize)
1026*a28cd43dSSascha Wildner {
1027*a28cd43dSSascha Wildner return ZSTD_CCtx_loadDictionary_advanced(
1028*a28cd43dSSascha Wildner cctx, dict, dictSize, ZSTD_dlm_byRef, ZSTD_dct_auto);
1029*a28cd43dSSascha Wildner }
1030*a28cd43dSSascha Wildner
ZSTD_CCtx_loadDictionary(ZSTD_CCtx * cctx,const void * dict,size_t dictSize)1031*a28cd43dSSascha Wildner ZSTDLIB_API size_t ZSTD_CCtx_loadDictionary(ZSTD_CCtx* cctx, const void* dict, size_t dictSize)
1032*a28cd43dSSascha Wildner {
1033*a28cd43dSSascha Wildner return ZSTD_CCtx_loadDictionary_advanced(
1034*a28cd43dSSascha Wildner cctx, dict, dictSize, ZSTD_dlm_byCopy, ZSTD_dct_auto);
1035*a28cd43dSSascha Wildner }
1036*a28cd43dSSascha Wildner
1037*a28cd43dSSascha Wildner
ZSTD_CCtx_refCDict(ZSTD_CCtx * cctx,const ZSTD_CDict * cdict)1038*a28cd43dSSascha Wildner size_t ZSTD_CCtx_refCDict(ZSTD_CCtx* cctx, const ZSTD_CDict* cdict)
1039*a28cd43dSSascha Wildner {
1040*a28cd43dSSascha Wildner RETURN_ERROR_IF(cctx->streamStage != zcss_init, stage_wrong,
1041*a28cd43dSSascha Wildner "Can't ref a dict when ctx not in init stage.");
1042*a28cd43dSSascha Wildner /* Free the existing local cdict (if any) to save memory. */
1043*a28cd43dSSascha Wildner ZSTD_clearAllDicts(cctx);
1044*a28cd43dSSascha Wildner cctx->cdict = cdict;
1045*a28cd43dSSascha Wildner return 0;
1046*a28cd43dSSascha Wildner }
1047*a28cd43dSSascha Wildner
ZSTD_CCtx_refThreadPool(ZSTD_CCtx * cctx,ZSTD_threadPool * pool)1048*a28cd43dSSascha Wildner size_t ZSTD_CCtx_refThreadPool(ZSTD_CCtx* cctx, ZSTD_threadPool* pool)
1049*a28cd43dSSascha Wildner {
1050*a28cd43dSSascha Wildner RETURN_ERROR_IF(cctx->streamStage != zcss_init, stage_wrong,
1051*a28cd43dSSascha Wildner "Can't ref a pool when ctx not in init stage.");
1052*a28cd43dSSascha Wildner cctx->pool = pool;
1053*a28cd43dSSascha Wildner return 0;
1054*a28cd43dSSascha Wildner }
1055*a28cd43dSSascha Wildner
ZSTD_CCtx_refPrefix(ZSTD_CCtx * cctx,const void * prefix,size_t prefixSize)1056*a28cd43dSSascha Wildner size_t ZSTD_CCtx_refPrefix(ZSTD_CCtx* cctx, const void* prefix, size_t prefixSize)
1057*a28cd43dSSascha Wildner {
1058*a28cd43dSSascha Wildner return ZSTD_CCtx_refPrefix_advanced(cctx, prefix, prefixSize, ZSTD_dct_rawContent);
1059*a28cd43dSSascha Wildner }
1060*a28cd43dSSascha Wildner
ZSTD_CCtx_refPrefix_advanced(ZSTD_CCtx * cctx,const void * prefix,size_t prefixSize,ZSTD_dictContentType_e dictContentType)1061*a28cd43dSSascha Wildner size_t ZSTD_CCtx_refPrefix_advanced(
1062*a28cd43dSSascha Wildner ZSTD_CCtx* cctx, const void* prefix, size_t prefixSize, ZSTD_dictContentType_e dictContentType)
1063*a28cd43dSSascha Wildner {
1064*a28cd43dSSascha Wildner RETURN_ERROR_IF(cctx->streamStage != zcss_init, stage_wrong,
1065*a28cd43dSSascha Wildner "Can't ref a prefix when ctx not in init stage.");
1066*a28cd43dSSascha Wildner ZSTD_clearAllDicts(cctx);
1067*a28cd43dSSascha Wildner if (prefix != NULL && prefixSize > 0) {
1068*a28cd43dSSascha Wildner cctx->prefixDict.dict = prefix;
1069*a28cd43dSSascha Wildner cctx->prefixDict.dictSize = prefixSize;
1070*a28cd43dSSascha Wildner cctx->prefixDict.dictContentType = dictContentType;
1071*a28cd43dSSascha Wildner }
1072*a28cd43dSSascha Wildner return 0;
1073*a28cd43dSSascha Wildner }
1074*a28cd43dSSascha Wildner
1075*a28cd43dSSascha Wildner /*! ZSTD_CCtx_reset() :
1076*a28cd43dSSascha Wildner * Also dumps dictionary */
ZSTD_CCtx_reset(ZSTD_CCtx * cctx,ZSTD_ResetDirective reset)1077*a28cd43dSSascha Wildner size_t ZSTD_CCtx_reset(ZSTD_CCtx* cctx, ZSTD_ResetDirective reset)
1078*a28cd43dSSascha Wildner {
1079*a28cd43dSSascha Wildner if ( (reset == ZSTD_reset_session_only)
1080*a28cd43dSSascha Wildner || (reset == ZSTD_reset_session_and_parameters) ) {
1081*a28cd43dSSascha Wildner cctx->streamStage = zcss_init;
1082*a28cd43dSSascha Wildner cctx->pledgedSrcSizePlusOne = 0;
1083*a28cd43dSSascha Wildner }
1084*a28cd43dSSascha Wildner if ( (reset == ZSTD_reset_parameters)
1085*a28cd43dSSascha Wildner || (reset == ZSTD_reset_session_and_parameters) ) {
1086*a28cd43dSSascha Wildner RETURN_ERROR_IF(cctx->streamStage != zcss_init, stage_wrong,
1087*a28cd43dSSascha Wildner "Can't reset parameters only when not in init stage.");
1088*a28cd43dSSascha Wildner ZSTD_clearAllDicts(cctx);
1089*a28cd43dSSascha Wildner return ZSTD_CCtxParams_reset(&cctx->requestedParams);
1090*a28cd43dSSascha Wildner }
1091*a28cd43dSSascha Wildner return 0;
1092*a28cd43dSSascha Wildner }
1093*a28cd43dSSascha Wildner
1094*a28cd43dSSascha Wildner
1095*a28cd43dSSascha Wildner /** ZSTD_checkCParams() :
1096*a28cd43dSSascha Wildner control CParam values remain within authorized range.
1097*a28cd43dSSascha Wildner @return : 0, or an error code if one value is beyond authorized range */
ZSTD_checkCParams(ZSTD_compressionParameters cParams)1098*a28cd43dSSascha Wildner size_t ZSTD_checkCParams(ZSTD_compressionParameters cParams)
1099*a28cd43dSSascha Wildner {
1100*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_windowLog, (int)cParams.windowLog);
1101*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_chainLog, (int)cParams.chainLog);
1102*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_hashLog, (int)cParams.hashLog);
1103*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_searchLog, (int)cParams.searchLog);
1104*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_minMatch, (int)cParams.minMatch);
1105*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_targetLength,(int)cParams.targetLength);
1106*a28cd43dSSascha Wildner BOUNDCHECK(ZSTD_c_strategy, cParams.strategy);
1107*a28cd43dSSascha Wildner return 0;
1108*a28cd43dSSascha Wildner }
1109*a28cd43dSSascha Wildner
1110*a28cd43dSSascha Wildner /** ZSTD_clampCParams() :
1111*a28cd43dSSascha Wildner * make CParam values within valid range.
1112*a28cd43dSSascha Wildner * @return : valid CParams */
1113*a28cd43dSSascha Wildner static ZSTD_compressionParameters
ZSTD_clampCParams(ZSTD_compressionParameters cParams)1114*a28cd43dSSascha Wildner ZSTD_clampCParams(ZSTD_compressionParameters cParams)
1115*a28cd43dSSascha Wildner {
1116*a28cd43dSSascha Wildner # define CLAMP_TYPE(cParam, val, type) { \
1117*a28cd43dSSascha Wildner ZSTD_bounds const bounds = ZSTD_cParam_getBounds(cParam); \
1118*a28cd43dSSascha Wildner if ((int)val<bounds.lowerBound) val=(type)bounds.lowerBound; \
1119*a28cd43dSSascha Wildner else if ((int)val>bounds.upperBound) val=(type)bounds.upperBound; \
1120*a28cd43dSSascha Wildner }
1121*a28cd43dSSascha Wildner # define CLAMP(cParam, val) CLAMP_TYPE(cParam, val, unsigned)
1122*a28cd43dSSascha Wildner CLAMP(ZSTD_c_windowLog, cParams.windowLog);
1123*a28cd43dSSascha Wildner CLAMP(ZSTD_c_chainLog, cParams.chainLog);
1124*a28cd43dSSascha Wildner CLAMP(ZSTD_c_hashLog, cParams.hashLog);
1125*a28cd43dSSascha Wildner CLAMP(ZSTD_c_searchLog, cParams.searchLog);
1126*a28cd43dSSascha Wildner CLAMP(ZSTD_c_minMatch, cParams.minMatch);
1127*a28cd43dSSascha Wildner CLAMP(ZSTD_c_targetLength,cParams.targetLength);
1128*a28cd43dSSascha Wildner CLAMP_TYPE(ZSTD_c_strategy,cParams.strategy, ZSTD_strategy);
1129*a28cd43dSSascha Wildner return cParams;
1130*a28cd43dSSascha Wildner }
1131*a28cd43dSSascha Wildner
1132*a28cd43dSSascha Wildner /** ZSTD_cycleLog() :
1133*a28cd43dSSascha Wildner * condition for correct operation : hashLog > 1 */
ZSTD_cycleLog(U32 hashLog,ZSTD_strategy strat)1134*a28cd43dSSascha Wildner U32 ZSTD_cycleLog(U32 hashLog, ZSTD_strategy strat)
1135*a28cd43dSSascha Wildner {
1136*a28cd43dSSascha Wildner U32 const btScale = ((U32)strat >= (U32)ZSTD_btlazy2);
1137*a28cd43dSSascha Wildner return hashLog - btScale;
1138*a28cd43dSSascha Wildner }
1139*a28cd43dSSascha Wildner
1140*a28cd43dSSascha Wildner /** ZSTD_dictAndWindowLog() :
1141*a28cd43dSSascha Wildner * Returns an adjusted window log that is large enough to fit the source and the dictionary.
1142*a28cd43dSSascha Wildner * The zstd format says that the entire dictionary is valid if one byte of the dictionary
1143*a28cd43dSSascha Wildner * is within the window. So the hashLog and chainLog should be large enough to reference both
1144*a28cd43dSSascha Wildner * the dictionary and the window. So we must use this adjusted dictAndWindowLog when downsizing
1145*a28cd43dSSascha Wildner * the hashLog and windowLog.
1146*a28cd43dSSascha Wildner * NOTE: srcSize must not be ZSTD_CONTENTSIZE_UNKNOWN.
1147*a28cd43dSSascha Wildner */
ZSTD_dictAndWindowLog(U32 windowLog,U64 srcSize,U64 dictSize)1148*a28cd43dSSascha Wildner static U32 ZSTD_dictAndWindowLog(U32 windowLog, U64 srcSize, U64 dictSize)
1149*a28cd43dSSascha Wildner {
1150*a28cd43dSSascha Wildner const U64 maxWindowSize = 1ULL << ZSTD_WINDOWLOG_MAX;
1151*a28cd43dSSascha Wildner /* No dictionary ==> No change */
1152*a28cd43dSSascha Wildner if (dictSize == 0) {
1153*a28cd43dSSascha Wildner return windowLog;
1154*a28cd43dSSascha Wildner }
1155*a28cd43dSSascha Wildner assert(windowLog <= ZSTD_WINDOWLOG_MAX);
1156*a28cd43dSSascha Wildner assert(srcSize != ZSTD_CONTENTSIZE_UNKNOWN); /* Handled in ZSTD_adjustCParams_internal() */
1157*a28cd43dSSascha Wildner {
1158*a28cd43dSSascha Wildner U64 const windowSize = 1ULL << windowLog;
1159*a28cd43dSSascha Wildner U64 const dictAndWindowSize = dictSize + windowSize;
1160*a28cd43dSSascha Wildner /* If the window size is already large enough to fit both the source and the dictionary
1161*a28cd43dSSascha Wildner * then just use the window size. Otherwise adjust so that it fits the dictionary and
1162*a28cd43dSSascha Wildner * the window.
1163*a28cd43dSSascha Wildner */
1164*a28cd43dSSascha Wildner if (windowSize >= dictSize + srcSize) {
1165*a28cd43dSSascha Wildner return windowLog; /* Window size large enough already */
1166*a28cd43dSSascha Wildner } else if (dictAndWindowSize >= maxWindowSize) {
1167*a28cd43dSSascha Wildner return ZSTD_WINDOWLOG_MAX; /* Larger than max window log */
1168*a28cd43dSSascha Wildner } else {
1169*a28cd43dSSascha Wildner return ZSTD_highbit32((U32)dictAndWindowSize - 1) + 1;
1170*a28cd43dSSascha Wildner }
1171*a28cd43dSSascha Wildner }
1172*a28cd43dSSascha Wildner }
1173*a28cd43dSSascha Wildner
1174*a28cd43dSSascha Wildner /** ZSTD_adjustCParams_internal() :
1175*a28cd43dSSascha Wildner * optimize `cPar` for a specified input (`srcSize` and `dictSize`).
1176*a28cd43dSSascha Wildner * mostly downsize to reduce memory consumption and initialization latency.
1177*a28cd43dSSascha Wildner * `srcSize` can be ZSTD_CONTENTSIZE_UNKNOWN when not known.
1178*a28cd43dSSascha Wildner * `mode` is the mode for parameter adjustment. See docs for `ZSTD_cParamMode_e`.
1179*a28cd43dSSascha Wildner * note : `srcSize==0` means 0!
1180*a28cd43dSSascha Wildner * condition : cPar is presumed validated (can be checked using ZSTD_checkCParams()). */
1181*a28cd43dSSascha Wildner static ZSTD_compressionParameters
ZSTD_adjustCParams_internal(ZSTD_compressionParameters cPar,unsigned long long srcSize,size_t dictSize,ZSTD_cParamMode_e mode)1182*a28cd43dSSascha Wildner ZSTD_adjustCParams_internal(ZSTD_compressionParameters cPar,
1183*a28cd43dSSascha Wildner unsigned long long srcSize,
1184*a28cd43dSSascha Wildner size_t dictSize,
1185*a28cd43dSSascha Wildner ZSTD_cParamMode_e mode)
1186*a28cd43dSSascha Wildner {
1187*a28cd43dSSascha Wildner const U64 minSrcSize = 513; /* (1<<9) + 1 */
1188*a28cd43dSSascha Wildner const U64 maxWindowResize = 1ULL << (ZSTD_WINDOWLOG_MAX-1);
1189*a28cd43dSSascha Wildner assert(ZSTD_checkCParams(cPar)==0);
1190*a28cd43dSSascha Wildner
1191*a28cd43dSSascha Wildner if (dictSize && srcSize == ZSTD_CONTENTSIZE_UNKNOWN)
1192*a28cd43dSSascha Wildner srcSize = minSrcSize;
1193*a28cd43dSSascha Wildner
1194*a28cd43dSSascha Wildner switch (mode) {
1195*a28cd43dSSascha Wildner case ZSTD_cpm_noAttachDict:
1196*a28cd43dSSascha Wildner case ZSTD_cpm_unknown:
1197*a28cd43dSSascha Wildner case ZSTD_cpm_createCDict:
1198*a28cd43dSSascha Wildner break;
1199*a28cd43dSSascha Wildner case ZSTD_cpm_attachDict:
1200*a28cd43dSSascha Wildner dictSize = 0;
1201*a28cd43dSSascha Wildner break;
1202*a28cd43dSSascha Wildner default:
1203*a28cd43dSSascha Wildner assert(0);
1204*a28cd43dSSascha Wildner break;
1205*a28cd43dSSascha Wildner }
1206*a28cd43dSSascha Wildner
1207*a28cd43dSSascha Wildner /* resize windowLog if input is small enough, to use less memory */
1208*a28cd43dSSascha Wildner if ( (srcSize < maxWindowResize)
1209*a28cd43dSSascha Wildner && (dictSize < maxWindowResize) ) {
1210*a28cd43dSSascha Wildner U32 const tSize = (U32)(srcSize + dictSize);
1211*a28cd43dSSascha Wildner static U32 const hashSizeMin = 1 << ZSTD_HASHLOG_MIN;
1212*a28cd43dSSascha Wildner U32 const srcLog = (tSize < hashSizeMin) ? ZSTD_HASHLOG_MIN :
1213*a28cd43dSSascha Wildner ZSTD_highbit32(tSize-1) + 1;
1214*a28cd43dSSascha Wildner if (cPar.windowLog > srcLog) cPar.windowLog = srcLog;
1215*a28cd43dSSascha Wildner }
1216*a28cd43dSSascha Wildner { U32 const dictAndWindowLog = ZSTD_dictAndWindowLog(cPar.windowLog, (U64)srcSize, (U64)dictSize);
1217*a28cd43dSSascha Wildner U32 const cycleLog = ZSTD_cycleLog(cPar.chainLog, cPar.strategy);
1218*a28cd43dSSascha Wildner if (cPar.hashLog > dictAndWindowLog+1) cPar.hashLog = dictAndWindowLog+1;
1219*a28cd43dSSascha Wildner if (cycleLog > dictAndWindowLog)
1220*a28cd43dSSascha Wildner cPar.chainLog -= (cycleLog - dictAndWindowLog);
1221*a28cd43dSSascha Wildner }
1222*a28cd43dSSascha Wildner
1223*a28cd43dSSascha Wildner if (cPar.windowLog < ZSTD_WINDOWLOG_ABSOLUTEMIN)
1224*a28cd43dSSascha Wildner cPar.windowLog = ZSTD_WINDOWLOG_ABSOLUTEMIN; /* minimum wlog required for valid frame header */
1225*a28cd43dSSascha Wildner
1226*a28cd43dSSascha Wildner return cPar;
1227*a28cd43dSSascha Wildner }
1228*a28cd43dSSascha Wildner
1229*a28cd43dSSascha Wildner ZSTD_compressionParameters
ZSTD_adjustCParams(ZSTD_compressionParameters cPar,unsigned long long srcSize,size_t dictSize)1230*a28cd43dSSascha Wildner ZSTD_adjustCParams(ZSTD_compressionParameters cPar,
1231*a28cd43dSSascha Wildner unsigned long long srcSize,
1232*a28cd43dSSascha Wildner size_t dictSize)
1233*a28cd43dSSascha Wildner {
1234*a28cd43dSSascha Wildner cPar = ZSTD_clampCParams(cPar); /* resulting cPar is necessarily valid (all parameters within range) */
1235*a28cd43dSSascha Wildner if (srcSize == 0) srcSize = ZSTD_CONTENTSIZE_UNKNOWN;
1236*a28cd43dSSascha Wildner return ZSTD_adjustCParams_internal(cPar, srcSize, dictSize, ZSTD_cpm_unknown);
1237*a28cd43dSSascha Wildner }
1238*a28cd43dSSascha Wildner
1239*a28cd43dSSascha Wildner static ZSTD_compressionParameters ZSTD_getCParams_internal(int compressionLevel, unsigned long long srcSizeHint, size_t dictSize, ZSTD_cParamMode_e mode);
1240*a28cd43dSSascha Wildner static ZSTD_parameters ZSTD_getParams_internal(int compressionLevel, unsigned long long srcSizeHint, size_t dictSize, ZSTD_cParamMode_e mode);
1241*a28cd43dSSascha Wildner
ZSTD_overrideCParams(ZSTD_compressionParameters * cParams,const ZSTD_compressionParameters * overrides)1242*a28cd43dSSascha Wildner static void ZSTD_overrideCParams(
1243*a28cd43dSSascha Wildner ZSTD_compressionParameters* cParams,
1244*a28cd43dSSascha Wildner const ZSTD_compressionParameters* overrides)
1245*a28cd43dSSascha Wildner {
1246*a28cd43dSSascha Wildner if (overrides->windowLog) cParams->windowLog = overrides->windowLog;
1247*a28cd43dSSascha Wildner if (overrides->hashLog) cParams->hashLog = overrides->hashLog;
1248*a28cd43dSSascha Wildner if (overrides->chainLog) cParams->chainLog = overrides->chainLog;
1249*a28cd43dSSascha Wildner if (overrides->searchLog) cParams->searchLog = overrides->searchLog;
1250*a28cd43dSSascha Wildner if (overrides->minMatch) cParams->minMatch = overrides->minMatch;
1251*a28cd43dSSascha Wildner if (overrides->targetLength) cParams->targetLength = overrides->targetLength;
1252*a28cd43dSSascha Wildner if (overrides->strategy) cParams->strategy = overrides->strategy;
1253*a28cd43dSSascha Wildner }
1254*a28cd43dSSascha Wildner
ZSTD_getCParamsFromCCtxParams(const ZSTD_CCtx_params * CCtxParams,U64 srcSizeHint,size_t dictSize,ZSTD_cParamMode_e mode)1255*a28cd43dSSascha Wildner ZSTD_compressionParameters ZSTD_getCParamsFromCCtxParams(
1256*a28cd43dSSascha Wildner const ZSTD_CCtx_params* CCtxParams, U64 srcSizeHint, size_t dictSize, ZSTD_cParamMode_e mode)
1257*a28cd43dSSascha Wildner {
1258*a28cd43dSSascha Wildner ZSTD_compressionParameters cParams;
1259*a28cd43dSSascha Wildner if (srcSizeHint == ZSTD_CONTENTSIZE_UNKNOWN && CCtxParams->srcSizeHint > 0) {
1260*a28cd43dSSascha Wildner srcSizeHint = CCtxParams->srcSizeHint;
1261*a28cd43dSSascha Wildner }
1262*a28cd43dSSascha Wildner cParams = ZSTD_getCParams_internal(CCtxParams->compressionLevel, srcSizeHint, dictSize, mode);
1263*a28cd43dSSascha Wildner if (CCtxParams->ldmParams.enableLdm) cParams.windowLog = ZSTD_LDM_DEFAULT_WINDOW_LOG;
1264*a28cd43dSSascha Wildner ZSTD_overrideCParams(&cParams, &CCtxParams->cParams);
1265*a28cd43dSSascha Wildner assert(!ZSTD_checkCParams(cParams));
1266*a28cd43dSSascha Wildner /* srcSizeHint == 0 means 0 */
1267*a28cd43dSSascha Wildner return ZSTD_adjustCParams_internal(cParams, srcSizeHint, dictSize, mode);
1268*a28cd43dSSascha Wildner }
1269*a28cd43dSSascha Wildner
1270*a28cd43dSSascha Wildner static size_t
ZSTD_sizeof_matchState(const ZSTD_compressionParameters * const cParams,const U32 forCCtx)1271*a28cd43dSSascha Wildner ZSTD_sizeof_matchState(const ZSTD_compressionParameters* const cParams,
1272*a28cd43dSSascha Wildner const U32 forCCtx)
1273*a28cd43dSSascha Wildner {
1274*a28cd43dSSascha Wildner size_t const chainSize = (cParams->strategy == ZSTD_fast) ? 0 : ((size_t)1 << cParams->chainLog);
1275*a28cd43dSSascha Wildner size_t const hSize = ((size_t)1) << cParams->hashLog;
1276*a28cd43dSSascha Wildner U32 const hashLog3 = (forCCtx && cParams->minMatch==3) ? MIN(ZSTD_HASHLOG3_MAX, cParams->windowLog) : 0;
1277*a28cd43dSSascha Wildner size_t const h3Size = hashLog3 ? ((size_t)1) << hashLog3 : 0;
1278*a28cd43dSSascha Wildner /* We don't use ZSTD_cwksp_alloc_size() here because the tables aren't
1279*a28cd43dSSascha Wildner * surrounded by redzones in ASAN. */
1280*a28cd43dSSascha Wildner size_t const tableSpace = chainSize * sizeof(U32)
1281*a28cd43dSSascha Wildner + hSize * sizeof(U32)
1282*a28cd43dSSascha Wildner + h3Size * sizeof(U32);
1283*a28cd43dSSascha Wildner size_t const optPotentialSpace =
1284*a28cd43dSSascha Wildner ZSTD_cwksp_alloc_size((MaxML+1) * sizeof(U32))
1285*a28cd43dSSascha Wildner + ZSTD_cwksp_alloc_size((MaxLL+1) * sizeof(U32))
1286*a28cd43dSSascha Wildner + ZSTD_cwksp_alloc_size((MaxOff+1) * sizeof(U32))
1287*a28cd43dSSascha Wildner + ZSTD_cwksp_alloc_size((1<<Litbits) * sizeof(U32))
1288*a28cd43dSSascha Wildner + ZSTD_cwksp_alloc_size((ZSTD_OPT_NUM+1) * sizeof(ZSTD_match_t))
1289*a28cd43dSSascha Wildner + ZSTD_cwksp_alloc_size((ZSTD_OPT_NUM+1) * sizeof(ZSTD_optimal_t));
1290*a28cd43dSSascha Wildner size_t const optSpace = (forCCtx && (cParams->strategy >= ZSTD_btopt))
1291*a28cd43dSSascha Wildner ? optPotentialSpace
1292*a28cd43dSSascha Wildner : 0;
1293*a28cd43dSSascha Wildner DEBUGLOG(4, "chainSize: %u - hSize: %u - h3Size: %u",
1294*a28cd43dSSascha Wildner (U32)chainSize, (U32)hSize, (U32)h3Size);
1295*a28cd43dSSascha Wildner return tableSpace + optSpace;
1296*a28cd43dSSascha Wildner }
1297*a28cd43dSSascha Wildner
ZSTD_estimateCCtxSize_usingCCtxParams_internal(const ZSTD_compressionParameters * cParams,const ldmParams_t * ldmParams,const int isStatic,const size_t buffInSize,const size_t buffOutSize,const U64 pledgedSrcSize)1298*a28cd43dSSascha Wildner static size_t ZSTD_estimateCCtxSize_usingCCtxParams_internal(
1299*a28cd43dSSascha Wildner const ZSTD_compressionParameters* cParams,
1300*a28cd43dSSascha Wildner const ldmParams_t* ldmParams,
1301*a28cd43dSSascha Wildner const int isStatic,
1302*a28cd43dSSascha Wildner const size_t buffInSize,
1303*a28cd43dSSascha Wildner const size_t buffOutSize,
1304*a28cd43dSSascha Wildner const U64 pledgedSrcSize)
1305*a28cd43dSSascha Wildner {
1306*a28cd43dSSascha Wildner size_t const windowSize = MAX(1, (size_t)MIN(((U64)1 << cParams->windowLog), pledgedSrcSize));
1307*a28cd43dSSascha Wildner size_t const blockSize = MIN(ZSTD_BLOCKSIZE_MAX, windowSize);
1308*a28cd43dSSascha Wildner U32 const divider = (cParams->minMatch==3) ? 3 : 4;
1309*a28cd43dSSascha Wildner size_t const maxNbSeq = blockSize / divider;
1310*a28cd43dSSascha Wildner size_t const tokenSpace = ZSTD_cwksp_alloc_size(WILDCOPY_OVERLENGTH + blockSize)
1311*a28cd43dSSascha Wildner + ZSTD_cwksp_alloc_size(maxNbSeq * sizeof(seqDef))
1312*a28cd43dSSascha Wildner + 3 * ZSTD_cwksp_alloc_size(maxNbSeq * sizeof(BYTE));
1313*a28cd43dSSascha Wildner size_t const entropySpace = ZSTD_cwksp_alloc_size(ENTROPY_WORKSPACE_SIZE);
1314*a28cd43dSSascha Wildner size_t const blockStateSpace = 2 * ZSTD_cwksp_alloc_size(sizeof(ZSTD_compressedBlockState_t));
1315*a28cd43dSSascha Wildner size_t const matchStateSize = ZSTD_sizeof_matchState(cParams, /* forCCtx */ 1);
1316*a28cd43dSSascha Wildner
1317*a28cd43dSSascha Wildner size_t const ldmSpace = ZSTD_ldm_getTableSize(*ldmParams);
1318*a28cd43dSSascha Wildner size_t const maxNbLdmSeq = ZSTD_ldm_getMaxNbSeq(*ldmParams, blockSize);
1319*a28cd43dSSascha Wildner size_t const ldmSeqSpace = ldmParams->enableLdm ?
1320*a28cd43dSSascha Wildner ZSTD_cwksp_alloc_size(maxNbLdmSeq * sizeof(rawSeq)) : 0;
1321*a28cd43dSSascha Wildner
1322*a28cd43dSSascha Wildner
1323*a28cd43dSSascha Wildner size_t const bufferSpace = ZSTD_cwksp_alloc_size(buffInSize)
1324*a28cd43dSSascha Wildner + ZSTD_cwksp_alloc_size(buffOutSize);
1325*a28cd43dSSascha Wildner
1326*a28cd43dSSascha Wildner size_t const cctxSpace = isStatic ? ZSTD_cwksp_alloc_size(sizeof(ZSTD_CCtx)) : 0;
1327*a28cd43dSSascha Wildner
1328*a28cd43dSSascha Wildner size_t const neededSpace =
1329*a28cd43dSSascha Wildner cctxSpace +
1330*a28cd43dSSascha Wildner entropySpace +
1331*a28cd43dSSascha Wildner blockStateSpace +
1332*a28cd43dSSascha Wildner ldmSpace +
1333*a28cd43dSSascha Wildner ldmSeqSpace +
1334*a28cd43dSSascha Wildner matchStateSize +
1335*a28cd43dSSascha Wildner tokenSpace +
1336*a28cd43dSSascha Wildner bufferSpace;
1337*a28cd43dSSascha Wildner
1338*a28cd43dSSascha Wildner DEBUGLOG(5, "estimate workspace : %u", (U32)neededSpace);
1339*a28cd43dSSascha Wildner return neededSpace;
1340*a28cd43dSSascha Wildner }
1341*a28cd43dSSascha Wildner
ZSTD_estimateCCtxSize_usingCCtxParams(const ZSTD_CCtx_params * params)1342*a28cd43dSSascha Wildner size_t ZSTD_estimateCCtxSize_usingCCtxParams(const ZSTD_CCtx_params* params)
1343*a28cd43dSSascha Wildner {
1344*a28cd43dSSascha Wildner ZSTD_compressionParameters const cParams =
1345*a28cd43dSSascha Wildner ZSTD_getCParamsFromCCtxParams(params, ZSTD_CONTENTSIZE_UNKNOWN, 0, ZSTD_cpm_noAttachDict);
1346*a28cd43dSSascha Wildner
1347*a28cd43dSSascha Wildner RETURN_ERROR_IF(params->nbWorkers > 0, GENERIC, "Estimate CCtx size is supported for single-threaded compression only.");
1348*a28cd43dSSascha Wildner /* estimateCCtxSize is for one-shot compression. So no buffers should
1349*a28cd43dSSascha Wildner * be needed. However, we still allocate two 0-sized buffers, which can
1350*a28cd43dSSascha Wildner * take space under ASAN. */
1351*a28cd43dSSascha Wildner return ZSTD_estimateCCtxSize_usingCCtxParams_internal(
1352*a28cd43dSSascha Wildner &cParams, ¶ms->ldmParams, 1, 0, 0, ZSTD_CONTENTSIZE_UNKNOWN);
1353*a28cd43dSSascha Wildner }
1354*a28cd43dSSascha Wildner
ZSTD_estimateCCtxSize_usingCParams(ZSTD_compressionParameters cParams)1355*a28cd43dSSascha Wildner size_t ZSTD_estimateCCtxSize_usingCParams(ZSTD_compressionParameters cParams)
1356*a28cd43dSSascha Wildner {
1357*a28cd43dSSascha Wildner ZSTD_CCtx_params const params = ZSTD_makeCCtxParamsFromCParams(cParams);
1358*a28cd43dSSascha Wildner return ZSTD_estimateCCtxSize_usingCCtxParams(¶ms);
1359*a28cd43dSSascha Wildner }
1360*a28cd43dSSascha Wildner
ZSTD_estimateCCtxSize_internal(int compressionLevel)1361*a28cd43dSSascha Wildner static size_t ZSTD_estimateCCtxSize_internal(int compressionLevel)
1362*a28cd43dSSascha Wildner {
1363*a28cd43dSSascha Wildner ZSTD_compressionParameters const cParams = ZSTD_getCParams_internal(compressionLevel, ZSTD_CONTENTSIZE_UNKNOWN, 0, ZSTD_cpm_noAttachDict);
1364*a28cd43dSSascha Wildner return ZSTD_estimateCCtxSize_usingCParams(cParams);
1365*a28cd43dSSascha Wildner }
1366*a28cd43dSSascha Wildner
ZSTD_estimateCCtxSize(int compressionLevel)1367*a28cd43dSSascha Wildner size_t ZSTD_estimateCCtxSize(int compressionLevel)
1368*a28cd43dSSascha Wildner {
1369*a28cd43dSSascha Wildner int level;
1370*a28cd43dSSascha Wildner size_t memBudget = 0;
1371*a28cd43dSSascha Wildner for (level=MIN(compressionLevel, 1); level<=compressionLevel; level++) {
1372*a28cd43dSSascha Wildner size_t const newMB = ZSTD_estimateCCtxSize_internal(level);
1373*a28cd43dSSascha Wildner if (newMB > memBudget) memBudget = newMB;
1374*a28cd43dSSascha Wildner }
1375*a28cd43dSSascha Wildner return memBudget;
1376*a28cd43dSSascha Wildner }
1377*a28cd43dSSascha Wildner
ZSTD_estimateCStreamSize_usingCCtxParams(const ZSTD_CCtx_params * params)1378*a28cd43dSSascha Wildner size_t ZSTD_estimateCStreamSize_usingCCtxParams(const ZSTD_CCtx_params* params)
1379*a28cd43dSSascha Wildner {
1380*a28cd43dSSascha Wildner RETURN_ERROR_IF(params->nbWorkers > 0, GENERIC, "Estimate CCtx size is supported for single-threaded compression only.");
1381*a28cd43dSSascha Wildner { ZSTD_compressionParameters const cParams =
1382*a28cd43dSSascha Wildner ZSTD_getCParamsFromCCtxParams(params, ZSTD_CONTENTSIZE_UNKNOWN, 0, ZSTD_cpm_noAttachDict);
1383*a28cd43dSSascha Wildner size_t const blockSize = MIN(ZSTD_BLOCKSIZE_MAX, (size_t)1 << cParams.windowLog);
1384*a28cd43dSSascha Wildner size_t const inBuffSize = (params->inBufferMode == ZSTD_bm_buffered)
1385*a28cd43dSSascha Wildner ? ((size_t)1 << cParams.windowLog) + blockSize
1386*a28cd43dSSascha Wildner : 0;
1387*a28cd43dSSascha Wildner size_t const outBuffSize = (params->outBufferMode == ZSTD_bm_buffered)
1388*a28cd43dSSascha Wildner ? ZSTD_compressBound(blockSize) + 1
1389*a28cd43dSSascha Wildner : 0;
1390*a28cd43dSSascha Wildner
1391*a28cd43dSSascha Wildner return ZSTD_estimateCCtxSize_usingCCtxParams_internal(
1392*a28cd43dSSascha Wildner &cParams, ¶ms->ldmParams, 1, inBuffSize, outBuffSize,
1393*a28cd43dSSascha Wildner ZSTD_CONTENTSIZE_UNKNOWN);
1394*a28cd43dSSascha Wildner }
1395*a28cd43dSSascha Wildner }
1396*a28cd43dSSascha Wildner
ZSTD_estimateCStreamSize_usingCParams(ZSTD_compressionParameters cParams)1397*a28cd43dSSascha Wildner size_t ZSTD_estimateCStreamSize_usingCParams(ZSTD_compressionParameters cParams)
1398*a28cd43dSSascha Wildner {
1399*a28cd43dSSascha Wildner ZSTD_CCtx_params const params = ZSTD_makeCCtxParamsFromCParams(cParams);
1400*a28cd43dSSascha Wildner return ZSTD_estimateCStreamSize_usingCCtxParams(¶ms);
1401*a28cd43dSSascha Wildner }
1402*a28cd43dSSascha Wildner
ZSTD_estimateCStreamSize_internal(int compressionLevel)1403*a28cd43dSSascha Wildner static size_t ZSTD_estimateCStreamSize_internal(int compressionLevel)
1404*a28cd43dSSascha Wildner {
1405*a28cd43dSSascha Wildner ZSTD_compressionParameters const cParams = ZSTD_getCParams_internal(compressionLevel, ZSTD_CONTENTSIZE_UNKNOWN, 0, ZSTD_cpm_noAttachDict);
1406*a28cd43dSSascha Wildner return ZSTD_estimateCStreamSize_usingCParams(cParams);
1407*a28cd43dSSascha Wildner }
1408*a28cd43dSSascha Wildner
ZSTD_estimateCStreamSize(int compressionLevel)1409*a28cd43dSSascha Wildner size_t ZSTD_estimateCStreamSize(int compressionLevel)
1410*a28cd43dSSascha Wildner {
1411*a28cd43dSSascha Wildner int level;
1412*a28cd43dSSascha Wildner size_t memBudget = 0;
1413*a28cd43dSSascha Wildner for (level=MIN(compressionLevel, 1); level<=compressionLevel; level++) {
1414*a28cd43dSSascha Wildner size_t const newMB = ZSTD_estimateCStreamSize_internal(level);
1415*a28cd43dSSascha Wildner if (newMB > memBudget) memBudget = newMB;
1416*a28cd43dSSascha Wildner }
1417*a28cd43dSSascha Wildner return memBudget;
1418*a28cd43dSSascha Wildner }
1419*a28cd43dSSascha Wildner
1420*a28cd43dSSascha Wildner /* ZSTD_getFrameProgression():
1421*a28cd43dSSascha Wildner * tells how much data has been consumed (input) and produced (output) for current frame.
1422*a28cd43dSSascha Wildner * able to count progression inside worker threads (non-blocking mode).
1423*a28cd43dSSascha Wildner */
ZSTD_getFrameProgression(const ZSTD_CCtx * cctx)1424*a28cd43dSSascha Wildner ZSTD_frameProgression ZSTD_getFrameProgression(const ZSTD_CCtx* cctx)
1425*a28cd43dSSascha Wildner {
1426*a28cd43dSSascha Wildner #ifdef ZSTD_MULTITHREAD
1427*a28cd43dSSascha Wildner if (cctx->appliedParams.nbWorkers > 0) {
1428*a28cd43dSSascha Wildner return ZSTDMT_getFrameProgression(cctx->mtctx);
1429*a28cd43dSSascha Wildner }
1430*a28cd43dSSascha Wildner #endif
1431*a28cd43dSSascha Wildner { ZSTD_frameProgression fp;
1432*a28cd43dSSascha Wildner size_t const buffered = (cctx->inBuff == NULL) ? 0 :
1433*a28cd43dSSascha Wildner cctx->inBuffPos - cctx->inToCompress;
1434*a28cd43dSSascha Wildner if (buffered) assert(cctx->inBuffPos >= cctx->inToCompress);
1435*a28cd43dSSascha Wildner assert(buffered <= ZSTD_BLOCKSIZE_MAX);
1436*a28cd43dSSascha Wildner fp.ingested = cctx->consumedSrcSize + buffered;
1437*a28cd43dSSascha Wildner fp.consumed = cctx->consumedSrcSize;
1438*a28cd43dSSascha Wildner fp.produced = cctx->producedCSize;
1439*a28cd43dSSascha Wildner fp.flushed = cctx->producedCSize; /* simplified; some data might still be left within streaming output buffer */
1440*a28cd43dSSascha Wildner fp.currentJobID = 0;
1441*a28cd43dSSascha Wildner fp.nbActiveWorkers = 0;
1442*a28cd43dSSascha Wildner return fp;
1443*a28cd43dSSascha Wildner } }
1444*a28cd43dSSascha Wildner
1445*a28cd43dSSascha Wildner /*! ZSTD_toFlushNow()
1446*a28cd43dSSascha Wildner * Only useful for multithreading scenarios currently (nbWorkers >= 1).
1447*a28cd43dSSascha Wildner */
ZSTD_toFlushNow(ZSTD_CCtx * cctx)1448*a28cd43dSSascha Wildner size_t ZSTD_toFlushNow(ZSTD_CCtx* cctx)
1449*a28cd43dSSascha Wildner {
1450*a28cd43dSSascha Wildner #ifdef ZSTD_MULTITHREAD
1451*a28cd43dSSascha Wildner if (cctx->appliedParams.nbWorkers > 0) {
1452*a28cd43dSSascha Wildner return ZSTDMT_toFlushNow(cctx->mtctx);
1453*a28cd43dSSascha Wildner }
1454*a28cd43dSSascha Wildner #endif
1455*a28cd43dSSascha Wildner (void)cctx;
1456*a28cd43dSSascha Wildner return 0; /* over-simplification; could also check if context is currently running in streaming mode, and in which case, report how many bytes are left to be flushed within output buffer */
1457*a28cd43dSSascha Wildner }
1458*a28cd43dSSascha Wildner
ZSTD_assertEqualCParams(ZSTD_compressionParameters cParams1,ZSTD_compressionParameters cParams2)1459*a28cd43dSSascha Wildner static void ZSTD_assertEqualCParams(ZSTD_compressionParameters cParams1,
1460*a28cd43dSSascha Wildner ZSTD_compressionParameters cParams2)
1461*a28cd43dSSascha Wildner {
1462*a28cd43dSSascha Wildner (void)cParams1;
1463*a28cd43dSSascha Wildner (void)cParams2;
1464*a28cd43dSSascha Wildner assert(cParams1.windowLog == cParams2.windowLog);
1465*a28cd43dSSascha Wildner assert(cParams1.chainLog == cParams2.chainLog);
1466*a28cd43dSSascha Wildner assert(cParams1.hashLog == cParams2.hashLog);
1467*a28cd43dSSascha Wildner assert(cParams1.searchLog == cParams2.searchLog);
1468*a28cd43dSSascha Wildner assert(cParams1.minMatch == cParams2.minMatch);
1469*a28cd43dSSascha Wildner assert(cParams1.targetLength == cParams2.targetLength);
1470*a28cd43dSSascha Wildner assert(cParams1.strategy == cParams2.strategy);
1471*a28cd43dSSascha Wildner }
1472*a28cd43dSSascha Wildner
ZSTD_reset_compressedBlockState(ZSTD_compressedBlockState_t * bs)1473*a28cd43dSSascha Wildner void ZSTD_reset_compressedBlockState(ZSTD_compressedBlockState_t* bs)
1474*a28cd43dSSascha Wildner {
1475*a28cd43dSSascha Wildner int i;
1476*a28cd43dSSascha Wildner for (i = 0; i < ZSTD_REP_NUM; ++i)
1477*a28cd43dSSascha Wildner bs->rep[i] = repStartValue[i];
1478*a28cd43dSSascha Wildner bs->entropy.huf.repeatMode = HUF_repeat_none;
1479*a28cd43dSSascha Wildner bs->entropy.fse.offcode_repeatMode = FSE_repeat_none;
1480*a28cd43dSSascha Wildner bs->entropy.fse.matchlength_repeatMode = FSE_repeat_none;
1481*a28cd43dSSascha Wildner bs->entropy.fse.litlength_repeatMode = FSE_repeat_none;
1482*a28cd43dSSascha Wildner }
1483*a28cd43dSSascha Wildner
1484*a28cd43dSSascha Wildner /*! ZSTD_invalidateMatchState()
1485*a28cd43dSSascha Wildner * Invalidate all the matches in the match finder tables.
1486*a28cd43dSSascha Wildner * Requires nextSrc and base to be set (can be NULL).
1487*a28cd43dSSascha Wildner */
ZSTD_invalidateMatchState(ZSTD_matchState_t * ms)1488*a28cd43dSSascha Wildner static void ZSTD_invalidateMatchState(ZSTD_matchState_t* ms)
1489*a28cd43dSSascha Wildner {
1490*a28cd43dSSascha Wildner ZSTD_window_clear(&ms->window);
1491*a28cd43dSSascha Wildner
1492*a28cd43dSSascha Wildner ms->nextToUpdate = ms->window.dictLimit;
1493*a28cd43dSSascha Wildner ms->loadedDictEnd = 0;
1494*a28cd43dSSascha Wildner ms->opt.litLengthSum = 0; /* force reset of btopt stats */
1495*a28cd43dSSascha Wildner ms->dictMatchState = NULL;
1496*a28cd43dSSascha Wildner }
1497*a28cd43dSSascha Wildner
1498*a28cd43dSSascha Wildner /**
1499*a28cd43dSSascha Wildner * Controls, for this matchState reset, whether the tables need to be cleared /
1500*a28cd43dSSascha Wildner * prepared for the coming compression (ZSTDcrp_makeClean), or whether the
1501*a28cd43dSSascha Wildner * tables can be left unclean (ZSTDcrp_leaveDirty), because we know that a
1502*a28cd43dSSascha Wildner * subsequent operation will overwrite the table space anyways (e.g., copying
1503*a28cd43dSSascha Wildner * the matchState contents in from a CDict).
1504*a28cd43dSSascha Wildner */
1505*a28cd43dSSascha Wildner typedef enum {
1506*a28cd43dSSascha Wildner ZSTDcrp_makeClean,
1507*a28cd43dSSascha Wildner ZSTDcrp_leaveDirty
1508*a28cd43dSSascha Wildner } ZSTD_compResetPolicy_e;
1509*a28cd43dSSascha Wildner
1510*a28cd43dSSascha Wildner /**
1511*a28cd43dSSascha Wildner * Controls, for this matchState reset, whether indexing can continue where it
1512*a28cd43dSSascha Wildner * left off (ZSTDirp_continue), or whether it needs to be restarted from zero
1513*a28cd43dSSascha Wildner * (ZSTDirp_reset).
1514*a28cd43dSSascha Wildner */
1515*a28cd43dSSascha Wildner typedef enum {
1516*a28cd43dSSascha Wildner ZSTDirp_continue,
1517*a28cd43dSSascha Wildner ZSTDirp_reset
1518*a28cd43dSSascha Wildner } ZSTD_indexResetPolicy_e;
1519*a28cd43dSSascha Wildner
1520*a28cd43dSSascha Wildner typedef enum {
1521*a28cd43dSSascha Wildner ZSTD_resetTarget_CDict,
1522*a28cd43dSSascha Wildner ZSTD_resetTarget_CCtx
1523*a28cd43dSSascha Wildner } ZSTD_resetTarget_e;
1524*a28cd43dSSascha Wildner
1525*a28cd43dSSascha Wildner static size_t
ZSTD_reset_matchState(ZSTD_matchState_t * ms,ZSTD_cwksp * ws,const ZSTD_compressionParameters * cParams,const ZSTD_compResetPolicy_e crp,const ZSTD_indexResetPolicy_e forceResetIndex,const ZSTD_resetTarget_e forWho)1526*a28cd43dSSascha Wildner ZSTD_reset_matchState(ZSTD_matchState_t* ms,
1527*a28cd43dSSascha Wildner ZSTD_cwksp* ws,
1528*a28cd43dSSascha Wildner const ZSTD_compressionParameters* cParams,
1529*a28cd43dSSascha Wildner const ZSTD_compResetPolicy_e crp,
1530*a28cd43dSSascha Wildner const ZSTD_indexResetPolicy_e forceResetIndex,
1531*a28cd43dSSascha Wildner const ZSTD_resetTarget_e forWho)
1532*a28cd43dSSascha Wildner {
1533*a28cd43dSSascha Wildner size_t const chainSize = (cParams->strategy == ZSTD_fast) ? 0 : ((size_t)1 << cParams->chainLog);
1534*a28cd43dSSascha Wildner size_t const hSize = ((size_t)1) << cParams->hashLog;
1535*a28cd43dSSascha Wildner U32 const hashLog3 = ((forWho == ZSTD_resetTarget_CCtx) && cParams->minMatch==3) ? MIN(ZSTD_HASHLOG3_MAX, cParams->windowLog) : 0;
1536*a28cd43dSSascha Wildner size_t const h3Size = hashLog3 ? ((size_t)1) << hashLog3 : 0;
1537*a28cd43dSSascha Wildner
1538*a28cd43dSSascha Wildner DEBUGLOG(4, "reset indices : %u", forceResetIndex == ZSTDirp_reset);
1539*a28cd43dSSascha Wildner if (forceResetIndex == ZSTDirp_reset) {
1540*a28cd43dSSascha Wildner ZSTD_window_init(&ms->window);
1541*a28cd43dSSascha Wildner ZSTD_cwksp_mark_tables_dirty(ws);
1542*a28cd43dSSascha Wildner }
1543*a28cd43dSSascha Wildner
1544*a28cd43dSSascha Wildner ms->hashLog3 = hashLog3;
1545*a28cd43dSSascha Wildner
1546*a28cd43dSSascha Wildner ZSTD_invalidateMatchState(ms);
1547*a28cd43dSSascha Wildner
1548*a28cd43dSSascha Wildner assert(!ZSTD_cwksp_reserve_failed(ws)); /* check that allocation hasn't already failed */
1549*a28cd43dSSascha Wildner
1550*a28cd43dSSascha Wildner ZSTD_cwksp_clear_tables(ws);
1551*a28cd43dSSascha Wildner
1552*a28cd43dSSascha Wildner DEBUGLOG(5, "reserving table space");
1553*a28cd43dSSascha Wildner /* table Space */
1554*a28cd43dSSascha Wildner ms->hashTable = (U32*)ZSTD_cwksp_reserve_table(ws, hSize * sizeof(U32));
1555*a28cd43dSSascha Wildner ms->chainTable = (U32*)ZSTD_cwksp_reserve_table(ws, chainSize * sizeof(U32));
1556*a28cd43dSSascha Wildner ms->hashTable3 = (U32*)ZSTD_cwksp_reserve_table(ws, h3Size * sizeof(U32));
1557*a28cd43dSSascha Wildner RETURN_ERROR_IF(ZSTD_cwksp_reserve_failed(ws), memory_allocation,
1558*a28cd43dSSascha Wildner "failed a workspace allocation in ZSTD_reset_matchState");
1559*a28cd43dSSascha Wildner
1560*a28cd43dSSascha Wildner DEBUGLOG(4, "reset table : %u", crp!=ZSTDcrp_leaveDirty);
1561*a28cd43dSSascha Wildner if (crp!=ZSTDcrp_leaveDirty) {
1562*a28cd43dSSascha Wildner /* reset tables only */
1563*a28cd43dSSascha Wildner ZSTD_cwksp_clean_tables(ws);
1564*a28cd43dSSascha Wildner }
1565*a28cd43dSSascha Wildner
1566*a28cd43dSSascha Wildner /* opt parser space */
1567*a28cd43dSSascha Wildner if ((forWho == ZSTD_resetTarget_CCtx) && (cParams->strategy >= ZSTD_btopt)) {
1568*a28cd43dSSascha Wildner DEBUGLOG(4, "reserving optimal parser space");
1569*a28cd43dSSascha Wildner ms->opt.litFreq = (unsigned*)ZSTD_cwksp_reserve_aligned(ws, (1<<Litbits) * sizeof(unsigned));
1570*a28cd43dSSascha Wildner ms->opt.litLengthFreq = (unsigned*)ZSTD_cwksp_reserve_aligned(ws, (MaxLL+1) * sizeof(unsigned));
1571*a28cd43dSSascha Wildner ms->opt.matchLengthFreq = (unsigned*)ZSTD_cwksp_reserve_aligned(ws, (MaxML+1) * sizeof(unsigned));
1572*a28cd43dSSascha Wildner ms->opt.offCodeFreq = (unsigned*)ZSTD_cwksp_reserve_aligned(ws, (MaxOff+1) * sizeof(unsigned));
1573*a28cd43dSSascha Wildner ms->opt.matchTable = (ZSTD_match_t*)ZSTD_cwksp_reserve_aligned(ws, (ZSTD_OPT_NUM+1) * sizeof(ZSTD_match_t));
1574*a28cd43dSSascha Wildner ms->opt.priceTable = (ZSTD_optimal_t*)ZSTD_cwksp_reserve_aligned(ws, (ZSTD_OPT_NUM+1) * sizeof(ZSTD_optimal_t));
1575*a28cd43dSSascha Wildner }
1576*a28cd43dSSascha Wildner
1577*a28cd43dSSascha Wildner ms->cParams = *cParams;
1578*a28cd43dSSascha Wildner
1579*a28cd43dSSascha Wildner RETURN_ERROR_IF(ZSTD_cwksp_reserve_failed(ws), memory_allocation,
1580*a28cd43dSSascha Wildner "failed a workspace allocation in ZSTD_reset_matchState");
1581*a28cd43dSSascha Wildner
1582*a28cd43dSSascha Wildner return 0;
1583*a28cd43dSSascha Wildner }
1584*a28cd43dSSascha Wildner
1585*a28cd43dSSascha Wildner /* ZSTD_indexTooCloseToMax() :
1586*a28cd43dSSascha Wildner * minor optimization : prefer memset() rather than reduceIndex()
1587*a28cd43dSSascha Wildner * which is measurably slow in some circumstances (reported for Visual Studio).
1588*a28cd43dSSascha Wildner * Works when re-using a context for a lot of smallish inputs :
1589*a28cd43dSSascha Wildner * if all inputs are smaller than ZSTD_INDEXOVERFLOW_MARGIN,
1590*a28cd43dSSascha Wildner * memset() will be triggered before reduceIndex().
1591*a28cd43dSSascha Wildner */
1592*a28cd43dSSascha Wildner #define ZSTD_INDEXOVERFLOW_MARGIN (16 MB)
ZSTD_indexTooCloseToMax(ZSTD_window_t w)1593*a28cd43dSSascha Wildner static int ZSTD_indexTooCloseToMax(ZSTD_window_t w)
1594*a28cd43dSSascha Wildner {
1595*a28cd43dSSascha Wildner return (size_t)(w.nextSrc - w.base) > (ZSTD_CURRENT_MAX - ZSTD_INDEXOVERFLOW_MARGIN);
1596*a28cd43dSSascha Wildner }
1597*a28cd43dSSascha Wildner
1598*a28cd43dSSascha Wildner /*! ZSTD_resetCCtx_internal() :
1599*a28cd43dSSascha Wildner note : `params` are assumed fully validated at this stage */
ZSTD_resetCCtx_internal(ZSTD_CCtx * zc,ZSTD_CCtx_params params,U64 const pledgedSrcSize,ZSTD_compResetPolicy_e const crp,ZSTD_buffered_policy_e const zbuff)1600*a28cd43dSSascha Wildner static size_t ZSTD_resetCCtx_internal(ZSTD_CCtx* zc,
1601*a28cd43dSSascha Wildner ZSTD_CCtx_params params,
1602*a28cd43dSSascha Wildner U64 const pledgedSrcSize,
1603*a28cd43dSSascha Wildner ZSTD_compResetPolicy_e const crp,
1604*a28cd43dSSascha Wildner ZSTD_buffered_policy_e const zbuff)
1605*a28cd43dSSascha Wildner {
1606*a28cd43dSSascha Wildner ZSTD_cwksp* const ws = &zc->workspace;
1607*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_resetCCtx_internal: pledgedSrcSize=%u, wlog=%u",
1608*a28cd43dSSascha Wildner (U32)pledgedSrcSize, params.cParams.windowLog);
1609*a28cd43dSSascha Wildner assert(!ZSTD_isError(ZSTD_checkCParams(params.cParams)));
1610*a28cd43dSSascha Wildner
1611*a28cd43dSSascha Wildner zc->isFirstBlock = 1;
1612*a28cd43dSSascha Wildner
1613*a28cd43dSSascha Wildner if (params.ldmParams.enableLdm) {
1614*a28cd43dSSascha Wildner /* Adjust long distance matching parameters */
1615*a28cd43dSSascha Wildner ZSTD_ldm_adjustParameters(¶ms.ldmParams, ¶ms.cParams);
1616*a28cd43dSSascha Wildner assert(params.ldmParams.hashLog >= params.ldmParams.bucketSizeLog);
1617*a28cd43dSSascha Wildner assert(params.ldmParams.hashRateLog < 32);
1618*a28cd43dSSascha Wildner zc->ldmState.hashPower = ZSTD_rollingHash_primePower(params.ldmParams.minMatchLength);
1619*a28cd43dSSascha Wildner }
1620*a28cd43dSSascha Wildner
1621*a28cd43dSSascha Wildner { size_t const windowSize = MAX(1, (size_t)MIN(((U64)1 << params.cParams.windowLog), pledgedSrcSize));
1622*a28cd43dSSascha Wildner size_t const blockSize = MIN(ZSTD_BLOCKSIZE_MAX, windowSize);
1623*a28cd43dSSascha Wildner U32 const divider = (params.cParams.minMatch==3) ? 3 : 4;
1624*a28cd43dSSascha Wildner size_t const maxNbSeq = blockSize / divider;
1625*a28cd43dSSascha Wildner size_t const buffOutSize = (zbuff == ZSTDb_buffered && params.outBufferMode == ZSTD_bm_buffered)
1626*a28cd43dSSascha Wildner ? ZSTD_compressBound(blockSize) + 1
1627*a28cd43dSSascha Wildner : 0;
1628*a28cd43dSSascha Wildner size_t const buffInSize = (zbuff == ZSTDb_buffered && params.inBufferMode == ZSTD_bm_buffered)
1629*a28cd43dSSascha Wildner ? windowSize + blockSize
1630*a28cd43dSSascha Wildner : 0;
1631*a28cd43dSSascha Wildner size_t const maxNbLdmSeq = ZSTD_ldm_getMaxNbSeq(params.ldmParams, blockSize);
1632*a28cd43dSSascha Wildner
1633*a28cd43dSSascha Wildner int const indexTooClose = ZSTD_indexTooCloseToMax(zc->blockState.matchState.window);
1634*a28cd43dSSascha Wildner ZSTD_indexResetPolicy_e needsIndexReset =
1635*a28cd43dSSascha Wildner (!indexTooClose && zc->initialized) ? ZSTDirp_continue : ZSTDirp_reset;
1636*a28cd43dSSascha Wildner
1637*a28cd43dSSascha Wildner size_t const neededSpace =
1638*a28cd43dSSascha Wildner ZSTD_estimateCCtxSize_usingCCtxParams_internal(
1639*a28cd43dSSascha Wildner ¶ms.cParams, ¶ms.ldmParams, zc->staticSize != 0,
1640*a28cd43dSSascha Wildner buffInSize, buffOutSize, pledgedSrcSize);
1641*a28cd43dSSascha Wildner FORWARD_IF_ERROR(neededSpace, "cctx size estimate failed!");
1642*a28cd43dSSascha Wildner
1643*a28cd43dSSascha Wildner if (!zc->staticSize) ZSTD_cwksp_bump_oversized_duration(ws, 0);
1644*a28cd43dSSascha Wildner
1645*a28cd43dSSascha Wildner /* Check if workspace is large enough, alloc a new one if needed */
1646*a28cd43dSSascha Wildner {
1647*a28cd43dSSascha Wildner int const workspaceTooSmall = ZSTD_cwksp_sizeof(ws) < neededSpace;
1648*a28cd43dSSascha Wildner int const workspaceWasteful = ZSTD_cwksp_check_wasteful(ws, neededSpace);
1649*a28cd43dSSascha Wildner
1650*a28cd43dSSascha Wildner DEBUGLOG(4, "Need %zu B workspace", neededSpace);
1651*a28cd43dSSascha Wildner DEBUGLOG(4, "windowSize: %zu - blockSize: %zu", windowSize, blockSize);
1652*a28cd43dSSascha Wildner
1653*a28cd43dSSascha Wildner if (workspaceTooSmall || workspaceWasteful) {
1654*a28cd43dSSascha Wildner DEBUGLOG(4, "Resize workspaceSize from %zuKB to %zuKB",
1655*a28cd43dSSascha Wildner ZSTD_cwksp_sizeof(ws) >> 10,
1656*a28cd43dSSascha Wildner neededSpace >> 10);
1657*a28cd43dSSascha Wildner
1658*a28cd43dSSascha Wildner RETURN_ERROR_IF(zc->staticSize, memory_allocation, "static cctx : no resize");
1659*a28cd43dSSascha Wildner
1660*a28cd43dSSascha Wildner needsIndexReset = ZSTDirp_reset;
1661*a28cd43dSSascha Wildner
1662*a28cd43dSSascha Wildner ZSTD_cwksp_free(ws, zc->customMem);
1663*a28cd43dSSascha Wildner FORWARD_IF_ERROR(ZSTD_cwksp_create(ws, neededSpace, zc->customMem), "");
1664*a28cd43dSSascha Wildner
1665*a28cd43dSSascha Wildner DEBUGLOG(5, "reserving object space");
1666*a28cd43dSSascha Wildner /* Statically sized space.
1667*a28cd43dSSascha Wildner * entropyWorkspace never moves,
1668*a28cd43dSSascha Wildner * though prev/next block swap places */
1669*a28cd43dSSascha Wildner assert(ZSTD_cwksp_check_available(ws, 2 * sizeof(ZSTD_compressedBlockState_t)));
1670*a28cd43dSSascha Wildner zc->blockState.prevCBlock = (ZSTD_compressedBlockState_t*) ZSTD_cwksp_reserve_object(ws, sizeof(ZSTD_compressedBlockState_t));
1671*a28cd43dSSascha Wildner RETURN_ERROR_IF(zc->blockState.prevCBlock == NULL, memory_allocation, "couldn't allocate prevCBlock");
1672*a28cd43dSSascha Wildner zc->blockState.nextCBlock = (ZSTD_compressedBlockState_t*) ZSTD_cwksp_reserve_object(ws, sizeof(ZSTD_compressedBlockState_t));
1673*a28cd43dSSascha Wildner RETURN_ERROR_IF(zc->blockState.nextCBlock == NULL, memory_allocation, "couldn't allocate nextCBlock");
1674*a28cd43dSSascha Wildner zc->entropyWorkspace = (U32*) ZSTD_cwksp_reserve_object(ws, ENTROPY_WORKSPACE_SIZE);
1675*a28cd43dSSascha Wildner RETURN_ERROR_IF(zc->blockState.nextCBlock == NULL, memory_allocation, "couldn't allocate entropyWorkspace");
1676*a28cd43dSSascha Wildner } }
1677*a28cd43dSSascha Wildner
1678*a28cd43dSSascha Wildner ZSTD_cwksp_clear(ws);
1679*a28cd43dSSascha Wildner
1680*a28cd43dSSascha Wildner /* init params */
1681*a28cd43dSSascha Wildner zc->appliedParams = params;
1682*a28cd43dSSascha Wildner zc->blockState.matchState.cParams = params.cParams;
1683*a28cd43dSSascha Wildner zc->pledgedSrcSizePlusOne = pledgedSrcSize+1;
1684*a28cd43dSSascha Wildner zc->consumedSrcSize = 0;
1685*a28cd43dSSascha Wildner zc->producedCSize = 0;
1686*a28cd43dSSascha Wildner if (pledgedSrcSize == ZSTD_CONTENTSIZE_UNKNOWN)
1687*a28cd43dSSascha Wildner zc->appliedParams.fParams.contentSizeFlag = 0;
1688*a28cd43dSSascha Wildner DEBUGLOG(4, "pledged content size : %u ; flag : %u",
1689*a28cd43dSSascha Wildner (unsigned)pledgedSrcSize, zc->appliedParams.fParams.contentSizeFlag);
1690*a28cd43dSSascha Wildner zc->blockSize = blockSize;
1691*a28cd43dSSascha Wildner
1692*a28cd43dSSascha Wildner XXH64_reset(&zc->xxhState, 0);
1693*a28cd43dSSascha Wildner zc->stage = ZSTDcs_init;
1694*a28cd43dSSascha Wildner zc->dictID = 0;
1695*a28cd43dSSascha Wildner
1696*a28cd43dSSascha Wildner ZSTD_reset_compressedBlockState(zc->blockState.prevCBlock);
1697*a28cd43dSSascha Wildner
1698*a28cd43dSSascha Wildner /* ZSTD_wildcopy() is used to copy into the literals buffer,
1699*a28cd43dSSascha Wildner * so we have to oversize the buffer by WILDCOPY_OVERLENGTH bytes.
1700*a28cd43dSSascha Wildner */
1701*a28cd43dSSascha Wildner zc->seqStore.litStart = ZSTD_cwksp_reserve_buffer(ws, blockSize + WILDCOPY_OVERLENGTH);
1702*a28cd43dSSascha Wildner zc->seqStore.maxNbLit = blockSize;
1703*a28cd43dSSascha Wildner
1704*a28cd43dSSascha Wildner /* buffers */
1705*a28cd43dSSascha Wildner zc->bufferedPolicy = zbuff;
1706*a28cd43dSSascha Wildner zc->inBuffSize = buffInSize;
1707*a28cd43dSSascha Wildner zc->inBuff = (char*)ZSTD_cwksp_reserve_buffer(ws, buffInSize);
1708*a28cd43dSSascha Wildner zc->outBuffSize = buffOutSize;
1709*a28cd43dSSascha Wildner zc->outBuff = (char*)ZSTD_cwksp_reserve_buffer(ws, buffOutSize);
1710*a28cd43dSSascha Wildner
1711*a28cd43dSSascha Wildner /* ldm bucketOffsets table */
1712*a28cd43dSSascha Wildner if (params.ldmParams.enableLdm) {
1713*a28cd43dSSascha Wildner /* TODO: avoid memset? */
1714*a28cd43dSSascha Wildner size_t const ldmBucketSize =
1715*a28cd43dSSascha Wildner ((size_t)1) << (params.ldmParams.hashLog -
1716*a28cd43dSSascha Wildner params.ldmParams.bucketSizeLog);
1717*a28cd43dSSascha Wildner zc->ldmState.bucketOffsets = ZSTD_cwksp_reserve_buffer(ws, ldmBucketSize);
1718*a28cd43dSSascha Wildner ZSTD_memset(zc->ldmState.bucketOffsets, 0, ldmBucketSize);
1719*a28cd43dSSascha Wildner }
1720*a28cd43dSSascha Wildner
1721*a28cd43dSSascha Wildner /* sequences storage */
1722*a28cd43dSSascha Wildner ZSTD_referenceExternalSequences(zc, NULL, 0);
1723*a28cd43dSSascha Wildner zc->seqStore.maxNbSeq = maxNbSeq;
1724*a28cd43dSSascha Wildner zc->seqStore.llCode = ZSTD_cwksp_reserve_buffer(ws, maxNbSeq * sizeof(BYTE));
1725*a28cd43dSSascha Wildner zc->seqStore.mlCode = ZSTD_cwksp_reserve_buffer(ws, maxNbSeq * sizeof(BYTE));
1726*a28cd43dSSascha Wildner zc->seqStore.ofCode = ZSTD_cwksp_reserve_buffer(ws, maxNbSeq * sizeof(BYTE));
1727*a28cd43dSSascha Wildner zc->seqStore.sequencesStart = (seqDef*)ZSTD_cwksp_reserve_aligned(ws, maxNbSeq * sizeof(seqDef));
1728*a28cd43dSSascha Wildner
1729*a28cd43dSSascha Wildner FORWARD_IF_ERROR(ZSTD_reset_matchState(
1730*a28cd43dSSascha Wildner &zc->blockState.matchState,
1731*a28cd43dSSascha Wildner ws,
1732*a28cd43dSSascha Wildner ¶ms.cParams,
1733*a28cd43dSSascha Wildner crp,
1734*a28cd43dSSascha Wildner needsIndexReset,
1735*a28cd43dSSascha Wildner ZSTD_resetTarget_CCtx), "");
1736*a28cd43dSSascha Wildner
1737*a28cd43dSSascha Wildner /* ldm hash table */
1738*a28cd43dSSascha Wildner if (params.ldmParams.enableLdm) {
1739*a28cd43dSSascha Wildner /* TODO: avoid memset? */
1740*a28cd43dSSascha Wildner size_t const ldmHSize = ((size_t)1) << params.ldmParams.hashLog;
1741*a28cd43dSSascha Wildner zc->ldmState.hashTable = (ldmEntry_t*)ZSTD_cwksp_reserve_aligned(ws, ldmHSize * sizeof(ldmEntry_t));
1742*a28cd43dSSascha Wildner ZSTD_memset(zc->ldmState.hashTable, 0, ldmHSize * sizeof(ldmEntry_t));
1743*a28cd43dSSascha Wildner zc->ldmSequences = (rawSeq*)ZSTD_cwksp_reserve_aligned(ws, maxNbLdmSeq * sizeof(rawSeq));
1744*a28cd43dSSascha Wildner zc->maxNbLdmSequences = maxNbLdmSeq;
1745*a28cd43dSSascha Wildner
1746*a28cd43dSSascha Wildner ZSTD_window_init(&zc->ldmState.window);
1747*a28cd43dSSascha Wildner ZSTD_window_clear(&zc->ldmState.window);
1748*a28cd43dSSascha Wildner zc->ldmState.loadedDictEnd = 0;
1749*a28cd43dSSascha Wildner }
1750*a28cd43dSSascha Wildner
1751*a28cd43dSSascha Wildner /* Due to alignment, when reusing a workspace, we can actually consume
1752*a28cd43dSSascha Wildner * up to 3 extra bytes for alignment. See the comments in zstd_cwksp.h
1753*a28cd43dSSascha Wildner */
1754*a28cd43dSSascha Wildner assert(ZSTD_cwksp_used(ws) >= neededSpace &&
1755*a28cd43dSSascha Wildner ZSTD_cwksp_used(ws) <= neededSpace + 3);
1756*a28cd43dSSascha Wildner
1757*a28cd43dSSascha Wildner DEBUGLOG(3, "wksp: finished allocating, %zd bytes remain available", ZSTD_cwksp_available_space(ws));
1758*a28cd43dSSascha Wildner zc->initialized = 1;
1759*a28cd43dSSascha Wildner
1760*a28cd43dSSascha Wildner return 0;
1761*a28cd43dSSascha Wildner }
1762*a28cd43dSSascha Wildner }
1763*a28cd43dSSascha Wildner
1764*a28cd43dSSascha Wildner /* ZSTD_invalidateRepCodes() :
1765*a28cd43dSSascha Wildner * ensures next compression will not use repcodes from previous block.
1766*a28cd43dSSascha Wildner * Note : only works with regular variant;
1767*a28cd43dSSascha Wildner * do not use with extDict variant ! */
ZSTD_invalidateRepCodes(ZSTD_CCtx * cctx)1768*a28cd43dSSascha Wildner void ZSTD_invalidateRepCodes(ZSTD_CCtx* cctx) {
1769*a28cd43dSSascha Wildner int i;
1770*a28cd43dSSascha Wildner for (i=0; i<ZSTD_REP_NUM; i++) cctx->blockState.prevCBlock->rep[i] = 0;
1771*a28cd43dSSascha Wildner assert(!ZSTD_window_hasExtDict(cctx->blockState.matchState.window));
1772*a28cd43dSSascha Wildner }
1773*a28cd43dSSascha Wildner
1774*a28cd43dSSascha Wildner /* These are the approximate sizes for each strategy past which copying the
1775*a28cd43dSSascha Wildner * dictionary tables into the working context is faster than using them
1776*a28cd43dSSascha Wildner * in-place.
1777*a28cd43dSSascha Wildner */
1778*a28cd43dSSascha Wildner static const size_t attachDictSizeCutoffs[ZSTD_STRATEGY_MAX+1] = {
1779*a28cd43dSSascha Wildner 8 KB, /* unused */
1780*a28cd43dSSascha Wildner 8 KB, /* ZSTD_fast */
1781*a28cd43dSSascha Wildner 16 KB, /* ZSTD_dfast */
1782*a28cd43dSSascha Wildner 32 KB, /* ZSTD_greedy */
1783*a28cd43dSSascha Wildner 32 KB, /* ZSTD_lazy */
1784*a28cd43dSSascha Wildner 32 KB, /* ZSTD_lazy2 */
1785*a28cd43dSSascha Wildner 32 KB, /* ZSTD_btlazy2 */
1786*a28cd43dSSascha Wildner 32 KB, /* ZSTD_btopt */
1787*a28cd43dSSascha Wildner 8 KB, /* ZSTD_btultra */
1788*a28cd43dSSascha Wildner 8 KB /* ZSTD_btultra2 */
1789*a28cd43dSSascha Wildner };
1790*a28cd43dSSascha Wildner
ZSTD_shouldAttachDict(const ZSTD_CDict * cdict,const ZSTD_CCtx_params * params,U64 pledgedSrcSize)1791*a28cd43dSSascha Wildner static int ZSTD_shouldAttachDict(const ZSTD_CDict* cdict,
1792*a28cd43dSSascha Wildner const ZSTD_CCtx_params* params,
1793*a28cd43dSSascha Wildner U64 pledgedSrcSize)
1794*a28cd43dSSascha Wildner {
1795*a28cd43dSSascha Wildner size_t cutoff = attachDictSizeCutoffs[cdict->matchState.cParams.strategy];
1796*a28cd43dSSascha Wildner int const dedicatedDictSearch = cdict->matchState.dedicatedDictSearch;
1797*a28cd43dSSascha Wildner return dedicatedDictSearch
1798*a28cd43dSSascha Wildner || ( ( pledgedSrcSize <= cutoff
1799*a28cd43dSSascha Wildner || pledgedSrcSize == ZSTD_CONTENTSIZE_UNKNOWN
1800*a28cd43dSSascha Wildner || params->attachDictPref == ZSTD_dictForceAttach )
1801*a28cd43dSSascha Wildner && params->attachDictPref != ZSTD_dictForceCopy
1802*a28cd43dSSascha Wildner && !params->forceWindow ); /* dictMatchState isn't correctly
1803*a28cd43dSSascha Wildner * handled in _enforceMaxDist */
1804*a28cd43dSSascha Wildner }
1805*a28cd43dSSascha Wildner
1806*a28cd43dSSascha Wildner static size_t
ZSTD_resetCCtx_byAttachingCDict(ZSTD_CCtx * cctx,const ZSTD_CDict * cdict,ZSTD_CCtx_params params,U64 pledgedSrcSize,ZSTD_buffered_policy_e zbuff)1807*a28cd43dSSascha Wildner ZSTD_resetCCtx_byAttachingCDict(ZSTD_CCtx* cctx,
1808*a28cd43dSSascha Wildner const ZSTD_CDict* cdict,
1809*a28cd43dSSascha Wildner ZSTD_CCtx_params params,
1810*a28cd43dSSascha Wildner U64 pledgedSrcSize,
1811*a28cd43dSSascha Wildner ZSTD_buffered_policy_e zbuff)
1812*a28cd43dSSascha Wildner {
1813*a28cd43dSSascha Wildner {
1814*a28cd43dSSascha Wildner ZSTD_compressionParameters adjusted_cdict_cParams = cdict->matchState.cParams;
1815*a28cd43dSSascha Wildner unsigned const windowLog = params.cParams.windowLog;
1816*a28cd43dSSascha Wildner assert(windowLog != 0);
1817*a28cd43dSSascha Wildner /* Resize working context table params for input only, since the dict
1818*a28cd43dSSascha Wildner * has its own tables. */
1819*a28cd43dSSascha Wildner /* pledgedSrcSize == 0 means 0! */
1820*a28cd43dSSascha Wildner
1821*a28cd43dSSascha Wildner if (cdict->matchState.dedicatedDictSearch) {
1822*a28cd43dSSascha Wildner ZSTD_dedicatedDictSearch_revertCParams(&adjusted_cdict_cParams);
1823*a28cd43dSSascha Wildner }
1824*a28cd43dSSascha Wildner
1825*a28cd43dSSascha Wildner params.cParams = ZSTD_adjustCParams_internal(adjusted_cdict_cParams, pledgedSrcSize,
1826*a28cd43dSSascha Wildner cdict->dictContentSize, ZSTD_cpm_attachDict);
1827*a28cd43dSSascha Wildner params.cParams.windowLog = windowLog;
1828*a28cd43dSSascha Wildner FORWARD_IF_ERROR(ZSTD_resetCCtx_internal(cctx, params, pledgedSrcSize,
1829*a28cd43dSSascha Wildner ZSTDcrp_makeClean, zbuff), "");
1830*a28cd43dSSascha Wildner assert(cctx->appliedParams.cParams.strategy == adjusted_cdict_cParams.strategy);
1831*a28cd43dSSascha Wildner }
1832*a28cd43dSSascha Wildner
1833*a28cd43dSSascha Wildner { const U32 cdictEnd = (U32)( cdict->matchState.window.nextSrc
1834*a28cd43dSSascha Wildner - cdict->matchState.window.base);
1835*a28cd43dSSascha Wildner const U32 cdictLen = cdictEnd - cdict->matchState.window.dictLimit;
1836*a28cd43dSSascha Wildner if (cdictLen == 0) {
1837*a28cd43dSSascha Wildner /* don't even attach dictionaries with no contents */
1838*a28cd43dSSascha Wildner DEBUGLOG(4, "skipping attaching empty dictionary");
1839*a28cd43dSSascha Wildner } else {
1840*a28cd43dSSascha Wildner DEBUGLOG(4, "attaching dictionary into context");
1841*a28cd43dSSascha Wildner cctx->blockState.matchState.dictMatchState = &cdict->matchState;
1842*a28cd43dSSascha Wildner
1843*a28cd43dSSascha Wildner /* prep working match state so dict matches never have negative indices
1844*a28cd43dSSascha Wildner * when they are translated to the working context's index space. */
1845*a28cd43dSSascha Wildner if (cctx->blockState.matchState.window.dictLimit < cdictEnd) {
1846*a28cd43dSSascha Wildner cctx->blockState.matchState.window.nextSrc =
1847*a28cd43dSSascha Wildner cctx->blockState.matchState.window.base + cdictEnd;
1848*a28cd43dSSascha Wildner ZSTD_window_clear(&cctx->blockState.matchState.window);
1849*a28cd43dSSascha Wildner }
1850*a28cd43dSSascha Wildner /* loadedDictEnd is expressed within the referential of the active context */
1851*a28cd43dSSascha Wildner cctx->blockState.matchState.loadedDictEnd = cctx->blockState.matchState.window.dictLimit;
1852*a28cd43dSSascha Wildner } }
1853*a28cd43dSSascha Wildner
1854*a28cd43dSSascha Wildner cctx->dictID = cdict->dictID;
1855*a28cd43dSSascha Wildner
1856*a28cd43dSSascha Wildner /* copy block state */
1857*a28cd43dSSascha Wildner ZSTD_memcpy(cctx->blockState.prevCBlock, &cdict->cBlockState, sizeof(cdict->cBlockState));
1858*a28cd43dSSascha Wildner
1859*a28cd43dSSascha Wildner return 0;
1860*a28cd43dSSascha Wildner }
1861*a28cd43dSSascha Wildner
ZSTD_resetCCtx_byCopyingCDict(ZSTD_CCtx * cctx,const ZSTD_CDict * cdict,ZSTD_CCtx_params params,U64 pledgedSrcSize,ZSTD_buffered_policy_e zbuff)1862*a28cd43dSSascha Wildner static size_t ZSTD_resetCCtx_byCopyingCDict(ZSTD_CCtx* cctx,
1863*a28cd43dSSascha Wildner const ZSTD_CDict* cdict,
1864*a28cd43dSSascha Wildner ZSTD_CCtx_params params,
1865*a28cd43dSSascha Wildner U64 pledgedSrcSize,
1866*a28cd43dSSascha Wildner ZSTD_buffered_policy_e zbuff)
1867*a28cd43dSSascha Wildner {
1868*a28cd43dSSascha Wildner const ZSTD_compressionParameters *cdict_cParams = &cdict->matchState.cParams;
1869*a28cd43dSSascha Wildner
1870*a28cd43dSSascha Wildner assert(!cdict->matchState.dedicatedDictSearch);
1871*a28cd43dSSascha Wildner
1872*a28cd43dSSascha Wildner DEBUGLOG(4, "copying dictionary into context");
1873*a28cd43dSSascha Wildner
1874*a28cd43dSSascha Wildner { unsigned const windowLog = params.cParams.windowLog;
1875*a28cd43dSSascha Wildner assert(windowLog != 0);
1876*a28cd43dSSascha Wildner /* Copy only compression parameters related to tables. */
1877*a28cd43dSSascha Wildner params.cParams = *cdict_cParams;
1878*a28cd43dSSascha Wildner params.cParams.windowLog = windowLog;
1879*a28cd43dSSascha Wildner FORWARD_IF_ERROR(ZSTD_resetCCtx_internal(cctx, params, pledgedSrcSize,
1880*a28cd43dSSascha Wildner ZSTDcrp_leaveDirty, zbuff), "");
1881*a28cd43dSSascha Wildner assert(cctx->appliedParams.cParams.strategy == cdict_cParams->strategy);
1882*a28cd43dSSascha Wildner assert(cctx->appliedParams.cParams.hashLog == cdict_cParams->hashLog);
1883*a28cd43dSSascha Wildner assert(cctx->appliedParams.cParams.chainLog == cdict_cParams->chainLog);
1884*a28cd43dSSascha Wildner }
1885*a28cd43dSSascha Wildner
1886*a28cd43dSSascha Wildner ZSTD_cwksp_mark_tables_dirty(&cctx->workspace);
1887*a28cd43dSSascha Wildner
1888*a28cd43dSSascha Wildner /* copy tables */
1889*a28cd43dSSascha Wildner { size_t const chainSize = (cdict_cParams->strategy == ZSTD_fast) ? 0 : ((size_t)1 << cdict_cParams->chainLog);
1890*a28cd43dSSascha Wildner size_t const hSize = (size_t)1 << cdict_cParams->hashLog;
1891*a28cd43dSSascha Wildner
1892*a28cd43dSSascha Wildner ZSTD_memcpy(cctx->blockState.matchState.hashTable,
1893*a28cd43dSSascha Wildner cdict->matchState.hashTable,
1894*a28cd43dSSascha Wildner hSize * sizeof(U32));
1895*a28cd43dSSascha Wildner ZSTD_memcpy(cctx->blockState.matchState.chainTable,
1896*a28cd43dSSascha Wildner cdict->matchState.chainTable,
1897*a28cd43dSSascha Wildner chainSize * sizeof(U32));
1898*a28cd43dSSascha Wildner }
1899*a28cd43dSSascha Wildner
1900*a28cd43dSSascha Wildner /* Zero the hashTable3, since the cdict never fills it */
1901*a28cd43dSSascha Wildner { int const h3log = cctx->blockState.matchState.hashLog3;
1902*a28cd43dSSascha Wildner size_t const h3Size = h3log ? ((size_t)1 << h3log) : 0;
1903*a28cd43dSSascha Wildner assert(cdict->matchState.hashLog3 == 0);
1904*a28cd43dSSascha Wildner ZSTD_memset(cctx->blockState.matchState.hashTable3, 0, h3Size * sizeof(U32));
1905*a28cd43dSSascha Wildner }
1906*a28cd43dSSascha Wildner
1907*a28cd43dSSascha Wildner ZSTD_cwksp_mark_tables_clean(&cctx->workspace);
1908*a28cd43dSSascha Wildner
1909*a28cd43dSSascha Wildner /* copy dictionary offsets */
1910*a28cd43dSSascha Wildner { ZSTD_matchState_t const* srcMatchState = &cdict->matchState;
1911*a28cd43dSSascha Wildner ZSTD_matchState_t* dstMatchState = &cctx->blockState.matchState;
1912*a28cd43dSSascha Wildner dstMatchState->window = srcMatchState->window;
1913*a28cd43dSSascha Wildner dstMatchState->nextToUpdate = srcMatchState->nextToUpdate;
1914*a28cd43dSSascha Wildner dstMatchState->loadedDictEnd= srcMatchState->loadedDictEnd;
1915*a28cd43dSSascha Wildner }
1916*a28cd43dSSascha Wildner
1917*a28cd43dSSascha Wildner cctx->dictID = cdict->dictID;
1918*a28cd43dSSascha Wildner
1919*a28cd43dSSascha Wildner /* copy block state */
1920*a28cd43dSSascha Wildner ZSTD_memcpy(cctx->blockState.prevCBlock, &cdict->cBlockState, sizeof(cdict->cBlockState));
1921*a28cd43dSSascha Wildner
1922*a28cd43dSSascha Wildner return 0;
1923*a28cd43dSSascha Wildner }
1924*a28cd43dSSascha Wildner
1925*a28cd43dSSascha Wildner /* We have a choice between copying the dictionary context into the working
1926*a28cd43dSSascha Wildner * context, or referencing the dictionary context from the working context
1927*a28cd43dSSascha Wildner * in-place. We decide here which strategy to use. */
ZSTD_resetCCtx_usingCDict(ZSTD_CCtx * cctx,const ZSTD_CDict * cdict,const ZSTD_CCtx_params * params,U64 pledgedSrcSize,ZSTD_buffered_policy_e zbuff)1928*a28cd43dSSascha Wildner static size_t ZSTD_resetCCtx_usingCDict(ZSTD_CCtx* cctx,
1929*a28cd43dSSascha Wildner const ZSTD_CDict* cdict,
1930*a28cd43dSSascha Wildner const ZSTD_CCtx_params* params,
1931*a28cd43dSSascha Wildner U64 pledgedSrcSize,
1932*a28cd43dSSascha Wildner ZSTD_buffered_policy_e zbuff)
1933*a28cd43dSSascha Wildner {
1934*a28cd43dSSascha Wildner
1935*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_resetCCtx_usingCDict (pledgedSrcSize=%u)",
1936*a28cd43dSSascha Wildner (unsigned)pledgedSrcSize);
1937*a28cd43dSSascha Wildner
1938*a28cd43dSSascha Wildner if (ZSTD_shouldAttachDict(cdict, params, pledgedSrcSize)) {
1939*a28cd43dSSascha Wildner return ZSTD_resetCCtx_byAttachingCDict(
1940*a28cd43dSSascha Wildner cctx, cdict, *params, pledgedSrcSize, zbuff);
1941*a28cd43dSSascha Wildner } else {
1942*a28cd43dSSascha Wildner return ZSTD_resetCCtx_byCopyingCDict(
1943*a28cd43dSSascha Wildner cctx, cdict, *params, pledgedSrcSize, zbuff);
1944*a28cd43dSSascha Wildner }
1945*a28cd43dSSascha Wildner }
1946*a28cd43dSSascha Wildner
1947*a28cd43dSSascha Wildner /*! ZSTD_copyCCtx_internal() :
1948*a28cd43dSSascha Wildner * Duplicate an existing context `srcCCtx` into another one `dstCCtx`.
1949*a28cd43dSSascha Wildner * Only works during stage ZSTDcs_init (i.e. after creation, but before first call to ZSTD_compressContinue()).
1950*a28cd43dSSascha Wildner * The "context", in this case, refers to the hash and chain tables,
1951*a28cd43dSSascha Wildner * entropy tables, and dictionary references.
1952*a28cd43dSSascha Wildner * `windowLog` value is enforced if != 0, otherwise value is copied from srcCCtx.
1953*a28cd43dSSascha Wildner * @return : 0, or an error code */
ZSTD_copyCCtx_internal(ZSTD_CCtx * dstCCtx,const ZSTD_CCtx * srcCCtx,ZSTD_frameParameters fParams,U64 pledgedSrcSize,ZSTD_buffered_policy_e zbuff)1954*a28cd43dSSascha Wildner static size_t ZSTD_copyCCtx_internal(ZSTD_CCtx* dstCCtx,
1955*a28cd43dSSascha Wildner const ZSTD_CCtx* srcCCtx,
1956*a28cd43dSSascha Wildner ZSTD_frameParameters fParams,
1957*a28cd43dSSascha Wildner U64 pledgedSrcSize,
1958*a28cd43dSSascha Wildner ZSTD_buffered_policy_e zbuff)
1959*a28cd43dSSascha Wildner {
1960*a28cd43dSSascha Wildner DEBUGLOG(5, "ZSTD_copyCCtx_internal");
1961*a28cd43dSSascha Wildner RETURN_ERROR_IF(srcCCtx->stage!=ZSTDcs_init, stage_wrong,
1962*a28cd43dSSascha Wildner "Can't copy a ctx that's not in init stage.");
1963*a28cd43dSSascha Wildner
1964*a28cd43dSSascha Wildner ZSTD_memcpy(&dstCCtx->customMem, &srcCCtx->customMem, sizeof(ZSTD_customMem));
1965*a28cd43dSSascha Wildner { ZSTD_CCtx_params params = dstCCtx->requestedParams;
1966*a28cd43dSSascha Wildner /* Copy only compression parameters related to tables. */
1967*a28cd43dSSascha Wildner params.cParams = srcCCtx->appliedParams.cParams;
1968*a28cd43dSSascha Wildner params.fParams = fParams;
1969*a28cd43dSSascha Wildner ZSTD_resetCCtx_internal(dstCCtx, params, pledgedSrcSize,
1970*a28cd43dSSascha Wildner ZSTDcrp_leaveDirty, zbuff);
1971*a28cd43dSSascha Wildner assert(dstCCtx->appliedParams.cParams.windowLog == srcCCtx->appliedParams.cParams.windowLog);
1972*a28cd43dSSascha Wildner assert(dstCCtx->appliedParams.cParams.strategy == srcCCtx->appliedParams.cParams.strategy);
1973*a28cd43dSSascha Wildner assert(dstCCtx->appliedParams.cParams.hashLog == srcCCtx->appliedParams.cParams.hashLog);
1974*a28cd43dSSascha Wildner assert(dstCCtx->appliedParams.cParams.chainLog == srcCCtx->appliedParams.cParams.chainLog);
1975*a28cd43dSSascha Wildner assert(dstCCtx->blockState.matchState.hashLog3 == srcCCtx->blockState.matchState.hashLog3);
1976*a28cd43dSSascha Wildner }
1977*a28cd43dSSascha Wildner
1978*a28cd43dSSascha Wildner ZSTD_cwksp_mark_tables_dirty(&dstCCtx->workspace);
1979*a28cd43dSSascha Wildner
1980*a28cd43dSSascha Wildner /* copy tables */
1981*a28cd43dSSascha Wildner { size_t const chainSize = (srcCCtx->appliedParams.cParams.strategy == ZSTD_fast) ? 0 : ((size_t)1 << srcCCtx->appliedParams.cParams.chainLog);
1982*a28cd43dSSascha Wildner size_t const hSize = (size_t)1 << srcCCtx->appliedParams.cParams.hashLog;
1983*a28cd43dSSascha Wildner int const h3log = srcCCtx->blockState.matchState.hashLog3;
1984*a28cd43dSSascha Wildner size_t const h3Size = h3log ? ((size_t)1 << h3log) : 0;
1985*a28cd43dSSascha Wildner
1986*a28cd43dSSascha Wildner ZSTD_memcpy(dstCCtx->blockState.matchState.hashTable,
1987*a28cd43dSSascha Wildner srcCCtx->blockState.matchState.hashTable,
1988*a28cd43dSSascha Wildner hSize * sizeof(U32));
1989*a28cd43dSSascha Wildner ZSTD_memcpy(dstCCtx->blockState.matchState.chainTable,
1990*a28cd43dSSascha Wildner srcCCtx->blockState.matchState.chainTable,
1991*a28cd43dSSascha Wildner chainSize * sizeof(U32));
1992*a28cd43dSSascha Wildner ZSTD_memcpy(dstCCtx->blockState.matchState.hashTable3,
1993*a28cd43dSSascha Wildner srcCCtx->blockState.matchState.hashTable3,
1994*a28cd43dSSascha Wildner h3Size * sizeof(U32));
1995*a28cd43dSSascha Wildner }
1996*a28cd43dSSascha Wildner
1997*a28cd43dSSascha Wildner ZSTD_cwksp_mark_tables_clean(&dstCCtx->workspace);
1998*a28cd43dSSascha Wildner
1999*a28cd43dSSascha Wildner /* copy dictionary offsets */
2000*a28cd43dSSascha Wildner {
2001*a28cd43dSSascha Wildner const ZSTD_matchState_t* srcMatchState = &srcCCtx->blockState.matchState;
2002*a28cd43dSSascha Wildner ZSTD_matchState_t* dstMatchState = &dstCCtx->blockState.matchState;
2003*a28cd43dSSascha Wildner dstMatchState->window = srcMatchState->window;
2004*a28cd43dSSascha Wildner dstMatchState->nextToUpdate = srcMatchState->nextToUpdate;
2005*a28cd43dSSascha Wildner dstMatchState->loadedDictEnd= srcMatchState->loadedDictEnd;
2006*a28cd43dSSascha Wildner }
2007*a28cd43dSSascha Wildner dstCCtx->dictID = srcCCtx->dictID;
2008*a28cd43dSSascha Wildner
2009*a28cd43dSSascha Wildner /* copy block state */
2010*a28cd43dSSascha Wildner ZSTD_memcpy(dstCCtx->blockState.prevCBlock, srcCCtx->blockState.prevCBlock, sizeof(*srcCCtx->blockState.prevCBlock));
2011*a28cd43dSSascha Wildner
2012*a28cd43dSSascha Wildner return 0;
2013*a28cd43dSSascha Wildner }
2014*a28cd43dSSascha Wildner
2015*a28cd43dSSascha Wildner /*! ZSTD_copyCCtx() :
2016*a28cd43dSSascha Wildner * Duplicate an existing context `srcCCtx` into another one `dstCCtx`.
2017*a28cd43dSSascha Wildner * Only works during stage ZSTDcs_init (i.e. after creation, but before first call to ZSTD_compressContinue()).
2018*a28cd43dSSascha Wildner * pledgedSrcSize==0 means "unknown".
2019*a28cd43dSSascha Wildner * @return : 0, or an error code */
ZSTD_copyCCtx(ZSTD_CCtx * dstCCtx,const ZSTD_CCtx * srcCCtx,unsigned long long pledgedSrcSize)2020*a28cd43dSSascha Wildner size_t ZSTD_copyCCtx(ZSTD_CCtx* dstCCtx, const ZSTD_CCtx* srcCCtx, unsigned long long pledgedSrcSize)
2021*a28cd43dSSascha Wildner {
2022*a28cd43dSSascha Wildner ZSTD_frameParameters fParams = { 1 /*content*/, 0 /*checksum*/, 0 /*noDictID*/ };
2023*a28cd43dSSascha Wildner ZSTD_buffered_policy_e const zbuff = srcCCtx->bufferedPolicy;
2024*a28cd43dSSascha Wildner ZSTD_STATIC_ASSERT((U32)ZSTDb_buffered==1);
2025*a28cd43dSSascha Wildner if (pledgedSrcSize==0) pledgedSrcSize = ZSTD_CONTENTSIZE_UNKNOWN;
2026*a28cd43dSSascha Wildner fParams.contentSizeFlag = (pledgedSrcSize != ZSTD_CONTENTSIZE_UNKNOWN);
2027*a28cd43dSSascha Wildner
2028*a28cd43dSSascha Wildner return ZSTD_copyCCtx_internal(dstCCtx, srcCCtx,
2029*a28cd43dSSascha Wildner fParams, pledgedSrcSize,
2030*a28cd43dSSascha Wildner zbuff);
2031*a28cd43dSSascha Wildner }
2032*a28cd43dSSascha Wildner
2033*a28cd43dSSascha Wildner
2034*a28cd43dSSascha Wildner #define ZSTD_ROWSIZE 16
2035*a28cd43dSSascha Wildner /*! ZSTD_reduceTable() :
2036*a28cd43dSSascha Wildner * reduce table indexes by `reducerValue`, or squash to zero.
2037*a28cd43dSSascha Wildner * PreserveMark preserves "unsorted mark" for btlazy2 strategy.
2038*a28cd43dSSascha Wildner * It must be set to a clear 0/1 value, to remove branch during inlining.
2039*a28cd43dSSascha Wildner * Presume table size is a multiple of ZSTD_ROWSIZE
2040*a28cd43dSSascha Wildner * to help auto-vectorization */
2041*a28cd43dSSascha Wildner FORCE_INLINE_TEMPLATE void
ZSTD_reduceTable_internal(U32 * const table,U32 const size,U32 const reducerValue,int const preserveMark)2042*a28cd43dSSascha Wildner ZSTD_reduceTable_internal (U32* const table, U32 const size, U32 const reducerValue, int const preserveMark)
2043*a28cd43dSSascha Wildner {
2044*a28cd43dSSascha Wildner int const nbRows = (int)size / ZSTD_ROWSIZE;
2045*a28cd43dSSascha Wildner int cellNb = 0;
2046*a28cd43dSSascha Wildner int rowNb;
2047*a28cd43dSSascha Wildner assert((size & (ZSTD_ROWSIZE-1)) == 0); /* multiple of ZSTD_ROWSIZE */
2048*a28cd43dSSascha Wildner assert(size < (1U<<31)); /* can be casted to int */
2049*a28cd43dSSascha Wildner
2050*a28cd43dSSascha Wildner #if ZSTD_MEMORY_SANITIZER && !defined (ZSTD_MSAN_DONT_POISON_WORKSPACE)
2051*a28cd43dSSascha Wildner /* To validate that the table re-use logic is sound, and that we don't
2052*a28cd43dSSascha Wildner * access table space that we haven't cleaned, we re-"poison" the table
2053*a28cd43dSSascha Wildner * space every time we mark it dirty.
2054*a28cd43dSSascha Wildner *
2055*a28cd43dSSascha Wildner * This function however is intended to operate on those dirty tables and
2056*a28cd43dSSascha Wildner * re-clean them. So when this function is used correctly, we can unpoison
2057*a28cd43dSSascha Wildner * the memory it operated on. This introduces a blind spot though, since
2058*a28cd43dSSascha Wildner * if we now try to operate on __actually__ poisoned memory, we will not
2059*a28cd43dSSascha Wildner * detect that. */
2060*a28cd43dSSascha Wildner __msan_unpoison(table, size * sizeof(U32));
2061*a28cd43dSSascha Wildner #endif
2062*a28cd43dSSascha Wildner
2063*a28cd43dSSascha Wildner for (rowNb=0 ; rowNb < nbRows ; rowNb++) {
2064*a28cd43dSSascha Wildner int column;
2065*a28cd43dSSascha Wildner for (column=0; column<ZSTD_ROWSIZE; column++) {
2066*a28cd43dSSascha Wildner if (preserveMark) {
2067*a28cd43dSSascha Wildner U32 const adder = (table[cellNb] == ZSTD_DUBT_UNSORTED_MARK) ? reducerValue : 0;
2068*a28cd43dSSascha Wildner table[cellNb] += adder;
2069*a28cd43dSSascha Wildner }
2070*a28cd43dSSascha Wildner if (table[cellNb] < reducerValue) table[cellNb] = 0;
2071*a28cd43dSSascha Wildner else table[cellNb] -= reducerValue;
2072*a28cd43dSSascha Wildner cellNb++;
2073*a28cd43dSSascha Wildner } }
2074*a28cd43dSSascha Wildner }
2075*a28cd43dSSascha Wildner
ZSTD_reduceTable(U32 * const table,U32 const size,U32 const reducerValue)2076*a28cd43dSSascha Wildner static void ZSTD_reduceTable(U32* const table, U32 const size, U32 const reducerValue)
2077*a28cd43dSSascha Wildner {
2078*a28cd43dSSascha Wildner ZSTD_reduceTable_internal(table, size, reducerValue, 0);
2079*a28cd43dSSascha Wildner }
2080*a28cd43dSSascha Wildner
ZSTD_reduceTable_btlazy2(U32 * const table,U32 const size,U32 const reducerValue)2081*a28cd43dSSascha Wildner static void ZSTD_reduceTable_btlazy2(U32* const table, U32 const size, U32 const reducerValue)
2082*a28cd43dSSascha Wildner {
2083*a28cd43dSSascha Wildner ZSTD_reduceTable_internal(table, size, reducerValue, 1);
2084*a28cd43dSSascha Wildner }
2085*a28cd43dSSascha Wildner
2086*a28cd43dSSascha Wildner /*! ZSTD_reduceIndex() :
2087*a28cd43dSSascha Wildner * rescale all indexes to avoid future overflow (indexes are U32) */
ZSTD_reduceIndex(ZSTD_matchState_t * ms,ZSTD_CCtx_params const * params,const U32 reducerValue)2088*a28cd43dSSascha Wildner static void ZSTD_reduceIndex (ZSTD_matchState_t* ms, ZSTD_CCtx_params const* params, const U32 reducerValue)
2089*a28cd43dSSascha Wildner {
2090*a28cd43dSSascha Wildner { U32 const hSize = (U32)1 << params->cParams.hashLog;
2091*a28cd43dSSascha Wildner ZSTD_reduceTable(ms->hashTable, hSize, reducerValue);
2092*a28cd43dSSascha Wildner }
2093*a28cd43dSSascha Wildner
2094*a28cd43dSSascha Wildner if (params->cParams.strategy != ZSTD_fast) {
2095*a28cd43dSSascha Wildner U32 const chainSize = (U32)1 << params->cParams.chainLog;
2096*a28cd43dSSascha Wildner if (params->cParams.strategy == ZSTD_btlazy2)
2097*a28cd43dSSascha Wildner ZSTD_reduceTable_btlazy2(ms->chainTable, chainSize, reducerValue);
2098*a28cd43dSSascha Wildner else
2099*a28cd43dSSascha Wildner ZSTD_reduceTable(ms->chainTable, chainSize, reducerValue);
2100*a28cd43dSSascha Wildner }
2101*a28cd43dSSascha Wildner
2102*a28cd43dSSascha Wildner if (ms->hashLog3) {
2103*a28cd43dSSascha Wildner U32 const h3Size = (U32)1 << ms->hashLog3;
2104*a28cd43dSSascha Wildner ZSTD_reduceTable(ms->hashTable3, h3Size, reducerValue);
2105*a28cd43dSSascha Wildner }
2106*a28cd43dSSascha Wildner }
2107*a28cd43dSSascha Wildner
2108*a28cd43dSSascha Wildner
2109*a28cd43dSSascha Wildner /*-*******************************************************
2110*a28cd43dSSascha Wildner * Block entropic compression
2111*a28cd43dSSascha Wildner *********************************************************/
2112*a28cd43dSSascha Wildner
2113*a28cd43dSSascha Wildner /* See doc/zstd_compression_format.md for detailed format description */
2114*a28cd43dSSascha Wildner
ZSTD_seqToCodes(const seqStore_t * seqStorePtr)2115*a28cd43dSSascha Wildner void ZSTD_seqToCodes(const seqStore_t* seqStorePtr)
2116*a28cd43dSSascha Wildner {
2117*a28cd43dSSascha Wildner const seqDef* const sequences = seqStorePtr->sequencesStart;
2118*a28cd43dSSascha Wildner BYTE* const llCodeTable = seqStorePtr->llCode;
2119*a28cd43dSSascha Wildner BYTE* const ofCodeTable = seqStorePtr->ofCode;
2120*a28cd43dSSascha Wildner BYTE* const mlCodeTable = seqStorePtr->mlCode;
2121*a28cd43dSSascha Wildner U32 const nbSeq = (U32)(seqStorePtr->sequences - seqStorePtr->sequencesStart);
2122*a28cd43dSSascha Wildner U32 u;
2123*a28cd43dSSascha Wildner assert(nbSeq <= seqStorePtr->maxNbSeq);
2124*a28cd43dSSascha Wildner for (u=0; u<nbSeq; u++) {
2125*a28cd43dSSascha Wildner U32 const llv = sequences[u].litLength;
2126*a28cd43dSSascha Wildner U32 const mlv = sequences[u].matchLength;
2127*a28cd43dSSascha Wildner llCodeTable[u] = (BYTE)ZSTD_LLcode(llv);
2128*a28cd43dSSascha Wildner ofCodeTable[u] = (BYTE)ZSTD_highbit32(sequences[u].offset);
2129*a28cd43dSSascha Wildner mlCodeTable[u] = (BYTE)ZSTD_MLcode(mlv);
2130*a28cd43dSSascha Wildner }
2131*a28cd43dSSascha Wildner if (seqStorePtr->longLengthID==1)
2132*a28cd43dSSascha Wildner llCodeTable[seqStorePtr->longLengthPos] = MaxLL;
2133*a28cd43dSSascha Wildner if (seqStorePtr->longLengthID==2)
2134*a28cd43dSSascha Wildner mlCodeTable[seqStorePtr->longLengthPos] = MaxML;
2135*a28cd43dSSascha Wildner }
2136*a28cd43dSSascha Wildner
2137*a28cd43dSSascha Wildner /* ZSTD_useTargetCBlockSize():
2138*a28cd43dSSascha Wildner * Returns if target compressed block size param is being used.
2139*a28cd43dSSascha Wildner * If used, compression will do best effort to make a compressed block size to be around targetCBlockSize.
2140*a28cd43dSSascha Wildner * Returns 1 if true, 0 otherwise. */
ZSTD_useTargetCBlockSize(const ZSTD_CCtx_params * cctxParams)2141*a28cd43dSSascha Wildner static int ZSTD_useTargetCBlockSize(const ZSTD_CCtx_params* cctxParams)
2142*a28cd43dSSascha Wildner {
2143*a28cd43dSSascha Wildner DEBUGLOG(5, "ZSTD_useTargetCBlockSize (targetCBlockSize=%zu)", cctxParams->targetCBlockSize);
2144*a28cd43dSSascha Wildner return (cctxParams->targetCBlockSize != 0);
2145*a28cd43dSSascha Wildner }
2146*a28cd43dSSascha Wildner
2147*a28cd43dSSascha Wildner /* ZSTD_entropyCompressSequences_internal():
2148*a28cd43dSSascha Wildner * actually compresses both literals and sequences */
2149*a28cd43dSSascha Wildner MEM_STATIC size_t
ZSTD_entropyCompressSequences_internal(seqStore_t * seqStorePtr,const ZSTD_entropyCTables_t * prevEntropy,ZSTD_entropyCTables_t * nextEntropy,const ZSTD_CCtx_params * cctxParams,void * dst,size_t dstCapacity,void * entropyWorkspace,size_t entropyWkspSize,const int bmi2)2150*a28cd43dSSascha Wildner ZSTD_entropyCompressSequences_internal(seqStore_t* seqStorePtr,
2151*a28cd43dSSascha Wildner const ZSTD_entropyCTables_t* prevEntropy,
2152*a28cd43dSSascha Wildner ZSTD_entropyCTables_t* nextEntropy,
2153*a28cd43dSSascha Wildner const ZSTD_CCtx_params* cctxParams,
2154*a28cd43dSSascha Wildner void* dst, size_t dstCapacity,
2155*a28cd43dSSascha Wildner void* entropyWorkspace, size_t entropyWkspSize,
2156*a28cd43dSSascha Wildner const int bmi2)
2157*a28cd43dSSascha Wildner {
2158*a28cd43dSSascha Wildner const int longOffsets = cctxParams->cParams.windowLog > STREAM_ACCUMULATOR_MIN;
2159*a28cd43dSSascha Wildner ZSTD_strategy const strategy = cctxParams->cParams.strategy;
2160*a28cd43dSSascha Wildner unsigned* count = (unsigned*)entropyWorkspace;
2161*a28cd43dSSascha Wildner FSE_CTable* CTable_LitLength = nextEntropy->fse.litlengthCTable;
2162*a28cd43dSSascha Wildner FSE_CTable* CTable_OffsetBits = nextEntropy->fse.offcodeCTable;
2163*a28cd43dSSascha Wildner FSE_CTable* CTable_MatchLength = nextEntropy->fse.matchlengthCTable;
2164*a28cd43dSSascha Wildner U32 LLtype, Offtype, MLtype; /* compressed, raw or rle */
2165*a28cd43dSSascha Wildner const seqDef* const sequences = seqStorePtr->sequencesStart;
2166*a28cd43dSSascha Wildner const BYTE* const ofCodeTable = seqStorePtr->ofCode;
2167*a28cd43dSSascha Wildner const BYTE* const llCodeTable = seqStorePtr->llCode;
2168*a28cd43dSSascha Wildner const BYTE* const mlCodeTable = seqStorePtr->mlCode;
2169*a28cd43dSSascha Wildner BYTE* const ostart = (BYTE*)dst;
2170*a28cd43dSSascha Wildner BYTE* const oend = ostart + dstCapacity;
2171*a28cd43dSSascha Wildner BYTE* op = ostart;
2172*a28cd43dSSascha Wildner size_t const nbSeq = (size_t)(seqStorePtr->sequences - seqStorePtr->sequencesStart);
2173*a28cd43dSSascha Wildner BYTE* seqHead;
2174*a28cd43dSSascha Wildner BYTE* lastNCount = NULL;
2175*a28cd43dSSascha Wildner
2176*a28cd43dSSascha Wildner entropyWorkspace = count + (MaxSeq + 1);
2177*a28cd43dSSascha Wildner entropyWkspSize -= (MaxSeq + 1) * sizeof(*count);
2178*a28cd43dSSascha Wildner
2179*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_entropyCompressSequences_internal (nbSeq=%zu)", nbSeq);
2180*a28cd43dSSascha Wildner ZSTD_STATIC_ASSERT(HUF_WORKSPACE_SIZE >= (1<<MAX(MLFSELog,LLFSELog)));
2181*a28cd43dSSascha Wildner assert(entropyWkspSize >= HUF_WORKSPACE_SIZE);
2182*a28cd43dSSascha Wildner
2183*a28cd43dSSascha Wildner /* Compress literals */
2184*a28cd43dSSascha Wildner { const BYTE* const literals = seqStorePtr->litStart;
2185*a28cd43dSSascha Wildner size_t const litSize = (size_t)(seqStorePtr->lit - literals);
2186*a28cd43dSSascha Wildner size_t const cSize = ZSTD_compressLiterals(
2187*a28cd43dSSascha Wildner &prevEntropy->huf, &nextEntropy->huf,
2188*a28cd43dSSascha Wildner cctxParams->cParams.strategy,
2189*a28cd43dSSascha Wildner ZSTD_disableLiteralsCompression(cctxParams),
2190*a28cd43dSSascha Wildner op, dstCapacity,
2191*a28cd43dSSascha Wildner literals, litSize,
2192*a28cd43dSSascha Wildner entropyWorkspace, entropyWkspSize,
2193*a28cd43dSSascha Wildner bmi2);
2194*a28cd43dSSascha Wildner FORWARD_IF_ERROR(cSize, "ZSTD_compressLiterals failed");
2195*a28cd43dSSascha Wildner assert(cSize <= dstCapacity);
2196*a28cd43dSSascha Wildner op += cSize;
2197*a28cd43dSSascha Wildner }
2198*a28cd43dSSascha Wildner
2199*a28cd43dSSascha Wildner /* Sequences Header */
2200*a28cd43dSSascha Wildner RETURN_ERROR_IF((oend-op) < 3 /*max nbSeq Size*/ + 1 /*seqHead*/,
2201*a28cd43dSSascha Wildner dstSize_tooSmall, "Can't fit seq hdr in output buf!");
2202*a28cd43dSSascha Wildner if (nbSeq < 128) {
2203*a28cd43dSSascha Wildner *op++ = (BYTE)nbSeq;
2204*a28cd43dSSascha Wildner } else if (nbSeq < LONGNBSEQ) {
2205*a28cd43dSSascha Wildner op[0] = (BYTE)((nbSeq>>8) + 0x80);
2206*a28cd43dSSascha Wildner op[1] = (BYTE)nbSeq;
2207*a28cd43dSSascha Wildner op+=2;
2208*a28cd43dSSascha Wildner } else {
2209*a28cd43dSSascha Wildner op[0]=0xFF;
2210*a28cd43dSSascha Wildner MEM_writeLE16(op+1, (U16)(nbSeq - LONGNBSEQ));
2211*a28cd43dSSascha Wildner op+=3;
2212*a28cd43dSSascha Wildner }
2213*a28cd43dSSascha Wildner assert(op <= oend);
2214*a28cd43dSSascha Wildner if (nbSeq==0) {
2215*a28cd43dSSascha Wildner /* Copy the old tables over as if we repeated them */
2216*a28cd43dSSascha Wildner ZSTD_memcpy(&nextEntropy->fse, &prevEntropy->fse, sizeof(prevEntropy->fse));
2217*a28cd43dSSascha Wildner return (size_t)(op - ostart);
2218*a28cd43dSSascha Wildner }
2219*a28cd43dSSascha Wildner
2220*a28cd43dSSascha Wildner /* seqHead : flags for FSE encoding type */
2221*a28cd43dSSascha Wildner seqHead = op++;
2222*a28cd43dSSascha Wildner assert(op <= oend);
2223*a28cd43dSSascha Wildner
2224*a28cd43dSSascha Wildner /* convert length/distances into codes */
2225*a28cd43dSSascha Wildner ZSTD_seqToCodes(seqStorePtr);
2226*a28cd43dSSascha Wildner /* build CTable for Literal Lengths */
2227*a28cd43dSSascha Wildner { unsigned max = MaxLL;
2228*a28cd43dSSascha Wildner size_t const mostFrequent = HIST_countFast_wksp(count, &max, llCodeTable, nbSeq, entropyWorkspace, entropyWkspSize); /* can't fail */
2229*a28cd43dSSascha Wildner DEBUGLOG(5, "Building LL table");
2230*a28cd43dSSascha Wildner nextEntropy->fse.litlength_repeatMode = prevEntropy->fse.litlength_repeatMode;
2231*a28cd43dSSascha Wildner LLtype = ZSTD_selectEncodingType(&nextEntropy->fse.litlength_repeatMode,
2232*a28cd43dSSascha Wildner count, max, mostFrequent, nbSeq,
2233*a28cd43dSSascha Wildner LLFSELog, prevEntropy->fse.litlengthCTable,
2234*a28cd43dSSascha Wildner LL_defaultNorm, LL_defaultNormLog,
2235*a28cd43dSSascha Wildner ZSTD_defaultAllowed, strategy);
2236*a28cd43dSSascha Wildner assert(set_basic < set_compressed && set_rle < set_compressed);
2237*a28cd43dSSascha Wildner assert(!(LLtype < set_compressed && nextEntropy->fse.litlength_repeatMode != FSE_repeat_none)); /* We don't copy tables */
2238*a28cd43dSSascha Wildner { size_t const countSize = ZSTD_buildCTable(
2239*a28cd43dSSascha Wildner op, (size_t)(oend - op),
2240*a28cd43dSSascha Wildner CTable_LitLength, LLFSELog, (symbolEncodingType_e)LLtype,
2241*a28cd43dSSascha Wildner count, max, llCodeTable, nbSeq,
2242*a28cd43dSSascha Wildner LL_defaultNorm, LL_defaultNormLog, MaxLL,
2243*a28cd43dSSascha Wildner prevEntropy->fse.litlengthCTable,
2244*a28cd43dSSascha Wildner sizeof(prevEntropy->fse.litlengthCTable),
2245*a28cd43dSSascha Wildner entropyWorkspace, entropyWkspSize);
2246*a28cd43dSSascha Wildner FORWARD_IF_ERROR(countSize, "ZSTD_buildCTable for LitLens failed");
2247*a28cd43dSSascha Wildner if (LLtype == set_compressed)
2248*a28cd43dSSascha Wildner lastNCount = op;
2249*a28cd43dSSascha Wildner op += countSize;
2250*a28cd43dSSascha Wildner assert(op <= oend);
2251*a28cd43dSSascha Wildner } }
2252*a28cd43dSSascha Wildner /* build CTable for Offsets */
2253*a28cd43dSSascha Wildner { unsigned max = MaxOff;
2254*a28cd43dSSascha Wildner size_t const mostFrequent = HIST_countFast_wksp(
2255*a28cd43dSSascha Wildner count, &max, ofCodeTable, nbSeq, entropyWorkspace, entropyWkspSize); /* can't fail */
2256*a28cd43dSSascha Wildner /* We can only use the basic table if max <= DefaultMaxOff, otherwise the offsets are too large */
2257*a28cd43dSSascha Wildner ZSTD_defaultPolicy_e const defaultPolicy = (max <= DefaultMaxOff) ? ZSTD_defaultAllowed : ZSTD_defaultDisallowed;
2258*a28cd43dSSascha Wildner DEBUGLOG(5, "Building OF table");
2259*a28cd43dSSascha Wildner nextEntropy->fse.offcode_repeatMode = prevEntropy->fse.offcode_repeatMode;
2260*a28cd43dSSascha Wildner Offtype = ZSTD_selectEncodingType(&nextEntropy->fse.offcode_repeatMode,
2261*a28cd43dSSascha Wildner count, max, mostFrequent, nbSeq,
2262*a28cd43dSSascha Wildner OffFSELog, prevEntropy->fse.offcodeCTable,
2263*a28cd43dSSascha Wildner OF_defaultNorm, OF_defaultNormLog,
2264*a28cd43dSSascha Wildner defaultPolicy, strategy);
2265*a28cd43dSSascha Wildner assert(!(Offtype < set_compressed && nextEntropy->fse.offcode_repeatMode != FSE_repeat_none)); /* We don't copy tables */
2266*a28cd43dSSascha Wildner { size_t const countSize = ZSTD_buildCTable(
2267*a28cd43dSSascha Wildner op, (size_t)(oend - op),
2268*a28cd43dSSascha Wildner CTable_OffsetBits, OffFSELog, (symbolEncodingType_e)Offtype,
2269*a28cd43dSSascha Wildner count, max, ofCodeTable, nbSeq,
2270*a28cd43dSSascha Wildner OF_defaultNorm, OF_defaultNormLog, DefaultMaxOff,
2271*a28cd43dSSascha Wildner prevEntropy->fse.offcodeCTable,
2272*a28cd43dSSascha Wildner sizeof(prevEntropy->fse.offcodeCTable),
2273*a28cd43dSSascha Wildner entropyWorkspace, entropyWkspSize);
2274*a28cd43dSSascha Wildner FORWARD_IF_ERROR(countSize, "ZSTD_buildCTable for Offsets failed");
2275*a28cd43dSSascha Wildner if (Offtype == set_compressed)
2276*a28cd43dSSascha Wildner lastNCount = op;
2277*a28cd43dSSascha Wildner op += countSize;
2278*a28cd43dSSascha Wildner assert(op <= oend);
2279*a28cd43dSSascha Wildner } }
2280*a28cd43dSSascha Wildner /* build CTable for MatchLengths */
2281*a28cd43dSSascha Wildner { unsigned max = MaxML;
2282*a28cd43dSSascha Wildner size_t const mostFrequent = HIST_countFast_wksp(
2283*a28cd43dSSascha Wildner count, &max, mlCodeTable, nbSeq, entropyWorkspace, entropyWkspSize); /* can't fail */
2284*a28cd43dSSascha Wildner DEBUGLOG(5, "Building ML table (remaining space : %i)", (int)(oend-op));
2285*a28cd43dSSascha Wildner nextEntropy->fse.matchlength_repeatMode = prevEntropy->fse.matchlength_repeatMode;
2286*a28cd43dSSascha Wildner MLtype = ZSTD_selectEncodingType(&nextEntropy->fse.matchlength_repeatMode,
2287*a28cd43dSSascha Wildner count, max, mostFrequent, nbSeq,
2288*a28cd43dSSascha Wildner MLFSELog, prevEntropy->fse.matchlengthCTable,
2289*a28cd43dSSascha Wildner ML_defaultNorm, ML_defaultNormLog,
2290*a28cd43dSSascha Wildner ZSTD_defaultAllowed, strategy);
2291*a28cd43dSSascha Wildner assert(!(MLtype < set_compressed && nextEntropy->fse.matchlength_repeatMode != FSE_repeat_none)); /* We don't copy tables */
2292*a28cd43dSSascha Wildner { size_t const countSize = ZSTD_buildCTable(
2293*a28cd43dSSascha Wildner op, (size_t)(oend - op),
2294*a28cd43dSSascha Wildner CTable_MatchLength, MLFSELog, (symbolEncodingType_e)MLtype,
2295*a28cd43dSSascha Wildner count, max, mlCodeTable, nbSeq,
2296*a28cd43dSSascha Wildner ML_defaultNorm, ML_defaultNormLog, MaxML,
2297*a28cd43dSSascha Wildner prevEntropy->fse.matchlengthCTable,
2298*a28cd43dSSascha Wildner sizeof(prevEntropy->fse.matchlengthCTable),
2299*a28cd43dSSascha Wildner entropyWorkspace, entropyWkspSize);
2300*a28cd43dSSascha Wildner FORWARD_IF_ERROR(countSize, "ZSTD_buildCTable for MatchLengths failed");
2301*a28cd43dSSascha Wildner if (MLtype == set_compressed)
2302*a28cd43dSSascha Wildner lastNCount = op;
2303*a28cd43dSSascha Wildner op += countSize;
2304*a28cd43dSSascha Wildner assert(op <= oend);
2305*a28cd43dSSascha Wildner } }
2306*a28cd43dSSascha Wildner
2307*a28cd43dSSascha Wildner *seqHead = (BYTE)((LLtype<<6) + (Offtype<<4) + (MLtype<<2));
2308*a28cd43dSSascha Wildner
2309*a28cd43dSSascha Wildner { size_t const bitstreamSize = ZSTD_encodeSequences(
2310*a28cd43dSSascha Wildner op, (size_t)(oend - op),
2311*a28cd43dSSascha Wildner CTable_MatchLength, mlCodeTable,
2312*a28cd43dSSascha Wildner CTable_OffsetBits, ofCodeTable,
2313*a28cd43dSSascha Wildner CTable_LitLength, llCodeTable,
2314*a28cd43dSSascha Wildner sequences, nbSeq,
2315*a28cd43dSSascha Wildner longOffsets, bmi2);
2316*a28cd43dSSascha Wildner FORWARD_IF_ERROR(bitstreamSize, "ZSTD_encodeSequences failed");
2317*a28cd43dSSascha Wildner op += bitstreamSize;
2318*a28cd43dSSascha Wildner assert(op <= oend);
2319*a28cd43dSSascha Wildner /* zstd versions <= 1.3.4 mistakenly report corruption when
2320*a28cd43dSSascha Wildner * FSE_readNCount() receives a buffer < 4 bytes.
2321*a28cd43dSSascha Wildner * Fixed by https://github.com/facebook/zstd/pull/1146.
2322*a28cd43dSSascha Wildner * This can happen when the last set_compressed table present is 2
2323*a28cd43dSSascha Wildner * bytes and the bitstream is only one byte.
2324*a28cd43dSSascha Wildner * In this exceedingly rare case, we will simply emit an uncompressed
2325*a28cd43dSSascha Wildner * block, since it isn't worth optimizing.
2326*a28cd43dSSascha Wildner */
2327*a28cd43dSSascha Wildner if (lastNCount && (op - lastNCount) < 4) {
2328*a28cd43dSSascha Wildner /* NCountSize >= 2 && bitstreamSize > 0 ==> lastCountSize == 3 */
2329*a28cd43dSSascha Wildner assert(op - lastNCount == 3);
2330*a28cd43dSSascha Wildner DEBUGLOG(5, "Avoiding bug in zstd decoder in versions <= 1.3.4 by "
2331*a28cd43dSSascha Wildner "emitting an uncompressed block.");
2332*a28cd43dSSascha Wildner return 0;
2333*a28cd43dSSascha Wildner }
2334*a28cd43dSSascha Wildner }
2335*a28cd43dSSascha Wildner
2336*a28cd43dSSascha Wildner DEBUGLOG(5, "compressed block size : %u", (unsigned)(op - ostart));
2337*a28cd43dSSascha Wildner return (size_t)(op - ostart);
2338*a28cd43dSSascha Wildner }
2339*a28cd43dSSascha Wildner
2340*a28cd43dSSascha Wildner MEM_STATIC size_t
ZSTD_entropyCompressSequences(seqStore_t * seqStorePtr,const ZSTD_entropyCTables_t * prevEntropy,ZSTD_entropyCTables_t * nextEntropy,const ZSTD_CCtx_params * cctxParams,void * dst,size_t dstCapacity,size_t srcSize,void * entropyWorkspace,size_t entropyWkspSize,int bmi2)2341*a28cd43dSSascha Wildner ZSTD_entropyCompressSequences(seqStore_t* seqStorePtr,
2342*a28cd43dSSascha Wildner const ZSTD_entropyCTables_t* prevEntropy,
2343*a28cd43dSSascha Wildner ZSTD_entropyCTables_t* nextEntropy,
2344*a28cd43dSSascha Wildner const ZSTD_CCtx_params* cctxParams,
2345*a28cd43dSSascha Wildner void* dst, size_t dstCapacity,
2346*a28cd43dSSascha Wildner size_t srcSize,
2347*a28cd43dSSascha Wildner void* entropyWorkspace, size_t entropyWkspSize,
2348*a28cd43dSSascha Wildner int bmi2)
2349*a28cd43dSSascha Wildner {
2350*a28cd43dSSascha Wildner size_t const cSize = ZSTD_entropyCompressSequences_internal(
2351*a28cd43dSSascha Wildner seqStorePtr, prevEntropy, nextEntropy, cctxParams,
2352*a28cd43dSSascha Wildner dst, dstCapacity,
2353*a28cd43dSSascha Wildner entropyWorkspace, entropyWkspSize, bmi2);
2354*a28cd43dSSascha Wildner if (cSize == 0) return 0;
2355*a28cd43dSSascha Wildner /* When srcSize <= dstCapacity, there is enough space to write a raw uncompressed block.
2356*a28cd43dSSascha Wildner * Since we ran out of space, block must be not compressible, so fall back to raw uncompressed block.
2357*a28cd43dSSascha Wildner */
2358*a28cd43dSSascha Wildner if ((cSize == ERROR(dstSize_tooSmall)) & (srcSize <= dstCapacity))
2359*a28cd43dSSascha Wildner return 0; /* block not compressed */
2360*a28cd43dSSascha Wildner FORWARD_IF_ERROR(cSize, "ZSTD_entropyCompressSequences_internal failed");
2361*a28cd43dSSascha Wildner
2362*a28cd43dSSascha Wildner /* Check compressibility */
2363*a28cd43dSSascha Wildner { size_t const maxCSize = srcSize - ZSTD_minGain(srcSize, cctxParams->cParams.strategy);
2364*a28cd43dSSascha Wildner if (cSize >= maxCSize) return 0; /* block not compressed */
2365*a28cd43dSSascha Wildner }
2366*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_entropyCompressSequences() cSize: %zu\n", cSize);
2367*a28cd43dSSascha Wildner return cSize;
2368*a28cd43dSSascha Wildner }
2369*a28cd43dSSascha Wildner
2370*a28cd43dSSascha Wildner /* ZSTD_selectBlockCompressor() :
2371*a28cd43dSSascha Wildner * Not static, but internal use only (used by long distance matcher)
2372*a28cd43dSSascha Wildner * assumption : strat is a valid strategy */
ZSTD_selectBlockCompressor(ZSTD_strategy strat,ZSTD_dictMode_e dictMode)2373*a28cd43dSSascha Wildner ZSTD_blockCompressor ZSTD_selectBlockCompressor(ZSTD_strategy strat, ZSTD_dictMode_e dictMode)
2374*a28cd43dSSascha Wildner {
2375*a28cd43dSSascha Wildner static const ZSTD_blockCompressor blockCompressor[4][ZSTD_STRATEGY_MAX+1] = {
2376*a28cd43dSSascha Wildner { ZSTD_compressBlock_fast /* default for 0 */,
2377*a28cd43dSSascha Wildner ZSTD_compressBlock_fast,
2378*a28cd43dSSascha Wildner ZSTD_compressBlock_doubleFast,
2379*a28cd43dSSascha Wildner ZSTD_compressBlock_greedy,
2380*a28cd43dSSascha Wildner ZSTD_compressBlock_lazy,
2381*a28cd43dSSascha Wildner ZSTD_compressBlock_lazy2,
2382*a28cd43dSSascha Wildner ZSTD_compressBlock_btlazy2,
2383*a28cd43dSSascha Wildner ZSTD_compressBlock_btopt,
2384*a28cd43dSSascha Wildner ZSTD_compressBlock_btultra,
2385*a28cd43dSSascha Wildner ZSTD_compressBlock_btultra2 },
2386*a28cd43dSSascha Wildner { ZSTD_compressBlock_fast_extDict /* default for 0 */,
2387*a28cd43dSSascha Wildner ZSTD_compressBlock_fast_extDict,
2388*a28cd43dSSascha Wildner ZSTD_compressBlock_doubleFast_extDict,
2389*a28cd43dSSascha Wildner ZSTD_compressBlock_greedy_extDict,
2390*a28cd43dSSascha Wildner ZSTD_compressBlock_lazy_extDict,
2391*a28cd43dSSascha Wildner ZSTD_compressBlock_lazy2_extDict,
2392*a28cd43dSSascha Wildner ZSTD_compressBlock_btlazy2_extDict,
2393*a28cd43dSSascha Wildner ZSTD_compressBlock_btopt_extDict,
2394*a28cd43dSSascha Wildner ZSTD_compressBlock_btultra_extDict,
2395*a28cd43dSSascha Wildner ZSTD_compressBlock_btultra_extDict },
2396*a28cd43dSSascha Wildner { ZSTD_compressBlock_fast_dictMatchState /* default for 0 */,
2397*a28cd43dSSascha Wildner ZSTD_compressBlock_fast_dictMatchState,
2398*a28cd43dSSascha Wildner ZSTD_compressBlock_doubleFast_dictMatchState,
2399*a28cd43dSSascha Wildner ZSTD_compressBlock_greedy_dictMatchState,
2400*a28cd43dSSascha Wildner ZSTD_compressBlock_lazy_dictMatchState,
2401*a28cd43dSSascha Wildner ZSTD_compressBlock_lazy2_dictMatchState,
2402*a28cd43dSSascha Wildner ZSTD_compressBlock_btlazy2_dictMatchState,
2403*a28cd43dSSascha Wildner ZSTD_compressBlock_btopt_dictMatchState,
2404*a28cd43dSSascha Wildner ZSTD_compressBlock_btultra_dictMatchState,
2405*a28cd43dSSascha Wildner ZSTD_compressBlock_btultra_dictMatchState },
2406*a28cd43dSSascha Wildner { NULL /* default for 0 */,
2407*a28cd43dSSascha Wildner NULL,
2408*a28cd43dSSascha Wildner NULL,
2409*a28cd43dSSascha Wildner ZSTD_compressBlock_greedy_dedicatedDictSearch,
2410*a28cd43dSSascha Wildner ZSTD_compressBlock_lazy_dedicatedDictSearch,
2411*a28cd43dSSascha Wildner ZSTD_compressBlock_lazy2_dedicatedDictSearch,
2412*a28cd43dSSascha Wildner NULL,
2413*a28cd43dSSascha Wildner NULL,
2414*a28cd43dSSascha Wildner NULL,
2415*a28cd43dSSascha Wildner NULL }
2416*a28cd43dSSascha Wildner };
2417*a28cd43dSSascha Wildner ZSTD_blockCompressor selectedCompressor;
2418*a28cd43dSSascha Wildner ZSTD_STATIC_ASSERT((unsigned)ZSTD_fast == 1);
2419*a28cd43dSSascha Wildner
2420*a28cd43dSSascha Wildner assert(ZSTD_cParam_withinBounds(ZSTD_c_strategy, strat));
2421*a28cd43dSSascha Wildner selectedCompressor = blockCompressor[(int)dictMode][(int)strat];
2422*a28cd43dSSascha Wildner assert(selectedCompressor != NULL);
2423*a28cd43dSSascha Wildner return selectedCompressor;
2424*a28cd43dSSascha Wildner }
2425*a28cd43dSSascha Wildner
ZSTD_storeLastLiterals(seqStore_t * seqStorePtr,const BYTE * anchor,size_t lastLLSize)2426*a28cd43dSSascha Wildner static void ZSTD_storeLastLiterals(seqStore_t* seqStorePtr,
2427*a28cd43dSSascha Wildner const BYTE* anchor, size_t lastLLSize)
2428*a28cd43dSSascha Wildner {
2429*a28cd43dSSascha Wildner ZSTD_memcpy(seqStorePtr->lit, anchor, lastLLSize);
2430*a28cd43dSSascha Wildner seqStorePtr->lit += lastLLSize;
2431*a28cd43dSSascha Wildner }
2432*a28cd43dSSascha Wildner
ZSTD_resetSeqStore(seqStore_t * ssPtr)2433*a28cd43dSSascha Wildner void ZSTD_resetSeqStore(seqStore_t* ssPtr)
2434*a28cd43dSSascha Wildner {
2435*a28cd43dSSascha Wildner ssPtr->lit = ssPtr->litStart;
2436*a28cd43dSSascha Wildner ssPtr->sequences = ssPtr->sequencesStart;
2437*a28cd43dSSascha Wildner ssPtr->longLengthID = 0;
2438*a28cd43dSSascha Wildner }
2439*a28cd43dSSascha Wildner
2440*a28cd43dSSascha Wildner typedef enum { ZSTDbss_compress, ZSTDbss_noCompress } ZSTD_buildSeqStore_e;
2441*a28cd43dSSascha Wildner
ZSTD_buildSeqStore(ZSTD_CCtx * zc,const void * src,size_t srcSize)2442*a28cd43dSSascha Wildner static size_t ZSTD_buildSeqStore(ZSTD_CCtx* zc, const void* src, size_t srcSize)
2443*a28cd43dSSascha Wildner {
2444*a28cd43dSSascha Wildner ZSTD_matchState_t* const ms = &zc->blockState.matchState;
2445*a28cd43dSSascha Wildner DEBUGLOG(5, "ZSTD_buildSeqStore (srcSize=%zu)", srcSize);
2446*a28cd43dSSascha Wildner assert(srcSize <= ZSTD_BLOCKSIZE_MAX);
2447*a28cd43dSSascha Wildner /* Assert that we have correctly flushed the ctx params into the ms's copy */
2448*a28cd43dSSascha Wildner ZSTD_assertEqualCParams(zc->appliedParams.cParams, ms->cParams);
2449*a28cd43dSSascha Wildner if (srcSize < MIN_CBLOCK_SIZE+ZSTD_blockHeaderSize+1) {
2450*a28cd43dSSascha Wildner if (zc->appliedParams.cParams.strategy >= ZSTD_btopt) {
2451*a28cd43dSSascha Wildner ZSTD_ldm_skipRawSeqStoreBytes(&zc->externSeqStore, srcSize);
2452*a28cd43dSSascha Wildner } else {
2453*a28cd43dSSascha Wildner ZSTD_ldm_skipSequences(&zc->externSeqStore, srcSize, zc->appliedParams.cParams.minMatch);
2454*a28cd43dSSascha Wildner }
2455*a28cd43dSSascha Wildner return ZSTDbss_noCompress; /* don't even attempt compression below a certain srcSize */
2456*a28cd43dSSascha Wildner }
2457*a28cd43dSSascha Wildner ZSTD_resetSeqStore(&(zc->seqStore));
2458*a28cd43dSSascha Wildner /* required for optimal parser to read stats from dictionary */
2459*a28cd43dSSascha Wildner ms->opt.symbolCosts = &zc->blockState.prevCBlock->entropy;
2460*a28cd43dSSascha Wildner /* tell the optimal parser how we expect to compress literals */
2461*a28cd43dSSascha Wildner ms->opt.literalCompressionMode = zc->appliedParams.literalCompressionMode;
2462*a28cd43dSSascha Wildner /* a gap between an attached dict and the current window is not safe,
2463*a28cd43dSSascha Wildner * they must remain adjacent,
2464*a28cd43dSSascha Wildner * and when that stops being the case, the dict must be unset */
2465*a28cd43dSSascha Wildner assert(ms->dictMatchState == NULL || ms->loadedDictEnd == ms->window.dictLimit);
2466*a28cd43dSSascha Wildner
2467*a28cd43dSSascha Wildner /* limited update after a very long match */
2468*a28cd43dSSascha Wildner { const BYTE* const base = ms->window.base;
2469*a28cd43dSSascha Wildner const BYTE* const istart = (const BYTE*)src;
2470*a28cd43dSSascha Wildner const U32 curr = (U32)(istart-base);
2471*a28cd43dSSascha Wildner if (sizeof(ptrdiff_t)==8) assert(istart - base < (ptrdiff_t)(U32)(-1)); /* ensure no overflow */
2472*a28cd43dSSascha Wildner if (curr > ms->nextToUpdate + 384)
2473*a28cd43dSSascha Wildner ms->nextToUpdate = curr - MIN(192, (U32)(curr - ms->nextToUpdate - 384));
2474*a28cd43dSSascha Wildner }
2475*a28cd43dSSascha Wildner
2476*a28cd43dSSascha Wildner /* select and store sequences */
2477*a28cd43dSSascha Wildner { ZSTD_dictMode_e const dictMode = ZSTD_matchState_dictMode(ms);
2478*a28cd43dSSascha Wildner size_t lastLLSize;
2479*a28cd43dSSascha Wildner { int i;
2480*a28cd43dSSascha Wildner for (i = 0; i < ZSTD_REP_NUM; ++i)
2481*a28cd43dSSascha Wildner zc->blockState.nextCBlock->rep[i] = zc->blockState.prevCBlock->rep[i];
2482*a28cd43dSSascha Wildner }
2483*a28cd43dSSascha Wildner if (zc->externSeqStore.pos < zc->externSeqStore.size) {
2484*a28cd43dSSascha Wildner assert(!zc->appliedParams.ldmParams.enableLdm);
2485*a28cd43dSSascha Wildner /* Updates ldmSeqStore.pos */
2486*a28cd43dSSascha Wildner lastLLSize =
2487*a28cd43dSSascha Wildner ZSTD_ldm_blockCompress(&zc->externSeqStore,
2488*a28cd43dSSascha Wildner ms, &zc->seqStore,
2489*a28cd43dSSascha Wildner zc->blockState.nextCBlock->rep,
2490*a28cd43dSSascha Wildner src, srcSize);
2491*a28cd43dSSascha Wildner assert(zc->externSeqStore.pos <= zc->externSeqStore.size);
2492*a28cd43dSSascha Wildner } else if (zc->appliedParams.ldmParams.enableLdm) {
2493*a28cd43dSSascha Wildner rawSeqStore_t ldmSeqStore = kNullRawSeqStore;
2494*a28cd43dSSascha Wildner
2495*a28cd43dSSascha Wildner ldmSeqStore.seq = zc->ldmSequences;
2496*a28cd43dSSascha Wildner ldmSeqStore.capacity = zc->maxNbLdmSequences;
2497*a28cd43dSSascha Wildner /* Updates ldmSeqStore.size */
2498*a28cd43dSSascha Wildner FORWARD_IF_ERROR(ZSTD_ldm_generateSequences(&zc->ldmState, &ldmSeqStore,
2499*a28cd43dSSascha Wildner &zc->appliedParams.ldmParams,
2500*a28cd43dSSascha Wildner src, srcSize), "");
2501*a28cd43dSSascha Wildner /* Updates ldmSeqStore.pos */
2502*a28cd43dSSascha Wildner lastLLSize =
2503*a28cd43dSSascha Wildner ZSTD_ldm_blockCompress(&ldmSeqStore,
2504*a28cd43dSSascha Wildner ms, &zc->seqStore,
2505*a28cd43dSSascha Wildner zc->blockState.nextCBlock->rep,
2506*a28cd43dSSascha Wildner src, srcSize);
2507*a28cd43dSSascha Wildner assert(ldmSeqStore.pos == ldmSeqStore.size);
2508*a28cd43dSSascha Wildner } else { /* not long range mode */
2509*a28cd43dSSascha Wildner ZSTD_blockCompressor const blockCompressor = ZSTD_selectBlockCompressor(zc->appliedParams.cParams.strategy, dictMode);
2510*a28cd43dSSascha Wildner ms->ldmSeqStore = NULL;
2511*a28cd43dSSascha Wildner lastLLSize = blockCompressor(ms, &zc->seqStore, zc->blockState.nextCBlock->rep, src, srcSize);
2512*a28cd43dSSascha Wildner }
2513*a28cd43dSSascha Wildner { const BYTE* const lastLiterals = (const BYTE*)src + srcSize - lastLLSize;
2514*a28cd43dSSascha Wildner ZSTD_storeLastLiterals(&zc->seqStore, lastLiterals, lastLLSize);
2515*a28cd43dSSascha Wildner } }
2516*a28cd43dSSascha Wildner return ZSTDbss_compress;
2517*a28cd43dSSascha Wildner }
2518*a28cd43dSSascha Wildner
ZSTD_copyBlockSequences(ZSTD_CCtx * zc)2519*a28cd43dSSascha Wildner static void ZSTD_copyBlockSequences(ZSTD_CCtx* zc)
2520*a28cd43dSSascha Wildner {
2521*a28cd43dSSascha Wildner const seqStore_t* seqStore = ZSTD_getSeqStore(zc);
2522*a28cd43dSSascha Wildner const seqDef* seqStoreSeqs = seqStore->sequencesStart;
2523*a28cd43dSSascha Wildner size_t seqStoreSeqSize = seqStore->sequences - seqStoreSeqs;
2524*a28cd43dSSascha Wildner size_t seqStoreLiteralsSize = (size_t)(seqStore->lit - seqStore->litStart);
2525*a28cd43dSSascha Wildner size_t literalsRead = 0;
2526*a28cd43dSSascha Wildner size_t lastLLSize;
2527*a28cd43dSSascha Wildner
2528*a28cd43dSSascha Wildner ZSTD_Sequence* outSeqs = &zc->seqCollector.seqStart[zc->seqCollector.seqIndex];
2529*a28cd43dSSascha Wildner size_t i;
2530*a28cd43dSSascha Wildner repcodes_t updatedRepcodes;
2531*a28cd43dSSascha Wildner
2532*a28cd43dSSascha Wildner assert(zc->seqCollector.seqIndex + 1 < zc->seqCollector.maxSequences);
2533*a28cd43dSSascha Wildner /* Ensure we have enough space for last literals "sequence" */
2534*a28cd43dSSascha Wildner assert(zc->seqCollector.maxSequences >= seqStoreSeqSize + 1);
2535*a28cd43dSSascha Wildner ZSTD_memcpy(updatedRepcodes.rep, zc->blockState.prevCBlock->rep, sizeof(repcodes_t));
2536*a28cd43dSSascha Wildner for (i = 0; i < seqStoreSeqSize; ++i) {
2537*a28cd43dSSascha Wildner U32 rawOffset = seqStoreSeqs[i].offset - ZSTD_REP_NUM;
2538*a28cd43dSSascha Wildner outSeqs[i].litLength = seqStoreSeqs[i].litLength;
2539*a28cd43dSSascha Wildner outSeqs[i].matchLength = seqStoreSeqs[i].matchLength + MINMATCH;
2540*a28cd43dSSascha Wildner outSeqs[i].rep = 0;
2541*a28cd43dSSascha Wildner
2542*a28cd43dSSascha Wildner if (i == seqStore->longLengthPos) {
2543*a28cd43dSSascha Wildner if (seqStore->longLengthID == 1) {
2544*a28cd43dSSascha Wildner outSeqs[i].litLength += 0x10000;
2545*a28cd43dSSascha Wildner } else if (seqStore->longLengthID == 2) {
2546*a28cd43dSSascha Wildner outSeqs[i].matchLength += 0x10000;
2547*a28cd43dSSascha Wildner }
2548*a28cd43dSSascha Wildner }
2549*a28cd43dSSascha Wildner
2550*a28cd43dSSascha Wildner if (seqStoreSeqs[i].offset <= ZSTD_REP_NUM) {
2551*a28cd43dSSascha Wildner /* Derive the correct offset corresponding to a repcode */
2552*a28cd43dSSascha Wildner outSeqs[i].rep = seqStoreSeqs[i].offset;
2553*a28cd43dSSascha Wildner if (outSeqs[i].litLength != 0) {
2554*a28cd43dSSascha Wildner rawOffset = updatedRepcodes.rep[outSeqs[i].rep - 1];
2555*a28cd43dSSascha Wildner } else {
2556*a28cd43dSSascha Wildner if (outSeqs[i].rep == 3) {
2557*a28cd43dSSascha Wildner rawOffset = updatedRepcodes.rep[0] - 1;
2558*a28cd43dSSascha Wildner } else {
2559*a28cd43dSSascha Wildner rawOffset = updatedRepcodes.rep[outSeqs[i].rep];
2560*a28cd43dSSascha Wildner }
2561*a28cd43dSSascha Wildner }
2562*a28cd43dSSascha Wildner }
2563*a28cd43dSSascha Wildner outSeqs[i].offset = rawOffset;
2564*a28cd43dSSascha Wildner /* seqStoreSeqs[i].offset == offCode+1, and ZSTD_updateRep() expects offCode
2565*a28cd43dSSascha Wildner so we provide seqStoreSeqs[i].offset - 1 */
2566*a28cd43dSSascha Wildner updatedRepcodes = ZSTD_updateRep(updatedRepcodes.rep,
2567*a28cd43dSSascha Wildner seqStoreSeqs[i].offset - 1,
2568*a28cd43dSSascha Wildner seqStoreSeqs[i].litLength == 0);
2569*a28cd43dSSascha Wildner literalsRead += outSeqs[i].litLength;
2570*a28cd43dSSascha Wildner }
2571*a28cd43dSSascha Wildner /* Insert last literals (if any exist) in the block as a sequence with ml == off == 0.
2572*a28cd43dSSascha Wildner * If there are no last literals, then we'll emit (of: 0, ml: 0, ll: 0), which is a marker
2573*a28cd43dSSascha Wildner * for the block boundary, according to the API.
2574*a28cd43dSSascha Wildner */
2575*a28cd43dSSascha Wildner assert(seqStoreLiteralsSize >= literalsRead);
2576*a28cd43dSSascha Wildner lastLLSize = seqStoreLiteralsSize - literalsRead;
2577*a28cd43dSSascha Wildner outSeqs[i].litLength = (U32)lastLLSize;
2578*a28cd43dSSascha Wildner outSeqs[i].matchLength = outSeqs[i].offset = outSeqs[i].rep = 0;
2579*a28cd43dSSascha Wildner seqStoreSeqSize++;
2580*a28cd43dSSascha Wildner zc->seqCollector.seqIndex += seqStoreSeqSize;
2581*a28cd43dSSascha Wildner }
2582*a28cd43dSSascha Wildner
ZSTD_generateSequences(ZSTD_CCtx * zc,ZSTD_Sequence * outSeqs,size_t outSeqsSize,const void * src,size_t srcSize)2583*a28cd43dSSascha Wildner size_t ZSTD_generateSequences(ZSTD_CCtx* zc, ZSTD_Sequence* outSeqs,
2584*a28cd43dSSascha Wildner size_t outSeqsSize, const void* src, size_t srcSize)
2585*a28cd43dSSascha Wildner {
2586*a28cd43dSSascha Wildner const size_t dstCapacity = ZSTD_compressBound(srcSize);
2587*a28cd43dSSascha Wildner void* dst = ZSTD_customMalloc(dstCapacity, ZSTD_defaultCMem);
2588*a28cd43dSSascha Wildner SeqCollector seqCollector;
2589*a28cd43dSSascha Wildner
2590*a28cd43dSSascha Wildner RETURN_ERROR_IF(dst == NULL, memory_allocation, "NULL pointer!");
2591*a28cd43dSSascha Wildner
2592*a28cd43dSSascha Wildner seqCollector.collectSequences = 1;
2593*a28cd43dSSascha Wildner seqCollector.seqStart = outSeqs;
2594*a28cd43dSSascha Wildner seqCollector.seqIndex = 0;
2595*a28cd43dSSascha Wildner seqCollector.maxSequences = outSeqsSize;
2596*a28cd43dSSascha Wildner zc->seqCollector = seqCollector;
2597*a28cd43dSSascha Wildner
2598*a28cd43dSSascha Wildner ZSTD_compress2(zc, dst, dstCapacity, src, srcSize);
2599*a28cd43dSSascha Wildner ZSTD_customFree(dst, ZSTD_defaultCMem);
2600*a28cd43dSSascha Wildner return zc->seqCollector.seqIndex;
2601*a28cd43dSSascha Wildner }
2602*a28cd43dSSascha Wildner
ZSTD_mergeBlockDelimiters(ZSTD_Sequence * sequences,size_t seqsSize)2603*a28cd43dSSascha Wildner size_t ZSTD_mergeBlockDelimiters(ZSTD_Sequence* sequences, size_t seqsSize) {
2604*a28cd43dSSascha Wildner size_t in = 0;
2605*a28cd43dSSascha Wildner size_t out = 0;
2606*a28cd43dSSascha Wildner for (; in < seqsSize; ++in) {
2607*a28cd43dSSascha Wildner if (sequences[in].offset == 0 && sequences[in].matchLength == 0) {
2608*a28cd43dSSascha Wildner if (in != seqsSize - 1) {
2609*a28cd43dSSascha Wildner sequences[in+1].litLength += sequences[in].litLength;
2610*a28cd43dSSascha Wildner }
2611*a28cd43dSSascha Wildner } else {
2612*a28cd43dSSascha Wildner sequences[out] = sequences[in];
2613*a28cd43dSSascha Wildner ++out;
2614*a28cd43dSSascha Wildner }
2615*a28cd43dSSascha Wildner }
2616*a28cd43dSSascha Wildner return out;
2617*a28cd43dSSascha Wildner }
2618*a28cd43dSSascha Wildner
2619*a28cd43dSSascha Wildner /* Unrolled loop to read four size_ts of input at a time. Returns 1 if is RLE, 0 if not. */
ZSTD_isRLE(const BYTE * src,size_t length)2620*a28cd43dSSascha Wildner static int ZSTD_isRLE(const BYTE* src, size_t length) {
2621*a28cd43dSSascha Wildner const BYTE* ip = src;
2622*a28cd43dSSascha Wildner const BYTE value = ip[0];
2623*a28cd43dSSascha Wildner const size_t valueST = (size_t)((U64)value * 0x0101010101010101ULL);
2624*a28cd43dSSascha Wildner const size_t unrollSize = sizeof(size_t) * 4;
2625*a28cd43dSSascha Wildner const size_t unrollMask = unrollSize - 1;
2626*a28cd43dSSascha Wildner const size_t prefixLength = length & unrollMask;
2627*a28cd43dSSascha Wildner size_t i;
2628*a28cd43dSSascha Wildner size_t u;
2629*a28cd43dSSascha Wildner if (length == 1) return 1;
2630*a28cd43dSSascha Wildner /* Check if prefix is RLE first before using unrolled loop */
2631*a28cd43dSSascha Wildner if (prefixLength && ZSTD_count(ip+1, ip, ip+prefixLength) != prefixLength-1) {
2632*a28cd43dSSascha Wildner return 0;
2633*a28cd43dSSascha Wildner }
2634*a28cd43dSSascha Wildner for (i = prefixLength; i != length; i += unrollSize) {
2635*a28cd43dSSascha Wildner for (u = 0; u < unrollSize; u += sizeof(size_t)) {
2636*a28cd43dSSascha Wildner if (MEM_readST(ip + i + u) != valueST) {
2637*a28cd43dSSascha Wildner return 0;
2638*a28cd43dSSascha Wildner }
2639*a28cd43dSSascha Wildner }
2640*a28cd43dSSascha Wildner }
2641*a28cd43dSSascha Wildner return 1;
2642*a28cd43dSSascha Wildner }
2643*a28cd43dSSascha Wildner
2644*a28cd43dSSascha Wildner /* Returns true if the given block may be RLE.
2645*a28cd43dSSascha Wildner * This is just a heuristic based on the compressibility.
2646*a28cd43dSSascha Wildner * It may return both false positives and false negatives.
2647*a28cd43dSSascha Wildner */
ZSTD_maybeRLE(seqStore_t const * seqStore)2648*a28cd43dSSascha Wildner static int ZSTD_maybeRLE(seqStore_t const* seqStore)
2649*a28cd43dSSascha Wildner {
2650*a28cd43dSSascha Wildner size_t const nbSeqs = (size_t)(seqStore->sequences - seqStore->sequencesStart);
2651*a28cd43dSSascha Wildner size_t const nbLits = (size_t)(seqStore->lit - seqStore->litStart);
2652*a28cd43dSSascha Wildner
2653*a28cd43dSSascha Wildner return nbSeqs < 4 && nbLits < 10;
2654*a28cd43dSSascha Wildner }
2655*a28cd43dSSascha Wildner
ZSTD_confirmRepcodesAndEntropyTables(ZSTD_CCtx * zc)2656*a28cd43dSSascha Wildner static void ZSTD_confirmRepcodesAndEntropyTables(ZSTD_CCtx* zc)
2657*a28cd43dSSascha Wildner {
2658*a28cd43dSSascha Wildner ZSTD_compressedBlockState_t* const tmp = zc->blockState.prevCBlock;
2659*a28cd43dSSascha Wildner zc->blockState.prevCBlock = zc->blockState.nextCBlock;
2660*a28cd43dSSascha Wildner zc->blockState.nextCBlock = tmp;
2661*a28cd43dSSascha Wildner }
2662*a28cd43dSSascha Wildner
ZSTD_compressBlock_internal(ZSTD_CCtx * zc,void * dst,size_t dstCapacity,const void * src,size_t srcSize,U32 frame)2663*a28cd43dSSascha Wildner static size_t ZSTD_compressBlock_internal(ZSTD_CCtx* zc,
2664*a28cd43dSSascha Wildner void* dst, size_t dstCapacity,
2665*a28cd43dSSascha Wildner const void* src, size_t srcSize, U32 frame)
2666*a28cd43dSSascha Wildner {
2667*a28cd43dSSascha Wildner /* This the upper bound for the length of an rle block.
2668*a28cd43dSSascha Wildner * This isn't the actual upper bound. Finding the real threshold
2669*a28cd43dSSascha Wildner * needs further investigation.
2670*a28cd43dSSascha Wildner */
2671*a28cd43dSSascha Wildner const U32 rleMaxLength = 25;
2672*a28cd43dSSascha Wildner size_t cSize;
2673*a28cd43dSSascha Wildner const BYTE* ip = (const BYTE*)src;
2674*a28cd43dSSascha Wildner BYTE* op = (BYTE*)dst;
2675*a28cd43dSSascha Wildner DEBUGLOG(5, "ZSTD_compressBlock_internal (dstCapacity=%u, dictLimit=%u, nextToUpdate=%u)",
2676*a28cd43dSSascha Wildner (unsigned)dstCapacity, (unsigned)zc->blockState.matchState.window.dictLimit,
2677*a28cd43dSSascha Wildner (unsigned)zc->blockState.matchState.nextToUpdate);
2678*a28cd43dSSascha Wildner
2679*a28cd43dSSascha Wildner { const size_t bss = ZSTD_buildSeqStore(zc, src, srcSize);
2680*a28cd43dSSascha Wildner FORWARD_IF_ERROR(bss, "ZSTD_buildSeqStore failed");
2681*a28cd43dSSascha Wildner if (bss == ZSTDbss_noCompress) { cSize = 0; goto out; }
2682*a28cd43dSSascha Wildner }
2683*a28cd43dSSascha Wildner
2684*a28cd43dSSascha Wildner if (zc->seqCollector.collectSequences) {
2685*a28cd43dSSascha Wildner ZSTD_copyBlockSequences(zc);
2686*a28cd43dSSascha Wildner ZSTD_confirmRepcodesAndEntropyTables(zc);
2687*a28cd43dSSascha Wildner return 0;
2688*a28cd43dSSascha Wildner }
2689*a28cd43dSSascha Wildner
2690*a28cd43dSSascha Wildner /* encode sequences and literals */
2691*a28cd43dSSascha Wildner cSize = ZSTD_entropyCompressSequences(&zc->seqStore,
2692*a28cd43dSSascha Wildner &zc->blockState.prevCBlock->entropy, &zc->blockState.nextCBlock->entropy,
2693*a28cd43dSSascha Wildner &zc->appliedParams,
2694*a28cd43dSSascha Wildner dst, dstCapacity,
2695*a28cd43dSSascha Wildner srcSize,
2696*a28cd43dSSascha Wildner zc->entropyWorkspace, ENTROPY_WORKSPACE_SIZE /* statically allocated in resetCCtx */,
2697*a28cd43dSSascha Wildner zc->bmi2);
2698*a28cd43dSSascha Wildner
2699*a28cd43dSSascha Wildner if (zc->seqCollector.collectSequences) {
2700*a28cd43dSSascha Wildner ZSTD_copyBlockSequences(zc);
2701*a28cd43dSSascha Wildner return 0;
2702*a28cd43dSSascha Wildner }
2703*a28cd43dSSascha Wildner
2704*a28cd43dSSascha Wildner
2705*a28cd43dSSascha Wildner if (frame &&
2706*a28cd43dSSascha Wildner /* We don't want to emit our first block as a RLE even if it qualifies because
2707*a28cd43dSSascha Wildner * doing so will cause the decoder (cli only) to throw a "should consume all input error."
2708*a28cd43dSSascha Wildner * This is only an issue for zstd <= v1.4.3
2709*a28cd43dSSascha Wildner */
2710*a28cd43dSSascha Wildner !zc->isFirstBlock &&
2711*a28cd43dSSascha Wildner cSize < rleMaxLength &&
2712*a28cd43dSSascha Wildner ZSTD_isRLE(ip, srcSize))
2713*a28cd43dSSascha Wildner {
2714*a28cd43dSSascha Wildner cSize = 1;
2715*a28cd43dSSascha Wildner op[0] = ip[0];
2716*a28cd43dSSascha Wildner }
2717*a28cd43dSSascha Wildner
2718*a28cd43dSSascha Wildner out:
2719*a28cd43dSSascha Wildner if (!ZSTD_isError(cSize) && cSize > 1) {
2720*a28cd43dSSascha Wildner ZSTD_confirmRepcodesAndEntropyTables(zc);
2721*a28cd43dSSascha Wildner }
2722*a28cd43dSSascha Wildner /* We check that dictionaries have offset codes available for the first
2723*a28cd43dSSascha Wildner * block. After the first block, the offcode table might not have large
2724*a28cd43dSSascha Wildner * enough codes to represent the offsets in the data.
2725*a28cd43dSSascha Wildner */
2726*a28cd43dSSascha Wildner if (zc->blockState.prevCBlock->entropy.fse.offcode_repeatMode == FSE_repeat_valid)
2727*a28cd43dSSascha Wildner zc->blockState.prevCBlock->entropy.fse.offcode_repeatMode = FSE_repeat_check;
2728*a28cd43dSSascha Wildner
2729*a28cd43dSSascha Wildner return cSize;
2730*a28cd43dSSascha Wildner }
2731*a28cd43dSSascha Wildner
ZSTD_compressBlock_targetCBlockSize_body(ZSTD_CCtx * zc,void * dst,size_t dstCapacity,const void * src,size_t srcSize,const size_t bss,U32 lastBlock)2732*a28cd43dSSascha Wildner static size_t ZSTD_compressBlock_targetCBlockSize_body(ZSTD_CCtx* zc,
2733*a28cd43dSSascha Wildner void* dst, size_t dstCapacity,
2734*a28cd43dSSascha Wildner const void* src, size_t srcSize,
2735*a28cd43dSSascha Wildner const size_t bss, U32 lastBlock)
2736*a28cd43dSSascha Wildner {
2737*a28cd43dSSascha Wildner DEBUGLOG(6, "Attempting ZSTD_compressSuperBlock()");
2738*a28cd43dSSascha Wildner if (bss == ZSTDbss_compress) {
2739*a28cd43dSSascha Wildner if (/* We don't want to emit our first block as a RLE even if it qualifies because
2740*a28cd43dSSascha Wildner * doing so will cause the decoder (cli only) to throw a "should consume all input error."
2741*a28cd43dSSascha Wildner * This is only an issue for zstd <= v1.4.3
2742*a28cd43dSSascha Wildner */
2743*a28cd43dSSascha Wildner !zc->isFirstBlock &&
2744*a28cd43dSSascha Wildner ZSTD_maybeRLE(&zc->seqStore) &&
2745*a28cd43dSSascha Wildner ZSTD_isRLE((BYTE const*)src, srcSize))
2746*a28cd43dSSascha Wildner {
2747*a28cd43dSSascha Wildner return ZSTD_rleCompressBlock(dst, dstCapacity, *(BYTE const*)src, srcSize, lastBlock);
2748*a28cd43dSSascha Wildner }
2749*a28cd43dSSascha Wildner /* Attempt superblock compression.
2750*a28cd43dSSascha Wildner *
2751*a28cd43dSSascha Wildner * Note that compressed size of ZSTD_compressSuperBlock() is not bound by the
2752*a28cd43dSSascha Wildner * standard ZSTD_compressBound(). This is a problem, because even if we have
2753*a28cd43dSSascha Wildner * space now, taking an extra byte now could cause us to run out of space later
2754*a28cd43dSSascha Wildner * and violate ZSTD_compressBound().
2755*a28cd43dSSascha Wildner *
2756*a28cd43dSSascha Wildner * Define blockBound(blockSize) = blockSize + ZSTD_blockHeaderSize.
2757*a28cd43dSSascha Wildner *
2758*a28cd43dSSascha Wildner * In order to respect ZSTD_compressBound() we must attempt to emit a raw
2759*a28cd43dSSascha Wildner * uncompressed block in these cases:
2760*a28cd43dSSascha Wildner * * cSize == 0: Return code for an uncompressed block.
2761*a28cd43dSSascha Wildner * * cSize == dstSize_tooSmall: We may have expanded beyond blockBound(srcSize).
2762*a28cd43dSSascha Wildner * ZSTD_noCompressBlock() will return dstSize_tooSmall if we are really out of
2763*a28cd43dSSascha Wildner * output space.
2764*a28cd43dSSascha Wildner * * cSize >= blockBound(srcSize): We have expanded the block too much so
2765*a28cd43dSSascha Wildner * emit an uncompressed block.
2766*a28cd43dSSascha Wildner */
2767*a28cd43dSSascha Wildner {
2768*a28cd43dSSascha Wildner size_t const cSize = ZSTD_compressSuperBlock(zc, dst, dstCapacity, src, srcSize, lastBlock);
2769*a28cd43dSSascha Wildner if (cSize != ERROR(dstSize_tooSmall)) {
2770*a28cd43dSSascha Wildner size_t const maxCSize = srcSize - ZSTD_minGain(srcSize, zc->appliedParams.cParams.strategy);
2771*a28cd43dSSascha Wildner FORWARD_IF_ERROR(cSize, "ZSTD_compressSuperBlock failed");
2772*a28cd43dSSascha Wildner if (cSize != 0 && cSize < maxCSize + ZSTD_blockHeaderSize) {
2773*a28cd43dSSascha Wildner ZSTD_confirmRepcodesAndEntropyTables(zc);
2774*a28cd43dSSascha Wildner return cSize;
2775*a28cd43dSSascha Wildner }
2776*a28cd43dSSascha Wildner }
2777*a28cd43dSSascha Wildner }
2778*a28cd43dSSascha Wildner }
2779*a28cd43dSSascha Wildner
2780*a28cd43dSSascha Wildner DEBUGLOG(6, "Resorting to ZSTD_noCompressBlock()");
2781*a28cd43dSSascha Wildner /* Superblock compression failed, attempt to emit a single no compress block.
2782*a28cd43dSSascha Wildner * The decoder will be able to stream this block since it is uncompressed.
2783*a28cd43dSSascha Wildner */
2784*a28cd43dSSascha Wildner return ZSTD_noCompressBlock(dst, dstCapacity, src, srcSize, lastBlock);
2785*a28cd43dSSascha Wildner }
2786*a28cd43dSSascha Wildner
ZSTD_compressBlock_targetCBlockSize(ZSTD_CCtx * zc,void * dst,size_t dstCapacity,const void * src,size_t srcSize,U32 lastBlock)2787*a28cd43dSSascha Wildner static size_t ZSTD_compressBlock_targetCBlockSize(ZSTD_CCtx* zc,
2788*a28cd43dSSascha Wildner void* dst, size_t dstCapacity,
2789*a28cd43dSSascha Wildner const void* src, size_t srcSize,
2790*a28cd43dSSascha Wildner U32 lastBlock)
2791*a28cd43dSSascha Wildner {
2792*a28cd43dSSascha Wildner size_t cSize = 0;
2793*a28cd43dSSascha Wildner const size_t bss = ZSTD_buildSeqStore(zc, src, srcSize);
2794*a28cd43dSSascha Wildner DEBUGLOG(5, "ZSTD_compressBlock_targetCBlockSize (dstCapacity=%u, dictLimit=%u, nextToUpdate=%u, srcSize=%zu)",
2795*a28cd43dSSascha Wildner (unsigned)dstCapacity, (unsigned)zc->blockState.matchState.window.dictLimit, (unsigned)zc->blockState.matchState.nextToUpdate, srcSize);
2796*a28cd43dSSascha Wildner FORWARD_IF_ERROR(bss, "ZSTD_buildSeqStore failed");
2797*a28cd43dSSascha Wildner
2798*a28cd43dSSascha Wildner cSize = ZSTD_compressBlock_targetCBlockSize_body(zc, dst, dstCapacity, src, srcSize, bss, lastBlock);
2799*a28cd43dSSascha Wildner FORWARD_IF_ERROR(cSize, "ZSTD_compressBlock_targetCBlockSize_body failed");
2800*a28cd43dSSascha Wildner
2801*a28cd43dSSascha Wildner if (zc->blockState.prevCBlock->entropy.fse.offcode_repeatMode == FSE_repeat_valid)
2802*a28cd43dSSascha Wildner zc->blockState.prevCBlock->entropy.fse.offcode_repeatMode = FSE_repeat_check;
2803*a28cd43dSSascha Wildner
2804*a28cd43dSSascha Wildner return cSize;
2805*a28cd43dSSascha Wildner }
2806*a28cd43dSSascha Wildner
ZSTD_overflowCorrectIfNeeded(ZSTD_matchState_t * ms,ZSTD_cwksp * ws,ZSTD_CCtx_params const * params,void const * ip,void const * iend)2807*a28cd43dSSascha Wildner static void ZSTD_overflowCorrectIfNeeded(ZSTD_matchState_t* ms,
2808*a28cd43dSSascha Wildner ZSTD_cwksp* ws,
2809*a28cd43dSSascha Wildner ZSTD_CCtx_params const* params,
2810*a28cd43dSSascha Wildner void const* ip,
2811*a28cd43dSSascha Wildner void const* iend)
2812*a28cd43dSSascha Wildner {
2813*a28cd43dSSascha Wildner if (ZSTD_window_needOverflowCorrection(ms->window, iend)) {
2814*a28cd43dSSascha Wildner U32 const maxDist = (U32)1 << params->cParams.windowLog;
2815*a28cd43dSSascha Wildner U32 const cycleLog = ZSTD_cycleLog(params->cParams.chainLog, params->cParams.strategy);
2816*a28cd43dSSascha Wildner U32 const correction = ZSTD_window_correctOverflow(&ms->window, cycleLog, maxDist, ip);
2817*a28cd43dSSascha Wildner ZSTD_STATIC_ASSERT(ZSTD_CHAINLOG_MAX <= 30);
2818*a28cd43dSSascha Wildner ZSTD_STATIC_ASSERT(ZSTD_WINDOWLOG_MAX_32 <= 30);
2819*a28cd43dSSascha Wildner ZSTD_STATIC_ASSERT(ZSTD_WINDOWLOG_MAX <= 31);
2820*a28cd43dSSascha Wildner ZSTD_cwksp_mark_tables_dirty(ws);
2821*a28cd43dSSascha Wildner ZSTD_reduceIndex(ms, params, correction);
2822*a28cd43dSSascha Wildner ZSTD_cwksp_mark_tables_clean(ws);
2823*a28cd43dSSascha Wildner if (ms->nextToUpdate < correction) ms->nextToUpdate = 0;
2824*a28cd43dSSascha Wildner else ms->nextToUpdate -= correction;
2825*a28cd43dSSascha Wildner /* invalidate dictionaries on overflow correction */
2826*a28cd43dSSascha Wildner ms->loadedDictEnd = 0;
2827*a28cd43dSSascha Wildner ms->dictMatchState = NULL;
2828*a28cd43dSSascha Wildner }
2829*a28cd43dSSascha Wildner }
2830*a28cd43dSSascha Wildner
2831*a28cd43dSSascha Wildner /*! ZSTD_compress_frameChunk() :
2832*a28cd43dSSascha Wildner * Compress a chunk of data into one or multiple blocks.
2833*a28cd43dSSascha Wildner * All blocks will be terminated, all input will be consumed.
2834*a28cd43dSSascha Wildner * Function will issue an error if there is not enough `dstCapacity` to hold the compressed content.
2835*a28cd43dSSascha Wildner * Frame is supposed already started (header already produced)
2836*a28cd43dSSascha Wildner * @return : compressed size, or an error code
2837*a28cd43dSSascha Wildner */
ZSTD_compress_frameChunk(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize,U32 lastFrameChunk)2838*a28cd43dSSascha Wildner static size_t ZSTD_compress_frameChunk (ZSTD_CCtx* cctx,
2839*a28cd43dSSascha Wildner void* dst, size_t dstCapacity,
2840*a28cd43dSSascha Wildner const void* src, size_t srcSize,
2841*a28cd43dSSascha Wildner U32 lastFrameChunk)
2842*a28cd43dSSascha Wildner {
2843*a28cd43dSSascha Wildner size_t blockSize = cctx->blockSize;
2844*a28cd43dSSascha Wildner size_t remaining = srcSize;
2845*a28cd43dSSascha Wildner const BYTE* ip = (const BYTE*)src;
2846*a28cd43dSSascha Wildner BYTE* const ostart = (BYTE*)dst;
2847*a28cd43dSSascha Wildner BYTE* op = ostart;
2848*a28cd43dSSascha Wildner U32 const maxDist = (U32)1 << cctx->appliedParams.cParams.windowLog;
2849*a28cd43dSSascha Wildner
2850*a28cd43dSSascha Wildner assert(cctx->appliedParams.cParams.windowLog <= ZSTD_WINDOWLOG_MAX);
2851*a28cd43dSSascha Wildner
2852*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_compress_frameChunk (blockSize=%u)", (unsigned)blockSize);
2853*a28cd43dSSascha Wildner if (cctx->appliedParams.fParams.checksumFlag && srcSize)
2854*a28cd43dSSascha Wildner XXH64_update(&cctx->xxhState, src, srcSize);
2855*a28cd43dSSascha Wildner
2856*a28cd43dSSascha Wildner while (remaining) {
2857*a28cd43dSSascha Wildner ZSTD_matchState_t* const ms = &cctx->blockState.matchState;
2858*a28cd43dSSascha Wildner U32 const lastBlock = lastFrameChunk & (blockSize >= remaining);
2859*a28cd43dSSascha Wildner
2860*a28cd43dSSascha Wildner RETURN_ERROR_IF(dstCapacity < ZSTD_blockHeaderSize + MIN_CBLOCK_SIZE,
2861*a28cd43dSSascha Wildner dstSize_tooSmall,
2862*a28cd43dSSascha Wildner "not enough space to store compressed block");
2863*a28cd43dSSascha Wildner if (remaining < blockSize) blockSize = remaining;
2864*a28cd43dSSascha Wildner
2865*a28cd43dSSascha Wildner ZSTD_overflowCorrectIfNeeded(
2866*a28cd43dSSascha Wildner ms, &cctx->workspace, &cctx->appliedParams, ip, ip + blockSize);
2867*a28cd43dSSascha Wildner ZSTD_checkDictValidity(&ms->window, ip + blockSize, maxDist, &ms->loadedDictEnd, &ms->dictMatchState);
2868*a28cd43dSSascha Wildner
2869*a28cd43dSSascha Wildner /* Ensure hash/chain table insertion resumes no sooner than lowlimit */
2870*a28cd43dSSascha Wildner if (ms->nextToUpdate < ms->window.lowLimit) ms->nextToUpdate = ms->window.lowLimit;
2871*a28cd43dSSascha Wildner
2872*a28cd43dSSascha Wildner { size_t cSize;
2873*a28cd43dSSascha Wildner if (ZSTD_useTargetCBlockSize(&cctx->appliedParams)) {
2874*a28cd43dSSascha Wildner cSize = ZSTD_compressBlock_targetCBlockSize(cctx, op, dstCapacity, ip, blockSize, lastBlock);
2875*a28cd43dSSascha Wildner FORWARD_IF_ERROR(cSize, "ZSTD_compressBlock_targetCBlockSize failed");
2876*a28cd43dSSascha Wildner assert(cSize > 0);
2877*a28cd43dSSascha Wildner assert(cSize <= blockSize + ZSTD_blockHeaderSize);
2878*a28cd43dSSascha Wildner } else {
2879*a28cd43dSSascha Wildner cSize = ZSTD_compressBlock_internal(cctx,
2880*a28cd43dSSascha Wildner op+ZSTD_blockHeaderSize, dstCapacity-ZSTD_blockHeaderSize,
2881*a28cd43dSSascha Wildner ip, blockSize, 1 /* frame */);
2882*a28cd43dSSascha Wildner FORWARD_IF_ERROR(cSize, "ZSTD_compressBlock_internal failed");
2883*a28cd43dSSascha Wildner
2884*a28cd43dSSascha Wildner if (cSize == 0) { /* block is not compressible */
2885*a28cd43dSSascha Wildner cSize = ZSTD_noCompressBlock(op, dstCapacity, ip, blockSize, lastBlock);
2886*a28cd43dSSascha Wildner FORWARD_IF_ERROR(cSize, "ZSTD_noCompressBlock failed");
2887*a28cd43dSSascha Wildner } else {
2888*a28cd43dSSascha Wildner U32 const cBlockHeader = cSize == 1 ?
2889*a28cd43dSSascha Wildner lastBlock + (((U32)bt_rle)<<1) + (U32)(blockSize << 3) :
2890*a28cd43dSSascha Wildner lastBlock + (((U32)bt_compressed)<<1) + (U32)(cSize << 3);
2891*a28cd43dSSascha Wildner MEM_writeLE24(op, cBlockHeader);
2892*a28cd43dSSascha Wildner cSize += ZSTD_blockHeaderSize;
2893*a28cd43dSSascha Wildner }
2894*a28cd43dSSascha Wildner }
2895*a28cd43dSSascha Wildner
2896*a28cd43dSSascha Wildner
2897*a28cd43dSSascha Wildner ip += blockSize;
2898*a28cd43dSSascha Wildner assert(remaining >= blockSize);
2899*a28cd43dSSascha Wildner remaining -= blockSize;
2900*a28cd43dSSascha Wildner op += cSize;
2901*a28cd43dSSascha Wildner assert(dstCapacity >= cSize);
2902*a28cd43dSSascha Wildner dstCapacity -= cSize;
2903*a28cd43dSSascha Wildner cctx->isFirstBlock = 0;
2904*a28cd43dSSascha Wildner DEBUGLOG(5, "ZSTD_compress_frameChunk: adding a block of size %u",
2905*a28cd43dSSascha Wildner (unsigned)cSize);
2906*a28cd43dSSascha Wildner } }
2907*a28cd43dSSascha Wildner
2908*a28cd43dSSascha Wildner if (lastFrameChunk && (op>ostart)) cctx->stage = ZSTDcs_ending;
2909*a28cd43dSSascha Wildner return (size_t)(op-ostart);
2910*a28cd43dSSascha Wildner }
2911*a28cd43dSSascha Wildner
2912*a28cd43dSSascha Wildner
ZSTD_writeFrameHeader(void * dst,size_t dstCapacity,const ZSTD_CCtx_params * params,U64 pledgedSrcSize,U32 dictID)2913*a28cd43dSSascha Wildner static size_t ZSTD_writeFrameHeader(void* dst, size_t dstCapacity,
2914*a28cd43dSSascha Wildner const ZSTD_CCtx_params* params, U64 pledgedSrcSize, U32 dictID)
2915*a28cd43dSSascha Wildner { BYTE* const op = (BYTE*)dst;
2916*a28cd43dSSascha Wildner U32 const dictIDSizeCodeLength = (dictID>0) + (dictID>=256) + (dictID>=65536); /* 0-3 */
2917*a28cd43dSSascha Wildner U32 const dictIDSizeCode = params->fParams.noDictIDFlag ? 0 : dictIDSizeCodeLength; /* 0-3 */
2918*a28cd43dSSascha Wildner U32 const checksumFlag = params->fParams.checksumFlag>0;
2919*a28cd43dSSascha Wildner U32 const windowSize = (U32)1 << params->cParams.windowLog;
2920*a28cd43dSSascha Wildner U32 const singleSegment = params->fParams.contentSizeFlag && (windowSize >= pledgedSrcSize);
2921*a28cd43dSSascha Wildner BYTE const windowLogByte = (BYTE)((params->cParams.windowLog - ZSTD_WINDOWLOG_ABSOLUTEMIN) << 3);
2922*a28cd43dSSascha Wildner U32 const fcsCode = params->fParams.contentSizeFlag ?
2923*a28cd43dSSascha Wildner (pledgedSrcSize>=256) + (pledgedSrcSize>=65536+256) + (pledgedSrcSize>=0xFFFFFFFFU) : 0; /* 0-3 */
2924*a28cd43dSSascha Wildner BYTE const frameHeaderDescriptionByte = (BYTE)(dictIDSizeCode + (checksumFlag<<2) + (singleSegment<<5) + (fcsCode<<6) );
2925*a28cd43dSSascha Wildner size_t pos=0;
2926*a28cd43dSSascha Wildner
2927*a28cd43dSSascha Wildner assert(!(params->fParams.contentSizeFlag && pledgedSrcSize == ZSTD_CONTENTSIZE_UNKNOWN));
2928*a28cd43dSSascha Wildner RETURN_ERROR_IF(dstCapacity < ZSTD_FRAMEHEADERSIZE_MAX, dstSize_tooSmall,
2929*a28cd43dSSascha Wildner "dst buf is too small to fit worst-case frame header size.");
2930*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_writeFrameHeader : dictIDFlag : %u ; dictID : %u ; dictIDSizeCode : %u",
2931*a28cd43dSSascha Wildner !params->fParams.noDictIDFlag, (unsigned)dictID, (unsigned)dictIDSizeCode);
2932*a28cd43dSSascha Wildner if (params->format == ZSTD_f_zstd1) {
2933*a28cd43dSSascha Wildner MEM_writeLE32(dst, ZSTD_MAGICNUMBER);
2934*a28cd43dSSascha Wildner pos = 4;
2935*a28cd43dSSascha Wildner }
2936*a28cd43dSSascha Wildner op[pos++] = frameHeaderDescriptionByte;
2937*a28cd43dSSascha Wildner if (!singleSegment) op[pos++] = windowLogByte;
2938*a28cd43dSSascha Wildner switch(dictIDSizeCode)
2939*a28cd43dSSascha Wildner {
2940*a28cd43dSSascha Wildner default: assert(0); /* impossible */
2941*a28cd43dSSascha Wildner case 0 : break;
2942*a28cd43dSSascha Wildner case 1 : op[pos] = (BYTE)(dictID); pos++; break;
2943*a28cd43dSSascha Wildner case 2 : MEM_writeLE16(op+pos, (U16)dictID); pos+=2; break;
2944*a28cd43dSSascha Wildner case 3 : MEM_writeLE32(op+pos, dictID); pos+=4; break;
2945*a28cd43dSSascha Wildner }
2946*a28cd43dSSascha Wildner switch(fcsCode)
2947*a28cd43dSSascha Wildner {
2948*a28cd43dSSascha Wildner default: assert(0); /* impossible */
2949*a28cd43dSSascha Wildner case 0 : if (singleSegment) op[pos++] = (BYTE)(pledgedSrcSize); break;
2950*a28cd43dSSascha Wildner case 1 : MEM_writeLE16(op+pos, (U16)(pledgedSrcSize-256)); pos+=2; break;
2951*a28cd43dSSascha Wildner case 2 : MEM_writeLE32(op+pos, (U32)(pledgedSrcSize)); pos+=4; break;
2952*a28cd43dSSascha Wildner case 3 : MEM_writeLE64(op+pos, (U64)(pledgedSrcSize)); pos+=8; break;
2953*a28cd43dSSascha Wildner }
2954*a28cd43dSSascha Wildner return pos;
2955*a28cd43dSSascha Wildner }
2956*a28cd43dSSascha Wildner
2957*a28cd43dSSascha Wildner /* ZSTD_writeLastEmptyBlock() :
2958*a28cd43dSSascha Wildner * output an empty Block with end-of-frame mark to complete a frame
2959*a28cd43dSSascha Wildner * @return : size of data written into `dst` (== ZSTD_blockHeaderSize (defined in zstd_internal.h))
2960*a28cd43dSSascha Wildner * or an error code if `dstCapacity` is too small (<ZSTD_blockHeaderSize)
2961*a28cd43dSSascha Wildner */
ZSTD_writeLastEmptyBlock(void * dst,size_t dstCapacity)2962*a28cd43dSSascha Wildner size_t ZSTD_writeLastEmptyBlock(void* dst, size_t dstCapacity)
2963*a28cd43dSSascha Wildner {
2964*a28cd43dSSascha Wildner RETURN_ERROR_IF(dstCapacity < ZSTD_blockHeaderSize, dstSize_tooSmall,
2965*a28cd43dSSascha Wildner "dst buf is too small to write frame trailer empty block.");
2966*a28cd43dSSascha Wildner { U32 const cBlockHeader24 = 1 /*lastBlock*/ + (((U32)bt_raw)<<1); /* 0 size */
2967*a28cd43dSSascha Wildner MEM_writeLE24(dst, cBlockHeader24);
2968*a28cd43dSSascha Wildner return ZSTD_blockHeaderSize;
2969*a28cd43dSSascha Wildner }
2970*a28cd43dSSascha Wildner }
2971*a28cd43dSSascha Wildner
ZSTD_referenceExternalSequences(ZSTD_CCtx * cctx,rawSeq * seq,size_t nbSeq)2972*a28cd43dSSascha Wildner size_t ZSTD_referenceExternalSequences(ZSTD_CCtx* cctx, rawSeq* seq, size_t nbSeq)
2973*a28cd43dSSascha Wildner {
2974*a28cd43dSSascha Wildner RETURN_ERROR_IF(cctx->stage != ZSTDcs_init, stage_wrong,
2975*a28cd43dSSascha Wildner "wrong cctx stage");
2976*a28cd43dSSascha Wildner RETURN_ERROR_IF(cctx->appliedParams.ldmParams.enableLdm,
2977*a28cd43dSSascha Wildner parameter_unsupported,
2978*a28cd43dSSascha Wildner "incompatible with ldm");
2979*a28cd43dSSascha Wildner cctx->externSeqStore.seq = seq;
2980*a28cd43dSSascha Wildner cctx->externSeqStore.size = nbSeq;
2981*a28cd43dSSascha Wildner cctx->externSeqStore.capacity = nbSeq;
2982*a28cd43dSSascha Wildner cctx->externSeqStore.pos = 0;
2983*a28cd43dSSascha Wildner cctx->externSeqStore.posInSequence = 0;
2984*a28cd43dSSascha Wildner return 0;
2985*a28cd43dSSascha Wildner }
2986*a28cd43dSSascha Wildner
2987*a28cd43dSSascha Wildner
ZSTD_compressContinue_internal(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize,U32 frame,U32 lastFrameChunk)2988*a28cd43dSSascha Wildner static size_t ZSTD_compressContinue_internal (ZSTD_CCtx* cctx,
2989*a28cd43dSSascha Wildner void* dst, size_t dstCapacity,
2990*a28cd43dSSascha Wildner const void* src, size_t srcSize,
2991*a28cd43dSSascha Wildner U32 frame, U32 lastFrameChunk)
2992*a28cd43dSSascha Wildner {
2993*a28cd43dSSascha Wildner ZSTD_matchState_t* const ms = &cctx->blockState.matchState;
2994*a28cd43dSSascha Wildner size_t fhSize = 0;
2995*a28cd43dSSascha Wildner
2996*a28cd43dSSascha Wildner DEBUGLOG(5, "ZSTD_compressContinue_internal, stage: %u, srcSize: %u",
2997*a28cd43dSSascha Wildner cctx->stage, (unsigned)srcSize);
2998*a28cd43dSSascha Wildner RETURN_ERROR_IF(cctx->stage==ZSTDcs_created, stage_wrong,
2999*a28cd43dSSascha Wildner "missing init (ZSTD_compressBegin)");
3000*a28cd43dSSascha Wildner
3001*a28cd43dSSascha Wildner if (frame && (cctx->stage==ZSTDcs_init)) {
3002*a28cd43dSSascha Wildner fhSize = ZSTD_writeFrameHeader(dst, dstCapacity, &cctx->appliedParams,
3003*a28cd43dSSascha Wildner cctx->pledgedSrcSizePlusOne-1, cctx->dictID);
3004*a28cd43dSSascha Wildner FORWARD_IF_ERROR(fhSize, "ZSTD_writeFrameHeader failed");
3005*a28cd43dSSascha Wildner assert(fhSize <= dstCapacity);
3006*a28cd43dSSascha Wildner dstCapacity -= fhSize;
3007*a28cd43dSSascha Wildner dst = (char*)dst + fhSize;
3008*a28cd43dSSascha Wildner cctx->stage = ZSTDcs_ongoing;
3009*a28cd43dSSascha Wildner }
3010*a28cd43dSSascha Wildner
3011*a28cd43dSSascha Wildner if (!srcSize) return fhSize; /* do not generate an empty block if no input */
3012*a28cd43dSSascha Wildner
3013*a28cd43dSSascha Wildner if (!ZSTD_window_update(&ms->window, src, srcSize)) {
3014*a28cd43dSSascha Wildner ms->nextToUpdate = ms->window.dictLimit;
3015*a28cd43dSSascha Wildner }
3016*a28cd43dSSascha Wildner if (cctx->appliedParams.ldmParams.enableLdm) {
3017*a28cd43dSSascha Wildner ZSTD_window_update(&cctx->ldmState.window, src, srcSize);
3018*a28cd43dSSascha Wildner }
3019*a28cd43dSSascha Wildner
3020*a28cd43dSSascha Wildner if (!frame) {
3021*a28cd43dSSascha Wildner /* overflow check and correction for block mode */
3022*a28cd43dSSascha Wildner ZSTD_overflowCorrectIfNeeded(
3023*a28cd43dSSascha Wildner ms, &cctx->workspace, &cctx->appliedParams,
3024*a28cd43dSSascha Wildner src, (BYTE const*)src + srcSize);
3025*a28cd43dSSascha Wildner }
3026*a28cd43dSSascha Wildner
3027*a28cd43dSSascha Wildner DEBUGLOG(5, "ZSTD_compressContinue_internal (blockSize=%u)", (unsigned)cctx->blockSize);
3028*a28cd43dSSascha Wildner { size_t const cSize = frame ?
3029*a28cd43dSSascha Wildner ZSTD_compress_frameChunk (cctx, dst, dstCapacity, src, srcSize, lastFrameChunk) :
3030*a28cd43dSSascha Wildner ZSTD_compressBlock_internal (cctx, dst, dstCapacity, src, srcSize, 0 /* frame */);
3031*a28cd43dSSascha Wildner FORWARD_IF_ERROR(cSize, "%s", frame ? "ZSTD_compress_frameChunk failed" : "ZSTD_compressBlock_internal failed");
3032*a28cd43dSSascha Wildner cctx->consumedSrcSize += srcSize;
3033*a28cd43dSSascha Wildner cctx->producedCSize += (cSize + fhSize);
3034*a28cd43dSSascha Wildner assert(!(cctx->appliedParams.fParams.contentSizeFlag && cctx->pledgedSrcSizePlusOne == 0));
3035*a28cd43dSSascha Wildner if (cctx->pledgedSrcSizePlusOne != 0) { /* control src size */
3036*a28cd43dSSascha Wildner ZSTD_STATIC_ASSERT(ZSTD_CONTENTSIZE_UNKNOWN == (unsigned long long)-1);
3037*a28cd43dSSascha Wildner RETURN_ERROR_IF(
3038*a28cd43dSSascha Wildner cctx->consumedSrcSize+1 > cctx->pledgedSrcSizePlusOne,
3039*a28cd43dSSascha Wildner srcSize_wrong,
3040*a28cd43dSSascha Wildner "error : pledgedSrcSize = %u, while realSrcSize >= %u",
3041*a28cd43dSSascha Wildner (unsigned)cctx->pledgedSrcSizePlusOne-1,
3042*a28cd43dSSascha Wildner (unsigned)cctx->consumedSrcSize);
3043*a28cd43dSSascha Wildner }
3044*a28cd43dSSascha Wildner return cSize + fhSize;
3045*a28cd43dSSascha Wildner }
3046*a28cd43dSSascha Wildner }
3047*a28cd43dSSascha Wildner
ZSTD_compressContinue(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize)3048*a28cd43dSSascha Wildner size_t ZSTD_compressContinue (ZSTD_CCtx* cctx,
3049*a28cd43dSSascha Wildner void* dst, size_t dstCapacity,
3050*a28cd43dSSascha Wildner const void* src, size_t srcSize)
3051*a28cd43dSSascha Wildner {
3052*a28cd43dSSascha Wildner DEBUGLOG(5, "ZSTD_compressContinue (srcSize=%u)", (unsigned)srcSize);
3053*a28cd43dSSascha Wildner return ZSTD_compressContinue_internal(cctx, dst, dstCapacity, src, srcSize, 1 /* frame mode */, 0 /* last chunk */);
3054*a28cd43dSSascha Wildner }
3055*a28cd43dSSascha Wildner
3056*a28cd43dSSascha Wildner
ZSTD_getBlockSize(const ZSTD_CCtx * cctx)3057*a28cd43dSSascha Wildner size_t ZSTD_getBlockSize(const ZSTD_CCtx* cctx)
3058*a28cd43dSSascha Wildner {
3059*a28cd43dSSascha Wildner ZSTD_compressionParameters const cParams = cctx->appliedParams.cParams;
3060*a28cd43dSSascha Wildner assert(!ZSTD_checkCParams(cParams));
3061*a28cd43dSSascha Wildner return MIN (ZSTD_BLOCKSIZE_MAX, (U32)1 << cParams.windowLog);
3062*a28cd43dSSascha Wildner }
3063*a28cd43dSSascha Wildner
ZSTD_compressBlock(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize)3064*a28cd43dSSascha Wildner size_t ZSTD_compressBlock(ZSTD_CCtx* cctx, void* dst, size_t dstCapacity, const void* src, size_t srcSize)
3065*a28cd43dSSascha Wildner {
3066*a28cd43dSSascha Wildner DEBUGLOG(5, "ZSTD_compressBlock: srcSize = %u", (unsigned)srcSize);
3067*a28cd43dSSascha Wildner { size_t const blockSizeMax = ZSTD_getBlockSize(cctx);
3068*a28cd43dSSascha Wildner RETURN_ERROR_IF(srcSize > blockSizeMax, srcSize_wrong, "input is larger than a block"); }
3069*a28cd43dSSascha Wildner
3070*a28cd43dSSascha Wildner return ZSTD_compressContinue_internal(cctx, dst, dstCapacity, src, srcSize, 0 /* frame mode */, 0 /* last chunk */);
3071*a28cd43dSSascha Wildner }
3072*a28cd43dSSascha Wildner
3073*a28cd43dSSascha Wildner /*! ZSTD_loadDictionaryContent() :
3074*a28cd43dSSascha Wildner * @return : 0, or an error code
3075*a28cd43dSSascha Wildner */
ZSTD_loadDictionaryContent(ZSTD_matchState_t * ms,ldmState_t * ls,ZSTD_cwksp * ws,ZSTD_CCtx_params const * params,const void * src,size_t srcSize,ZSTD_dictTableLoadMethod_e dtlm)3076*a28cd43dSSascha Wildner static size_t ZSTD_loadDictionaryContent(ZSTD_matchState_t* ms,
3077*a28cd43dSSascha Wildner ldmState_t* ls,
3078*a28cd43dSSascha Wildner ZSTD_cwksp* ws,
3079*a28cd43dSSascha Wildner ZSTD_CCtx_params const* params,
3080*a28cd43dSSascha Wildner const void* src, size_t srcSize,
3081*a28cd43dSSascha Wildner ZSTD_dictTableLoadMethod_e dtlm)
3082*a28cd43dSSascha Wildner {
3083*a28cd43dSSascha Wildner const BYTE* ip = (const BYTE*) src;
3084*a28cd43dSSascha Wildner const BYTE* const iend = ip + srcSize;
3085*a28cd43dSSascha Wildner
3086*a28cd43dSSascha Wildner ZSTD_window_update(&ms->window, src, srcSize);
3087*a28cd43dSSascha Wildner ms->loadedDictEnd = params->forceWindow ? 0 : (U32)(iend - ms->window.base);
3088*a28cd43dSSascha Wildner
3089*a28cd43dSSascha Wildner if (params->ldmParams.enableLdm && ls != NULL) {
3090*a28cd43dSSascha Wildner ZSTD_window_update(&ls->window, src, srcSize);
3091*a28cd43dSSascha Wildner ls->loadedDictEnd = params->forceWindow ? 0 : (U32)(iend - ls->window.base);
3092*a28cd43dSSascha Wildner }
3093*a28cd43dSSascha Wildner
3094*a28cd43dSSascha Wildner /* Assert that we the ms params match the params we're being given */
3095*a28cd43dSSascha Wildner ZSTD_assertEqualCParams(params->cParams, ms->cParams);
3096*a28cd43dSSascha Wildner
3097*a28cd43dSSascha Wildner if (srcSize <= HASH_READ_SIZE) return 0;
3098*a28cd43dSSascha Wildner
3099*a28cd43dSSascha Wildner while (iend - ip > HASH_READ_SIZE) {
3100*a28cd43dSSascha Wildner size_t const remaining = (size_t)(iend - ip);
3101*a28cd43dSSascha Wildner size_t const chunk = MIN(remaining, ZSTD_CHUNKSIZE_MAX);
3102*a28cd43dSSascha Wildner const BYTE* const ichunk = ip + chunk;
3103*a28cd43dSSascha Wildner
3104*a28cd43dSSascha Wildner ZSTD_overflowCorrectIfNeeded(ms, ws, params, ip, ichunk);
3105*a28cd43dSSascha Wildner
3106*a28cd43dSSascha Wildner if (params->ldmParams.enableLdm && ls != NULL)
3107*a28cd43dSSascha Wildner ZSTD_ldm_fillHashTable(ls, (const BYTE*)src, (const BYTE*)src + srcSize, ¶ms->ldmParams);
3108*a28cd43dSSascha Wildner
3109*a28cd43dSSascha Wildner switch(params->cParams.strategy)
3110*a28cd43dSSascha Wildner {
3111*a28cd43dSSascha Wildner case ZSTD_fast:
3112*a28cd43dSSascha Wildner ZSTD_fillHashTable(ms, ichunk, dtlm);
3113*a28cd43dSSascha Wildner break;
3114*a28cd43dSSascha Wildner case ZSTD_dfast:
3115*a28cd43dSSascha Wildner ZSTD_fillDoubleHashTable(ms, ichunk, dtlm);
3116*a28cd43dSSascha Wildner break;
3117*a28cd43dSSascha Wildner
3118*a28cd43dSSascha Wildner case ZSTD_greedy:
3119*a28cd43dSSascha Wildner case ZSTD_lazy:
3120*a28cd43dSSascha Wildner case ZSTD_lazy2:
3121*a28cd43dSSascha Wildner if (chunk >= HASH_READ_SIZE && ms->dedicatedDictSearch) {
3122*a28cd43dSSascha Wildner assert(chunk == remaining); /* must load everything in one go */
3123*a28cd43dSSascha Wildner ZSTD_dedicatedDictSearch_lazy_loadDictionary(ms, ichunk-HASH_READ_SIZE);
3124*a28cd43dSSascha Wildner } else if (chunk >= HASH_READ_SIZE) {
3125*a28cd43dSSascha Wildner ZSTD_insertAndFindFirstIndex(ms, ichunk-HASH_READ_SIZE);
3126*a28cd43dSSascha Wildner }
3127*a28cd43dSSascha Wildner break;
3128*a28cd43dSSascha Wildner
3129*a28cd43dSSascha Wildner case ZSTD_btlazy2: /* we want the dictionary table fully sorted */
3130*a28cd43dSSascha Wildner case ZSTD_btopt:
3131*a28cd43dSSascha Wildner case ZSTD_btultra:
3132*a28cd43dSSascha Wildner case ZSTD_btultra2:
3133*a28cd43dSSascha Wildner if (chunk >= HASH_READ_SIZE)
3134*a28cd43dSSascha Wildner ZSTD_updateTree(ms, ichunk-HASH_READ_SIZE, ichunk);
3135*a28cd43dSSascha Wildner break;
3136*a28cd43dSSascha Wildner
3137*a28cd43dSSascha Wildner default:
3138*a28cd43dSSascha Wildner assert(0); /* not possible : not a valid strategy id */
3139*a28cd43dSSascha Wildner }
3140*a28cd43dSSascha Wildner
3141*a28cd43dSSascha Wildner ip = ichunk;
3142*a28cd43dSSascha Wildner }
3143*a28cd43dSSascha Wildner
3144*a28cd43dSSascha Wildner ms->nextToUpdate = (U32)(iend - ms->window.base);
3145*a28cd43dSSascha Wildner return 0;
3146*a28cd43dSSascha Wildner }
3147*a28cd43dSSascha Wildner
3148*a28cd43dSSascha Wildner
3149*a28cd43dSSascha Wildner /* Dictionaries that assign zero probability to symbols that show up causes problems
3150*a28cd43dSSascha Wildner * when FSE encoding. Mark dictionaries with zero probability symbols as FSE_repeat_check
3151*a28cd43dSSascha Wildner * and only dictionaries with 100% valid symbols can be assumed valid.
3152*a28cd43dSSascha Wildner */
ZSTD_dictNCountRepeat(short * normalizedCounter,unsigned dictMaxSymbolValue,unsigned maxSymbolValue)3153*a28cd43dSSascha Wildner static FSE_repeat ZSTD_dictNCountRepeat(short* normalizedCounter, unsigned dictMaxSymbolValue, unsigned maxSymbolValue)
3154*a28cd43dSSascha Wildner {
3155*a28cd43dSSascha Wildner U32 s;
3156*a28cd43dSSascha Wildner if (dictMaxSymbolValue < maxSymbolValue) {
3157*a28cd43dSSascha Wildner return FSE_repeat_check;
3158*a28cd43dSSascha Wildner }
3159*a28cd43dSSascha Wildner for (s = 0; s <= maxSymbolValue; ++s) {
3160*a28cd43dSSascha Wildner if (normalizedCounter[s] == 0) {
3161*a28cd43dSSascha Wildner return FSE_repeat_check;
3162*a28cd43dSSascha Wildner }
3163*a28cd43dSSascha Wildner }
3164*a28cd43dSSascha Wildner return FSE_repeat_valid;
3165*a28cd43dSSascha Wildner }
3166*a28cd43dSSascha Wildner
ZSTD_loadCEntropy(ZSTD_compressedBlockState_t * bs,void * workspace,const void * const dict,size_t dictSize)3167*a28cd43dSSascha Wildner size_t ZSTD_loadCEntropy(ZSTD_compressedBlockState_t* bs, void* workspace,
3168*a28cd43dSSascha Wildner const void* const dict, size_t dictSize)
3169*a28cd43dSSascha Wildner {
3170*a28cd43dSSascha Wildner short offcodeNCount[MaxOff+1];
3171*a28cd43dSSascha Wildner unsigned offcodeMaxValue = MaxOff;
3172*a28cd43dSSascha Wildner const BYTE* dictPtr = (const BYTE*)dict; /* skip magic num and dict ID */
3173*a28cd43dSSascha Wildner const BYTE* const dictEnd = dictPtr + dictSize;
3174*a28cd43dSSascha Wildner dictPtr += 8;
3175*a28cd43dSSascha Wildner bs->entropy.huf.repeatMode = HUF_repeat_check;
3176*a28cd43dSSascha Wildner
3177*a28cd43dSSascha Wildner { unsigned maxSymbolValue = 255;
3178*a28cd43dSSascha Wildner unsigned hasZeroWeights = 1;
3179*a28cd43dSSascha Wildner size_t const hufHeaderSize = HUF_readCTable((HUF_CElt*)bs->entropy.huf.CTable, &maxSymbolValue, dictPtr,
3180*a28cd43dSSascha Wildner dictEnd-dictPtr, &hasZeroWeights);
3181*a28cd43dSSascha Wildner
3182*a28cd43dSSascha Wildner /* We only set the loaded table as valid if it contains all non-zero
3183*a28cd43dSSascha Wildner * weights. Otherwise, we set it to check */
3184*a28cd43dSSascha Wildner if (!hasZeroWeights)
3185*a28cd43dSSascha Wildner bs->entropy.huf.repeatMode = HUF_repeat_valid;
3186*a28cd43dSSascha Wildner
3187*a28cd43dSSascha Wildner RETURN_ERROR_IF(HUF_isError(hufHeaderSize), dictionary_corrupted, "");
3188*a28cd43dSSascha Wildner RETURN_ERROR_IF(maxSymbolValue < 255, dictionary_corrupted, "");
3189*a28cd43dSSascha Wildner dictPtr += hufHeaderSize;
3190*a28cd43dSSascha Wildner }
3191*a28cd43dSSascha Wildner
3192*a28cd43dSSascha Wildner { unsigned offcodeLog;
3193*a28cd43dSSascha Wildner size_t const offcodeHeaderSize = FSE_readNCount(offcodeNCount, &offcodeMaxValue, &offcodeLog, dictPtr, dictEnd-dictPtr);
3194*a28cd43dSSascha Wildner RETURN_ERROR_IF(FSE_isError(offcodeHeaderSize), dictionary_corrupted, "");
3195*a28cd43dSSascha Wildner RETURN_ERROR_IF(offcodeLog > OffFSELog, dictionary_corrupted, "");
3196*a28cd43dSSascha Wildner /* fill all offset symbols to avoid garbage at end of table */
3197*a28cd43dSSascha Wildner RETURN_ERROR_IF(FSE_isError(FSE_buildCTable_wksp(
3198*a28cd43dSSascha Wildner bs->entropy.fse.offcodeCTable,
3199*a28cd43dSSascha Wildner offcodeNCount, MaxOff, offcodeLog,
3200*a28cd43dSSascha Wildner workspace, HUF_WORKSPACE_SIZE)),
3201*a28cd43dSSascha Wildner dictionary_corrupted, "");
3202*a28cd43dSSascha Wildner /* Defer checking offcodeMaxValue because we need to know the size of the dictionary content */
3203*a28cd43dSSascha Wildner dictPtr += offcodeHeaderSize;
3204*a28cd43dSSascha Wildner }
3205*a28cd43dSSascha Wildner
3206*a28cd43dSSascha Wildner { short matchlengthNCount[MaxML+1];
3207*a28cd43dSSascha Wildner unsigned matchlengthMaxValue = MaxML, matchlengthLog;
3208*a28cd43dSSascha Wildner size_t const matchlengthHeaderSize = FSE_readNCount(matchlengthNCount, &matchlengthMaxValue, &matchlengthLog, dictPtr, dictEnd-dictPtr);
3209*a28cd43dSSascha Wildner RETURN_ERROR_IF(FSE_isError(matchlengthHeaderSize), dictionary_corrupted, "");
3210*a28cd43dSSascha Wildner RETURN_ERROR_IF(matchlengthLog > MLFSELog, dictionary_corrupted, "");
3211*a28cd43dSSascha Wildner RETURN_ERROR_IF(FSE_isError(FSE_buildCTable_wksp(
3212*a28cd43dSSascha Wildner bs->entropy.fse.matchlengthCTable,
3213*a28cd43dSSascha Wildner matchlengthNCount, matchlengthMaxValue, matchlengthLog,
3214*a28cd43dSSascha Wildner workspace, HUF_WORKSPACE_SIZE)),
3215*a28cd43dSSascha Wildner dictionary_corrupted, "");
3216*a28cd43dSSascha Wildner bs->entropy.fse.matchlength_repeatMode = ZSTD_dictNCountRepeat(matchlengthNCount, matchlengthMaxValue, MaxML);
3217*a28cd43dSSascha Wildner dictPtr += matchlengthHeaderSize;
3218*a28cd43dSSascha Wildner }
3219*a28cd43dSSascha Wildner
3220*a28cd43dSSascha Wildner { short litlengthNCount[MaxLL+1];
3221*a28cd43dSSascha Wildner unsigned litlengthMaxValue = MaxLL, litlengthLog;
3222*a28cd43dSSascha Wildner size_t const litlengthHeaderSize = FSE_readNCount(litlengthNCount, &litlengthMaxValue, &litlengthLog, dictPtr, dictEnd-dictPtr);
3223*a28cd43dSSascha Wildner RETURN_ERROR_IF(FSE_isError(litlengthHeaderSize), dictionary_corrupted, "");
3224*a28cd43dSSascha Wildner RETURN_ERROR_IF(litlengthLog > LLFSELog, dictionary_corrupted, "");
3225*a28cd43dSSascha Wildner RETURN_ERROR_IF(FSE_isError(FSE_buildCTable_wksp(
3226*a28cd43dSSascha Wildner bs->entropy.fse.litlengthCTable,
3227*a28cd43dSSascha Wildner litlengthNCount, litlengthMaxValue, litlengthLog,
3228*a28cd43dSSascha Wildner workspace, HUF_WORKSPACE_SIZE)),
3229*a28cd43dSSascha Wildner dictionary_corrupted, "");
3230*a28cd43dSSascha Wildner bs->entropy.fse.litlength_repeatMode = ZSTD_dictNCountRepeat(litlengthNCount, litlengthMaxValue, MaxLL);
3231*a28cd43dSSascha Wildner dictPtr += litlengthHeaderSize;
3232*a28cd43dSSascha Wildner }
3233*a28cd43dSSascha Wildner
3234*a28cd43dSSascha Wildner RETURN_ERROR_IF(dictPtr+12 > dictEnd, dictionary_corrupted, "");
3235*a28cd43dSSascha Wildner bs->rep[0] = MEM_readLE32(dictPtr+0);
3236*a28cd43dSSascha Wildner bs->rep[1] = MEM_readLE32(dictPtr+4);
3237*a28cd43dSSascha Wildner bs->rep[2] = MEM_readLE32(dictPtr+8);
3238*a28cd43dSSascha Wildner dictPtr += 12;
3239*a28cd43dSSascha Wildner
3240*a28cd43dSSascha Wildner { size_t const dictContentSize = (size_t)(dictEnd - dictPtr);
3241*a28cd43dSSascha Wildner U32 offcodeMax = MaxOff;
3242*a28cd43dSSascha Wildner if (dictContentSize <= ((U32)-1) - 128 KB) {
3243*a28cd43dSSascha Wildner U32 const maxOffset = (U32)dictContentSize + 128 KB; /* The maximum offset that must be supported */
3244*a28cd43dSSascha Wildner offcodeMax = ZSTD_highbit32(maxOffset); /* Calculate minimum offset code required to represent maxOffset */
3245*a28cd43dSSascha Wildner }
3246*a28cd43dSSascha Wildner /* All offset values <= dictContentSize + 128 KB must be representable for a valid table */
3247*a28cd43dSSascha Wildner bs->entropy.fse.offcode_repeatMode = ZSTD_dictNCountRepeat(offcodeNCount, offcodeMaxValue, MIN(offcodeMax, MaxOff));
3248*a28cd43dSSascha Wildner
3249*a28cd43dSSascha Wildner /* All repCodes must be <= dictContentSize and != 0 */
3250*a28cd43dSSascha Wildner { U32 u;
3251*a28cd43dSSascha Wildner for (u=0; u<3; u++) {
3252*a28cd43dSSascha Wildner RETURN_ERROR_IF(bs->rep[u] == 0, dictionary_corrupted, "");
3253*a28cd43dSSascha Wildner RETURN_ERROR_IF(bs->rep[u] > dictContentSize, dictionary_corrupted, "");
3254*a28cd43dSSascha Wildner } } }
3255*a28cd43dSSascha Wildner
3256*a28cd43dSSascha Wildner return dictPtr - (const BYTE*)dict;
3257*a28cd43dSSascha Wildner }
3258*a28cd43dSSascha Wildner
3259*a28cd43dSSascha Wildner /* Dictionary format :
3260*a28cd43dSSascha Wildner * See :
3261*a28cd43dSSascha Wildner * https://github.com/facebook/zstd/blob/release/doc/zstd_compression_format.md#dictionary-format
3262*a28cd43dSSascha Wildner */
3263*a28cd43dSSascha Wildner /*! ZSTD_loadZstdDictionary() :
3264*a28cd43dSSascha Wildner * @return : dictID, or an error code
3265*a28cd43dSSascha Wildner * assumptions : magic number supposed already checked
3266*a28cd43dSSascha Wildner * dictSize supposed >= 8
3267*a28cd43dSSascha Wildner */
ZSTD_loadZstdDictionary(ZSTD_compressedBlockState_t * bs,ZSTD_matchState_t * ms,ZSTD_cwksp * ws,ZSTD_CCtx_params const * params,const void * dict,size_t dictSize,ZSTD_dictTableLoadMethod_e dtlm,void * workspace)3268*a28cd43dSSascha Wildner static size_t ZSTD_loadZstdDictionary(ZSTD_compressedBlockState_t* bs,
3269*a28cd43dSSascha Wildner ZSTD_matchState_t* ms,
3270*a28cd43dSSascha Wildner ZSTD_cwksp* ws,
3271*a28cd43dSSascha Wildner ZSTD_CCtx_params const* params,
3272*a28cd43dSSascha Wildner const void* dict, size_t dictSize,
3273*a28cd43dSSascha Wildner ZSTD_dictTableLoadMethod_e dtlm,
3274*a28cd43dSSascha Wildner void* workspace)
3275*a28cd43dSSascha Wildner {
3276*a28cd43dSSascha Wildner const BYTE* dictPtr = (const BYTE*)dict;
3277*a28cd43dSSascha Wildner const BYTE* const dictEnd = dictPtr + dictSize;
3278*a28cd43dSSascha Wildner size_t dictID;
3279*a28cd43dSSascha Wildner size_t eSize;
3280*a28cd43dSSascha Wildner
3281*a28cd43dSSascha Wildner ZSTD_STATIC_ASSERT(HUF_WORKSPACE_SIZE >= (1<<MAX(MLFSELog,LLFSELog)));
3282*a28cd43dSSascha Wildner assert(dictSize >= 8);
3283*a28cd43dSSascha Wildner assert(MEM_readLE32(dictPtr) == ZSTD_MAGIC_DICTIONARY);
3284*a28cd43dSSascha Wildner
3285*a28cd43dSSascha Wildner dictID = params->fParams.noDictIDFlag ? 0 : MEM_readLE32(dictPtr + 4 /* skip magic number */ );
3286*a28cd43dSSascha Wildner eSize = ZSTD_loadCEntropy(bs, workspace, dict, dictSize);
3287*a28cd43dSSascha Wildner FORWARD_IF_ERROR(eSize, "ZSTD_loadCEntropy failed");
3288*a28cd43dSSascha Wildner dictPtr += eSize;
3289*a28cd43dSSascha Wildner
3290*a28cd43dSSascha Wildner {
3291*a28cd43dSSascha Wildner size_t const dictContentSize = (size_t)(dictEnd - dictPtr);
3292*a28cd43dSSascha Wildner FORWARD_IF_ERROR(ZSTD_loadDictionaryContent(
3293*a28cd43dSSascha Wildner ms, NULL, ws, params, dictPtr, dictContentSize, dtlm), "");
3294*a28cd43dSSascha Wildner }
3295*a28cd43dSSascha Wildner return dictID;
3296*a28cd43dSSascha Wildner }
3297*a28cd43dSSascha Wildner
3298*a28cd43dSSascha Wildner /** ZSTD_compress_insertDictionary() :
3299*a28cd43dSSascha Wildner * @return : dictID, or an error code */
3300*a28cd43dSSascha Wildner static size_t
ZSTD_compress_insertDictionary(ZSTD_compressedBlockState_t * bs,ZSTD_matchState_t * ms,ldmState_t * ls,ZSTD_cwksp * ws,const ZSTD_CCtx_params * params,const void * dict,size_t dictSize,ZSTD_dictContentType_e dictContentType,ZSTD_dictTableLoadMethod_e dtlm,void * workspace)3301*a28cd43dSSascha Wildner ZSTD_compress_insertDictionary(ZSTD_compressedBlockState_t* bs,
3302*a28cd43dSSascha Wildner ZSTD_matchState_t* ms,
3303*a28cd43dSSascha Wildner ldmState_t* ls,
3304*a28cd43dSSascha Wildner ZSTD_cwksp* ws,
3305*a28cd43dSSascha Wildner const ZSTD_CCtx_params* params,
3306*a28cd43dSSascha Wildner const void* dict, size_t dictSize,
3307*a28cd43dSSascha Wildner ZSTD_dictContentType_e dictContentType,
3308*a28cd43dSSascha Wildner ZSTD_dictTableLoadMethod_e dtlm,
3309*a28cd43dSSascha Wildner void* workspace)
3310*a28cd43dSSascha Wildner {
3311*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_compress_insertDictionary (dictSize=%u)", (U32)dictSize);
3312*a28cd43dSSascha Wildner if ((dict==NULL) || (dictSize<8)) {
3313*a28cd43dSSascha Wildner RETURN_ERROR_IF(dictContentType == ZSTD_dct_fullDict, dictionary_wrong, "");
3314*a28cd43dSSascha Wildner return 0;
3315*a28cd43dSSascha Wildner }
3316*a28cd43dSSascha Wildner
3317*a28cd43dSSascha Wildner ZSTD_reset_compressedBlockState(bs);
3318*a28cd43dSSascha Wildner
3319*a28cd43dSSascha Wildner /* dict restricted modes */
3320*a28cd43dSSascha Wildner if (dictContentType == ZSTD_dct_rawContent)
3321*a28cd43dSSascha Wildner return ZSTD_loadDictionaryContent(ms, ls, ws, params, dict, dictSize, dtlm);
3322*a28cd43dSSascha Wildner
3323*a28cd43dSSascha Wildner if (MEM_readLE32(dict) != ZSTD_MAGIC_DICTIONARY) {
3324*a28cd43dSSascha Wildner if (dictContentType == ZSTD_dct_auto) {
3325*a28cd43dSSascha Wildner DEBUGLOG(4, "raw content dictionary detected");
3326*a28cd43dSSascha Wildner return ZSTD_loadDictionaryContent(
3327*a28cd43dSSascha Wildner ms, ls, ws, params, dict, dictSize, dtlm);
3328*a28cd43dSSascha Wildner }
3329*a28cd43dSSascha Wildner RETURN_ERROR_IF(dictContentType == ZSTD_dct_fullDict, dictionary_wrong, "");
3330*a28cd43dSSascha Wildner assert(0); /* impossible */
3331*a28cd43dSSascha Wildner }
3332*a28cd43dSSascha Wildner
3333*a28cd43dSSascha Wildner /* dict as full zstd dictionary */
3334*a28cd43dSSascha Wildner return ZSTD_loadZstdDictionary(
3335*a28cd43dSSascha Wildner bs, ms, ws, params, dict, dictSize, dtlm, workspace);
3336*a28cd43dSSascha Wildner }
3337*a28cd43dSSascha Wildner
3338*a28cd43dSSascha Wildner #define ZSTD_USE_CDICT_PARAMS_SRCSIZE_CUTOFF (128 KB)
3339*a28cd43dSSascha Wildner #define ZSTD_USE_CDICT_PARAMS_DICTSIZE_MULTIPLIER (6ULL)
3340*a28cd43dSSascha Wildner
3341*a28cd43dSSascha Wildner /*! ZSTD_compressBegin_internal() :
3342*a28cd43dSSascha Wildner * @return : 0, or an error code */
ZSTD_compressBegin_internal(ZSTD_CCtx * cctx,const void * dict,size_t dictSize,ZSTD_dictContentType_e dictContentType,ZSTD_dictTableLoadMethod_e dtlm,const ZSTD_CDict * cdict,const ZSTD_CCtx_params * params,U64 pledgedSrcSize,ZSTD_buffered_policy_e zbuff)3343*a28cd43dSSascha Wildner static size_t ZSTD_compressBegin_internal(ZSTD_CCtx* cctx,
3344*a28cd43dSSascha Wildner const void* dict, size_t dictSize,
3345*a28cd43dSSascha Wildner ZSTD_dictContentType_e dictContentType,
3346*a28cd43dSSascha Wildner ZSTD_dictTableLoadMethod_e dtlm,
3347*a28cd43dSSascha Wildner const ZSTD_CDict* cdict,
3348*a28cd43dSSascha Wildner const ZSTD_CCtx_params* params, U64 pledgedSrcSize,
3349*a28cd43dSSascha Wildner ZSTD_buffered_policy_e zbuff)
3350*a28cd43dSSascha Wildner {
3351*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_compressBegin_internal: wlog=%u", params->cParams.windowLog);
3352*a28cd43dSSascha Wildner /* params are supposed to be fully validated at this point */
3353*a28cd43dSSascha Wildner assert(!ZSTD_isError(ZSTD_checkCParams(params->cParams)));
3354*a28cd43dSSascha Wildner assert(!((dict) && (cdict))); /* either dict or cdict, not both */
3355*a28cd43dSSascha Wildner if ( (cdict)
3356*a28cd43dSSascha Wildner && (cdict->dictContentSize > 0)
3357*a28cd43dSSascha Wildner && ( pledgedSrcSize < ZSTD_USE_CDICT_PARAMS_SRCSIZE_CUTOFF
3358*a28cd43dSSascha Wildner || pledgedSrcSize < cdict->dictContentSize * ZSTD_USE_CDICT_PARAMS_DICTSIZE_MULTIPLIER
3359*a28cd43dSSascha Wildner || pledgedSrcSize == ZSTD_CONTENTSIZE_UNKNOWN
3360*a28cd43dSSascha Wildner || cdict->compressionLevel == 0)
3361*a28cd43dSSascha Wildner && (params->attachDictPref != ZSTD_dictForceLoad) ) {
3362*a28cd43dSSascha Wildner return ZSTD_resetCCtx_usingCDict(cctx, cdict, params, pledgedSrcSize, zbuff);
3363*a28cd43dSSascha Wildner }
3364*a28cd43dSSascha Wildner
3365*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_resetCCtx_internal(cctx, *params, pledgedSrcSize,
3366*a28cd43dSSascha Wildner ZSTDcrp_makeClean, zbuff) , "");
3367*a28cd43dSSascha Wildner { size_t const dictID = cdict ?
3368*a28cd43dSSascha Wildner ZSTD_compress_insertDictionary(
3369*a28cd43dSSascha Wildner cctx->blockState.prevCBlock, &cctx->blockState.matchState,
3370*a28cd43dSSascha Wildner &cctx->ldmState, &cctx->workspace, &cctx->appliedParams, cdict->dictContent,
3371*a28cd43dSSascha Wildner cdict->dictContentSize, cdict->dictContentType, dtlm,
3372*a28cd43dSSascha Wildner cctx->entropyWorkspace)
3373*a28cd43dSSascha Wildner : ZSTD_compress_insertDictionary(
3374*a28cd43dSSascha Wildner cctx->blockState.prevCBlock, &cctx->blockState.matchState,
3375*a28cd43dSSascha Wildner &cctx->ldmState, &cctx->workspace, &cctx->appliedParams, dict, dictSize,
3376*a28cd43dSSascha Wildner dictContentType, dtlm, cctx->entropyWorkspace);
3377*a28cd43dSSascha Wildner FORWARD_IF_ERROR(dictID, "ZSTD_compress_insertDictionary failed");
3378*a28cd43dSSascha Wildner assert(dictID <= UINT_MAX);
3379*a28cd43dSSascha Wildner cctx->dictID = (U32)dictID;
3380*a28cd43dSSascha Wildner }
3381*a28cd43dSSascha Wildner return 0;
3382*a28cd43dSSascha Wildner }
3383*a28cd43dSSascha Wildner
ZSTD_compressBegin_advanced_internal(ZSTD_CCtx * cctx,const void * dict,size_t dictSize,ZSTD_dictContentType_e dictContentType,ZSTD_dictTableLoadMethod_e dtlm,const ZSTD_CDict * cdict,const ZSTD_CCtx_params * params,unsigned long long pledgedSrcSize)3384*a28cd43dSSascha Wildner size_t ZSTD_compressBegin_advanced_internal(ZSTD_CCtx* cctx,
3385*a28cd43dSSascha Wildner const void* dict, size_t dictSize,
3386*a28cd43dSSascha Wildner ZSTD_dictContentType_e dictContentType,
3387*a28cd43dSSascha Wildner ZSTD_dictTableLoadMethod_e dtlm,
3388*a28cd43dSSascha Wildner const ZSTD_CDict* cdict,
3389*a28cd43dSSascha Wildner const ZSTD_CCtx_params* params,
3390*a28cd43dSSascha Wildner unsigned long long pledgedSrcSize)
3391*a28cd43dSSascha Wildner {
3392*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_compressBegin_advanced_internal: wlog=%u", params->cParams.windowLog);
3393*a28cd43dSSascha Wildner /* compression parameters verification and optimization */
3394*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_checkCParams(params->cParams) , "");
3395*a28cd43dSSascha Wildner return ZSTD_compressBegin_internal(cctx,
3396*a28cd43dSSascha Wildner dict, dictSize, dictContentType, dtlm,
3397*a28cd43dSSascha Wildner cdict,
3398*a28cd43dSSascha Wildner params, pledgedSrcSize,
3399*a28cd43dSSascha Wildner ZSTDb_not_buffered);
3400*a28cd43dSSascha Wildner }
3401*a28cd43dSSascha Wildner
3402*a28cd43dSSascha Wildner /*! ZSTD_compressBegin_advanced() :
3403*a28cd43dSSascha Wildner * @return : 0, or an error code */
ZSTD_compressBegin_advanced(ZSTD_CCtx * cctx,const void * dict,size_t dictSize,ZSTD_parameters params,unsigned long long pledgedSrcSize)3404*a28cd43dSSascha Wildner size_t ZSTD_compressBegin_advanced(ZSTD_CCtx* cctx,
3405*a28cd43dSSascha Wildner const void* dict, size_t dictSize,
3406*a28cd43dSSascha Wildner ZSTD_parameters params, unsigned long long pledgedSrcSize)
3407*a28cd43dSSascha Wildner {
3408*a28cd43dSSascha Wildner ZSTD_CCtx_params const cctxParams =
3409*a28cd43dSSascha Wildner ZSTD_assignParamsToCCtxParams(&cctx->requestedParams, ¶ms);
3410*a28cd43dSSascha Wildner return ZSTD_compressBegin_advanced_internal(cctx,
3411*a28cd43dSSascha Wildner dict, dictSize, ZSTD_dct_auto, ZSTD_dtlm_fast,
3412*a28cd43dSSascha Wildner NULL /*cdict*/,
3413*a28cd43dSSascha Wildner &cctxParams, pledgedSrcSize);
3414*a28cd43dSSascha Wildner }
3415*a28cd43dSSascha Wildner
ZSTD_compressBegin_usingDict(ZSTD_CCtx * cctx,const void * dict,size_t dictSize,int compressionLevel)3416*a28cd43dSSascha Wildner size_t ZSTD_compressBegin_usingDict(ZSTD_CCtx* cctx, const void* dict, size_t dictSize, int compressionLevel)
3417*a28cd43dSSascha Wildner {
3418*a28cd43dSSascha Wildner ZSTD_parameters const params = ZSTD_getParams_internal(compressionLevel, ZSTD_CONTENTSIZE_UNKNOWN, dictSize, ZSTD_cpm_noAttachDict);
3419*a28cd43dSSascha Wildner ZSTD_CCtx_params const cctxParams =
3420*a28cd43dSSascha Wildner ZSTD_assignParamsToCCtxParams(&cctx->requestedParams, ¶ms);
3421*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_compressBegin_usingDict (dictSize=%u)", (unsigned)dictSize);
3422*a28cd43dSSascha Wildner return ZSTD_compressBegin_internal(cctx, dict, dictSize, ZSTD_dct_auto, ZSTD_dtlm_fast, NULL,
3423*a28cd43dSSascha Wildner &cctxParams, ZSTD_CONTENTSIZE_UNKNOWN, ZSTDb_not_buffered);
3424*a28cd43dSSascha Wildner }
3425*a28cd43dSSascha Wildner
ZSTD_compressBegin(ZSTD_CCtx * cctx,int compressionLevel)3426*a28cd43dSSascha Wildner size_t ZSTD_compressBegin(ZSTD_CCtx* cctx, int compressionLevel)
3427*a28cd43dSSascha Wildner {
3428*a28cd43dSSascha Wildner return ZSTD_compressBegin_usingDict(cctx, NULL, 0, compressionLevel);
3429*a28cd43dSSascha Wildner }
3430*a28cd43dSSascha Wildner
3431*a28cd43dSSascha Wildner
3432*a28cd43dSSascha Wildner /*! ZSTD_writeEpilogue() :
3433*a28cd43dSSascha Wildner * Ends a frame.
3434*a28cd43dSSascha Wildner * @return : nb of bytes written into dst (or an error code) */
ZSTD_writeEpilogue(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity)3435*a28cd43dSSascha Wildner static size_t ZSTD_writeEpilogue(ZSTD_CCtx* cctx, void* dst, size_t dstCapacity)
3436*a28cd43dSSascha Wildner {
3437*a28cd43dSSascha Wildner BYTE* const ostart = (BYTE*)dst;
3438*a28cd43dSSascha Wildner BYTE* op = ostart;
3439*a28cd43dSSascha Wildner size_t fhSize = 0;
3440*a28cd43dSSascha Wildner
3441*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_writeEpilogue");
3442*a28cd43dSSascha Wildner RETURN_ERROR_IF(cctx->stage == ZSTDcs_created, stage_wrong, "init missing");
3443*a28cd43dSSascha Wildner
3444*a28cd43dSSascha Wildner /* special case : empty frame */
3445*a28cd43dSSascha Wildner if (cctx->stage == ZSTDcs_init) {
3446*a28cd43dSSascha Wildner fhSize = ZSTD_writeFrameHeader(dst, dstCapacity, &cctx->appliedParams, 0, 0);
3447*a28cd43dSSascha Wildner FORWARD_IF_ERROR(fhSize, "ZSTD_writeFrameHeader failed");
3448*a28cd43dSSascha Wildner dstCapacity -= fhSize;
3449*a28cd43dSSascha Wildner op += fhSize;
3450*a28cd43dSSascha Wildner cctx->stage = ZSTDcs_ongoing;
3451*a28cd43dSSascha Wildner }
3452*a28cd43dSSascha Wildner
3453*a28cd43dSSascha Wildner if (cctx->stage != ZSTDcs_ending) {
3454*a28cd43dSSascha Wildner /* write one last empty block, make it the "last" block */
3455*a28cd43dSSascha Wildner U32 const cBlockHeader24 = 1 /* last block */ + (((U32)bt_raw)<<1) + 0;
3456*a28cd43dSSascha Wildner RETURN_ERROR_IF(dstCapacity<4, dstSize_tooSmall, "no room for epilogue");
3457*a28cd43dSSascha Wildner MEM_writeLE32(op, cBlockHeader24);
3458*a28cd43dSSascha Wildner op += ZSTD_blockHeaderSize;
3459*a28cd43dSSascha Wildner dstCapacity -= ZSTD_blockHeaderSize;
3460*a28cd43dSSascha Wildner }
3461*a28cd43dSSascha Wildner
3462*a28cd43dSSascha Wildner if (cctx->appliedParams.fParams.checksumFlag) {
3463*a28cd43dSSascha Wildner U32 const checksum = (U32) XXH64_digest(&cctx->xxhState);
3464*a28cd43dSSascha Wildner RETURN_ERROR_IF(dstCapacity<4, dstSize_tooSmall, "no room for checksum");
3465*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_writeEpilogue: write checksum : %08X", (unsigned)checksum);
3466*a28cd43dSSascha Wildner MEM_writeLE32(op, checksum);
3467*a28cd43dSSascha Wildner op += 4;
3468*a28cd43dSSascha Wildner }
3469*a28cd43dSSascha Wildner
3470*a28cd43dSSascha Wildner cctx->stage = ZSTDcs_created; /* return to "created but no init" status */
3471*a28cd43dSSascha Wildner return op-ostart;
3472*a28cd43dSSascha Wildner }
3473*a28cd43dSSascha Wildner
ZSTD_compressEnd(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize)3474*a28cd43dSSascha Wildner size_t ZSTD_compressEnd (ZSTD_CCtx* cctx,
3475*a28cd43dSSascha Wildner void* dst, size_t dstCapacity,
3476*a28cd43dSSascha Wildner const void* src, size_t srcSize)
3477*a28cd43dSSascha Wildner {
3478*a28cd43dSSascha Wildner size_t endResult;
3479*a28cd43dSSascha Wildner size_t const cSize = ZSTD_compressContinue_internal(cctx,
3480*a28cd43dSSascha Wildner dst, dstCapacity, src, srcSize,
3481*a28cd43dSSascha Wildner 1 /* frame mode */, 1 /* last chunk */);
3482*a28cd43dSSascha Wildner FORWARD_IF_ERROR(cSize, "ZSTD_compressContinue_internal failed");
3483*a28cd43dSSascha Wildner endResult = ZSTD_writeEpilogue(cctx, (char*)dst + cSize, dstCapacity-cSize);
3484*a28cd43dSSascha Wildner FORWARD_IF_ERROR(endResult, "ZSTD_writeEpilogue failed");
3485*a28cd43dSSascha Wildner assert(!(cctx->appliedParams.fParams.contentSizeFlag && cctx->pledgedSrcSizePlusOne == 0));
3486*a28cd43dSSascha Wildner if (cctx->pledgedSrcSizePlusOne != 0) { /* control src size */
3487*a28cd43dSSascha Wildner ZSTD_STATIC_ASSERT(ZSTD_CONTENTSIZE_UNKNOWN == (unsigned long long)-1);
3488*a28cd43dSSascha Wildner DEBUGLOG(4, "end of frame : controlling src size");
3489*a28cd43dSSascha Wildner RETURN_ERROR_IF(
3490*a28cd43dSSascha Wildner cctx->pledgedSrcSizePlusOne != cctx->consumedSrcSize+1,
3491*a28cd43dSSascha Wildner srcSize_wrong,
3492*a28cd43dSSascha Wildner "error : pledgedSrcSize = %u, while realSrcSize = %u",
3493*a28cd43dSSascha Wildner (unsigned)cctx->pledgedSrcSizePlusOne-1,
3494*a28cd43dSSascha Wildner (unsigned)cctx->consumedSrcSize);
3495*a28cd43dSSascha Wildner }
3496*a28cd43dSSascha Wildner return cSize + endResult;
3497*a28cd43dSSascha Wildner }
3498*a28cd43dSSascha Wildner
ZSTD_compress_internal(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize,const void * dict,size_t dictSize,const ZSTD_parameters * params)3499*a28cd43dSSascha Wildner static size_t ZSTD_compress_internal (ZSTD_CCtx* cctx,
3500*a28cd43dSSascha Wildner void* dst, size_t dstCapacity,
3501*a28cd43dSSascha Wildner const void* src, size_t srcSize,
3502*a28cd43dSSascha Wildner const void* dict,size_t dictSize,
3503*a28cd43dSSascha Wildner const ZSTD_parameters* params)
3504*a28cd43dSSascha Wildner {
3505*a28cd43dSSascha Wildner ZSTD_CCtx_params const cctxParams =
3506*a28cd43dSSascha Wildner ZSTD_assignParamsToCCtxParams(&cctx->requestedParams, params);
3507*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_compress_internal");
3508*a28cd43dSSascha Wildner return ZSTD_compress_advanced_internal(cctx,
3509*a28cd43dSSascha Wildner dst, dstCapacity,
3510*a28cd43dSSascha Wildner src, srcSize,
3511*a28cd43dSSascha Wildner dict, dictSize,
3512*a28cd43dSSascha Wildner &cctxParams);
3513*a28cd43dSSascha Wildner }
3514*a28cd43dSSascha Wildner
ZSTD_compress_advanced(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize,const void * dict,size_t dictSize,ZSTD_parameters params)3515*a28cd43dSSascha Wildner size_t ZSTD_compress_advanced (ZSTD_CCtx* cctx,
3516*a28cd43dSSascha Wildner void* dst, size_t dstCapacity,
3517*a28cd43dSSascha Wildner const void* src, size_t srcSize,
3518*a28cd43dSSascha Wildner const void* dict,size_t dictSize,
3519*a28cd43dSSascha Wildner ZSTD_parameters params)
3520*a28cd43dSSascha Wildner {
3521*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_compress_advanced");
3522*a28cd43dSSascha Wildner FORWARD_IF_ERROR(ZSTD_checkCParams(params.cParams), "");
3523*a28cd43dSSascha Wildner return ZSTD_compress_internal(cctx,
3524*a28cd43dSSascha Wildner dst, dstCapacity,
3525*a28cd43dSSascha Wildner src, srcSize,
3526*a28cd43dSSascha Wildner dict, dictSize,
3527*a28cd43dSSascha Wildner ¶ms);
3528*a28cd43dSSascha Wildner }
3529*a28cd43dSSascha Wildner
3530*a28cd43dSSascha Wildner /* Internal */
ZSTD_compress_advanced_internal(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize,const void * dict,size_t dictSize,const ZSTD_CCtx_params * params)3531*a28cd43dSSascha Wildner size_t ZSTD_compress_advanced_internal(
3532*a28cd43dSSascha Wildner ZSTD_CCtx* cctx,
3533*a28cd43dSSascha Wildner void* dst, size_t dstCapacity,
3534*a28cd43dSSascha Wildner const void* src, size_t srcSize,
3535*a28cd43dSSascha Wildner const void* dict,size_t dictSize,
3536*a28cd43dSSascha Wildner const ZSTD_CCtx_params* params)
3537*a28cd43dSSascha Wildner {
3538*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_compress_advanced_internal (srcSize:%u)", (unsigned)srcSize);
3539*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_compressBegin_internal(cctx,
3540*a28cd43dSSascha Wildner dict, dictSize, ZSTD_dct_auto, ZSTD_dtlm_fast, NULL,
3541*a28cd43dSSascha Wildner params, srcSize, ZSTDb_not_buffered) , "");
3542*a28cd43dSSascha Wildner return ZSTD_compressEnd(cctx, dst, dstCapacity, src, srcSize);
3543*a28cd43dSSascha Wildner }
3544*a28cd43dSSascha Wildner
ZSTD_compress_usingDict(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize,const void * dict,size_t dictSize,int compressionLevel)3545*a28cd43dSSascha Wildner size_t ZSTD_compress_usingDict(ZSTD_CCtx* cctx,
3546*a28cd43dSSascha Wildner void* dst, size_t dstCapacity,
3547*a28cd43dSSascha Wildner const void* src, size_t srcSize,
3548*a28cd43dSSascha Wildner const void* dict, size_t dictSize,
3549*a28cd43dSSascha Wildner int compressionLevel)
3550*a28cd43dSSascha Wildner {
3551*a28cd43dSSascha Wildner ZSTD_parameters const params = ZSTD_getParams_internal(compressionLevel, srcSize, dict ? dictSize : 0, ZSTD_cpm_noAttachDict);
3552*a28cd43dSSascha Wildner ZSTD_CCtx_params cctxParams = ZSTD_assignParamsToCCtxParams(&cctx->requestedParams, ¶ms);
3553*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_compress_usingDict (srcSize=%u)", (unsigned)srcSize);
3554*a28cd43dSSascha Wildner assert(params.fParams.contentSizeFlag == 1);
3555*a28cd43dSSascha Wildner return ZSTD_compress_advanced_internal(cctx, dst, dstCapacity, src, srcSize, dict, dictSize, &cctxParams);
3556*a28cd43dSSascha Wildner }
3557*a28cd43dSSascha Wildner
ZSTD_compressCCtx(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize,int compressionLevel)3558*a28cd43dSSascha Wildner size_t ZSTD_compressCCtx(ZSTD_CCtx* cctx,
3559*a28cd43dSSascha Wildner void* dst, size_t dstCapacity,
3560*a28cd43dSSascha Wildner const void* src, size_t srcSize,
3561*a28cd43dSSascha Wildner int compressionLevel)
3562*a28cd43dSSascha Wildner {
3563*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_compressCCtx (srcSize=%u)", (unsigned)srcSize);
3564*a28cd43dSSascha Wildner assert(cctx != NULL);
3565*a28cd43dSSascha Wildner return ZSTD_compress_usingDict(cctx, dst, dstCapacity, src, srcSize, NULL, 0, compressionLevel);
3566*a28cd43dSSascha Wildner }
3567*a28cd43dSSascha Wildner
ZSTD_compress(void * dst,size_t dstCapacity,const void * src,size_t srcSize,int compressionLevel)3568*a28cd43dSSascha Wildner size_t ZSTD_compress(void* dst, size_t dstCapacity,
3569*a28cd43dSSascha Wildner const void* src, size_t srcSize,
3570*a28cd43dSSascha Wildner int compressionLevel)
3571*a28cd43dSSascha Wildner {
3572*a28cd43dSSascha Wildner size_t result;
3573*a28cd43dSSascha Wildner #if ZSTD_COMPRESS_HEAPMODE
3574*a28cd43dSSascha Wildner ZSTD_CCtx* cctx = ZSTD_createCCtx();
3575*a28cd43dSSascha Wildner RETURN_ERROR_IF(!cctx, memory_allocation, "ZSTD_createCCtx failed");
3576*a28cd43dSSascha Wildner result = ZSTD_compressCCtx(cctx, dst, dstCapacity, src, srcSize, compressionLevel);
3577*a28cd43dSSascha Wildner ZSTD_freeCCtx(cctx);
3578*a28cd43dSSascha Wildner #else
3579*a28cd43dSSascha Wildner ZSTD_CCtx ctxBody;
3580*a28cd43dSSascha Wildner ZSTD_initCCtx(&ctxBody, ZSTD_defaultCMem);
3581*a28cd43dSSascha Wildner result = ZSTD_compressCCtx(&ctxBody, dst, dstCapacity, src, srcSize, compressionLevel);
3582*a28cd43dSSascha Wildner ZSTD_freeCCtxContent(&ctxBody); /* can't free ctxBody itself, as it's on stack; free only heap content */
3583*a28cd43dSSascha Wildner #endif
3584*a28cd43dSSascha Wildner return result;
3585*a28cd43dSSascha Wildner }
3586*a28cd43dSSascha Wildner
3587*a28cd43dSSascha Wildner
3588*a28cd43dSSascha Wildner /* ===== Dictionary API ===== */
3589*a28cd43dSSascha Wildner
3590*a28cd43dSSascha Wildner /*! ZSTD_estimateCDictSize_advanced() :
3591*a28cd43dSSascha Wildner * Estimate amount of memory that will be needed to create a dictionary with following arguments */
ZSTD_estimateCDictSize_advanced(size_t dictSize,ZSTD_compressionParameters cParams,ZSTD_dictLoadMethod_e dictLoadMethod)3592*a28cd43dSSascha Wildner size_t ZSTD_estimateCDictSize_advanced(
3593*a28cd43dSSascha Wildner size_t dictSize, ZSTD_compressionParameters cParams,
3594*a28cd43dSSascha Wildner ZSTD_dictLoadMethod_e dictLoadMethod)
3595*a28cd43dSSascha Wildner {
3596*a28cd43dSSascha Wildner DEBUGLOG(5, "sizeof(ZSTD_CDict) : %u", (unsigned)sizeof(ZSTD_CDict));
3597*a28cd43dSSascha Wildner return ZSTD_cwksp_alloc_size(sizeof(ZSTD_CDict))
3598*a28cd43dSSascha Wildner + ZSTD_cwksp_alloc_size(HUF_WORKSPACE_SIZE)
3599*a28cd43dSSascha Wildner + ZSTD_sizeof_matchState(&cParams, /* forCCtx */ 0)
3600*a28cd43dSSascha Wildner + (dictLoadMethod == ZSTD_dlm_byRef ? 0
3601*a28cd43dSSascha Wildner : ZSTD_cwksp_alloc_size(ZSTD_cwksp_align(dictSize, sizeof(void *))));
3602*a28cd43dSSascha Wildner }
3603*a28cd43dSSascha Wildner
ZSTD_estimateCDictSize(size_t dictSize,int compressionLevel)3604*a28cd43dSSascha Wildner size_t ZSTD_estimateCDictSize(size_t dictSize, int compressionLevel)
3605*a28cd43dSSascha Wildner {
3606*a28cd43dSSascha Wildner ZSTD_compressionParameters const cParams = ZSTD_getCParams_internal(compressionLevel, ZSTD_CONTENTSIZE_UNKNOWN, dictSize, ZSTD_cpm_createCDict);
3607*a28cd43dSSascha Wildner return ZSTD_estimateCDictSize_advanced(dictSize, cParams, ZSTD_dlm_byCopy);
3608*a28cd43dSSascha Wildner }
3609*a28cd43dSSascha Wildner
ZSTD_sizeof_CDict(const ZSTD_CDict * cdict)3610*a28cd43dSSascha Wildner size_t ZSTD_sizeof_CDict(const ZSTD_CDict* cdict)
3611*a28cd43dSSascha Wildner {
3612*a28cd43dSSascha Wildner if (cdict==NULL) return 0; /* support sizeof on NULL */
3613*a28cd43dSSascha Wildner DEBUGLOG(5, "sizeof(*cdict) : %u", (unsigned)sizeof(*cdict));
3614*a28cd43dSSascha Wildner /* cdict may be in the workspace */
3615*a28cd43dSSascha Wildner return (cdict->workspace.workspace == cdict ? 0 : sizeof(*cdict))
3616*a28cd43dSSascha Wildner + ZSTD_cwksp_sizeof(&cdict->workspace);
3617*a28cd43dSSascha Wildner }
3618*a28cd43dSSascha Wildner
ZSTD_initCDict_internal(ZSTD_CDict * cdict,const void * dictBuffer,size_t dictSize,ZSTD_dictLoadMethod_e dictLoadMethod,ZSTD_dictContentType_e dictContentType,ZSTD_CCtx_params params)3619*a28cd43dSSascha Wildner static size_t ZSTD_initCDict_internal(
3620*a28cd43dSSascha Wildner ZSTD_CDict* cdict,
3621*a28cd43dSSascha Wildner const void* dictBuffer, size_t dictSize,
3622*a28cd43dSSascha Wildner ZSTD_dictLoadMethod_e dictLoadMethod,
3623*a28cd43dSSascha Wildner ZSTD_dictContentType_e dictContentType,
3624*a28cd43dSSascha Wildner ZSTD_CCtx_params params)
3625*a28cd43dSSascha Wildner {
3626*a28cd43dSSascha Wildner DEBUGLOG(3, "ZSTD_initCDict_internal (dictContentType:%u)", (unsigned)dictContentType);
3627*a28cd43dSSascha Wildner assert(!ZSTD_checkCParams(params.cParams));
3628*a28cd43dSSascha Wildner cdict->matchState.cParams = params.cParams;
3629*a28cd43dSSascha Wildner cdict->matchState.dedicatedDictSearch = params.enableDedicatedDictSearch;
3630*a28cd43dSSascha Wildner if (cdict->matchState.dedicatedDictSearch && dictSize > ZSTD_CHUNKSIZE_MAX) {
3631*a28cd43dSSascha Wildner cdict->matchState.dedicatedDictSearch = 0;
3632*a28cd43dSSascha Wildner }
3633*a28cd43dSSascha Wildner if ((dictLoadMethod == ZSTD_dlm_byRef) || (!dictBuffer) || (!dictSize)) {
3634*a28cd43dSSascha Wildner cdict->dictContent = dictBuffer;
3635*a28cd43dSSascha Wildner } else {
3636*a28cd43dSSascha Wildner void *internalBuffer = ZSTD_cwksp_reserve_object(&cdict->workspace, ZSTD_cwksp_align(dictSize, sizeof(void*)));
3637*a28cd43dSSascha Wildner RETURN_ERROR_IF(!internalBuffer, memory_allocation, "NULL pointer!");
3638*a28cd43dSSascha Wildner cdict->dictContent = internalBuffer;
3639*a28cd43dSSascha Wildner ZSTD_memcpy(internalBuffer, dictBuffer, dictSize);
3640*a28cd43dSSascha Wildner }
3641*a28cd43dSSascha Wildner cdict->dictContentSize = dictSize;
3642*a28cd43dSSascha Wildner cdict->dictContentType = dictContentType;
3643*a28cd43dSSascha Wildner
3644*a28cd43dSSascha Wildner cdict->entropyWorkspace = (U32*)ZSTD_cwksp_reserve_object(&cdict->workspace, HUF_WORKSPACE_SIZE);
3645*a28cd43dSSascha Wildner
3646*a28cd43dSSascha Wildner
3647*a28cd43dSSascha Wildner /* Reset the state to no dictionary */
3648*a28cd43dSSascha Wildner ZSTD_reset_compressedBlockState(&cdict->cBlockState);
3649*a28cd43dSSascha Wildner FORWARD_IF_ERROR(ZSTD_reset_matchState(
3650*a28cd43dSSascha Wildner &cdict->matchState,
3651*a28cd43dSSascha Wildner &cdict->workspace,
3652*a28cd43dSSascha Wildner ¶ms.cParams,
3653*a28cd43dSSascha Wildner ZSTDcrp_makeClean,
3654*a28cd43dSSascha Wildner ZSTDirp_reset,
3655*a28cd43dSSascha Wildner ZSTD_resetTarget_CDict), "");
3656*a28cd43dSSascha Wildner /* (Maybe) load the dictionary
3657*a28cd43dSSascha Wildner * Skips loading the dictionary if it is < 8 bytes.
3658*a28cd43dSSascha Wildner */
3659*a28cd43dSSascha Wildner { params.compressionLevel = ZSTD_CLEVEL_DEFAULT;
3660*a28cd43dSSascha Wildner params.fParams.contentSizeFlag = 1;
3661*a28cd43dSSascha Wildner { size_t const dictID = ZSTD_compress_insertDictionary(
3662*a28cd43dSSascha Wildner &cdict->cBlockState, &cdict->matchState, NULL, &cdict->workspace,
3663*a28cd43dSSascha Wildner ¶ms, cdict->dictContent, cdict->dictContentSize,
3664*a28cd43dSSascha Wildner dictContentType, ZSTD_dtlm_full, cdict->entropyWorkspace);
3665*a28cd43dSSascha Wildner FORWARD_IF_ERROR(dictID, "ZSTD_compress_insertDictionary failed");
3666*a28cd43dSSascha Wildner assert(dictID <= (size_t)(U32)-1);
3667*a28cd43dSSascha Wildner cdict->dictID = (U32)dictID;
3668*a28cd43dSSascha Wildner }
3669*a28cd43dSSascha Wildner }
3670*a28cd43dSSascha Wildner
3671*a28cd43dSSascha Wildner return 0;
3672*a28cd43dSSascha Wildner }
3673*a28cd43dSSascha Wildner
ZSTD_createCDict_advanced_internal(size_t dictSize,ZSTD_dictLoadMethod_e dictLoadMethod,ZSTD_compressionParameters cParams,ZSTD_customMem customMem)3674*a28cd43dSSascha Wildner static ZSTD_CDict* ZSTD_createCDict_advanced_internal(size_t dictSize,
3675*a28cd43dSSascha Wildner ZSTD_dictLoadMethod_e dictLoadMethod,
3676*a28cd43dSSascha Wildner ZSTD_compressionParameters cParams, ZSTD_customMem customMem)
3677*a28cd43dSSascha Wildner {
3678*a28cd43dSSascha Wildner if ((!customMem.customAlloc) ^ (!customMem.customFree)) return NULL;
3679*a28cd43dSSascha Wildner
3680*a28cd43dSSascha Wildner { size_t const workspaceSize =
3681*a28cd43dSSascha Wildner ZSTD_cwksp_alloc_size(sizeof(ZSTD_CDict)) +
3682*a28cd43dSSascha Wildner ZSTD_cwksp_alloc_size(HUF_WORKSPACE_SIZE) +
3683*a28cd43dSSascha Wildner ZSTD_sizeof_matchState(&cParams, /* forCCtx */ 0) +
3684*a28cd43dSSascha Wildner (dictLoadMethod == ZSTD_dlm_byRef ? 0
3685*a28cd43dSSascha Wildner : ZSTD_cwksp_alloc_size(ZSTD_cwksp_align(dictSize, sizeof(void*))));
3686*a28cd43dSSascha Wildner void* const workspace = ZSTD_customMalloc(workspaceSize, customMem);
3687*a28cd43dSSascha Wildner ZSTD_cwksp ws;
3688*a28cd43dSSascha Wildner ZSTD_CDict* cdict;
3689*a28cd43dSSascha Wildner
3690*a28cd43dSSascha Wildner if (!workspace) {
3691*a28cd43dSSascha Wildner ZSTD_customFree(workspace, customMem);
3692*a28cd43dSSascha Wildner return NULL;
3693*a28cd43dSSascha Wildner }
3694*a28cd43dSSascha Wildner
3695*a28cd43dSSascha Wildner ZSTD_cwksp_init(&ws, workspace, workspaceSize, ZSTD_cwksp_dynamic_alloc);
3696*a28cd43dSSascha Wildner
3697*a28cd43dSSascha Wildner cdict = (ZSTD_CDict*)ZSTD_cwksp_reserve_object(&ws, sizeof(ZSTD_CDict));
3698*a28cd43dSSascha Wildner assert(cdict != NULL);
3699*a28cd43dSSascha Wildner ZSTD_cwksp_move(&cdict->workspace, &ws);
3700*a28cd43dSSascha Wildner cdict->customMem = customMem;
3701*a28cd43dSSascha Wildner cdict->compressionLevel = 0; /* signals advanced API usage */
3702*a28cd43dSSascha Wildner
3703*a28cd43dSSascha Wildner return cdict;
3704*a28cd43dSSascha Wildner }
3705*a28cd43dSSascha Wildner }
3706*a28cd43dSSascha Wildner
ZSTD_createCDict_advanced(const void * dictBuffer,size_t dictSize,ZSTD_dictLoadMethod_e dictLoadMethod,ZSTD_dictContentType_e dictContentType,ZSTD_compressionParameters cParams,ZSTD_customMem customMem)3707*a28cd43dSSascha Wildner ZSTD_CDict* ZSTD_createCDict_advanced(const void* dictBuffer, size_t dictSize,
3708*a28cd43dSSascha Wildner ZSTD_dictLoadMethod_e dictLoadMethod,
3709*a28cd43dSSascha Wildner ZSTD_dictContentType_e dictContentType,
3710*a28cd43dSSascha Wildner ZSTD_compressionParameters cParams,
3711*a28cd43dSSascha Wildner ZSTD_customMem customMem)
3712*a28cd43dSSascha Wildner {
3713*a28cd43dSSascha Wildner ZSTD_CCtx_params cctxParams;
3714*a28cd43dSSascha Wildner ZSTD_memset(&cctxParams, 0, sizeof(cctxParams));
3715*a28cd43dSSascha Wildner ZSTD_CCtxParams_init(&cctxParams, 0);
3716*a28cd43dSSascha Wildner cctxParams.cParams = cParams;
3717*a28cd43dSSascha Wildner cctxParams.customMem = customMem;
3718*a28cd43dSSascha Wildner return ZSTD_createCDict_advanced2(
3719*a28cd43dSSascha Wildner dictBuffer, dictSize,
3720*a28cd43dSSascha Wildner dictLoadMethod, dictContentType,
3721*a28cd43dSSascha Wildner &cctxParams, customMem);
3722*a28cd43dSSascha Wildner }
3723*a28cd43dSSascha Wildner
ZSTD_createCDict_advanced2(const void * dict,size_t dictSize,ZSTD_dictLoadMethod_e dictLoadMethod,ZSTD_dictContentType_e dictContentType,const ZSTD_CCtx_params * originalCctxParams,ZSTD_customMem customMem)3724*a28cd43dSSascha Wildner ZSTDLIB_API ZSTD_CDict* ZSTD_createCDict_advanced2(
3725*a28cd43dSSascha Wildner const void* dict, size_t dictSize,
3726*a28cd43dSSascha Wildner ZSTD_dictLoadMethod_e dictLoadMethod,
3727*a28cd43dSSascha Wildner ZSTD_dictContentType_e dictContentType,
3728*a28cd43dSSascha Wildner const ZSTD_CCtx_params* originalCctxParams,
3729*a28cd43dSSascha Wildner ZSTD_customMem customMem)
3730*a28cd43dSSascha Wildner {
3731*a28cd43dSSascha Wildner ZSTD_CCtx_params cctxParams = *originalCctxParams;
3732*a28cd43dSSascha Wildner ZSTD_compressionParameters cParams;
3733*a28cd43dSSascha Wildner ZSTD_CDict* cdict;
3734*a28cd43dSSascha Wildner
3735*a28cd43dSSascha Wildner DEBUGLOG(3, "ZSTD_createCDict_advanced2, mode %u", (unsigned)dictContentType);
3736*a28cd43dSSascha Wildner if (!customMem.customAlloc ^ !customMem.customFree) return NULL;
3737*a28cd43dSSascha Wildner
3738*a28cd43dSSascha Wildner if (cctxParams.enableDedicatedDictSearch) {
3739*a28cd43dSSascha Wildner cParams = ZSTD_dedicatedDictSearch_getCParams(
3740*a28cd43dSSascha Wildner cctxParams.compressionLevel, dictSize);
3741*a28cd43dSSascha Wildner ZSTD_overrideCParams(&cParams, &cctxParams.cParams);
3742*a28cd43dSSascha Wildner } else {
3743*a28cd43dSSascha Wildner cParams = ZSTD_getCParamsFromCCtxParams(
3744*a28cd43dSSascha Wildner &cctxParams, ZSTD_CONTENTSIZE_UNKNOWN, dictSize, ZSTD_cpm_createCDict);
3745*a28cd43dSSascha Wildner }
3746*a28cd43dSSascha Wildner
3747*a28cd43dSSascha Wildner if (!ZSTD_dedicatedDictSearch_isSupported(&cParams)) {
3748*a28cd43dSSascha Wildner /* Fall back to non-DDSS params */
3749*a28cd43dSSascha Wildner cctxParams.enableDedicatedDictSearch = 0;
3750*a28cd43dSSascha Wildner cParams = ZSTD_getCParamsFromCCtxParams(
3751*a28cd43dSSascha Wildner &cctxParams, ZSTD_CONTENTSIZE_UNKNOWN, dictSize, ZSTD_cpm_createCDict);
3752*a28cd43dSSascha Wildner }
3753*a28cd43dSSascha Wildner
3754*a28cd43dSSascha Wildner cctxParams.cParams = cParams;
3755*a28cd43dSSascha Wildner
3756*a28cd43dSSascha Wildner cdict = ZSTD_createCDict_advanced_internal(dictSize,
3757*a28cd43dSSascha Wildner dictLoadMethod, cctxParams.cParams,
3758*a28cd43dSSascha Wildner customMem);
3759*a28cd43dSSascha Wildner
3760*a28cd43dSSascha Wildner if (ZSTD_isError( ZSTD_initCDict_internal(cdict,
3761*a28cd43dSSascha Wildner dict, dictSize,
3762*a28cd43dSSascha Wildner dictLoadMethod, dictContentType,
3763*a28cd43dSSascha Wildner cctxParams) )) {
3764*a28cd43dSSascha Wildner ZSTD_freeCDict(cdict);
3765*a28cd43dSSascha Wildner return NULL;
3766*a28cd43dSSascha Wildner }
3767*a28cd43dSSascha Wildner
3768*a28cd43dSSascha Wildner return cdict;
3769*a28cd43dSSascha Wildner }
3770*a28cd43dSSascha Wildner
ZSTD_createCDict(const void * dict,size_t dictSize,int compressionLevel)3771*a28cd43dSSascha Wildner ZSTD_CDict* ZSTD_createCDict(const void* dict, size_t dictSize, int compressionLevel)
3772*a28cd43dSSascha Wildner {
3773*a28cd43dSSascha Wildner ZSTD_compressionParameters cParams = ZSTD_getCParams_internal(compressionLevel, ZSTD_CONTENTSIZE_UNKNOWN, dictSize, ZSTD_cpm_createCDict);
3774*a28cd43dSSascha Wildner ZSTD_CDict* const cdict = ZSTD_createCDict_advanced(dict, dictSize,
3775*a28cd43dSSascha Wildner ZSTD_dlm_byCopy, ZSTD_dct_auto,
3776*a28cd43dSSascha Wildner cParams, ZSTD_defaultCMem);
3777*a28cd43dSSascha Wildner if (cdict)
3778*a28cd43dSSascha Wildner cdict->compressionLevel = (compressionLevel == 0) ? ZSTD_CLEVEL_DEFAULT : compressionLevel;
3779*a28cd43dSSascha Wildner return cdict;
3780*a28cd43dSSascha Wildner }
3781*a28cd43dSSascha Wildner
ZSTD_createCDict_byReference(const void * dict,size_t dictSize,int compressionLevel)3782*a28cd43dSSascha Wildner ZSTD_CDict* ZSTD_createCDict_byReference(const void* dict, size_t dictSize, int compressionLevel)
3783*a28cd43dSSascha Wildner {
3784*a28cd43dSSascha Wildner ZSTD_compressionParameters cParams = ZSTD_getCParams_internal(compressionLevel, ZSTD_CONTENTSIZE_UNKNOWN, dictSize, ZSTD_cpm_createCDict);
3785*a28cd43dSSascha Wildner ZSTD_CDict* const cdict = ZSTD_createCDict_advanced(dict, dictSize,
3786*a28cd43dSSascha Wildner ZSTD_dlm_byRef, ZSTD_dct_auto,
3787*a28cd43dSSascha Wildner cParams, ZSTD_defaultCMem);
3788*a28cd43dSSascha Wildner if (cdict)
3789*a28cd43dSSascha Wildner cdict->compressionLevel = (compressionLevel == 0) ? ZSTD_CLEVEL_DEFAULT : compressionLevel;
3790*a28cd43dSSascha Wildner return cdict;
3791*a28cd43dSSascha Wildner }
3792*a28cd43dSSascha Wildner
ZSTD_freeCDict(ZSTD_CDict * cdict)3793*a28cd43dSSascha Wildner size_t ZSTD_freeCDict(ZSTD_CDict* cdict)
3794*a28cd43dSSascha Wildner {
3795*a28cd43dSSascha Wildner if (cdict==NULL) return 0; /* support free on NULL */
3796*a28cd43dSSascha Wildner { ZSTD_customMem const cMem = cdict->customMem;
3797*a28cd43dSSascha Wildner int cdictInWorkspace = ZSTD_cwksp_owns_buffer(&cdict->workspace, cdict);
3798*a28cd43dSSascha Wildner ZSTD_cwksp_free(&cdict->workspace, cMem);
3799*a28cd43dSSascha Wildner if (!cdictInWorkspace) {
3800*a28cd43dSSascha Wildner ZSTD_customFree(cdict, cMem);
3801*a28cd43dSSascha Wildner }
3802*a28cd43dSSascha Wildner return 0;
3803*a28cd43dSSascha Wildner }
3804*a28cd43dSSascha Wildner }
3805*a28cd43dSSascha Wildner
3806*a28cd43dSSascha Wildner /*! ZSTD_initStaticCDict_advanced() :
3807*a28cd43dSSascha Wildner * Generate a digested dictionary in provided memory area.
3808*a28cd43dSSascha Wildner * workspace: The memory area to emplace the dictionary into.
3809*a28cd43dSSascha Wildner * Provided pointer must 8-bytes aligned.
3810*a28cd43dSSascha Wildner * It must outlive dictionary usage.
3811*a28cd43dSSascha Wildner * workspaceSize: Use ZSTD_estimateCDictSize()
3812*a28cd43dSSascha Wildner * to determine how large workspace must be.
3813*a28cd43dSSascha Wildner * cParams : use ZSTD_getCParams() to transform a compression level
3814*a28cd43dSSascha Wildner * into its relevants cParams.
3815*a28cd43dSSascha Wildner * @return : pointer to ZSTD_CDict*, or NULL if error (size too small)
3816*a28cd43dSSascha Wildner * Note : there is no corresponding "free" function.
3817*a28cd43dSSascha Wildner * Since workspace was allocated externally, it must be freed externally.
3818*a28cd43dSSascha Wildner */
ZSTD_initStaticCDict(void * workspace,size_t workspaceSize,const void * dict,size_t dictSize,ZSTD_dictLoadMethod_e dictLoadMethod,ZSTD_dictContentType_e dictContentType,ZSTD_compressionParameters cParams)3819*a28cd43dSSascha Wildner const ZSTD_CDict* ZSTD_initStaticCDict(
3820*a28cd43dSSascha Wildner void* workspace, size_t workspaceSize,
3821*a28cd43dSSascha Wildner const void* dict, size_t dictSize,
3822*a28cd43dSSascha Wildner ZSTD_dictLoadMethod_e dictLoadMethod,
3823*a28cd43dSSascha Wildner ZSTD_dictContentType_e dictContentType,
3824*a28cd43dSSascha Wildner ZSTD_compressionParameters cParams)
3825*a28cd43dSSascha Wildner {
3826*a28cd43dSSascha Wildner size_t const matchStateSize = ZSTD_sizeof_matchState(&cParams, /* forCCtx */ 0);
3827*a28cd43dSSascha Wildner size_t const neededSize = ZSTD_cwksp_alloc_size(sizeof(ZSTD_CDict))
3828*a28cd43dSSascha Wildner + (dictLoadMethod == ZSTD_dlm_byRef ? 0
3829*a28cd43dSSascha Wildner : ZSTD_cwksp_alloc_size(ZSTD_cwksp_align(dictSize, sizeof(void*))))
3830*a28cd43dSSascha Wildner + ZSTD_cwksp_alloc_size(HUF_WORKSPACE_SIZE)
3831*a28cd43dSSascha Wildner + matchStateSize;
3832*a28cd43dSSascha Wildner ZSTD_CDict* cdict;
3833*a28cd43dSSascha Wildner ZSTD_CCtx_params params;
3834*a28cd43dSSascha Wildner
3835*a28cd43dSSascha Wildner if ((size_t)workspace & 7) return NULL; /* 8-aligned */
3836*a28cd43dSSascha Wildner
3837*a28cd43dSSascha Wildner {
3838*a28cd43dSSascha Wildner ZSTD_cwksp ws;
3839*a28cd43dSSascha Wildner ZSTD_cwksp_init(&ws, workspace, workspaceSize, ZSTD_cwksp_static_alloc);
3840*a28cd43dSSascha Wildner cdict = (ZSTD_CDict*)ZSTD_cwksp_reserve_object(&ws, sizeof(ZSTD_CDict));
3841*a28cd43dSSascha Wildner if (cdict == NULL) return NULL;
3842*a28cd43dSSascha Wildner ZSTD_cwksp_move(&cdict->workspace, &ws);
3843*a28cd43dSSascha Wildner }
3844*a28cd43dSSascha Wildner
3845*a28cd43dSSascha Wildner DEBUGLOG(4, "(workspaceSize < neededSize) : (%u < %u) => %u",
3846*a28cd43dSSascha Wildner (unsigned)workspaceSize, (unsigned)neededSize, (unsigned)(workspaceSize < neededSize));
3847*a28cd43dSSascha Wildner if (workspaceSize < neededSize) return NULL;
3848*a28cd43dSSascha Wildner
3849*a28cd43dSSascha Wildner ZSTD_CCtxParams_init(¶ms, 0);
3850*a28cd43dSSascha Wildner params.cParams = cParams;
3851*a28cd43dSSascha Wildner
3852*a28cd43dSSascha Wildner if (ZSTD_isError( ZSTD_initCDict_internal(cdict,
3853*a28cd43dSSascha Wildner dict, dictSize,
3854*a28cd43dSSascha Wildner dictLoadMethod, dictContentType,
3855*a28cd43dSSascha Wildner params) ))
3856*a28cd43dSSascha Wildner return NULL;
3857*a28cd43dSSascha Wildner
3858*a28cd43dSSascha Wildner return cdict;
3859*a28cd43dSSascha Wildner }
3860*a28cd43dSSascha Wildner
ZSTD_getCParamsFromCDict(const ZSTD_CDict * cdict)3861*a28cd43dSSascha Wildner ZSTD_compressionParameters ZSTD_getCParamsFromCDict(const ZSTD_CDict* cdict)
3862*a28cd43dSSascha Wildner {
3863*a28cd43dSSascha Wildner assert(cdict != NULL);
3864*a28cd43dSSascha Wildner return cdict->matchState.cParams;
3865*a28cd43dSSascha Wildner }
3866*a28cd43dSSascha Wildner
3867*a28cd43dSSascha Wildner /*! ZSTD_getDictID_fromCDict() :
3868*a28cd43dSSascha Wildner * Provides the dictID of the dictionary loaded into `cdict`.
3869*a28cd43dSSascha Wildner * If @return == 0, the dictionary is not conformant to Zstandard specification, or empty.
3870*a28cd43dSSascha Wildner * Non-conformant dictionaries can still be loaded, but as content-only dictionaries. */
ZSTD_getDictID_fromCDict(const ZSTD_CDict * cdict)3871*a28cd43dSSascha Wildner unsigned ZSTD_getDictID_fromCDict(const ZSTD_CDict* cdict)
3872*a28cd43dSSascha Wildner {
3873*a28cd43dSSascha Wildner if (cdict==NULL) return 0;
3874*a28cd43dSSascha Wildner return cdict->dictID;
3875*a28cd43dSSascha Wildner }
3876*a28cd43dSSascha Wildner
3877*a28cd43dSSascha Wildner
3878*a28cd43dSSascha Wildner /* ZSTD_compressBegin_usingCDict_advanced() :
3879*a28cd43dSSascha Wildner * cdict must be != NULL */
ZSTD_compressBegin_usingCDict_advanced(ZSTD_CCtx * const cctx,const ZSTD_CDict * const cdict,ZSTD_frameParameters const fParams,unsigned long long const pledgedSrcSize)3880*a28cd43dSSascha Wildner size_t ZSTD_compressBegin_usingCDict_advanced(
3881*a28cd43dSSascha Wildner ZSTD_CCtx* const cctx, const ZSTD_CDict* const cdict,
3882*a28cd43dSSascha Wildner ZSTD_frameParameters const fParams, unsigned long long const pledgedSrcSize)
3883*a28cd43dSSascha Wildner {
3884*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_compressBegin_usingCDict_advanced");
3885*a28cd43dSSascha Wildner RETURN_ERROR_IF(cdict==NULL, dictionary_wrong, "NULL pointer!");
3886*a28cd43dSSascha Wildner { ZSTD_CCtx_params params = cctx->requestedParams;
3887*a28cd43dSSascha Wildner params.cParams = ( pledgedSrcSize < ZSTD_USE_CDICT_PARAMS_SRCSIZE_CUTOFF
3888*a28cd43dSSascha Wildner || pledgedSrcSize < cdict->dictContentSize * ZSTD_USE_CDICT_PARAMS_DICTSIZE_MULTIPLIER
3889*a28cd43dSSascha Wildner || pledgedSrcSize == ZSTD_CONTENTSIZE_UNKNOWN
3890*a28cd43dSSascha Wildner || cdict->compressionLevel == 0 )
3891*a28cd43dSSascha Wildner && (params.attachDictPref != ZSTD_dictForceLoad) ?
3892*a28cd43dSSascha Wildner ZSTD_getCParamsFromCDict(cdict)
3893*a28cd43dSSascha Wildner : ZSTD_getCParams(cdict->compressionLevel,
3894*a28cd43dSSascha Wildner pledgedSrcSize,
3895*a28cd43dSSascha Wildner cdict->dictContentSize);
3896*a28cd43dSSascha Wildner /* Increase window log to fit the entire dictionary and source if the
3897*a28cd43dSSascha Wildner * source size is known. Limit the increase to 19, which is the
3898*a28cd43dSSascha Wildner * window log for compression level 1 with the largest source size.
3899*a28cd43dSSascha Wildner */
3900*a28cd43dSSascha Wildner if (pledgedSrcSize != ZSTD_CONTENTSIZE_UNKNOWN) {
3901*a28cd43dSSascha Wildner U32 const limitedSrcSize = (U32)MIN(pledgedSrcSize, 1U << 19);
3902*a28cd43dSSascha Wildner U32 const limitedSrcLog = limitedSrcSize > 1 ? ZSTD_highbit32(limitedSrcSize - 1) + 1 : 1;
3903*a28cd43dSSascha Wildner params.cParams.windowLog = MAX(params.cParams.windowLog, limitedSrcLog);
3904*a28cd43dSSascha Wildner }
3905*a28cd43dSSascha Wildner params.fParams = fParams;
3906*a28cd43dSSascha Wildner return ZSTD_compressBegin_internal(cctx,
3907*a28cd43dSSascha Wildner NULL, 0, ZSTD_dct_auto, ZSTD_dtlm_fast,
3908*a28cd43dSSascha Wildner cdict,
3909*a28cd43dSSascha Wildner ¶ms, pledgedSrcSize,
3910*a28cd43dSSascha Wildner ZSTDb_not_buffered);
3911*a28cd43dSSascha Wildner }
3912*a28cd43dSSascha Wildner }
3913*a28cd43dSSascha Wildner
3914*a28cd43dSSascha Wildner /* ZSTD_compressBegin_usingCDict() :
3915*a28cd43dSSascha Wildner * pledgedSrcSize=0 means "unknown"
3916*a28cd43dSSascha Wildner * if pledgedSrcSize>0, it will enable contentSizeFlag */
ZSTD_compressBegin_usingCDict(ZSTD_CCtx * cctx,const ZSTD_CDict * cdict)3917*a28cd43dSSascha Wildner size_t ZSTD_compressBegin_usingCDict(ZSTD_CCtx* cctx, const ZSTD_CDict* cdict)
3918*a28cd43dSSascha Wildner {
3919*a28cd43dSSascha Wildner ZSTD_frameParameters const fParams = { 0 /*content*/, 0 /*checksum*/, 0 /*noDictID*/ };
3920*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_compressBegin_usingCDict : dictIDFlag == %u", !fParams.noDictIDFlag);
3921*a28cd43dSSascha Wildner return ZSTD_compressBegin_usingCDict_advanced(cctx, cdict, fParams, ZSTD_CONTENTSIZE_UNKNOWN);
3922*a28cd43dSSascha Wildner }
3923*a28cd43dSSascha Wildner
ZSTD_compress_usingCDict_advanced(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize,const ZSTD_CDict * cdict,ZSTD_frameParameters fParams)3924*a28cd43dSSascha Wildner size_t ZSTD_compress_usingCDict_advanced(ZSTD_CCtx* cctx,
3925*a28cd43dSSascha Wildner void* dst, size_t dstCapacity,
3926*a28cd43dSSascha Wildner const void* src, size_t srcSize,
3927*a28cd43dSSascha Wildner const ZSTD_CDict* cdict, ZSTD_frameParameters fParams)
3928*a28cd43dSSascha Wildner {
3929*a28cd43dSSascha Wildner FORWARD_IF_ERROR(ZSTD_compressBegin_usingCDict_advanced(cctx, cdict, fParams, srcSize), ""); /* will check if cdict != NULL */
3930*a28cd43dSSascha Wildner return ZSTD_compressEnd(cctx, dst, dstCapacity, src, srcSize);
3931*a28cd43dSSascha Wildner }
3932*a28cd43dSSascha Wildner
3933*a28cd43dSSascha Wildner /*! ZSTD_compress_usingCDict() :
3934*a28cd43dSSascha Wildner * Compression using a digested Dictionary.
3935*a28cd43dSSascha Wildner * Faster startup than ZSTD_compress_usingDict(), recommended when same dictionary is used multiple times.
3936*a28cd43dSSascha Wildner * Note that compression parameters are decided at CDict creation time
3937*a28cd43dSSascha Wildner * while frame parameters are hardcoded */
ZSTD_compress_usingCDict(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize,const ZSTD_CDict * cdict)3938*a28cd43dSSascha Wildner size_t ZSTD_compress_usingCDict(ZSTD_CCtx* cctx,
3939*a28cd43dSSascha Wildner void* dst, size_t dstCapacity,
3940*a28cd43dSSascha Wildner const void* src, size_t srcSize,
3941*a28cd43dSSascha Wildner const ZSTD_CDict* cdict)
3942*a28cd43dSSascha Wildner {
3943*a28cd43dSSascha Wildner ZSTD_frameParameters const fParams = { 1 /*content*/, 0 /*checksum*/, 0 /*noDictID*/ };
3944*a28cd43dSSascha Wildner return ZSTD_compress_usingCDict_advanced(cctx, dst, dstCapacity, src, srcSize, cdict, fParams);
3945*a28cd43dSSascha Wildner }
3946*a28cd43dSSascha Wildner
3947*a28cd43dSSascha Wildner
3948*a28cd43dSSascha Wildner
3949*a28cd43dSSascha Wildner /* ******************************************************************
3950*a28cd43dSSascha Wildner * Streaming
3951*a28cd43dSSascha Wildner ********************************************************************/
3952*a28cd43dSSascha Wildner
ZSTD_createCStream(void)3953*a28cd43dSSascha Wildner ZSTD_CStream* ZSTD_createCStream(void)
3954*a28cd43dSSascha Wildner {
3955*a28cd43dSSascha Wildner DEBUGLOG(3, "ZSTD_createCStream");
3956*a28cd43dSSascha Wildner return ZSTD_createCStream_advanced(ZSTD_defaultCMem);
3957*a28cd43dSSascha Wildner }
3958*a28cd43dSSascha Wildner
ZSTD_initStaticCStream(void * workspace,size_t workspaceSize)3959*a28cd43dSSascha Wildner ZSTD_CStream* ZSTD_initStaticCStream(void *workspace, size_t workspaceSize)
3960*a28cd43dSSascha Wildner {
3961*a28cd43dSSascha Wildner return ZSTD_initStaticCCtx(workspace, workspaceSize);
3962*a28cd43dSSascha Wildner }
3963*a28cd43dSSascha Wildner
ZSTD_createCStream_advanced(ZSTD_customMem customMem)3964*a28cd43dSSascha Wildner ZSTD_CStream* ZSTD_createCStream_advanced(ZSTD_customMem customMem)
3965*a28cd43dSSascha Wildner { /* CStream and CCtx are now same object */
3966*a28cd43dSSascha Wildner return ZSTD_createCCtx_advanced(customMem);
3967*a28cd43dSSascha Wildner }
3968*a28cd43dSSascha Wildner
ZSTD_freeCStream(ZSTD_CStream * zcs)3969*a28cd43dSSascha Wildner size_t ZSTD_freeCStream(ZSTD_CStream* zcs)
3970*a28cd43dSSascha Wildner {
3971*a28cd43dSSascha Wildner return ZSTD_freeCCtx(zcs); /* same object */
3972*a28cd43dSSascha Wildner }
3973*a28cd43dSSascha Wildner
3974*a28cd43dSSascha Wildner
3975*a28cd43dSSascha Wildner
3976*a28cd43dSSascha Wildner /*====== Initialization ======*/
3977*a28cd43dSSascha Wildner
ZSTD_CStreamInSize(void)3978*a28cd43dSSascha Wildner size_t ZSTD_CStreamInSize(void) { return ZSTD_BLOCKSIZE_MAX; }
3979*a28cd43dSSascha Wildner
ZSTD_CStreamOutSize(void)3980*a28cd43dSSascha Wildner size_t ZSTD_CStreamOutSize(void)
3981*a28cd43dSSascha Wildner {
3982*a28cd43dSSascha Wildner return ZSTD_compressBound(ZSTD_BLOCKSIZE_MAX) + ZSTD_blockHeaderSize + 4 /* 32-bits hash */ ;
3983*a28cd43dSSascha Wildner }
3984*a28cd43dSSascha Wildner
ZSTD_getCParamMode(ZSTD_CDict const * cdict,ZSTD_CCtx_params const * params,U64 pledgedSrcSize)3985*a28cd43dSSascha Wildner static ZSTD_cParamMode_e ZSTD_getCParamMode(ZSTD_CDict const* cdict, ZSTD_CCtx_params const* params, U64 pledgedSrcSize)
3986*a28cd43dSSascha Wildner {
3987*a28cd43dSSascha Wildner if (cdict != NULL && ZSTD_shouldAttachDict(cdict, params, pledgedSrcSize))
3988*a28cd43dSSascha Wildner return ZSTD_cpm_attachDict;
3989*a28cd43dSSascha Wildner else
3990*a28cd43dSSascha Wildner return ZSTD_cpm_noAttachDict;
3991*a28cd43dSSascha Wildner }
3992*a28cd43dSSascha Wildner
3993*a28cd43dSSascha Wildner /* ZSTD_resetCStream():
3994*a28cd43dSSascha Wildner * pledgedSrcSize == 0 means "unknown" */
ZSTD_resetCStream(ZSTD_CStream * zcs,unsigned long long pss)3995*a28cd43dSSascha Wildner size_t ZSTD_resetCStream(ZSTD_CStream* zcs, unsigned long long pss)
3996*a28cd43dSSascha Wildner {
3997*a28cd43dSSascha Wildner /* temporary : 0 interpreted as "unknown" during transition period.
3998*a28cd43dSSascha Wildner * Users willing to specify "unknown" **must** use ZSTD_CONTENTSIZE_UNKNOWN.
3999*a28cd43dSSascha Wildner * 0 will be interpreted as "empty" in the future.
4000*a28cd43dSSascha Wildner */
4001*a28cd43dSSascha Wildner U64 const pledgedSrcSize = (pss==0) ? ZSTD_CONTENTSIZE_UNKNOWN : pss;
4002*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_resetCStream: pledgedSrcSize = %u", (unsigned)pledgedSrcSize);
4003*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only) , "");
4004*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_setPledgedSrcSize(zcs, pledgedSrcSize) , "");
4005*a28cd43dSSascha Wildner return 0;
4006*a28cd43dSSascha Wildner }
4007*a28cd43dSSascha Wildner
4008*a28cd43dSSascha Wildner /*! ZSTD_initCStream_internal() :
4009*a28cd43dSSascha Wildner * Note : for lib/compress only. Used by zstdmt_compress.c.
4010*a28cd43dSSascha Wildner * Assumption 1 : params are valid
4011*a28cd43dSSascha Wildner * Assumption 2 : either dict, or cdict, is defined, not both */
ZSTD_initCStream_internal(ZSTD_CStream * zcs,const void * dict,size_t dictSize,const ZSTD_CDict * cdict,const ZSTD_CCtx_params * params,unsigned long long pledgedSrcSize)4012*a28cd43dSSascha Wildner size_t ZSTD_initCStream_internal(ZSTD_CStream* zcs,
4013*a28cd43dSSascha Wildner const void* dict, size_t dictSize, const ZSTD_CDict* cdict,
4014*a28cd43dSSascha Wildner const ZSTD_CCtx_params* params,
4015*a28cd43dSSascha Wildner unsigned long long pledgedSrcSize)
4016*a28cd43dSSascha Wildner {
4017*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_initCStream_internal");
4018*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only) , "");
4019*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_setPledgedSrcSize(zcs, pledgedSrcSize) , "");
4020*a28cd43dSSascha Wildner assert(!ZSTD_isError(ZSTD_checkCParams(params->cParams)));
4021*a28cd43dSSascha Wildner zcs->requestedParams = *params;
4022*a28cd43dSSascha Wildner assert(!((dict) && (cdict))); /* either dict or cdict, not both */
4023*a28cd43dSSascha Wildner if (dict) {
4024*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_loadDictionary(zcs, dict, dictSize) , "");
4025*a28cd43dSSascha Wildner } else {
4026*a28cd43dSSascha Wildner /* Dictionary is cleared if !cdict */
4027*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_refCDict(zcs, cdict) , "");
4028*a28cd43dSSascha Wildner }
4029*a28cd43dSSascha Wildner return 0;
4030*a28cd43dSSascha Wildner }
4031*a28cd43dSSascha Wildner
4032*a28cd43dSSascha Wildner /* ZSTD_initCStream_usingCDict_advanced() :
4033*a28cd43dSSascha Wildner * same as ZSTD_initCStream_usingCDict(), with control over frame parameters */
ZSTD_initCStream_usingCDict_advanced(ZSTD_CStream * zcs,const ZSTD_CDict * cdict,ZSTD_frameParameters fParams,unsigned long long pledgedSrcSize)4034*a28cd43dSSascha Wildner size_t ZSTD_initCStream_usingCDict_advanced(ZSTD_CStream* zcs,
4035*a28cd43dSSascha Wildner const ZSTD_CDict* cdict,
4036*a28cd43dSSascha Wildner ZSTD_frameParameters fParams,
4037*a28cd43dSSascha Wildner unsigned long long pledgedSrcSize)
4038*a28cd43dSSascha Wildner {
4039*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_initCStream_usingCDict_advanced");
4040*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only) , "");
4041*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_setPledgedSrcSize(zcs, pledgedSrcSize) , "");
4042*a28cd43dSSascha Wildner zcs->requestedParams.fParams = fParams;
4043*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_refCDict(zcs, cdict) , "");
4044*a28cd43dSSascha Wildner return 0;
4045*a28cd43dSSascha Wildner }
4046*a28cd43dSSascha Wildner
4047*a28cd43dSSascha Wildner /* note : cdict must outlive compression session */
ZSTD_initCStream_usingCDict(ZSTD_CStream * zcs,const ZSTD_CDict * cdict)4048*a28cd43dSSascha Wildner size_t ZSTD_initCStream_usingCDict(ZSTD_CStream* zcs, const ZSTD_CDict* cdict)
4049*a28cd43dSSascha Wildner {
4050*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_initCStream_usingCDict");
4051*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only) , "");
4052*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_refCDict(zcs, cdict) , "");
4053*a28cd43dSSascha Wildner return 0;
4054*a28cd43dSSascha Wildner }
4055*a28cd43dSSascha Wildner
4056*a28cd43dSSascha Wildner
4057*a28cd43dSSascha Wildner /* ZSTD_initCStream_advanced() :
4058*a28cd43dSSascha Wildner * pledgedSrcSize must be exact.
4059*a28cd43dSSascha Wildner * if srcSize is not known at init time, use value ZSTD_CONTENTSIZE_UNKNOWN.
4060*a28cd43dSSascha Wildner * dict is loaded with default parameters ZSTD_dct_auto and ZSTD_dlm_byCopy. */
ZSTD_initCStream_advanced(ZSTD_CStream * zcs,const void * dict,size_t dictSize,ZSTD_parameters params,unsigned long long pss)4061*a28cd43dSSascha Wildner size_t ZSTD_initCStream_advanced(ZSTD_CStream* zcs,
4062*a28cd43dSSascha Wildner const void* dict, size_t dictSize,
4063*a28cd43dSSascha Wildner ZSTD_parameters params, unsigned long long pss)
4064*a28cd43dSSascha Wildner {
4065*a28cd43dSSascha Wildner /* for compatibility with older programs relying on this behavior.
4066*a28cd43dSSascha Wildner * Users should now specify ZSTD_CONTENTSIZE_UNKNOWN.
4067*a28cd43dSSascha Wildner * This line will be removed in the future.
4068*a28cd43dSSascha Wildner */
4069*a28cd43dSSascha Wildner U64 const pledgedSrcSize = (pss==0 && params.fParams.contentSizeFlag==0) ? ZSTD_CONTENTSIZE_UNKNOWN : pss;
4070*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_initCStream_advanced");
4071*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only) , "");
4072*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_setPledgedSrcSize(zcs, pledgedSrcSize) , "");
4073*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_checkCParams(params.cParams) , "");
4074*a28cd43dSSascha Wildner zcs->requestedParams = ZSTD_assignParamsToCCtxParams(&zcs->requestedParams, ¶ms);
4075*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_loadDictionary(zcs, dict, dictSize) , "");
4076*a28cd43dSSascha Wildner return 0;
4077*a28cd43dSSascha Wildner }
4078*a28cd43dSSascha Wildner
ZSTD_initCStream_usingDict(ZSTD_CStream * zcs,const void * dict,size_t dictSize,int compressionLevel)4079*a28cd43dSSascha Wildner size_t ZSTD_initCStream_usingDict(ZSTD_CStream* zcs, const void* dict, size_t dictSize, int compressionLevel)
4080*a28cd43dSSascha Wildner {
4081*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_initCStream_usingDict");
4082*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only) , "");
4083*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_setParameter(zcs, ZSTD_c_compressionLevel, compressionLevel) , "");
4084*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_loadDictionary(zcs, dict, dictSize) , "");
4085*a28cd43dSSascha Wildner return 0;
4086*a28cd43dSSascha Wildner }
4087*a28cd43dSSascha Wildner
ZSTD_initCStream_srcSize(ZSTD_CStream * zcs,int compressionLevel,unsigned long long pss)4088*a28cd43dSSascha Wildner size_t ZSTD_initCStream_srcSize(ZSTD_CStream* zcs, int compressionLevel, unsigned long long pss)
4089*a28cd43dSSascha Wildner {
4090*a28cd43dSSascha Wildner /* temporary : 0 interpreted as "unknown" during transition period.
4091*a28cd43dSSascha Wildner * Users willing to specify "unknown" **must** use ZSTD_CONTENTSIZE_UNKNOWN.
4092*a28cd43dSSascha Wildner * 0 will be interpreted as "empty" in the future.
4093*a28cd43dSSascha Wildner */
4094*a28cd43dSSascha Wildner U64 const pledgedSrcSize = (pss==0) ? ZSTD_CONTENTSIZE_UNKNOWN : pss;
4095*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_initCStream_srcSize");
4096*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only) , "");
4097*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_refCDict(zcs, NULL) , "");
4098*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_setParameter(zcs, ZSTD_c_compressionLevel, compressionLevel) , "");
4099*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_setPledgedSrcSize(zcs, pledgedSrcSize) , "");
4100*a28cd43dSSascha Wildner return 0;
4101*a28cd43dSSascha Wildner }
4102*a28cd43dSSascha Wildner
ZSTD_initCStream(ZSTD_CStream * zcs,int compressionLevel)4103*a28cd43dSSascha Wildner size_t ZSTD_initCStream(ZSTD_CStream* zcs, int compressionLevel)
4104*a28cd43dSSascha Wildner {
4105*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_initCStream");
4106*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only) , "");
4107*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_refCDict(zcs, NULL) , "");
4108*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_CCtx_setParameter(zcs, ZSTD_c_compressionLevel, compressionLevel) , "");
4109*a28cd43dSSascha Wildner return 0;
4110*a28cd43dSSascha Wildner }
4111*a28cd43dSSascha Wildner
4112*a28cd43dSSascha Wildner /*====== Compression ======*/
4113*a28cd43dSSascha Wildner
ZSTD_nextInputSizeHint(const ZSTD_CCtx * cctx)4114*a28cd43dSSascha Wildner static size_t ZSTD_nextInputSizeHint(const ZSTD_CCtx* cctx)
4115*a28cd43dSSascha Wildner {
4116*a28cd43dSSascha Wildner size_t hintInSize = cctx->inBuffTarget - cctx->inBuffPos;
4117*a28cd43dSSascha Wildner if (hintInSize==0) hintInSize = cctx->blockSize;
4118*a28cd43dSSascha Wildner return hintInSize;
4119*a28cd43dSSascha Wildner }
4120*a28cd43dSSascha Wildner
4121*a28cd43dSSascha Wildner /** ZSTD_compressStream_generic():
4122*a28cd43dSSascha Wildner * internal function for all *compressStream*() variants
4123*a28cd43dSSascha Wildner * non-static, because can be called from zstdmt_compress.c
4124*a28cd43dSSascha Wildner * @return : hint size for next input */
ZSTD_compressStream_generic(ZSTD_CStream * zcs,ZSTD_outBuffer * output,ZSTD_inBuffer * input,ZSTD_EndDirective const flushMode)4125*a28cd43dSSascha Wildner static size_t ZSTD_compressStream_generic(ZSTD_CStream* zcs,
4126*a28cd43dSSascha Wildner ZSTD_outBuffer* output,
4127*a28cd43dSSascha Wildner ZSTD_inBuffer* input,
4128*a28cd43dSSascha Wildner ZSTD_EndDirective const flushMode)
4129*a28cd43dSSascha Wildner {
4130*a28cd43dSSascha Wildner const char* const istart = (const char*)input->src;
4131*a28cd43dSSascha Wildner const char* const iend = input->size != 0 ? istart + input->size : istart;
4132*a28cd43dSSascha Wildner const char* ip = input->pos != 0 ? istart + input->pos : istart;
4133*a28cd43dSSascha Wildner char* const ostart = (char*)output->dst;
4134*a28cd43dSSascha Wildner char* const oend = output->size != 0 ? ostart + output->size : ostart;
4135*a28cd43dSSascha Wildner char* op = output->pos != 0 ? ostart + output->pos : ostart;
4136*a28cd43dSSascha Wildner U32 someMoreWork = 1;
4137*a28cd43dSSascha Wildner
4138*a28cd43dSSascha Wildner /* check expectations */
4139*a28cd43dSSascha Wildner DEBUGLOG(5, "ZSTD_compressStream_generic, flush=%u", (unsigned)flushMode);
4140*a28cd43dSSascha Wildner if (zcs->appliedParams.inBufferMode == ZSTD_bm_buffered) {
4141*a28cd43dSSascha Wildner assert(zcs->inBuff != NULL);
4142*a28cd43dSSascha Wildner assert(zcs->inBuffSize > 0);
4143*a28cd43dSSascha Wildner }
4144*a28cd43dSSascha Wildner if (zcs->appliedParams.outBufferMode == ZSTD_bm_buffered) {
4145*a28cd43dSSascha Wildner assert(zcs->outBuff != NULL);
4146*a28cd43dSSascha Wildner assert(zcs->outBuffSize > 0);
4147*a28cd43dSSascha Wildner }
4148*a28cd43dSSascha Wildner assert(output->pos <= output->size);
4149*a28cd43dSSascha Wildner assert(input->pos <= input->size);
4150*a28cd43dSSascha Wildner assert((U32)flushMode <= (U32)ZSTD_e_end);
4151*a28cd43dSSascha Wildner
4152*a28cd43dSSascha Wildner while (someMoreWork) {
4153*a28cd43dSSascha Wildner switch(zcs->streamStage)
4154*a28cd43dSSascha Wildner {
4155*a28cd43dSSascha Wildner case zcss_init:
4156*a28cd43dSSascha Wildner RETURN_ERROR(init_missing, "call ZSTD_initCStream() first!");
4157*a28cd43dSSascha Wildner
4158*a28cd43dSSascha Wildner case zcss_load:
4159*a28cd43dSSascha Wildner if ( (flushMode == ZSTD_e_end)
4160*a28cd43dSSascha Wildner && ( (size_t)(oend-op) >= ZSTD_compressBound(iend-ip) /* Enough output space */
4161*a28cd43dSSascha Wildner || zcs->appliedParams.outBufferMode == ZSTD_bm_stable) /* OR we are allowed to return dstSizeTooSmall */
4162*a28cd43dSSascha Wildner && (zcs->inBuffPos == 0) ) {
4163*a28cd43dSSascha Wildner /* shortcut to compression pass directly into output buffer */
4164*a28cd43dSSascha Wildner size_t const cSize = ZSTD_compressEnd(zcs,
4165*a28cd43dSSascha Wildner op, oend-op, ip, iend-ip);
4166*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_compressEnd : cSize=%u", (unsigned)cSize);
4167*a28cd43dSSascha Wildner FORWARD_IF_ERROR(cSize, "ZSTD_compressEnd failed");
4168*a28cd43dSSascha Wildner ip = iend;
4169*a28cd43dSSascha Wildner op += cSize;
4170*a28cd43dSSascha Wildner zcs->frameEnded = 1;
4171*a28cd43dSSascha Wildner ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only);
4172*a28cd43dSSascha Wildner someMoreWork = 0; break;
4173*a28cd43dSSascha Wildner }
4174*a28cd43dSSascha Wildner /* complete loading into inBuffer in buffered mode */
4175*a28cd43dSSascha Wildner if (zcs->appliedParams.inBufferMode == ZSTD_bm_buffered) {
4176*a28cd43dSSascha Wildner size_t const toLoad = zcs->inBuffTarget - zcs->inBuffPos;
4177*a28cd43dSSascha Wildner size_t const loaded = ZSTD_limitCopy(
4178*a28cd43dSSascha Wildner zcs->inBuff + zcs->inBuffPos, toLoad,
4179*a28cd43dSSascha Wildner ip, iend-ip);
4180*a28cd43dSSascha Wildner zcs->inBuffPos += loaded;
4181*a28cd43dSSascha Wildner if (loaded != 0)
4182*a28cd43dSSascha Wildner ip += loaded;
4183*a28cd43dSSascha Wildner if ( (flushMode == ZSTD_e_continue)
4184*a28cd43dSSascha Wildner && (zcs->inBuffPos < zcs->inBuffTarget) ) {
4185*a28cd43dSSascha Wildner /* not enough input to fill full block : stop here */
4186*a28cd43dSSascha Wildner someMoreWork = 0; break;
4187*a28cd43dSSascha Wildner }
4188*a28cd43dSSascha Wildner if ( (flushMode == ZSTD_e_flush)
4189*a28cd43dSSascha Wildner && (zcs->inBuffPos == zcs->inToCompress) ) {
4190*a28cd43dSSascha Wildner /* empty */
4191*a28cd43dSSascha Wildner someMoreWork = 0; break;
4192*a28cd43dSSascha Wildner }
4193*a28cd43dSSascha Wildner }
4194*a28cd43dSSascha Wildner /* compress current block (note : this stage cannot be stopped in the middle) */
4195*a28cd43dSSascha Wildner DEBUGLOG(5, "stream compression stage (flushMode==%u)", flushMode);
4196*a28cd43dSSascha Wildner { int const inputBuffered = (zcs->appliedParams.inBufferMode == ZSTD_bm_buffered);
4197*a28cd43dSSascha Wildner void* cDst;
4198*a28cd43dSSascha Wildner size_t cSize;
4199*a28cd43dSSascha Wildner size_t oSize = oend-op;
4200*a28cd43dSSascha Wildner size_t const iSize = inputBuffered
4201*a28cd43dSSascha Wildner ? zcs->inBuffPos - zcs->inToCompress
4202*a28cd43dSSascha Wildner : MIN((size_t)(iend - ip), zcs->blockSize);
4203*a28cd43dSSascha Wildner if (oSize >= ZSTD_compressBound(iSize) || zcs->appliedParams.outBufferMode == ZSTD_bm_stable)
4204*a28cd43dSSascha Wildner cDst = op; /* compress into output buffer, to skip flush stage */
4205*a28cd43dSSascha Wildner else
4206*a28cd43dSSascha Wildner cDst = zcs->outBuff, oSize = zcs->outBuffSize;
4207*a28cd43dSSascha Wildner if (inputBuffered) {
4208*a28cd43dSSascha Wildner unsigned const lastBlock = (flushMode == ZSTD_e_end) && (ip==iend);
4209*a28cd43dSSascha Wildner cSize = lastBlock ?
4210*a28cd43dSSascha Wildner ZSTD_compressEnd(zcs, cDst, oSize,
4211*a28cd43dSSascha Wildner zcs->inBuff + zcs->inToCompress, iSize) :
4212*a28cd43dSSascha Wildner ZSTD_compressContinue(zcs, cDst, oSize,
4213*a28cd43dSSascha Wildner zcs->inBuff + zcs->inToCompress, iSize);
4214*a28cd43dSSascha Wildner FORWARD_IF_ERROR(cSize, "%s", lastBlock ? "ZSTD_compressEnd failed" : "ZSTD_compressContinue failed");
4215*a28cd43dSSascha Wildner zcs->frameEnded = lastBlock;
4216*a28cd43dSSascha Wildner /* prepare next block */
4217*a28cd43dSSascha Wildner zcs->inBuffTarget = zcs->inBuffPos + zcs->blockSize;
4218*a28cd43dSSascha Wildner if (zcs->inBuffTarget > zcs->inBuffSize)
4219*a28cd43dSSascha Wildner zcs->inBuffPos = 0, zcs->inBuffTarget = zcs->blockSize;
4220*a28cd43dSSascha Wildner DEBUGLOG(5, "inBuffTarget:%u / inBuffSize:%u",
4221*a28cd43dSSascha Wildner (unsigned)zcs->inBuffTarget, (unsigned)zcs->inBuffSize);
4222*a28cd43dSSascha Wildner if (!lastBlock)
4223*a28cd43dSSascha Wildner assert(zcs->inBuffTarget <= zcs->inBuffSize);
4224*a28cd43dSSascha Wildner zcs->inToCompress = zcs->inBuffPos;
4225*a28cd43dSSascha Wildner } else {
4226*a28cd43dSSascha Wildner unsigned const lastBlock = (ip + iSize == iend);
4227*a28cd43dSSascha Wildner assert(flushMode == ZSTD_e_end /* Already validated */);
4228*a28cd43dSSascha Wildner cSize = lastBlock ?
4229*a28cd43dSSascha Wildner ZSTD_compressEnd(zcs, cDst, oSize, ip, iSize) :
4230*a28cd43dSSascha Wildner ZSTD_compressContinue(zcs, cDst, oSize, ip, iSize);
4231*a28cd43dSSascha Wildner /* Consume the input prior to error checking to mirror buffered mode. */
4232*a28cd43dSSascha Wildner if (iSize > 0)
4233*a28cd43dSSascha Wildner ip += iSize;
4234*a28cd43dSSascha Wildner FORWARD_IF_ERROR(cSize, "%s", lastBlock ? "ZSTD_compressEnd failed" : "ZSTD_compressContinue failed");
4235*a28cd43dSSascha Wildner zcs->frameEnded = lastBlock;
4236*a28cd43dSSascha Wildner if (lastBlock)
4237*a28cd43dSSascha Wildner assert(ip == iend);
4238*a28cd43dSSascha Wildner }
4239*a28cd43dSSascha Wildner if (cDst == op) { /* no need to flush */
4240*a28cd43dSSascha Wildner op += cSize;
4241*a28cd43dSSascha Wildner if (zcs->frameEnded) {
4242*a28cd43dSSascha Wildner DEBUGLOG(5, "Frame completed directly in outBuffer");
4243*a28cd43dSSascha Wildner someMoreWork = 0;
4244*a28cd43dSSascha Wildner ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only);
4245*a28cd43dSSascha Wildner }
4246*a28cd43dSSascha Wildner break;
4247*a28cd43dSSascha Wildner }
4248*a28cd43dSSascha Wildner zcs->outBuffContentSize = cSize;
4249*a28cd43dSSascha Wildner zcs->outBuffFlushedSize = 0;
4250*a28cd43dSSascha Wildner zcs->streamStage = zcss_flush; /* pass-through to flush stage */
4251*a28cd43dSSascha Wildner }
4252*a28cd43dSSascha Wildner /* fall-through */
4253*a28cd43dSSascha Wildner case zcss_flush:
4254*a28cd43dSSascha Wildner DEBUGLOG(5, "flush stage");
4255*a28cd43dSSascha Wildner assert(zcs->appliedParams.outBufferMode == ZSTD_bm_buffered);
4256*a28cd43dSSascha Wildner { size_t const toFlush = zcs->outBuffContentSize - zcs->outBuffFlushedSize;
4257*a28cd43dSSascha Wildner size_t const flushed = ZSTD_limitCopy(op, (size_t)(oend-op),
4258*a28cd43dSSascha Wildner zcs->outBuff + zcs->outBuffFlushedSize, toFlush);
4259*a28cd43dSSascha Wildner DEBUGLOG(5, "toFlush: %u into %u ==> flushed: %u",
4260*a28cd43dSSascha Wildner (unsigned)toFlush, (unsigned)(oend-op), (unsigned)flushed);
4261*a28cd43dSSascha Wildner if (flushed)
4262*a28cd43dSSascha Wildner op += flushed;
4263*a28cd43dSSascha Wildner zcs->outBuffFlushedSize += flushed;
4264*a28cd43dSSascha Wildner if (toFlush!=flushed) {
4265*a28cd43dSSascha Wildner /* flush not fully completed, presumably because dst is too small */
4266*a28cd43dSSascha Wildner assert(op==oend);
4267*a28cd43dSSascha Wildner someMoreWork = 0;
4268*a28cd43dSSascha Wildner break;
4269*a28cd43dSSascha Wildner }
4270*a28cd43dSSascha Wildner zcs->outBuffContentSize = zcs->outBuffFlushedSize = 0;
4271*a28cd43dSSascha Wildner if (zcs->frameEnded) {
4272*a28cd43dSSascha Wildner DEBUGLOG(5, "Frame completed on flush");
4273*a28cd43dSSascha Wildner someMoreWork = 0;
4274*a28cd43dSSascha Wildner ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only);
4275*a28cd43dSSascha Wildner break;
4276*a28cd43dSSascha Wildner }
4277*a28cd43dSSascha Wildner zcs->streamStage = zcss_load;
4278*a28cd43dSSascha Wildner break;
4279*a28cd43dSSascha Wildner }
4280*a28cd43dSSascha Wildner
4281*a28cd43dSSascha Wildner default: /* impossible */
4282*a28cd43dSSascha Wildner assert(0);
4283*a28cd43dSSascha Wildner }
4284*a28cd43dSSascha Wildner }
4285*a28cd43dSSascha Wildner
4286*a28cd43dSSascha Wildner input->pos = ip - istart;
4287*a28cd43dSSascha Wildner output->pos = op - ostart;
4288*a28cd43dSSascha Wildner if (zcs->frameEnded) return 0;
4289*a28cd43dSSascha Wildner return ZSTD_nextInputSizeHint(zcs);
4290*a28cd43dSSascha Wildner }
4291*a28cd43dSSascha Wildner
ZSTD_nextInputSizeHint_MTorST(const ZSTD_CCtx * cctx)4292*a28cd43dSSascha Wildner static size_t ZSTD_nextInputSizeHint_MTorST(const ZSTD_CCtx* cctx)
4293*a28cd43dSSascha Wildner {
4294*a28cd43dSSascha Wildner #ifdef ZSTD_MULTITHREAD
4295*a28cd43dSSascha Wildner if (cctx->appliedParams.nbWorkers >= 1) {
4296*a28cd43dSSascha Wildner assert(cctx->mtctx != NULL);
4297*a28cd43dSSascha Wildner return ZSTDMT_nextInputSizeHint(cctx->mtctx);
4298*a28cd43dSSascha Wildner }
4299*a28cd43dSSascha Wildner #endif
4300*a28cd43dSSascha Wildner return ZSTD_nextInputSizeHint(cctx);
4301*a28cd43dSSascha Wildner
4302*a28cd43dSSascha Wildner }
4303*a28cd43dSSascha Wildner
ZSTD_compressStream(ZSTD_CStream * zcs,ZSTD_outBuffer * output,ZSTD_inBuffer * input)4304*a28cd43dSSascha Wildner size_t ZSTD_compressStream(ZSTD_CStream* zcs, ZSTD_outBuffer* output, ZSTD_inBuffer* input)
4305*a28cd43dSSascha Wildner {
4306*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_compressStream2(zcs, output, input, ZSTD_e_continue) , "");
4307*a28cd43dSSascha Wildner return ZSTD_nextInputSizeHint_MTorST(zcs);
4308*a28cd43dSSascha Wildner }
4309*a28cd43dSSascha Wildner
4310*a28cd43dSSascha Wildner /* After a compression call set the expected input/output buffer.
4311*a28cd43dSSascha Wildner * This is validated at the start of the next compression call.
4312*a28cd43dSSascha Wildner */
ZSTD_setBufferExpectations(ZSTD_CCtx * cctx,ZSTD_outBuffer const * output,ZSTD_inBuffer const * input)4313*a28cd43dSSascha Wildner static void ZSTD_setBufferExpectations(ZSTD_CCtx* cctx, ZSTD_outBuffer const* output, ZSTD_inBuffer const* input)
4314*a28cd43dSSascha Wildner {
4315*a28cd43dSSascha Wildner if (cctx->appliedParams.inBufferMode == ZSTD_bm_stable) {
4316*a28cd43dSSascha Wildner cctx->expectedInBuffer = *input;
4317*a28cd43dSSascha Wildner }
4318*a28cd43dSSascha Wildner if (cctx->appliedParams.outBufferMode == ZSTD_bm_stable) {
4319*a28cd43dSSascha Wildner cctx->expectedOutBufferSize = output->size - output->pos;
4320*a28cd43dSSascha Wildner }
4321*a28cd43dSSascha Wildner }
4322*a28cd43dSSascha Wildner
4323*a28cd43dSSascha Wildner /* Validate that the input/output buffers match the expectations set by
4324*a28cd43dSSascha Wildner * ZSTD_setBufferExpectations.
4325*a28cd43dSSascha Wildner */
ZSTD_checkBufferStability(ZSTD_CCtx const * cctx,ZSTD_outBuffer const * output,ZSTD_inBuffer const * input,ZSTD_EndDirective endOp)4326*a28cd43dSSascha Wildner static size_t ZSTD_checkBufferStability(ZSTD_CCtx const* cctx,
4327*a28cd43dSSascha Wildner ZSTD_outBuffer const* output,
4328*a28cd43dSSascha Wildner ZSTD_inBuffer const* input,
4329*a28cd43dSSascha Wildner ZSTD_EndDirective endOp)
4330*a28cd43dSSascha Wildner {
4331*a28cd43dSSascha Wildner if (cctx->appliedParams.inBufferMode == ZSTD_bm_stable) {
4332*a28cd43dSSascha Wildner ZSTD_inBuffer const expect = cctx->expectedInBuffer;
4333*a28cd43dSSascha Wildner if (expect.src != input->src || expect.pos != input->pos || expect.size != input->size)
4334*a28cd43dSSascha Wildner RETURN_ERROR(srcBuffer_wrong, "ZSTD_c_stableInBuffer enabled but input differs!");
4335*a28cd43dSSascha Wildner if (endOp != ZSTD_e_end)
4336*a28cd43dSSascha Wildner RETURN_ERROR(srcBuffer_wrong, "ZSTD_c_stableInBuffer can only be used with ZSTD_e_end!");
4337*a28cd43dSSascha Wildner }
4338*a28cd43dSSascha Wildner if (cctx->appliedParams.outBufferMode == ZSTD_bm_stable) {
4339*a28cd43dSSascha Wildner size_t const outBufferSize = output->size - output->pos;
4340*a28cd43dSSascha Wildner if (cctx->expectedOutBufferSize != outBufferSize)
4341*a28cd43dSSascha Wildner RETURN_ERROR(dstBuffer_wrong, "ZSTD_c_stableOutBuffer enabled but output size differs!");
4342*a28cd43dSSascha Wildner }
4343*a28cd43dSSascha Wildner return 0;
4344*a28cd43dSSascha Wildner }
4345*a28cd43dSSascha Wildner
ZSTD_CCtx_init_compressStream2(ZSTD_CCtx * cctx,ZSTD_EndDirective endOp,size_t inSize)4346*a28cd43dSSascha Wildner static size_t ZSTD_CCtx_init_compressStream2(ZSTD_CCtx* cctx,
4347*a28cd43dSSascha Wildner ZSTD_EndDirective endOp,
4348*a28cd43dSSascha Wildner size_t inSize) {
4349*a28cd43dSSascha Wildner ZSTD_CCtx_params params = cctx->requestedParams;
4350*a28cd43dSSascha Wildner ZSTD_prefixDict const prefixDict = cctx->prefixDict;
4351*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_initLocalDict(cctx) , ""); /* Init the local dict if present. */
4352*a28cd43dSSascha Wildner ZSTD_memset(&cctx->prefixDict, 0, sizeof(cctx->prefixDict)); /* single usage */
4353*a28cd43dSSascha Wildner assert(prefixDict.dict==NULL || cctx->cdict==NULL); /* only one can be set */
4354*a28cd43dSSascha Wildner if (cctx->cdict)
4355*a28cd43dSSascha Wildner params.compressionLevel = cctx->cdict->compressionLevel; /* let cdict take priority in terms of compression level */
4356*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_compressStream2 : transparent init stage");
4357*a28cd43dSSascha Wildner if (endOp == ZSTD_e_end) cctx->pledgedSrcSizePlusOne = inSize + 1; /* auto-fix pledgedSrcSize */
4358*a28cd43dSSascha Wildner {
4359*a28cd43dSSascha Wildner size_t const dictSize = prefixDict.dict
4360*a28cd43dSSascha Wildner ? prefixDict.dictSize
4361*a28cd43dSSascha Wildner : (cctx->cdict ? cctx->cdict->dictContentSize : 0);
4362*a28cd43dSSascha Wildner ZSTD_cParamMode_e const mode = ZSTD_getCParamMode(cctx->cdict, ¶ms, cctx->pledgedSrcSizePlusOne - 1);
4363*a28cd43dSSascha Wildner params.cParams = ZSTD_getCParamsFromCCtxParams(
4364*a28cd43dSSascha Wildner ¶ms, cctx->pledgedSrcSizePlusOne-1,
4365*a28cd43dSSascha Wildner dictSize, mode);
4366*a28cd43dSSascha Wildner }
4367*a28cd43dSSascha Wildner
4368*a28cd43dSSascha Wildner if (ZSTD_CParams_shouldEnableLdm(¶ms.cParams)) {
4369*a28cd43dSSascha Wildner /* Enable LDM by default for optimal parser and window size >= 128MB */
4370*a28cd43dSSascha Wildner DEBUGLOG(4, "LDM enabled by default (window size >= 128MB, strategy >= btopt)");
4371*a28cd43dSSascha Wildner params.ldmParams.enableLdm = 1;
4372*a28cd43dSSascha Wildner }
4373*a28cd43dSSascha Wildner
4374*a28cd43dSSascha Wildner #ifdef ZSTD_MULTITHREAD
4375*a28cd43dSSascha Wildner if ((cctx->pledgedSrcSizePlusOne-1) <= ZSTDMT_JOBSIZE_MIN) {
4376*a28cd43dSSascha Wildner params.nbWorkers = 0; /* do not invoke multi-threading when src size is too small */
4377*a28cd43dSSascha Wildner }
4378*a28cd43dSSascha Wildner if (params.nbWorkers > 0) {
4379*a28cd43dSSascha Wildner /* mt context creation */
4380*a28cd43dSSascha Wildner if (cctx->mtctx == NULL) {
4381*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_compressStream2: creating new mtctx for nbWorkers=%u",
4382*a28cd43dSSascha Wildner params.nbWorkers);
4383*a28cd43dSSascha Wildner cctx->mtctx = ZSTDMT_createCCtx_advanced((U32)params.nbWorkers, cctx->customMem, cctx->pool);
4384*a28cd43dSSascha Wildner RETURN_ERROR_IF(cctx->mtctx == NULL, memory_allocation, "NULL pointer!");
4385*a28cd43dSSascha Wildner }
4386*a28cd43dSSascha Wildner /* mt compression */
4387*a28cd43dSSascha Wildner DEBUGLOG(4, "call ZSTDMT_initCStream_internal as nbWorkers=%u", params.nbWorkers);
4388*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTDMT_initCStream_internal(
4389*a28cd43dSSascha Wildner cctx->mtctx,
4390*a28cd43dSSascha Wildner prefixDict.dict, prefixDict.dictSize, prefixDict.dictContentType,
4391*a28cd43dSSascha Wildner cctx->cdict, params, cctx->pledgedSrcSizePlusOne-1) , "");
4392*a28cd43dSSascha Wildner cctx->streamStage = zcss_load;
4393*a28cd43dSSascha Wildner cctx->appliedParams = params;
4394*a28cd43dSSascha Wildner } else
4395*a28cd43dSSascha Wildner #endif
4396*a28cd43dSSascha Wildner { U64 const pledgedSrcSize = cctx->pledgedSrcSizePlusOne - 1;
4397*a28cd43dSSascha Wildner assert(!ZSTD_isError(ZSTD_checkCParams(params.cParams)));
4398*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_compressBegin_internal(cctx,
4399*a28cd43dSSascha Wildner prefixDict.dict, prefixDict.dictSize, prefixDict.dictContentType, ZSTD_dtlm_fast,
4400*a28cd43dSSascha Wildner cctx->cdict,
4401*a28cd43dSSascha Wildner ¶ms, pledgedSrcSize,
4402*a28cd43dSSascha Wildner ZSTDb_buffered) , "");
4403*a28cd43dSSascha Wildner assert(cctx->appliedParams.nbWorkers == 0);
4404*a28cd43dSSascha Wildner cctx->inToCompress = 0;
4405*a28cd43dSSascha Wildner cctx->inBuffPos = 0;
4406*a28cd43dSSascha Wildner if (cctx->appliedParams.inBufferMode == ZSTD_bm_buffered) {
4407*a28cd43dSSascha Wildner /* for small input: avoid automatic flush on reaching end of block, since
4408*a28cd43dSSascha Wildner * it would require to add a 3-bytes null block to end frame
4409*a28cd43dSSascha Wildner */
4410*a28cd43dSSascha Wildner cctx->inBuffTarget = cctx->blockSize + (cctx->blockSize == pledgedSrcSize);
4411*a28cd43dSSascha Wildner } else {
4412*a28cd43dSSascha Wildner cctx->inBuffTarget = 0;
4413*a28cd43dSSascha Wildner }
4414*a28cd43dSSascha Wildner cctx->outBuffContentSize = cctx->outBuffFlushedSize = 0;
4415*a28cd43dSSascha Wildner cctx->streamStage = zcss_load;
4416*a28cd43dSSascha Wildner cctx->frameEnded = 0;
4417*a28cd43dSSascha Wildner }
4418*a28cd43dSSascha Wildner return 0;
4419*a28cd43dSSascha Wildner }
4420*a28cd43dSSascha Wildner
ZSTD_compressStream2(ZSTD_CCtx * cctx,ZSTD_outBuffer * output,ZSTD_inBuffer * input,ZSTD_EndDirective endOp)4421*a28cd43dSSascha Wildner size_t ZSTD_compressStream2( ZSTD_CCtx* cctx,
4422*a28cd43dSSascha Wildner ZSTD_outBuffer* output,
4423*a28cd43dSSascha Wildner ZSTD_inBuffer* input,
4424*a28cd43dSSascha Wildner ZSTD_EndDirective endOp)
4425*a28cd43dSSascha Wildner {
4426*a28cd43dSSascha Wildner DEBUGLOG(5, "ZSTD_compressStream2, endOp=%u ", (unsigned)endOp);
4427*a28cd43dSSascha Wildner /* check conditions */
4428*a28cd43dSSascha Wildner RETURN_ERROR_IF(output->pos > output->size, dstSize_tooSmall, "invalid output buffer");
4429*a28cd43dSSascha Wildner RETURN_ERROR_IF(input->pos > input->size, srcSize_wrong, "invalid input buffer");
4430*a28cd43dSSascha Wildner RETURN_ERROR_IF((U32)endOp > (U32)ZSTD_e_end, parameter_outOfBound, "invalid endDirective");
4431*a28cd43dSSascha Wildner assert(cctx != NULL);
4432*a28cd43dSSascha Wildner
4433*a28cd43dSSascha Wildner /* transparent initialization stage */
4434*a28cd43dSSascha Wildner if (cctx->streamStage == zcss_init) {
4435*a28cd43dSSascha Wildner FORWARD_IF_ERROR(ZSTD_CCtx_init_compressStream2(cctx, endOp, input->size), "CompressStream2 initialization failed");
4436*a28cd43dSSascha Wildner ZSTD_setBufferExpectations(cctx, output, input); /* Set initial buffer expectations now that we've initialized */
4437*a28cd43dSSascha Wildner }
4438*a28cd43dSSascha Wildner /* end of transparent initialization stage */
4439*a28cd43dSSascha Wildner
4440*a28cd43dSSascha Wildner FORWARD_IF_ERROR(ZSTD_checkBufferStability(cctx, output, input, endOp), "invalid buffers");
4441*a28cd43dSSascha Wildner /* compression stage */
4442*a28cd43dSSascha Wildner #ifdef ZSTD_MULTITHREAD
4443*a28cd43dSSascha Wildner if (cctx->appliedParams.nbWorkers > 0) {
4444*a28cd43dSSascha Wildner size_t flushMin;
4445*a28cd43dSSascha Wildner if (cctx->cParamsChanged) {
4446*a28cd43dSSascha Wildner ZSTDMT_updateCParams_whileCompressing(cctx->mtctx, &cctx->requestedParams);
4447*a28cd43dSSascha Wildner cctx->cParamsChanged = 0;
4448*a28cd43dSSascha Wildner }
4449*a28cd43dSSascha Wildner for (;;) {
4450*a28cd43dSSascha Wildner size_t const ipos = input->pos;
4451*a28cd43dSSascha Wildner size_t const opos = output->pos;
4452*a28cd43dSSascha Wildner flushMin = ZSTDMT_compressStream_generic(cctx->mtctx, output, input, endOp);
4453*a28cd43dSSascha Wildner if ( ZSTD_isError(flushMin)
4454*a28cd43dSSascha Wildner || (endOp == ZSTD_e_end && flushMin == 0) ) { /* compression completed */
4455*a28cd43dSSascha Wildner ZSTD_CCtx_reset(cctx, ZSTD_reset_session_only);
4456*a28cd43dSSascha Wildner }
4457*a28cd43dSSascha Wildner FORWARD_IF_ERROR(flushMin, "ZSTDMT_compressStream_generic failed");
4458*a28cd43dSSascha Wildner
4459*a28cd43dSSascha Wildner if (endOp == ZSTD_e_continue) {
4460*a28cd43dSSascha Wildner /* We only require some progress with ZSTD_e_continue, not maximal progress.
4461*a28cd43dSSascha Wildner * We're done if we've consumed or produced any bytes, or either buffer is
4462*a28cd43dSSascha Wildner * full.
4463*a28cd43dSSascha Wildner */
4464*a28cd43dSSascha Wildner if (input->pos != ipos || output->pos != opos || input->pos == input->size || output->pos == output->size)
4465*a28cd43dSSascha Wildner break;
4466*a28cd43dSSascha Wildner } else {
4467*a28cd43dSSascha Wildner assert(endOp == ZSTD_e_flush || endOp == ZSTD_e_end);
4468*a28cd43dSSascha Wildner /* We require maximal progress. We're done when the flush is complete or the
4469*a28cd43dSSascha Wildner * output buffer is full.
4470*a28cd43dSSascha Wildner */
4471*a28cd43dSSascha Wildner if (flushMin == 0 || output->pos == output->size)
4472*a28cd43dSSascha Wildner break;
4473*a28cd43dSSascha Wildner }
4474*a28cd43dSSascha Wildner }
4475*a28cd43dSSascha Wildner DEBUGLOG(5, "completed ZSTD_compressStream2 delegating to ZSTDMT_compressStream_generic");
4476*a28cd43dSSascha Wildner /* Either we don't require maximum forward progress, we've finished the
4477*a28cd43dSSascha Wildner * flush, or we are out of output space.
4478*a28cd43dSSascha Wildner */
4479*a28cd43dSSascha Wildner assert(endOp == ZSTD_e_continue || flushMin == 0 || output->pos == output->size);
4480*a28cd43dSSascha Wildner ZSTD_setBufferExpectations(cctx, output, input);
4481*a28cd43dSSascha Wildner return flushMin;
4482*a28cd43dSSascha Wildner }
4483*a28cd43dSSascha Wildner #endif
4484*a28cd43dSSascha Wildner FORWARD_IF_ERROR( ZSTD_compressStream_generic(cctx, output, input, endOp) , "");
4485*a28cd43dSSascha Wildner DEBUGLOG(5, "completed ZSTD_compressStream2");
4486*a28cd43dSSascha Wildner ZSTD_setBufferExpectations(cctx, output, input);
4487*a28cd43dSSascha Wildner return cctx->outBuffContentSize - cctx->outBuffFlushedSize; /* remaining to flush */
4488*a28cd43dSSascha Wildner }
4489*a28cd43dSSascha Wildner
ZSTD_compressStream2_simpleArgs(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,size_t * dstPos,const void * src,size_t srcSize,size_t * srcPos,ZSTD_EndDirective endOp)4490*a28cd43dSSascha Wildner size_t ZSTD_compressStream2_simpleArgs (
4491*a28cd43dSSascha Wildner ZSTD_CCtx* cctx,
4492*a28cd43dSSascha Wildner void* dst, size_t dstCapacity, size_t* dstPos,
4493*a28cd43dSSascha Wildner const void* src, size_t srcSize, size_t* srcPos,
4494*a28cd43dSSascha Wildner ZSTD_EndDirective endOp)
4495*a28cd43dSSascha Wildner {
4496*a28cd43dSSascha Wildner ZSTD_outBuffer output = { dst, dstCapacity, *dstPos };
4497*a28cd43dSSascha Wildner ZSTD_inBuffer input = { src, srcSize, *srcPos };
4498*a28cd43dSSascha Wildner /* ZSTD_compressStream2() will check validity of dstPos and srcPos */
4499*a28cd43dSSascha Wildner size_t const cErr = ZSTD_compressStream2(cctx, &output, &input, endOp);
4500*a28cd43dSSascha Wildner *dstPos = output.pos;
4501*a28cd43dSSascha Wildner *srcPos = input.pos;
4502*a28cd43dSSascha Wildner return cErr;
4503*a28cd43dSSascha Wildner }
4504*a28cd43dSSascha Wildner
ZSTD_compress2(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize)4505*a28cd43dSSascha Wildner size_t ZSTD_compress2(ZSTD_CCtx* cctx,
4506*a28cd43dSSascha Wildner void* dst, size_t dstCapacity,
4507*a28cd43dSSascha Wildner const void* src, size_t srcSize)
4508*a28cd43dSSascha Wildner {
4509*a28cd43dSSascha Wildner ZSTD_bufferMode_e const originalInBufferMode = cctx->requestedParams.inBufferMode;
4510*a28cd43dSSascha Wildner ZSTD_bufferMode_e const originalOutBufferMode = cctx->requestedParams.outBufferMode;
4511*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_compress2 (srcSize=%u)", (unsigned)srcSize);
4512*a28cd43dSSascha Wildner ZSTD_CCtx_reset(cctx, ZSTD_reset_session_only);
4513*a28cd43dSSascha Wildner /* Enable stable input/output buffers. */
4514*a28cd43dSSascha Wildner cctx->requestedParams.inBufferMode = ZSTD_bm_stable;
4515*a28cd43dSSascha Wildner cctx->requestedParams.outBufferMode = ZSTD_bm_stable;
4516*a28cd43dSSascha Wildner { size_t oPos = 0;
4517*a28cd43dSSascha Wildner size_t iPos = 0;
4518*a28cd43dSSascha Wildner size_t const result = ZSTD_compressStream2_simpleArgs(cctx,
4519*a28cd43dSSascha Wildner dst, dstCapacity, &oPos,
4520*a28cd43dSSascha Wildner src, srcSize, &iPos,
4521*a28cd43dSSascha Wildner ZSTD_e_end);
4522*a28cd43dSSascha Wildner /* Reset to the original values. */
4523*a28cd43dSSascha Wildner cctx->requestedParams.inBufferMode = originalInBufferMode;
4524*a28cd43dSSascha Wildner cctx->requestedParams.outBufferMode = originalOutBufferMode;
4525*a28cd43dSSascha Wildner FORWARD_IF_ERROR(result, "ZSTD_compressStream2_simpleArgs failed");
4526*a28cd43dSSascha Wildner if (result != 0) { /* compression not completed, due to lack of output space */
4527*a28cd43dSSascha Wildner assert(oPos == dstCapacity);
4528*a28cd43dSSascha Wildner RETURN_ERROR(dstSize_tooSmall, "");
4529*a28cd43dSSascha Wildner }
4530*a28cd43dSSascha Wildner assert(iPos == srcSize); /* all input is expected consumed */
4531*a28cd43dSSascha Wildner return oPos;
4532*a28cd43dSSascha Wildner }
4533*a28cd43dSSascha Wildner }
4534*a28cd43dSSascha Wildner
4535*a28cd43dSSascha Wildner typedef struct {
4536*a28cd43dSSascha Wildner U32 idx; /* Index in array of ZSTD_Sequence */
4537*a28cd43dSSascha Wildner U32 posInSequence; /* Position within sequence at idx */
4538*a28cd43dSSascha Wildner size_t posInSrc; /* Number of bytes given by sequences provided so far */
4539*a28cd43dSSascha Wildner } ZSTD_sequencePosition;
4540*a28cd43dSSascha Wildner
4541*a28cd43dSSascha Wildner /* Returns a ZSTD error code if sequence is not valid */
ZSTD_validateSequence(U32 offCode,U32 matchLength,size_t posInSrc,U32 windowLog,size_t dictSize,U32 minMatch)4542*a28cd43dSSascha Wildner static size_t ZSTD_validateSequence(U32 offCode, U32 matchLength,
4543*a28cd43dSSascha Wildner size_t posInSrc, U32 windowLog, size_t dictSize, U32 minMatch) {
4544*a28cd43dSSascha Wildner size_t offsetBound;
4545*a28cd43dSSascha Wildner U32 windowSize = 1 << windowLog;
4546*a28cd43dSSascha Wildner /* posInSrc represents the amount of data the the decoder would decode up to this point.
4547*a28cd43dSSascha Wildner * As long as the amount of data decoded is less than or equal to window size, offsets may be
4548*a28cd43dSSascha Wildner * larger than the total length of output decoded in order to reference the dict, even larger than
4549*a28cd43dSSascha Wildner * window size. After output surpasses windowSize, we're limited to windowSize offsets again.
4550*a28cd43dSSascha Wildner */
4551*a28cd43dSSascha Wildner offsetBound = posInSrc > windowSize ? (size_t)windowSize : posInSrc + (size_t)dictSize;
4552*a28cd43dSSascha Wildner RETURN_ERROR_IF(offCode > offsetBound + ZSTD_REP_MOVE, corruption_detected, "Offset too large!");
4553*a28cd43dSSascha Wildner RETURN_ERROR_IF(matchLength < minMatch, corruption_detected, "Matchlength too small");
4554*a28cd43dSSascha Wildner return 0;
4555*a28cd43dSSascha Wildner }
4556*a28cd43dSSascha Wildner
4557*a28cd43dSSascha Wildner /* Returns an offset code, given a sequence's raw offset, the ongoing repcode array, and whether litLength == 0 */
ZSTD_finalizeOffCode(U32 rawOffset,const U32 rep[ZSTD_REP_NUM],U32 ll0)4558*a28cd43dSSascha Wildner static U32 ZSTD_finalizeOffCode(U32 rawOffset, const U32 rep[ZSTD_REP_NUM], U32 ll0) {
4559*a28cd43dSSascha Wildner U32 offCode = rawOffset + ZSTD_REP_MOVE;
4560*a28cd43dSSascha Wildner U32 repCode = 0;
4561*a28cd43dSSascha Wildner
4562*a28cd43dSSascha Wildner if (!ll0 && rawOffset == rep[0]) {
4563*a28cd43dSSascha Wildner repCode = 1;
4564*a28cd43dSSascha Wildner } else if (rawOffset == rep[1]) {
4565*a28cd43dSSascha Wildner repCode = 2 - ll0;
4566*a28cd43dSSascha Wildner } else if (rawOffset == rep[2]) {
4567*a28cd43dSSascha Wildner repCode = 3 - ll0;
4568*a28cd43dSSascha Wildner } else if (ll0 && rawOffset == rep[0] - 1) {
4569*a28cd43dSSascha Wildner repCode = 3;
4570*a28cd43dSSascha Wildner }
4571*a28cd43dSSascha Wildner if (repCode) {
4572*a28cd43dSSascha Wildner /* ZSTD_storeSeq expects a number in the range [0, 2] to represent a repcode */
4573*a28cd43dSSascha Wildner offCode = repCode - 1;
4574*a28cd43dSSascha Wildner }
4575*a28cd43dSSascha Wildner return offCode;
4576*a28cd43dSSascha Wildner }
4577*a28cd43dSSascha Wildner
4578*a28cd43dSSascha Wildner /* Returns 0 on success, and a ZSTD_error otherwise. This function scans through an array of
4579*a28cd43dSSascha Wildner * ZSTD_Sequence, storing the sequences it finds, until it reaches a block delimiter.
4580*a28cd43dSSascha Wildner */
ZSTD_copySequencesToSeqStoreExplicitBlockDelim(ZSTD_CCtx * cctx,ZSTD_sequencePosition * seqPos,const ZSTD_Sequence * const inSeqs,size_t inSeqsSize,const void * src,size_t blockSize)4581*a28cd43dSSascha Wildner static size_t ZSTD_copySequencesToSeqStoreExplicitBlockDelim(ZSTD_CCtx* cctx, ZSTD_sequencePosition* seqPos,
4582*a28cd43dSSascha Wildner const ZSTD_Sequence* const inSeqs, size_t inSeqsSize,
4583*a28cd43dSSascha Wildner const void* src, size_t blockSize) {
4584*a28cd43dSSascha Wildner U32 idx = seqPos->idx;
4585*a28cd43dSSascha Wildner BYTE const* ip = (BYTE const*)(src);
4586*a28cd43dSSascha Wildner const BYTE* const iend = ip + blockSize;
4587*a28cd43dSSascha Wildner repcodes_t updatedRepcodes;
4588*a28cd43dSSascha Wildner U32 dictSize;
4589*a28cd43dSSascha Wildner U32 litLength;
4590*a28cd43dSSascha Wildner U32 matchLength;
4591*a28cd43dSSascha Wildner U32 ll0;
4592*a28cd43dSSascha Wildner U32 offCode;
4593*a28cd43dSSascha Wildner
4594*a28cd43dSSascha Wildner if (cctx->cdict) {
4595*a28cd43dSSascha Wildner dictSize = (U32)cctx->cdict->dictContentSize;
4596*a28cd43dSSascha Wildner } else if (cctx->prefixDict.dict) {
4597*a28cd43dSSascha Wildner dictSize = (U32)cctx->prefixDict.dictSize;
4598*a28cd43dSSascha Wildner } else {
4599*a28cd43dSSascha Wildner dictSize = 0;
4600*a28cd43dSSascha Wildner }
4601*a28cd43dSSascha Wildner ZSTD_memcpy(updatedRepcodes.rep, cctx->blockState.prevCBlock->rep, sizeof(repcodes_t));
4602*a28cd43dSSascha Wildner for (; (inSeqs[idx].matchLength != 0 || inSeqs[idx].offset != 0) && idx < inSeqsSize; ++idx) {
4603*a28cd43dSSascha Wildner litLength = inSeqs[idx].litLength;
4604*a28cd43dSSascha Wildner matchLength = inSeqs[idx].matchLength;
4605*a28cd43dSSascha Wildner ll0 = litLength == 0;
4606*a28cd43dSSascha Wildner offCode = ZSTD_finalizeOffCode(inSeqs[idx].offset, updatedRepcodes.rep, ll0);
4607*a28cd43dSSascha Wildner updatedRepcodes = ZSTD_updateRep(updatedRepcodes.rep, offCode, ll0);
4608*a28cd43dSSascha Wildner
4609*a28cd43dSSascha Wildner DEBUGLOG(6, "Storing sequence: (of: %u, ml: %u, ll: %u)", offCode, matchLength, litLength);
4610*a28cd43dSSascha Wildner if (cctx->appliedParams.validateSequences) {
4611*a28cd43dSSascha Wildner seqPos->posInSrc += litLength + matchLength;
4612*a28cd43dSSascha Wildner FORWARD_IF_ERROR(ZSTD_validateSequence(offCode, matchLength, seqPos->posInSrc,
4613*a28cd43dSSascha Wildner cctx->appliedParams.cParams.windowLog, dictSize,
4614*a28cd43dSSascha Wildner cctx->appliedParams.cParams.minMatch),
4615*a28cd43dSSascha Wildner "Sequence validation failed");
4616*a28cd43dSSascha Wildner }
4617*a28cd43dSSascha Wildner RETURN_ERROR_IF(idx - seqPos->idx > cctx->seqStore.maxNbSeq, memory_allocation,
4618*a28cd43dSSascha Wildner "Not enough memory allocated. Try adjusting ZSTD_c_minMatch.");
4619*a28cd43dSSascha Wildner ZSTD_storeSeq(&cctx->seqStore, litLength, ip, iend, offCode, matchLength - MINMATCH);
4620*a28cd43dSSascha Wildner ip += matchLength + litLength;
4621*a28cd43dSSascha Wildner }
4622*a28cd43dSSascha Wildner ZSTD_memcpy(cctx->blockState.nextCBlock->rep, updatedRepcodes.rep, sizeof(repcodes_t));
4623*a28cd43dSSascha Wildner
4624*a28cd43dSSascha Wildner if (inSeqs[idx].litLength) {
4625*a28cd43dSSascha Wildner DEBUGLOG(6, "Storing last literals of size: %u", inSeqs[idx].litLength);
4626*a28cd43dSSascha Wildner ZSTD_storeLastLiterals(&cctx->seqStore, ip, inSeqs[idx].litLength);
4627*a28cd43dSSascha Wildner ip += inSeqs[idx].litLength;
4628*a28cd43dSSascha Wildner seqPos->posInSrc += inSeqs[idx].litLength;
4629*a28cd43dSSascha Wildner }
4630*a28cd43dSSascha Wildner RETURN_ERROR_IF(ip != iend, corruption_detected, "Blocksize doesn't agree with block delimiter!");
4631*a28cd43dSSascha Wildner seqPos->idx = idx+1;
4632*a28cd43dSSascha Wildner return 0;
4633*a28cd43dSSascha Wildner }
4634*a28cd43dSSascha Wildner
4635*a28cd43dSSascha Wildner /* Returns the number of bytes to move the current read position back by. Only non-zero
4636*a28cd43dSSascha Wildner * if we ended up splitting a sequence. Otherwise, it may return a ZSTD error if something
4637*a28cd43dSSascha Wildner * went wrong.
4638*a28cd43dSSascha Wildner *
4639*a28cd43dSSascha Wildner * This function will attempt to scan through blockSize bytes represented by the sequences
4640*a28cd43dSSascha Wildner * in inSeqs, storing any (partial) sequences.
4641*a28cd43dSSascha Wildner *
4642*a28cd43dSSascha Wildner * Occasionally, we may want to change the actual number of bytes we consumed from inSeqs to
4643*a28cd43dSSascha Wildner * avoid splitting a match, or to avoid splitting a match such that it would produce a match
4644*a28cd43dSSascha Wildner * smaller than MINMATCH. In this case, we return the number of bytes that we didn't read from this block.
4645*a28cd43dSSascha Wildner */
ZSTD_copySequencesToSeqStoreNoBlockDelim(ZSTD_CCtx * cctx,ZSTD_sequencePosition * seqPos,const ZSTD_Sequence * const inSeqs,size_t inSeqsSize,const void * src,size_t blockSize)4646*a28cd43dSSascha Wildner static size_t ZSTD_copySequencesToSeqStoreNoBlockDelim(ZSTD_CCtx* cctx, ZSTD_sequencePosition* seqPos,
4647*a28cd43dSSascha Wildner const ZSTD_Sequence* const inSeqs, size_t inSeqsSize,
4648*a28cd43dSSascha Wildner const void* src, size_t blockSize) {
4649*a28cd43dSSascha Wildner U32 idx = seqPos->idx;
4650*a28cd43dSSascha Wildner U32 startPosInSequence = seqPos->posInSequence;
4651*a28cd43dSSascha Wildner U32 endPosInSequence = seqPos->posInSequence + (U32)blockSize;
4652*a28cd43dSSascha Wildner size_t dictSize;
4653*a28cd43dSSascha Wildner BYTE const* ip = (BYTE const*)(src);
4654*a28cd43dSSascha Wildner BYTE const* iend = ip + blockSize; /* May be adjusted if we decide to process fewer than blockSize bytes */
4655*a28cd43dSSascha Wildner repcodes_t updatedRepcodes;
4656*a28cd43dSSascha Wildner U32 bytesAdjustment = 0;
4657*a28cd43dSSascha Wildner U32 finalMatchSplit = 0;
4658*a28cd43dSSascha Wildner U32 litLength;
4659*a28cd43dSSascha Wildner U32 matchLength;
4660*a28cd43dSSascha Wildner U32 rawOffset;
4661*a28cd43dSSascha Wildner U32 offCode;
4662*a28cd43dSSascha Wildner
4663*a28cd43dSSascha Wildner if (cctx->cdict) {
4664*a28cd43dSSascha Wildner dictSize = cctx->cdict->dictContentSize;
4665*a28cd43dSSascha Wildner } else if (cctx->prefixDict.dict) {
4666*a28cd43dSSascha Wildner dictSize = cctx->prefixDict.dictSize;
4667*a28cd43dSSascha Wildner } else {
4668*a28cd43dSSascha Wildner dictSize = 0;
4669*a28cd43dSSascha Wildner }
4670*a28cd43dSSascha Wildner DEBUGLOG(5, "ZSTD_copySequencesToSeqStore: idx: %u PIS: %u blockSize: %zu", idx, startPosInSequence, blockSize);
4671*a28cd43dSSascha Wildner DEBUGLOG(5, "Start seq: idx: %u (of: %u ml: %u ll: %u)", idx, inSeqs[idx].offset, inSeqs[idx].matchLength, inSeqs[idx].litLength);
4672*a28cd43dSSascha Wildner ZSTD_memcpy(updatedRepcodes.rep, cctx->blockState.prevCBlock->rep, sizeof(repcodes_t));
4673*a28cd43dSSascha Wildner while (endPosInSequence && idx < inSeqsSize && !finalMatchSplit) {
4674*a28cd43dSSascha Wildner const ZSTD_Sequence currSeq = inSeqs[idx];
4675*a28cd43dSSascha Wildner litLength = currSeq.litLength;
4676*a28cd43dSSascha Wildner matchLength = currSeq.matchLength;
4677*a28cd43dSSascha Wildner rawOffset = currSeq.offset;
4678*a28cd43dSSascha Wildner
4679*a28cd43dSSascha Wildner /* Modify the sequence depending on where endPosInSequence lies */
4680*a28cd43dSSascha Wildner if (endPosInSequence >= currSeq.litLength + currSeq.matchLength) {
4681*a28cd43dSSascha Wildner if (startPosInSequence >= litLength) {
4682*a28cd43dSSascha Wildner startPosInSequence -= litLength;
4683*a28cd43dSSascha Wildner litLength = 0;
4684*a28cd43dSSascha Wildner matchLength -= startPosInSequence;
4685*a28cd43dSSascha Wildner } else {
4686*a28cd43dSSascha Wildner litLength -= startPosInSequence;
4687*a28cd43dSSascha Wildner }
4688*a28cd43dSSascha Wildner /* Move to the next sequence */
4689*a28cd43dSSascha Wildner endPosInSequence -= currSeq.litLength + currSeq.matchLength;
4690*a28cd43dSSascha Wildner startPosInSequence = 0;
4691*a28cd43dSSascha Wildner idx++;
4692*a28cd43dSSascha Wildner } else {
4693*a28cd43dSSascha Wildner /* This is the final (partial) sequence we're adding from inSeqs, and endPosInSequence
4694*a28cd43dSSascha Wildner does not reach the end of the match. So, we have to split the sequence */
4695*a28cd43dSSascha Wildner DEBUGLOG(6, "Require a split: diff: %u, idx: %u PIS: %u",
4696*a28cd43dSSascha Wildner currSeq.litLength + currSeq.matchLength - endPosInSequence, idx, endPosInSequence);
4697*a28cd43dSSascha Wildner if (endPosInSequence > litLength) {
4698*a28cd43dSSascha Wildner U32 firstHalfMatchLength;
4699*a28cd43dSSascha Wildner litLength = startPosInSequence >= litLength ? 0 : litLength - startPosInSequence;
4700*a28cd43dSSascha Wildner firstHalfMatchLength = endPosInSequence - startPosInSequence - litLength;
4701*a28cd43dSSascha Wildner if (matchLength > blockSize && firstHalfMatchLength >= cctx->appliedParams.cParams.minMatch) {
4702*a28cd43dSSascha Wildner /* Only ever split the match if it is larger than the block size */
4703*a28cd43dSSascha Wildner U32 secondHalfMatchLength = currSeq.matchLength + currSeq.litLength - endPosInSequence;
4704*a28cd43dSSascha Wildner if (secondHalfMatchLength < cctx->appliedParams.cParams.minMatch) {
4705*a28cd43dSSascha Wildner /* Move the endPosInSequence backward so that it creates match of minMatch length */
4706*a28cd43dSSascha Wildner endPosInSequence -= cctx->appliedParams.cParams.minMatch - secondHalfMatchLength;
4707*a28cd43dSSascha Wildner bytesAdjustment = cctx->appliedParams.cParams.minMatch - secondHalfMatchLength;
4708*a28cd43dSSascha Wildner firstHalfMatchLength -= bytesAdjustment;
4709*a28cd43dSSascha Wildner }
4710*a28cd43dSSascha Wildner matchLength = firstHalfMatchLength;
4711*a28cd43dSSascha Wildner /* Flag that we split the last match - after storing the sequence, exit the loop,
4712*a28cd43dSSascha Wildner but keep the value of endPosInSequence */
4713*a28cd43dSSascha Wildner finalMatchSplit = 1;
4714*a28cd43dSSascha Wildner } else {
4715*a28cd43dSSascha Wildner /* Move the position in sequence backwards so that we don't split match, and break to store
4716*a28cd43dSSascha Wildner * the last literals. We use the original currSeq.litLength as a marker for where endPosInSequence
4717*a28cd43dSSascha Wildner * should go. We prefer to do this whenever it is not necessary to split the match, or if doing so
4718*a28cd43dSSascha Wildner * would cause the first half of the match to be too small
4719*a28cd43dSSascha Wildner */
4720*a28cd43dSSascha Wildner bytesAdjustment = endPosInSequence - currSeq.litLength;
4721*a28cd43dSSascha Wildner endPosInSequence = currSeq.litLength;
4722*a28cd43dSSascha Wildner break;
4723*a28cd43dSSascha Wildner }
4724*a28cd43dSSascha Wildner } else {
4725*a28cd43dSSascha Wildner /* This sequence ends inside the literals, break to store the last literals */
4726*a28cd43dSSascha Wildner break;
4727*a28cd43dSSascha Wildner }
4728*a28cd43dSSascha Wildner }
4729*a28cd43dSSascha Wildner /* Check if this offset can be represented with a repcode */
4730*a28cd43dSSascha Wildner { U32 ll0 = (litLength == 0);
4731*a28cd43dSSascha Wildner offCode = ZSTD_finalizeOffCode(rawOffset, updatedRepcodes.rep, ll0);
4732*a28cd43dSSascha Wildner updatedRepcodes = ZSTD_updateRep(updatedRepcodes.rep, offCode, ll0);
4733*a28cd43dSSascha Wildner }
4734*a28cd43dSSascha Wildner
4735*a28cd43dSSascha Wildner if (cctx->appliedParams.validateSequences) {
4736*a28cd43dSSascha Wildner seqPos->posInSrc += litLength + matchLength;
4737*a28cd43dSSascha Wildner FORWARD_IF_ERROR(ZSTD_validateSequence(offCode, matchLength, seqPos->posInSrc,
4738*a28cd43dSSascha Wildner cctx->appliedParams.cParams.windowLog, dictSize,
4739*a28cd43dSSascha Wildner cctx->appliedParams.cParams.minMatch),
4740*a28cd43dSSascha Wildner "Sequence validation failed");
4741*a28cd43dSSascha Wildner }
4742*a28cd43dSSascha Wildner DEBUGLOG(6, "Storing sequence: (of: %u, ml: %u, ll: %u)", offCode, matchLength, litLength);
4743*a28cd43dSSascha Wildner RETURN_ERROR_IF(idx - seqPos->idx > cctx->seqStore.maxNbSeq, memory_allocation,
4744*a28cd43dSSascha Wildner "Not enough memory allocated. Try adjusting ZSTD_c_minMatch.");
4745*a28cd43dSSascha Wildner ZSTD_storeSeq(&cctx->seqStore, litLength, ip, iend, offCode, matchLength - MINMATCH);
4746*a28cd43dSSascha Wildner ip += matchLength + litLength;
4747*a28cd43dSSascha Wildner }
4748*a28cd43dSSascha Wildner DEBUGLOG(5, "Ending seq: idx: %u (of: %u ml: %u ll: %u)", idx, inSeqs[idx].offset, inSeqs[idx].matchLength, inSeqs[idx].litLength);
4749*a28cd43dSSascha Wildner assert(idx == inSeqsSize || endPosInSequence <= inSeqs[idx].litLength + inSeqs[idx].matchLength);
4750*a28cd43dSSascha Wildner seqPos->idx = idx;
4751*a28cd43dSSascha Wildner seqPos->posInSequence = endPosInSequence;
4752*a28cd43dSSascha Wildner ZSTD_memcpy(cctx->blockState.nextCBlock->rep, updatedRepcodes.rep, sizeof(repcodes_t));
4753*a28cd43dSSascha Wildner
4754*a28cd43dSSascha Wildner iend -= bytesAdjustment;
4755*a28cd43dSSascha Wildner if (ip != iend) {
4756*a28cd43dSSascha Wildner /* Store any last literals */
4757*a28cd43dSSascha Wildner U32 lastLLSize = (U32)(iend - ip);
4758*a28cd43dSSascha Wildner assert(ip <= iend);
4759*a28cd43dSSascha Wildner DEBUGLOG(6, "Storing last literals of size: %u", lastLLSize);
4760*a28cd43dSSascha Wildner ZSTD_storeLastLiterals(&cctx->seqStore, ip, lastLLSize);
4761*a28cd43dSSascha Wildner seqPos->posInSrc += lastLLSize;
4762*a28cd43dSSascha Wildner }
4763*a28cd43dSSascha Wildner
4764*a28cd43dSSascha Wildner return bytesAdjustment;
4765*a28cd43dSSascha Wildner }
4766*a28cd43dSSascha Wildner
4767*a28cd43dSSascha Wildner typedef size_t (*ZSTD_sequenceCopier) (ZSTD_CCtx* cctx, ZSTD_sequencePosition* seqPos,
4768*a28cd43dSSascha Wildner const ZSTD_Sequence* const inSeqs, size_t inSeqsSize,
4769*a28cd43dSSascha Wildner const void* src, size_t blockSize);
ZSTD_selectSequenceCopier(ZSTD_sequenceFormat_e mode)4770*a28cd43dSSascha Wildner static ZSTD_sequenceCopier ZSTD_selectSequenceCopier(ZSTD_sequenceFormat_e mode) {
4771*a28cd43dSSascha Wildner ZSTD_sequenceCopier sequenceCopier = NULL;
4772*a28cd43dSSascha Wildner assert(ZSTD_cParam_withinBounds(ZSTD_c_blockDelimiters, mode));
4773*a28cd43dSSascha Wildner if (mode == ZSTD_sf_explicitBlockDelimiters) {
4774*a28cd43dSSascha Wildner return ZSTD_copySequencesToSeqStoreExplicitBlockDelim;
4775*a28cd43dSSascha Wildner } else if (mode == ZSTD_sf_noBlockDelimiters) {
4776*a28cd43dSSascha Wildner return ZSTD_copySequencesToSeqStoreNoBlockDelim;
4777*a28cd43dSSascha Wildner }
4778*a28cd43dSSascha Wildner assert(sequenceCopier != NULL);
4779*a28cd43dSSascha Wildner return sequenceCopier;
4780*a28cd43dSSascha Wildner }
4781*a28cd43dSSascha Wildner
4782*a28cd43dSSascha Wildner /* Compress, block-by-block, all of the sequences given.
4783*a28cd43dSSascha Wildner *
4784*a28cd43dSSascha Wildner * Returns the cumulative size of all compressed blocks (including their headers), otherwise a ZSTD error.
4785*a28cd43dSSascha Wildner */
ZSTD_compressSequences_internal(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const ZSTD_Sequence * inSeqs,size_t inSeqsSize,const void * src,size_t srcSize)4786*a28cd43dSSascha Wildner static size_t ZSTD_compressSequences_internal(ZSTD_CCtx* cctx,
4787*a28cd43dSSascha Wildner void* dst, size_t dstCapacity,
4788*a28cd43dSSascha Wildner const ZSTD_Sequence* inSeqs, size_t inSeqsSize,
4789*a28cd43dSSascha Wildner const void* src, size_t srcSize) {
4790*a28cd43dSSascha Wildner size_t cSize = 0;
4791*a28cd43dSSascha Wildner U32 lastBlock;
4792*a28cd43dSSascha Wildner size_t blockSize;
4793*a28cd43dSSascha Wildner size_t compressedSeqsSize;
4794*a28cd43dSSascha Wildner size_t remaining = srcSize;
4795*a28cd43dSSascha Wildner ZSTD_sequencePosition seqPos = {0, 0, 0};
4796*a28cd43dSSascha Wildner
4797*a28cd43dSSascha Wildner BYTE const* ip = (BYTE const*)src;
4798*a28cd43dSSascha Wildner BYTE* op = (BYTE*)dst;
4799*a28cd43dSSascha Wildner ZSTD_sequenceCopier sequenceCopier = ZSTD_selectSequenceCopier(cctx->appliedParams.blockDelimiters);
4800*a28cd43dSSascha Wildner
4801*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_compressSequences_internal srcSize: %zu, inSeqsSize: %zu", srcSize, inSeqsSize);
4802*a28cd43dSSascha Wildner /* Special case: empty frame */
4803*a28cd43dSSascha Wildner if (remaining == 0) {
4804*a28cd43dSSascha Wildner U32 const cBlockHeader24 = 1 /* last block */ + (((U32)bt_raw)<<1);
4805*a28cd43dSSascha Wildner RETURN_ERROR_IF(dstCapacity<4, dstSize_tooSmall, "No room for empty frame block header");
4806*a28cd43dSSascha Wildner MEM_writeLE32(op, cBlockHeader24);
4807*a28cd43dSSascha Wildner op += ZSTD_blockHeaderSize;
4808*a28cd43dSSascha Wildner dstCapacity -= ZSTD_blockHeaderSize;
4809*a28cd43dSSascha Wildner cSize += ZSTD_blockHeaderSize;
4810*a28cd43dSSascha Wildner }
4811*a28cd43dSSascha Wildner
4812*a28cd43dSSascha Wildner while (remaining) {
4813*a28cd43dSSascha Wildner size_t cBlockSize;
4814*a28cd43dSSascha Wildner size_t additionalByteAdjustment;
4815*a28cd43dSSascha Wildner lastBlock = remaining <= cctx->blockSize;
4816*a28cd43dSSascha Wildner blockSize = lastBlock ? (U32)remaining : (U32)cctx->blockSize;
4817*a28cd43dSSascha Wildner ZSTD_resetSeqStore(&cctx->seqStore);
4818*a28cd43dSSascha Wildner DEBUGLOG(4, "Working on new block. Blocksize: %zu", blockSize);
4819*a28cd43dSSascha Wildner
4820*a28cd43dSSascha Wildner additionalByteAdjustment = sequenceCopier(cctx, &seqPos, inSeqs, inSeqsSize, ip, blockSize);
4821*a28cd43dSSascha Wildner FORWARD_IF_ERROR(additionalByteAdjustment, "Bad sequence copy");
4822*a28cd43dSSascha Wildner blockSize -= additionalByteAdjustment;
4823*a28cd43dSSascha Wildner
4824*a28cd43dSSascha Wildner /* If blocks are too small, emit as a nocompress block */
4825*a28cd43dSSascha Wildner if (blockSize < MIN_CBLOCK_SIZE+ZSTD_blockHeaderSize+1) {
4826*a28cd43dSSascha Wildner cBlockSize = ZSTD_noCompressBlock(op, dstCapacity, ip, blockSize, lastBlock);
4827*a28cd43dSSascha Wildner FORWARD_IF_ERROR(cBlockSize, "Nocompress block failed");
4828*a28cd43dSSascha Wildner DEBUGLOG(4, "Block too small, writing out nocompress block: cSize: %zu", cBlockSize);
4829*a28cd43dSSascha Wildner cSize += cBlockSize;
4830*a28cd43dSSascha Wildner ip += blockSize;
4831*a28cd43dSSascha Wildner op += cBlockSize;
4832*a28cd43dSSascha Wildner remaining -= blockSize;
4833*a28cd43dSSascha Wildner dstCapacity -= cBlockSize;
4834*a28cd43dSSascha Wildner continue;
4835*a28cd43dSSascha Wildner }
4836*a28cd43dSSascha Wildner
4837*a28cd43dSSascha Wildner compressedSeqsSize = ZSTD_entropyCompressSequences(&cctx->seqStore,
4838*a28cd43dSSascha Wildner &cctx->blockState.prevCBlock->entropy, &cctx->blockState.nextCBlock->entropy,
4839*a28cd43dSSascha Wildner &cctx->appliedParams,
4840*a28cd43dSSascha Wildner op + ZSTD_blockHeaderSize /* Leave space for block header */, dstCapacity - ZSTD_blockHeaderSize,
4841*a28cd43dSSascha Wildner blockSize,
4842*a28cd43dSSascha Wildner cctx->entropyWorkspace, ENTROPY_WORKSPACE_SIZE /* statically allocated in resetCCtx */,
4843*a28cd43dSSascha Wildner cctx->bmi2);
4844*a28cd43dSSascha Wildner FORWARD_IF_ERROR(compressedSeqsSize, "Compressing sequences of block failed");
4845*a28cd43dSSascha Wildner DEBUGLOG(4, "Compressed sequences size: %zu", compressedSeqsSize);
4846*a28cd43dSSascha Wildner
4847*a28cd43dSSascha Wildner if (!cctx->isFirstBlock &&
4848*a28cd43dSSascha Wildner ZSTD_maybeRLE(&cctx->seqStore) &&
4849*a28cd43dSSascha Wildner ZSTD_isRLE((BYTE const*)src, srcSize)) {
4850*a28cd43dSSascha Wildner /* We don't want to emit our first block as a RLE even if it qualifies because
4851*a28cd43dSSascha Wildner * doing so will cause the decoder (cli only) to throw a "should consume all input error."
4852*a28cd43dSSascha Wildner * This is only an issue for zstd <= v1.4.3
4853*a28cd43dSSascha Wildner */
4854*a28cd43dSSascha Wildner compressedSeqsSize = 1;
4855*a28cd43dSSascha Wildner }
4856*a28cd43dSSascha Wildner
4857*a28cd43dSSascha Wildner if (compressedSeqsSize == 0) {
4858*a28cd43dSSascha Wildner /* ZSTD_noCompressBlock writes the block header as well */
4859*a28cd43dSSascha Wildner cBlockSize = ZSTD_noCompressBlock(op, dstCapacity, ip, blockSize, lastBlock);
4860*a28cd43dSSascha Wildner FORWARD_IF_ERROR(cBlockSize, "Nocompress block failed");
4861*a28cd43dSSascha Wildner DEBUGLOG(4, "Writing out nocompress block, size: %zu", cBlockSize);
4862*a28cd43dSSascha Wildner } else if (compressedSeqsSize == 1) {
4863*a28cd43dSSascha Wildner cBlockSize = ZSTD_rleCompressBlock(op, dstCapacity, *ip, blockSize, lastBlock);
4864*a28cd43dSSascha Wildner FORWARD_IF_ERROR(cBlockSize, "RLE compress block failed");
4865*a28cd43dSSascha Wildner DEBUGLOG(4, "Writing out RLE block, size: %zu", cBlockSize);
4866*a28cd43dSSascha Wildner } else {
4867*a28cd43dSSascha Wildner U32 cBlockHeader;
4868*a28cd43dSSascha Wildner /* Error checking and repcodes update */
4869*a28cd43dSSascha Wildner ZSTD_confirmRepcodesAndEntropyTables(cctx);
4870*a28cd43dSSascha Wildner if (cctx->blockState.prevCBlock->entropy.fse.offcode_repeatMode == FSE_repeat_valid)
4871*a28cd43dSSascha Wildner cctx->blockState.prevCBlock->entropy.fse.offcode_repeatMode = FSE_repeat_check;
4872*a28cd43dSSascha Wildner
4873*a28cd43dSSascha Wildner /* Write block header into beginning of block*/
4874*a28cd43dSSascha Wildner cBlockHeader = lastBlock + (((U32)bt_compressed)<<1) + (U32)(compressedSeqsSize << 3);
4875*a28cd43dSSascha Wildner MEM_writeLE24(op, cBlockHeader);
4876*a28cd43dSSascha Wildner cBlockSize = ZSTD_blockHeaderSize + compressedSeqsSize;
4877*a28cd43dSSascha Wildner DEBUGLOG(4, "Writing out compressed block, size: %zu", cBlockSize);
4878*a28cd43dSSascha Wildner }
4879*a28cd43dSSascha Wildner
4880*a28cd43dSSascha Wildner cSize += cBlockSize;
4881*a28cd43dSSascha Wildner DEBUGLOG(4, "cSize running total: %zu", cSize);
4882*a28cd43dSSascha Wildner
4883*a28cd43dSSascha Wildner if (lastBlock) {
4884*a28cd43dSSascha Wildner break;
4885*a28cd43dSSascha Wildner } else {
4886*a28cd43dSSascha Wildner ip += blockSize;
4887*a28cd43dSSascha Wildner op += cBlockSize;
4888*a28cd43dSSascha Wildner remaining -= blockSize;
4889*a28cd43dSSascha Wildner dstCapacity -= cBlockSize;
4890*a28cd43dSSascha Wildner cctx->isFirstBlock = 0;
4891*a28cd43dSSascha Wildner }
4892*a28cd43dSSascha Wildner }
4893*a28cd43dSSascha Wildner
4894*a28cd43dSSascha Wildner return cSize;
4895*a28cd43dSSascha Wildner }
4896*a28cd43dSSascha Wildner
ZSTD_compressSequences(ZSTD_CCtx * const cctx,void * dst,size_t dstCapacity,const ZSTD_Sequence * inSeqs,size_t inSeqsSize,const void * src,size_t srcSize)4897*a28cd43dSSascha Wildner size_t ZSTD_compressSequences(ZSTD_CCtx* const cctx, void* dst, size_t dstCapacity,
4898*a28cd43dSSascha Wildner const ZSTD_Sequence* inSeqs, size_t inSeqsSize,
4899*a28cd43dSSascha Wildner const void* src, size_t srcSize) {
4900*a28cd43dSSascha Wildner BYTE* op = (BYTE*)dst;
4901*a28cd43dSSascha Wildner size_t cSize = 0;
4902*a28cd43dSSascha Wildner size_t compressedBlocksSize = 0;
4903*a28cd43dSSascha Wildner size_t frameHeaderSize = 0;
4904*a28cd43dSSascha Wildner
4905*a28cd43dSSascha Wildner /* Transparent initialization stage, same as compressStream2() */
4906*a28cd43dSSascha Wildner DEBUGLOG(3, "ZSTD_compressSequences()");
4907*a28cd43dSSascha Wildner assert(cctx != NULL);
4908*a28cd43dSSascha Wildner FORWARD_IF_ERROR(ZSTD_CCtx_init_compressStream2(cctx, ZSTD_e_end, srcSize), "CCtx initialization failed");
4909*a28cd43dSSascha Wildner /* Begin writing output, starting with frame header */
4910*a28cd43dSSascha Wildner frameHeaderSize = ZSTD_writeFrameHeader(op, dstCapacity, &cctx->appliedParams, srcSize, cctx->dictID);
4911*a28cd43dSSascha Wildner op += frameHeaderSize;
4912*a28cd43dSSascha Wildner dstCapacity -= frameHeaderSize;
4913*a28cd43dSSascha Wildner cSize += frameHeaderSize;
4914*a28cd43dSSascha Wildner if (cctx->appliedParams.fParams.checksumFlag && srcSize) {
4915*a28cd43dSSascha Wildner XXH64_update(&cctx->xxhState, src, srcSize);
4916*a28cd43dSSascha Wildner }
4917*a28cd43dSSascha Wildner /* cSize includes block header size and compressed sequences size */
4918*a28cd43dSSascha Wildner compressedBlocksSize = ZSTD_compressSequences_internal(cctx,
4919*a28cd43dSSascha Wildner op, dstCapacity,
4920*a28cd43dSSascha Wildner inSeqs, inSeqsSize,
4921*a28cd43dSSascha Wildner src, srcSize);
4922*a28cd43dSSascha Wildner FORWARD_IF_ERROR(compressedBlocksSize, "Compressing blocks failed!");
4923*a28cd43dSSascha Wildner cSize += compressedBlocksSize;
4924*a28cd43dSSascha Wildner dstCapacity -= compressedBlocksSize;
4925*a28cd43dSSascha Wildner
4926*a28cd43dSSascha Wildner if (cctx->appliedParams.fParams.checksumFlag) {
4927*a28cd43dSSascha Wildner U32 const checksum = (U32) XXH64_digest(&cctx->xxhState);
4928*a28cd43dSSascha Wildner RETURN_ERROR_IF(dstCapacity<4, dstSize_tooSmall, "no room for checksum");
4929*a28cd43dSSascha Wildner DEBUGLOG(4, "Write checksum : %08X", (unsigned)checksum);
4930*a28cd43dSSascha Wildner MEM_writeLE32((char*)dst + cSize, checksum);
4931*a28cd43dSSascha Wildner cSize += 4;
4932*a28cd43dSSascha Wildner }
4933*a28cd43dSSascha Wildner
4934*a28cd43dSSascha Wildner DEBUGLOG(3, "Final compressed size: %zu", cSize);
4935*a28cd43dSSascha Wildner return cSize;
4936*a28cd43dSSascha Wildner }
4937*a28cd43dSSascha Wildner
4938*a28cd43dSSascha Wildner /*====== Finalize ======*/
4939*a28cd43dSSascha Wildner
4940*a28cd43dSSascha Wildner /*! ZSTD_flushStream() :
4941*a28cd43dSSascha Wildner * @return : amount of data remaining to flush */
ZSTD_flushStream(ZSTD_CStream * zcs,ZSTD_outBuffer * output)4942*a28cd43dSSascha Wildner size_t ZSTD_flushStream(ZSTD_CStream* zcs, ZSTD_outBuffer* output)
4943*a28cd43dSSascha Wildner {
4944*a28cd43dSSascha Wildner ZSTD_inBuffer input = { NULL, 0, 0 };
4945*a28cd43dSSascha Wildner return ZSTD_compressStream2(zcs, output, &input, ZSTD_e_flush);
4946*a28cd43dSSascha Wildner }
4947*a28cd43dSSascha Wildner
4948*a28cd43dSSascha Wildner
ZSTD_endStream(ZSTD_CStream * zcs,ZSTD_outBuffer * output)4949*a28cd43dSSascha Wildner size_t ZSTD_endStream(ZSTD_CStream* zcs, ZSTD_outBuffer* output)
4950*a28cd43dSSascha Wildner {
4951*a28cd43dSSascha Wildner ZSTD_inBuffer input = { NULL, 0, 0 };
4952*a28cd43dSSascha Wildner size_t const remainingToFlush = ZSTD_compressStream2(zcs, output, &input, ZSTD_e_end);
4953*a28cd43dSSascha Wildner FORWARD_IF_ERROR( remainingToFlush , "ZSTD_compressStream2 failed");
4954*a28cd43dSSascha Wildner if (zcs->appliedParams.nbWorkers > 0) return remainingToFlush; /* minimal estimation */
4955*a28cd43dSSascha Wildner /* single thread mode : attempt to calculate remaining to flush more precisely */
4956*a28cd43dSSascha Wildner { size_t const lastBlockSize = zcs->frameEnded ? 0 : ZSTD_BLOCKHEADERSIZE;
4957*a28cd43dSSascha Wildner size_t const checksumSize = (size_t)(zcs->frameEnded ? 0 : zcs->appliedParams.fParams.checksumFlag * 4);
4958*a28cd43dSSascha Wildner size_t const toFlush = remainingToFlush + lastBlockSize + checksumSize;
4959*a28cd43dSSascha Wildner DEBUGLOG(4, "ZSTD_endStream : remaining to flush : %u", (unsigned)toFlush);
4960*a28cd43dSSascha Wildner return toFlush;
4961*a28cd43dSSascha Wildner }
4962*a28cd43dSSascha Wildner }
4963*a28cd43dSSascha Wildner
4964*a28cd43dSSascha Wildner
4965*a28cd43dSSascha Wildner /*-===== Pre-defined compression levels =====-*/
4966*a28cd43dSSascha Wildner
4967*a28cd43dSSascha Wildner #define ZSTD_MAX_CLEVEL 22
ZSTD_maxCLevel(void)4968*a28cd43dSSascha Wildner int ZSTD_maxCLevel(void) { return ZSTD_MAX_CLEVEL; }
ZSTD_minCLevel(void)4969*a28cd43dSSascha Wildner int ZSTD_minCLevel(void) { return (int)-ZSTD_TARGETLENGTH_MAX; }
4970*a28cd43dSSascha Wildner
4971*a28cd43dSSascha Wildner static const ZSTD_compressionParameters ZSTD_defaultCParameters[4][ZSTD_MAX_CLEVEL+1] = {
4972*a28cd43dSSascha Wildner { /* "default" - for any srcSize > 256 KB */
4973*a28cd43dSSascha Wildner /* W, C, H, S, L, TL, strat */
4974*a28cd43dSSascha Wildner { 19, 12, 13, 1, 6, 1, ZSTD_fast }, /* base for negative levels */
4975*a28cd43dSSascha Wildner { 19, 13, 14, 1, 7, 0, ZSTD_fast }, /* level 1 */
4976*a28cd43dSSascha Wildner { 20, 15, 16, 1, 6, 0, ZSTD_fast }, /* level 2 */
4977*a28cd43dSSascha Wildner { 21, 16, 17, 1, 5, 0, ZSTD_dfast }, /* level 3 */
4978*a28cd43dSSascha Wildner { 21, 18, 18, 1, 5, 0, ZSTD_dfast }, /* level 4 */
4979*a28cd43dSSascha Wildner { 21, 18, 19, 2, 5, 2, ZSTD_greedy }, /* level 5 */
4980*a28cd43dSSascha Wildner { 21, 19, 19, 3, 5, 4, ZSTD_greedy }, /* level 6 */
4981*a28cd43dSSascha Wildner { 21, 19, 19, 3, 5, 8, ZSTD_lazy }, /* level 7 */
4982*a28cd43dSSascha Wildner { 21, 19, 19, 3, 5, 16, ZSTD_lazy2 }, /* level 8 */
4983*a28cd43dSSascha Wildner { 21, 19, 20, 4, 5, 16, ZSTD_lazy2 }, /* level 9 */
4984*a28cd43dSSascha Wildner { 22, 20, 21, 4, 5, 16, ZSTD_lazy2 }, /* level 10 */
4985*a28cd43dSSascha Wildner { 22, 21, 22, 4, 5, 16, ZSTD_lazy2 }, /* level 11 */
4986*a28cd43dSSascha Wildner { 22, 21, 22, 5, 5, 16, ZSTD_lazy2 }, /* level 12 */
4987*a28cd43dSSascha Wildner { 22, 21, 22, 5, 5, 32, ZSTD_btlazy2 }, /* level 13 */
4988*a28cd43dSSascha Wildner { 22, 22, 23, 5, 5, 32, ZSTD_btlazy2 }, /* level 14 */
4989*a28cd43dSSascha Wildner { 22, 23, 23, 6, 5, 32, ZSTD_btlazy2 }, /* level 15 */
4990*a28cd43dSSascha Wildner { 22, 22, 22, 5, 5, 48, ZSTD_btopt }, /* level 16 */
4991*a28cd43dSSascha Wildner { 23, 23, 22, 5, 4, 64, ZSTD_btopt }, /* level 17 */
4992*a28cd43dSSascha Wildner { 23, 23, 22, 6, 3, 64, ZSTD_btultra }, /* level 18 */
4993*a28cd43dSSascha Wildner { 23, 24, 22, 7, 3,256, ZSTD_btultra2}, /* level 19 */
4994*a28cd43dSSascha Wildner { 25, 25, 23, 7, 3,256, ZSTD_btultra2}, /* level 20 */
4995*a28cd43dSSascha Wildner { 26, 26, 24, 7, 3,512, ZSTD_btultra2}, /* level 21 */
4996*a28cd43dSSascha Wildner { 27, 27, 25, 9, 3,999, ZSTD_btultra2}, /* level 22 */
4997*a28cd43dSSascha Wildner },
4998*a28cd43dSSascha Wildner { /* for srcSize <= 256 KB */
4999*a28cd43dSSascha Wildner /* W, C, H, S, L, T, strat */
5000*a28cd43dSSascha Wildner { 18, 12, 13, 1, 5, 1, ZSTD_fast }, /* base for negative levels */
5001*a28cd43dSSascha Wildner { 18, 13, 14, 1, 6, 0, ZSTD_fast }, /* level 1 */
5002*a28cd43dSSascha Wildner { 18, 14, 14, 1, 5, 0, ZSTD_dfast }, /* level 2 */
5003*a28cd43dSSascha Wildner { 18, 16, 16, 1, 4, 0, ZSTD_dfast }, /* level 3 */
5004*a28cd43dSSascha Wildner { 18, 16, 17, 2, 5, 2, ZSTD_greedy }, /* level 4.*/
5005*a28cd43dSSascha Wildner { 18, 18, 18, 3, 5, 2, ZSTD_greedy }, /* level 5.*/
5006*a28cd43dSSascha Wildner { 18, 18, 19, 3, 5, 4, ZSTD_lazy }, /* level 6.*/
5007*a28cd43dSSascha Wildner { 18, 18, 19, 4, 4, 4, ZSTD_lazy }, /* level 7 */
5008*a28cd43dSSascha Wildner { 18, 18, 19, 4, 4, 8, ZSTD_lazy2 }, /* level 8 */
5009*a28cd43dSSascha Wildner { 18, 18, 19, 5, 4, 8, ZSTD_lazy2 }, /* level 9 */
5010*a28cd43dSSascha Wildner { 18, 18, 19, 6, 4, 8, ZSTD_lazy2 }, /* level 10 */
5011*a28cd43dSSascha Wildner { 18, 18, 19, 5, 4, 12, ZSTD_btlazy2 }, /* level 11.*/
5012*a28cd43dSSascha Wildner { 18, 19, 19, 7, 4, 12, ZSTD_btlazy2 }, /* level 12.*/
5013*a28cd43dSSascha Wildner { 18, 18, 19, 4, 4, 16, ZSTD_btopt }, /* level 13 */
5014*a28cd43dSSascha Wildner { 18, 18, 19, 4, 3, 32, ZSTD_btopt }, /* level 14.*/
5015*a28cd43dSSascha Wildner { 18, 18, 19, 6, 3,128, ZSTD_btopt }, /* level 15.*/
5016*a28cd43dSSascha Wildner { 18, 19, 19, 6, 3,128, ZSTD_btultra }, /* level 16.*/
5017*a28cd43dSSascha Wildner { 18, 19, 19, 8, 3,256, ZSTD_btultra }, /* level 17.*/
5018*a28cd43dSSascha Wildner { 18, 19, 19, 6, 3,128, ZSTD_btultra2}, /* level 18.*/
5019*a28cd43dSSascha Wildner { 18, 19, 19, 8, 3,256, ZSTD_btultra2}, /* level 19.*/
5020*a28cd43dSSascha Wildner { 18, 19, 19, 10, 3,512, ZSTD_btultra2}, /* level 20.*/
5021*a28cd43dSSascha Wildner { 18, 19, 19, 12, 3,512, ZSTD_btultra2}, /* level 21.*/
5022*a28cd43dSSascha Wildner { 18, 19, 19, 13, 3,999, ZSTD_btultra2}, /* level 22.*/
5023*a28cd43dSSascha Wildner },
5024*a28cd43dSSascha Wildner { /* for srcSize <= 128 KB */
5025*a28cd43dSSascha Wildner /* W, C, H, S, L, T, strat */
5026*a28cd43dSSascha Wildner { 17, 12, 12, 1, 5, 1, ZSTD_fast }, /* base for negative levels */
5027*a28cd43dSSascha Wildner { 17, 12, 13, 1, 6, 0, ZSTD_fast }, /* level 1 */
5028*a28cd43dSSascha Wildner { 17, 13, 15, 1, 5, 0, ZSTD_fast }, /* level 2 */
5029*a28cd43dSSascha Wildner { 17, 15, 16, 2, 5, 0, ZSTD_dfast }, /* level 3 */
5030*a28cd43dSSascha Wildner { 17, 17, 17, 2, 4, 0, ZSTD_dfast }, /* level 4 */
5031*a28cd43dSSascha Wildner { 17, 16, 17, 3, 4, 2, ZSTD_greedy }, /* level 5 */
5032*a28cd43dSSascha Wildner { 17, 17, 17, 3, 4, 4, ZSTD_lazy }, /* level 6 */
5033*a28cd43dSSascha Wildner { 17, 17, 17, 3, 4, 8, ZSTD_lazy2 }, /* level 7 */
5034*a28cd43dSSascha Wildner { 17, 17, 17, 4, 4, 8, ZSTD_lazy2 }, /* level 8 */
5035*a28cd43dSSascha Wildner { 17, 17, 17, 5, 4, 8, ZSTD_lazy2 }, /* level 9 */
5036*a28cd43dSSascha Wildner { 17, 17, 17, 6, 4, 8, ZSTD_lazy2 }, /* level 10 */
5037*a28cd43dSSascha Wildner { 17, 17, 17, 5, 4, 8, ZSTD_btlazy2 }, /* level 11 */
5038*a28cd43dSSascha Wildner { 17, 18, 17, 7, 4, 12, ZSTD_btlazy2 }, /* level 12 */
5039*a28cd43dSSascha Wildner { 17, 18, 17, 3, 4, 12, ZSTD_btopt }, /* level 13.*/
5040*a28cd43dSSascha Wildner { 17, 18, 17, 4, 3, 32, ZSTD_btopt }, /* level 14.*/
5041*a28cd43dSSascha Wildner { 17, 18, 17, 6, 3,256, ZSTD_btopt }, /* level 15.*/
5042*a28cd43dSSascha Wildner { 17, 18, 17, 6, 3,128, ZSTD_btultra }, /* level 16.*/
5043*a28cd43dSSascha Wildner { 17, 18, 17, 8, 3,256, ZSTD_btultra }, /* level 17.*/
5044*a28cd43dSSascha Wildner { 17, 18, 17, 10, 3,512, ZSTD_btultra }, /* level 18.*/
5045*a28cd43dSSascha Wildner { 17, 18, 17, 5, 3,256, ZSTD_btultra2}, /* level 19.*/
5046*a28cd43dSSascha Wildner { 17, 18, 17, 7, 3,512, ZSTD_btultra2}, /* level 20.*/
5047*a28cd43dSSascha Wildner { 17, 18, 17, 9, 3,512, ZSTD_btultra2}, /* level 21.*/
5048*a28cd43dSSascha Wildner { 17, 18, 17, 11, 3,999, ZSTD_btultra2}, /* level 22.*/
5049*a28cd43dSSascha Wildner },
5050*a28cd43dSSascha Wildner { /* for srcSize <= 16 KB */
5051*a28cd43dSSascha Wildner /* W, C, H, S, L, T, strat */
5052*a28cd43dSSascha Wildner { 14, 12, 13, 1, 5, 1, ZSTD_fast }, /* base for negative levels */
5053*a28cd43dSSascha Wildner { 14, 14, 15, 1, 5, 0, ZSTD_fast }, /* level 1 */
5054*a28cd43dSSascha Wildner { 14, 14, 15, 1, 4, 0, ZSTD_fast }, /* level 2 */
5055*a28cd43dSSascha Wildner { 14, 14, 15, 2, 4, 0, ZSTD_dfast }, /* level 3 */
5056*a28cd43dSSascha Wildner { 14, 14, 14, 4, 4, 2, ZSTD_greedy }, /* level 4 */
5057*a28cd43dSSascha Wildner { 14, 14, 14, 3, 4, 4, ZSTD_lazy }, /* level 5.*/
5058*a28cd43dSSascha Wildner { 14, 14, 14, 4, 4, 8, ZSTD_lazy2 }, /* level 6 */
5059*a28cd43dSSascha Wildner { 14, 14, 14, 6, 4, 8, ZSTD_lazy2 }, /* level 7 */
5060*a28cd43dSSascha Wildner { 14, 14, 14, 8, 4, 8, ZSTD_lazy2 }, /* level 8.*/
5061*a28cd43dSSascha Wildner { 14, 15, 14, 5, 4, 8, ZSTD_btlazy2 }, /* level 9.*/
5062*a28cd43dSSascha Wildner { 14, 15, 14, 9, 4, 8, ZSTD_btlazy2 }, /* level 10.*/
5063*a28cd43dSSascha Wildner { 14, 15, 14, 3, 4, 12, ZSTD_btopt }, /* level 11.*/
5064*a28cd43dSSascha Wildner { 14, 15, 14, 4, 3, 24, ZSTD_btopt }, /* level 12.*/
5065*a28cd43dSSascha Wildner { 14, 15, 14, 5, 3, 32, ZSTD_btultra }, /* level 13.*/
5066*a28cd43dSSascha Wildner { 14, 15, 15, 6, 3, 64, ZSTD_btultra }, /* level 14.*/
5067*a28cd43dSSascha Wildner { 14, 15, 15, 7, 3,256, ZSTD_btultra }, /* level 15.*/
5068*a28cd43dSSascha Wildner { 14, 15, 15, 5, 3, 48, ZSTD_btultra2}, /* level 16.*/
5069*a28cd43dSSascha Wildner { 14, 15, 15, 6, 3,128, ZSTD_btultra2}, /* level 17.*/
5070*a28cd43dSSascha Wildner { 14, 15, 15, 7, 3,256, ZSTD_btultra2}, /* level 18.*/
5071*a28cd43dSSascha Wildner { 14, 15, 15, 8, 3,256, ZSTD_btultra2}, /* level 19.*/
5072*a28cd43dSSascha Wildner { 14, 15, 15, 8, 3,512, ZSTD_btultra2}, /* level 20.*/
5073*a28cd43dSSascha Wildner { 14, 15, 15, 9, 3,512, ZSTD_btultra2}, /* level 21.*/
5074*a28cd43dSSascha Wildner { 14, 15, 15, 10, 3,999, ZSTD_btultra2}, /* level 22.*/
5075*a28cd43dSSascha Wildner },
5076*a28cd43dSSascha Wildner };
5077*a28cd43dSSascha Wildner
ZSTD_dedicatedDictSearch_getCParams(int const compressionLevel,size_t const dictSize)5078*a28cd43dSSascha Wildner static ZSTD_compressionParameters ZSTD_dedicatedDictSearch_getCParams(int const compressionLevel, size_t const dictSize)
5079*a28cd43dSSascha Wildner {
5080*a28cd43dSSascha Wildner ZSTD_compressionParameters cParams = ZSTD_getCParams_internal(compressionLevel, 0, dictSize, ZSTD_cpm_createCDict);
5081*a28cd43dSSascha Wildner switch (cParams.strategy) {
5082*a28cd43dSSascha Wildner case ZSTD_fast:
5083*a28cd43dSSascha Wildner case ZSTD_dfast:
5084*a28cd43dSSascha Wildner break;
5085*a28cd43dSSascha Wildner case ZSTD_greedy:
5086*a28cd43dSSascha Wildner case ZSTD_lazy:
5087*a28cd43dSSascha Wildner case ZSTD_lazy2:
5088*a28cd43dSSascha Wildner cParams.hashLog += ZSTD_LAZY_DDSS_BUCKET_LOG;
5089*a28cd43dSSascha Wildner break;
5090*a28cd43dSSascha Wildner case ZSTD_btlazy2:
5091*a28cd43dSSascha Wildner case ZSTD_btopt:
5092*a28cd43dSSascha Wildner case ZSTD_btultra:
5093*a28cd43dSSascha Wildner case ZSTD_btultra2:
5094*a28cd43dSSascha Wildner break;
5095*a28cd43dSSascha Wildner }
5096*a28cd43dSSascha Wildner return cParams;
5097*a28cd43dSSascha Wildner }
5098*a28cd43dSSascha Wildner
ZSTD_dedicatedDictSearch_isSupported(ZSTD_compressionParameters const * cParams)5099*a28cd43dSSascha Wildner static int ZSTD_dedicatedDictSearch_isSupported(
5100*a28cd43dSSascha Wildner ZSTD_compressionParameters const* cParams)
5101*a28cd43dSSascha Wildner {
5102*a28cd43dSSascha Wildner return (cParams->strategy >= ZSTD_greedy) && (cParams->strategy <= ZSTD_lazy2);
5103*a28cd43dSSascha Wildner }
5104*a28cd43dSSascha Wildner
5105*a28cd43dSSascha Wildner /**
5106*a28cd43dSSascha Wildner * Reverses the adjustment applied to cparams when enabling dedicated dict
5107*a28cd43dSSascha Wildner * search. This is used to recover the params set to be used in the working
5108*a28cd43dSSascha Wildner * context. (Otherwise, those tables would also grow.)
5109*a28cd43dSSascha Wildner */
ZSTD_dedicatedDictSearch_revertCParams(ZSTD_compressionParameters * cParams)5110*a28cd43dSSascha Wildner static void ZSTD_dedicatedDictSearch_revertCParams(
5111*a28cd43dSSascha Wildner ZSTD_compressionParameters* cParams) {
5112*a28cd43dSSascha Wildner switch (cParams->strategy) {
5113*a28cd43dSSascha Wildner case ZSTD_fast:
5114*a28cd43dSSascha Wildner case ZSTD_dfast:
5115*a28cd43dSSascha Wildner break;
5116*a28cd43dSSascha Wildner case ZSTD_greedy:
5117*a28cd43dSSascha Wildner case ZSTD_lazy:
5118*a28cd43dSSascha Wildner case ZSTD_lazy2:
5119*a28cd43dSSascha Wildner cParams->hashLog -= ZSTD_LAZY_DDSS_BUCKET_LOG;
5120*a28cd43dSSascha Wildner break;
5121*a28cd43dSSascha Wildner case ZSTD_btlazy2:
5122*a28cd43dSSascha Wildner case ZSTD_btopt:
5123*a28cd43dSSascha Wildner case ZSTD_btultra:
5124*a28cd43dSSascha Wildner case ZSTD_btultra2:
5125*a28cd43dSSascha Wildner break;
5126*a28cd43dSSascha Wildner }
5127*a28cd43dSSascha Wildner }
5128*a28cd43dSSascha Wildner
ZSTD_getCParamRowSize(U64 srcSizeHint,size_t dictSize,ZSTD_cParamMode_e mode)5129*a28cd43dSSascha Wildner static U64 ZSTD_getCParamRowSize(U64 srcSizeHint, size_t dictSize, ZSTD_cParamMode_e mode)
5130*a28cd43dSSascha Wildner {
5131*a28cd43dSSascha Wildner switch (mode) {
5132*a28cd43dSSascha Wildner case ZSTD_cpm_unknown:
5133*a28cd43dSSascha Wildner case ZSTD_cpm_noAttachDict:
5134*a28cd43dSSascha Wildner case ZSTD_cpm_createCDict:
5135*a28cd43dSSascha Wildner break;
5136*a28cd43dSSascha Wildner case ZSTD_cpm_attachDict:
5137*a28cd43dSSascha Wildner dictSize = 0;
5138*a28cd43dSSascha Wildner break;
5139*a28cd43dSSascha Wildner default:
5140*a28cd43dSSascha Wildner assert(0);
5141*a28cd43dSSascha Wildner break;
5142*a28cd43dSSascha Wildner }
5143*a28cd43dSSascha Wildner { int const unknown = srcSizeHint == ZSTD_CONTENTSIZE_UNKNOWN;
5144*a28cd43dSSascha Wildner size_t const addedSize = unknown && dictSize > 0 ? 500 : 0;
5145*a28cd43dSSascha Wildner return unknown && dictSize == 0 ? ZSTD_CONTENTSIZE_UNKNOWN : srcSizeHint+dictSize+addedSize;
5146*a28cd43dSSascha Wildner }
5147*a28cd43dSSascha Wildner }
5148*a28cd43dSSascha Wildner
5149*a28cd43dSSascha Wildner /*! ZSTD_getCParams_internal() :
5150*a28cd43dSSascha Wildner * @return ZSTD_compressionParameters structure for a selected compression level, srcSize and dictSize.
5151*a28cd43dSSascha Wildner * Note: srcSizeHint 0 means 0, use ZSTD_CONTENTSIZE_UNKNOWN for unknown.
5152*a28cd43dSSascha Wildner * Use dictSize == 0 for unknown or unused.
5153*a28cd43dSSascha Wildner * Note: `mode` controls how we treat the `dictSize`. See docs for `ZSTD_cParamMode_e`. */
ZSTD_getCParams_internal(int compressionLevel,unsigned long long srcSizeHint,size_t dictSize,ZSTD_cParamMode_e mode)5154*a28cd43dSSascha Wildner static ZSTD_compressionParameters ZSTD_getCParams_internal(int compressionLevel, unsigned long long srcSizeHint, size_t dictSize, ZSTD_cParamMode_e mode)
5155*a28cd43dSSascha Wildner {
5156*a28cd43dSSascha Wildner U64 const rSize = ZSTD_getCParamRowSize(srcSizeHint, dictSize, mode);
5157*a28cd43dSSascha Wildner U32 const tableID = (rSize <= 256 KB) + (rSize <= 128 KB) + (rSize <= 16 KB);
5158*a28cd43dSSascha Wildner int row;
5159*a28cd43dSSascha Wildner DEBUGLOG(5, "ZSTD_getCParams_internal (cLevel=%i)", compressionLevel);
5160*a28cd43dSSascha Wildner
5161*a28cd43dSSascha Wildner /* row */
5162*a28cd43dSSascha Wildner if (compressionLevel == 0) row = ZSTD_CLEVEL_DEFAULT; /* 0 == default */
5163*a28cd43dSSascha Wildner else if (compressionLevel < 0) row = 0; /* entry 0 is baseline for fast mode */
5164*a28cd43dSSascha Wildner else if (compressionLevel > ZSTD_MAX_CLEVEL) row = ZSTD_MAX_CLEVEL;
5165*a28cd43dSSascha Wildner else row = compressionLevel;
5166*a28cd43dSSascha Wildner
5167*a28cd43dSSascha Wildner { ZSTD_compressionParameters cp = ZSTD_defaultCParameters[tableID][row];
5168*a28cd43dSSascha Wildner /* acceleration factor */
5169*a28cd43dSSascha Wildner if (compressionLevel < 0) {
5170*a28cd43dSSascha Wildner int const clampedCompressionLevel = MAX(ZSTD_minCLevel(), compressionLevel);
5171*a28cd43dSSascha Wildner cp.targetLength = (unsigned)(-clampedCompressionLevel);
5172*a28cd43dSSascha Wildner }
5173*a28cd43dSSascha Wildner /* refine parameters based on srcSize & dictSize */
5174*a28cd43dSSascha Wildner return ZSTD_adjustCParams_internal(cp, srcSizeHint, dictSize, mode);
5175*a28cd43dSSascha Wildner }
5176*a28cd43dSSascha Wildner }
5177*a28cd43dSSascha Wildner
5178*a28cd43dSSascha Wildner /*! ZSTD_getCParams() :
5179*a28cd43dSSascha Wildner * @return ZSTD_compressionParameters structure for a selected compression level, srcSize and dictSize.
5180*a28cd43dSSascha Wildner * Size values are optional, provide 0 if not known or unused */
ZSTD_getCParams(int compressionLevel,unsigned long long srcSizeHint,size_t dictSize)5181*a28cd43dSSascha Wildner ZSTD_compressionParameters ZSTD_getCParams(int compressionLevel, unsigned long long srcSizeHint, size_t dictSize)
5182*a28cd43dSSascha Wildner {
5183*a28cd43dSSascha Wildner if (srcSizeHint == 0) srcSizeHint = ZSTD_CONTENTSIZE_UNKNOWN;
5184*a28cd43dSSascha Wildner return ZSTD_getCParams_internal(compressionLevel, srcSizeHint, dictSize, ZSTD_cpm_unknown);
5185*a28cd43dSSascha Wildner }
5186*a28cd43dSSascha Wildner
5187*a28cd43dSSascha Wildner /*! ZSTD_getParams() :
5188*a28cd43dSSascha Wildner * same idea as ZSTD_getCParams()
5189*a28cd43dSSascha Wildner * @return a `ZSTD_parameters` structure (instead of `ZSTD_compressionParameters`).
5190*a28cd43dSSascha Wildner * Fields of `ZSTD_frameParameters` are set to default values */
ZSTD_getParams_internal(int compressionLevel,unsigned long long srcSizeHint,size_t dictSize,ZSTD_cParamMode_e mode)5191*a28cd43dSSascha Wildner static ZSTD_parameters ZSTD_getParams_internal(int compressionLevel, unsigned long long srcSizeHint, size_t dictSize, ZSTD_cParamMode_e mode) {
5192*a28cd43dSSascha Wildner ZSTD_parameters params;
5193*a28cd43dSSascha Wildner ZSTD_compressionParameters const cParams = ZSTD_getCParams_internal(compressionLevel, srcSizeHint, dictSize, mode);
5194*a28cd43dSSascha Wildner DEBUGLOG(5, "ZSTD_getParams (cLevel=%i)", compressionLevel);
5195*a28cd43dSSascha Wildner ZSTD_memset(¶ms, 0, sizeof(params));
5196*a28cd43dSSascha Wildner params.cParams = cParams;
5197*a28cd43dSSascha Wildner params.fParams.contentSizeFlag = 1;
5198*a28cd43dSSascha Wildner return params;
5199*a28cd43dSSascha Wildner }
5200*a28cd43dSSascha Wildner
5201*a28cd43dSSascha Wildner /*! ZSTD_getParams() :
5202*a28cd43dSSascha Wildner * same idea as ZSTD_getCParams()
5203*a28cd43dSSascha Wildner * @return a `ZSTD_parameters` structure (instead of `ZSTD_compressionParameters`).
5204*a28cd43dSSascha Wildner * Fields of `ZSTD_frameParameters` are set to default values */
ZSTD_getParams(int compressionLevel,unsigned long long srcSizeHint,size_t dictSize)5205*a28cd43dSSascha Wildner ZSTD_parameters ZSTD_getParams(int compressionLevel, unsigned long long srcSizeHint, size_t dictSize) {
5206*a28cd43dSSascha Wildner if (srcSizeHint == 0) srcSizeHint = ZSTD_CONTENTSIZE_UNKNOWN;
5207*a28cd43dSSascha Wildner return ZSTD_getParams_internal(compressionLevel, srcSizeHint, dictSize, ZSTD_cpm_unknown);
5208*a28cd43dSSascha Wildner }
5209