xref: /freebsd-src/sys/contrib/openzfs/module/zstd/lib/compress/zstd_compress.c (revision c03c5b1c80914ec656fbee84539355d1fad68bf9)
1*c03c5b1cSMartin Matuska /*
2*c03c5b1cSMartin Matuska  * Copyright (c) 2016-2020, Yann Collet, Facebook, Inc.
3*c03c5b1cSMartin Matuska  * All rights reserved.
4*c03c5b1cSMartin Matuska  *
5*c03c5b1cSMartin Matuska  * This source code is licensed under both the BSD-style license (found in the
6*c03c5b1cSMartin Matuska  * LICENSE file in the root directory of this source tree) and the GPLv2 (found
7*c03c5b1cSMartin Matuska  * in the COPYING file in the root directory of this source tree).
8*c03c5b1cSMartin Matuska  * You may select, at your option, one of the above-listed licenses.
9*c03c5b1cSMartin Matuska  */
10*c03c5b1cSMartin Matuska 
11*c03c5b1cSMartin Matuska /*-*************************************
12*c03c5b1cSMartin Matuska *  Dependencies
13*c03c5b1cSMartin Matuska ***************************************/
14*c03c5b1cSMartin Matuska #include <limits.h>         /* INT_MAX */
15*c03c5b1cSMartin Matuska #include <string.h>         /* memset */
16*c03c5b1cSMartin Matuska #include "../common/cpu.h"
17*c03c5b1cSMartin Matuska #include "../common/mem.h"
18*c03c5b1cSMartin Matuska #include "hist.h"           /* HIST_countFast_wksp */
19*c03c5b1cSMartin Matuska #define FSE_STATIC_LINKING_ONLY   /* FSE_encodeSymbol */
20*c03c5b1cSMartin Matuska #include "../common/fse.h"
21*c03c5b1cSMartin Matuska #define HUF_STATIC_LINKING_ONLY
22*c03c5b1cSMartin Matuska #include "../common/huf.h"
23*c03c5b1cSMartin Matuska #include "zstd_compress_internal.h"
24*c03c5b1cSMartin Matuska #include "zstd_compress_sequences.h"
25*c03c5b1cSMartin Matuska #include "zstd_compress_literals.h"
26*c03c5b1cSMartin Matuska #include "zstd_fast.h"
27*c03c5b1cSMartin Matuska #include "zstd_double_fast.h"
28*c03c5b1cSMartin Matuska #include "zstd_lazy.h"
29*c03c5b1cSMartin Matuska #include "zstd_opt.h"
30*c03c5b1cSMartin Matuska #include "zstd_ldm.h"
31*c03c5b1cSMartin Matuska #include "zstd_compress_superblock.h"
32*c03c5b1cSMartin Matuska 
33*c03c5b1cSMartin Matuska 
34*c03c5b1cSMartin Matuska /*-*************************************
35*c03c5b1cSMartin Matuska *  Helper functions
36*c03c5b1cSMartin Matuska ***************************************/
37*c03c5b1cSMartin Matuska /* ZSTD_compressBound()
38*c03c5b1cSMartin Matuska  * Note that the result from this function is only compatible with the "normal"
39*c03c5b1cSMartin Matuska  * full-block strategy.
40*c03c5b1cSMartin Matuska  * When there are a lot of small blocks due to frequent flush in streaming mode
41*c03c5b1cSMartin Matuska  * the overhead of headers can make the compressed data to be larger than the
42*c03c5b1cSMartin Matuska  * return value of ZSTD_compressBound().
43*c03c5b1cSMartin Matuska  */
ZSTD_compressBound(size_t srcSize)44*c03c5b1cSMartin Matuska size_t ZSTD_compressBound(size_t srcSize) {
45*c03c5b1cSMartin Matuska     return ZSTD_COMPRESSBOUND(srcSize);
46*c03c5b1cSMartin Matuska }
47*c03c5b1cSMartin Matuska 
48*c03c5b1cSMartin Matuska 
49*c03c5b1cSMartin Matuska /*-*************************************
50*c03c5b1cSMartin Matuska *  Context memory management
51*c03c5b1cSMartin Matuska ***************************************/
52*c03c5b1cSMartin Matuska struct ZSTD_CDict_s {
53*c03c5b1cSMartin Matuska     const void* dictContent;
54*c03c5b1cSMartin Matuska     size_t dictContentSize;
55*c03c5b1cSMartin Matuska     U32* entropyWorkspace; /* entropy workspace of HUF_WORKSPACE_SIZE bytes */
56*c03c5b1cSMartin Matuska     ZSTD_cwksp workspace;
57*c03c5b1cSMartin Matuska     ZSTD_matchState_t matchState;
58*c03c5b1cSMartin Matuska     ZSTD_compressedBlockState_t cBlockState;
59*c03c5b1cSMartin Matuska     ZSTD_customMem customMem;
60*c03c5b1cSMartin Matuska     U32 dictID;
61*c03c5b1cSMartin Matuska     int compressionLevel; /* 0 indicates that advanced API was used to select CDict params */
62*c03c5b1cSMartin Matuska };  /* typedef'd to ZSTD_CDict within "zstd.h" */
63*c03c5b1cSMartin Matuska 
ZSTD_createCCtx(void)64*c03c5b1cSMartin Matuska ZSTD_CCtx* ZSTD_createCCtx(void)
65*c03c5b1cSMartin Matuska {
66*c03c5b1cSMartin Matuska     return ZSTD_createCCtx_advanced(ZSTD_defaultCMem);
67*c03c5b1cSMartin Matuska }
68*c03c5b1cSMartin Matuska 
ZSTD_initCCtx(ZSTD_CCtx * cctx,ZSTD_customMem memManager)69*c03c5b1cSMartin Matuska static void ZSTD_initCCtx(ZSTD_CCtx* cctx, ZSTD_customMem memManager)
70*c03c5b1cSMartin Matuska {
71*c03c5b1cSMartin Matuska     assert(cctx != NULL);
72*c03c5b1cSMartin Matuska     memset(cctx, 0, sizeof(*cctx));
73*c03c5b1cSMartin Matuska     cctx->customMem = memManager;
74*c03c5b1cSMartin Matuska     cctx->bmi2 = ZSTD_cpuid_bmi2(ZSTD_cpuid());
75*c03c5b1cSMartin Matuska     {   size_t const err = ZSTD_CCtx_reset(cctx, ZSTD_reset_parameters);
76*c03c5b1cSMartin Matuska         assert(!ZSTD_isError(err));
77*c03c5b1cSMartin Matuska         (void)err;
78*c03c5b1cSMartin Matuska     }
79*c03c5b1cSMartin Matuska }
80*c03c5b1cSMartin Matuska 
ZSTD_createCCtx_advanced(ZSTD_customMem customMem)81*c03c5b1cSMartin Matuska ZSTD_CCtx* ZSTD_createCCtx_advanced(ZSTD_customMem customMem)
82*c03c5b1cSMartin Matuska {
83*c03c5b1cSMartin Matuska     ZSTD_STATIC_ASSERT(zcss_init==0);
84*c03c5b1cSMartin Matuska     ZSTD_STATIC_ASSERT(ZSTD_CONTENTSIZE_UNKNOWN==(0ULL - 1));
85*c03c5b1cSMartin Matuska     if (!customMem.customAlloc ^ !customMem.customFree) return NULL;
86*c03c5b1cSMartin Matuska     {   ZSTD_CCtx* const cctx = (ZSTD_CCtx*)ZSTD_malloc(sizeof(ZSTD_CCtx), customMem);
87*c03c5b1cSMartin Matuska         if (!cctx) return NULL;
88*c03c5b1cSMartin Matuska         ZSTD_initCCtx(cctx, customMem);
89*c03c5b1cSMartin Matuska         return cctx;
90*c03c5b1cSMartin Matuska     }
91*c03c5b1cSMartin Matuska }
92*c03c5b1cSMartin Matuska 
ZSTD_initStaticCCtx(void * workspace,size_t workspaceSize)93*c03c5b1cSMartin Matuska ZSTD_CCtx* ZSTD_initStaticCCtx(void* workspace, size_t workspaceSize)
94*c03c5b1cSMartin Matuska {
95*c03c5b1cSMartin Matuska     ZSTD_cwksp ws;
96*c03c5b1cSMartin Matuska     ZSTD_CCtx* cctx;
97*c03c5b1cSMartin Matuska     if (workspaceSize <= sizeof(ZSTD_CCtx)) return NULL;  /* minimum size */
98*c03c5b1cSMartin Matuska     if ((size_t)workspace & 7) return NULL;  /* must be 8-aligned */
99*c03c5b1cSMartin Matuska     ZSTD_cwksp_init(&ws, workspace, workspaceSize);
100*c03c5b1cSMartin Matuska 
101*c03c5b1cSMartin Matuska     cctx = (ZSTD_CCtx*)ZSTD_cwksp_reserve_object(&ws, sizeof(ZSTD_CCtx));
102*c03c5b1cSMartin Matuska     if (cctx == NULL) return NULL;
103*c03c5b1cSMartin Matuska 
104*c03c5b1cSMartin Matuska     memset(cctx, 0, sizeof(ZSTD_CCtx));
105*c03c5b1cSMartin Matuska     ZSTD_cwksp_move(&cctx->workspace, &ws);
106*c03c5b1cSMartin Matuska     cctx->staticSize = workspaceSize;
107*c03c5b1cSMartin Matuska 
108*c03c5b1cSMartin Matuska     /* statically sized space. entropyWorkspace never moves (but prev/next block swap places) */
109*c03c5b1cSMartin Matuska     if (!ZSTD_cwksp_check_available(&cctx->workspace, HUF_WORKSPACE_SIZE + 2 * sizeof(ZSTD_compressedBlockState_t))) return NULL;
110*c03c5b1cSMartin Matuska     cctx->blockState.prevCBlock = (ZSTD_compressedBlockState_t*)ZSTD_cwksp_reserve_object(&cctx->workspace, sizeof(ZSTD_compressedBlockState_t));
111*c03c5b1cSMartin Matuska     cctx->blockState.nextCBlock = (ZSTD_compressedBlockState_t*)ZSTD_cwksp_reserve_object(&cctx->workspace, sizeof(ZSTD_compressedBlockState_t));
112*c03c5b1cSMartin Matuska     cctx->entropyWorkspace = (U32*)ZSTD_cwksp_reserve_object(&cctx->workspace, HUF_WORKSPACE_SIZE);
113*c03c5b1cSMartin Matuska     cctx->bmi2 = ZSTD_cpuid_bmi2(ZSTD_cpuid());
114*c03c5b1cSMartin Matuska     return cctx;
115*c03c5b1cSMartin Matuska }
116*c03c5b1cSMartin Matuska 
117*c03c5b1cSMartin Matuska /**
118*c03c5b1cSMartin Matuska  * Clears and frees all of the dictionaries in the CCtx.
119*c03c5b1cSMartin Matuska  */
ZSTD_clearAllDicts(ZSTD_CCtx * cctx)120*c03c5b1cSMartin Matuska static void ZSTD_clearAllDicts(ZSTD_CCtx* cctx)
121*c03c5b1cSMartin Matuska {
122*c03c5b1cSMartin Matuska     ZSTD_free(cctx->localDict.dictBuffer, cctx->customMem);
123*c03c5b1cSMartin Matuska     ZSTD_freeCDict(cctx->localDict.cdict);
124*c03c5b1cSMartin Matuska     memset(&cctx->localDict, 0, sizeof(cctx->localDict));
125*c03c5b1cSMartin Matuska     memset(&cctx->prefixDict, 0, sizeof(cctx->prefixDict));
126*c03c5b1cSMartin Matuska     cctx->cdict = NULL;
127*c03c5b1cSMartin Matuska }
128*c03c5b1cSMartin Matuska 
ZSTD_sizeof_localDict(ZSTD_localDict dict)129*c03c5b1cSMartin Matuska static size_t ZSTD_sizeof_localDict(ZSTD_localDict dict)
130*c03c5b1cSMartin Matuska {
131*c03c5b1cSMartin Matuska     size_t const bufferSize = dict.dictBuffer != NULL ? dict.dictSize : 0;
132*c03c5b1cSMartin Matuska     size_t const cdictSize = ZSTD_sizeof_CDict(dict.cdict);
133*c03c5b1cSMartin Matuska     return bufferSize + cdictSize;
134*c03c5b1cSMartin Matuska }
135*c03c5b1cSMartin Matuska 
ZSTD_freeCCtxContent(ZSTD_CCtx * cctx)136*c03c5b1cSMartin Matuska static void ZSTD_freeCCtxContent(ZSTD_CCtx* cctx)
137*c03c5b1cSMartin Matuska {
138*c03c5b1cSMartin Matuska     assert(cctx != NULL);
139*c03c5b1cSMartin Matuska     assert(cctx->staticSize == 0);
140*c03c5b1cSMartin Matuska     ZSTD_clearAllDicts(cctx);
141*c03c5b1cSMartin Matuska #ifdef ZSTD_MULTITHREAD
142*c03c5b1cSMartin Matuska     ZSTDMT_freeCCtx(cctx->mtctx); cctx->mtctx = NULL;
143*c03c5b1cSMartin Matuska #endif
144*c03c5b1cSMartin Matuska     ZSTD_cwksp_free(&cctx->workspace, cctx->customMem);
145*c03c5b1cSMartin Matuska }
146*c03c5b1cSMartin Matuska 
ZSTD_freeCCtx(ZSTD_CCtx * cctx)147*c03c5b1cSMartin Matuska size_t ZSTD_freeCCtx(ZSTD_CCtx* cctx)
148*c03c5b1cSMartin Matuska {
149*c03c5b1cSMartin Matuska     if (cctx==NULL) return 0;   /* support free on NULL */
150*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(cctx->staticSize, memory_allocation,
151*c03c5b1cSMartin Matuska                     "not compatible with static CCtx");
152*c03c5b1cSMartin Matuska     {
153*c03c5b1cSMartin Matuska         int cctxInWorkspace = ZSTD_cwksp_owns_buffer(&cctx->workspace, cctx);
154*c03c5b1cSMartin Matuska         ZSTD_freeCCtxContent(cctx);
155*c03c5b1cSMartin Matuska         if (!cctxInWorkspace) {
156*c03c5b1cSMartin Matuska             ZSTD_free(cctx, cctx->customMem);
157*c03c5b1cSMartin Matuska         }
158*c03c5b1cSMartin Matuska     }
159*c03c5b1cSMartin Matuska     return 0;
160*c03c5b1cSMartin Matuska }
161*c03c5b1cSMartin Matuska 
162*c03c5b1cSMartin Matuska 
ZSTD_sizeof_mtctx(const ZSTD_CCtx * cctx)163*c03c5b1cSMartin Matuska static size_t ZSTD_sizeof_mtctx(const ZSTD_CCtx* cctx)
164*c03c5b1cSMartin Matuska {
165*c03c5b1cSMartin Matuska #ifdef ZSTD_MULTITHREAD
166*c03c5b1cSMartin Matuska     return ZSTDMT_sizeof_CCtx(cctx->mtctx);
167*c03c5b1cSMartin Matuska #else
168*c03c5b1cSMartin Matuska     (void)cctx;
169*c03c5b1cSMartin Matuska     return 0;
170*c03c5b1cSMartin Matuska #endif
171*c03c5b1cSMartin Matuska }
172*c03c5b1cSMartin Matuska 
173*c03c5b1cSMartin Matuska 
ZSTD_sizeof_CCtx(const ZSTD_CCtx * cctx)174*c03c5b1cSMartin Matuska size_t ZSTD_sizeof_CCtx(const ZSTD_CCtx* cctx)
175*c03c5b1cSMartin Matuska {
176*c03c5b1cSMartin Matuska     if (cctx==NULL) return 0;   /* support sizeof on NULL */
177*c03c5b1cSMartin Matuska     /* cctx may be in the workspace */
178*c03c5b1cSMartin Matuska     return (cctx->workspace.workspace == cctx ? 0 : sizeof(*cctx))
179*c03c5b1cSMartin Matuska            + ZSTD_cwksp_sizeof(&cctx->workspace)
180*c03c5b1cSMartin Matuska            + ZSTD_sizeof_localDict(cctx->localDict)
181*c03c5b1cSMartin Matuska            + ZSTD_sizeof_mtctx(cctx);
182*c03c5b1cSMartin Matuska }
183*c03c5b1cSMartin Matuska 
ZSTD_sizeof_CStream(const ZSTD_CStream * zcs)184*c03c5b1cSMartin Matuska size_t ZSTD_sizeof_CStream(const ZSTD_CStream* zcs)
185*c03c5b1cSMartin Matuska {
186*c03c5b1cSMartin Matuska     return ZSTD_sizeof_CCtx(zcs);  /* same object */
187*c03c5b1cSMartin Matuska }
188*c03c5b1cSMartin Matuska 
189*c03c5b1cSMartin Matuska /* private API call, for dictBuilder only */
ZSTD_getSeqStore(const ZSTD_CCtx * ctx)190*c03c5b1cSMartin Matuska const seqStore_t* ZSTD_getSeqStore(const ZSTD_CCtx* ctx) { return &(ctx->seqStore); }
191*c03c5b1cSMartin Matuska 
ZSTD_makeCCtxParamsFromCParams(ZSTD_compressionParameters cParams)192*c03c5b1cSMartin Matuska static ZSTD_CCtx_params ZSTD_makeCCtxParamsFromCParams(
193*c03c5b1cSMartin Matuska         ZSTD_compressionParameters cParams)
194*c03c5b1cSMartin Matuska {
195*c03c5b1cSMartin Matuska     ZSTD_CCtx_params cctxParams;
196*c03c5b1cSMartin Matuska     memset(&cctxParams, 0, sizeof(cctxParams));
197*c03c5b1cSMartin Matuska     cctxParams.cParams = cParams;
198*c03c5b1cSMartin Matuska     cctxParams.compressionLevel = ZSTD_CLEVEL_DEFAULT;  /* should not matter, as all cParams are presumed properly defined */
199*c03c5b1cSMartin Matuska     assert(!ZSTD_checkCParams(cParams));
200*c03c5b1cSMartin Matuska     cctxParams.fParams.contentSizeFlag = 1;
201*c03c5b1cSMartin Matuska     return cctxParams;
202*c03c5b1cSMartin Matuska }
203*c03c5b1cSMartin Matuska 
ZSTD_createCCtxParams_advanced(ZSTD_customMem customMem)204*c03c5b1cSMartin Matuska static ZSTD_CCtx_params* ZSTD_createCCtxParams_advanced(
205*c03c5b1cSMartin Matuska         ZSTD_customMem customMem)
206*c03c5b1cSMartin Matuska {
207*c03c5b1cSMartin Matuska     ZSTD_CCtx_params* params;
208*c03c5b1cSMartin Matuska     if (!customMem.customAlloc ^ !customMem.customFree) return NULL;
209*c03c5b1cSMartin Matuska     params = (ZSTD_CCtx_params*)ZSTD_calloc(
210*c03c5b1cSMartin Matuska             sizeof(ZSTD_CCtx_params), customMem);
211*c03c5b1cSMartin Matuska     if (!params) { return NULL; }
212*c03c5b1cSMartin Matuska     params->customMem = customMem;
213*c03c5b1cSMartin Matuska     params->compressionLevel = ZSTD_CLEVEL_DEFAULT;
214*c03c5b1cSMartin Matuska     params->fParams.contentSizeFlag = 1;
215*c03c5b1cSMartin Matuska     return params;
216*c03c5b1cSMartin Matuska }
217*c03c5b1cSMartin Matuska 
ZSTD_createCCtxParams(void)218*c03c5b1cSMartin Matuska ZSTD_CCtx_params* ZSTD_createCCtxParams(void)
219*c03c5b1cSMartin Matuska {
220*c03c5b1cSMartin Matuska     return ZSTD_createCCtxParams_advanced(ZSTD_defaultCMem);
221*c03c5b1cSMartin Matuska }
222*c03c5b1cSMartin Matuska 
ZSTD_freeCCtxParams(ZSTD_CCtx_params * params)223*c03c5b1cSMartin Matuska size_t ZSTD_freeCCtxParams(ZSTD_CCtx_params* params)
224*c03c5b1cSMartin Matuska {
225*c03c5b1cSMartin Matuska     if (params == NULL) { return 0; }
226*c03c5b1cSMartin Matuska     ZSTD_free(params, params->customMem);
227*c03c5b1cSMartin Matuska     return 0;
228*c03c5b1cSMartin Matuska }
229*c03c5b1cSMartin Matuska 
ZSTD_CCtxParams_reset(ZSTD_CCtx_params * params)230*c03c5b1cSMartin Matuska size_t ZSTD_CCtxParams_reset(ZSTD_CCtx_params* params)
231*c03c5b1cSMartin Matuska {
232*c03c5b1cSMartin Matuska     return ZSTD_CCtxParams_init(params, ZSTD_CLEVEL_DEFAULT);
233*c03c5b1cSMartin Matuska }
234*c03c5b1cSMartin Matuska 
ZSTD_CCtxParams_init(ZSTD_CCtx_params * cctxParams,int compressionLevel)235*c03c5b1cSMartin Matuska size_t ZSTD_CCtxParams_init(ZSTD_CCtx_params* cctxParams, int compressionLevel) {
236*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(!cctxParams, GENERIC, "NULL pointer!");
237*c03c5b1cSMartin Matuska     memset(cctxParams, 0, sizeof(*cctxParams));
238*c03c5b1cSMartin Matuska     cctxParams->compressionLevel = compressionLevel;
239*c03c5b1cSMartin Matuska     cctxParams->fParams.contentSizeFlag = 1;
240*c03c5b1cSMartin Matuska     return 0;
241*c03c5b1cSMartin Matuska }
242*c03c5b1cSMartin Matuska 
ZSTD_CCtxParams_init_advanced(ZSTD_CCtx_params * cctxParams,ZSTD_parameters params)243*c03c5b1cSMartin Matuska size_t ZSTD_CCtxParams_init_advanced(ZSTD_CCtx_params* cctxParams, ZSTD_parameters params)
244*c03c5b1cSMartin Matuska {
245*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(!cctxParams, GENERIC, "NULL pointer!");
246*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_checkCParams(params.cParams) , "");
247*c03c5b1cSMartin Matuska     memset(cctxParams, 0, sizeof(*cctxParams));
248*c03c5b1cSMartin Matuska     assert(!ZSTD_checkCParams(params.cParams));
249*c03c5b1cSMartin Matuska     cctxParams->cParams = params.cParams;
250*c03c5b1cSMartin Matuska     cctxParams->fParams = params.fParams;
251*c03c5b1cSMartin Matuska     cctxParams->compressionLevel = ZSTD_CLEVEL_DEFAULT;   /* should not matter, as all cParams are presumed properly defined */
252*c03c5b1cSMartin Matuska     return 0;
253*c03c5b1cSMartin Matuska }
254*c03c5b1cSMartin Matuska 
255*c03c5b1cSMartin Matuska /* ZSTD_assignParamsToCCtxParams() :
256*c03c5b1cSMartin Matuska  * params is presumed valid at this stage */
ZSTD_assignParamsToCCtxParams(const ZSTD_CCtx_params * cctxParams,const ZSTD_parameters * params)257*c03c5b1cSMartin Matuska static ZSTD_CCtx_params ZSTD_assignParamsToCCtxParams(
258*c03c5b1cSMartin Matuska         const ZSTD_CCtx_params* cctxParams, const ZSTD_parameters* params)
259*c03c5b1cSMartin Matuska {
260*c03c5b1cSMartin Matuska     ZSTD_CCtx_params ret = *cctxParams;
261*c03c5b1cSMartin Matuska     assert(!ZSTD_checkCParams(params->cParams));
262*c03c5b1cSMartin Matuska     ret.cParams = params->cParams;
263*c03c5b1cSMartin Matuska     ret.fParams = params->fParams;
264*c03c5b1cSMartin Matuska     ret.compressionLevel = ZSTD_CLEVEL_DEFAULT;   /* should not matter, as all cParams are presumed properly defined */
265*c03c5b1cSMartin Matuska     return ret;
266*c03c5b1cSMartin Matuska }
267*c03c5b1cSMartin Matuska 
ZSTD_cParam_getBounds(ZSTD_cParameter param)268*c03c5b1cSMartin Matuska ZSTD_bounds ZSTD_cParam_getBounds(ZSTD_cParameter param)
269*c03c5b1cSMartin Matuska {
270*c03c5b1cSMartin Matuska     ZSTD_bounds bounds = { 0, 0, 0 };
271*c03c5b1cSMartin Matuska 
272*c03c5b1cSMartin Matuska     switch(param)
273*c03c5b1cSMartin Matuska     {
274*c03c5b1cSMartin Matuska     case ZSTD_c_compressionLevel:
275*c03c5b1cSMartin Matuska         bounds.lowerBound = ZSTD_minCLevel();
276*c03c5b1cSMartin Matuska         bounds.upperBound = ZSTD_maxCLevel();
277*c03c5b1cSMartin Matuska         return bounds;
278*c03c5b1cSMartin Matuska 
279*c03c5b1cSMartin Matuska     case ZSTD_c_windowLog:
280*c03c5b1cSMartin Matuska         bounds.lowerBound = ZSTD_WINDOWLOG_MIN;
281*c03c5b1cSMartin Matuska         bounds.upperBound = ZSTD_WINDOWLOG_MAX;
282*c03c5b1cSMartin Matuska         return bounds;
283*c03c5b1cSMartin Matuska 
284*c03c5b1cSMartin Matuska     case ZSTD_c_hashLog:
285*c03c5b1cSMartin Matuska         bounds.lowerBound = ZSTD_HASHLOG_MIN;
286*c03c5b1cSMartin Matuska         bounds.upperBound = ZSTD_HASHLOG_MAX;
287*c03c5b1cSMartin Matuska         return bounds;
288*c03c5b1cSMartin Matuska 
289*c03c5b1cSMartin Matuska     case ZSTD_c_chainLog:
290*c03c5b1cSMartin Matuska         bounds.lowerBound = ZSTD_CHAINLOG_MIN;
291*c03c5b1cSMartin Matuska         bounds.upperBound = ZSTD_CHAINLOG_MAX;
292*c03c5b1cSMartin Matuska         return bounds;
293*c03c5b1cSMartin Matuska 
294*c03c5b1cSMartin Matuska     case ZSTD_c_searchLog:
295*c03c5b1cSMartin Matuska         bounds.lowerBound = ZSTD_SEARCHLOG_MIN;
296*c03c5b1cSMartin Matuska         bounds.upperBound = ZSTD_SEARCHLOG_MAX;
297*c03c5b1cSMartin Matuska         return bounds;
298*c03c5b1cSMartin Matuska 
299*c03c5b1cSMartin Matuska     case ZSTD_c_minMatch:
300*c03c5b1cSMartin Matuska         bounds.lowerBound = ZSTD_MINMATCH_MIN;
301*c03c5b1cSMartin Matuska         bounds.upperBound = ZSTD_MINMATCH_MAX;
302*c03c5b1cSMartin Matuska         return bounds;
303*c03c5b1cSMartin Matuska 
304*c03c5b1cSMartin Matuska     case ZSTD_c_targetLength:
305*c03c5b1cSMartin Matuska         bounds.lowerBound = ZSTD_TARGETLENGTH_MIN;
306*c03c5b1cSMartin Matuska         bounds.upperBound = ZSTD_TARGETLENGTH_MAX;
307*c03c5b1cSMartin Matuska         return bounds;
308*c03c5b1cSMartin Matuska 
309*c03c5b1cSMartin Matuska     case ZSTD_c_strategy:
310*c03c5b1cSMartin Matuska         bounds.lowerBound = ZSTD_STRATEGY_MIN;
311*c03c5b1cSMartin Matuska         bounds.upperBound = ZSTD_STRATEGY_MAX;
312*c03c5b1cSMartin Matuska         return bounds;
313*c03c5b1cSMartin Matuska 
314*c03c5b1cSMartin Matuska     case ZSTD_c_contentSizeFlag:
315*c03c5b1cSMartin Matuska         bounds.lowerBound = 0;
316*c03c5b1cSMartin Matuska         bounds.upperBound = 1;
317*c03c5b1cSMartin Matuska         return bounds;
318*c03c5b1cSMartin Matuska 
319*c03c5b1cSMartin Matuska     case ZSTD_c_checksumFlag:
320*c03c5b1cSMartin Matuska         bounds.lowerBound = 0;
321*c03c5b1cSMartin Matuska         bounds.upperBound = 1;
322*c03c5b1cSMartin Matuska         return bounds;
323*c03c5b1cSMartin Matuska 
324*c03c5b1cSMartin Matuska     case ZSTD_c_dictIDFlag:
325*c03c5b1cSMartin Matuska         bounds.lowerBound = 0;
326*c03c5b1cSMartin Matuska         bounds.upperBound = 1;
327*c03c5b1cSMartin Matuska         return bounds;
328*c03c5b1cSMartin Matuska 
329*c03c5b1cSMartin Matuska     case ZSTD_c_nbWorkers:
330*c03c5b1cSMartin Matuska         bounds.lowerBound = 0;
331*c03c5b1cSMartin Matuska #ifdef ZSTD_MULTITHREAD
332*c03c5b1cSMartin Matuska         bounds.upperBound = ZSTDMT_NBWORKERS_MAX;
333*c03c5b1cSMartin Matuska #else
334*c03c5b1cSMartin Matuska         bounds.upperBound = 0;
335*c03c5b1cSMartin Matuska #endif
336*c03c5b1cSMartin Matuska         return bounds;
337*c03c5b1cSMartin Matuska 
338*c03c5b1cSMartin Matuska     case ZSTD_c_jobSize:
339*c03c5b1cSMartin Matuska         bounds.lowerBound = 0;
340*c03c5b1cSMartin Matuska #ifdef ZSTD_MULTITHREAD
341*c03c5b1cSMartin Matuska         bounds.upperBound = ZSTDMT_JOBSIZE_MAX;
342*c03c5b1cSMartin Matuska #else
343*c03c5b1cSMartin Matuska         bounds.upperBound = 0;
344*c03c5b1cSMartin Matuska #endif
345*c03c5b1cSMartin Matuska         return bounds;
346*c03c5b1cSMartin Matuska 
347*c03c5b1cSMartin Matuska     case ZSTD_c_overlapLog:
348*c03c5b1cSMartin Matuska #ifdef ZSTD_MULTITHREAD
349*c03c5b1cSMartin Matuska         bounds.lowerBound = ZSTD_OVERLAPLOG_MIN;
350*c03c5b1cSMartin Matuska         bounds.upperBound = ZSTD_OVERLAPLOG_MAX;
351*c03c5b1cSMartin Matuska #else
352*c03c5b1cSMartin Matuska         bounds.lowerBound = 0;
353*c03c5b1cSMartin Matuska         bounds.upperBound = 0;
354*c03c5b1cSMartin Matuska #endif
355*c03c5b1cSMartin Matuska         return bounds;
356*c03c5b1cSMartin Matuska 
357*c03c5b1cSMartin Matuska     case ZSTD_c_enableLongDistanceMatching:
358*c03c5b1cSMartin Matuska         bounds.lowerBound = 0;
359*c03c5b1cSMartin Matuska         bounds.upperBound = 1;
360*c03c5b1cSMartin Matuska         return bounds;
361*c03c5b1cSMartin Matuska 
362*c03c5b1cSMartin Matuska     case ZSTD_c_ldmHashLog:
363*c03c5b1cSMartin Matuska         bounds.lowerBound = ZSTD_LDM_HASHLOG_MIN;
364*c03c5b1cSMartin Matuska         bounds.upperBound = ZSTD_LDM_HASHLOG_MAX;
365*c03c5b1cSMartin Matuska         return bounds;
366*c03c5b1cSMartin Matuska 
367*c03c5b1cSMartin Matuska     case ZSTD_c_ldmMinMatch:
368*c03c5b1cSMartin Matuska         bounds.lowerBound = ZSTD_LDM_MINMATCH_MIN;
369*c03c5b1cSMartin Matuska         bounds.upperBound = ZSTD_LDM_MINMATCH_MAX;
370*c03c5b1cSMartin Matuska         return bounds;
371*c03c5b1cSMartin Matuska 
372*c03c5b1cSMartin Matuska     case ZSTD_c_ldmBucketSizeLog:
373*c03c5b1cSMartin Matuska         bounds.lowerBound = ZSTD_LDM_BUCKETSIZELOG_MIN;
374*c03c5b1cSMartin Matuska         bounds.upperBound = ZSTD_LDM_BUCKETSIZELOG_MAX;
375*c03c5b1cSMartin Matuska         return bounds;
376*c03c5b1cSMartin Matuska 
377*c03c5b1cSMartin Matuska     case ZSTD_c_ldmHashRateLog:
378*c03c5b1cSMartin Matuska         bounds.lowerBound = ZSTD_LDM_HASHRATELOG_MIN;
379*c03c5b1cSMartin Matuska         bounds.upperBound = ZSTD_LDM_HASHRATELOG_MAX;
380*c03c5b1cSMartin Matuska         return bounds;
381*c03c5b1cSMartin Matuska 
382*c03c5b1cSMartin Matuska     /* experimental parameters */
383*c03c5b1cSMartin Matuska     case ZSTD_c_rsyncable:
384*c03c5b1cSMartin Matuska         bounds.lowerBound = 0;
385*c03c5b1cSMartin Matuska         bounds.upperBound = 1;
386*c03c5b1cSMartin Matuska         return bounds;
387*c03c5b1cSMartin Matuska 
388*c03c5b1cSMartin Matuska     case ZSTD_c_forceMaxWindow :
389*c03c5b1cSMartin Matuska         bounds.lowerBound = 0;
390*c03c5b1cSMartin Matuska         bounds.upperBound = 1;
391*c03c5b1cSMartin Matuska         return bounds;
392*c03c5b1cSMartin Matuska 
393*c03c5b1cSMartin Matuska     case ZSTD_c_format:
394*c03c5b1cSMartin Matuska         ZSTD_STATIC_ASSERT(ZSTD_f_zstd1 < ZSTD_f_zstd1_magicless);
395*c03c5b1cSMartin Matuska         bounds.lowerBound = ZSTD_f_zstd1;
396*c03c5b1cSMartin Matuska         bounds.upperBound = ZSTD_f_zstd1_magicless;   /* note : how to ensure at compile time that this is the highest value enum ? */
397*c03c5b1cSMartin Matuska         return bounds;
398*c03c5b1cSMartin Matuska 
399*c03c5b1cSMartin Matuska     case ZSTD_c_forceAttachDict:
400*c03c5b1cSMartin Matuska         ZSTD_STATIC_ASSERT(ZSTD_dictDefaultAttach < ZSTD_dictForceCopy);
401*c03c5b1cSMartin Matuska         bounds.lowerBound = ZSTD_dictDefaultAttach;
402*c03c5b1cSMartin Matuska         bounds.upperBound = ZSTD_dictForceLoad;       /* note : how to ensure at compile time that this is the highest value enum ? */
403*c03c5b1cSMartin Matuska         return bounds;
404*c03c5b1cSMartin Matuska 
405*c03c5b1cSMartin Matuska     case ZSTD_c_literalCompressionMode:
406*c03c5b1cSMartin Matuska         ZSTD_STATIC_ASSERT(ZSTD_lcm_auto < ZSTD_lcm_huffman && ZSTD_lcm_huffman < ZSTD_lcm_uncompressed);
407*c03c5b1cSMartin Matuska         bounds.lowerBound = ZSTD_lcm_auto;
408*c03c5b1cSMartin Matuska         bounds.upperBound = ZSTD_lcm_uncompressed;
409*c03c5b1cSMartin Matuska         return bounds;
410*c03c5b1cSMartin Matuska 
411*c03c5b1cSMartin Matuska     case ZSTD_c_targetCBlockSize:
412*c03c5b1cSMartin Matuska         bounds.lowerBound = ZSTD_TARGETCBLOCKSIZE_MIN;
413*c03c5b1cSMartin Matuska         bounds.upperBound = ZSTD_TARGETCBLOCKSIZE_MAX;
414*c03c5b1cSMartin Matuska         return bounds;
415*c03c5b1cSMartin Matuska 
416*c03c5b1cSMartin Matuska     case ZSTD_c_srcSizeHint:
417*c03c5b1cSMartin Matuska         bounds.lowerBound = ZSTD_SRCSIZEHINT_MIN;
418*c03c5b1cSMartin Matuska         bounds.upperBound = ZSTD_SRCSIZEHINT_MAX;
419*c03c5b1cSMartin Matuska         return bounds;
420*c03c5b1cSMartin Matuska 
421*c03c5b1cSMartin Matuska     default:
422*c03c5b1cSMartin Matuska         bounds.error = ERROR(parameter_unsupported);
423*c03c5b1cSMartin Matuska         return bounds;
424*c03c5b1cSMartin Matuska     }
425*c03c5b1cSMartin Matuska }
426*c03c5b1cSMartin Matuska 
427*c03c5b1cSMartin Matuska /* ZSTD_cParam_clampBounds:
428*c03c5b1cSMartin Matuska  * Clamps the value into the bounded range.
429*c03c5b1cSMartin Matuska  */
ZSTD_cParam_clampBounds(ZSTD_cParameter cParam,int * value)430*c03c5b1cSMartin Matuska static size_t ZSTD_cParam_clampBounds(ZSTD_cParameter cParam, int* value)
431*c03c5b1cSMartin Matuska {
432*c03c5b1cSMartin Matuska     ZSTD_bounds const bounds = ZSTD_cParam_getBounds(cParam);
433*c03c5b1cSMartin Matuska     if (ZSTD_isError(bounds.error)) return bounds.error;
434*c03c5b1cSMartin Matuska     if (*value < bounds.lowerBound) *value = bounds.lowerBound;
435*c03c5b1cSMartin Matuska     if (*value > bounds.upperBound) *value = bounds.upperBound;
436*c03c5b1cSMartin Matuska     return 0;
437*c03c5b1cSMartin Matuska }
438*c03c5b1cSMartin Matuska 
439*c03c5b1cSMartin Matuska #define BOUNDCHECK(cParam, val) { \
440*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(!ZSTD_cParam_withinBounds(cParam,val), \
441*c03c5b1cSMartin Matuska                     parameter_outOfBound, "Param out of bounds"); \
442*c03c5b1cSMartin Matuska }
443*c03c5b1cSMartin Matuska 
444*c03c5b1cSMartin Matuska 
ZSTD_isUpdateAuthorized(ZSTD_cParameter param)445*c03c5b1cSMartin Matuska static int ZSTD_isUpdateAuthorized(ZSTD_cParameter param)
446*c03c5b1cSMartin Matuska {
447*c03c5b1cSMartin Matuska     switch(param)
448*c03c5b1cSMartin Matuska     {
449*c03c5b1cSMartin Matuska     case ZSTD_c_compressionLevel:
450*c03c5b1cSMartin Matuska     case ZSTD_c_hashLog:
451*c03c5b1cSMartin Matuska     case ZSTD_c_chainLog:
452*c03c5b1cSMartin Matuska     case ZSTD_c_searchLog:
453*c03c5b1cSMartin Matuska     case ZSTD_c_minMatch:
454*c03c5b1cSMartin Matuska     case ZSTD_c_targetLength:
455*c03c5b1cSMartin Matuska     case ZSTD_c_strategy:
456*c03c5b1cSMartin Matuska         return 1;
457*c03c5b1cSMartin Matuska 
458*c03c5b1cSMartin Matuska     case ZSTD_c_format:
459*c03c5b1cSMartin Matuska     case ZSTD_c_windowLog:
460*c03c5b1cSMartin Matuska     case ZSTD_c_contentSizeFlag:
461*c03c5b1cSMartin Matuska     case ZSTD_c_checksumFlag:
462*c03c5b1cSMartin Matuska     case ZSTD_c_dictIDFlag:
463*c03c5b1cSMartin Matuska     case ZSTD_c_forceMaxWindow :
464*c03c5b1cSMartin Matuska     case ZSTD_c_nbWorkers:
465*c03c5b1cSMartin Matuska     case ZSTD_c_jobSize:
466*c03c5b1cSMartin Matuska     case ZSTD_c_overlapLog:
467*c03c5b1cSMartin Matuska     case ZSTD_c_rsyncable:
468*c03c5b1cSMartin Matuska     case ZSTD_c_enableLongDistanceMatching:
469*c03c5b1cSMartin Matuska     case ZSTD_c_ldmHashLog:
470*c03c5b1cSMartin Matuska     case ZSTD_c_ldmMinMatch:
471*c03c5b1cSMartin Matuska     case ZSTD_c_ldmBucketSizeLog:
472*c03c5b1cSMartin Matuska     case ZSTD_c_ldmHashRateLog:
473*c03c5b1cSMartin Matuska     case ZSTD_c_forceAttachDict:
474*c03c5b1cSMartin Matuska     case ZSTD_c_literalCompressionMode:
475*c03c5b1cSMartin Matuska     case ZSTD_c_targetCBlockSize:
476*c03c5b1cSMartin Matuska     case ZSTD_c_srcSizeHint:
477*c03c5b1cSMartin Matuska     default:
478*c03c5b1cSMartin Matuska         return 0;
479*c03c5b1cSMartin Matuska     }
480*c03c5b1cSMartin Matuska }
481*c03c5b1cSMartin Matuska 
ZSTD_CCtx_setParameter(ZSTD_CCtx * cctx,ZSTD_cParameter param,int value)482*c03c5b1cSMartin Matuska size_t ZSTD_CCtx_setParameter(ZSTD_CCtx* cctx, ZSTD_cParameter param, int value)
483*c03c5b1cSMartin Matuska {
484*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_CCtx_setParameter (%i, %i)", (int)param, value);
485*c03c5b1cSMartin Matuska     if (cctx->streamStage != zcss_init) {
486*c03c5b1cSMartin Matuska         if (ZSTD_isUpdateAuthorized(param)) {
487*c03c5b1cSMartin Matuska             cctx->cParamsChanged = 1;
488*c03c5b1cSMartin Matuska         } else {
489*c03c5b1cSMartin Matuska             RETURN_ERROR(stage_wrong, "can only set params in ctx init stage");
490*c03c5b1cSMartin Matuska     }   }
491*c03c5b1cSMartin Matuska 
492*c03c5b1cSMartin Matuska     switch(param)
493*c03c5b1cSMartin Matuska     {
494*c03c5b1cSMartin Matuska     case ZSTD_c_nbWorkers:
495*c03c5b1cSMartin Matuska         RETURN_ERROR_IF((value!=0) && cctx->staticSize, parameter_unsupported,
496*c03c5b1cSMartin Matuska                         "MT not compatible with static alloc");
497*c03c5b1cSMartin Matuska         break;
498*c03c5b1cSMartin Matuska 
499*c03c5b1cSMartin Matuska     case ZSTD_c_compressionLevel:
500*c03c5b1cSMartin Matuska     case ZSTD_c_windowLog:
501*c03c5b1cSMartin Matuska     case ZSTD_c_hashLog:
502*c03c5b1cSMartin Matuska     case ZSTD_c_chainLog:
503*c03c5b1cSMartin Matuska     case ZSTD_c_searchLog:
504*c03c5b1cSMartin Matuska     case ZSTD_c_minMatch:
505*c03c5b1cSMartin Matuska     case ZSTD_c_targetLength:
506*c03c5b1cSMartin Matuska     case ZSTD_c_strategy:
507*c03c5b1cSMartin Matuska     case ZSTD_c_ldmHashRateLog:
508*c03c5b1cSMartin Matuska     case ZSTD_c_format:
509*c03c5b1cSMartin Matuska     case ZSTD_c_contentSizeFlag:
510*c03c5b1cSMartin Matuska     case ZSTD_c_checksumFlag:
511*c03c5b1cSMartin Matuska     case ZSTD_c_dictIDFlag:
512*c03c5b1cSMartin Matuska     case ZSTD_c_forceMaxWindow:
513*c03c5b1cSMartin Matuska     case ZSTD_c_forceAttachDict:
514*c03c5b1cSMartin Matuska     case ZSTD_c_literalCompressionMode:
515*c03c5b1cSMartin Matuska     case ZSTD_c_jobSize:
516*c03c5b1cSMartin Matuska     case ZSTD_c_overlapLog:
517*c03c5b1cSMartin Matuska     case ZSTD_c_rsyncable:
518*c03c5b1cSMartin Matuska     case ZSTD_c_enableLongDistanceMatching:
519*c03c5b1cSMartin Matuska     case ZSTD_c_ldmHashLog:
520*c03c5b1cSMartin Matuska     case ZSTD_c_ldmMinMatch:
521*c03c5b1cSMartin Matuska     case ZSTD_c_ldmBucketSizeLog:
522*c03c5b1cSMartin Matuska     case ZSTD_c_targetCBlockSize:
523*c03c5b1cSMartin Matuska     case ZSTD_c_srcSizeHint:
524*c03c5b1cSMartin Matuska         break;
525*c03c5b1cSMartin Matuska 
526*c03c5b1cSMartin Matuska     default: RETURN_ERROR(parameter_unsupported, "unknown parameter");
527*c03c5b1cSMartin Matuska     }
528*c03c5b1cSMartin Matuska     return ZSTD_CCtxParams_setParameter(&cctx->requestedParams, param, value);
529*c03c5b1cSMartin Matuska }
530*c03c5b1cSMartin Matuska 
ZSTD_CCtxParams_setParameter(ZSTD_CCtx_params * CCtxParams,ZSTD_cParameter param,int value)531*c03c5b1cSMartin Matuska size_t ZSTD_CCtxParams_setParameter(ZSTD_CCtx_params* CCtxParams,
532*c03c5b1cSMartin Matuska                                     ZSTD_cParameter param, int value)
533*c03c5b1cSMartin Matuska {
534*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_CCtxParams_setParameter (%i, %i)", (int)param, value);
535*c03c5b1cSMartin Matuska     switch(param)
536*c03c5b1cSMartin Matuska     {
537*c03c5b1cSMartin Matuska     case ZSTD_c_format :
538*c03c5b1cSMartin Matuska         BOUNDCHECK(ZSTD_c_format, value);
539*c03c5b1cSMartin Matuska         CCtxParams->format = (ZSTD_format_e)value;
540*c03c5b1cSMartin Matuska         return (size_t)CCtxParams->format;
541*c03c5b1cSMartin Matuska 
542*c03c5b1cSMartin Matuska     case ZSTD_c_compressionLevel : {
543*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR(ZSTD_cParam_clampBounds(param, &value), "");
544*c03c5b1cSMartin Matuska         if (value) {  /* 0 : does not change current level */
545*c03c5b1cSMartin Matuska             CCtxParams->compressionLevel = value;
546*c03c5b1cSMartin Matuska         }
547*c03c5b1cSMartin Matuska         if (CCtxParams->compressionLevel >= 0) return (size_t)CCtxParams->compressionLevel;
548*c03c5b1cSMartin Matuska         return 0;  /* return type (size_t) cannot represent negative values */
549*c03c5b1cSMartin Matuska     }
550*c03c5b1cSMartin Matuska 
551*c03c5b1cSMartin Matuska     case ZSTD_c_windowLog :
552*c03c5b1cSMartin Matuska         if (value!=0)   /* 0 => use default */
553*c03c5b1cSMartin Matuska             BOUNDCHECK(ZSTD_c_windowLog, value);
554*c03c5b1cSMartin Matuska         CCtxParams->cParams.windowLog = (U32)value;
555*c03c5b1cSMartin Matuska         return CCtxParams->cParams.windowLog;
556*c03c5b1cSMartin Matuska 
557*c03c5b1cSMartin Matuska     case ZSTD_c_hashLog :
558*c03c5b1cSMartin Matuska         if (value!=0)   /* 0 => use default */
559*c03c5b1cSMartin Matuska             BOUNDCHECK(ZSTD_c_hashLog, value);
560*c03c5b1cSMartin Matuska         CCtxParams->cParams.hashLog = (U32)value;
561*c03c5b1cSMartin Matuska         return CCtxParams->cParams.hashLog;
562*c03c5b1cSMartin Matuska 
563*c03c5b1cSMartin Matuska     case ZSTD_c_chainLog :
564*c03c5b1cSMartin Matuska         if (value!=0)   /* 0 => use default */
565*c03c5b1cSMartin Matuska             BOUNDCHECK(ZSTD_c_chainLog, value);
566*c03c5b1cSMartin Matuska         CCtxParams->cParams.chainLog = (U32)value;
567*c03c5b1cSMartin Matuska         return CCtxParams->cParams.chainLog;
568*c03c5b1cSMartin Matuska 
569*c03c5b1cSMartin Matuska     case ZSTD_c_searchLog :
570*c03c5b1cSMartin Matuska         if (value!=0)   /* 0 => use default */
571*c03c5b1cSMartin Matuska             BOUNDCHECK(ZSTD_c_searchLog, value);
572*c03c5b1cSMartin Matuska         CCtxParams->cParams.searchLog = (U32)value;
573*c03c5b1cSMartin Matuska         return (size_t)value;
574*c03c5b1cSMartin Matuska 
575*c03c5b1cSMartin Matuska     case ZSTD_c_minMatch :
576*c03c5b1cSMartin Matuska         if (value!=0)   /* 0 => use default */
577*c03c5b1cSMartin Matuska             BOUNDCHECK(ZSTD_c_minMatch, value);
578*c03c5b1cSMartin Matuska         CCtxParams->cParams.minMatch = value;
579*c03c5b1cSMartin Matuska         return CCtxParams->cParams.minMatch;
580*c03c5b1cSMartin Matuska 
581*c03c5b1cSMartin Matuska     case ZSTD_c_targetLength :
582*c03c5b1cSMartin Matuska         BOUNDCHECK(ZSTD_c_targetLength, value);
583*c03c5b1cSMartin Matuska         CCtxParams->cParams.targetLength = value;
584*c03c5b1cSMartin Matuska         return CCtxParams->cParams.targetLength;
585*c03c5b1cSMartin Matuska 
586*c03c5b1cSMartin Matuska     case ZSTD_c_strategy :
587*c03c5b1cSMartin Matuska         if (value!=0)   /* 0 => use default */
588*c03c5b1cSMartin Matuska             BOUNDCHECK(ZSTD_c_strategy, value);
589*c03c5b1cSMartin Matuska         CCtxParams->cParams.strategy = (ZSTD_strategy)value;
590*c03c5b1cSMartin Matuska         return (size_t)CCtxParams->cParams.strategy;
591*c03c5b1cSMartin Matuska 
592*c03c5b1cSMartin Matuska     case ZSTD_c_contentSizeFlag :
593*c03c5b1cSMartin Matuska         /* Content size written in frame header _when known_ (default:1) */
594*c03c5b1cSMartin Matuska         DEBUGLOG(4, "set content size flag = %u", (value!=0));
595*c03c5b1cSMartin Matuska         CCtxParams->fParams.contentSizeFlag = value != 0;
596*c03c5b1cSMartin Matuska         return CCtxParams->fParams.contentSizeFlag;
597*c03c5b1cSMartin Matuska 
598*c03c5b1cSMartin Matuska     case ZSTD_c_checksumFlag :
599*c03c5b1cSMartin Matuska         /* A 32-bits content checksum will be calculated and written at end of frame (default:0) */
600*c03c5b1cSMartin Matuska         CCtxParams->fParams.checksumFlag = value != 0;
601*c03c5b1cSMartin Matuska         return CCtxParams->fParams.checksumFlag;
602*c03c5b1cSMartin Matuska 
603*c03c5b1cSMartin Matuska     case ZSTD_c_dictIDFlag : /* When applicable, dictionary's dictID is provided in frame header (default:1) */
604*c03c5b1cSMartin Matuska         DEBUGLOG(4, "set dictIDFlag = %u", (value!=0));
605*c03c5b1cSMartin Matuska         CCtxParams->fParams.noDictIDFlag = !value;
606*c03c5b1cSMartin Matuska         return !CCtxParams->fParams.noDictIDFlag;
607*c03c5b1cSMartin Matuska 
608*c03c5b1cSMartin Matuska     case ZSTD_c_forceMaxWindow :
609*c03c5b1cSMartin Matuska         CCtxParams->forceWindow = (value != 0);
610*c03c5b1cSMartin Matuska         return CCtxParams->forceWindow;
611*c03c5b1cSMartin Matuska 
612*c03c5b1cSMartin Matuska     case ZSTD_c_forceAttachDict : {
613*c03c5b1cSMartin Matuska         const ZSTD_dictAttachPref_e pref = (ZSTD_dictAttachPref_e)value;
614*c03c5b1cSMartin Matuska         BOUNDCHECK(ZSTD_c_forceAttachDict, pref);
615*c03c5b1cSMartin Matuska         CCtxParams->attachDictPref = pref;
616*c03c5b1cSMartin Matuska         return CCtxParams->attachDictPref;
617*c03c5b1cSMartin Matuska     }
618*c03c5b1cSMartin Matuska 
619*c03c5b1cSMartin Matuska     case ZSTD_c_literalCompressionMode : {
620*c03c5b1cSMartin Matuska         const ZSTD_literalCompressionMode_e lcm = (ZSTD_literalCompressionMode_e)value;
621*c03c5b1cSMartin Matuska         BOUNDCHECK(ZSTD_c_literalCompressionMode, lcm);
622*c03c5b1cSMartin Matuska         CCtxParams->literalCompressionMode = lcm;
623*c03c5b1cSMartin Matuska         return CCtxParams->literalCompressionMode;
624*c03c5b1cSMartin Matuska     }
625*c03c5b1cSMartin Matuska 
626*c03c5b1cSMartin Matuska     case ZSTD_c_nbWorkers :
627*c03c5b1cSMartin Matuska #ifndef ZSTD_MULTITHREAD
628*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(value!=0, parameter_unsupported, "not compiled with multithreading");
629*c03c5b1cSMartin Matuska         return 0;
630*c03c5b1cSMartin Matuska #else
631*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR(ZSTD_cParam_clampBounds(param, &value), "");
632*c03c5b1cSMartin Matuska         CCtxParams->nbWorkers = value;
633*c03c5b1cSMartin Matuska         return CCtxParams->nbWorkers;
634*c03c5b1cSMartin Matuska #endif
635*c03c5b1cSMartin Matuska 
636*c03c5b1cSMartin Matuska     case ZSTD_c_jobSize :
637*c03c5b1cSMartin Matuska #ifndef ZSTD_MULTITHREAD
638*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(value!=0, parameter_unsupported, "not compiled with multithreading");
639*c03c5b1cSMartin Matuska         return 0;
640*c03c5b1cSMartin Matuska #else
641*c03c5b1cSMartin Matuska         /* Adjust to the minimum non-default value. */
642*c03c5b1cSMartin Matuska         if (value != 0 && value < ZSTDMT_JOBSIZE_MIN)
643*c03c5b1cSMartin Matuska             value = ZSTDMT_JOBSIZE_MIN;
644*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR(ZSTD_cParam_clampBounds(param, &value), "");
645*c03c5b1cSMartin Matuska         assert(value >= 0);
646*c03c5b1cSMartin Matuska         CCtxParams->jobSize = value;
647*c03c5b1cSMartin Matuska         return CCtxParams->jobSize;
648*c03c5b1cSMartin Matuska #endif
649*c03c5b1cSMartin Matuska 
650*c03c5b1cSMartin Matuska     case ZSTD_c_overlapLog :
651*c03c5b1cSMartin Matuska #ifndef ZSTD_MULTITHREAD
652*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(value!=0, parameter_unsupported, "not compiled with multithreading");
653*c03c5b1cSMartin Matuska         return 0;
654*c03c5b1cSMartin Matuska #else
655*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR(ZSTD_cParam_clampBounds(ZSTD_c_overlapLog, &value), "");
656*c03c5b1cSMartin Matuska         CCtxParams->overlapLog = value;
657*c03c5b1cSMartin Matuska         return CCtxParams->overlapLog;
658*c03c5b1cSMartin Matuska #endif
659*c03c5b1cSMartin Matuska 
660*c03c5b1cSMartin Matuska     case ZSTD_c_rsyncable :
661*c03c5b1cSMartin Matuska #ifndef ZSTD_MULTITHREAD
662*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(value!=0, parameter_unsupported, "not compiled with multithreading");
663*c03c5b1cSMartin Matuska         return 0;
664*c03c5b1cSMartin Matuska #else
665*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR(ZSTD_cParam_clampBounds(ZSTD_c_overlapLog, &value), "");
666*c03c5b1cSMartin Matuska         CCtxParams->rsyncable = value;
667*c03c5b1cSMartin Matuska         return CCtxParams->rsyncable;
668*c03c5b1cSMartin Matuska #endif
669*c03c5b1cSMartin Matuska 
670*c03c5b1cSMartin Matuska     case ZSTD_c_enableLongDistanceMatching :
671*c03c5b1cSMartin Matuska         CCtxParams->ldmParams.enableLdm = (value!=0);
672*c03c5b1cSMartin Matuska         return CCtxParams->ldmParams.enableLdm;
673*c03c5b1cSMartin Matuska 
674*c03c5b1cSMartin Matuska     case ZSTD_c_ldmHashLog :
675*c03c5b1cSMartin Matuska         if (value!=0)   /* 0 ==> auto */
676*c03c5b1cSMartin Matuska             BOUNDCHECK(ZSTD_c_ldmHashLog, value);
677*c03c5b1cSMartin Matuska         CCtxParams->ldmParams.hashLog = value;
678*c03c5b1cSMartin Matuska         return CCtxParams->ldmParams.hashLog;
679*c03c5b1cSMartin Matuska 
680*c03c5b1cSMartin Matuska     case ZSTD_c_ldmMinMatch :
681*c03c5b1cSMartin Matuska         if (value!=0)   /* 0 ==> default */
682*c03c5b1cSMartin Matuska             BOUNDCHECK(ZSTD_c_ldmMinMatch, value);
683*c03c5b1cSMartin Matuska         CCtxParams->ldmParams.minMatchLength = value;
684*c03c5b1cSMartin Matuska         return CCtxParams->ldmParams.minMatchLength;
685*c03c5b1cSMartin Matuska 
686*c03c5b1cSMartin Matuska     case ZSTD_c_ldmBucketSizeLog :
687*c03c5b1cSMartin Matuska         if (value!=0)   /* 0 ==> default */
688*c03c5b1cSMartin Matuska             BOUNDCHECK(ZSTD_c_ldmBucketSizeLog, value);
689*c03c5b1cSMartin Matuska         CCtxParams->ldmParams.bucketSizeLog = value;
690*c03c5b1cSMartin Matuska         return CCtxParams->ldmParams.bucketSizeLog;
691*c03c5b1cSMartin Matuska 
692*c03c5b1cSMartin Matuska     case ZSTD_c_ldmHashRateLog :
693*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(value > ZSTD_WINDOWLOG_MAX - ZSTD_HASHLOG_MIN,
694*c03c5b1cSMartin Matuska                         parameter_outOfBound, "Param out of bounds!");
695*c03c5b1cSMartin Matuska         CCtxParams->ldmParams.hashRateLog = value;
696*c03c5b1cSMartin Matuska         return CCtxParams->ldmParams.hashRateLog;
697*c03c5b1cSMartin Matuska 
698*c03c5b1cSMartin Matuska     case ZSTD_c_targetCBlockSize :
699*c03c5b1cSMartin Matuska         if (value!=0)   /* 0 ==> default */
700*c03c5b1cSMartin Matuska             BOUNDCHECK(ZSTD_c_targetCBlockSize, value);
701*c03c5b1cSMartin Matuska         CCtxParams->targetCBlockSize = value;
702*c03c5b1cSMartin Matuska         return CCtxParams->targetCBlockSize;
703*c03c5b1cSMartin Matuska 
704*c03c5b1cSMartin Matuska     case ZSTD_c_srcSizeHint :
705*c03c5b1cSMartin Matuska         if (value!=0)    /* 0 ==> default */
706*c03c5b1cSMartin Matuska             BOUNDCHECK(ZSTD_c_srcSizeHint, value);
707*c03c5b1cSMartin Matuska         CCtxParams->srcSizeHint = value;
708*c03c5b1cSMartin Matuska         return CCtxParams->srcSizeHint;
709*c03c5b1cSMartin Matuska 
710*c03c5b1cSMartin Matuska     default: RETURN_ERROR(parameter_unsupported, "unknown parameter");
711*c03c5b1cSMartin Matuska     }
712*c03c5b1cSMartin Matuska }
713*c03c5b1cSMartin Matuska 
ZSTD_CCtx_getParameter(ZSTD_CCtx * cctx,ZSTD_cParameter param,int * value)714*c03c5b1cSMartin Matuska size_t ZSTD_CCtx_getParameter(ZSTD_CCtx* cctx, ZSTD_cParameter param, int* value)
715*c03c5b1cSMartin Matuska {
716*c03c5b1cSMartin Matuska     return ZSTD_CCtxParams_getParameter(&cctx->requestedParams, param, value);
717*c03c5b1cSMartin Matuska }
718*c03c5b1cSMartin Matuska 
ZSTD_CCtxParams_getParameter(ZSTD_CCtx_params * CCtxParams,ZSTD_cParameter param,int * value)719*c03c5b1cSMartin Matuska size_t ZSTD_CCtxParams_getParameter(
720*c03c5b1cSMartin Matuska         ZSTD_CCtx_params* CCtxParams, ZSTD_cParameter param, int* value)
721*c03c5b1cSMartin Matuska {
722*c03c5b1cSMartin Matuska     switch(param)
723*c03c5b1cSMartin Matuska     {
724*c03c5b1cSMartin Matuska     case ZSTD_c_format :
725*c03c5b1cSMartin Matuska         *value = CCtxParams->format;
726*c03c5b1cSMartin Matuska         break;
727*c03c5b1cSMartin Matuska     case ZSTD_c_compressionLevel :
728*c03c5b1cSMartin Matuska         *value = CCtxParams->compressionLevel;
729*c03c5b1cSMartin Matuska         break;
730*c03c5b1cSMartin Matuska     case ZSTD_c_windowLog :
731*c03c5b1cSMartin Matuska         *value = (int)CCtxParams->cParams.windowLog;
732*c03c5b1cSMartin Matuska         break;
733*c03c5b1cSMartin Matuska     case ZSTD_c_hashLog :
734*c03c5b1cSMartin Matuska         *value = (int)CCtxParams->cParams.hashLog;
735*c03c5b1cSMartin Matuska         break;
736*c03c5b1cSMartin Matuska     case ZSTD_c_chainLog :
737*c03c5b1cSMartin Matuska         *value = (int)CCtxParams->cParams.chainLog;
738*c03c5b1cSMartin Matuska         break;
739*c03c5b1cSMartin Matuska     case ZSTD_c_searchLog :
740*c03c5b1cSMartin Matuska         *value = CCtxParams->cParams.searchLog;
741*c03c5b1cSMartin Matuska         break;
742*c03c5b1cSMartin Matuska     case ZSTD_c_minMatch :
743*c03c5b1cSMartin Matuska         *value = CCtxParams->cParams.minMatch;
744*c03c5b1cSMartin Matuska         break;
745*c03c5b1cSMartin Matuska     case ZSTD_c_targetLength :
746*c03c5b1cSMartin Matuska         *value = CCtxParams->cParams.targetLength;
747*c03c5b1cSMartin Matuska         break;
748*c03c5b1cSMartin Matuska     case ZSTD_c_strategy :
749*c03c5b1cSMartin Matuska         *value = (unsigned)CCtxParams->cParams.strategy;
750*c03c5b1cSMartin Matuska         break;
751*c03c5b1cSMartin Matuska     case ZSTD_c_contentSizeFlag :
752*c03c5b1cSMartin Matuska         *value = CCtxParams->fParams.contentSizeFlag;
753*c03c5b1cSMartin Matuska         break;
754*c03c5b1cSMartin Matuska     case ZSTD_c_checksumFlag :
755*c03c5b1cSMartin Matuska         *value = CCtxParams->fParams.checksumFlag;
756*c03c5b1cSMartin Matuska         break;
757*c03c5b1cSMartin Matuska     case ZSTD_c_dictIDFlag :
758*c03c5b1cSMartin Matuska         *value = !CCtxParams->fParams.noDictIDFlag;
759*c03c5b1cSMartin Matuska         break;
760*c03c5b1cSMartin Matuska     case ZSTD_c_forceMaxWindow :
761*c03c5b1cSMartin Matuska         *value = CCtxParams->forceWindow;
762*c03c5b1cSMartin Matuska         break;
763*c03c5b1cSMartin Matuska     case ZSTD_c_forceAttachDict :
764*c03c5b1cSMartin Matuska         *value = CCtxParams->attachDictPref;
765*c03c5b1cSMartin Matuska         break;
766*c03c5b1cSMartin Matuska     case ZSTD_c_literalCompressionMode :
767*c03c5b1cSMartin Matuska         *value = CCtxParams->literalCompressionMode;
768*c03c5b1cSMartin Matuska         break;
769*c03c5b1cSMartin Matuska     case ZSTD_c_nbWorkers :
770*c03c5b1cSMartin Matuska #ifndef ZSTD_MULTITHREAD
771*c03c5b1cSMartin Matuska         assert(CCtxParams->nbWorkers == 0);
772*c03c5b1cSMartin Matuska #endif
773*c03c5b1cSMartin Matuska         *value = CCtxParams->nbWorkers;
774*c03c5b1cSMartin Matuska         break;
775*c03c5b1cSMartin Matuska     case ZSTD_c_jobSize :
776*c03c5b1cSMartin Matuska #ifndef ZSTD_MULTITHREAD
777*c03c5b1cSMartin Matuska         RETURN_ERROR(parameter_unsupported, "not compiled with multithreading");
778*c03c5b1cSMartin Matuska #else
779*c03c5b1cSMartin Matuska         assert(CCtxParams->jobSize <= INT_MAX);
780*c03c5b1cSMartin Matuska         *value = (int)CCtxParams->jobSize;
781*c03c5b1cSMartin Matuska         break;
782*c03c5b1cSMartin Matuska #endif
783*c03c5b1cSMartin Matuska     case ZSTD_c_overlapLog :
784*c03c5b1cSMartin Matuska #ifndef ZSTD_MULTITHREAD
785*c03c5b1cSMartin Matuska         RETURN_ERROR(parameter_unsupported, "not compiled with multithreading");
786*c03c5b1cSMartin Matuska #else
787*c03c5b1cSMartin Matuska         *value = CCtxParams->overlapLog;
788*c03c5b1cSMartin Matuska         break;
789*c03c5b1cSMartin Matuska #endif
790*c03c5b1cSMartin Matuska     case ZSTD_c_rsyncable :
791*c03c5b1cSMartin Matuska #ifndef ZSTD_MULTITHREAD
792*c03c5b1cSMartin Matuska         RETURN_ERROR(parameter_unsupported, "not compiled with multithreading");
793*c03c5b1cSMartin Matuska #else
794*c03c5b1cSMartin Matuska         *value = CCtxParams->rsyncable;
795*c03c5b1cSMartin Matuska         break;
796*c03c5b1cSMartin Matuska #endif
797*c03c5b1cSMartin Matuska     case ZSTD_c_enableLongDistanceMatching :
798*c03c5b1cSMartin Matuska         *value = CCtxParams->ldmParams.enableLdm;
799*c03c5b1cSMartin Matuska         break;
800*c03c5b1cSMartin Matuska     case ZSTD_c_ldmHashLog :
801*c03c5b1cSMartin Matuska         *value = CCtxParams->ldmParams.hashLog;
802*c03c5b1cSMartin Matuska         break;
803*c03c5b1cSMartin Matuska     case ZSTD_c_ldmMinMatch :
804*c03c5b1cSMartin Matuska         *value = CCtxParams->ldmParams.minMatchLength;
805*c03c5b1cSMartin Matuska         break;
806*c03c5b1cSMartin Matuska     case ZSTD_c_ldmBucketSizeLog :
807*c03c5b1cSMartin Matuska         *value = CCtxParams->ldmParams.bucketSizeLog;
808*c03c5b1cSMartin Matuska         break;
809*c03c5b1cSMartin Matuska     case ZSTD_c_ldmHashRateLog :
810*c03c5b1cSMartin Matuska         *value = CCtxParams->ldmParams.hashRateLog;
811*c03c5b1cSMartin Matuska         break;
812*c03c5b1cSMartin Matuska     case ZSTD_c_targetCBlockSize :
813*c03c5b1cSMartin Matuska         *value = (int)CCtxParams->targetCBlockSize;
814*c03c5b1cSMartin Matuska         break;
815*c03c5b1cSMartin Matuska     case ZSTD_c_srcSizeHint :
816*c03c5b1cSMartin Matuska         *value = (int)CCtxParams->srcSizeHint;
817*c03c5b1cSMartin Matuska         break;
818*c03c5b1cSMartin Matuska     default: RETURN_ERROR(parameter_unsupported, "unknown parameter");
819*c03c5b1cSMartin Matuska     }
820*c03c5b1cSMartin Matuska     return 0;
821*c03c5b1cSMartin Matuska }
822*c03c5b1cSMartin Matuska 
823*c03c5b1cSMartin Matuska /** ZSTD_CCtx_setParametersUsingCCtxParams() :
824*c03c5b1cSMartin Matuska  *  just applies `params` into `cctx`
825*c03c5b1cSMartin Matuska  *  no action is performed, parameters are merely stored.
826*c03c5b1cSMartin Matuska  *  If ZSTDMT is enabled, parameters are pushed to cctx->mtctx.
827*c03c5b1cSMartin Matuska  *    This is possible even if a compression is ongoing.
828*c03c5b1cSMartin Matuska  *    In which case, new parameters will be applied on the fly, starting with next compression job.
829*c03c5b1cSMartin Matuska  */
ZSTD_CCtx_setParametersUsingCCtxParams(ZSTD_CCtx * cctx,const ZSTD_CCtx_params * params)830*c03c5b1cSMartin Matuska size_t ZSTD_CCtx_setParametersUsingCCtxParams(
831*c03c5b1cSMartin Matuska         ZSTD_CCtx* cctx, const ZSTD_CCtx_params* params)
832*c03c5b1cSMartin Matuska {
833*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_CCtx_setParametersUsingCCtxParams");
834*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(cctx->streamStage != zcss_init, stage_wrong,
835*c03c5b1cSMartin Matuska                     "The context is in the wrong stage!");
836*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(cctx->cdict, stage_wrong,
837*c03c5b1cSMartin Matuska                     "Can't override parameters with cdict attached (some must "
838*c03c5b1cSMartin Matuska                     "be inherited from the cdict).");
839*c03c5b1cSMartin Matuska 
840*c03c5b1cSMartin Matuska     cctx->requestedParams = *params;
841*c03c5b1cSMartin Matuska     return 0;
842*c03c5b1cSMartin Matuska }
843*c03c5b1cSMartin Matuska 
ZSTD_CCtx_setPledgedSrcSize(ZSTD_CCtx * cctx,unsigned long long pledgedSrcSize)844*c03c5b1cSMartin Matuska ZSTDLIB_API size_t ZSTD_CCtx_setPledgedSrcSize(ZSTD_CCtx* cctx, unsigned long long pledgedSrcSize)
845*c03c5b1cSMartin Matuska {
846*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_CCtx_setPledgedSrcSize to %u bytes", (U32)pledgedSrcSize);
847*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(cctx->streamStage != zcss_init, stage_wrong,
848*c03c5b1cSMartin Matuska                     "Can't set pledgedSrcSize when not in init stage.");
849*c03c5b1cSMartin Matuska     cctx->pledgedSrcSizePlusOne = pledgedSrcSize+1;
850*c03c5b1cSMartin Matuska     return 0;
851*c03c5b1cSMartin Matuska }
852*c03c5b1cSMartin Matuska 
853*c03c5b1cSMartin Matuska /**
854*c03c5b1cSMartin Matuska  * Initializes the local dict using the requested parameters.
855*c03c5b1cSMartin Matuska  * NOTE: This does not use the pledged src size, because it may be used for more
856*c03c5b1cSMartin Matuska  * than one compression.
857*c03c5b1cSMartin Matuska  */
ZSTD_initLocalDict(ZSTD_CCtx * cctx)858*c03c5b1cSMartin Matuska static size_t ZSTD_initLocalDict(ZSTD_CCtx* cctx)
859*c03c5b1cSMartin Matuska {
860*c03c5b1cSMartin Matuska     ZSTD_localDict* const dl = &cctx->localDict;
861*c03c5b1cSMartin Matuska     ZSTD_compressionParameters const cParams = ZSTD_getCParamsFromCCtxParams(
862*c03c5b1cSMartin Matuska             &cctx->requestedParams, ZSTD_CONTENTSIZE_UNKNOWN, dl->dictSize);
863*c03c5b1cSMartin Matuska     if (dl->dict == NULL) {
864*c03c5b1cSMartin Matuska         /* No local dictionary. */
865*c03c5b1cSMartin Matuska         assert(dl->dictBuffer == NULL);
866*c03c5b1cSMartin Matuska         assert(dl->cdict == NULL);
867*c03c5b1cSMartin Matuska         assert(dl->dictSize == 0);
868*c03c5b1cSMartin Matuska         return 0;
869*c03c5b1cSMartin Matuska     }
870*c03c5b1cSMartin Matuska     if (dl->cdict != NULL) {
871*c03c5b1cSMartin Matuska         assert(cctx->cdict == dl->cdict);
872*c03c5b1cSMartin Matuska         /* Local dictionary already initialized. */
873*c03c5b1cSMartin Matuska         return 0;
874*c03c5b1cSMartin Matuska     }
875*c03c5b1cSMartin Matuska     assert(dl->dictSize > 0);
876*c03c5b1cSMartin Matuska     assert(cctx->cdict == NULL);
877*c03c5b1cSMartin Matuska     assert(cctx->prefixDict.dict == NULL);
878*c03c5b1cSMartin Matuska 
879*c03c5b1cSMartin Matuska     dl->cdict = ZSTD_createCDict_advanced(
880*c03c5b1cSMartin Matuska             dl->dict,
881*c03c5b1cSMartin Matuska             dl->dictSize,
882*c03c5b1cSMartin Matuska             ZSTD_dlm_byRef,
883*c03c5b1cSMartin Matuska             dl->dictContentType,
884*c03c5b1cSMartin Matuska             cParams,
885*c03c5b1cSMartin Matuska             cctx->customMem);
886*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(!dl->cdict, memory_allocation, "ZSTD_createCDict_advanced failed");
887*c03c5b1cSMartin Matuska     cctx->cdict = dl->cdict;
888*c03c5b1cSMartin Matuska     return 0;
889*c03c5b1cSMartin Matuska }
890*c03c5b1cSMartin Matuska 
ZSTD_CCtx_loadDictionary_advanced(ZSTD_CCtx * cctx,const void * dict,size_t dictSize,ZSTD_dictLoadMethod_e dictLoadMethod,ZSTD_dictContentType_e dictContentType)891*c03c5b1cSMartin Matuska size_t ZSTD_CCtx_loadDictionary_advanced(
892*c03c5b1cSMartin Matuska         ZSTD_CCtx* cctx, const void* dict, size_t dictSize,
893*c03c5b1cSMartin Matuska         ZSTD_dictLoadMethod_e dictLoadMethod, ZSTD_dictContentType_e dictContentType)
894*c03c5b1cSMartin Matuska {
895*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(cctx->streamStage != zcss_init, stage_wrong,
896*c03c5b1cSMartin Matuska                     "Can't load a dictionary when ctx is not in init stage.");
897*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(cctx->staticSize, memory_allocation,
898*c03c5b1cSMartin Matuska                     "no malloc for static CCtx");
899*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_CCtx_loadDictionary_advanced (size: %u)", (U32)dictSize);
900*c03c5b1cSMartin Matuska     ZSTD_clearAllDicts(cctx);  /* in case one already exists */
901*c03c5b1cSMartin Matuska     if (dict == NULL || dictSize == 0)  /* no dictionary mode */
902*c03c5b1cSMartin Matuska         return 0;
903*c03c5b1cSMartin Matuska     if (dictLoadMethod == ZSTD_dlm_byRef) {
904*c03c5b1cSMartin Matuska         cctx->localDict.dict = dict;
905*c03c5b1cSMartin Matuska     } else {
906*c03c5b1cSMartin Matuska         void* dictBuffer = ZSTD_malloc(dictSize, cctx->customMem);
907*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(!dictBuffer, memory_allocation, "NULL pointer!");
908*c03c5b1cSMartin Matuska         memcpy(dictBuffer, dict, dictSize);
909*c03c5b1cSMartin Matuska         cctx->localDict.dictBuffer = dictBuffer;
910*c03c5b1cSMartin Matuska         cctx->localDict.dict = dictBuffer;
911*c03c5b1cSMartin Matuska     }
912*c03c5b1cSMartin Matuska     cctx->localDict.dictSize = dictSize;
913*c03c5b1cSMartin Matuska     cctx->localDict.dictContentType = dictContentType;
914*c03c5b1cSMartin Matuska     return 0;
915*c03c5b1cSMartin Matuska }
916*c03c5b1cSMartin Matuska 
ZSTD_CCtx_loadDictionary_byReference(ZSTD_CCtx * cctx,const void * dict,size_t dictSize)917*c03c5b1cSMartin Matuska ZSTDLIB_API size_t ZSTD_CCtx_loadDictionary_byReference(
918*c03c5b1cSMartin Matuska       ZSTD_CCtx* cctx, const void* dict, size_t dictSize)
919*c03c5b1cSMartin Matuska {
920*c03c5b1cSMartin Matuska     return ZSTD_CCtx_loadDictionary_advanced(
921*c03c5b1cSMartin Matuska             cctx, dict, dictSize, ZSTD_dlm_byRef, ZSTD_dct_auto);
922*c03c5b1cSMartin Matuska }
923*c03c5b1cSMartin Matuska 
ZSTD_CCtx_loadDictionary(ZSTD_CCtx * cctx,const void * dict,size_t dictSize)924*c03c5b1cSMartin Matuska ZSTDLIB_API size_t ZSTD_CCtx_loadDictionary(ZSTD_CCtx* cctx, const void* dict, size_t dictSize)
925*c03c5b1cSMartin Matuska {
926*c03c5b1cSMartin Matuska     return ZSTD_CCtx_loadDictionary_advanced(
927*c03c5b1cSMartin Matuska             cctx, dict, dictSize, ZSTD_dlm_byCopy, ZSTD_dct_auto);
928*c03c5b1cSMartin Matuska }
929*c03c5b1cSMartin Matuska 
930*c03c5b1cSMartin Matuska 
ZSTD_CCtx_refCDict(ZSTD_CCtx * cctx,const ZSTD_CDict * cdict)931*c03c5b1cSMartin Matuska size_t ZSTD_CCtx_refCDict(ZSTD_CCtx* cctx, const ZSTD_CDict* cdict)
932*c03c5b1cSMartin Matuska {
933*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(cctx->streamStage != zcss_init, stage_wrong,
934*c03c5b1cSMartin Matuska                     "Can't ref a dict when ctx not in init stage.");
935*c03c5b1cSMartin Matuska     /* Free the existing local cdict (if any) to save memory. */
936*c03c5b1cSMartin Matuska     ZSTD_clearAllDicts(cctx);
937*c03c5b1cSMartin Matuska     cctx->cdict = cdict;
938*c03c5b1cSMartin Matuska     return 0;
939*c03c5b1cSMartin Matuska }
940*c03c5b1cSMartin Matuska 
ZSTD_CCtx_refPrefix(ZSTD_CCtx * cctx,const void * prefix,size_t prefixSize)941*c03c5b1cSMartin Matuska size_t ZSTD_CCtx_refPrefix(ZSTD_CCtx* cctx, const void* prefix, size_t prefixSize)
942*c03c5b1cSMartin Matuska {
943*c03c5b1cSMartin Matuska     return ZSTD_CCtx_refPrefix_advanced(cctx, prefix, prefixSize, ZSTD_dct_rawContent);
944*c03c5b1cSMartin Matuska }
945*c03c5b1cSMartin Matuska 
ZSTD_CCtx_refPrefix_advanced(ZSTD_CCtx * cctx,const void * prefix,size_t prefixSize,ZSTD_dictContentType_e dictContentType)946*c03c5b1cSMartin Matuska size_t ZSTD_CCtx_refPrefix_advanced(
947*c03c5b1cSMartin Matuska         ZSTD_CCtx* cctx, const void* prefix, size_t prefixSize, ZSTD_dictContentType_e dictContentType)
948*c03c5b1cSMartin Matuska {
949*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(cctx->streamStage != zcss_init, stage_wrong,
950*c03c5b1cSMartin Matuska                     "Can't ref a prefix when ctx not in init stage.");
951*c03c5b1cSMartin Matuska     ZSTD_clearAllDicts(cctx);
952*c03c5b1cSMartin Matuska     if (prefix != NULL && prefixSize > 0) {
953*c03c5b1cSMartin Matuska         cctx->prefixDict.dict = prefix;
954*c03c5b1cSMartin Matuska         cctx->prefixDict.dictSize = prefixSize;
955*c03c5b1cSMartin Matuska         cctx->prefixDict.dictContentType = dictContentType;
956*c03c5b1cSMartin Matuska     }
957*c03c5b1cSMartin Matuska     return 0;
958*c03c5b1cSMartin Matuska }
959*c03c5b1cSMartin Matuska 
960*c03c5b1cSMartin Matuska /*! ZSTD_CCtx_reset() :
961*c03c5b1cSMartin Matuska  *  Also dumps dictionary */
ZSTD_CCtx_reset(ZSTD_CCtx * cctx,ZSTD_ResetDirective reset)962*c03c5b1cSMartin Matuska size_t ZSTD_CCtx_reset(ZSTD_CCtx* cctx, ZSTD_ResetDirective reset)
963*c03c5b1cSMartin Matuska {
964*c03c5b1cSMartin Matuska     if ( (reset == ZSTD_reset_session_only)
965*c03c5b1cSMartin Matuska       || (reset == ZSTD_reset_session_and_parameters) ) {
966*c03c5b1cSMartin Matuska         cctx->streamStage = zcss_init;
967*c03c5b1cSMartin Matuska         cctx->pledgedSrcSizePlusOne = 0;
968*c03c5b1cSMartin Matuska     }
969*c03c5b1cSMartin Matuska     if ( (reset == ZSTD_reset_parameters)
970*c03c5b1cSMartin Matuska       || (reset == ZSTD_reset_session_and_parameters) ) {
971*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(cctx->streamStage != zcss_init, stage_wrong,
972*c03c5b1cSMartin Matuska                         "Can't reset parameters only when not in init stage.");
973*c03c5b1cSMartin Matuska         ZSTD_clearAllDicts(cctx);
974*c03c5b1cSMartin Matuska         return ZSTD_CCtxParams_reset(&cctx->requestedParams);
975*c03c5b1cSMartin Matuska     }
976*c03c5b1cSMartin Matuska     return 0;
977*c03c5b1cSMartin Matuska }
978*c03c5b1cSMartin Matuska 
979*c03c5b1cSMartin Matuska 
980*c03c5b1cSMartin Matuska /** ZSTD_checkCParams() :
981*c03c5b1cSMartin Matuska     control CParam values remain within authorized range.
982*c03c5b1cSMartin Matuska     @return : 0, or an error code if one value is beyond authorized range */
ZSTD_checkCParams(ZSTD_compressionParameters cParams)983*c03c5b1cSMartin Matuska size_t ZSTD_checkCParams(ZSTD_compressionParameters cParams)
984*c03c5b1cSMartin Matuska {
985*c03c5b1cSMartin Matuska     BOUNDCHECK(ZSTD_c_windowLog, (int)cParams.windowLog);
986*c03c5b1cSMartin Matuska     BOUNDCHECK(ZSTD_c_chainLog,  (int)cParams.chainLog);
987*c03c5b1cSMartin Matuska     BOUNDCHECK(ZSTD_c_hashLog,   (int)cParams.hashLog);
988*c03c5b1cSMartin Matuska     BOUNDCHECK(ZSTD_c_searchLog, (int)cParams.searchLog);
989*c03c5b1cSMartin Matuska     BOUNDCHECK(ZSTD_c_minMatch,  (int)cParams.minMatch);
990*c03c5b1cSMartin Matuska     BOUNDCHECK(ZSTD_c_targetLength,(int)cParams.targetLength);
991*c03c5b1cSMartin Matuska     BOUNDCHECK(ZSTD_c_strategy,  cParams.strategy);
992*c03c5b1cSMartin Matuska     return 0;
993*c03c5b1cSMartin Matuska }
994*c03c5b1cSMartin Matuska 
995*c03c5b1cSMartin Matuska /** ZSTD_clampCParams() :
996*c03c5b1cSMartin Matuska  *  make CParam values within valid range.
997*c03c5b1cSMartin Matuska  *  @return : valid CParams */
998*c03c5b1cSMartin Matuska static ZSTD_compressionParameters
ZSTD_clampCParams(ZSTD_compressionParameters cParams)999*c03c5b1cSMartin Matuska ZSTD_clampCParams(ZSTD_compressionParameters cParams)
1000*c03c5b1cSMartin Matuska {
1001*c03c5b1cSMartin Matuska #   define CLAMP_TYPE(cParam, val, type) {                                \
1002*c03c5b1cSMartin Matuska         ZSTD_bounds const bounds = ZSTD_cParam_getBounds(cParam);         \
1003*c03c5b1cSMartin Matuska         if ((int)val<bounds.lowerBound) val=(type)bounds.lowerBound;      \
1004*c03c5b1cSMartin Matuska         else if ((int)val>bounds.upperBound) val=(type)bounds.upperBound; \
1005*c03c5b1cSMartin Matuska     }
1006*c03c5b1cSMartin Matuska #   define CLAMP(cParam, val) CLAMP_TYPE(cParam, val, unsigned)
1007*c03c5b1cSMartin Matuska     CLAMP(ZSTD_c_windowLog, cParams.windowLog);
1008*c03c5b1cSMartin Matuska     CLAMP(ZSTD_c_chainLog,  cParams.chainLog);
1009*c03c5b1cSMartin Matuska     CLAMP(ZSTD_c_hashLog,   cParams.hashLog);
1010*c03c5b1cSMartin Matuska     CLAMP(ZSTD_c_searchLog, cParams.searchLog);
1011*c03c5b1cSMartin Matuska     CLAMP(ZSTD_c_minMatch,  cParams.minMatch);
1012*c03c5b1cSMartin Matuska     CLAMP(ZSTD_c_targetLength,cParams.targetLength);
1013*c03c5b1cSMartin Matuska     CLAMP_TYPE(ZSTD_c_strategy,cParams.strategy, ZSTD_strategy);
1014*c03c5b1cSMartin Matuska     return cParams;
1015*c03c5b1cSMartin Matuska }
1016*c03c5b1cSMartin Matuska 
1017*c03c5b1cSMartin Matuska /** ZSTD_cycleLog() :
1018*c03c5b1cSMartin Matuska  *  condition for correct operation : hashLog > 1 */
ZSTD_cycleLog(U32 hashLog,ZSTD_strategy strat)1019*c03c5b1cSMartin Matuska U32 ZSTD_cycleLog(U32 hashLog, ZSTD_strategy strat)
1020*c03c5b1cSMartin Matuska {
1021*c03c5b1cSMartin Matuska     U32 const btScale = ((U32)strat >= (U32)ZSTD_btlazy2);
1022*c03c5b1cSMartin Matuska     return hashLog - btScale;
1023*c03c5b1cSMartin Matuska }
1024*c03c5b1cSMartin Matuska 
1025*c03c5b1cSMartin Matuska /** ZSTD_adjustCParams_internal() :
1026*c03c5b1cSMartin Matuska  *  optimize `cPar` for a specified input (`srcSize` and `dictSize`).
1027*c03c5b1cSMartin Matuska  *  mostly downsize to reduce memory consumption and initialization latency.
1028*c03c5b1cSMartin Matuska  * `srcSize` can be ZSTD_CONTENTSIZE_UNKNOWN when not known.
1029*c03c5b1cSMartin Matuska  *  note : `srcSize==0` means 0!
1030*c03c5b1cSMartin Matuska  *  condition : cPar is presumed validated (can be checked using ZSTD_checkCParams()). */
1031*c03c5b1cSMartin Matuska static ZSTD_compressionParameters
ZSTD_adjustCParams_internal(ZSTD_compressionParameters cPar,unsigned long long srcSize,size_t dictSize)1032*c03c5b1cSMartin Matuska ZSTD_adjustCParams_internal(ZSTD_compressionParameters cPar,
1033*c03c5b1cSMartin Matuska                             unsigned long long srcSize,
1034*c03c5b1cSMartin Matuska                             size_t dictSize)
1035*c03c5b1cSMartin Matuska {
1036*c03c5b1cSMartin Matuska     static const U64 minSrcSize = 513; /* (1<<9) + 1 */
1037*c03c5b1cSMartin Matuska     static const U64 maxWindowResize = 1ULL << (ZSTD_WINDOWLOG_MAX-1);
1038*c03c5b1cSMartin Matuska     assert(ZSTD_checkCParams(cPar)==0);
1039*c03c5b1cSMartin Matuska 
1040*c03c5b1cSMartin Matuska     if (dictSize && srcSize == ZSTD_CONTENTSIZE_UNKNOWN)
1041*c03c5b1cSMartin Matuska         srcSize = minSrcSize;
1042*c03c5b1cSMartin Matuska 
1043*c03c5b1cSMartin Matuska     /* resize windowLog if input is small enough, to use less memory */
1044*c03c5b1cSMartin Matuska     if ( (srcSize < maxWindowResize)
1045*c03c5b1cSMartin Matuska       && (dictSize < maxWindowResize) )  {
1046*c03c5b1cSMartin Matuska         U32 const tSize = (U32)(srcSize + dictSize);
1047*c03c5b1cSMartin Matuska         static U32 const hashSizeMin = 1 << ZSTD_HASHLOG_MIN;
1048*c03c5b1cSMartin Matuska         U32 const srcLog = (tSize < hashSizeMin) ? ZSTD_HASHLOG_MIN :
1049*c03c5b1cSMartin Matuska                             ZSTD_highbit32(tSize-1) + 1;
1050*c03c5b1cSMartin Matuska         if (cPar.windowLog > srcLog) cPar.windowLog = srcLog;
1051*c03c5b1cSMartin Matuska     }
1052*c03c5b1cSMartin Matuska     if (cPar.hashLog > cPar.windowLog+1) cPar.hashLog = cPar.windowLog+1;
1053*c03c5b1cSMartin Matuska     {   U32 const cycleLog = ZSTD_cycleLog(cPar.chainLog, cPar.strategy);
1054*c03c5b1cSMartin Matuska         if (cycleLog > cPar.windowLog)
1055*c03c5b1cSMartin Matuska             cPar.chainLog -= (cycleLog - cPar.windowLog);
1056*c03c5b1cSMartin Matuska     }
1057*c03c5b1cSMartin Matuska 
1058*c03c5b1cSMartin Matuska     if (cPar.windowLog < ZSTD_WINDOWLOG_ABSOLUTEMIN)
1059*c03c5b1cSMartin Matuska         cPar.windowLog = ZSTD_WINDOWLOG_ABSOLUTEMIN;  /* minimum wlog required for valid frame header */
1060*c03c5b1cSMartin Matuska 
1061*c03c5b1cSMartin Matuska     return cPar;
1062*c03c5b1cSMartin Matuska }
1063*c03c5b1cSMartin Matuska 
1064*c03c5b1cSMartin Matuska ZSTD_compressionParameters
ZSTD_adjustCParams(ZSTD_compressionParameters cPar,unsigned long long srcSize,size_t dictSize)1065*c03c5b1cSMartin Matuska ZSTD_adjustCParams(ZSTD_compressionParameters cPar,
1066*c03c5b1cSMartin Matuska                    unsigned long long srcSize,
1067*c03c5b1cSMartin Matuska                    size_t dictSize)
1068*c03c5b1cSMartin Matuska {
1069*c03c5b1cSMartin Matuska     cPar = ZSTD_clampCParams(cPar);   /* resulting cPar is necessarily valid (all parameters within range) */
1070*c03c5b1cSMartin Matuska     if (srcSize == 0) srcSize = ZSTD_CONTENTSIZE_UNKNOWN;
1071*c03c5b1cSMartin Matuska     return ZSTD_adjustCParams_internal(cPar, srcSize, dictSize);
1072*c03c5b1cSMartin Matuska }
1073*c03c5b1cSMartin Matuska 
1074*c03c5b1cSMartin Matuska static ZSTD_compressionParameters ZSTD_getCParams_internal(int compressionLevel, unsigned long long srcSizeHint, size_t dictSize);
1075*c03c5b1cSMartin Matuska static ZSTD_parameters ZSTD_getParams_internal(int compressionLevel, unsigned long long srcSizeHint, size_t dictSize);
1076*c03c5b1cSMartin Matuska 
ZSTD_getCParamsFromCCtxParams(const ZSTD_CCtx_params * CCtxParams,U64 srcSizeHint,size_t dictSize)1077*c03c5b1cSMartin Matuska ZSTD_compressionParameters ZSTD_getCParamsFromCCtxParams(
1078*c03c5b1cSMartin Matuska         const ZSTD_CCtx_params* CCtxParams, U64 srcSizeHint, size_t dictSize)
1079*c03c5b1cSMartin Matuska {
1080*c03c5b1cSMartin Matuska     ZSTD_compressionParameters cParams;
1081*c03c5b1cSMartin Matuska     if (srcSizeHint == ZSTD_CONTENTSIZE_UNKNOWN && CCtxParams->srcSizeHint > 0) {
1082*c03c5b1cSMartin Matuska       srcSizeHint = CCtxParams->srcSizeHint;
1083*c03c5b1cSMartin Matuska     }
1084*c03c5b1cSMartin Matuska     cParams = ZSTD_getCParams_internal(CCtxParams->compressionLevel, srcSizeHint, dictSize);
1085*c03c5b1cSMartin Matuska     if (CCtxParams->ldmParams.enableLdm) cParams.windowLog = ZSTD_LDM_DEFAULT_WINDOW_LOG;
1086*c03c5b1cSMartin Matuska     if (CCtxParams->cParams.windowLog) cParams.windowLog = CCtxParams->cParams.windowLog;
1087*c03c5b1cSMartin Matuska     if (CCtxParams->cParams.hashLog) cParams.hashLog = CCtxParams->cParams.hashLog;
1088*c03c5b1cSMartin Matuska     if (CCtxParams->cParams.chainLog) cParams.chainLog = CCtxParams->cParams.chainLog;
1089*c03c5b1cSMartin Matuska     if (CCtxParams->cParams.searchLog) cParams.searchLog = CCtxParams->cParams.searchLog;
1090*c03c5b1cSMartin Matuska     if (CCtxParams->cParams.minMatch) cParams.minMatch = CCtxParams->cParams.minMatch;
1091*c03c5b1cSMartin Matuska     if (CCtxParams->cParams.targetLength) cParams.targetLength = CCtxParams->cParams.targetLength;
1092*c03c5b1cSMartin Matuska     if (CCtxParams->cParams.strategy) cParams.strategy = CCtxParams->cParams.strategy;
1093*c03c5b1cSMartin Matuska     assert(!ZSTD_checkCParams(cParams));
1094*c03c5b1cSMartin Matuska     /* srcSizeHint == 0 means 0 */
1095*c03c5b1cSMartin Matuska     return ZSTD_adjustCParams_internal(cParams, srcSizeHint, dictSize);
1096*c03c5b1cSMartin Matuska }
1097*c03c5b1cSMartin Matuska 
1098*c03c5b1cSMartin Matuska static size_t
ZSTD_sizeof_matchState(const ZSTD_compressionParameters * const cParams,const U32 forCCtx)1099*c03c5b1cSMartin Matuska ZSTD_sizeof_matchState(const ZSTD_compressionParameters* const cParams,
1100*c03c5b1cSMartin Matuska                        const U32 forCCtx)
1101*c03c5b1cSMartin Matuska {
1102*c03c5b1cSMartin Matuska     size_t const chainSize = (cParams->strategy == ZSTD_fast) ? 0 : ((size_t)1 << cParams->chainLog);
1103*c03c5b1cSMartin Matuska     size_t const hSize = ((size_t)1) << cParams->hashLog;
1104*c03c5b1cSMartin Matuska     U32    const hashLog3 = (forCCtx && cParams->minMatch==3) ? MIN(ZSTD_HASHLOG3_MAX, cParams->windowLog) : 0;
1105*c03c5b1cSMartin Matuska     size_t const h3Size = hashLog3 ? ((size_t)1) << hashLog3 : 0;
1106*c03c5b1cSMartin Matuska     /* We don't use ZSTD_cwksp_alloc_size() here because the tables aren't
1107*c03c5b1cSMartin Matuska      * surrounded by redzones in ASAN. */
1108*c03c5b1cSMartin Matuska     size_t const tableSpace = chainSize * sizeof(U32)
1109*c03c5b1cSMartin Matuska                             + hSize * sizeof(U32)
1110*c03c5b1cSMartin Matuska                             + h3Size * sizeof(U32);
1111*c03c5b1cSMartin Matuska     size_t const optPotentialSpace =
1112*c03c5b1cSMartin Matuska         ZSTD_cwksp_alloc_size((MaxML+1) * sizeof(U32))
1113*c03c5b1cSMartin Matuska       + ZSTD_cwksp_alloc_size((MaxLL+1) * sizeof(U32))
1114*c03c5b1cSMartin Matuska       + ZSTD_cwksp_alloc_size((MaxOff+1) * sizeof(U32))
1115*c03c5b1cSMartin Matuska       + ZSTD_cwksp_alloc_size((1<<Litbits) * sizeof(U32))
1116*c03c5b1cSMartin Matuska       + ZSTD_cwksp_alloc_size((ZSTD_OPT_NUM+1) * sizeof(ZSTD_match_t))
1117*c03c5b1cSMartin Matuska       + ZSTD_cwksp_alloc_size((ZSTD_OPT_NUM+1) * sizeof(ZSTD_optimal_t));
1118*c03c5b1cSMartin Matuska     size_t const optSpace = (forCCtx && (cParams->strategy >= ZSTD_btopt))
1119*c03c5b1cSMartin Matuska                                 ? optPotentialSpace
1120*c03c5b1cSMartin Matuska                                 : 0;
1121*c03c5b1cSMartin Matuska     DEBUGLOG(4, "chainSize: %u - hSize: %u - h3Size: %u",
1122*c03c5b1cSMartin Matuska                 (U32)chainSize, (U32)hSize, (U32)h3Size);
1123*c03c5b1cSMartin Matuska     return tableSpace + optSpace;
1124*c03c5b1cSMartin Matuska }
1125*c03c5b1cSMartin Matuska 
ZSTD_estimateCCtxSize_usingCCtxParams(const ZSTD_CCtx_params * params)1126*c03c5b1cSMartin Matuska size_t ZSTD_estimateCCtxSize_usingCCtxParams(const ZSTD_CCtx_params* params)
1127*c03c5b1cSMartin Matuska {
1128*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(params->nbWorkers > 0, GENERIC, "Estimate CCtx size is supported for single-threaded compression only.");
1129*c03c5b1cSMartin Matuska     {   ZSTD_compressionParameters const cParams =
1130*c03c5b1cSMartin Matuska                 ZSTD_getCParamsFromCCtxParams(params, ZSTD_CONTENTSIZE_UNKNOWN, 0);
1131*c03c5b1cSMartin Matuska         size_t const blockSize = MIN(ZSTD_BLOCKSIZE_MAX, (size_t)1 << cParams.windowLog);
1132*c03c5b1cSMartin Matuska         U32    const divider = (cParams.minMatch==3) ? 3 : 4;
1133*c03c5b1cSMartin Matuska         size_t const maxNbSeq = blockSize / divider;
1134*c03c5b1cSMartin Matuska         size_t const tokenSpace = ZSTD_cwksp_alloc_size(WILDCOPY_OVERLENGTH + blockSize)
1135*c03c5b1cSMartin Matuska                                 + ZSTD_cwksp_alloc_size(maxNbSeq * sizeof(seqDef))
1136*c03c5b1cSMartin Matuska                                 + 3 * ZSTD_cwksp_alloc_size(maxNbSeq * sizeof(BYTE));
1137*c03c5b1cSMartin Matuska         size_t const entropySpace = ZSTD_cwksp_alloc_size(HUF_WORKSPACE_SIZE);
1138*c03c5b1cSMartin Matuska         size_t const blockStateSpace = 2 * ZSTD_cwksp_alloc_size(sizeof(ZSTD_compressedBlockState_t));
1139*c03c5b1cSMartin Matuska         size_t const matchStateSize = ZSTD_sizeof_matchState(&cParams, /* forCCtx */ 1);
1140*c03c5b1cSMartin Matuska 
1141*c03c5b1cSMartin Matuska         size_t const ldmSpace = ZSTD_ldm_getTableSize(params->ldmParams);
1142*c03c5b1cSMartin Matuska         size_t const ldmSeqSpace = ZSTD_cwksp_alloc_size(ZSTD_ldm_getMaxNbSeq(params->ldmParams, blockSize) * sizeof(rawSeq));
1143*c03c5b1cSMartin Matuska 
1144*c03c5b1cSMartin Matuska         /* estimateCCtxSize is for one-shot compression. So no buffers should
1145*c03c5b1cSMartin Matuska          * be needed. However, we still allocate two 0-sized buffers, which can
1146*c03c5b1cSMartin Matuska          * take space under ASAN. */
1147*c03c5b1cSMartin Matuska         size_t const bufferSpace = ZSTD_cwksp_alloc_size(0)
1148*c03c5b1cSMartin Matuska                                  + ZSTD_cwksp_alloc_size(0);
1149*c03c5b1cSMartin Matuska 
1150*c03c5b1cSMartin Matuska         size_t const cctxSpace = ZSTD_cwksp_alloc_size(sizeof(ZSTD_CCtx));
1151*c03c5b1cSMartin Matuska 
1152*c03c5b1cSMartin Matuska         size_t const neededSpace =
1153*c03c5b1cSMartin Matuska             cctxSpace +
1154*c03c5b1cSMartin Matuska             entropySpace +
1155*c03c5b1cSMartin Matuska             blockStateSpace +
1156*c03c5b1cSMartin Matuska             ldmSpace +
1157*c03c5b1cSMartin Matuska             ldmSeqSpace +
1158*c03c5b1cSMartin Matuska             matchStateSize +
1159*c03c5b1cSMartin Matuska             tokenSpace +
1160*c03c5b1cSMartin Matuska             bufferSpace;
1161*c03c5b1cSMartin Matuska 
1162*c03c5b1cSMartin Matuska         DEBUGLOG(5, "estimate workspace : %u", (U32)neededSpace);
1163*c03c5b1cSMartin Matuska         return neededSpace;
1164*c03c5b1cSMartin Matuska     }
1165*c03c5b1cSMartin Matuska }
1166*c03c5b1cSMartin Matuska 
ZSTD_estimateCCtxSize_usingCParams(ZSTD_compressionParameters cParams)1167*c03c5b1cSMartin Matuska size_t ZSTD_estimateCCtxSize_usingCParams(ZSTD_compressionParameters cParams)
1168*c03c5b1cSMartin Matuska {
1169*c03c5b1cSMartin Matuska     ZSTD_CCtx_params const params = ZSTD_makeCCtxParamsFromCParams(cParams);
1170*c03c5b1cSMartin Matuska     return ZSTD_estimateCCtxSize_usingCCtxParams(&params);
1171*c03c5b1cSMartin Matuska }
1172*c03c5b1cSMartin Matuska 
ZSTD_estimateCCtxSize_internal(int compressionLevel)1173*c03c5b1cSMartin Matuska static size_t ZSTD_estimateCCtxSize_internal(int compressionLevel)
1174*c03c5b1cSMartin Matuska {
1175*c03c5b1cSMartin Matuska     ZSTD_compressionParameters const cParams = ZSTD_getCParams_internal(compressionLevel, ZSTD_CONTENTSIZE_UNKNOWN, 0);
1176*c03c5b1cSMartin Matuska     return ZSTD_estimateCCtxSize_usingCParams(cParams);
1177*c03c5b1cSMartin Matuska }
1178*c03c5b1cSMartin Matuska 
ZSTD_estimateCCtxSize(int compressionLevel)1179*c03c5b1cSMartin Matuska size_t ZSTD_estimateCCtxSize(int compressionLevel)
1180*c03c5b1cSMartin Matuska {
1181*c03c5b1cSMartin Matuska     int level;
1182*c03c5b1cSMartin Matuska     size_t memBudget = 0;
1183*c03c5b1cSMartin Matuska     for (level=MIN(compressionLevel, 1); level<=compressionLevel; level++) {
1184*c03c5b1cSMartin Matuska         size_t const newMB = ZSTD_estimateCCtxSize_internal(level);
1185*c03c5b1cSMartin Matuska         if (newMB > memBudget) memBudget = newMB;
1186*c03c5b1cSMartin Matuska     }
1187*c03c5b1cSMartin Matuska     return memBudget;
1188*c03c5b1cSMartin Matuska }
1189*c03c5b1cSMartin Matuska 
ZSTD_estimateCStreamSize_usingCCtxParams(const ZSTD_CCtx_params * params)1190*c03c5b1cSMartin Matuska size_t ZSTD_estimateCStreamSize_usingCCtxParams(const ZSTD_CCtx_params* params)
1191*c03c5b1cSMartin Matuska {
1192*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(params->nbWorkers > 0, GENERIC, "Estimate CCtx size is supported for single-threaded compression only.");
1193*c03c5b1cSMartin Matuska     {   ZSTD_compressionParameters const cParams =
1194*c03c5b1cSMartin Matuska                 ZSTD_getCParamsFromCCtxParams(params, ZSTD_CONTENTSIZE_UNKNOWN, 0);
1195*c03c5b1cSMartin Matuska         size_t const CCtxSize = ZSTD_estimateCCtxSize_usingCCtxParams(params);
1196*c03c5b1cSMartin Matuska         size_t const blockSize = MIN(ZSTD_BLOCKSIZE_MAX, (size_t)1 << cParams.windowLog);
1197*c03c5b1cSMartin Matuska         size_t const inBuffSize = ((size_t)1 << cParams.windowLog) + blockSize;
1198*c03c5b1cSMartin Matuska         size_t const outBuffSize = ZSTD_compressBound(blockSize) + 1;
1199*c03c5b1cSMartin Matuska         size_t const streamingSize = ZSTD_cwksp_alloc_size(inBuffSize)
1200*c03c5b1cSMartin Matuska                                    + ZSTD_cwksp_alloc_size(outBuffSize);
1201*c03c5b1cSMartin Matuska 
1202*c03c5b1cSMartin Matuska         return CCtxSize + streamingSize;
1203*c03c5b1cSMartin Matuska     }
1204*c03c5b1cSMartin Matuska }
1205*c03c5b1cSMartin Matuska 
ZSTD_estimateCStreamSize_usingCParams(ZSTD_compressionParameters cParams)1206*c03c5b1cSMartin Matuska size_t ZSTD_estimateCStreamSize_usingCParams(ZSTD_compressionParameters cParams)
1207*c03c5b1cSMartin Matuska {
1208*c03c5b1cSMartin Matuska     ZSTD_CCtx_params const params = ZSTD_makeCCtxParamsFromCParams(cParams);
1209*c03c5b1cSMartin Matuska     return ZSTD_estimateCStreamSize_usingCCtxParams(&params);
1210*c03c5b1cSMartin Matuska }
1211*c03c5b1cSMartin Matuska 
ZSTD_estimateCStreamSize_internal(int compressionLevel)1212*c03c5b1cSMartin Matuska static size_t ZSTD_estimateCStreamSize_internal(int compressionLevel)
1213*c03c5b1cSMartin Matuska {
1214*c03c5b1cSMartin Matuska     ZSTD_compressionParameters const cParams = ZSTD_getCParams_internal(compressionLevel, ZSTD_CONTENTSIZE_UNKNOWN, 0);
1215*c03c5b1cSMartin Matuska     return ZSTD_estimateCStreamSize_usingCParams(cParams);
1216*c03c5b1cSMartin Matuska }
1217*c03c5b1cSMartin Matuska 
ZSTD_estimateCStreamSize(int compressionLevel)1218*c03c5b1cSMartin Matuska size_t ZSTD_estimateCStreamSize(int compressionLevel)
1219*c03c5b1cSMartin Matuska {
1220*c03c5b1cSMartin Matuska     int level;
1221*c03c5b1cSMartin Matuska     size_t memBudget = 0;
1222*c03c5b1cSMartin Matuska     for (level=MIN(compressionLevel, 1); level<=compressionLevel; level++) {
1223*c03c5b1cSMartin Matuska         size_t const newMB = ZSTD_estimateCStreamSize_internal(level);
1224*c03c5b1cSMartin Matuska         if (newMB > memBudget) memBudget = newMB;
1225*c03c5b1cSMartin Matuska     }
1226*c03c5b1cSMartin Matuska     return memBudget;
1227*c03c5b1cSMartin Matuska }
1228*c03c5b1cSMartin Matuska 
1229*c03c5b1cSMartin Matuska /* ZSTD_getFrameProgression():
1230*c03c5b1cSMartin Matuska  * tells how much data has been consumed (input) and produced (output) for current frame.
1231*c03c5b1cSMartin Matuska  * able to count progression inside worker threads (non-blocking mode).
1232*c03c5b1cSMartin Matuska  */
ZSTD_getFrameProgression(const ZSTD_CCtx * cctx)1233*c03c5b1cSMartin Matuska ZSTD_frameProgression ZSTD_getFrameProgression(const ZSTD_CCtx* cctx)
1234*c03c5b1cSMartin Matuska {
1235*c03c5b1cSMartin Matuska #ifdef ZSTD_MULTITHREAD
1236*c03c5b1cSMartin Matuska     if (cctx->appliedParams.nbWorkers > 0) {
1237*c03c5b1cSMartin Matuska         return ZSTDMT_getFrameProgression(cctx->mtctx);
1238*c03c5b1cSMartin Matuska     }
1239*c03c5b1cSMartin Matuska #endif
1240*c03c5b1cSMartin Matuska     {   ZSTD_frameProgression fp;
1241*c03c5b1cSMartin Matuska         size_t const buffered = (cctx->inBuff == NULL) ? 0 :
1242*c03c5b1cSMartin Matuska                                 cctx->inBuffPos - cctx->inToCompress;
1243*c03c5b1cSMartin Matuska         if (buffered) assert(cctx->inBuffPos >= cctx->inToCompress);
1244*c03c5b1cSMartin Matuska         assert(buffered <= ZSTD_BLOCKSIZE_MAX);
1245*c03c5b1cSMartin Matuska         fp.ingested = cctx->consumedSrcSize + buffered;
1246*c03c5b1cSMartin Matuska         fp.consumed = cctx->consumedSrcSize;
1247*c03c5b1cSMartin Matuska         fp.produced = cctx->producedCSize;
1248*c03c5b1cSMartin Matuska         fp.flushed  = cctx->producedCSize;   /* simplified; some data might still be left within streaming output buffer */
1249*c03c5b1cSMartin Matuska         fp.currentJobID = 0;
1250*c03c5b1cSMartin Matuska         fp.nbActiveWorkers = 0;
1251*c03c5b1cSMartin Matuska         return fp;
1252*c03c5b1cSMartin Matuska }   }
1253*c03c5b1cSMartin Matuska 
1254*c03c5b1cSMartin Matuska /*! ZSTD_toFlushNow()
1255*c03c5b1cSMartin Matuska  *  Only useful for multithreading scenarios currently (nbWorkers >= 1).
1256*c03c5b1cSMartin Matuska  */
ZSTD_toFlushNow(ZSTD_CCtx * cctx)1257*c03c5b1cSMartin Matuska size_t ZSTD_toFlushNow(ZSTD_CCtx* cctx)
1258*c03c5b1cSMartin Matuska {
1259*c03c5b1cSMartin Matuska #ifdef ZSTD_MULTITHREAD
1260*c03c5b1cSMartin Matuska     if (cctx->appliedParams.nbWorkers > 0) {
1261*c03c5b1cSMartin Matuska         return ZSTDMT_toFlushNow(cctx->mtctx);
1262*c03c5b1cSMartin Matuska     }
1263*c03c5b1cSMartin Matuska #endif
1264*c03c5b1cSMartin Matuska     (void)cctx;
1265*c03c5b1cSMartin Matuska     return 0;   /* over-simplification; could also check if context is currently running in streaming mode, and in which case, report how many bytes are left to be flushed within output buffer */
1266*c03c5b1cSMartin Matuska }
1267*c03c5b1cSMartin Matuska 
ZSTD_assertEqualCParams(ZSTD_compressionParameters cParams1,ZSTD_compressionParameters cParams2)1268*c03c5b1cSMartin Matuska static void ZSTD_assertEqualCParams(ZSTD_compressionParameters cParams1,
1269*c03c5b1cSMartin Matuska                                     ZSTD_compressionParameters cParams2)
1270*c03c5b1cSMartin Matuska {
1271*c03c5b1cSMartin Matuska     (void)cParams1;
1272*c03c5b1cSMartin Matuska     (void)cParams2;
1273*c03c5b1cSMartin Matuska     assert(cParams1.windowLog    == cParams2.windowLog);
1274*c03c5b1cSMartin Matuska     assert(cParams1.chainLog     == cParams2.chainLog);
1275*c03c5b1cSMartin Matuska     assert(cParams1.hashLog      == cParams2.hashLog);
1276*c03c5b1cSMartin Matuska     assert(cParams1.searchLog    == cParams2.searchLog);
1277*c03c5b1cSMartin Matuska     assert(cParams1.minMatch     == cParams2.minMatch);
1278*c03c5b1cSMartin Matuska     assert(cParams1.targetLength == cParams2.targetLength);
1279*c03c5b1cSMartin Matuska     assert(cParams1.strategy     == cParams2.strategy);
1280*c03c5b1cSMartin Matuska }
1281*c03c5b1cSMartin Matuska 
ZSTD_reset_compressedBlockState(ZSTD_compressedBlockState_t * bs)1282*c03c5b1cSMartin Matuska void ZSTD_reset_compressedBlockState(ZSTD_compressedBlockState_t* bs)
1283*c03c5b1cSMartin Matuska {
1284*c03c5b1cSMartin Matuska     int i;
1285*c03c5b1cSMartin Matuska     for (i = 0; i < ZSTD_REP_NUM; ++i)
1286*c03c5b1cSMartin Matuska         bs->rep[i] = repStartValue[i];
1287*c03c5b1cSMartin Matuska     bs->entropy.huf.repeatMode = HUF_repeat_none;
1288*c03c5b1cSMartin Matuska     bs->entropy.fse.offcode_repeatMode = FSE_repeat_none;
1289*c03c5b1cSMartin Matuska     bs->entropy.fse.matchlength_repeatMode = FSE_repeat_none;
1290*c03c5b1cSMartin Matuska     bs->entropy.fse.litlength_repeatMode = FSE_repeat_none;
1291*c03c5b1cSMartin Matuska }
1292*c03c5b1cSMartin Matuska 
1293*c03c5b1cSMartin Matuska /*! ZSTD_invalidateMatchState()
1294*c03c5b1cSMartin Matuska  *  Invalidate all the matches in the match finder tables.
1295*c03c5b1cSMartin Matuska  *  Requires nextSrc and base to be set (can be NULL).
1296*c03c5b1cSMartin Matuska  */
ZSTD_invalidateMatchState(ZSTD_matchState_t * ms)1297*c03c5b1cSMartin Matuska static void ZSTD_invalidateMatchState(ZSTD_matchState_t* ms)
1298*c03c5b1cSMartin Matuska {
1299*c03c5b1cSMartin Matuska     ZSTD_window_clear(&ms->window);
1300*c03c5b1cSMartin Matuska 
1301*c03c5b1cSMartin Matuska     ms->nextToUpdate = ms->window.dictLimit;
1302*c03c5b1cSMartin Matuska     ms->loadedDictEnd = 0;
1303*c03c5b1cSMartin Matuska     ms->opt.litLengthSum = 0;  /* force reset of btopt stats */
1304*c03c5b1cSMartin Matuska     ms->dictMatchState = NULL;
1305*c03c5b1cSMartin Matuska }
1306*c03c5b1cSMartin Matuska 
1307*c03c5b1cSMartin Matuska /**
1308*c03c5b1cSMartin Matuska  * Indicates whether this compression proceeds directly from user-provided
1309*c03c5b1cSMartin Matuska  * source buffer to user-provided destination buffer (ZSTDb_not_buffered), or
1310*c03c5b1cSMartin Matuska  * whether the context needs to buffer the input/output (ZSTDb_buffered).
1311*c03c5b1cSMartin Matuska  */
1312*c03c5b1cSMartin Matuska typedef enum {
1313*c03c5b1cSMartin Matuska     ZSTDb_not_buffered,
1314*c03c5b1cSMartin Matuska     ZSTDb_buffered
1315*c03c5b1cSMartin Matuska } ZSTD_buffered_policy_e;
1316*c03c5b1cSMartin Matuska 
1317*c03c5b1cSMartin Matuska /**
1318*c03c5b1cSMartin Matuska  * Controls, for this matchState reset, whether the tables need to be cleared /
1319*c03c5b1cSMartin Matuska  * prepared for the coming compression (ZSTDcrp_makeClean), or whether the
1320*c03c5b1cSMartin Matuska  * tables can be left unclean (ZSTDcrp_leaveDirty), because we know that a
1321*c03c5b1cSMartin Matuska  * subsequent operation will overwrite the table space anyways (e.g., copying
1322*c03c5b1cSMartin Matuska  * the matchState contents in from a CDict).
1323*c03c5b1cSMartin Matuska  */
1324*c03c5b1cSMartin Matuska typedef enum {
1325*c03c5b1cSMartin Matuska     ZSTDcrp_makeClean,
1326*c03c5b1cSMartin Matuska     ZSTDcrp_leaveDirty
1327*c03c5b1cSMartin Matuska } ZSTD_compResetPolicy_e;
1328*c03c5b1cSMartin Matuska 
1329*c03c5b1cSMartin Matuska /**
1330*c03c5b1cSMartin Matuska  * Controls, for this matchState reset, whether indexing can continue where it
1331*c03c5b1cSMartin Matuska  * left off (ZSTDirp_continue), or whether it needs to be restarted from zero
1332*c03c5b1cSMartin Matuska  * (ZSTDirp_reset).
1333*c03c5b1cSMartin Matuska  */
1334*c03c5b1cSMartin Matuska typedef enum {
1335*c03c5b1cSMartin Matuska     ZSTDirp_continue,
1336*c03c5b1cSMartin Matuska     ZSTDirp_reset
1337*c03c5b1cSMartin Matuska } ZSTD_indexResetPolicy_e;
1338*c03c5b1cSMartin Matuska 
1339*c03c5b1cSMartin Matuska typedef enum {
1340*c03c5b1cSMartin Matuska     ZSTD_resetTarget_CDict,
1341*c03c5b1cSMartin Matuska     ZSTD_resetTarget_CCtx
1342*c03c5b1cSMartin Matuska } ZSTD_resetTarget_e;
1343*c03c5b1cSMartin Matuska 
1344*c03c5b1cSMartin Matuska static size_t
ZSTD_reset_matchState(ZSTD_matchState_t * ms,ZSTD_cwksp * ws,const ZSTD_compressionParameters * cParams,const ZSTD_compResetPolicy_e crp,const ZSTD_indexResetPolicy_e forceResetIndex,const ZSTD_resetTarget_e forWho)1345*c03c5b1cSMartin Matuska ZSTD_reset_matchState(ZSTD_matchState_t* ms,
1346*c03c5b1cSMartin Matuska                       ZSTD_cwksp* ws,
1347*c03c5b1cSMartin Matuska                 const ZSTD_compressionParameters* cParams,
1348*c03c5b1cSMartin Matuska                 const ZSTD_compResetPolicy_e crp,
1349*c03c5b1cSMartin Matuska                 const ZSTD_indexResetPolicy_e forceResetIndex,
1350*c03c5b1cSMartin Matuska                 const ZSTD_resetTarget_e forWho)
1351*c03c5b1cSMartin Matuska {
1352*c03c5b1cSMartin Matuska     size_t const chainSize = (cParams->strategy == ZSTD_fast) ? 0 : ((size_t)1 << cParams->chainLog);
1353*c03c5b1cSMartin Matuska     size_t const hSize = ((size_t)1) << cParams->hashLog;
1354*c03c5b1cSMartin Matuska     U32    const hashLog3 = ((forWho == ZSTD_resetTarget_CCtx) && cParams->minMatch==3) ? MIN(ZSTD_HASHLOG3_MAX, cParams->windowLog) : 0;
1355*c03c5b1cSMartin Matuska     size_t const h3Size = hashLog3 ? ((size_t)1) << hashLog3 : 0;
1356*c03c5b1cSMartin Matuska 
1357*c03c5b1cSMartin Matuska     DEBUGLOG(4, "reset indices : %u", forceResetIndex == ZSTDirp_reset);
1358*c03c5b1cSMartin Matuska     if (forceResetIndex == ZSTDirp_reset) {
1359*c03c5b1cSMartin Matuska         ZSTD_window_init(&ms->window);
1360*c03c5b1cSMartin Matuska         ZSTD_cwksp_mark_tables_dirty(ws);
1361*c03c5b1cSMartin Matuska     }
1362*c03c5b1cSMartin Matuska 
1363*c03c5b1cSMartin Matuska     ms->hashLog3 = hashLog3;
1364*c03c5b1cSMartin Matuska 
1365*c03c5b1cSMartin Matuska     ZSTD_invalidateMatchState(ms);
1366*c03c5b1cSMartin Matuska 
1367*c03c5b1cSMartin Matuska     assert(!ZSTD_cwksp_reserve_failed(ws)); /* check that allocation hasn't already failed */
1368*c03c5b1cSMartin Matuska 
1369*c03c5b1cSMartin Matuska     ZSTD_cwksp_clear_tables(ws);
1370*c03c5b1cSMartin Matuska 
1371*c03c5b1cSMartin Matuska     DEBUGLOG(5, "reserving table space");
1372*c03c5b1cSMartin Matuska     /* table Space */
1373*c03c5b1cSMartin Matuska     ms->hashTable = (U32*)ZSTD_cwksp_reserve_table(ws, hSize * sizeof(U32));
1374*c03c5b1cSMartin Matuska     ms->chainTable = (U32*)ZSTD_cwksp_reserve_table(ws, chainSize * sizeof(U32));
1375*c03c5b1cSMartin Matuska     ms->hashTable3 = (U32*)ZSTD_cwksp_reserve_table(ws, h3Size * sizeof(U32));
1376*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(ZSTD_cwksp_reserve_failed(ws), memory_allocation,
1377*c03c5b1cSMartin Matuska                     "failed a workspace allocation in ZSTD_reset_matchState");
1378*c03c5b1cSMartin Matuska 
1379*c03c5b1cSMartin Matuska     DEBUGLOG(4, "reset table : %u", crp!=ZSTDcrp_leaveDirty);
1380*c03c5b1cSMartin Matuska     if (crp!=ZSTDcrp_leaveDirty) {
1381*c03c5b1cSMartin Matuska         /* reset tables only */
1382*c03c5b1cSMartin Matuska         ZSTD_cwksp_clean_tables(ws);
1383*c03c5b1cSMartin Matuska     }
1384*c03c5b1cSMartin Matuska 
1385*c03c5b1cSMartin Matuska     /* opt parser space */
1386*c03c5b1cSMartin Matuska     if ((forWho == ZSTD_resetTarget_CCtx) && (cParams->strategy >= ZSTD_btopt)) {
1387*c03c5b1cSMartin Matuska         DEBUGLOG(4, "reserving optimal parser space");
1388*c03c5b1cSMartin Matuska         ms->opt.litFreq = (unsigned*)ZSTD_cwksp_reserve_aligned(ws, (1<<Litbits) * sizeof(unsigned));
1389*c03c5b1cSMartin Matuska         ms->opt.litLengthFreq = (unsigned*)ZSTD_cwksp_reserve_aligned(ws, (MaxLL+1) * sizeof(unsigned));
1390*c03c5b1cSMartin Matuska         ms->opt.matchLengthFreq = (unsigned*)ZSTD_cwksp_reserve_aligned(ws, (MaxML+1) * sizeof(unsigned));
1391*c03c5b1cSMartin Matuska         ms->opt.offCodeFreq = (unsigned*)ZSTD_cwksp_reserve_aligned(ws, (MaxOff+1) * sizeof(unsigned));
1392*c03c5b1cSMartin Matuska         ms->opt.matchTable = (ZSTD_match_t*)ZSTD_cwksp_reserve_aligned(ws, (ZSTD_OPT_NUM+1) * sizeof(ZSTD_match_t));
1393*c03c5b1cSMartin Matuska         ms->opt.priceTable = (ZSTD_optimal_t*)ZSTD_cwksp_reserve_aligned(ws, (ZSTD_OPT_NUM+1) * sizeof(ZSTD_optimal_t));
1394*c03c5b1cSMartin Matuska     }
1395*c03c5b1cSMartin Matuska 
1396*c03c5b1cSMartin Matuska     ms->cParams = *cParams;
1397*c03c5b1cSMartin Matuska 
1398*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(ZSTD_cwksp_reserve_failed(ws), memory_allocation,
1399*c03c5b1cSMartin Matuska                     "failed a workspace allocation in ZSTD_reset_matchState");
1400*c03c5b1cSMartin Matuska 
1401*c03c5b1cSMartin Matuska     return 0;
1402*c03c5b1cSMartin Matuska }
1403*c03c5b1cSMartin Matuska 
1404*c03c5b1cSMartin Matuska /* ZSTD_indexTooCloseToMax() :
1405*c03c5b1cSMartin Matuska  * minor optimization : prefer memset() rather than reduceIndex()
1406*c03c5b1cSMartin Matuska  * which is measurably slow in some circumstances (reported for Visual Studio).
1407*c03c5b1cSMartin Matuska  * Works when re-using a context for a lot of smallish inputs :
1408*c03c5b1cSMartin Matuska  * if all inputs are smaller than ZSTD_INDEXOVERFLOW_MARGIN,
1409*c03c5b1cSMartin Matuska  * memset() will be triggered before reduceIndex().
1410*c03c5b1cSMartin Matuska  */
1411*c03c5b1cSMartin Matuska #define ZSTD_INDEXOVERFLOW_MARGIN (16 MB)
ZSTD_indexTooCloseToMax(ZSTD_window_t w)1412*c03c5b1cSMartin Matuska static int ZSTD_indexTooCloseToMax(ZSTD_window_t w)
1413*c03c5b1cSMartin Matuska {
1414*c03c5b1cSMartin Matuska     return (size_t)(w.nextSrc - w.base) > (ZSTD_CURRENT_MAX - ZSTD_INDEXOVERFLOW_MARGIN);
1415*c03c5b1cSMartin Matuska }
1416*c03c5b1cSMartin Matuska 
1417*c03c5b1cSMartin Matuska /*! ZSTD_resetCCtx_internal() :
1418*c03c5b1cSMartin Matuska     note : `params` are assumed fully validated at this stage */
ZSTD_resetCCtx_internal(ZSTD_CCtx * zc,ZSTD_CCtx_params params,U64 const pledgedSrcSize,ZSTD_compResetPolicy_e const crp,ZSTD_buffered_policy_e const zbuff)1419*c03c5b1cSMartin Matuska static size_t ZSTD_resetCCtx_internal(ZSTD_CCtx* zc,
1420*c03c5b1cSMartin Matuska                                       ZSTD_CCtx_params params,
1421*c03c5b1cSMartin Matuska                                       U64 const pledgedSrcSize,
1422*c03c5b1cSMartin Matuska                                       ZSTD_compResetPolicy_e const crp,
1423*c03c5b1cSMartin Matuska                                       ZSTD_buffered_policy_e const zbuff)
1424*c03c5b1cSMartin Matuska {
1425*c03c5b1cSMartin Matuska     ZSTD_cwksp* const ws = &zc->workspace;
1426*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_resetCCtx_internal: pledgedSrcSize=%u, wlog=%u",
1427*c03c5b1cSMartin Matuska                 (U32)pledgedSrcSize, params.cParams.windowLog);
1428*c03c5b1cSMartin Matuska     assert(!ZSTD_isError(ZSTD_checkCParams(params.cParams)));
1429*c03c5b1cSMartin Matuska 
1430*c03c5b1cSMartin Matuska     zc->isFirstBlock = 1;
1431*c03c5b1cSMartin Matuska 
1432*c03c5b1cSMartin Matuska     if (params.ldmParams.enableLdm) {
1433*c03c5b1cSMartin Matuska         /* Adjust long distance matching parameters */
1434*c03c5b1cSMartin Matuska         ZSTD_ldm_adjustParameters(&params.ldmParams, &params.cParams);
1435*c03c5b1cSMartin Matuska         assert(params.ldmParams.hashLog >= params.ldmParams.bucketSizeLog);
1436*c03c5b1cSMartin Matuska         assert(params.ldmParams.hashRateLog < 32);
1437*c03c5b1cSMartin Matuska         zc->ldmState.hashPower = ZSTD_rollingHash_primePower(params.ldmParams.minMatchLength);
1438*c03c5b1cSMartin Matuska     }
1439*c03c5b1cSMartin Matuska 
1440*c03c5b1cSMartin Matuska     {   size_t const windowSize = MAX(1, (size_t)MIN(((U64)1 << params.cParams.windowLog), pledgedSrcSize));
1441*c03c5b1cSMartin Matuska         size_t const blockSize = MIN(ZSTD_BLOCKSIZE_MAX, windowSize);
1442*c03c5b1cSMartin Matuska         U32    const divider = (params.cParams.minMatch==3) ? 3 : 4;
1443*c03c5b1cSMartin Matuska         size_t const maxNbSeq = blockSize / divider;
1444*c03c5b1cSMartin Matuska         size_t const tokenSpace = ZSTD_cwksp_alloc_size(WILDCOPY_OVERLENGTH + blockSize)
1445*c03c5b1cSMartin Matuska                                 + ZSTD_cwksp_alloc_size(maxNbSeq * sizeof(seqDef))
1446*c03c5b1cSMartin Matuska                                 + 3 * ZSTD_cwksp_alloc_size(maxNbSeq * sizeof(BYTE));
1447*c03c5b1cSMartin Matuska         size_t const buffOutSize = (zbuff==ZSTDb_buffered) ? ZSTD_compressBound(blockSize)+1 : 0;
1448*c03c5b1cSMartin Matuska         size_t const buffInSize = (zbuff==ZSTDb_buffered) ? windowSize + blockSize : 0;
1449*c03c5b1cSMartin Matuska         size_t const matchStateSize = ZSTD_sizeof_matchState(&params.cParams, /* forCCtx */ 1);
1450*c03c5b1cSMartin Matuska         size_t const maxNbLdmSeq = ZSTD_ldm_getMaxNbSeq(params.ldmParams, blockSize);
1451*c03c5b1cSMartin Matuska 
1452*c03c5b1cSMartin Matuska         ZSTD_indexResetPolicy_e needsIndexReset = zc->initialized ? ZSTDirp_continue : ZSTDirp_reset;
1453*c03c5b1cSMartin Matuska 
1454*c03c5b1cSMartin Matuska         if (ZSTD_indexTooCloseToMax(zc->blockState.matchState.window)) {
1455*c03c5b1cSMartin Matuska             needsIndexReset = ZSTDirp_reset;
1456*c03c5b1cSMartin Matuska         }
1457*c03c5b1cSMartin Matuska 
1458*c03c5b1cSMartin Matuska         if (!zc->staticSize) ZSTD_cwksp_bump_oversized_duration(ws, 0);
1459*c03c5b1cSMartin Matuska 
1460*c03c5b1cSMartin Matuska         /* Check if workspace is large enough, alloc a new one if needed */
1461*c03c5b1cSMartin Matuska         {   size_t const cctxSpace = zc->staticSize ? ZSTD_cwksp_alloc_size(sizeof(ZSTD_CCtx)) : 0;
1462*c03c5b1cSMartin Matuska             size_t const entropySpace = ZSTD_cwksp_alloc_size(HUF_WORKSPACE_SIZE);
1463*c03c5b1cSMartin Matuska             size_t const blockStateSpace = 2 * ZSTD_cwksp_alloc_size(sizeof(ZSTD_compressedBlockState_t));
1464*c03c5b1cSMartin Matuska             size_t const bufferSpace = ZSTD_cwksp_alloc_size(buffInSize) + ZSTD_cwksp_alloc_size(buffOutSize);
1465*c03c5b1cSMartin Matuska             size_t const ldmSpace = ZSTD_ldm_getTableSize(params.ldmParams);
1466*c03c5b1cSMartin Matuska             size_t const ldmSeqSpace = ZSTD_cwksp_alloc_size(maxNbLdmSeq * sizeof(rawSeq));
1467*c03c5b1cSMartin Matuska 
1468*c03c5b1cSMartin Matuska             size_t const neededSpace =
1469*c03c5b1cSMartin Matuska                 cctxSpace +
1470*c03c5b1cSMartin Matuska                 entropySpace +
1471*c03c5b1cSMartin Matuska                 blockStateSpace +
1472*c03c5b1cSMartin Matuska                 ldmSpace +
1473*c03c5b1cSMartin Matuska                 ldmSeqSpace +
1474*c03c5b1cSMartin Matuska                 matchStateSize +
1475*c03c5b1cSMartin Matuska                 tokenSpace +
1476*c03c5b1cSMartin Matuska                 bufferSpace;
1477*c03c5b1cSMartin Matuska 
1478*c03c5b1cSMartin Matuska             int const workspaceTooSmall = ZSTD_cwksp_sizeof(ws) < neededSpace;
1479*c03c5b1cSMartin Matuska             int const workspaceWasteful = ZSTD_cwksp_check_wasteful(ws, neededSpace);
1480*c03c5b1cSMartin Matuska 
1481*c03c5b1cSMartin Matuska             DEBUGLOG(4, "Need %zuKB workspace, including %zuKB for match state, and %zuKB for buffers",
1482*c03c5b1cSMartin Matuska                         neededSpace>>10, matchStateSize>>10, bufferSpace>>10);
1483*c03c5b1cSMartin Matuska             DEBUGLOG(4, "windowSize: %zu - blockSize: %zu", windowSize, blockSize);
1484*c03c5b1cSMartin Matuska 
1485*c03c5b1cSMartin Matuska             if (workspaceTooSmall || workspaceWasteful) {
1486*c03c5b1cSMartin Matuska                 DEBUGLOG(4, "Resize workspaceSize from %zuKB to %zuKB",
1487*c03c5b1cSMartin Matuska                             ZSTD_cwksp_sizeof(ws) >> 10,
1488*c03c5b1cSMartin Matuska                             neededSpace >> 10);
1489*c03c5b1cSMartin Matuska 
1490*c03c5b1cSMartin Matuska                 RETURN_ERROR_IF(zc->staticSize, memory_allocation, "static cctx : no resize");
1491*c03c5b1cSMartin Matuska 
1492*c03c5b1cSMartin Matuska                 needsIndexReset = ZSTDirp_reset;
1493*c03c5b1cSMartin Matuska 
1494*c03c5b1cSMartin Matuska                 ZSTD_cwksp_free(ws, zc->customMem);
1495*c03c5b1cSMartin Matuska                 FORWARD_IF_ERROR(ZSTD_cwksp_create(ws, neededSpace, zc->customMem), "");
1496*c03c5b1cSMartin Matuska 
1497*c03c5b1cSMartin Matuska                 DEBUGLOG(5, "reserving object space");
1498*c03c5b1cSMartin Matuska                 /* Statically sized space.
1499*c03c5b1cSMartin Matuska                  * entropyWorkspace never moves,
1500*c03c5b1cSMartin Matuska                  * though prev/next block swap places */
1501*c03c5b1cSMartin Matuska                 assert(ZSTD_cwksp_check_available(ws, 2 * sizeof(ZSTD_compressedBlockState_t)));
1502*c03c5b1cSMartin Matuska                 zc->blockState.prevCBlock = (ZSTD_compressedBlockState_t*) ZSTD_cwksp_reserve_object(ws, sizeof(ZSTD_compressedBlockState_t));
1503*c03c5b1cSMartin Matuska                 RETURN_ERROR_IF(zc->blockState.prevCBlock == NULL, memory_allocation, "couldn't allocate prevCBlock");
1504*c03c5b1cSMartin Matuska                 zc->blockState.nextCBlock = (ZSTD_compressedBlockState_t*) ZSTD_cwksp_reserve_object(ws, sizeof(ZSTD_compressedBlockState_t));
1505*c03c5b1cSMartin Matuska                 RETURN_ERROR_IF(zc->blockState.nextCBlock == NULL, memory_allocation, "couldn't allocate nextCBlock");
1506*c03c5b1cSMartin Matuska                 zc->entropyWorkspace = (U32*) ZSTD_cwksp_reserve_object(ws, HUF_WORKSPACE_SIZE);
1507*c03c5b1cSMartin Matuska                 RETURN_ERROR_IF(zc->blockState.nextCBlock == NULL, memory_allocation, "couldn't allocate entropyWorkspace");
1508*c03c5b1cSMartin Matuska         }   }
1509*c03c5b1cSMartin Matuska 
1510*c03c5b1cSMartin Matuska         ZSTD_cwksp_clear(ws);
1511*c03c5b1cSMartin Matuska 
1512*c03c5b1cSMartin Matuska         /* init params */
1513*c03c5b1cSMartin Matuska         zc->appliedParams = params;
1514*c03c5b1cSMartin Matuska         zc->blockState.matchState.cParams = params.cParams;
1515*c03c5b1cSMartin Matuska         zc->pledgedSrcSizePlusOne = pledgedSrcSize+1;
1516*c03c5b1cSMartin Matuska         zc->consumedSrcSize = 0;
1517*c03c5b1cSMartin Matuska         zc->producedCSize = 0;
1518*c03c5b1cSMartin Matuska         if (pledgedSrcSize == ZSTD_CONTENTSIZE_UNKNOWN)
1519*c03c5b1cSMartin Matuska             zc->appliedParams.fParams.contentSizeFlag = 0;
1520*c03c5b1cSMartin Matuska         DEBUGLOG(4, "pledged content size : %u ; flag : %u",
1521*c03c5b1cSMartin Matuska             (unsigned)pledgedSrcSize, zc->appliedParams.fParams.contentSizeFlag);
1522*c03c5b1cSMartin Matuska         zc->blockSize = blockSize;
1523*c03c5b1cSMartin Matuska 
1524*c03c5b1cSMartin Matuska         XXH64_reset(&zc->xxhState, 0);
1525*c03c5b1cSMartin Matuska         zc->stage = ZSTDcs_init;
1526*c03c5b1cSMartin Matuska         zc->dictID = 0;
1527*c03c5b1cSMartin Matuska 
1528*c03c5b1cSMartin Matuska         ZSTD_reset_compressedBlockState(zc->blockState.prevCBlock);
1529*c03c5b1cSMartin Matuska 
1530*c03c5b1cSMartin Matuska         /* ZSTD_wildcopy() is used to copy into the literals buffer,
1531*c03c5b1cSMartin Matuska          * so we have to oversize the buffer by WILDCOPY_OVERLENGTH bytes.
1532*c03c5b1cSMartin Matuska          */
1533*c03c5b1cSMartin Matuska         zc->seqStore.litStart = ZSTD_cwksp_reserve_buffer(ws, blockSize + WILDCOPY_OVERLENGTH);
1534*c03c5b1cSMartin Matuska         zc->seqStore.maxNbLit = blockSize;
1535*c03c5b1cSMartin Matuska 
1536*c03c5b1cSMartin Matuska         /* buffers */
1537*c03c5b1cSMartin Matuska         zc->inBuffSize = buffInSize;
1538*c03c5b1cSMartin Matuska         zc->inBuff = (char*)ZSTD_cwksp_reserve_buffer(ws, buffInSize);
1539*c03c5b1cSMartin Matuska         zc->outBuffSize = buffOutSize;
1540*c03c5b1cSMartin Matuska         zc->outBuff = (char*)ZSTD_cwksp_reserve_buffer(ws, buffOutSize);
1541*c03c5b1cSMartin Matuska 
1542*c03c5b1cSMartin Matuska         /* ldm bucketOffsets table */
1543*c03c5b1cSMartin Matuska         if (params.ldmParams.enableLdm) {
1544*c03c5b1cSMartin Matuska             /* TODO: avoid memset? */
1545*c03c5b1cSMartin Matuska             size_t const ldmBucketSize =
1546*c03c5b1cSMartin Matuska                   ((size_t)1) << (params.ldmParams.hashLog -
1547*c03c5b1cSMartin Matuska                                   params.ldmParams.bucketSizeLog);
1548*c03c5b1cSMartin Matuska             zc->ldmState.bucketOffsets = ZSTD_cwksp_reserve_buffer(ws, ldmBucketSize);
1549*c03c5b1cSMartin Matuska             memset(zc->ldmState.bucketOffsets, 0, ldmBucketSize);
1550*c03c5b1cSMartin Matuska         }
1551*c03c5b1cSMartin Matuska 
1552*c03c5b1cSMartin Matuska         /* sequences storage */
1553*c03c5b1cSMartin Matuska         ZSTD_referenceExternalSequences(zc, NULL, 0);
1554*c03c5b1cSMartin Matuska         zc->seqStore.maxNbSeq = maxNbSeq;
1555*c03c5b1cSMartin Matuska         zc->seqStore.llCode = ZSTD_cwksp_reserve_buffer(ws, maxNbSeq * sizeof(BYTE));
1556*c03c5b1cSMartin Matuska         zc->seqStore.mlCode = ZSTD_cwksp_reserve_buffer(ws, maxNbSeq * sizeof(BYTE));
1557*c03c5b1cSMartin Matuska         zc->seqStore.ofCode = ZSTD_cwksp_reserve_buffer(ws, maxNbSeq * sizeof(BYTE));
1558*c03c5b1cSMartin Matuska         zc->seqStore.sequencesStart = (seqDef*)ZSTD_cwksp_reserve_aligned(ws, maxNbSeq * sizeof(seqDef));
1559*c03c5b1cSMartin Matuska 
1560*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR(ZSTD_reset_matchState(
1561*c03c5b1cSMartin Matuska             &zc->blockState.matchState,
1562*c03c5b1cSMartin Matuska             ws,
1563*c03c5b1cSMartin Matuska             &params.cParams,
1564*c03c5b1cSMartin Matuska             crp,
1565*c03c5b1cSMartin Matuska             needsIndexReset,
1566*c03c5b1cSMartin Matuska             ZSTD_resetTarget_CCtx), "");
1567*c03c5b1cSMartin Matuska 
1568*c03c5b1cSMartin Matuska         /* ldm hash table */
1569*c03c5b1cSMartin Matuska         if (params.ldmParams.enableLdm) {
1570*c03c5b1cSMartin Matuska             /* TODO: avoid memset? */
1571*c03c5b1cSMartin Matuska             size_t const ldmHSize = ((size_t)1) << params.ldmParams.hashLog;
1572*c03c5b1cSMartin Matuska             zc->ldmState.hashTable = (ldmEntry_t*)ZSTD_cwksp_reserve_aligned(ws, ldmHSize * sizeof(ldmEntry_t));
1573*c03c5b1cSMartin Matuska             memset(zc->ldmState.hashTable, 0, ldmHSize * sizeof(ldmEntry_t));
1574*c03c5b1cSMartin Matuska             zc->ldmSequences = (rawSeq*)ZSTD_cwksp_reserve_aligned(ws, maxNbLdmSeq * sizeof(rawSeq));
1575*c03c5b1cSMartin Matuska             zc->maxNbLdmSequences = maxNbLdmSeq;
1576*c03c5b1cSMartin Matuska 
1577*c03c5b1cSMartin Matuska             ZSTD_window_init(&zc->ldmState.window);
1578*c03c5b1cSMartin Matuska             ZSTD_window_clear(&zc->ldmState.window);
1579*c03c5b1cSMartin Matuska             zc->ldmState.loadedDictEnd = 0;
1580*c03c5b1cSMartin Matuska         }
1581*c03c5b1cSMartin Matuska 
1582*c03c5b1cSMartin Matuska         DEBUGLOG(3, "wksp: finished allocating, %zd bytes remain available", ZSTD_cwksp_available_space(ws));
1583*c03c5b1cSMartin Matuska         zc->initialized = 1;
1584*c03c5b1cSMartin Matuska 
1585*c03c5b1cSMartin Matuska         return 0;
1586*c03c5b1cSMartin Matuska     }
1587*c03c5b1cSMartin Matuska }
1588*c03c5b1cSMartin Matuska 
1589*c03c5b1cSMartin Matuska /* ZSTD_invalidateRepCodes() :
1590*c03c5b1cSMartin Matuska  * ensures next compression will not use repcodes from previous block.
1591*c03c5b1cSMartin Matuska  * Note : only works with regular variant;
1592*c03c5b1cSMartin Matuska  *        do not use with extDict variant ! */
ZSTD_invalidateRepCodes(ZSTD_CCtx * cctx)1593*c03c5b1cSMartin Matuska void ZSTD_invalidateRepCodes(ZSTD_CCtx* cctx) {
1594*c03c5b1cSMartin Matuska     int i;
1595*c03c5b1cSMartin Matuska     for (i=0; i<ZSTD_REP_NUM; i++) cctx->blockState.prevCBlock->rep[i] = 0;
1596*c03c5b1cSMartin Matuska     assert(!ZSTD_window_hasExtDict(cctx->blockState.matchState.window));
1597*c03c5b1cSMartin Matuska }
1598*c03c5b1cSMartin Matuska 
1599*c03c5b1cSMartin Matuska /* These are the approximate sizes for each strategy past which copying the
1600*c03c5b1cSMartin Matuska  * dictionary tables into the working context is faster than using them
1601*c03c5b1cSMartin Matuska  * in-place.
1602*c03c5b1cSMartin Matuska  */
1603*c03c5b1cSMartin Matuska static const size_t attachDictSizeCutoffs[ZSTD_STRATEGY_MAX+1] = {
1604*c03c5b1cSMartin Matuska     8 KB,  /* unused */
1605*c03c5b1cSMartin Matuska     8 KB,  /* ZSTD_fast */
1606*c03c5b1cSMartin Matuska     16 KB, /* ZSTD_dfast */
1607*c03c5b1cSMartin Matuska     32 KB, /* ZSTD_greedy */
1608*c03c5b1cSMartin Matuska     32 KB, /* ZSTD_lazy */
1609*c03c5b1cSMartin Matuska     32 KB, /* ZSTD_lazy2 */
1610*c03c5b1cSMartin Matuska     32 KB, /* ZSTD_btlazy2 */
1611*c03c5b1cSMartin Matuska     32 KB, /* ZSTD_btopt */
1612*c03c5b1cSMartin Matuska     8 KB,  /* ZSTD_btultra */
1613*c03c5b1cSMartin Matuska     8 KB   /* ZSTD_btultra2 */
1614*c03c5b1cSMartin Matuska };
1615*c03c5b1cSMartin Matuska 
ZSTD_shouldAttachDict(const ZSTD_CDict * cdict,const ZSTD_CCtx_params * params,U64 pledgedSrcSize)1616*c03c5b1cSMartin Matuska static int ZSTD_shouldAttachDict(const ZSTD_CDict* cdict,
1617*c03c5b1cSMartin Matuska                                  const ZSTD_CCtx_params* params,
1618*c03c5b1cSMartin Matuska                                  U64 pledgedSrcSize)
1619*c03c5b1cSMartin Matuska {
1620*c03c5b1cSMartin Matuska     size_t cutoff = attachDictSizeCutoffs[cdict->matchState.cParams.strategy];
1621*c03c5b1cSMartin Matuska     return ( pledgedSrcSize <= cutoff
1622*c03c5b1cSMartin Matuska           || pledgedSrcSize == ZSTD_CONTENTSIZE_UNKNOWN
1623*c03c5b1cSMartin Matuska           || params->attachDictPref == ZSTD_dictForceAttach )
1624*c03c5b1cSMartin Matuska         && params->attachDictPref != ZSTD_dictForceCopy
1625*c03c5b1cSMartin Matuska         && !params->forceWindow; /* dictMatchState isn't correctly
1626*c03c5b1cSMartin Matuska                                  * handled in _enforceMaxDist */
1627*c03c5b1cSMartin Matuska }
1628*c03c5b1cSMartin Matuska 
1629*c03c5b1cSMartin Matuska static size_t
ZSTD_resetCCtx_byAttachingCDict(ZSTD_CCtx * cctx,const ZSTD_CDict * cdict,ZSTD_CCtx_params params,U64 pledgedSrcSize,ZSTD_buffered_policy_e zbuff)1630*c03c5b1cSMartin Matuska ZSTD_resetCCtx_byAttachingCDict(ZSTD_CCtx* cctx,
1631*c03c5b1cSMartin Matuska                         const ZSTD_CDict* cdict,
1632*c03c5b1cSMartin Matuska                         ZSTD_CCtx_params params,
1633*c03c5b1cSMartin Matuska                         U64 pledgedSrcSize,
1634*c03c5b1cSMartin Matuska                         ZSTD_buffered_policy_e zbuff)
1635*c03c5b1cSMartin Matuska {
1636*c03c5b1cSMartin Matuska     {   const ZSTD_compressionParameters* const cdict_cParams = &cdict->matchState.cParams;
1637*c03c5b1cSMartin Matuska         unsigned const windowLog = params.cParams.windowLog;
1638*c03c5b1cSMartin Matuska         assert(windowLog != 0);
1639*c03c5b1cSMartin Matuska         /* Resize working context table params for input only, since the dict
1640*c03c5b1cSMartin Matuska          * has its own tables. */
1641*c03c5b1cSMartin Matuska         /* pledgeSrcSize == 0 means 0! */
1642*c03c5b1cSMartin Matuska         params.cParams = ZSTD_adjustCParams_internal(*cdict_cParams, pledgedSrcSize, 0);
1643*c03c5b1cSMartin Matuska         params.cParams.windowLog = windowLog;
1644*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR(ZSTD_resetCCtx_internal(cctx, params, pledgedSrcSize,
1645*c03c5b1cSMartin Matuska                                                  ZSTDcrp_makeClean, zbuff), "");
1646*c03c5b1cSMartin Matuska         assert(cctx->appliedParams.cParams.strategy == cdict_cParams->strategy);
1647*c03c5b1cSMartin Matuska     }
1648*c03c5b1cSMartin Matuska 
1649*c03c5b1cSMartin Matuska     {   const U32 cdictEnd = (U32)( cdict->matchState.window.nextSrc
1650*c03c5b1cSMartin Matuska                                   - cdict->matchState.window.base);
1651*c03c5b1cSMartin Matuska         const U32 cdictLen = cdictEnd - cdict->matchState.window.dictLimit;
1652*c03c5b1cSMartin Matuska         if (cdictLen == 0) {
1653*c03c5b1cSMartin Matuska             /* don't even attach dictionaries with no contents */
1654*c03c5b1cSMartin Matuska             DEBUGLOG(4, "skipping attaching empty dictionary");
1655*c03c5b1cSMartin Matuska         } else {
1656*c03c5b1cSMartin Matuska             DEBUGLOG(4, "attaching dictionary into context");
1657*c03c5b1cSMartin Matuska             cctx->blockState.matchState.dictMatchState = &cdict->matchState;
1658*c03c5b1cSMartin Matuska 
1659*c03c5b1cSMartin Matuska             /* prep working match state so dict matches never have negative indices
1660*c03c5b1cSMartin Matuska              * when they are translated to the working context's index space. */
1661*c03c5b1cSMartin Matuska             if (cctx->blockState.matchState.window.dictLimit < cdictEnd) {
1662*c03c5b1cSMartin Matuska                 cctx->blockState.matchState.window.nextSrc =
1663*c03c5b1cSMartin Matuska                     cctx->blockState.matchState.window.base + cdictEnd;
1664*c03c5b1cSMartin Matuska                 ZSTD_window_clear(&cctx->blockState.matchState.window);
1665*c03c5b1cSMartin Matuska             }
1666*c03c5b1cSMartin Matuska             /* loadedDictEnd is expressed within the referential of the active context */
1667*c03c5b1cSMartin Matuska             cctx->blockState.matchState.loadedDictEnd = cctx->blockState.matchState.window.dictLimit;
1668*c03c5b1cSMartin Matuska     }   }
1669*c03c5b1cSMartin Matuska 
1670*c03c5b1cSMartin Matuska     cctx->dictID = cdict->dictID;
1671*c03c5b1cSMartin Matuska 
1672*c03c5b1cSMartin Matuska     /* copy block state */
1673*c03c5b1cSMartin Matuska     memcpy(cctx->blockState.prevCBlock, &cdict->cBlockState, sizeof(cdict->cBlockState));
1674*c03c5b1cSMartin Matuska 
1675*c03c5b1cSMartin Matuska     return 0;
1676*c03c5b1cSMartin Matuska }
1677*c03c5b1cSMartin Matuska 
ZSTD_resetCCtx_byCopyingCDict(ZSTD_CCtx * cctx,const ZSTD_CDict * cdict,ZSTD_CCtx_params params,U64 pledgedSrcSize,ZSTD_buffered_policy_e zbuff)1678*c03c5b1cSMartin Matuska static size_t ZSTD_resetCCtx_byCopyingCDict(ZSTD_CCtx* cctx,
1679*c03c5b1cSMartin Matuska                             const ZSTD_CDict* cdict,
1680*c03c5b1cSMartin Matuska                             ZSTD_CCtx_params params,
1681*c03c5b1cSMartin Matuska                             U64 pledgedSrcSize,
1682*c03c5b1cSMartin Matuska                             ZSTD_buffered_policy_e zbuff)
1683*c03c5b1cSMartin Matuska {
1684*c03c5b1cSMartin Matuska     const ZSTD_compressionParameters *cdict_cParams = &cdict->matchState.cParams;
1685*c03c5b1cSMartin Matuska 
1686*c03c5b1cSMartin Matuska     DEBUGLOG(4, "copying dictionary into context");
1687*c03c5b1cSMartin Matuska 
1688*c03c5b1cSMartin Matuska     {   unsigned const windowLog = params.cParams.windowLog;
1689*c03c5b1cSMartin Matuska         assert(windowLog != 0);
1690*c03c5b1cSMartin Matuska         /* Copy only compression parameters related to tables. */
1691*c03c5b1cSMartin Matuska         params.cParams = *cdict_cParams;
1692*c03c5b1cSMartin Matuska         params.cParams.windowLog = windowLog;
1693*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR(ZSTD_resetCCtx_internal(cctx, params, pledgedSrcSize,
1694*c03c5b1cSMartin Matuska                                                  ZSTDcrp_leaveDirty, zbuff), "");
1695*c03c5b1cSMartin Matuska         assert(cctx->appliedParams.cParams.strategy == cdict_cParams->strategy);
1696*c03c5b1cSMartin Matuska         assert(cctx->appliedParams.cParams.hashLog == cdict_cParams->hashLog);
1697*c03c5b1cSMartin Matuska         assert(cctx->appliedParams.cParams.chainLog == cdict_cParams->chainLog);
1698*c03c5b1cSMartin Matuska     }
1699*c03c5b1cSMartin Matuska 
1700*c03c5b1cSMartin Matuska     ZSTD_cwksp_mark_tables_dirty(&cctx->workspace);
1701*c03c5b1cSMartin Matuska 
1702*c03c5b1cSMartin Matuska     /* copy tables */
1703*c03c5b1cSMartin Matuska     {   size_t const chainSize = (cdict_cParams->strategy == ZSTD_fast) ? 0 : ((size_t)1 << cdict_cParams->chainLog);
1704*c03c5b1cSMartin Matuska         size_t const hSize =  (size_t)1 << cdict_cParams->hashLog;
1705*c03c5b1cSMartin Matuska 
1706*c03c5b1cSMartin Matuska         memcpy(cctx->blockState.matchState.hashTable,
1707*c03c5b1cSMartin Matuska                cdict->matchState.hashTable,
1708*c03c5b1cSMartin Matuska                hSize * sizeof(U32));
1709*c03c5b1cSMartin Matuska         memcpy(cctx->blockState.matchState.chainTable,
1710*c03c5b1cSMartin Matuska                cdict->matchState.chainTable,
1711*c03c5b1cSMartin Matuska                chainSize * sizeof(U32));
1712*c03c5b1cSMartin Matuska     }
1713*c03c5b1cSMartin Matuska 
1714*c03c5b1cSMartin Matuska     /* Zero the hashTable3, since the cdict never fills it */
1715*c03c5b1cSMartin Matuska     {   int const h3log = cctx->blockState.matchState.hashLog3;
1716*c03c5b1cSMartin Matuska         size_t const h3Size = h3log ? ((size_t)1 << h3log) : 0;
1717*c03c5b1cSMartin Matuska         assert(cdict->matchState.hashLog3 == 0);
1718*c03c5b1cSMartin Matuska         memset(cctx->blockState.matchState.hashTable3, 0, h3Size * sizeof(U32));
1719*c03c5b1cSMartin Matuska     }
1720*c03c5b1cSMartin Matuska 
1721*c03c5b1cSMartin Matuska     ZSTD_cwksp_mark_tables_clean(&cctx->workspace);
1722*c03c5b1cSMartin Matuska 
1723*c03c5b1cSMartin Matuska     /* copy dictionary offsets */
1724*c03c5b1cSMartin Matuska     {   ZSTD_matchState_t const* srcMatchState = &cdict->matchState;
1725*c03c5b1cSMartin Matuska         ZSTD_matchState_t* dstMatchState = &cctx->blockState.matchState;
1726*c03c5b1cSMartin Matuska         dstMatchState->window       = srcMatchState->window;
1727*c03c5b1cSMartin Matuska         dstMatchState->nextToUpdate = srcMatchState->nextToUpdate;
1728*c03c5b1cSMartin Matuska         dstMatchState->loadedDictEnd= srcMatchState->loadedDictEnd;
1729*c03c5b1cSMartin Matuska     }
1730*c03c5b1cSMartin Matuska 
1731*c03c5b1cSMartin Matuska     cctx->dictID = cdict->dictID;
1732*c03c5b1cSMartin Matuska 
1733*c03c5b1cSMartin Matuska     /* copy block state */
1734*c03c5b1cSMartin Matuska     memcpy(cctx->blockState.prevCBlock, &cdict->cBlockState, sizeof(cdict->cBlockState));
1735*c03c5b1cSMartin Matuska 
1736*c03c5b1cSMartin Matuska     return 0;
1737*c03c5b1cSMartin Matuska }
1738*c03c5b1cSMartin Matuska 
1739*c03c5b1cSMartin Matuska /* We have a choice between copying the dictionary context into the working
1740*c03c5b1cSMartin Matuska  * context, or referencing the dictionary context from the working context
1741*c03c5b1cSMartin Matuska  * in-place. We decide here which strategy to use. */
ZSTD_resetCCtx_usingCDict(ZSTD_CCtx * cctx,const ZSTD_CDict * cdict,const ZSTD_CCtx_params * params,U64 pledgedSrcSize,ZSTD_buffered_policy_e zbuff)1742*c03c5b1cSMartin Matuska static size_t ZSTD_resetCCtx_usingCDict(ZSTD_CCtx* cctx,
1743*c03c5b1cSMartin Matuska                             const ZSTD_CDict* cdict,
1744*c03c5b1cSMartin Matuska                             const ZSTD_CCtx_params* params,
1745*c03c5b1cSMartin Matuska                             U64 pledgedSrcSize,
1746*c03c5b1cSMartin Matuska                             ZSTD_buffered_policy_e zbuff)
1747*c03c5b1cSMartin Matuska {
1748*c03c5b1cSMartin Matuska 
1749*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_resetCCtx_usingCDict (pledgedSrcSize=%u)",
1750*c03c5b1cSMartin Matuska                 (unsigned)pledgedSrcSize);
1751*c03c5b1cSMartin Matuska 
1752*c03c5b1cSMartin Matuska     if (ZSTD_shouldAttachDict(cdict, params, pledgedSrcSize)) {
1753*c03c5b1cSMartin Matuska         return ZSTD_resetCCtx_byAttachingCDict(
1754*c03c5b1cSMartin Matuska             cctx, cdict, *params, pledgedSrcSize, zbuff);
1755*c03c5b1cSMartin Matuska     } else {
1756*c03c5b1cSMartin Matuska         return ZSTD_resetCCtx_byCopyingCDict(
1757*c03c5b1cSMartin Matuska             cctx, cdict, *params, pledgedSrcSize, zbuff);
1758*c03c5b1cSMartin Matuska     }
1759*c03c5b1cSMartin Matuska }
1760*c03c5b1cSMartin Matuska 
1761*c03c5b1cSMartin Matuska /*! ZSTD_copyCCtx_internal() :
1762*c03c5b1cSMartin Matuska  *  Duplicate an existing context `srcCCtx` into another one `dstCCtx`.
1763*c03c5b1cSMartin Matuska  *  Only works during stage ZSTDcs_init (i.e. after creation, but before first call to ZSTD_compressContinue()).
1764*c03c5b1cSMartin Matuska  *  The "context", in this case, refers to the hash and chain tables,
1765*c03c5b1cSMartin Matuska  *  entropy tables, and dictionary references.
1766*c03c5b1cSMartin Matuska  * `windowLog` value is enforced if != 0, otherwise value is copied from srcCCtx.
1767*c03c5b1cSMartin Matuska  * @return : 0, or an error code */
ZSTD_copyCCtx_internal(ZSTD_CCtx * dstCCtx,const ZSTD_CCtx * srcCCtx,ZSTD_frameParameters fParams,U64 pledgedSrcSize,ZSTD_buffered_policy_e zbuff)1768*c03c5b1cSMartin Matuska static size_t ZSTD_copyCCtx_internal(ZSTD_CCtx* dstCCtx,
1769*c03c5b1cSMartin Matuska                             const ZSTD_CCtx* srcCCtx,
1770*c03c5b1cSMartin Matuska                             ZSTD_frameParameters fParams,
1771*c03c5b1cSMartin Matuska                             U64 pledgedSrcSize,
1772*c03c5b1cSMartin Matuska                             ZSTD_buffered_policy_e zbuff)
1773*c03c5b1cSMartin Matuska {
1774*c03c5b1cSMartin Matuska     DEBUGLOG(5, "ZSTD_copyCCtx_internal");
1775*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(srcCCtx->stage!=ZSTDcs_init, stage_wrong,
1776*c03c5b1cSMartin Matuska                     "Can't copy a ctx that's not in init stage.");
1777*c03c5b1cSMartin Matuska 
1778*c03c5b1cSMartin Matuska     memcpy(&dstCCtx->customMem, &srcCCtx->customMem, sizeof(ZSTD_customMem));
1779*c03c5b1cSMartin Matuska     {   ZSTD_CCtx_params params = dstCCtx->requestedParams;
1780*c03c5b1cSMartin Matuska         /* Copy only compression parameters related to tables. */
1781*c03c5b1cSMartin Matuska         params.cParams = srcCCtx->appliedParams.cParams;
1782*c03c5b1cSMartin Matuska         params.fParams = fParams;
1783*c03c5b1cSMartin Matuska         ZSTD_resetCCtx_internal(dstCCtx, params, pledgedSrcSize,
1784*c03c5b1cSMartin Matuska                                 ZSTDcrp_leaveDirty, zbuff);
1785*c03c5b1cSMartin Matuska         assert(dstCCtx->appliedParams.cParams.windowLog == srcCCtx->appliedParams.cParams.windowLog);
1786*c03c5b1cSMartin Matuska         assert(dstCCtx->appliedParams.cParams.strategy == srcCCtx->appliedParams.cParams.strategy);
1787*c03c5b1cSMartin Matuska         assert(dstCCtx->appliedParams.cParams.hashLog == srcCCtx->appliedParams.cParams.hashLog);
1788*c03c5b1cSMartin Matuska         assert(dstCCtx->appliedParams.cParams.chainLog == srcCCtx->appliedParams.cParams.chainLog);
1789*c03c5b1cSMartin Matuska         assert(dstCCtx->blockState.matchState.hashLog3 == srcCCtx->blockState.matchState.hashLog3);
1790*c03c5b1cSMartin Matuska     }
1791*c03c5b1cSMartin Matuska 
1792*c03c5b1cSMartin Matuska     ZSTD_cwksp_mark_tables_dirty(&dstCCtx->workspace);
1793*c03c5b1cSMartin Matuska 
1794*c03c5b1cSMartin Matuska     /* copy tables */
1795*c03c5b1cSMartin Matuska     {   size_t const chainSize = (srcCCtx->appliedParams.cParams.strategy == ZSTD_fast) ? 0 : ((size_t)1 << srcCCtx->appliedParams.cParams.chainLog);
1796*c03c5b1cSMartin Matuska         size_t const hSize =  (size_t)1 << srcCCtx->appliedParams.cParams.hashLog;
1797*c03c5b1cSMartin Matuska         int const h3log = srcCCtx->blockState.matchState.hashLog3;
1798*c03c5b1cSMartin Matuska         size_t const h3Size = h3log ? ((size_t)1 << h3log) : 0;
1799*c03c5b1cSMartin Matuska 
1800*c03c5b1cSMartin Matuska         memcpy(dstCCtx->blockState.matchState.hashTable,
1801*c03c5b1cSMartin Matuska                srcCCtx->blockState.matchState.hashTable,
1802*c03c5b1cSMartin Matuska                hSize * sizeof(U32));
1803*c03c5b1cSMartin Matuska         memcpy(dstCCtx->blockState.matchState.chainTable,
1804*c03c5b1cSMartin Matuska                srcCCtx->blockState.matchState.chainTable,
1805*c03c5b1cSMartin Matuska                chainSize * sizeof(U32));
1806*c03c5b1cSMartin Matuska         memcpy(dstCCtx->blockState.matchState.hashTable3,
1807*c03c5b1cSMartin Matuska                srcCCtx->blockState.matchState.hashTable3,
1808*c03c5b1cSMartin Matuska                h3Size * sizeof(U32));
1809*c03c5b1cSMartin Matuska     }
1810*c03c5b1cSMartin Matuska 
1811*c03c5b1cSMartin Matuska     ZSTD_cwksp_mark_tables_clean(&dstCCtx->workspace);
1812*c03c5b1cSMartin Matuska 
1813*c03c5b1cSMartin Matuska     /* copy dictionary offsets */
1814*c03c5b1cSMartin Matuska     {
1815*c03c5b1cSMartin Matuska         const ZSTD_matchState_t* srcMatchState = &srcCCtx->blockState.matchState;
1816*c03c5b1cSMartin Matuska         ZSTD_matchState_t* dstMatchState = &dstCCtx->blockState.matchState;
1817*c03c5b1cSMartin Matuska         dstMatchState->window       = srcMatchState->window;
1818*c03c5b1cSMartin Matuska         dstMatchState->nextToUpdate = srcMatchState->nextToUpdate;
1819*c03c5b1cSMartin Matuska         dstMatchState->loadedDictEnd= srcMatchState->loadedDictEnd;
1820*c03c5b1cSMartin Matuska     }
1821*c03c5b1cSMartin Matuska     dstCCtx->dictID = srcCCtx->dictID;
1822*c03c5b1cSMartin Matuska 
1823*c03c5b1cSMartin Matuska     /* copy block state */
1824*c03c5b1cSMartin Matuska     memcpy(dstCCtx->blockState.prevCBlock, srcCCtx->blockState.prevCBlock, sizeof(*srcCCtx->blockState.prevCBlock));
1825*c03c5b1cSMartin Matuska 
1826*c03c5b1cSMartin Matuska     return 0;
1827*c03c5b1cSMartin Matuska }
1828*c03c5b1cSMartin Matuska 
1829*c03c5b1cSMartin Matuska /*! ZSTD_copyCCtx() :
1830*c03c5b1cSMartin Matuska  *  Duplicate an existing context `srcCCtx` into another one `dstCCtx`.
1831*c03c5b1cSMartin Matuska  *  Only works during stage ZSTDcs_init (i.e. after creation, but before first call to ZSTD_compressContinue()).
1832*c03c5b1cSMartin Matuska  *  pledgedSrcSize==0 means "unknown".
1833*c03c5b1cSMartin Matuska *   @return : 0, or an error code */
ZSTD_copyCCtx(ZSTD_CCtx * dstCCtx,const ZSTD_CCtx * srcCCtx,unsigned long long pledgedSrcSize)1834*c03c5b1cSMartin Matuska size_t ZSTD_copyCCtx(ZSTD_CCtx* dstCCtx, const ZSTD_CCtx* srcCCtx, unsigned long long pledgedSrcSize)
1835*c03c5b1cSMartin Matuska {
1836*c03c5b1cSMartin Matuska     ZSTD_frameParameters fParams = { 1 /*content*/, 0 /*checksum*/, 0 /*noDictID*/ };
1837*c03c5b1cSMartin Matuska     ZSTD_buffered_policy_e const zbuff = (ZSTD_buffered_policy_e)(srcCCtx->inBuffSize>0);
1838*c03c5b1cSMartin Matuska     ZSTD_STATIC_ASSERT((U32)ZSTDb_buffered==1);
1839*c03c5b1cSMartin Matuska     if (pledgedSrcSize==0) pledgedSrcSize = ZSTD_CONTENTSIZE_UNKNOWN;
1840*c03c5b1cSMartin Matuska     fParams.contentSizeFlag = (pledgedSrcSize != ZSTD_CONTENTSIZE_UNKNOWN);
1841*c03c5b1cSMartin Matuska 
1842*c03c5b1cSMartin Matuska     return ZSTD_copyCCtx_internal(dstCCtx, srcCCtx,
1843*c03c5b1cSMartin Matuska                                 fParams, pledgedSrcSize,
1844*c03c5b1cSMartin Matuska                                 zbuff);
1845*c03c5b1cSMartin Matuska }
1846*c03c5b1cSMartin Matuska 
1847*c03c5b1cSMartin Matuska 
1848*c03c5b1cSMartin Matuska #define ZSTD_ROWSIZE 16
1849*c03c5b1cSMartin Matuska /*! ZSTD_reduceTable() :
1850*c03c5b1cSMartin Matuska  *  reduce table indexes by `reducerValue`, or squash to zero.
1851*c03c5b1cSMartin Matuska  *  PreserveMark preserves "unsorted mark" for btlazy2 strategy.
1852*c03c5b1cSMartin Matuska  *  It must be set to a clear 0/1 value, to remove branch during inlining.
1853*c03c5b1cSMartin Matuska  *  Presume table size is a multiple of ZSTD_ROWSIZE
1854*c03c5b1cSMartin Matuska  *  to help auto-vectorization */
1855*c03c5b1cSMartin Matuska FORCE_INLINE_TEMPLATE void
ZSTD_reduceTable_internal(U32 * const table,U32 const size,U32 const reducerValue,int const preserveMark)1856*c03c5b1cSMartin Matuska ZSTD_reduceTable_internal (U32* const table, U32 const size, U32 const reducerValue, int const preserveMark)
1857*c03c5b1cSMartin Matuska {
1858*c03c5b1cSMartin Matuska     int const nbRows = (int)size / ZSTD_ROWSIZE;
1859*c03c5b1cSMartin Matuska     int cellNb = 0;
1860*c03c5b1cSMartin Matuska     int rowNb;
1861*c03c5b1cSMartin Matuska     assert((size & (ZSTD_ROWSIZE-1)) == 0);  /* multiple of ZSTD_ROWSIZE */
1862*c03c5b1cSMartin Matuska     assert(size < (1U<<31));   /* can be casted to int */
1863*c03c5b1cSMartin Matuska 
1864*c03c5b1cSMartin Matuska #if defined (MEMORY_SANITIZER) && !defined (ZSTD_MSAN_DONT_POISON_WORKSPACE)
1865*c03c5b1cSMartin Matuska     /* To validate that the table re-use logic is sound, and that we don't
1866*c03c5b1cSMartin Matuska      * access table space that we haven't cleaned, we re-"poison" the table
1867*c03c5b1cSMartin Matuska      * space every time we mark it dirty.
1868*c03c5b1cSMartin Matuska      *
1869*c03c5b1cSMartin Matuska      * This function however is intended to operate on those dirty tables and
1870*c03c5b1cSMartin Matuska      * re-clean them. So when this function is used correctly, we can unpoison
1871*c03c5b1cSMartin Matuska      * the memory it operated on. This introduces a blind spot though, since
1872*c03c5b1cSMartin Matuska      * if we now try to operate on __actually__ poisoned memory, we will not
1873*c03c5b1cSMartin Matuska      * detect that. */
1874*c03c5b1cSMartin Matuska     __msan_unpoison(table, size * sizeof(U32));
1875*c03c5b1cSMartin Matuska #endif
1876*c03c5b1cSMartin Matuska 
1877*c03c5b1cSMartin Matuska     for (rowNb=0 ; rowNb < nbRows ; rowNb++) {
1878*c03c5b1cSMartin Matuska         int column;
1879*c03c5b1cSMartin Matuska         for (column=0; column<ZSTD_ROWSIZE; column++) {
1880*c03c5b1cSMartin Matuska             if (preserveMark) {
1881*c03c5b1cSMartin Matuska                 U32 const adder = (table[cellNb] == ZSTD_DUBT_UNSORTED_MARK) ? reducerValue : 0;
1882*c03c5b1cSMartin Matuska                 table[cellNb] += adder;
1883*c03c5b1cSMartin Matuska             }
1884*c03c5b1cSMartin Matuska             if (table[cellNb] < reducerValue) table[cellNb] = 0;
1885*c03c5b1cSMartin Matuska             else table[cellNb] -= reducerValue;
1886*c03c5b1cSMartin Matuska             cellNb++;
1887*c03c5b1cSMartin Matuska     }   }
1888*c03c5b1cSMartin Matuska }
1889*c03c5b1cSMartin Matuska 
ZSTD_reduceTable(U32 * const table,U32 const size,U32 const reducerValue)1890*c03c5b1cSMartin Matuska static void ZSTD_reduceTable(U32* const table, U32 const size, U32 const reducerValue)
1891*c03c5b1cSMartin Matuska {
1892*c03c5b1cSMartin Matuska     ZSTD_reduceTable_internal(table, size, reducerValue, 0);
1893*c03c5b1cSMartin Matuska }
1894*c03c5b1cSMartin Matuska 
ZSTD_reduceTable_btlazy2(U32 * const table,U32 const size,U32 const reducerValue)1895*c03c5b1cSMartin Matuska static void ZSTD_reduceTable_btlazy2(U32* const table, U32 const size, U32 const reducerValue)
1896*c03c5b1cSMartin Matuska {
1897*c03c5b1cSMartin Matuska     ZSTD_reduceTable_internal(table, size, reducerValue, 1);
1898*c03c5b1cSMartin Matuska }
1899*c03c5b1cSMartin Matuska 
1900*c03c5b1cSMartin Matuska /*! ZSTD_reduceIndex() :
1901*c03c5b1cSMartin Matuska *   rescale all indexes to avoid future overflow (indexes are U32) */
ZSTD_reduceIndex(ZSTD_matchState_t * ms,ZSTD_CCtx_params const * params,const U32 reducerValue)1902*c03c5b1cSMartin Matuska static void ZSTD_reduceIndex (ZSTD_matchState_t* ms, ZSTD_CCtx_params const* params, const U32 reducerValue)
1903*c03c5b1cSMartin Matuska {
1904*c03c5b1cSMartin Matuska     {   U32 const hSize = (U32)1 << params->cParams.hashLog;
1905*c03c5b1cSMartin Matuska         ZSTD_reduceTable(ms->hashTable, hSize, reducerValue);
1906*c03c5b1cSMartin Matuska     }
1907*c03c5b1cSMartin Matuska 
1908*c03c5b1cSMartin Matuska     if (params->cParams.strategy != ZSTD_fast) {
1909*c03c5b1cSMartin Matuska         U32 const chainSize = (U32)1 << params->cParams.chainLog;
1910*c03c5b1cSMartin Matuska         if (params->cParams.strategy == ZSTD_btlazy2)
1911*c03c5b1cSMartin Matuska             ZSTD_reduceTable_btlazy2(ms->chainTable, chainSize, reducerValue);
1912*c03c5b1cSMartin Matuska         else
1913*c03c5b1cSMartin Matuska             ZSTD_reduceTable(ms->chainTable, chainSize, reducerValue);
1914*c03c5b1cSMartin Matuska     }
1915*c03c5b1cSMartin Matuska 
1916*c03c5b1cSMartin Matuska     if (ms->hashLog3) {
1917*c03c5b1cSMartin Matuska         U32 const h3Size = (U32)1 << ms->hashLog3;
1918*c03c5b1cSMartin Matuska         ZSTD_reduceTable(ms->hashTable3, h3Size, reducerValue);
1919*c03c5b1cSMartin Matuska     }
1920*c03c5b1cSMartin Matuska }
1921*c03c5b1cSMartin Matuska 
1922*c03c5b1cSMartin Matuska 
1923*c03c5b1cSMartin Matuska /*-*******************************************************
1924*c03c5b1cSMartin Matuska *  Block entropic compression
1925*c03c5b1cSMartin Matuska *********************************************************/
1926*c03c5b1cSMartin Matuska 
1927*c03c5b1cSMartin Matuska /* See doc/zstd_compression_format.md for detailed format description */
1928*c03c5b1cSMartin Matuska 
ZSTD_seqToCodes(const seqStore_t * seqStorePtr)1929*c03c5b1cSMartin Matuska void ZSTD_seqToCodes(const seqStore_t* seqStorePtr)
1930*c03c5b1cSMartin Matuska {
1931*c03c5b1cSMartin Matuska     const seqDef* const sequences = seqStorePtr->sequencesStart;
1932*c03c5b1cSMartin Matuska     BYTE* const llCodeTable = seqStorePtr->llCode;
1933*c03c5b1cSMartin Matuska     BYTE* const ofCodeTable = seqStorePtr->ofCode;
1934*c03c5b1cSMartin Matuska     BYTE* const mlCodeTable = seqStorePtr->mlCode;
1935*c03c5b1cSMartin Matuska     U32 const nbSeq = (U32)(seqStorePtr->sequences - seqStorePtr->sequencesStart);
1936*c03c5b1cSMartin Matuska     U32 u;
1937*c03c5b1cSMartin Matuska     assert(nbSeq <= seqStorePtr->maxNbSeq);
1938*c03c5b1cSMartin Matuska     for (u=0; u<nbSeq; u++) {
1939*c03c5b1cSMartin Matuska         U32 const llv = sequences[u].litLength;
1940*c03c5b1cSMartin Matuska         U32 const mlv = sequences[u].matchLength;
1941*c03c5b1cSMartin Matuska         llCodeTable[u] = (BYTE)ZSTD_LLcode(llv);
1942*c03c5b1cSMartin Matuska         ofCodeTable[u] = (BYTE)ZSTD_highbit32(sequences[u].offset);
1943*c03c5b1cSMartin Matuska         mlCodeTable[u] = (BYTE)ZSTD_MLcode(mlv);
1944*c03c5b1cSMartin Matuska     }
1945*c03c5b1cSMartin Matuska     if (seqStorePtr->longLengthID==1)
1946*c03c5b1cSMartin Matuska         llCodeTable[seqStorePtr->longLengthPos] = MaxLL;
1947*c03c5b1cSMartin Matuska     if (seqStorePtr->longLengthID==2)
1948*c03c5b1cSMartin Matuska         mlCodeTable[seqStorePtr->longLengthPos] = MaxML;
1949*c03c5b1cSMartin Matuska }
1950*c03c5b1cSMartin Matuska 
1951*c03c5b1cSMartin Matuska /* ZSTD_useTargetCBlockSize():
1952*c03c5b1cSMartin Matuska  * Returns if target compressed block size param is being used.
1953*c03c5b1cSMartin Matuska  * If used, compression will do best effort to make a compressed block size to be around targetCBlockSize.
1954*c03c5b1cSMartin Matuska  * Returns 1 if true, 0 otherwise. */
ZSTD_useTargetCBlockSize(const ZSTD_CCtx_params * cctxParams)1955*c03c5b1cSMartin Matuska static int ZSTD_useTargetCBlockSize(const ZSTD_CCtx_params* cctxParams)
1956*c03c5b1cSMartin Matuska {
1957*c03c5b1cSMartin Matuska     DEBUGLOG(5, "ZSTD_useTargetCBlockSize (targetCBlockSize=%zu)", cctxParams->targetCBlockSize);
1958*c03c5b1cSMartin Matuska     return (cctxParams->targetCBlockSize != 0);
1959*c03c5b1cSMartin Matuska }
1960*c03c5b1cSMartin Matuska 
1961*c03c5b1cSMartin Matuska /* ZSTD_compressSequences_internal():
1962*c03c5b1cSMartin Matuska  * actually compresses both literals and sequences */
1963*c03c5b1cSMartin Matuska MEM_STATIC size_t
ZSTD_compressSequences_internal(seqStore_t * seqStorePtr,const ZSTD_entropyCTables_t * prevEntropy,ZSTD_entropyCTables_t * nextEntropy,const ZSTD_CCtx_params * cctxParams,void * dst,size_t dstCapacity,void * entropyWorkspace,size_t entropyWkspSize,const int bmi2)1964*c03c5b1cSMartin Matuska ZSTD_compressSequences_internal(seqStore_t* seqStorePtr,
1965*c03c5b1cSMartin Matuska                           const ZSTD_entropyCTables_t* prevEntropy,
1966*c03c5b1cSMartin Matuska                                 ZSTD_entropyCTables_t* nextEntropy,
1967*c03c5b1cSMartin Matuska                           const ZSTD_CCtx_params* cctxParams,
1968*c03c5b1cSMartin Matuska                                 void* dst, size_t dstCapacity,
1969*c03c5b1cSMartin Matuska                                 void* entropyWorkspace, size_t entropyWkspSize,
1970*c03c5b1cSMartin Matuska                           const int bmi2)
1971*c03c5b1cSMartin Matuska {
1972*c03c5b1cSMartin Matuska     const int longOffsets = cctxParams->cParams.windowLog > STREAM_ACCUMULATOR_MIN;
1973*c03c5b1cSMartin Matuska     ZSTD_strategy const strategy = cctxParams->cParams.strategy;
1974*c03c5b1cSMartin Matuska     unsigned count[MaxSeq+1];
1975*c03c5b1cSMartin Matuska     FSE_CTable* CTable_LitLength = nextEntropy->fse.litlengthCTable;
1976*c03c5b1cSMartin Matuska     FSE_CTable* CTable_OffsetBits = nextEntropy->fse.offcodeCTable;
1977*c03c5b1cSMartin Matuska     FSE_CTable* CTable_MatchLength = nextEntropy->fse.matchlengthCTable;
1978*c03c5b1cSMartin Matuska     U32 LLtype, Offtype, MLtype;   /* compressed, raw or rle */
1979*c03c5b1cSMartin Matuska     const seqDef* const sequences = seqStorePtr->sequencesStart;
1980*c03c5b1cSMartin Matuska     const BYTE* const ofCodeTable = seqStorePtr->ofCode;
1981*c03c5b1cSMartin Matuska     const BYTE* const llCodeTable = seqStorePtr->llCode;
1982*c03c5b1cSMartin Matuska     const BYTE* const mlCodeTable = seqStorePtr->mlCode;
1983*c03c5b1cSMartin Matuska     BYTE* const ostart = (BYTE*)dst;
1984*c03c5b1cSMartin Matuska     BYTE* const oend = ostart + dstCapacity;
1985*c03c5b1cSMartin Matuska     BYTE* op = ostart;
1986*c03c5b1cSMartin Matuska     size_t const nbSeq = (size_t)(seqStorePtr->sequences - seqStorePtr->sequencesStart);
1987*c03c5b1cSMartin Matuska     BYTE* seqHead;
1988*c03c5b1cSMartin Matuska     BYTE* lastNCount = NULL;
1989*c03c5b1cSMartin Matuska 
1990*c03c5b1cSMartin Matuska     DEBUGLOG(5, "ZSTD_compressSequences_internal (nbSeq=%zu)", nbSeq);
1991*c03c5b1cSMartin Matuska     ZSTD_STATIC_ASSERT(HUF_WORKSPACE_SIZE >= (1<<MAX(MLFSELog,LLFSELog)));
1992*c03c5b1cSMartin Matuska 
1993*c03c5b1cSMartin Matuska     /* Compress literals */
1994*c03c5b1cSMartin Matuska     {   const BYTE* const literals = seqStorePtr->litStart;
1995*c03c5b1cSMartin Matuska         size_t const litSize = (size_t)(seqStorePtr->lit - literals);
1996*c03c5b1cSMartin Matuska         size_t const cSize = ZSTD_compressLiterals(
1997*c03c5b1cSMartin Matuska                                     &prevEntropy->huf, &nextEntropy->huf,
1998*c03c5b1cSMartin Matuska                                     cctxParams->cParams.strategy,
1999*c03c5b1cSMartin Matuska                                     ZSTD_disableLiteralsCompression(cctxParams),
2000*c03c5b1cSMartin Matuska                                     op, dstCapacity,
2001*c03c5b1cSMartin Matuska                                     literals, litSize,
2002*c03c5b1cSMartin Matuska                                     entropyWorkspace, entropyWkspSize,
2003*c03c5b1cSMartin Matuska                                     bmi2);
2004*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR(cSize, "ZSTD_compressLiterals failed");
2005*c03c5b1cSMartin Matuska         assert(cSize <= dstCapacity);
2006*c03c5b1cSMartin Matuska         op += cSize;
2007*c03c5b1cSMartin Matuska     }
2008*c03c5b1cSMartin Matuska 
2009*c03c5b1cSMartin Matuska     /* Sequences Header */
2010*c03c5b1cSMartin Matuska     RETURN_ERROR_IF((oend-op) < 3 /*max nbSeq Size*/ + 1 /*seqHead*/,
2011*c03c5b1cSMartin Matuska                     dstSize_tooSmall, "Can't fit seq hdr in output buf!");
2012*c03c5b1cSMartin Matuska     if (nbSeq < 128) {
2013*c03c5b1cSMartin Matuska         *op++ = (BYTE)nbSeq;
2014*c03c5b1cSMartin Matuska     } else if (nbSeq < LONGNBSEQ) {
2015*c03c5b1cSMartin Matuska         op[0] = (BYTE)((nbSeq>>8) + 0x80);
2016*c03c5b1cSMartin Matuska         op[1] = (BYTE)nbSeq;
2017*c03c5b1cSMartin Matuska         op+=2;
2018*c03c5b1cSMartin Matuska     } else {
2019*c03c5b1cSMartin Matuska         op[0]=0xFF;
2020*c03c5b1cSMartin Matuska         MEM_writeLE16(op+1, (U16)(nbSeq - LONGNBSEQ));
2021*c03c5b1cSMartin Matuska         op+=3;
2022*c03c5b1cSMartin Matuska     }
2023*c03c5b1cSMartin Matuska     assert(op <= oend);
2024*c03c5b1cSMartin Matuska     if (nbSeq==0) {
2025*c03c5b1cSMartin Matuska         /* Copy the old tables over as if we repeated them */
2026*c03c5b1cSMartin Matuska         memcpy(&nextEntropy->fse, &prevEntropy->fse, sizeof(prevEntropy->fse));
2027*c03c5b1cSMartin Matuska         return (size_t)(op - ostart);
2028*c03c5b1cSMartin Matuska     }
2029*c03c5b1cSMartin Matuska 
2030*c03c5b1cSMartin Matuska     /* seqHead : flags for FSE encoding type */
2031*c03c5b1cSMartin Matuska     seqHead = op++;
2032*c03c5b1cSMartin Matuska     assert(op <= oend);
2033*c03c5b1cSMartin Matuska 
2034*c03c5b1cSMartin Matuska     /* convert length/distances into codes */
2035*c03c5b1cSMartin Matuska     ZSTD_seqToCodes(seqStorePtr);
2036*c03c5b1cSMartin Matuska     /* build CTable for Literal Lengths */
2037*c03c5b1cSMartin Matuska     {   unsigned max = MaxLL;
2038*c03c5b1cSMartin Matuska         size_t const mostFrequent = HIST_countFast_wksp(count, &max, llCodeTable, nbSeq, entropyWorkspace, entropyWkspSize);   /* can't fail */
2039*c03c5b1cSMartin Matuska         DEBUGLOG(5, "Building LL table");
2040*c03c5b1cSMartin Matuska         nextEntropy->fse.litlength_repeatMode = prevEntropy->fse.litlength_repeatMode;
2041*c03c5b1cSMartin Matuska         LLtype = ZSTD_selectEncodingType(&nextEntropy->fse.litlength_repeatMode,
2042*c03c5b1cSMartin Matuska                                         count, max, mostFrequent, nbSeq,
2043*c03c5b1cSMartin Matuska                                         LLFSELog, prevEntropy->fse.litlengthCTable,
2044*c03c5b1cSMartin Matuska                                         LL_defaultNorm, LL_defaultNormLog,
2045*c03c5b1cSMartin Matuska                                         ZSTD_defaultAllowed, strategy);
2046*c03c5b1cSMartin Matuska         assert(set_basic < set_compressed && set_rle < set_compressed);
2047*c03c5b1cSMartin Matuska         assert(!(LLtype < set_compressed && nextEntropy->fse.litlength_repeatMode != FSE_repeat_none)); /* We don't copy tables */
2048*c03c5b1cSMartin Matuska         {   size_t const countSize = ZSTD_buildCTable(
2049*c03c5b1cSMartin Matuska                 op, (size_t)(oend - op),
2050*c03c5b1cSMartin Matuska                 CTable_LitLength, LLFSELog, (symbolEncodingType_e)LLtype,
2051*c03c5b1cSMartin Matuska                 count, max, llCodeTable, nbSeq,
2052*c03c5b1cSMartin Matuska                 LL_defaultNorm, LL_defaultNormLog, MaxLL,
2053*c03c5b1cSMartin Matuska                 prevEntropy->fse.litlengthCTable,
2054*c03c5b1cSMartin Matuska                 sizeof(prevEntropy->fse.litlengthCTable),
2055*c03c5b1cSMartin Matuska                 entropyWorkspace, entropyWkspSize);
2056*c03c5b1cSMartin Matuska             FORWARD_IF_ERROR(countSize, "ZSTD_buildCTable for LitLens failed");
2057*c03c5b1cSMartin Matuska             if (LLtype == set_compressed)
2058*c03c5b1cSMartin Matuska                 lastNCount = op;
2059*c03c5b1cSMartin Matuska             op += countSize;
2060*c03c5b1cSMartin Matuska             assert(op <= oend);
2061*c03c5b1cSMartin Matuska     }   }
2062*c03c5b1cSMartin Matuska     /* build CTable for Offsets */
2063*c03c5b1cSMartin Matuska     {   unsigned max = MaxOff;
2064*c03c5b1cSMartin Matuska         size_t const mostFrequent = HIST_countFast_wksp(
2065*c03c5b1cSMartin Matuska             count, &max, ofCodeTable, nbSeq, entropyWorkspace, entropyWkspSize);  /* can't fail */
2066*c03c5b1cSMartin Matuska         /* We can only use the basic table if max <= DefaultMaxOff, otherwise the offsets are too large */
2067*c03c5b1cSMartin Matuska         ZSTD_defaultPolicy_e const defaultPolicy = (max <= DefaultMaxOff) ? ZSTD_defaultAllowed : ZSTD_defaultDisallowed;
2068*c03c5b1cSMartin Matuska         DEBUGLOG(5, "Building OF table");
2069*c03c5b1cSMartin Matuska         nextEntropy->fse.offcode_repeatMode = prevEntropy->fse.offcode_repeatMode;
2070*c03c5b1cSMartin Matuska         Offtype = ZSTD_selectEncodingType(&nextEntropy->fse.offcode_repeatMode,
2071*c03c5b1cSMartin Matuska                                         count, max, mostFrequent, nbSeq,
2072*c03c5b1cSMartin Matuska                                         OffFSELog, prevEntropy->fse.offcodeCTable,
2073*c03c5b1cSMartin Matuska                                         OF_defaultNorm, OF_defaultNormLog,
2074*c03c5b1cSMartin Matuska                                         defaultPolicy, strategy);
2075*c03c5b1cSMartin Matuska         assert(!(Offtype < set_compressed && nextEntropy->fse.offcode_repeatMode != FSE_repeat_none)); /* We don't copy tables */
2076*c03c5b1cSMartin Matuska         {   size_t const countSize = ZSTD_buildCTable(
2077*c03c5b1cSMartin Matuska                 op, (size_t)(oend - op),
2078*c03c5b1cSMartin Matuska                 CTable_OffsetBits, OffFSELog, (symbolEncodingType_e)Offtype,
2079*c03c5b1cSMartin Matuska                 count, max, ofCodeTable, nbSeq,
2080*c03c5b1cSMartin Matuska                 OF_defaultNorm, OF_defaultNormLog, DefaultMaxOff,
2081*c03c5b1cSMartin Matuska                 prevEntropy->fse.offcodeCTable,
2082*c03c5b1cSMartin Matuska                 sizeof(prevEntropy->fse.offcodeCTable),
2083*c03c5b1cSMartin Matuska                 entropyWorkspace, entropyWkspSize);
2084*c03c5b1cSMartin Matuska             FORWARD_IF_ERROR(countSize, "ZSTD_buildCTable for Offsets failed");
2085*c03c5b1cSMartin Matuska             if (Offtype == set_compressed)
2086*c03c5b1cSMartin Matuska                 lastNCount = op;
2087*c03c5b1cSMartin Matuska             op += countSize;
2088*c03c5b1cSMartin Matuska             assert(op <= oend);
2089*c03c5b1cSMartin Matuska     }   }
2090*c03c5b1cSMartin Matuska     /* build CTable for MatchLengths */
2091*c03c5b1cSMartin Matuska     {   unsigned max = MaxML;
2092*c03c5b1cSMartin Matuska         size_t const mostFrequent = HIST_countFast_wksp(
2093*c03c5b1cSMartin Matuska             count, &max, mlCodeTable, nbSeq, entropyWorkspace, entropyWkspSize);   /* can't fail */
2094*c03c5b1cSMartin Matuska         DEBUGLOG(5, "Building ML table (remaining space : %i)", (int)(oend-op));
2095*c03c5b1cSMartin Matuska         nextEntropy->fse.matchlength_repeatMode = prevEntropy->fse.matchlength_repeatMode;
2096*c03c5b1cSMartin Matuska         MLtype = ZSTD_selectEncodingType(&nextEntropy->fse.matchlength_repeatMode,
2097*c03c5b1cSMartin Matuska                                         count, max, mostFrequent, nbSeq,
2098*c03c5b1cSMartin Matuska                                         MLFSELog, prevEntropy->fse.matchlengthCTable,
2099*c03c5b1cSMartin Matuska                                         ML_defaultNorm, ML_defaultNormLog,
2100*c03c5b1cSMartin Matuska                                         ZSTD_defaultAllowed, strategy);
2101*c03c5b1cSMartin Matuska         assert(!(MLtype < set_compressed && nextEntropy->fse.matchlength_repeatMode != FSE_repeat_none)); /* We don't copy tables */
2102*c03c5b1cSMartin Matuska         {   size_t const countSize = ZSTD_buildCTable(
2103*c03c5b1cSMartin Matuska                 op, (size_t)(oend - op),
2104*c03c5b1cSMartin Matuska                 CTable_MatchLength, MLFSELog, (symbolEncodingType_e)MLtype,
2105*c03c5b1cSMartin Matuska                 count, max, mlCodeTable, nbSeq,
2106*c03c5b1cSMartin Matuska                 ML_defaultNorm, ML_defaultNormLog, MaxML,
2107*c03c5b1cSMartin Matuska                 prevEntropy->fse.matchlengthCTable,
2108*c03c5b1cSMartin Matuska                 sizeof(prevEntropy->fse.matchlengthCTable),
2109*c03c5b1cSMartin Matuska                 entropyWorkspace, entropyWkspSize);
2110*c03c5b1cSMartin Matuska             FORWARD_IF_ERROR(countSize, "ZSTD_buildCTable for MatchLengths failed");
2111*c03c5b1cSMartin Matuska             if (MLtype == set_compressed)
2112*c03c5b1cSMartin Matuska                 lastNCount = op;
2113*c03c5b1cSMartin Matuska             op += countSize;
2114*c03c5b1cSMartin Matuska             assert(op <= oend);
2115*c03c5b1cSMartin Matuska     }   }
2116*c03c5b1cSMartin Matuska 
2117*c03c5b1cSMartin Matuska     *seqHead = (BYTE)((LLtype<<6) + (Offtype<<4) + (MLtype<<2));
2118*c03c5b1cSMartin Matuska 
2119*c03c5b1cSMartin Matuska     {   size_t const bitstreamSize = ZSTD_encodeSequences(
2120*c03c5b1cSMartin Matuska                                         op, (size_t)(oend - op),
2121*c03c5b1cSMartin Matuska                                         CTable_MatchLength, mlCodeTable,
2122*c03c5b1cSMartin Matuska                                         CTable_OffsetBits, ofCodeTable,
2123*c03c5b1cSMartin Matuska                                         CTable_LitLength, llCodeTable,
2124*c03c5b1cSMartin Matuska                                         sequences, nbSeq,
2125*c03c5b1cSMartin Matuska                                         longOffsets, bmi2);
2126*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR(bitstreamSize, "ZSTD_encodeSequences failed");
2127*c03c5b1cSMartin Matuska         op += bitstreamSize;
2128*c03c5b1cSMartin Matuska         assert(op <= oend);
2129*c03c5b1cSMartin Matuska         /* zstd versions <= 1.3.4 mistakenly report corruption when
2130*c03c5b1cSMartin Matuska          * FSE_readNCount() receives a buffer < 4 bytes.
2131*c03c5b1cSMartin Matuska          * Fixed by https://github.com/facebook/zstd/pull/1146.
2132*c03c5b1cSMartin Matuska          * This can happen when the last set_compressed table present is 2
2133*c03c5b1cSMartin Matuska          * bytes and the bitstream is only one byte.
2134*c03c5b1cSMartin Matuska          * In this exceedingly rare case, we will simply emit an uncompressed
2135*c03c5b1cSMartin Matuska          * block, since it isn't worth optimizing.
2136*c03c5b1cSMartin Matuska          */
2137*c03c5b1cSMartin Matuska         if (lastNCount && (op - lastNCount) < 4) {
2138*c03c5b1cSMartin Matuska             /* NCountSize >= 2 && bitstreamSize > 0 ==> lastCountSize == 3 */
2139*c03c5b1cSMartin Matuska             assert(op - lastNCount == 3);
2140*c03c5b1cSMartin Matuska             DEBUGLOG(5, "Avoiding bug in zstd decoder in versions <= 1.3.4 by "
2141*c03c5b1cSMartin Matuska                         "emitting an uncompressed block.");
2142*c03c5b1cSMartin Matuska             return 0;
2143*c03c5b1cSMartin Matuska         }
2144*c03c5b1cSMartin Matuska     }
2145*c03c5b1cSMartin Matuska 
2146*c03c5b1cSMartin Matuska     DEBUGLOG(5, "compressed block size : %u", (unsigned)(op - ostart));
2147*c03c5b1cSMartin Matuska     return (size_t)(op - ostart);
2148*c03c5b1cSMartin Matuska }
2149*c03c5b1cSMartin Matuska 
2150*c03c5b1cSMartin Matuska MEM_STATIC size_t
ZSTD_compressSequences(seqStore_t * seqStorePtr,const ZSTD_entropyCTables_t * prevEntropy,ZSTD_entropyCTables_t * nextEntropy,const ZSTD_CCtx_params * cctxParams,void * dst,size_t dstCapacity,size_t srcSize,void * entropyWorkspace,size_t entropyWkspSize,int bmi2)2151*c03c5b1cSMartin Matuska ZSTD_compressSequences(seqStore_t* seqStorePtr,
2152*c03c5b1cSMartin Matuska                        const ZSTD_entropyCTables_t* prevEntropy,
2153*c03c5b1cSMartin Matuska                              ZSTD_entropyCTables_t* nextEntropy,
2154*c03c5b1cSMartin Matuska                        const ZSTD_CCtx_params* cctxParams,
2155*c03c5b1cSMartin Matuska                              void* dst, size_t dstCapacity,
2156*c03c5b1cSMartin Matuska                              size_t srcSize,
2157*c03c5b1cSMartin Matuska                              void* entropyWorkspace, size_t entropyWkspSize,
2158*c03c5b1cSMartin Matuska                              int bmi2)
2159*c03c5b1cSMartin Matuska {
2160*c03c5b1cSMartin Matuska     size_t const cSize = ZSTD_compressSequences_internal(
2161*c03c5b1cSMartin Matuska                             seqStorePtr, prevEntropy, nextEntropy, cctxParams,
2162*c03c5b1cSMartin Matuska                             dst, dstCapacity,
2163*c03c5b1cSMartin Matuska                             entropyWorkspace, entropyWkspSize, bmi2);
2164*c03c5b1cSMartin Matuska     if (cSize == 0) return 0;
2165*c03c5b1cSMartin Matuska     /* When srcSize <= dstCapacity, there is enough space to write a raw uncompressed block.
2166*c03c5b1cSMartin Matuska      * Since we ran out of space, block must be not compressible, so fall back to raw uncompressed block.
2167*c03c5b1cSMartin Matuska      */
2168*c03c5b1cSMartin Matuska     if ((cSize == ERROR(dstSize_tooSmall)) & (srcSize <= dstCapacity))
2169*c03c5b1cSMartin Matuska         return 0;  /* block not compressed */
2170*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR(cSize, "ZSTD_compressSequences_internal failed");
2171*c03c5b1cSMartin Matuska 
2172*c03c5b1cSMartin Matuska     /* Check compressibility */
2173*c03c5b1cSMartin Matuska     {   size_t const maxCSize = srcSize - ZSTD_minGain(srcSize, cctxParams->cParams.strategy);
2174*c03c5b1cSMartin Matuska         if (cSize >= maxCSize) return 0;  /* block not compressed */
2175*c03c5b1cSMartin Matuska     }
2176*c03c5b1cSMartin Matuska 
2177*c03c5b1cSMartin Matuska     return cSize;
2178*c03c5b1cSMartin Matuska }
2179*c03c5b1cSMartin Matuska 
2180*c03c5b1cSMartin Matuska /* ZSTD_selectBlockCompressor() :
2181*c03c5b1cSMartin Matuska  * Not static, but internal use only (used by long distance matcher)
2182*c03c5b1cSMartin Matuska  * assumption : strat is a valid strategy */
ZSTD_selectBlockCompressor(ZSTD_strategy strat,ZSTD_dictMode_e dictMode)2183*c03c5b1cSMartin Matuska ZSTD_blockCompressor ZSTD_selectBlockCompressor(ZSTD_strategy strat, ZSTD_dictMode_e dictMode)
2184*c03c5b1cSMartin Matuska {
2185*c03c5b1cSMartin Matuska     static const ZSTD_blockCompressor blockCompressor[3][ZSTD_STRATEGY_MAX+1] = {
2186*c03c5b1cSMartin Matuska         { ZSTD_compressBlock_fast  /* default for 0 */,
2187*c03c5b1cSMartin Matuska           ZSTD_compressBlock_fast,
2188*c03c5b1cSMartin Matuska           ZSTD_compressBlock_doubleFast,
2189*c03c5b1cSMartin Matuska           ZSTD_compressBlock_greedy,
2190*c03c5b1cSMartin Matuska           ZSTD_compressBlock_lazy,
2191*c03c5b1cSMartin Matuska           ZSTD_compressBlock_lazy2,
2192*c03c5b1cSMartin Matuska           ZSTD_compressBlock_btlazy2,
2193*c03c5b1cSMartin Matuska           ZSTD_compressBlock_btopt,
2194*c03c5b1cSMartin Matuska           ZSTD_compressBlock_btultra,
2195*c03c5b1cSMartin Matuska           ZSTD_compressBlock_btultra2 },
2196*c03c5b1cSMartin Matuska         { ZSTD_compressBlock_fast_extDict  /* default for 0 */,
2197*c03c5b1cSMartin Matuska           ZSTD_compressBlock_fast_extDict,
2198*c03c5b1cSMartin Matuska           ZSTD_compressBlock_doubleFast_extDict,
2199*c03c5b1cSMartin Matuska           ZSTD_compressBlock_greedy_extDict,
2200*c03c5b1cSMartin Matuska           ZSTD_compressBlock_lazy_extDict,
2201*c03c5b1cSMartin Matuska           ZSTD_compressBlock_lazy2_extDict,
2202*c03c5b1cSMartin Matuska           ZSTD_compressBlock_btlazy2_extDict,
2203*c03c5b1cSMartin Matuska           ZSTD_compressBlock_btopt_extDict,
2204*c03c5b1cSMartin Matuska           ZSTD_compressBlock_btultra_extDict,
2205*c03c5b1cSMartin Matuska           ZSTD_compressBlock_btultra_extDict },
2206*c03c5b1cSMartin Matuska         { ZSTD_compressBlock_fast_dictMatchState  /* default for 0 */,
2207*c03c5b1cSMartin Matuska           ZSTD_compressBlock_fast_dictMatchState,
2208*c03c5b1cSMartin Matuska           ZSTD_compressBlock_doubleFast_dictMatchState,
2209*c03c5b1cSMartin Matuska           ZSTD_compressBlock_greedy_dictMatchState,
2210*c03c5b1cSMartin Matuska           ZSTD_compressBlock_lazy_dictMatchState,
2211*c03c5b1cSMartin Matuska           ZSTD_compressBlock_lazy2_dictMatchState,
2212*c03c5b1cSMartin Matuska           ZSTD_compressBlock_btlazy2_dictMatchState,
2213*c03c5b1cSMartin Matuska           ZSTD_compressBlock_btopt_dictMatchState,
2214*c03c5b1cSMartin Matuska           ZSTD_compressBlock_btultra_dictMatchState,
2215*c03c5b1cSMartin Matuska           ZSTD_compressBlock_btultra_dictMatchState }
2216*c03c5b1cSMartin Matuska     };
2217*c03c5b1cSMartin Matuska     ZSTD_blockCompressor selectedCompressor;
2218*c03c5b1cSMartin Matuska     ZSTD_STATIC_ASSERT((unsigned)ZSTD_fast == 1);
2219*c03c5b1cSMartin Matuska 
2220*c03c5b1cSMartin Matuska     assert(ZSTD_cParam_withinBounds(ZSTD_c_strategy, strat));
2221*c03c5b1cSMartin Matuska     selectedCompressor = blockCompressor[(int)dictMode][(int)strat];
2222*c03c5b1cSMartin Matuska     assert(selectedCompressor != NULL);
2223*c03c5b1cSMartin Matuska     return selectedCompressor;
2224*c03c5b1cSMartin Matuska }
2225*c03c5b1cSMartin Matuska 
ZSTD_storeLastLiterals(seqStore_t * seqStorePtr,const BYTE * anchor,size_t lastLLSize)2226*c03c5b1cSMartin Matuska static void ZSTD_storeLastLiterals(seqStore_t* seqStorePtr,
2227*c03c5b1cSMartin Matuska                                    const BYTE* anchor, size_t lastLLSize)
2228*c03c5b1cSMartin Matuska {
2229*c03c5b1cSMartin Matuska     memcpy(seqStorePtr->lit, anchor, lastLLSize);
2230*c03c5b1cSMartin Matuska     seqStorePtr->lit += lastLLSize;
2231*c03c5b1cSMartin Matuska }
2232*c03c5b1cSMartin Matuska 
ZSTD_resetSeqStore(seqStore_t * ssPtr)2233*c03c5b1cSMartin Matuska void ZSTD_resetSeqStore(seqStore_t* ssPtr)
2234*c03c5b1cSMartin Matuska {
2235*c03c5b1cSMartin Matuska     ssPtr->lit = ssPtr->litStart;
2236*c03c5b1cSMartin Matuska     ssPtr->sequences = ssPtr->sequencesStart;
2237*c03c5b1cSMartin Matuska     ssPtr->longLengthID = 0;
2238*c03c5b1cSMartin Matuska }
2239*c03c5b1cSMartin Matuska 
2240*c03c5b1cSMartin Matuska typedef enum { ZSTDbss_compress, ZSTDbss_noCompress } ZSTD_buildSeqStore_e;
2241*c03c5b1cSMartin Matuska 
ZSTD_buildSeqStore(ZSTD_CCtx * zc,const void * src,size_t srcSize)2242*c03c5b1cSMartin Matuska static size_t ZSTD_buildSeqStore(ZSTD_CCtx* zc, const void* src, size_t srcSize)
2243*c03c5b1cSMartin Matuska {
2244*c03c5b1cSMartin Matuska     ZSTD_matchState_t* const ms = &zc->blockState.matchState;
2245*c03c5b1cSMartin Matuska     DEBUGLOG(5, "ZSTD_buildSeqStore (srcSize=%zu)", srcSize);
2246*c03c5b1cSMartin Matuska     assert(srcSize <= ZSTD_BLOCKSIZE_MAX);
2247*c03c5b1cSMartin Matuska     /* Assert that we have correctly flushed the ctx params into the ms's copy */
2248*c03c5b1cSMartin Matuska     ZSTD_assertEqualCParams(zc->appliedParams.cParams, ms->cParams);
2249*c03c5b1cSMartin Matuska     if (srcSize < MIN_CBLOCK_SIZE+ZSTD_blockHeaderSize+1) {
2250*c03c5b1cSMartin Matuska         ZSTD_ldm_skipSequences(&zc->externSeqStore, srcSize, zc->appliedParams.cParams.minMatch);
2251*c03c5b1cSMartin Matuska         return ZSTDbss_noCompress; /* don't even attempt compression below a certain srcSize */
2252*c03c5b1cSMartin Matuska     }
2253*c03c5b1cSMartin Matuska     ZSTD_resetSeqStore(&(zc->seqStore));
2254*c03c5b1cSMartin Matuska     /* required for optimal parser to read stats from dictionary */
2255*c03c5b1cSMartin Matuska     ms->opt.symbolCosts = &zc->blockState.prevCBlock->entropy;
2256*c03c5b1cSMartin Matuska     /* tell the optimal parser how we expect to compress literals */
2257*c03c5b1cSMartin Matuska     ms->opt.literalCompressionMode = zc->appliedParams.literalCompressionMode;
2258*c03c5b1cSMartin Matuska     /* a gap between an attached dict and the current window is not safe,
2259*c03c5b1cSMartin Matuska      * they must remain adjacent,
2260*c03c5b1cSMartin Matuska      * and when that stops being the case, the dict must be unset */
2261*c03c5b1cSMartin Matuska     assert(ms->dictMatchState == NULL || ms->loadedDictEnd == ms->window.dictLimit);
2262*c03c5b1cSMartin Matuska 
2263*c03c5b1cSMartin Matuska     /* limited update after a very long match */
2264*c03c5b1cSMartin Matuska     {   const BYTE* const base = ms->window.base;
2265*c03c5b1cSMartin Matuska         const BYTE* const istart = (const BYTE*)src;
2266*c03c5b1cSMartin Matuska         const U32 current = (U32)(istart-base);
2267*c03c5b1cSMartin Matuska         if (sizeof(ptrdiff_t)==8) assert(istart - base < (ptrdiff_t)(U32)(-1));   /* ensure no overflow */
2268*c03c5b1cSMartin Matuska         if (current > ms->nextToUpdate + 384)
2269*c03c5b1cSMartin Matuska             ms->nextToUpdate = current - MIN(192, (U32)(current - ms->nextToUpdate - 384));
2270*c03c5b1cSMartin Matuska     }
2271*c03c5b1cSMartin Matuska 
2272*c03c5b1cSMartin Matuska     /* select and store sequences */
2273*c03c5b1cSMartin Matuska     {   ZSTD_dictMode_e const dictMode = ZSTD_matchState_dictMode(ms);
2274*c03c5b1cSMartin Matuska         size_t lastLLSize;
2275*c03c5b1cSMartin Matuska         {   int i;
2276*c03c5b1cSMartin Matuska             for (i = 0; i < ZSTD_REP_NUM; ++i)
2277*c03c5b1cSMartin Matuska                 zc->blockState.nextCBlock->rep[i] = zc->blockState.prevCBlock->rep[i];
2278*c03c5b1cSMartin Matuska         }
2279*c03c5b1cSMartin Matuska         if (zc->externSeqStore.pos < zc->externSeqStore.size) {
2280*c03c5b1cSMartin Matuska             assert(!zc->appliedParams.ldmParams.enableLdm);
2281*c03c5b1cSMartin Matuska             /* Updates ldmSeqStore.pos */
2282*c03c5b1cSMartin Matuska             lastLLSize =
2283*c03c5b1cSMartin Matuska                 ZSTD_ldm_blockCompress(&zc->externSeqStore,
2284*c03c5b1cSMartin Matuska                                        ms, &zc->seqStore,
2285*c03c5b1cSMartin Matuska                                        zc->blockState.nextCBlock->rep,
2286*c03c5b1cSMartin Matuska                                        src, srcSize);
2287*c03c5b1cSMartin Matuska             assert(zc->externSeqStore.pos <= zc->externSeqStore.size);
2288*c03c5b1cSMartin Matuska         } else if (zc->appliedParams.ldmParams.enableLdm) {
2289*c03c5b1cSMartin Matuska             rawSeqStore_t ldmSeqStore = {NULL, 0, 0, 0};
2290*c03c5b1cSMartin Matuska 
2291*c03c5b1cSMartin Matuska             ldmSeqStore.seq = zc->ldmSequences;
2292*c03c5b1cSMartin Matuska             ldmSeqStore.capacity = zc->maxNbLdmSequences;
2293*c03c5b1cSMartin Matuska             /* Updates ldmSeqStore.size */
2294*c03c5b1cSMartin Matuska             FORWARD_IF_ERROR(ZSTD_ldm_generateSequences(&zc->ldmState, &ldmSeqStore,
2295*c03c5b1cSMartin Matuska                                                &zc->appliedParams.ldmParams,
2296*c03c5b1cSMartin Matuska                                                src, srcSize), "");
2297*c03c5b1cSMartin Matuska             /* Updates ldmSeqStore.pos */
2298*c03c5b1cSMartin Matuska             lastLLSize =
2299*c03c5b1cSMartin Matuska                 ZSTD_ldm_blockCompress(&ldmSeqStore,
2300*c03c5b1cSMartin Matuska                                        ms, &zc->seqStore,
2301*c03c5b1cSMartin Matuska                                        zc->blockState.nextCBlock->rep,
2302*c03c5b1cSMartin Matuska                                        src, srcSize);
2303*c03c5b1cSMartin Matuska             assert(ldmSeqStore.pos == ldmSeqStore.size);
2304*c03c5b1cSMartin Matuska         } else {   /* not long range mode */
2305*c03c5b1cSMartin Matuska             ZSTD_blockCompressor const blockCompressor = ZSTD_selectBlockCompressor(zc->appliedParams.cParams.strategy, dictMode);
2306*c03c5b1cSMartin Matuska             lastLLSize = blockCompressor(ms, &zc->seqStore, zc->blockState.nextCBlock->rep, src, srcSize);
2307*c03c5b1cSMartin Matuska         }
2308*c03c5b1cSMartin Matuska         {   const BYTE* const lastLiterals = (const BYTE*)src + srcSize - lastLLSize;
2309*c03c5b1cSMartin Matuska             ZSTD_storeLastLiterals(&zc->seqStore, lastLiterals, lastLLSize);
2310*c03c5b1cSMartin Matuska     }   }
2311*c03c5b1cSMartin Matuska     return ZSTDbss_compress;
2312*c03c5b1cSMartin Matuska }
2313*c03c5b1cSMartin Matuska 
ZSTD_copyBlockSequences(ZSTD_CCtx * zc)2314*c03c5b1cSMartin Matuska static void ZSTD_copyBlockSequences(ZSTD_CCtx* zc)
2315*c03c5b1cSMartin Matuska {
2316*c03c5b1cSMartin Matuska     const seqStore_t* seqStore = ZSTD_getSeqStore(zc);
2317*c03c5b1cSMartin Matuska     const seqDef* seqs = seqStore->sequencesStart;
2318*c03c5b1cSMartin Matuska     size_t seqsSize = seqStore->sequences - seqs;
2319*c03c5b1cSMartin Matuska 
2320*c03c5b1cSMartin Matuska     ZSTD_Sequence* outSeqs = &zc->seqCollector.seqStart[zc->seqCollector.seqIndex];
2321*c03c5b1cSMartin Matuska     size_t i; size_t position; int repIdx;
2322*c03c5b1cSMartin Matuska 
2323*c03c5b1cSMartin Matuska     assert(zc->seqCollector.seqIndex + 1 < zc->seqCollector.maxSequences);
2324*c03c5b1cSMartin Matuska     for (i = 0, position = 0; i < seqsSize; ++i) {
2325*c03c5b1cSMartin Matuska         outSeqs[i].offset = seqs[i].offset;
2326*c03c5b1cSMartin Matuska         outSeqs[i].litLength = seqs[i].litLength;
2327*c03c5b1cSMartin Matuska         outSeqs[i].matchLength = seqs[i].matchLength + MINMATCH;
2328*c03c5b1cSMartin Matuska 
2329*c03c5b1cSMartin Matuska         if (i == seqStore->longLengthPos) {
2330*c03c5b1cSMartin Matuska             if (seqStore->longLengthID == 1) {
2331*c03c5b1cSMartin Matuska                 outSeqs[i].litLength += 0x10000;
2332*c03c5b1cSMartin Matuska             } else if (seqStore->longLengthID == 2) {
2333*c03c5b1cSMartin Matuska                 outSeqs[i].matchLength += 0x10000;
2334*c03c5b1cSMartin Matuska             }
2335*c03c5b1cSMartin Matuska         }
2336*c03c5b1cSMartin Matuska 
2337*c03c5b1cSMartin Matuska         if (outSeqs[i].offset <= ZSTD_REP_NUM) {
2338*c03c5b1cSMartin Matuska             outSeqs[i].rep = outSeqs[i].offset;
2339*c03c5b1cSMartin Matuska             repIdx = (unsigned int)i - outSeqs[i].offset;
2340*c03c5b1cSMartin Matuska 
2341*c03c5b1cSMartin Matuska             if (outSeqs[i].litLength == 0) {
2342*c03c5b1cSMartin Matuska                 if (outSeqs[i].offset < 3) {
2343*c03c5b1cSMartin Matuska                     --repIdx;
2344*c03c5b1cSMartin Matuska                 } else {
2345*c03c5b1cSMartin Matuska                     repIdx = (unsigned int)i - 1;
2346*c03c5b1cSMartin Matuska                 }
2347*c03c5b1cSMartin Matuska                 ++outSeqs[i].rep;
2348*c03c5b1cSMartin Matuska             }
2349*c03c5b1cSMartin Matuska             assert(repIdx >= -3);
2350*c03c5b1cSMartin Matuska             outSeqs[i].offset = repIdx >= 0 ? outSeqs[repIdx].offset : repStartValue[-repIdx - 1];
2351*c03c5b1cSMartin Matuska             if (outSeqs[i].rep == 4) {
2352*c03c5b1cSMartin Matuska                 --outSeqs[i].offset;
2353*c03c5b1cSMartin Matuska             }
2354*c03c5b1cSMartin Matuska         } else {
2355*c03c5b1cSMartin Matuska             outSeqs[i].offset -= ZSTD_REP_NUM;
2356*c03c5b1cSMartin Matuska         }
2357*c03c5b1cSMartin Matuska 
2358*c03c5b1cSMartin Matuska         position += outSeqs[i].litLength;
2359*c03c5b1cSMartin Matuska         outSeqs[i].matchPos = (unsigned int)position;
2360*c03c5b1cSMartin Matuska         position += outSeqs[i].matchLength;
2361*c03c5b1cSMartin Matuska     }
2362*c03c5b1cSMartin Matuska     zc->seqCollector.seqIndex += seqsSize;
2363*c03c5b1cSMartin Matuska }
2364*c03c5b1cSMartin Matuska 
ZSTD_getSequences(ZSTD_CCtx * zc,ZSTD_Sequence * outSeqs,size_t outSeqsSize,const void * src,size_t srcSize)2365*c03c5b1cSMartin Matuska size_t ZSTD_getSequences(ZSTD_CCtx* zc, ZSTD_Sequence* outSeqs,
2366*c03c5b1cSMartin Matuska     size_t outSeqsSize, const void* src, size_t srcSize)
2367*c03c5b1cSMartin Matuska {
2368*c03c5b1cSMartin Matuska     const size_t dstCapacity = ZSTD_compressBound(srcSize);
2369*c03c5b1cSMartin Matuska     void* dst = ZSTD_malloc(dstCapacity, ZSTD_defaultCMem);
2370*c03c5b1cSMartin Matuska     SeqCollector seqCollector;
2371*c03c5b1cSMartin Matuska 
2372*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(dst == NULL, memory_allocation, "NULL pointer!");
2373*c03c5b1cSMartin Matuska 
2374*c03c5b1cSMartin Matuska     seqCollector.collectSequences = 1;
2375*c03c5b1cSMartin Matuska     seqCollector.seqStart = outSeqs;
2376*c03c5b1cSMartin Matuska     seqCollector.seqIndex = 0;
2377*c03c5b1cSMartin Matuska     seqCollector.maxSequences = outSeqsSize;
2378*c03c5b1cSMartin Matuska     zc->seqCollector = seqCollector;
2379*c03c5b1cSMartin Matuska 
2380*c03c5b1cSMartin Matuska     ZSTD_compress2(zc, dst, dstCapacity, src, srcSize);
2381*c03c5b1cSMartin Matuska     ZSTD_free(dst, ZSTD_defaultCMem);
2382*c03c5b1cSMartin Matuska     return zc->seqCollector.seqIndex;
2383*c03c5b1cSMartin Matuska }
2384*c03c5b1cSMartin Matuska 
2385*c03c5b1cSMartin Matuska /* Returns true if the given block is a RLE block */
ZSTD_isRLE(const BYTE * ip,size_t length)2386*c03c5b1cSMartin Matuska static int ZSTD_isRLE(const BYTE *ip, size_t length) {
2387*c03c5b1cSMartin Matuska     size_t i;
2388*c03c5b1cSMartin Matuska     if (length < 2) return 1;
2389*c03c5b1cSMartin Matuska     for (i = 1; i < length; ++i) {
2390*c03c5b1cSMartin Matuska         if (ip[0] != ip[i]) return 0;
2391*c03c5b1cSMartin Matuska     }
2392*c03c5b1cSMartin Matuska     return 1;
2393*c03c5b1cSMartin Matuska }
2394*c03c5b1cSMartin Matuska 
2395*c03c5b1cSMartin Matuska /* Returns true if the given block may be RLE.
2396*c03c5b1cSMartin Matuska  * This is just a heuristic based on the compressibility.
2397*c03c5b1cSMartin Matuska  * It may return both false positives and false negatives.
2398*c03c5b1cSMartin Matuska  */
ZSTD_maybeRLE(seqStore_t const * seqStore)2399*c03c5b1cSMartin Matuska static int ZSTD_maybeRLE(seqStore_t const* seqStore)
2400*c03c5b1cSMartin Matuska {
2401*c03c5b1cSMartin Matuska     size_t const nbSeqs = (size_t)(seqStore->sequences - seqStore->sequencesStart);
2402*c03c5b1cSMartin Matuska     size_t const nbLits = (size_t)(seqStore->lit - seqStore->litStart);
2403*c03c5b1cSMartin Matuska 
2404*c03c5b1cSMartin Matuska     return nbSeqs < 4 && nbLits < 10;
2405*c03c5b1cSMartin Matuska }
2406*c03c5b1cSMartin Matuska 
ZSTD_confirmRepcodesAndEntropyTables(ZSTD_CCtx * zc)2407*c03c5b1cSMartin Matuska static void ZSTD_confirmRepcodesAndEntropyTables(ZSTD_CCtx* zc)
2408*c03c5b1cSMartin Matuska {
2409*c03c5b1cSMartin Matuska     ZSTD_compressedBlockState_t* const tmp = zc->blockState.prevCBlock;
2410*c03c5b1cSMartin Matuska     zc->blockState.prevCBlock = zc->blockState.nextCBlock;
2411*c03c5b1cSMartin Matuska     zc->blockState.nextCBlock = tmp;
2412*c03c5b1cSMartin Matuska }
2413*c03c5b1cSMartin Matuska 
ZSTD_compressBlock_internal(ZSTD_CCtx * zc,void * dst,size_t dstCapacity,const void * src,size_t srcSize,U32 frame)2414*c03c5b1cSMartin Matuska static size_t ZSTD_compressBlock_internal(ZSTD_CCtx* zc,
2415*c03c5b1cSMartin Matuska                                         void* dst, size_t dstCapacity,
2416*c03c5b1cSMartin Matuska                                         const void* src, size_t srcSize, U32 frame)
2417*c03c5b1cSMartin Matuska {
2418*c03c5b1cSMartin Matuska     /* This the upper bound for the length of an rle block.
2419*c03c5b1cSMartin Matuska      * This isn't the actual upper bound. Finding the real threshold
2420*c03c5b1cSMartin Matuska      * needs further investigation.
2421*c03c5b1cSMartin Matuska      */
2422*c03c5b1cSMartin Matuska     const U32 rleMaxLength = 25;
2423*c03c5b1cSMartin Matuska     size_t cSize;
2424*c03c5b1cSMartin Matuska     const BYTE* ip = (const BYTE*)src;
2425*c03c5b1cSMartin Matuska     BYTE* op = (BYTE*)dst;
2426*c03c5b1cSMartin Matuska     DEBUGLOG(5, "ZSTD_compressBlock_internal (dstCapacity=%u, dictLimit=%u, nextToUpdate=%u)",
2427*c03c5b1cSMartin Matuska                 (unsigned)dstCapacity, (unsigned)zc->blockState.matchState.window.dictLimit,
2428*c03c5b1cSMartin Matuska                 (unsigned)zc->blockState.matchState.nextToUpdate);
2429*c03c5b1cSMartin Matuska 
2430*c03c5b1cSMartin Matuska     {   const size_t bss = ZSTD_buildSeqStore(zc, src, srcSize);
2431*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR(bss, "ZSTD_buildSeqStore failed");
2432*c03c5b1cSMartin Matuska         if (bss == ZSTDbss_noCompress) { cSize = 0; goto out; }
2433*c03c5b1cSMartin Matuska     }
2434*c03c5b1cSMartin Matuska 
2435*c03c5b1cSMartin Matuska     if (zc->seqCollector.collectSequences) {
2436*c03c5b1cSMartin Matuska         ZSTD_copyBlockSequences(zc);
2437*c03c5b1cSMartin Matuska         return 0;
2438*c03c5b1cSMartin Matuska     }
2439*c03c5b1cSMartin Matuska 
2440*c03c5b1cSMartin Matuska     /* encode sequences and literals */
2441*c03c5b1cSMartin Matuska     cSize = ZSTD_compressSequences(&zc->seqStore,
2442*c03c5b1cSMartin Matuska             &zc->blockState.prevCBlock->entropy, &zc->blockState.nextCBlock->entropy,
2443*c03c5b1cSMartin Matuska             &zc->appliedParams,
2444*c03c5b1cSMartin Matuska             dst, dstCapacity,
2445*c03c5b1cSMartin Matuska             srcSize,
2446*c03c5b1cSMartin Matuska             zc->entropyWorkspace, HUF_WORKSPACE_SIZE /* statically allocated in resetCCtx */,
2447*c03c5b1cSMartin Matuska             zc->bmi2);
2448*c03c5b1cSMartin Matuska 
2449*c03c5b1cSMartin Matuska     if (frame &&
2450*c03c5b1cSMartin Matuska         /* We don't want to emit our first block as a RLE even if it qualifies because
2451*c03c5b1cSMartin Matuska          * doing so will cause the decoder (cli only) to throw a "should consume all input error."
2452*c03c5b1cSMartin Matuska          * This is only an issue for zstd <= v1.4.3
2453*c03c5b1cSMartin Matuska          */
2454*c03c5b1cSMartin Matuska         !zc->isFirstBlock &&
2455*c03c5b1cSMartin Matuska         cSize < rleMaxLength &&
2456*c03c5b1cSMartin Matuska         ZSTD_isRLE(ip, srcSize))
2457*c03c5b1cSMartin Matuska     {
2458*c03c5b1cSMartin Matuska         cSize = 1;
2459*c03c5b1cSMartin Matuska         op[0] = ip[0];
2460*c03c5b1cSMartin Matuska     }
2461*c03c5b1cSMartin Matuska 
2462*c03c5b1cSMartin Matuska out:
2463*c03c5b1cSMartin Matuska     if (!ZSTD_isError(cSize) && cSize > 1) {
2464*c03c5b1cSMartin Matuska         ZSTD_confirmRepcodesAndEntropyTables(zc);
2465*c03c5b1cSMartin Matuska     }
2466*c03c5b1cSMartin Matuska     /* We check that dictionaries have offset codes available for the first
2467*c03c5b1cSMartin Matuska      * block. After the first block, the offcode table might not have large
2468*c03c5b1cSMartin Matuska      * enough codes to represent the offsets in the data.
2469*c03c5b1cSMartin Matuska      */
2470*c03c5b1cSMartin Matuska     if (zc->blockState.prevCBlock->entropy.fse.offcode_repeatMode == FSE_repeat_valid)
2471*c03c5b1cSMartin Matuska         zc->blockState.prevCBlock->entropy.fse.offcode_repeatMode = FSE_repeat_check;
2472*c03c5b1cSMartin Matuska 
2473*c03c5b1cSMartin Matuska     return cSize;
2474*c03c5b1cSMartin Matuska }
2475*c03c5b1cSMartin Matuska 
ZSTD_compressBlock_targetCBlockSize_body(ZSTD_CCtx * zc,void * dst,size_t dstCapacity,const void * src,size_t srcSize,const size_t bss,U32 lastBlock)2476*c03c5b1cSMartin Matuska static size_t ZSTD_compressBlock_targetCBlockSize_body(ZSTD_CCtx* zc,
2477*c03c5b1cSMartin Matuska                                void* dst, size_t dstCapacity,
2478*c03c5b1cSMartin Matuska                                const void* src, size_t srcSize,
2479*c03c5b1cSMartin Matuska                                const size_t bss, U32 lastBlock)
2480*c03c5b1cSMartin Matuska {
2481*c03c5b1cSMartin Matuska     DEBUGLOG(6, "Attempting ZSTD_compressSuperBlock()");
2482*c03c5b1cSMartin Matuska     if (bss == ZSTDbss_compress) {
2483*c03c5b1cSMartin Matuska         if (/* We don't want to emit our first block as a RLE even if it qualifies because
2484*c03c5b1cSMartin Matuska             * doing so will cause the decoder (cli only) to throw a "should consume all input error."
2485*c03c5b1cSMartin Matuska             * This is only an issue for zstd <= v1.4.3
2486*c03c5b1cSMartin Matuska             */
2487*c03c5b1cSMartin Matuska             !zc->isFirstBlock &&
2488*c03c5b1cSMartin Matuska             ZSTD_maybeRLE(&zc->seqStore) &&
2489*c03c5b1cSMartin Matuska             ZSTD_isRLE((BYTE const*)src, srcSize))
2490*c03c5b1cSMartin Matuska         {
2491*c03c5b1cSMartin Matuska             return ZSTD_rleCompressBlock(dst, dstCapacity, *(BYTE const*)src, srcSize, lastBlock);
2492*c03c5b1cSMartin Matuska         }
2493*c03c5b1cSMartin Matuska         /* Attempt superblock compression.
2494*c03c5b1cSMartin Matuska          *
2495*c03c5b1cSMartin Matuska          * Note that compressed size of ZSTD_compressSuperBlock() is not bound by the
2496*c03c5b1cSMartin Matuska          * standard ZSTD_compressBound(). This is a problem, because even if we have
2497*c03c5b1cSMartin Matuska          * space now, taking an extra byte now could cause us to run out of space later
2498*c03c5b1cSMartin Matuska          * and violate ZSTD_compressBound().
2499*c03c5b1cSMartin Matuska          *
2500*c03c5b1cSMartin Matuska          * Define blockBound(blockSize) = blockSize + ZSTD_blockHeaderSize.
2501*c03c5b1cSMartin Matuska          *
2502*c03c5b1cSMartin Matuska          * In order to respect ZSTD_compressBound() we must attempt to emit a raw
2503*c03c5b1cSMartin Matuska          * uncompressed block in these cases:
2504*c03c5b1cSMartin Matuska          *   * cSize == 0: Return code for an uncompressed block.
2505*c03c5b1cSMartin Matuska          *   * cSize == dstSize_tooSmall: We may have expanded beyond blockBound(srcSize).
2506*c03c5b1cSMartin Matuska          *     ZSTD_noCompressBlock() will return dstSize_tooSmall if we are really out of
2507*c03c5b1cSMartin Matuska          *     output space.
2508*c03c5b1cSMartin Matuska          *   * cSize >= blockBound(srcSize): We have expanded the block too much so
2509*c03c5b1cSMartin Matuska          *     emit an uncompressed block.
2510*c03c5b1cSMartin Matuska          */
2511*c03c5b1cSMartin Matuska         {
2512*c03c5b1cSMartin Matuska             size_t const cSize = ZSTD_compressSuperBlock(zc, dst, dstCapacity, src, srcSize, lastBlock);
2513*c03c5b1cSMartin Matuska             if (cSize != ERROR(dstSize_tooSmall)) {
2514*c03c5b1cSMartin Matuska                 size_t const maxCSize = srcSize - ZSTD_minGain(srcSize, zc->appliedParams.cParams.strategy);
2515*c03c5b1cSMartin Matuska                 FORWARD_IF_ERROR(cSize, "ZSTD_compressSuperBlock failed");
2516*c03c5b1cSMartin Matuska                 if (cSize != 0 && cSize < maxCSize + ZSTD_blockHeaderSize) {
2517*c03c5b1cSMartin Matuska                     ZSTD_confirmRepcodesAndEntropyTables(zc);
2518*c03c5b1cSMartin Matuska                     return cSize;
2519*c03c5b1cSMartin Matuska                 }
2520*c03c5b1cSMartin Matuska             }
2521*c03c5b1cSMartin Matuska         }
2522*c03c5b1cSMartin Matuska     }
2523*c03c5b1cSMartin Matuska 
2524*c03c5b1cSMartin Matuska     DEBUGLOG(6, "Resorting to ZSTD_noCompressBlock()");
2525*c03c5b1cSMartin Matuska     /* Superblock compression failed, attempt to emit a single no compress block.
2526*c03c5b1cSMartin Matuska      * The decoder will be able to stream this block since it is uncompressed.
2527*c03c5b1cSMartin Matuska      */
2528*c03c5b1cSMartin Matuska     return ZSTD_noCompressBlock(dst, dstCapacity, src, srcSize, lastBlock);
2529*c03c5b1cSMartin Matuska }
2530*c03c5b1cSMartin Matuska 
ZSTD_compressBlock_targetCBlockSize(ZSTD_CCtx * zc,void * dst,size_t dstCapacity,const void * src,size_t srcSize,U32 lastBlock)2531*c03c5b1cSMartin Matuska static size_t ZSTD_compressBlock_targetCBlockSize(ZSTD_CCtx* zc,
2532*c03c5b1cSMartin Matuska                                void* dst, size_t dstCapacity,
2533*c03c5b1cSMartin Matuska                                const void* src, size_t srcSize,
2534*c03c5b1cSMartin Matuska                                U32 lastBlock)
2535*c03c5b1cSMartin Matuska {
2536*c03c5b1cSMartin Matuska     size_t cSize = 0;
2537*c03c5b1cSMartin Matuska     const size_t bss = ZSTD_buildSeqStore(zc, src, srcSize);
2538*c03c5b1cSMartin Matuska     DEBUGLOG(5, "ZSTD_compressBlock_targetCBlockSize (dstCapacity=%u, dictLimit=%u, nextToUpdate=%u, srcSize=%zu)",
2539*c03c5b1cSMartin Matuska                 (unsigned)dstCapacity, (unsigned)zc->blockState.matchState.window.dictLimit, (unsigned)zc->blockState.matchState.nextToUpdate, srcSize);
2540*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR(bss, "ZSTD_buildSeqStore failed");
2541*c03c5b1cSMartin Matuska 
2542*c03c5b1cSMartin Matuska     cSize = ZSTD_compressBlock_targetCBlockSize_body(zc, dst, dstCapacity, src, srcSize, bss, lastBlock);
2543*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR(cSize, "ZSTD_compressBlock_targetCBlockSize_body failed");
2544*c03c5b1cSMartin Matuska 
2545*c03c5b1cSMartin Matuska     if (zc->blockState.prevCBlock->entropy.fse.offcode_repeatMode == FSE_repeat_valid)
2546*c03c5b1cSMartin Matuska         zc->blockState.prevCBlock->entropy.fse.offcode_repeatMode = FSE_repeat_check;
2547*c03c5b1cSMartin Matuska 
2548*c03c5b1cSMartin Matuska     return cSize;
2549*c03c5b1cSMartin Matuska }
2550*c03c5b1cSMartin Matuska 
ZSTD_overflowCorrectIfNeeded(ZSTD_matchState_t * ms,ZSTD_cwksp * ws,ZSTD_CCtx_params const * params,void const * ip,void const * iend)2551*c03c5b1cSMartin Matuska static void ZSTD_overflowCorrectIfNeeded(ZSTD_matchState_t* ms,
2552*c03c5b1cSMartin Matuska                                          ZSTD_cwksp* ws,
2553*c03c5b1cSMartin Matuska                                          ZSTD_CCtx_params const* params,
2554*c03c5b1cSMartin Matuska                                          void const* ip,
2555*c03c5b1cSMartin Matuska                                          void const* iend)
2556*c03c5b1cSMartin Matuska {
2557*c03c5b1cSMartin Matuska     if (ZSTD_window_needOverflowCorrection(ms->window, iend)) {
2558*c03c5b1cSMartin Matuska         U32 const maxDist = (U32)1 << params->cParams.windowLog;
2559*c03c5b1cSMartin Matuska         U32 const cycleLog = ZSTD_cycleLog(params->cParams.chainLog, params->cParams.strategy);
2560*c03c5b1cSMartin Matuska         U32 const correction = ZSTD_window_correctOverflow(&ms->window, cycleLog, maxDist, ip);
2561*c03c5b1cSMartin Matuska         ZSTD_STATIC_ASSERT(ZSTD_CHAINLOG_MAX <= 30);
2562*c03c5b1cSMartin Matuska         ZSTD_STATIC_ASSERT(ZSTD_WINDOWLOG_MAX_32 <= 30);
2563*c03c5b1cSMartin Matuska         ZSTD_STATIC_ASSERT(ZSTD_WINDOWLOG_MAX <= 31);
2564*c03c5b1cSMartin Matuska         ZSTD_cwksp_mark_tables_dirty(ws);
2565*c03c5b1cSMartin Matuska         ZSTD_reduceIndex(ms, params, correction);
2566*c03c5b1cSMartin Matuska         ZSTD_cwksp_mark_tables_clean(ws);
2567*c03c5b1cSMartin Matuska         if (ms->nextToUpdate < correction) ms->nextToUpdate = 0;
2568*c03c5b1cSMartin Matuska         else ms->nextToUpdate -= correction;
2569*c03c5b1cSMartin Matuska         /* invalidate dictionaries on overflow correction */
2570*c03c5b1cSMartin Matuska         ms->loadedDictEnd = 0;
2571*c03c5b1cSMartin Matuska         ms->dictMatchState = NULL;
2572*c03c5b1cSMartin Matuska     }
2573*c03c5b1cSMartin Matuska }
2574*c03c5b1cSMartin Matuska 
2575*c03c5b1cSMartin Matuska /*! ZSTD_compress_frameChunk() :
2576*c03c5b1cSMartin Matuska *   Compress a chunk of data into one or multiple blocks.
2577*c03c5b1cSMartin Matuska *   All blocks will be terminated, all input will be consumed.
2578*c03c5b1cSMartin Matuska *   Function will issue an error if there is not enough `dstCapacity` to hold the compressed content.
2579*c03c5b1cSMartin Matuska *   Frame is supposed already started (header already produced)
2580*c03c5b1cSMartin Matuska *   @return : compressed size, or an error code
2581*c03c5b1cSMartin Matuska */
ZSTD_compress_frameChunk(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize,U32 lastFrameChunk)2582*c03c5b1cSMartin Matuska static size_t ZSTD_compress_frameChunk (ZSTD_CCtx* cctx,
2583*c03c5b1cSMartin Matuska                                      void* dst, size_t dstCapacity,
2584*c03c5b1cSMartin Matuska                                const void* src, size_t srcSize,
2585*c03c5b1cSMartin Matuska                                      U32 lastFrameChunk)
2586*c03c5b1cSMartin Matuska {
2587*c03c5b1cSMartin Matuska     size_t blockSize = cctx->blockSize;
2588*c03c5b1cSMartin Matuska     size_t remaining = srcSize;
2589*c03c5b1cSMartin Matuska     const BYTE* ip = (const BYTE*)src;
2590*c03c5b1cSMartin Matuska     BYTE* const ostart = (BYTE*)dst;
2591*c03c5b1cSMartin Matuska     BYTE* op = ostart;
2592*c03c5b1cSMartin Matuska     U32 const maxDist = (U32)1 << cctx->appliedParams.cParams.windowLog;
2593*c03c5b1cSMartin Matuska 
2594*c03c5b1cSMartin Matuska     assert(cctx->appliedParams.cParams.windowLog <= ZSTD_WINDOWLOG_MAX);
2595*c03c5b1cSMartin Matuska 
2596*c03c5b1cSMartin Matuska     DEBUGLOG(5, "ZSTD_compress_frameChunk (blockSize=%u)", (unsigned)blockSize);
2597*c03c5b1cSMartin Matuska     if (cctx->appliedParams.fParams.checksumFlag && srcSize)
2598*c03c5b1cSMartin Matuska         XXH64_update(&cctx->xxhState, src, srcSize);
2599*c03c5b1cSMartin Matuska 
2600*c03c5b1cSMartin Matuska     while (remaining) {
2601*c03c5b1cSMartin Matuska         ZSTD_matchState_t* const ms = &cctx->blockState.matchState;
2602*c03c5b1cSMartin Matuska         U32 const lastBlock = lastFrameChunk & (blockSize >= remaining);
2603*c03c5b1cSMartin Matuska 
2604*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(dstCapacity < ZSTD_blockHeaderSize + MIN_CBLOCK_SIZE,
2605*c03c5b1cSMartin Matuska                         dstSize_tooSmall,
2606*c03c5b1cSMartin Matuska                         "not enough space to store compressed block");
2607*c03c5b1cSMartin Matuska         if (remaining < blockSize) blockSize = remaining;
2608*c03c5b1cSMartin Matuska 
2609*c03c5b1cSMartin Matuska         ZSTD_overflowCorrectIfNeeded(
2610*c03c5b1cSMartin Matuska             ms, &cctx->workspace, &cctx->appliedParams, ip, ip + blockSize);
2611*c03c5b1cSMartin Matuska         ZSTD_checkDictValidity(&ms->window, ip + blockSize, maxDist, &ms->loadedDictEnd, &ms->dictMatchState);
2612*c03c5b1cSMartin Matuska 
2613*c03c5b1cSMartin Matuska         /* Ensure hash/chain table insertion resumes no sooner than lowlimit */
2614*c03c5b1cSMartin Matuska         if (ms->nextToUpdate < ms->window.lowLimit) ms->nextToUpdate = ms->window.lowLimit;
2615*c03c5b1cSMartin Matuska 
2616*c03c5b1cSMartin Matuska         {   size_t cSize;
2617*c03c5b1cSMartin Matuska             if (ZSTD_useTargetCBlockSize(&cctx->appliedParams)) {
2618*c03c5b1cSMartin Matuska                 cSize = ZSTD_compressBlock_targetCBlockSize(cctx, op, dstCapacity, ip, blockSize, lastBlock);
2619*c03c5b1cSMartin Matuska                 FORWARD_IF_ERROR(cSize, "ZSTD_compressBlock_targetCBlockSize failed");
2620*c03c5b1cSMartin Matuska                 assert(cSize > 0);
2621*c03c5b1cSMartin Matuska                 assert(cSize <= blockSize + ZSTD_blockHeaderSize);
2622*c03c5b1cSMartin Matuska             } else {
2623*c03c5b1cSMartin Matuska                 cSize = ZSTD_compressBlock_internal(cctx,
2624*c03c5b1cSMartin Matuska                                         op+ZSTD_blockHeaderSize, dstCapacity-ZSTD_blockHeaderSize,
2625*c03c5b1cSMartin Matuska                                         ip, blockSize, 1 /* frame */);
2626*c03c5b1cSMartin Matuska                 FORWARD_IF_ERROR(cSize, "ZSTD_compressBlock_internal failed");
2627*c03c5b1cSMartin Matuska 
2628*c03c5b1cSMartin Matuska                 if (cSize == 0) {  /* block is not compressible */
2629*c03c5b1cSMartin Matuska                     cSize = ZSTD_noCompressBlock(op, dstCapacity, ip, blockSize, lastBlock);
2630*c03c5b1cSMartin Matuska                     FORWARD_IF_ERROR(cSize, "ZSTD_noCompressBlock failed");
2631*c03c5b1cSMartin Matuska                 } else {
2632*c03c5b1cSMartin Matuska                     U32 const cBlockHeader = cSize == 1 ?
2633*c03c5b1cSMartin Matuska                         lastBlock + (((U32)bt_rle)<<1) + (U32)(blockSize << 3) :
2634*c03c5b1cSMartin Matuska                         lastBlock + (((U32)bt_compressed)<<1) + (U32)(cSize << 3);
2635*c03c5b1cSMartin Matuska                     MEM_writeLE24(op, cBlockHeader);
2636*c03c5b1cSMartin Matuska                     cSize += ZSTD_blockHeaderSize;
2637*c03c5b1cSMartin Matuska                 }
2638*c03c5b1cSMartin Matuska             }
2639*c03c5b1cSMartin Matuska 
2640*c03c5b1cSMartin Matuska 
2641*c03c5b1cSMartin Matuska             ip += blockSize;
2642*c03c5b1cSMartin Matuska             assert(remaining >= blockSize);
2643*c03c5b1cSMartin Matuska             remaining -= blockSize;
2644*c03c5b1cSMartin Matuska             op += cSize;
2645*c03c5b1cSMartin Matuska             assert(dstCapacity >= cSize);
2646*c03c5b1cSMartin Matuska             dstCapacity -= cSize;
2647*c03c5b1cSMartin Matuska             cctx->isFirstBlock = 0;
2648*c03c5b1cSMartin Matuska             DEBUGLOG(5, "ZSTD_compress_frameChunk: adding a block of size %u",
2649*c03c5b1cSMartin Matuska                         (unsigned)cSize);
2650*c03c5b1cSMartin Matuska     }   }
2651*c03c5b1cSMartin Matuska 
2652*c03c5b1cSMartin Matuska     if (lastFrameChunk && (op>ostart)) cctx->stage = ZSTDcs_ending;
2653*c03c5b1cSMartin Matuska     return (size_t)(op-ostart);
2654*c03c5b1cSMartin Matuska }
2655*c03c5b1cSMartin Matuska 
2656*c03c5b1cSMartin Matuska 
ZSTD_writeFrameHeader(void * dst,size_t dstCapacity,const ZSTD_CCtx_params * params,U64 pledgedSrcSize,U32 dictID)2657*c03c5b1cSMartin Matuska static size_t ZSTD_writeFrameHeader(void* dst, size_t dstCapacity,
2658*c03c5b1cSMartin Matuska                                     const ZSTD_CCtx_params* params, U64 pledgedSrcSize, U32 dictID)
2659*c03c5b1cSMartin Matuska {   BYTE* const op = (BYTE*)dst;
2660*c03c5b1cSMartin Matuska     U32   const dictIDSizeCodeLength = (dictID>0) + (dictID>=256) + (dictID>=65536);   /* 0-3 */
2661*c03c5b1cSMartin Matuska     U32   const dictIDSizeCode = params->fParams.noDictIDFlag ? 0 : dictIDSizeCodeLength;   /* 0-3 */
2662*c03c5b1cSMartin Matuska     U32   const checksumFlag = params->fParams.checksumFlag>0;
2663*c03c5b1cSMartin Matuska     U32   const windowSize = (U32)1 << params->cParams.windowLog;
2664*c03c5b1cSMartin Matuska     U32   const singleSegment = params->fParams.contentSizeFlag && (windowSize >= pledgedSrcSize);
2665*c03c5b1cSMartin Matuska     BYTE  const windowLogByte = (BYTE)((params->cParams.windowLog - ZSTD_WINDOWLOG_ABSOLUTEMIN) << 3);
2666*c03c5b1cSMartin Matuska     U32   const fcsCode = params->fParams.contentSizeFlag ?
2667*c03c5b1cSMartin Matuska                      (pledgedSrcSize>=256) + (pledgedSrcSize>=65536+256) + (pledgedSrcSize>=0xFFFFFFFFU) : 0;  /* 0-3 */
2668*c03c5b1cSMartin Matuska     BYTE  const frameHeaderDescriptionByte = (BYTE)(dictIDSizeCode + (checksumFlag<<2) + (singleSegment<<5) + (fcsCode<<6) );
2669*c03c5b1cSMartin Matuska     size_t pos=0;
2670*c03c5b1cSMartin Matuska 
2671*c03c5b1cSMartin Matuska     assert(!(params->fParams.contentSizeFlag && pledgedSrcSize == ZSTD_CONTENTSIZE_UNKNOWN));
2672*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(dstCapacity < ZSTD_FRAMEHEADERSIZE_MAX, dstSize_tooSmall,
2673*c03c5b1cSMartin Matuska                     "dst buf is too small to fit worst-case frame header size.");
2674*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_writeFrameHeader : dictIDFlag : %u ; dictID : %u ; dictIDSizeCode : %u",
2675*c03c5b1cSMartin Matuska                 !params->fParams.noDictIDFlag, (unsigned)dictID, (unsigned)dictIDSizeCode);
2676*c03c5b1cSMartin Matuska 
2677*c03c5b1cSMartin Matuska     if (params->format == ZSTD_f_zstd1) {
2678*c03c5b1cSMartin Matuska         MEM_writeLE32(dst, ZSTD_MAGICNUMBER);
2679*c03c5b1cSMartin Matuska         pos = 4;
2680*c03c5b1cSMartin Matuska     }
2681*c03c5b1cSMartin Matuska     op[pos++] = frameHeaderDescriptionByte;
2682*c03c5b1cSMartin Matuska     if (!singleSegment) op[pos++] = windowLogByte;
2683*c03c5b1cSMartin Matuska     switch(dictIDSizeCode)
2684*c03c5b1cSMartin Matuska     {
2685*c03c5b1cSMartin Matuska         default:  assert(0); /* impossible */
2686*c03c5b1cSMartin Matuska         case 0 : break;
2687*c03c5b1cSMartin Matuska         case 1 : op[pos] = (BYTE)(dictID); pos++; break;
2688*c03c5b1cSMartin Matuska         case 2 : MEM_writeLE16(op+pos, (U16)dictID); pos+=2; break;
2689*c03c5b1cSMartin Matuska         case 3 : MEM_writeLE32(op+pos, dictID); pos+=4; break;
2690*c03c5b1cSMartin Matuska     }
2691*c03c5b1cSMartin Matuska     switch(fcsCode)
2692*c03c5b1cSMartin Matuska     {
2693*c03c5b1cSMartin Matuska         default:  assert(0); /* impossible */
2694*c03c5b1cSMartin Matuska         case 0 : if (singleSegment) op[pos++] = (BYTE)(pledgedSrcSize); break;
2695*c03c5b1cSMartin Matuska         case 1 : MEM_writeLE16(op+pos, (U16)(pledgedSrcSize-256)); pos+=2; break;
2696*c03c5b1cSMartin Matuska         case 2 : MEM_writeLE32(op+pos, (U32)(pledgedSrcSize)); pos+=4; break;
2697*c03c5b1cSMartin Matuska         case 3 : MEM_writeLE64(op+pos, (U64)(pledgedSrcSize)); pos+=8; break;
2698*c03c5b1cSMartin Matuska     }
2699*c03c5b1cSMartin Matuska     return pos;
2700*c03c5b1cSMartin Matuska }
2701*c03c5b1cSMartin Matuska 
2702*c03c5b1cSMartin Matuska /* ZSTD_writeLastEmptyBlock() :
2703*c03c5b1cSMartin Matuska  * output an empty Block with end-of-frame mark to complete a frame
2704*c03c5b1cSMartin Matuska  * @return : size of data written into `dst` (== ZSTD_blockHeaderSize (defined in zstd_internal.h))
2705*c03c5b1cSMartin Matuska  *           or an error code if `dstCapacity` is too small (<ZSTD_blockHeaderSize)
2706*c03c5b1cSMartin Matuska  */
ZSTD_writeLastEmptyBlock(void * dst,size_t dstCapacity)2707*c03c5b1cSMartin Matuska size_t ZSTD_writeLastEmptyBlock(void* dst, size_t dstCapacity)
2708*c03c5b1cSMartin Matuska {
2709*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(dstCapacity < ZSTD_blockHeaderSize, dstSize_tooSmall,
2710*c03c5b1cSMartin Matuska                     "dst buf is too small to write frame trailer empty block.");
2711*c03c5b1cSMartin Matuska     {   U32 const cBlockHeader24 = 1 /*lastBlock*/ + (((U32)bt_raw)<<1);  /* 0 size */
2712*c03c5b1cSMartin Matuska         MEM_writeLE24(dst, cBlockHeader24);
2713*c03c5b1cSMartin Matuska         return ZSTD_blockHeaderSize;
2714*c03c5b1cSMartin Matuska     }
2715*c03c5b1cSMartin Matuska }
2716*c03c5b1cSMartin Matuska 
ZSTD_referenceExternalSequences(ZSTD_CCtx * cctx,rawSeq * seq,size_t nbSeq)2717*c03c5b1cSMartin Matuska size_t ZSTD_referenceExternalSequences(ZSTD_CCtx* cctx, rawSeq* seq, size_t nbSeq)
2718*c03c5b1cSMartin Matuska {
2719*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(cctx->stage != ZSTDcs_init, stage_wrong,
2720*c03c5b1cSMartin Matuska                     "wrong cctx stage");
2721*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(cctx->appliedParams.ldmParams.enableLdm,
2722*c03c5b1cSMartin Matuska                     parameter_unsupported,
2723*c03c5b1cSMartin Matuska                     "incompatible with ldm");
2724*c03c5b1cSMartin Matuska     cctx->externSeqStore.seq = seq;
2725*c03c5b1cSMartin Matuska     cctx->externSeqStore.size = nbSeq;
2726*c03c5b1cSMartin Matuska     cctx->externSeqStore.capacity = nbSeq;
2727*c03c5b1cSMartin Matuska     cctx->externSeqStore.pos = 0;
2728*c03c5b1cSMartin Matuska     return 0;
2729*c03c5b1cSMartin Matuska }
2730*c03c5b1cSMartin Matuska 
2731*c03c5b1cSMartin Matuska 
ZSTD_compressContinue_internal(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize,U32 frame,U32 lastFrameChunk)2732*c03c5b1cSMartin Matuska static size_t ZSTD_compressContinue_internal (ZSTD_CCtx* cctx,
2733*c03c5b1cSMartin Matuska                               void* dst, size_t dstCapacity,
2734*c03c5b1cSMartin Matuska                         const void* src, size_t srcSize,
2735*c03c5b1cSMartin Matuska                                U32 frame, U32 lastFrameChunk)
2736*c03c5b1cSMartin Matuska {
2737*c03c5b1cSMartin Matuska     ZSTD_matchState_t* const ms = &cctx->blockState.matchState;
2738*c03c5b1cSMartin Matuska     size_t fhSize = 0;
2739*c03c5b1cSMartin Matuska 
2740*c03c5b1cSMartin Matuska     DEBUGLOG(5, "ZSTD_compressContinue_internal, stage: %u, srcSize: %u",
2741*c03c5b1cSMartin Matuska                 cctx->stage, (unsigned)srcSize);
2742*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(cctx->stage==ZSTDcs_created, stage_wrong,
2743*c03c5b1cSMartin Matuska                     "missing init (ZSTD_compressBegin)");
2744*c03c5b1cSMartin Matuska 
2745*c03c5b1cSMartin Matuska     if (frame && (cctx->stage==ZSTDcs_init)) {
2746*c03c5b1cSMartin Matuska         fhSize = ZSTD_writeFrameHeader(dst, dstCapacity, &cctx->appliedParams,
2747*c03c5b1cSMartin Matuska                                        cctx->pledgedSrcSizePlusOne-1, cctx->dictID);
2748*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR(fhSize, "ZSTD_writeFrameHeader failed");
2749*c03c5b1cSMartin Matuska         assert(fhSize <= dstCapacity);
2750*c03c5b1cSMartin Matuska         dstCapacity -= fhSize;
2751*c03c5b1cSMartin Matuska         dst = (char*)dst + fhSize;
2752*c03c5b1cSMartin Matuska         cctx->stage = ZSTDcs_ongoing;
2753*c03c5b1cSMartin Matuska     }
2754*c03c5b1cSMartin Matuska 
2755*c03c5b1cSMartin Matuska     if (!srcSize) return fhSize;  /* do not generate an empty block if no input */
2756*c03c5b1cSMartin Matuska 
2757*c03c5b1cSMartin Matuska     if (!ZSTD_window_update(&ms->window, src, srcSize)) {
2758*c03c5b1cSMartin Matuska         ms->nextToUpdate = ms->window.dictLimit;
2759*c03c5b1cSMartin Matuska     }
2760*c03c5b1cSMartin Matuska     if (cctx->appliedParams.ldmParams.enableLdm) {
2761*c03c5b1cSMartin Matuska         ZSTD_window_update(&cctx->ldmState.window, src, srcSize);
2762*c03c5b1cSMartin Matuska     }
2763*c03c5b1cSMartin Matuska 
2764*c03c5b1cSMartin Matuska     if (!frame) {
2765*c03c5b1cSMartin Matuska         /* overflow check and correction for block mode */
2766*c03c5b1cSMartin Matuska         ZSTD_overflowCorrectIfNeeded(
2767*c03c5b1cSMartin Matuska             ms, &cctx->workspace, &cctx->appliedParams,
2768*c03c5b1cSMartin Matuska             src, (BYTE const*)src + srcSize);
2769*c03c5b1cSMartin Matuska     }
2770*c03c5b1cSMartin Matuska 
2771*c03c5b1cSMartin Matuska     DEBUGLOG(5, "ZSTD_compressContinue_internal (blockSize=%u)", (unsigned)cctx->blockSize);
2772*c03c5b1cSMartin Matuska     {   size_t const cSize = frame ?
2773*c03c5b1cSMartin Matuska                              ZSTD_compress_frameChunk (cctx, dst, dstCapacity, src, srcSize, lastFrameChunk) :
2774*c03c5b1cSMartin Matuska                              ZSTD_compressBlock_internal (cctx, dst, dstCapacity, src, srcSize, 0 /* frame */);
2775*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR(cSize, "%s", frame ? "ZSTD_compress_frameChunk failed" : "ZSTD_compressBlock_internal failed");
2776*c03c5b1cSMartin Matuska         cctx->consumedSrcSize += srcSize;
2777*c03c5b1cSMartin Matuska         cctx->producedCSize += (cSize + fhSize);
2778*c03c5b1cSMartin Matuska         assert(!(cctx->appliedParams.fParams.contentSizeFlag && cctx->pledgedSrcSizePlusOne == 0));
2779*c03c5b1cSMartin Matuska         if (cctx->pledgedSrcSizePlusOne != 0) {  /* control src size */
2780*c03c5b1cSMartin Matuska             ZSTD_STATIC_ASSERT(ZSTD_CONTENTSIZE_UNKNOWN == (unsigned long long)-1);
2781*c03c5b1cSMartin Matuska             RETURN_ERROR_IF(
2782*c03c5b1cSMartin Matuska                 cctx->consumedSrcSize+1 > cctx->pledgedSrcSizePlusOne,
2783*c03c5b1cSMartin Matuska                 srcSize_wrong,
2784*c03c5b1cSMartin Matuska                 "error : pledgedSrcSize = %u, while realSrcSize >= %u",
2785*c03c5b1cSMartin Matuska                 (unsigned)cctx->pledgedSrcSizePlusOne-1,
2786*c03c5b1cSMartin Matuska                 (unsigned)cctx->consumedSrcSize);
2787*c03c5b1cSMartin Matuska         }
2788*c03c5b1cSMartin Matuska         return cSize + fhSize;
2789*c03c5b1cSMartin Matuska     }
2790*c03c5b1cSMartin Matuska }
2791*c03c5b1cSMartin Matuska 
ZSTD_compressContinue(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize)2792*c03c5b1cSMartin Matuska size_t ZSTD_compressContinue (ZSTD_CCtx* cctx,
2793*c03c5b1cSMartin Matuska                               void* dst, size_t dstCapacity,
2794*c03c5b1cSMartin Matuska                         const void* src, size_t srcSize)
2795*c03c5b1cSMartin Matuska {
2796*c03c5b1cSMartin Matuska     DEBUGLOG(5, "ZSTD_compressContinue (srcSize=%u)", (unsigned)srcSize);
2797*c03c5b1cSMartin Matuska     return ZSTD_compressContinue_internal(cctx, dst, dstCapacity, src, srcSize, 1 /* frame mode */, 0 /* last chunk */);
2798*c03c5b1cSMartin Matuska }
2799*c03c5b1cSMartin Matuska 
2800*c03c5b1cSMartin Matuska 
ZSTD_getBlockSize(const ZSTD_CCtx * cctx)2801*c03c5b1cSMartin Matuska size_t ZSTD_getBlockSize(const ZSTD_CCtx* cctx)
2802*c03c5b1cSMartin Matuska {
2803*c03c5b1cSMartin Matuska     ZSTD_compressionParameters const cParams = cctx->appliedParams.cParams;
2804*c03c5b1cSMartin Matuska     assert(!ZSTD_checkCParams(cParams));
2805*c03c5b1cSMartin Matuska     return MIN (ZSTD_BLOCKSIZE_MAX, (U32)1 << cParams.windowLog);
2806*c03c5b1cSMartin Matuska }
2807*c03c5b1cSMartin Matuska 
ZSTD_compressBlock(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize)2808*c03c5b1cSMartin Matuska size_t ZSTD_compressBlock(ZSTD_CCtx* cctx, void* dst, size_t dstCapacity, const void* src, size_t srcSize)
2809*c03c5b1cSMartin Matuska {
2810*c03c5b1cSMartin Matuska     DEBUGLOG(5, "ZSTD_compressBlock: srcSize = %u", (unsigned)srcSize);
2811*c03c5b1cSMartin Matuska     { size_t const blockSizeMax = ZSTD_getBlockSize(cctx);
2812*c03c5b1cSMartin Matuska       RETURN_ERROR_IF(srcSize > blockSizeMax, srcSize_wrong, "input is larger than a block"); }
2813*c03c5b1cSMartin Matuska 
2814*c03c5b1cSMartin Matuska     return ZSTD_compressContinue_internal(cctx, dst, dstCapacity, src, srcSize, 0 /* frame mode */, 0 /* last chunk */);
2815*c03c5b1cSMartin Matuska }
2816*c03c5b1cSMartin Matuska 
2817*c03c5b1cSMartin Matuska /*! ZSTD_loadDictionaryContent() :
2818*c03c5b1cSMartin Matuska  *  @return : 0, or an error code
2819*c03c5b1cSMartin Matuska  */
ZSTD_loadDictionaryContent(ZSTD_matchState_t * ms,ldmState_t * ls,ZSTD_cwksp * ws,ZSTD_CCtx_params const * params,const void * src,size_t srcSize,ZSTD_dictTableLoadMethod_e dtlm)2820*c03c5b1cSMartin Matuska static size_t ZSTD_loadDictionaryContent(ZSTD_matchState_t* ms,
2821*c03c5b1cSMartin Matuska                                          ldmState_t* ls,
2822*c03c5b1cSMartin Matuska                                          ZSTD_cwksp* ws,
2823*c03c5b1cSMartin Matuska                                          ZSTD_CCtx_params const* params,
2824*c03c5b1cSMartin Matuska                                          const void* src, size_t srcSize,
2825*c03c5b1cSMartin Matuska                                          ZSTD_dictTableLoadMethod_e dtlm)
2826*c03c5b1cSMartin Matuska {
2827*c03c5b1cSMartin Matuska     const BYTE* ip = (const BYTE*) src;
2828*c03c5b1cSMartin Matuska     const BYTE* const iend = ip + srcSize;
2829*c03c5b1cSMartin Matuska 
2830*c03c5b1cSMartin Matuska     ZSTD_window_update(&ms->window, src, srcSize);
2831*c03c5b1cSMartin Matuska     ms->loadedDictEnd = params->forceWindow ? 0 : (U32)(iend - ms->window.base);
2832*c03c5b1cSMartin Matuska 
2833*c03c5b1cSMartin Matuska     if (params->ldmParams.enableLdm && ls != NULL) {
2834*c03c5b1cSMartin Matuska         ZSTD_window_update(&ls->window, src, srcSize);
2835*c03c5b1cSMartin Matuska         ls->loadedDictEnd = params->forceWindow ? 0 : (U32)(iend - ls->window.base);
2836*c03c5b1cSMartin Matuska     }
2837*c03c5b1cSMartin Matuska 
2838*c03c5b1cSMartin Matuska     /* Assert that we the ms params match the params we're being given */
2839*c03c5b1cSMartin Matuska     ZSTD_assertEqualCParams(params->cParams, ms->cParams);
2840*c03c5b1cSMartin Matuska 
2841*c03c5b1cSMartin Matuska     if (srcSize <= HASH_READ_SIZE) return 0;
2842*c03c5b1cSMartin Matuska 
2843*c03c5b1cSMartin Matuska     while (iend - ip > HASH_READ_SIZE) {
2844*c03c5b1cSMartin Matuska         size_t const remaining = (size_t)(iend - ip);
2845*c03c5b1cSMartin Matuska         size_t const chunk = MIN(remaining, ZSTD_CHUNKSIZE_MAX);
2846*c03c5b1cSMartin Matuska         const BYTE* const ichunk = ip + chunk;
2847*c03c5b1cSMartin Matuska 
2848*c03c5b1cSMartin Matuska         ZSTD_overflowCorrectIfNeeded(ms, ws, params, ip, ichunk);
2849*c03c5b1cSMartin Matuska 
2850*c03c5b1cSMartin Matuska         if (params->ldmParams.enableLdm && ls != NULL)
2851*c03c5b1cSMartin Matuska             ZSTD_ldm_fillHashTable(ls, (const BYTE*)src, (const BYTE*)src + srcSize, &params->ldmParams);
2852*c03c5b1cSMartin Matuska 
2853*c03c5b1cSMartin Matuska         switch(params->cParams.strategy)
2854*c03c5b1cSMartin Matuska         {
2855*c03c5b1cSMartin Matuska         case ZSTD_fast:
2856*c03c5b1cSMartin Matuska             ZSTD_fillHashTable(ms, ichunk, dtlm);
2857*c03c5b1cSMartin Matuska             break;
2858*c03c5b1cSMartin Matuska         case ZSTD_dfast:
2859*c03c5b1cSMartin Matuska             ZSTD_fillDoubleHashTable(ms, ichunk, dtlm);
2860*c03c5b1cSMartin Matuska             break;
2861*c03c5b1cSMartin Matuska 
2862*c03c5b1cSMartin Matuska         case ZSTD_greedy:
2863*c03c5b1cSMartin Matuska         case ZSTD_lazy:
2864*c03c5b1cSMartin Matuska         case ZSTD_lazy2:
2865*c03c5b1cSMartin Matuska             if (chunk >= HASH_READ_SIZE)
2866*c03c5b1cSMartin Matuska                 ZSTD_insertAndFindFirstIndex(ms, ichunk-HASH_READ_SIZE);
2867*c03c5b1cSMartin Matuska             break;
2868*c03c5b1cSMartin Matuska 
2869*c03c5b1cSMartin Matuska         case ZSTD_btlazy2:   /* we want the dictionary table fully sorted */
2870*c03c5b1cSMartin Matuska         case ZSTD_btopt:
2871*c03c5b1cSMartin Matuska         case ZSTD_btultra:
2872*c03c5b1cSMartin Matuska         case ZSTD_btultra2:
2873*c03c5b1cSMartin Matuska             if (chunk >= HASH_READ_SIZE)
2874*c03c5b1cSMartin Matuska                 ZSTD_updateTree(ms, ichunk-HASH_READ_SIZE, ichunk);
2875*c03c5b1cSMartin Matuska             break;
2876*c03c5b1cSMartin Matuska 
2877*c03c5b1cSMartin Matuska         default:
2878*c03c5b1cSMartin Matuska             assert(0);  /* not possible : not a valid strategy id */
2879*c03c5b1cSMartin Matuska         }
2880*c03c5b1cSMartin Matuska 
2881*c03c5b1cSMartin Matuska         ip = ichunk;
2882*c03c5b1cSMartin Matuska     }
2883*c03c5b1cSMartin Matuska 
2884*c03c5b1cSMartin Matuska     ms->nextToUpdate = (U32)(iend - ms->window.base);
2885*c03c5b1cSMartin Matuska     return 0;
2886*c03c5b1cSMartin Matuska }
2887*c03c5b1cSMartin Matuska 
2888*c03c5b1cSMartin Matuska 
2889*c03c5b1cSMartin Matuska /* Dictionaries that assign zero probability to symbols that show up causes problems
2890*c03c5b1cSMartin Matuska    when FSE encoding.  Refuse dictionaries that assign zero probability to symbols
2891*c03c5b1cSMartin Matuska    that we may encounter during compression.
2892*c03c5b1cSMartin Matuska    NOTE: This behavior is not standard and could be improved in the future. */
ZSTD_checkDictNCount(short * normalizedCounter,unsigned dictMaxSymbolValue,unsigned maxSymbolValue)2893*c03c5b1cSMartin Matuska static size_t ZSTD_checkDictNCount(short* normalizedCounter, unsigned dictMaxSymbolValue, unsigned maxSymbolValue) {
2894*c03c5b1cSMartin Matuska     U32 s;
2895*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(dictMaxSymbolValue < maxSymbolValue, dictionary_corrupted, "dict fse tables don't have all symbols");
2896*c03c5b1cSMartin Matuska     for (s = 0; s <= maxSymbolValue; ++s) {
2897*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(normalizedCounter[s] == 0, dictionary_corrupted, "dict fse tables don't have all symbols");
2898*c03c5b1cSMartin Matuska     }
2899*c03c5b1cSMartin Matuska     return 0;
2900*c03c5b1cSMartin Matuska }
2901*c03c5b1cSMartin Matuska 
ZSTD_loadCEntropy(ZSTD_compressedBlockState_t * bs,void * workspace,short * offcodeNCount,unsigned * offcodeMaxValue,const void * const dict,size_t dictSize)2902*c03c5b1cSMartin Matuska size_t ZSTD_loadCEntropy(ZSTD_compressedBlockState_t* bs, void* workspace,
2903*c03c5b1cSMartin Matuska                          short* offcodeNCount, unsigned* offcodeMaxValue,
2904*c03c5b1cSMartin Matuska                          const void* const dict, size_t dictSize)
2905*c03c5b1cSMartin Matuska {
2906*c03c5b1cSMartin Matuska     const BYTE* dictPtr = (const BYTE*)dict;    /* skip magic num and dict ID */
2907*c03c5b1cSMartin Matuska     const BYTE* const dictEnd = dictPtr + dictSize;
2908*c03c5b1cSMartin Matuska     dictPtr += 8;
2909*c03c5b1cSMartin Matuska     bs->entropy.huf.repeatMode = HUF_repeat_check;
2910*c03c5b1cSMartin Matuska 
2911*c03c5b1cSMartin Matuska     {   unsigned maxSymbolValue = 255;
2912*c03c5b1cSMartin Matuska         unsigned hasZeroWeights = 1;
2913*c03c5b1cSMartin Matuska         size_t const hufHeaderSize = HUF_readCTable((HUF_CElt*)bs->entropy.huf.CTable, &maxSymbolValue, dictPtr,
2914*c03c5b1cSMartin Matuska             dictEnd-dictPtr, &hasZeroWeights);
2915*c03c5b1cSMartin Matuska 
2916*c03c5b1cSMartin Matuska         /* We only set the loaded table as valid if it contains all non-zero
2917*c03c5b1cSMartin Matuska          * weights. Otherwise, we set it to check */
2918*c03c5b1cSMartin Matuska         if (!hasZeroWeights)
2919*c03c5b1cSMartin Matuska             bs->entropy.huf.repeatMode = HUF_repeat_valid;
2920*c03c5b1cSMartin Matuska 
2921*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(HUF_isError(hufHeaderSize), dictionary_corrupted, "");
2922*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(maxSymbolValue < 255, dictionary_corrupted, "");
2923*c03c5b1cSMartin Matuska         dictPtr += hufHeaderSize;
2924*c03c5b1cSMartin Matuska     }
2925*c03c5b1cSMartin Matuska 
2926*c03c5b1cSMartin Matuska     {   unsigned offcodeLog;
2927*c03c5b1cSMartin Matuska         size_t const offcodeHeaderSize = FSE_readNCount(offcodeNCount, offcodeMaxValue, &offcodeLog, dictPtr, dictEnd-dictPtr);
2928*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(FSE_isError(offcodeHeaderSize), dictionary_corrupted, "");
2929*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(offcodeLog > OffFSELog, dictionary_corrupted, "");
2930*c03c5b1cSMartin Matuska         /* Defer checking offcodeMaxValue because we need to know the size of the dictionary content */
2931*c03c5b1cSMartin Matuska         /* fill all offset symbols to avoid garbage at end of table */
2932*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(FSE_isError(FSE_buildCTable_wksp(
2933*c03c5b1cSMartin Matuska                 bs->entropy.fse.offcodeCTable,
2934*c03c5b1cSMartin Matuska                 offcodeNCount, MaxOff, offcodeLog,
2935*c03c5b1cSMartin Matuska                 workspace, HUF_WORKSPACE_SIZE)),
2936*c03c5b1cSMartin Matuska             dictionary_corrupted, "");
2937*c03c5b1cSMartin Matuska         dictPtr += offcodeHeaderSize;
2938*c03c5b1cSMartin Matuska     }
2939*c03c5b1cSMartin Matuska 
2940*c03c5b1cSMartin Matuska     {   short matchlengthNCount[MaxML+1];
2941*c03c5b1cSMartin Matuska         unsigned matchlengthMaxValue = MaxML, matchlengthLog;
2942*c03c5b1cSMartin Matuska         size_t const matchlengthHeaderSize = FSE_readNCount(matchlengthNCount, &matchlengthMaxValue, &matchlengthLog, dictPtr, dictEnd-dictPtr);
2943*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(FSE_isError(matchlengthHeaderSize), dictionary_corrupted, "");
2944*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(matchlengthLog > MLFSELog, dictionary_corrupted, "");
2945*c03c5b1cSMartin Matuska         /* Every match length code must have non-zero probability */
2946*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR( ZSTD_checkDictNCount(matchlengthNCount, matchlengthMaxValue, MaxML), "");
2947*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(FSE_isError(FSE_buildCTable_wksp(
2948*c03c5b1cSMartin Matuska                 bs->entropy.fse.matchlengthCTable,
2949*c03c5b1cSMartin Matuska                 matchlengthNCount, matchlengthMaxValue, matchlengthLog,
2950*c03c5b1cSMartin Matuska                 workspace, HUF_WORKSPACE_SIZE)),
2951*c03c5b1cSMartin Matuska             dictionary_corrupted, "");
2952*c03c5b1cSMartin Matuska         dictPtr += matchlengthHeaderSize;
2953*c03c5b1cSMartin Matuska     }
2954*c03c5b1cSMartin Matuska 
2955*c03c5b1cSMartin Matuska     {   short litlengthNCount[MaxLL+1];
2956*c03c5b1cSMartin Matuska         unsigned litlengthMaxValue = MaxLL, litlengthLog;
2957*c03c5b1cSMartin Matuska         size_t const litlengthHeaderSize = FSE_readNCount(litlengthNCount, &litlengthMaxValue, &litlengthLog, dictPtr, dictEnd-dictPtr);
2958*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(FSE_isError(litlengthHeaderSize), dictionary_corrupted, "");
2959*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(litlengthLog > LLFSELog, dictionary_corrupted, "");
2960*c03c5b1cSMartin Matuska         /* Every literal length code must have non-zero probability */
2961*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR( ZSTD_checkDictNCount(litlengthNCount, litlengthMaxValue, MaxLL), "");
2962*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(FSE_isError(FSE_buildCTable_wksp(
2963*c03c5b1cSMartin Matuska                 bs->entropy.fse.litlengthCTable,
2964*c03c5b1cSMartin Matuska                 litlengthNCount, litlengthMaxValue, litlengthLog,
2965*c03c5b1cSMartin Matuska                 workspace, HUF_WORKSPACE_SIZE)),
2966*c03c5b1cSMartin Matuska             dictionary_corrupted, "");
2967*c03c5b1cSMartin Matuska         dictPtr += litlengthHeaderSize;
2968*c03c5b1cSMartin Matuska     }
2969*c03c5b1cSMartin Matuska 
2970*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(dictPtr+12 > dictEnd, dictionary_corrupted, "");
2971*c03c5b1cSMartin Matuska     bs->rep[0] = MEM_readLE32(dictPtr+0);
2972*c03c5b1cSMartin Matuska     bs->rep[1] = MEM_readLE32(dictPtr+4);
2973*c03c5b1cSMartin Matuska     bs->rep[2] = MEM_readLE32(dictPtr+8);
2974*c03c5b1cSMartin Matuska     dictPtr += 12;
2975*c03c5b1cSMartin Matuska 
2976*c03c5b1cSMartin Matuska     return dictPtr - (const BYTE*)dict;
2977*c03c5b1cSMartin Matuska }
2978*c03c5b1cSMartin Matuska 
2979*c03c5b1cSMartin Matuska /* Dictionary format :
2980*c03c5b1cSMartin Matuska  * See :
2981*c03c5b1cSMartin Matuska  * https://github.com/facebook/zstd/blob/master/doc/zstd_compression_format.md#dictionary-format
2982*c03c5b1cSMartin Matuska  */
2983*c03c5b1cSMartin Matuska /*! ZSTD_loadZstdDictionary() :
2984*c03c5b1cSMartin Matuska  * @return : dictID, or an error code
2985*c03c5b1cSMartin Matuska  *  assumptions : magic number supposed already checked
2986*c03c5b1cSMartin Matuska  *                dictSize supposed >= 8
2987*c03c5b1cSMartin Matuska  */
ZSTD_loadZstdDictionary(ZSTD_compressedBlockState_t * bs,ZSTD_matchState_t * ms,ZSTD_cwksp * ws,ZSTD_CCtx_params const * params,const void * dict,size_t dictSize,ZSTD_dictTableLoadMethod_e dtlm,void * workspace)2988*c03c5b1cSMartin Matuska static size_t ZSTD_loadZstdDictionary(ZSTD_compressedBlockState_t* bs,
2989*c03c5b1cSMartin Matuska                                       ZSTD_matchState_t* ms,
2990*c03c5b1cSMartin Matuska                                       ZSTD_cwksp* ws,
2991*c03c5b1cSMartin Matuska                                       ZSTD_CCtx_params const* params,
2992*c03c5b1cSMartin Matuska                                       const void* dict, size_t dictSize,
2993*c03c5b1cSMartin Matuska                                       ZSTD_dictTableLoadMethod_e dtlm,
2994*c03c5b1cSMartin Matuska                                       void* workspace)
2995*c03c5b1cSMartin Matuska {
2996*c03c5b1cSMartin Matuska     const BYTE* dictPtr = (const BYTE*)dict;
2997*c03c5b1cSMartin Matuska     const BYTE* const dictEnd = dictPtr + dictSize;
2998*c03c5b1cSMartin Matuska     short offcodeNCount[MaxOff+1];
2999*c03c5b1cSMartin Matuska     unsigned offcodeMaxValue = MaxOff;
3000*c03c5b1cSMartin Matuska     size_t dictID;
3001*c03c5b1cSMartin Matuska     size_t eSize;
3002*c03c5b1cSMartin Matuska 
3003*c03c5b1cSMartin Matuska     ZSTD_STATIC_ASSERT(HUF_WORKSPACE_SIZE >= (1<<MAX(MLFSELog,LLFSELog)));
3004*c03c5b1cSMartin Matuska     assert(dictSize >= 8);
3005*c03c5b1cSMartin Matuska     assert(MEM_readLE32(dictPtr) == ZSTD_MAGIC_DICTIONARY);
3006*c03c5b1cSMartin Matuska 
3007*c03c5b1cSMartin Matuska     dictID = params->fParams.noDictIDFlag ? 0 :  MEM_readLE32(dictPtr + 4 /* skip magic number */ );
3008*c03c5b1cSMartin Matuska     eSize = ZSTD_loadCEntropy(bs, workspace, offcodeNCount, &offcodeMaxValue, dict, dictSize);
3009*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR(eSize, "ZSTD_loadCEntropy failed");
3010*c03c5b1cSMartin Matuska     dictPtr += eSize;
3011*c03c5b1cSMartin Matuska 
3012*c03c5b1cSMartin Matuska     {   size_t const dictContentSize = (size_t)(dictEnd - dictPtr);
3013*c03c5b1cSMartin Matuska         U32 offcodeMax = MaxOff;
3014*c03c5b1cSMartin Matuska         if (dictContentSize <= ((U32)-1) - 128 KB) {
3015*c03c5b1cSMartin Matuska             U32 const maxOffset = (U32)dictContentSize + 128 KB; /* The maximum offset that must be supported */
3016*c03c5b1cSMartin Matuska             offcodeMax = ZSTD_highbit32(maxOffset); /* Calculate minimum offset code required to represent maxOffset */
3017*c03c5b1cSMartin Matuska         }
3018*c03c5b1cSMartin Matuska         /* All offset values <= dictContentSize + 128 KB must be representable */
3019*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR(ZSTD_checkDictNCount(offcodeNCount, offcodeMaxValue, MIN(offcodeMax, MaxOff)), "");
3020*c03c5b1cSMartin Matuska         /* All repCodes must be <= dictContentSize and != 0*/
3021*c03c5b1cSMartin Matuska         {   U32 u;
3022*c03c5b1cSMartin Matuska             for (u=0; u<3; u++) {
3023*c03c5b1cSMartin Matuska                 RETURN_ERROR_IF(bs->rep[u] == 0, dictionary_corrupted, "");
3024*c03c5b1cSMartin Matuska                 RETURN_ERROR_IF(bs->rep[u] > dictContentSize, dictionary_corrupted, "");
3025*c03c5b1cSMartin Matuska         }   }
3026*c03c5b1cSMartin Matuska 
3027*c03c5b1cSMartin Matuska         bs->entropy.fse.offcode_repeatMode = FSE_repeat_valid;
3028*c03c5b1cSMartin Matuska         bs->entropy.fse.matchlength_repeatMode = FSE_repeat_valid;
3029*c03c5b1cSMartin Matuska         bs->entropy.fse.litlength_repeatMode = FSE_repeat_valid;
3030*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR(ZSTD_loadDictionaryContent(
3031*c03c5b1cSMartin Matuska             ms, NULL, ws, params, dictPtr, dictContentSize, dtlm), "");
3032*c03c5b1cSMartin Matuska         return dictID;
3033*c03c5b1cSMartin Matuska     }
3034*c03c5b1cSMartin Matuska }
3035*c03c5b1cSMartin Matuska 
3036*c03c5b1cSMartin Matuska /** ZSTD_compress_insertDictionary() :
3037*c03c5b1cSMartin Matuska *   @return : dictID, or an error code */
3038*c03c5b1cSMartin Matuska static size_t
ZSTD_compress_insertDictionary(ZSTD_compressedBlockState_t * bs,ZSTD_matchState_t * ms,ldmState_t * ls,ZSTD_cwksp * ws,const ZSTD_CCtx_params * params,const void * dict,size_t dictSize,ZSTD_dictContentType_e dictContentType,ZSTD_dictTableLoadMethod_e dtlm,void * workspace)3039*c03c5b1cSMartin Matuska ZSTD_compress_insertDictionary(ZSTD_compressedBlockState_t* bs,
3040*c03c5b1cSMartin Matuska                                ZSTD_matchState_t* ms,
3041*c03c5b1cSMartin Matuska                                ldmState_t* ls,
3042*c03c5b1cSMartin Matuska                                ZSTD_cwksp* ws,
3043*c03c5b1cSMartin Matuska                          const ZSTD_CCtx_params* params,
3044*c03c5b1cSMartin Matuska                          const void* dict, size_t dictSize,
3045*c03c5b1cSMartin Matuska                                ZSTD_dictContentType_e dictContentType,
3046*c03c5b1cSMartin Matuska                                ZSTD_dictTableLoadMethod_e dtlm,
3047*c03c5b1cSMartin Matuska                                void* workspace)
3048*c03c5b1cSMartin Matuska {
3049*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_compress_insertDictionary (dictSize=%u)", (U32)dictSize);
3050*c03c5b1cSMartin Matuska     if ((dict==NULL) || (dictSize<8)) {
3051*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(dictContentType == ZSTD_dct_fullDict, dictionary_wrong, "");
3052*c03c5b1cSMartin Matuska         return 0;
3053*c03c5b1cSMartin Matuska     }
3054*c03c5b1cSMartin Matuska 
3055*c03c5b1cSMartin Matuska     ZSTD_reset_compressedBlockState(bs);
3056*c03c5b1cSMartin Matuska 
3057*c03c5b1cSMartin Matuska     /* dict restricted modes */
3058*c03c5b1cSMartin Matuska     if (dictContentType == ZSTD_dct_rawContent)
3059*c03c5b1cSMartin Matuska         return ZSTD_loadDictionaryContent(ms, ls, ws, params, dict, dictSize, dtlm);
3060*c03c5b1cSMartin Matuska 
3061*c03c5b1cSMartin Matuska     if (MEM_readLE32(dict) != ZSTD_MAGIC_DICTIONARY) {
3062*c03c5b1cSMartin Matuska         if (dictContentType == ZSTD_dct_auto) {
3063*c03c5b1cSMartin Matuska             DEBUGLOG(4, "raw content dictionary detected");
3064*c03c5b1cSMartin Matuska             return ZSTD_loadDictionaryContent(
3065*c03c5b1cSMartin Matuska                 ms, ls, ws, params, dict, dictSize, dtlm);
3066*c03c5b1cSMartin Matuska         }
3067*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(dictContentType == ZSTD_dct_fullDict, dictionary_wrong, "");
3068*c03c5b1cSMartin Matuska         assert(0);   /* impossible */
3069*c03c5b1cSMartin Matuska     }
3070*c03c5b1cSMartin Matuska 
3071*c03c5b1cSMartin Matuska     /* dict as full zstd dictionary */
3072*c03c5b1cSMartin Matuska     return ZSTD_loadZstdDictionary(
3073*c03c5b1cSMartin Matuska         bs, ms, ws, params, dict, dictSize, dtlm, workspace);
3074*c03c5b1cSMartin Matuska }
3075*c03c5b1cSMartin Matuska 
3076*c03c5b1cSMartin Matuska #define ZSTD_USE_CDICT_PARAMS_SRCSIZE_CUTOFF (128 KB)
3077*c03c5b1cSMartin Matuska #define ZSTD_USE_CDICT_PARAMS_DICTSIZE_MULTIPLIER (6)
3078*c03c5b1cSMartin Matuska 
3079*c03c5b1cSMartin Matuska /*! ZSTD_compressBegin_internal() :
3080*c03c5b1cSMartin Matuska  * @return : 0, or an error code */
ZSTD_compressBegin_internal(ZSTD_CCtx * cctx,const void * dict,size_t dictSize,ZSTD_dictContentType_e dictContentType,ZSTD_dictTableLoadMethod_e dtlm,const ZSTD_CDict * cdict,const ZSTD_CCtx_params * params,U64 pledgedSrcSize,ZSTD_buffered_policy_e zbuff)3081*c03c5b1cSMartin Matuska static size_t ZSTD_compressBegin_internal(ZSTD_CCtx* cctx,
3082*c03c5b1cSMartin Matuska                                     const void* dict, size_t dictSize,
3083*c03c5b1cSMartin Matuska                                     ZSTD_dictContentType_e dictContentType,
3084*c03c5b1cSMartin Matuska                                     ZSTD_dictTableLoadMethod_e dtlm,
3085*c03c5b1cSMartin Matuska                                     const ZSTD_CDict* cdict,
3086*c03c5b1cSMartin Matuska                                     const ZSTD_CCtx_params* params, U64 pledgedSrcSize,
3087*c03c5b1cSMartin Matuska                                     ZSTD_buffered_policy_e zbuff)
3088*c03c5b1cSMartin Matuska {
3089*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_compressBegin_internal: wlog=%u", params->cParams.windowLog);
3090*c03c5b1cSMartin Matuska     /* params are supposed to be fully validated at this point */
3091*c03c5b1cSMartin Matuska     assert(!ZSTD_isError(ZSTD_checkCParams(params->cParams)));
3092*c03c5b1cSMartin Matuska     assert(!((dict) && (cdict)));  /* either dict or cdict, not both */
3093*c03c5b1cSMartin Matuska     if ( (cdict)
3094*c03c5b1cSMartin Matuska       && (cdict->dictContentSize > 0)
3095*c03c5b1cSMartin Matuska       && ( pledgedSrcSize < ZSTD_USE_CDICT_PARAMS_SRCSIZE_CUTOFF
3096*c03c5b1cSMartin Matuska         || pledgedSrcSize < cdict->dictContentSize * ZSTD_USE_CDICT_PARAMS_DICTSIZE_MULTIPLIER
3097*c03c5b1cSMartin Matuska         || pledgedSrcSize == ZSTD_CONTENTSIZE_UNKNOWN
3098*c03c5b1cSMartin Matuska         || cdict->compressionLevel == 0)
3099*c03c5b1cSMartin Matuska       && (params->attachDictPref != ZSTD_dictForceLoad) ) {
3100*c03c5b1cSMartin Matuska         return ZSTD_resetCCtx_usingCDict(cctx, cdict, params, pledgedSrcSize, zbuff);
3101*c03c5b1cSMartin Matuska     }
3102*c03c5b1cSMartin Matuska 
3103*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_resetCCtx_internal(cctx, *params, pledgedSrcSize,
3104*c03c5b1cSMartin Matuska                                      ZSTDcrp_makeClean, zbuff) , "");
3105*c03c5b1cSMartin Matuska     {   size_t const dictID = cdict ?
3106*c03c5b1cSMartin Matuska                 ZSTD_compress_insertDictionary(
3107*c03c5b1cSMartin Matuska                         cctx->blockState.prevCBlock, &cctx->blockState.matchState,
3108*c03c5b1cSMartin Matuska                         &cctx->ldmState, &cctx->workspace, &cctx->appliedParams, cdict->dictContent,
3109*c03c5b1cSMartin Matuska                         cdict->dictContentSize, dictContentType, dtlm,
3110*c03c5b1cSMartin Matuska                         cctx->entropyWorkspace)
3111*c03c5b1cSMartin Matuska               : ZSTD_compress_insertDictionary(
3112*c03c5b1cSMartin Matuska                         cctx->blockState.prevCBlock, &cctx->blockState.matchState,
3113*c03c5b1cSMartin Matuska                         &cctx->ldmState, &cctx->workspace, &cctx->appliedParams, dict, dictSize,
3114*c03c5b1cSMartin Matuska                         dictContentType, dtlm, cctx->entropyWorkspace);
3115*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR(dictID, "ZSTD_compress_insertDictionary failed");
3116*c03c5b1cSMartin Matuska         assert(dictID <= UINT_MAX);
3117*c03c5b1cSMartin Matuska         cctx->dictID = (U32)dictID;
3118*c03c5b1cSMartin Matuska     }
3119*c03c5b1cSMartin Matuska     return 0;
3120*c03c5b1cSMartin Matuska }
3121*c03c5b1cSMartin Matuska 
ZSTD_compressBegin_advanced_internal(ZSTD_CCtx * cctx,const void * dict,size_t dictSize,ZSTD_dictContentType_e dictContentType,ZSTD_dictTableLoadMethod_e dtlm,const ZSTD_CDict * cdict,const ZSTD_CCtx_params * params,unsigned long long pledgedSrcSize)3122*c03c5b1cSMartin Matuska size_t ZSTD_compressBegin_advanced_internal(ZSTD_CCtx* cctx,
3123*c03c5b1cSMartin Matuska                                     const void* dict, size_t dictSize,
3124*c03c5b1cSMartin Matuska                                     ZSTD_dictContentType_e dictContentType,
3125*c03c5b1cSMartin Matuska                                     ZSTD_dictTableLoadMethod_e dtlm,
3126*c03c5b1cSMartin Matuska                                     const ZSTD_CDict* cdict,
3127*c03c5b1cSMartin Matuska                                     const ZSTD_CCtx_params* params,
3128*c03c5b1cSMartin Matuska                                     unsigned long long pledgedSrcSize)
3129*c03c5b1cSMartin Matuska {
3130*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_compressBegin_advanced_internal: wlog=%u", params->cParams.windowLog);
3131*c03c5b1cSMartin Matuska     /* compression parameters verification and optimization */
3132*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_checkCParams(params->cParams) , "");
3133*c03c5b1cSMartin Matuska     return ZSTD_compressBegin_internal(cctx,
3134*c03c5b1cSMartin Matuska                                        dict, dictSize, dictContentType, dtlm,
3135*c03c5b1cSMartin Matuska                                        cdict,
3136*c03c5b1cSMartin Matuska                                        params, pledgedSrcSize,
3137*c03c5b1cSMartin Matuska                                        ZSTDb_not_buffered);
3138*c03c5b1cSMartin Matuska }
3139*c03c5b1cSMartin Matuska 
3140*c03c5b1cSMartin Matuska /*! ZSTD_compressBegin_advanced() :
3141*c03c5b1cSMartin Matuska *   @return : 0, or an error code */
ZSTD_compressBegin_advanced(ZSTD_CCtx * cctx,const void * dict,size_t dictSize,ZSTD_parameters params,unsigned long long pledgedSrcSize)3142*c03c5b1cSMartin Matuska size_t ZSTD_compressBegin_advanced(ZSTD_CCtx* cctx,
3143*c03c5b1cSMartin Matuska                              const void* dict, size_t dictSize,
3144*c03c5b1cSMartin Matuska                                    ZSTD_parameters params, unsigned long long pledgedSrcSize)
3145*c03c5b1cSMartin Matuska {
3146*c03c5b1cSMartin Matuska     ZSTD_CCtx_params const cctxParams =
3147*c03c5b1cSMartin Matuska             ZSTD_assignParamsToCCtxParams(&cctx->requestedParams, &params);
3148*c03c5b1cSMartin Matuska     return ZSTD_compressBegin_advanced_internal(cctx,
3149*c03c5b1cSMartin Matuska                                             dict, dictSize, ZSTD_dct_auto, ZSTD_dtlm_fast,
3150*c03c5b1cSMartin Matuska                                             NULL /*cdict*/,
3151*c03c5b1cSMartin Matuska                                             &cctxParams, pledgedSrcSize);
3152*c03c5b1cSMartin Matuska }
3153*c03c5b1cSMartin Matuska 
ZSTD_compressBegin_usingDict(ZSTD_CCtx * cctx,const void * dict,size_t dictSize,int compressionLevel)3154*c03c5b1cSMartin Matuska size_t ZSTD_compressBegin_usingDict(ZSTD_CCtx* cctx, const void* dict, size_t dictSize, int compressionLevel)
3155*c03c5b1cSMartin Matuska {
3156*c03c5b1cSMartin Matuska     ZSTD_parameters const params = ZSTD_getParams_internal(compressionLevel, ZSTD_CONTENTSIZE_UNKNOWN, dictSize);
3157*c03c5b1cSMartin Matuska     ZSTD_CCtx_params const cctxParams =
3158*c03c5b1cSMartin Matuska             ZSTD_assignParamsToCCtxParams(&cctx->requestedParams, &params);
3159*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_compressBegin_usingDict (dictSize=%u)", (unsigned)dictSize);
3160*c03c5b1cSMartin Matuska     return ZSTD_compressBegin_internal(cctx, dict, dictSize, ZSTD_dct_auto, ZSTD_dtlm_fast, NULL,
3161*c03c5b1cSMartin Matuska                                        &cctxParams, ZSTD_CONTENTSIZE_UNKNOWN, ZSTDb_not_buffered);
3162*c03c5b1cSMartin Matuska }
3163*c03c5b1cSMartin Matuska 
ZSTD_compressBegin(ZSTD_CCtx * cctx,int compressionLevel)3164*c03c5b1cSMartin Matuska size_t ZSTD_compressBegin(ZSTD_CCtx* cctx, int compressionLevel)
3165*c03c5b1cSMartin Matuska {
3166*c03c5b1cSMartin Matuska     return ZSTD_compressBegin_usingDict(cctx, NULL, 0, compressionLevel);
3167*c03c5b1cSMartin Matuska }
3168*c03c5b1cSMartin Matuska 
3169*c03c5b1cSMartin Matuska 
3170*c03c5b1cSMartin Matuska /*! ZSTD_writeEpilogue() :
3171*c03c5b1cSMartin Matuska *   Ends a frame.
3172*c03c5b1cSMartin Matuska *   @return : nb of bytes written into dst (or an error code) */
ZSTD_writeEpilogue(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity)3173*c03c5b1cSMartin Matuska static size_t ZSTD_writeEpilogue(ZSTD_CCtx* cctx, void* dst, size_t dstCapacity)
3174*c03c5b1cSMartin Matuska {
3175*c03c5b1cSMartin Matuska     BYTE* const ostart = (BYTE*)dst;
3176*c03c5b1cSMartin Matuska     BYTE* op = ostart;
3177*c03c5b1cSMartin Matuska     size_t fhSize = 0;
3178*c03c5b1cSMartin Matuska 
3179*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_writeEpilogue");
3180*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(cctx->stage == ZSTDcs_created, stage_wrong, "init missing");
3181*c03c5b1cSMartin Matuska 
3182*c03c5b1cSMartin Matuska     /* special case : empty frame */
3183*c03c5b1cSMartin Matuska     if (cctx->stage == ZSTDcs_init) {
3184*c03c5b1cSMartin Matuska         fhSize = ZSTD_writeFrameHeader(dst, dstCapacity, &cctx->appliedParams, 0, 0);
3185*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR(fhSize, "ZSTD_writeFrameHeader failed");
3186*c03c5b1cSMartin Matuska         dstCapacity -= fhSize;
3187*c03c5b1cSMartin Matuska         op += fhSize;
3188*c03c5b1cSMartin Matuska         cctx->stage = ZSTDcs_ongoing;
3189*c03c5b1cSMartin Matuska     }
3190*c03c5b1cSMartin Matuska 
3191*c03c5b1cSMartin Matuska     if (cctx->stage != ZSTDcs_ending) {
3192*c03c5b1cSMartin Matuska         /* write one last empty block, make it the "last" block */
3193*c03c5b1cSMartin Matuska         U32 const cBlockHeader24 = 1 /* last block */ + (((U32)bt_raw)<<1) + 0;
3194*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(dstCapacity<4, dstSize_tooSmall, "no room for epilogue");
3195*c03c5b1cSMartin Matuska         MEM_writeLE32(op, cBlockHeader24);
3196*c03c5b1cSMartin Matuska         op += ZSTD_blockHeaderSize;
3197*c03c5b1cSMartin Matuska         dstCapacity -= ZSTD_blockHeaderSize;
3198*c03c5b1cSMartin Matuska     }
3199*c03c5b1cSMartin Matuska 
3200*c03c5b1cSMartin Matuska     if (cctx->appliedParams.fParams.checksumFlag) {
3201*c03c5b1cSMartin Matuska         U32 const checksum = (U32) XXH64_digest(&cctx->xxhState);
3202*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(dstCapacity<4, dstSize_tooSmall, "no room for checksum");
3203*c03c5b1cSMartin Matuska         DEBUGLOG(4, "ZSTD_writeEpilogue: write checksum : %08X", (unsigned)checksum);
3204*c03c5b1cSMartin Matuska         MEM_writeLE32(op, checksum);
3205*c03c5b1cSMartin Matuska         op += 4;
3206*c03c5b1cSMartin Matuska     }
3207*c03c5b1cSMartin Matuska 
3208*c03c5b1cSMartin Matuska     cctx->stage = ZSTDcs_created;  /* return to "created but no init" status */
3209*c03c5b1cSMartin Matuska     return op-ostart;
3210*c03c5b1cSMartin Matuska }
3211*c03c5b1cSMartin Matuska 
ZSTD_compressEnd(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize)3212*c03c5b1cSMartin Matuska size_t ZSTD_compressEnd (ZSTD_CCtx* cctx,
3213*c03c5b1cSMartin Matuska                          void* dst, size_t dstCapacity,
3214*c03c5b1cSMartin Matuska                    const void* src, size_t srcSize)
3215*c03c5b1cSMartin Matuska {
3216*c03c5b1cSMartin Matuska     size_t endResult;
3217*c03c5b1cSMartin Matuska     size_t const cSize = ZSTD_compressContinue_internal(cctx,
3218*c03c5b1cSMartin Matuska                                 dst, dstCapacity, src, srcSize,
3219*c03c5b1cSMartin Matuska                                 1 /* frame mode */, 1 /* last chunk */);
3220*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR(cSize, "ZSTD_compressContinue_internal failed");
3221*c03c5b1cSMartin Matuska     endResult = ZSTD_writeEpilogue(cctx, (char*)dst + cSize, dstCapacity-cSize);
3222*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR(endResult, "ZSTD_writeEpilogue failed");
3223*c03c5b1cSMartin Matuska     assert(!(cctx->appliedParams.fParams.contentSizeFlag && cctx->pledgedSrcSizePlusOne == 0));
3224*c03c5b1cSMartin Matuska     if (cctx->pledgedSrcSizePlusOne != 0) {  /* control src size */
3225*c03c5b1cSMartin Matuska         ZSTD_STATIC_ASSERT(ZSTD_CONTENTSIZE_UNKNOWN == (unsigned long long)-1);
3226*c03c5b1cSMartin Matuska         DEBUGLOG(4, "end of frame : controlling src size");
3227*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(
3228*c03c5b1cSMartin Matuska             cctx->pledgedSrcSizePlusOne != cctx->consumedSrcSize+1,
3229*c03c5b1cSMartin Matuska             srcSize_wrong,
3230*c03c5b1cSMartin Matuska              "error : pledgedSrcSize = %u, while realSrcSize = %u",
3231*c03c5b1cSMartin Matuska             (unsigned)cctx->pledgedSrcSizePlusOne-1,
3232*c03c5b1cSMartin Matuska             (unsigned)cctx->consumedSrcSize);
3233*c03c5b1cSMartin Matuska     }
3234*c03c5b1cSMartin Matuska     return cSize + endResult;
3235*c03c5b1cSMartin Matuska }
3236*c03c5b1cSMartin Matuska 
3237*c03c5b1cSMartin Matuska 
ZSTD_compress_internal(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize,const void * dict,size_t dictSize,const ZSTD_parameters * params)3238*c03c5b1cSMartin Matuska static size_t ZSTD_compress_internal (ZSTD_CCtx* cctx,
3239*c03c5b1cSMartin Matuska                                       void* dst, size_t dstCapacity,
3240*c03c5b1cSMartin Matuska                                 const void* src, size_t srcSize,
3241*c03c5b1cSMartin Matuska                                 const void* dict,size_t dictSize,
3242*c03c5b1cSMartin Matuska                                 const ZSTD_parameters* params)
3243*c03c5b1cSMartin Matuska {
3244*c03c5b1cSMartin Matuska     ZSTD_CCtx_params const cctxParams =
3245*c03c5b1cSMartin Matuska             ZSTD_assignParamsToCCtxParams(&cctx->requestedParams, params);
3246*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_compress_internal");
3247*c03c5b1cSMartin Matuska     return ZSTD_compress_advanced_internal(cctx,
3248*c03c5b1cSMartin Matuska                                            dst, dstCapacity,
3249*c03c5b1cSMartin Matuska                                            src, srcSize,
3250*c03c5b1cSMartin Matuska                                            dict, dictSize,
3251*c03c5b1cSMartin Matuska                                            &cctxParams);
3252*c03c5b1cSMartin Matuska }
3253*c03c5b1cSMartin Matuska 
ZSTD_compress_advanced(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize,const void * dict,size_t dictSize,ZSTD_parameters params)3254*c03c5b1cSMartin Matuska size_t ZSTD_compress_advanced (ZSTD_CCtx* cctx,
3255*c03c5b1cSMartin Matuska                                void* dst, size_t dstCapacity,
3256*c03c5b1cSMartin Matuska                          const void* src, size_t srcSize,
3257*c03c5b1cSMartin Matuska                          const void* dict,size_t dictSize,
3258*c03c5b1cSMartin Matuska                                ZSTD_parameters params)
3259*c03c5b1cSMartin Matuska {
3260*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_compress_advanced");
3261*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR(ZSTD_checkCParams(params.cParams), "");
3262*c03c5b1cSMartin Matuska     return ZSTD_compress_internal(cctx,
3263*c03c5b1cSMartin Matuska                                   dst, dstCapacity,
3264*c03c5b1cSMartin Matuska                                   src, srcSize,
3265*c03c5b1cSMartin Matuska                                   dict, dictSize,
3266*c03c5b1cSMartin Matuska                                   &params);
3267*c03c5b1cSMartin Matuska }
3268*c03c5b1cSMartin Matuska 
3269*c03c5b1cSMartin Matuska /* Internal */
ZSTD_compress_advanced_internal(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize,const void * dict,size_t dictSize,const ZSTD_CCtx_params * params)3270*c03c5b1cSMartin Matuska size_t ZSTD_compress_advanced_internal(
3271*c03c5b1cSMartin Matuska         ZSTD_CCtx* cctx,
3272*c03c5b1cSMartin Matuska         void* dst, size_t dstCapacity,
3273*c03c5b1cSMartin Matuska         const void* src, size_t srcSize,
3274*c03c5b1cSMartin Matuska         const void* dict,size_t dictSize,
3275*c03c5b1cSMartin Matuska         const ZSTD_CCtx_params* params)
3276*c03c5b1cSMartin Matuska {
3277*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_compress_advanced_internal (srcSize:%u)", (unsigned)srcSize);
3278*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_compressBegin_internal(cctx,
3279*c03c5b1cSMartin Matuska                          dict, dictSize, ZSTD_dct_auto, ZSTD_dtlm_fast, NULL,
3280*c03c5b1cSMartin Matuska                          params, srcSize, ZSTDb_not_buffered) , "");
3281*c03c5b1cSMartin Matuska     return ZSTD_compressEnd(cctx, dst, dstCapacity, src, srcSize);
3282*c03c5b1cSMartin Matuska }
3283*c03c5b1cSMartin Matuska 
ZSTD_compress_usingDict(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize,const void * dict,size_t dictSize,int compressionLevel)3284*c03c5b1cSMartin Matuska size_t ZSTD_compress_usingDict(ZSTD_CCtx* cctx,
3285*c03c5b1cSMartin Matuska                                void* dst, size_t dstCapacity,
3286*c03c5b1cSMartin Matuska                          const void* src, size_t srcSize,
3287*c03c5b1cSMartin Matuska                          const void* dict, size_t dictSize,
3288*c03c5b1cSMartin Matuska                                int compressionLevel)
3289*c03c5b1cSMartin Matuska {
3290*c03c5b1cSMartin Matuska     ZSTD_parameters const params = ZSTD_getParams_internal(compressionLevel, srcSize, dict ? dictSize : 0);
3291*c03c5b1cSMartin Matuska     ZSTD_CCtx_params cctxParams = ZSTD_assignParamsToCCtxParams(&cctx->requestedParams, &params);
3292*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_compress_usingDict (srcSize=%u)", (unsigned)srcSize);
3293*c03c5b1cSMartin Matuska     assert(params.fParams.contentSizeFlag == 1);
3294*c03c5b1cSMartin Matuska     return ZSTD_compress_advanced_internal(cctx, dst, dstCapacity, src, srcSize, dict, dictSize, &cctxParams);
3295*c03c5b1cSMartin Matuska }
3296*c03c5b1cSMartin Matuska 
ZSTD_compressCCtx(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize,int compressionLevel)3297*c03c5b1cSMartin Matuska size_t ZSTD_compressCCtx(ZSTD_CCtx* cctx,
3298*c03c5b1cSMartin Matuska                          void* dst, size_t dstCapacity,
3299*c03c5b1cSMartin Matuska                    const void* src, size_t srcSize,
3300*c03c5b1cSMartin Matuska                          int compressionLevel)
3301*c03c5b1cSMartin Matuska {
3302*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_compressCCtx (srcSize=%u)", (unsigned)srcSize);
3303*c03c5b1cSMartin Matuska     assert(cctx != NULL);
3304*c03c5b1cSMartin Matuska     return ZSTD_compress_usingDict(cctx, dst, dstCapacity, src, srcSize, NULL, 0, compressionLevel);
3305*c03c5b1cSMartin Matuska }
3306*c03c5b1cSMartin Matuska 
ZSTD_compress(void * dst,size_t dstCapacity,const void * src,size_t srcSize,int compressionLevel)3307*c03c5b1cSMartin Matuska size_t ZSTD_compress(void* dst, size_t dstCapacity,
3308*c03c5b1cSMartin Matuska                const void* src, size_t srcSize,
3309*c03c5b1cSMartin Matuska                      int compressionLevel)
3310*c03c5b1cSMartin Matuska {
3311*c03c5b1cSMartin Matuska     size_t result;
3312*c03c5b1cSMartin Matuska     ZSTD_CCtx ctxBody;
3313*c03c5b1cSMartin Matuska     ZSTD_initCCtx(&ctxBody, ZSTD_defaultCMem);
3314*c03c5b1cSMartin Matuska     result = ZSTD_compressCCtx(&ctxBody, dst, dstCapacity, src, srcSize, compressionLevel);
3315*c03c5b1cSMartin Matuska     ZSTD_freeCCtxContent(&ctxBody);   /* can't free ctxBody itself, as it's on stack; free only heap content */
3316*c03c5b1cSMartin Matuska     return result;
3317*c03c5b1cSMartin Matuska }
3318*c03c5b1cSMartin Matuska 
3319*c03c5b1cSMartin Matuska 
3320*c03c5b1cSMartin Matuska /* =====  Dictionary API  ===== */
3321*c03c5b1cSMartin Matuska 
3322*c03c5b1cSMartin Matuska /*! ZSTD_estimateCDictSize_advanced() :
3323*c03c5b1cSMartin Matuska  *  Estimate amount of memory that will be needed to create a dictionary with following arguments */
ZSTD_estimateCDictSize_advanced(size_t dictSize,ZSTD_compressionParameters cParams,ZSTD_dictLoadMethod_e dictLoadMethod)3324*c03c5b1cSMartin Matuska size_t ZSTD_estimateCDictSize_advanced(
3325*c03c5b1cSMartin Matuska         size_t dictSize, ZSTD_compressionParameters cParams,
3326*c03c5b1cSMartin Matuska         ZSTD_dictLoadMethod_e dictLoadMethod)
3327*c03c5b1cSMartin Matuska {
3328*c03c5b1cSMartin Matuska     DEBUGLOG(5, "sizeof(ZSTD_CDict) : %u", (unsigned)sizeof(ZSTD_CDict));
3329*c03c5b1cSMartin Matuska     return ZSTD_cwksp_alloc_size(sizeof(ZSTD_CDict))
3330*c03c5b1cSMartin Matuska          + ZSTD_cwksp_alloc_size(HUF_WORKSPACE_SIZE)
3331*c03c5b1cSMartin Matuska          + ZSTD_sizeof_matchState(&cParams, /* forCCtx */ 0)
3332*c03c5b1cSMartin Matuska          + (dictLoadMethod == ZSTD_dlm_byRef ? 0
3333*c03c5b1cSMartin Matuska             : ZSTD_cwksp_alloc_size(ZSTD_cwksp_align(dictSize, sizeof(void *))));
3334*c03c5b1cSMartin Matuska }
3335*c03c5b1cSMartin Matuska 
ZSTD_estimateCDictSize(size_t dictSize,int compressionLevel)3336*c03c5b1cSMartin Matuska size_t ZSTD_estimateCDictSize(size_t dictSize, int compressionLevel)
3337*c03c5b1cSMartin Matuska {
3338*c03c5b1cSMartin Matuska     ZSTD_compressionParameters const cParams = ZSTD_getCParams_internal(compressionLevel, ZSTD_CONTENTSIZE_UNKNOWN, dictSize);
3339*c03c5b1cSMartin Matuska     return ZSTD_estimateCDictSize_advanced(dictSize, cParams, ZSTD_dlm_byCopy);
3340*c03c5b1cSMartin Matuska }
3341*c03c5b1cSMartin Matuska 
ZSTD_sizeof_CDict(const ZSTD_CDict * cdict)3342*c03c5b1cSMartin Matuska size_t ZSTD_sizeof_CDict(const ZSTD_CDict* cdict)
3343*c03c5b1cSMartin Matuska {
3344*c03c5b1cSMartin Matuska     if (cdict==NULL) return 0;   /* support sizeof on NULL */
3345*c03c5b1cSMartin Matuska     DEBUGLOG(5, "sizeof(*cdict) : %u", (unsigned)sizeof(*cdict));
3346*c03c5b1cSMartin Matuska     /* cdict may be in the workspace */
3347*c03c5b1cSMartin Matuska     return (cdict->workspace.workspace == cdict ? 0 : sizeof(*cdict))
3348*c03c5b1cSMartin Matuska         + ZSTD_cwksp_sizeof(&cdict->workspace);
3349*c03c5b1cSMartin Matuska }
3350*c03c5b1cSMartin Matuska 
ZSTD_initCDict_internal(ZSTD_CDict * cdict,const void * dictBuffer,size_t dictSize,ZSTD_dictLoadMethod_e dictLoadMethod,ZSTD_dictContentType_e dictContentType,ZSTD_compressionParameters cParams)3351*c03c5b1cSMartin Matuska static size_t ZSTD_initCDict_internal(
3352*c03c5b1cSMartin Matuska                     ZSTD_CDict* cdict,
3353*c03c5b1cSMartin Matuska               const void* dictBuffer, size_t dictSize,
3354*c03c5b1cSMartin Matuska                     ZSTD_dictLoadMethod_e dictLoadMethod,
3355*c03c5b1cSMartin Matuska                     ZSTD_dictContentType_e dictContentType,
3356*c03c5b1cSMartin Matuska                     ZSTD_compressionParameters cParams)
3357*c03c5b1cSMartin Matuska {
3358*c03c5b1cSMartin Matuska     DEBUGLOG(3, "ZSTD_initCDict_internal (dictContentType:%u)", (unsigned)dictContentType);
3359*c03c5b1cSMartin Matuska     assert(!ZSTD_checkCParams(cParams));
3360*c03c5b1cSMartin Matuska     cdict->matchState.cParams = cParams;
3361*c03c5b1cSMartin Matuska     if ((dictLoadMethod == ZSTD_dlm_byRef) || (!dictBuffer) || (!dictSize)) {
3362*c03c5b1cSMartin Matuska         cdict->dictContent = dictBuffer;
3363*c03c5b1cSMartin Matuska     } else {
3364*c03c5b1cSMartin Matuska          void *internalBuffer = ZSTD_cwksp_reserve_object(&cdict->workspace, ZSTD_cwksp_align(dictSize, sizeof(void*)));
3365*c03c5b1cSMartin Matuska         RETURN_ERROR_IF(!internalBuffer, memory_allocation, "NULL pointer!");
3366*c03c5b1cSMartin Matuska         cdict->dictContent = internalBuffer;
3367*c03c5b1cSMartin Matuska         memcpy(internalBuffer, dictBuffer, dictSize);
3368*c03c5b1cSMartin Matuska     }
3369*c03c5b1cSMartin Matuska     cdict->dictContentSize = dictSize;
3370*c03c5b1cSMartin Matuska 
3371*c03c5b1cSMartin Matuska     cdict->entropyWorkspace = (U32*)ZSTD_cwksp_reserve_object(&cdict->workspace, HUF_WORKSPACE_SIZE);
3372*c03c5b1cSMartin Matuska 
3373*c03c5b1cSMartin Matuska 
3374*c03c5b1cSMartin Matuska     /* Reset the state to no dictionary */
3375*c03c5b1cSMartin Matuska     ZSTD_reset_compressedBlockState(&cdict->cBlockState);
3376*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR(ZSTD_reset_matchState(
3377*c03c5b1cSMartin Matuska         &cdict->matchState,
3378*c03c5b1cSMartin Matuska         &cdict->workspace,
3379*c03c5b1cSMartin Matuska         &cParams,
3380*c03c5b1cSMartin Matuska         ZSTDcrp_makeClean,
3381*c03c5b1cSMartin Matuska         ZSTDirp_reset,
3382*c03c5b1cSMartin Matuska         ZSTD_resetTarget_CDict), "");
3383*c03c5b1cSMartin Matuska     /* (Maybe) load the dictionary
3384*c03c5b1cSMartin Matuska      * Skips loading the dictionary if it is < 8 bytes.
3385*c03c5b1cSMartin Matuska      */
3386*c03c5b1cSMartin Matuska     {   ZSTD_CCtx_params params;
3387*c03c5b1cSMartin Matuska         memset(&params, 0, sizeof(params));
3388*c03c5b1cSMartin Matuska         params.compressionLevel = ZSTD_CLEVEL_DEFAULT;
3389*c03c5b1cSMartin Matuska         params.fParams.contentSizeFlag = 1;
3390*c03c5b1cSMartin Matuska         params.cParams = cParams;
3391*c03c5b1cSMartin Matuska         {   size_t const dictID = ZSTD_compress_insertDictionary(
3392*c03c5b1cSMartin Matuska                     &cdict->cBlockState, &cdict->matchState, NULL, &cdict->workspace,
3393*c03c5b1cSMartin Matuska                     &params, cdict->dictContent, cdict->dictContentSize,
3394*c03c5b1cSMartin Matuska                     dictContentType, ZSTD_dtlm_full, cdict->entropyWorkspace);
3395*c03c5b1cSMartin Matuska             FORWARD_IF_ERROR(dictID, "ZSTD_compress_insertDictionary failed");
3396*c03c5b1cSMartin Matuska             assert(dictID <= (size_t)(U32)-1);
3397*c03c5b1cSMartin Matuska             cdict->dictID = (U32)dictID;
3398*c03c5b1cSMartin Matuska         }
3399*c03c5b1cSMartin Matuska     }
3400*c03c5b1cSMartin Matuska 
3401*c03c5b1cSMartin Matuska     return 0;
3402*c03c5b1cSMartin Matuska }
3403*c03c5b1cSMartin Matuska 
ZSTD_createCDict_advanced(const void * dictBuffer,size_t dictSize,ZSTD_dictLoadMethod_e dictLoadMethod,ZSTD_dictContentType_e dictContentType,ZSTD_compressionParameters cParams,ZSTD_customMem customMem)3404*c03c5b1cSMartin Matuska ZSTD_CDict* ZSTD_createCDict_advanced(const void* dictBuffer, size_t dictSize,
3405*c03c5b1cSMartin Matuska                                       ZSTD_dictLoadMethod_e dictLoadMethod,
3406*c03c5b1cSMartin Matuska                                       ZSTD_dictContentType_e dictContentType,
3407*c03c5b1cSMartin Matuska                                       ZSTD_compressionParameters cParams, ZSTD_customMem customMem)
3408*c03c5b1cSMartin Matuska {
3409*c03c5b1cSMartin Matuska     DEBUGLOG(3, "ZSTD_createCDict_advanced, mode %u", (unsigned)dictContentType);
3410*c03c5b1cSMartin Matuska     if (!customMem.customAlloc ^ !customMem.customFree) return NULL;
3411*c03c5b1cSMartin Matuska 
3412*c03c5b1cSMartin Matuska     {   size_t const workspaceSize =
3413*c03c5b1cSMartin Matuska             ZSTD_cwksp_alloc_size(sizeof(ZSTD_CDict)) +
3414*c03c5b1cSMartin Matuska             ZSTD_cwksp_alloc_size(HUF_WORKSPACE_SIZE) +
3415*c03c5b1cSMartin Matuska             ZSTD_sizeof_matchState(&cParams, /* forCCtx */ 0) +
3416*c03c5b1cSMartin Matuska             (dictLoadMethod == ZSTD_dlm_byRef ? 0
3417*c03c5b1cSMartin Matuska              : ZSTD_cwksp_alloc_size(ZSTD_cwksp_align(dictSize, sizeof(void*))));
3418*c03c5b1cSMartin Matuska         void* const workspace = ZSTD_malloc(workspaceSize, customMem);
3419*c03c5b1cSMartin Matuska         ZSTD_cwksp ws;
3420*c03c5b1cSMartin Matuska         ZSTD_CDict* cdict;
3421*c03c5b1cSMartin Matuska 
3422*c03c5b1cSMartin Matuska         if (!workspace) {
3423*c03c5b1cSMartin Matuska             ZSTD_free(workspace, customMem);
3424*c03c5b1cSMartin Matuska             return NULL;
3425*c03c5b1cSMartin Matuska         }
3426*c03c5b1cSMartin Matuska 
3427*c03c5b1cSMartin Matuska         ZSTD_cwksp_init(&ws, workspace, workspaceSize);
3428*c03c5b1cSMartin Matuska 
3429*c03c5b1cSMartin Matuska         cdict = (ZSTD_CDict*)ZSTD_cwksp_reserve_object(&ws, sizeof(ZSTD_CDict));
3430*c03c5b1cSMartin Matuska         assert(cdict != NULL);
3431*c03c5b1cSMartin Matuska         ZSTD_cwksp_move(&cdict->workspace, &ws);
3432*c03c5b1cSMartin Matuska         cdict->customMem = customMem;
3433*c03c5b1cSMartin Matuska         cdict->compressionLevel = 0; /* signals advanced API usage */
3434*c03c5b1cSMartin Matuska 
3435*c03c5b1cSMartin Matuska         if (ZSTD_isError( ZSTD_initCDict_internal(cdict,
3436*c03c5b1cSMartin Matuska                                         dictBuffer, dictSize,
3437*c03c5b1cSMartin Matuska                                         dictLoadMethod, dictContentType,
3438*c03c5b1cSMartin Matuska                                         cParams) )) {
3439*c03c5b1cSMartin Matuska             ZSTD_freeCDict(cdict);
3440*c03c5b1cSMartin Matuska             return NULL;
3441*c03c5b1cSMartin Matuska         }
3442*c03c5b1cSMartin Matuska 
3443*c03c5b1cSMartin Matuska         return cdict;
3444*c03c5b1cSMartin Matuska     }
3445*c03c5b1cSMartin Matuska }
3446*c03c5b1cSMartin Matuska 
ZSTD_createCDict(const void * dict,size_t dictSize,int compressionLevel)3447*c03c5b1cSMartin Matuska ZSTD_CDict* ZSTD_createCDict(const void* dict, size_t dictSize, int compressionLevel)
3448*c03c5b1cSMartin Matuska {
3449*c03c5b1cSMartin Matuska     ZSTD_compressionParameters cParams = ZSTD_getCParams_internal(compressionLevel, ZSTD_CONTENTSIZE_UNKNOWN, dictSize);
3450*c03c5b1cSMartin Matuska     ZSTD_CDict* cdict = ZSTD_createCDict_advanced(dict, dictSize,
3451*c03c5b1cSMartin Matuska                                                   ZSTD_dlm_byCopy, ZSTD_dct_auto,
3452*c03c5b1cSMartin Matuska                                                   cParams, ZSTD_defaultCMem);
3453*c03c5b1cSMartin Matuska     if (cdict)
3454*c03c5b1cSMartin Matuska         cdict->compressionLevel = compressionLevel == 0 ? ZSTD_CLEVEL_DEFAULT : compressionLevel;
3455*c03c5b1cSMartin Matuska     return cdict;
3456*c03c5b1cSMartin Matuska }
3457*c03c5b1cSMartin Matuska 
ZSTD_createCDict_byReference(const void * dict,size_t dictSize,int compressionLevel)3458*c03c5b1cSMartin Matuska ZSTD_CDict* ZSTD_createCDict_byReference(const void* dict, size_t dictSize, int compressionLevel)
3459*c03c5b1cSMartin Matuska {
3460*c03c5b1cSMartin Matuska     ZSTD_compressionParameters cParams = ZSTD_getCParams_internal(compressionLevel, ZSTD_CONTENTSIZE_UNKNOWN, dictSize);
3461*c03c5b1cSMartin Matuska     return ZSTD_createCDict_advanced(dict, dictSize,
3462*c03c5b1cSMartin Matuska                                      ZSTD_dlm_byRef, ZSTD_dct_auto,
3463*c03c5b1cSMartin Matuska                                      cParams, ZSTD_defaultCMem);
3464*c03c5b1cSMartin Matuska }
3465*c03c5b1cSMartin Matuska 
ZSTD_freeCDict(ZSTD_CDict * cdict)3466*c03c5b1cSMartin Matuska size_t ZSTD_freeCDict(ZSTD_CDict* cdict)
3467*c03c5b1cSMartin Matuska {
3468*c03c5b1cSMartin Matuska     if (cdict==NULL) return 0;   /* support free on NULL */
3469*c03c5b1cSMartin Matuska     {   ZSTD_customMem const cMem = cdict->customMem;
3470*c03c5b1cSMartin Matuska         int cdictInWorkspace = ZSTD_cwksp_owns_buffer(&cdict->workspace, cdict);
3471*c03c5b1cSMartin Matuska         ZSTD_cwksp_free(&cdict->workspace, cMem);
3472*c03c5b1cSMartin Matuska         if (!cdictInWorkspace) {
3473*c03c5b1cSMartin Matuska             ZSTD_free(cdict, cMem);
3474*c03c5b1cSMartin Matuska         }
3475*c03c5b1cSMartin Matuska         return 0;
3476*c03c5b1cSMartin Matuska     }
3477*c03c5b1cSMartin Matuska }
3478*c03c5b1cSMartin Matuska 
3479*c03c5b1cSMartin Matuska /*! ZSTD_initStaticCDict_advanced() :
3480*c03c5b1cSMartin Matuska  *  Generate a digested dictionary in provided memory area.
3481*c03c5b1cSMartin Matuska  *  workspace: The memory area to emplace the dictionary into.
3482*c03c5b1cSMartin Matuska  *             Provided pointer must 8-bytes aligned.
3483*c03c5b1cSMartin Matuska  *             It must outlive dictionary usage.
3484*c03c5b1cSMartin Matuska  *  workspaceSize: Use ZSTD_estimateCDictSize()
3485*c03c5b1cSMartin Matuska  *                 to determine how large workspace must be.
3486*c03c5b1cSMartin Matuska  *  cParams : use ZSTD_getCParams() to transform a compression level
3487*c03c5b1cSMartin Matuska  *            into its relevants cParams.
3488*c03c5b1cSMartin Matuska  * @return : pointer to ZSTD_CDict*, or NULL if error (size too small)
3489*c03c5b1cSMartin Matuska  *  Note : there is no corresponding "free" function.
3490*c03c5b1cSMartin Matuska  *         Since workspace was allocated externally, it must be freed externally.
3491*c03c5b1cSMartin Matuska  */
ZSTD_initStaticCDict(void * workspace,size_t workspaceSize,const void * dict,size_t dictSize,ZSTD_dictLoadMethod_e dictLoadMethod,ZSTD_dictContentType_e dictContentType,ZSTD_compressionParameters cParams)3492*c03c5b1cSMartin Matuska const ZSTD_CDict* ZSTD_initStaticCDict(
3493*c03c5b1cSMartin Matuska                                  void* workspace, size_t workspaceSize,
3494*c03c5b1cSMartin Matuska                            const void* dict, size_t dictSize,
3495*c03c5b1cSMartin Matuska                                  ZSTD_dictLoadMethod_e dictLoadMethod,
3496*c03c5b1cSMartin Matuska                                  ZSTD_dictContentType_e dictContentType,
3497*c03c5b1cSMartin Matuska                                  ZSTD_compressionParameters cParams)
3498*c03c5b1cSMartin Matuska {
3499*c03c5b1cSMartin Matuska     size_t const matchStateSize = ZSTD_sizeof_matchState(&cParams, /* forCCtx */ 0);
3500*c03c5b1cSMartin Matuska     size_t const neededSize = ZSTD_cwksp_alloc_size(sizeof(ZSTD_CDict))
3501*c03c5b1cSMartin Matuska                             + (dictLoadMethod == ZSTD_dlm_byRef ? 0
3502*c03c5b1cSMartin Matuska                                : ZSTD_cwksp_alloc_size(ZSTD_cwksp_align(dictSize, sizeof(void*))))
3503*c03c5b1cSMartin Matuska                             + ZSTD_cwksp_alloc_size(HUF_WORKSPACE_SIZE)
3504*c03c5b1cSMartin Matuska                             + matchStateSize;
3505*c03c5b1cSMartin Matuska     ZSTD_CDict* cdict;
3506*c03c5b1cSMartin Matuska 
3507*c03c5b1cSMartin Matuska     if ((size_t)workspace & 7) return NULL;  /* 8-aligned */
3508*c03c5b1cSMartin Matuska 
3509*c03c5b1cSMartin Matuska     {
3510*c03c5b1cSMartin Matuska         ZSTD_cwksp ws;
3511*c03c5b1cSMartin Matuska         ZSTD_cwksp_init(&ws, workspace, workspaceSize);
3512*c03c5b1cSMartin Matuska         cdict = (ZSTD_CDict*)ZSTD_cwksp_reserve_object(&ws, sizeof(ZSTD_CDict));
3513*c03c5b1cSMartin Matuska         if (cdict == NULL) return NULL;
3514*c03c5b1cSMartin Matuska         ZSTD_cwksp_move(&cdict->workspace, &ws);
3515*c03c5b1cSMartin Matuska     }
3516*c03c5b1cSMartin Matuska 
3517*c03c5b1cSMartin Matuska     DEBUGLOG(4, "(workspaceSize < neededSize) : (%u < %u) => %u",
3518*c03c5b1cSMartin Matuska         (unsigned)workspaceSize, (unsigned)neededSize, (unsigned)(workspaceSize < neededSize));
3519*c03c5b1cSMartin Matuska     if (workspaceSize < neededSize) return NULL;
3520*c03c5b1cSMartin Matuska 
3521*c03c5b1cSMartin Matuska     if (ZSTD_isError( ZSTD_initCDict_internal(cdict,
3522*c03c5b1cSMartin Matuska                                               dict, dictSize,
3523*c03c5b1cSMartin Matuska                                               dictLoadMethod, dictContentType,
3524*c03c5b1cSMartin Matuska                                               cParams) ))
3525*c03c5b1cSMartin Matuska         return NULL;
3526*c03c5b1cSMartin Matuska 
3527*c03c5b1cSMartin Matuska     return cdict;
3528*c03c5b1cSMartin Matuska }
3529*c03c5b1cSMartin Matuska 
ZSTD_getCParamsFromCDict(const ZSTD_CDict * cdict)3530*c03c5b1cSMartin Matuska ZSTD_compressionParameters ZSTD_getCParamsFromCDict(const ZSTD_CDict* cdict)
3531*c03c5b1cSMartin Matuska {
3532*c03c5b1cSMartin Matuska     assert(cdict != NULL);
3533*c03c5b1cSMartin Matuska     return cdict->matchState.cParams;
3534*c03c5b1cSMartin Matuska }
3535*c03c5b1cSMartin Matuska 
3536*c03c5b1cSMartin Matuska /* ZSTD_compressBegin_usingCDict_advanced() :
3537*c03c5b1cSMartin Matuska  * cdict must be != NULL */
ZSTD_compressBegin_usingCDict_advanced(ZSTD_CCtx * const cctx,const ZSTD_CDict * const cdict,ZSTD_frameParameters const fParams,unsigned long long const pledgedSrcSize)3538*c03c5b1cSMartin Matuska size_t ZSTD_compressBegin_usingCDict_advanced(
3539*c03c5b1cSMartin Matuska     ZSTD_CCtx* const cctx, const ZSTD_CDict* const cdict,
3540*c03c5b1cSMartin Matuska     ZSTD_frameParameters const fParams, unsigned long long const pledgedSrcSize)
3541*c03c5b1cSMartin Matuska {
3542*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_compressBegin_usingCDict_advanced");
3543*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(cdict==NULL, dictionary_wrong, "NULL pointer!");
3544*c03c5b1cSMartin Matuska     {   ZSTD_CCtx_params params = cctx->requestedParams;
3545*c03c5b1cSMartin Matuska         params.cParams = ( pledgedSrcSize < ZSTD_USE_CDICT_PARAMS_SRCSIZE_CUTOFF
3546*c03c5b1cSMartin Matuska                         || pledgedSrcSize < cdict->dictContentSize * ZSTD_USE_CDICT_PARAMS_DICTSIZE_MULTIPLIER
3547*c03c5b1cSMartin Matuska                         || pledgedSrcSize == ZSTD_CONTENTSIZE_UNKNOWN
3548*c03c5b1cSMartin Matuska                         || cdict->compressionLevel == 0 )
3549*c03c5b1cSMartin Matuska                       && (params.attachDictPref != ZSTD_dictForceLoad) ?
3550*c03c5b1cSMartin Matuska                 ZSTD_getCParamsFromCDict(cdict)
3551*c03c5b1cSMartin Matuska               : ZSTD_getCParams(cdict->compressionLevel,
3552*c03c5b1cSMartin Matuska                                 pledgedSrcSize,
3553*c03c5b1cSMartin Matuska                                 cdict->dictContentSize);
3554*c03c5b1cSMartin Matuska         /* Increase window log to fit the entire dictionary and source if the
3555*c03c5b1cSMartin Matuska          * source size is known. Limit the increase to 19, which is the
3556*c03c5b1cSMartin Matuska          * window log for compression level 1 with the largest source size.
3557*c03c5b1cSMartin Matuska          */
3558*c03c5b1cSMartin Matuska         if (pledgedSrcSize != ZSTD_CONTENTSIZE_UNKNOWN) {
3559*c03c5b1cSMartin Matuska             U32 const limitedSrcSize = (U32)MIN(pledgedSrcSize, 1U << 19);
3560*c03c5b1cSMartin Matuska             U32 const limitedSrcLog = limitedSrcSize > 1 ? ZSTD_highbit32(limitedSrcSize - 1) + 1 : 1;
3561*c03c5b1cSMartin Matuska             params.cParams.windowLog = MAX(params.cParams.windowLog, limitedSrcLog);
3562*c03c5b1cSMartin Matuska         }
3563*c03c5b1cSMartin Matuska         params.fParams = fParams;
3564*c03c5b1cSMartin Matuska         return ZSTD_compressBegin_internal(cctx,
3565*c03c5b1cSMartin Matuska                                            NULL, 0, ZSTD_dct_auto, ZSTD_dtlm_fast,
3566*c03c5b1cSMartin Matuska                                            cdict,
3567*c03c5b1cSMartin Matuska                                            &params, pledgedSrcSize,
3568*c03c5b1cSMartin Matuska                                            ZSTDb_not_buffered);
3569*c03c5b1cSMartin Matuska     }
3570*c03c5b1cSMartin Matuska }
3571*c03c5b1cSMartin Matuska 
3572*c03c5b1cSMartin Matuska /* ZSTD_compressBegin_usingCDict() :
3573*c03c5b1cSMartin Matuska  * pledgedSrcSize=0 means "unknown"
3574*c03c5b1cSMartin Matuska  * if pledgedSrcSize>0, it will enable contentSizeFlag */
ZSTD_compressBegin_usingCDict(ZSTD_CCtx * cctx,const ZSTD_CDict * cdict)3575*c03c5b1cSMartin Matuska size_t ZSTD_compressBegin_usingCDict(ZSTD_CCtx* cctx, const ZSTD_CDict* cdict)
3576*c03c5b1cSMartin Matuska {
3577*c03c5b1cSMartin Matuska     ZSTD_frameParameters const fParams = { 0 /*content*/, 0 /*checksum*/, 0 /*noDictID*/ };
3578*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_compressBegin_usingCDict : dictIDFlag == %u", !fParams.noDictIDFlag);
3579*c03c5b1cSMartin Matuska     return ZSTD_compressBegin_usingCDict_advanced(cctx, cdict, fParams, ZSTD_CONTENTSIZE_UNKNOWN);
3580*c03c5b1cSMartin Matuska }
3581*c03c5b1cSMartin Matuska 
ZSTD_compress_usingCDict_advanced(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize,const ZSTD_CDict * cdict,ZSTD_frameParameters fParams)3582*c03c5b1cSMartin Matuska size_t ZSTD_compress_usingCDict_advanced(ZSTD_CCtx* cctx,
3583*c03c5b1cSMartin Matuska                                 void* dst, size_t dstCapacity,
3584*c03c5b1cSMartin Matuska                                 const void* src, size_t srcSize,
3585*c03c5b1cSMartin Matuska                                 const ZSTD_CDict* cdict, ZSTD_frameParameters fParams)
3586*c03c5b1cSMartin Matuska {
3587*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR(ZSTD_compressBegin_usingCDict_advanced(cctx, cdict, fParams, srcSize), "");   /* will check if cdict != NULL */
3588*c03c5b1cSMartin Matuska     return ZSTD_compressEnd(cctx, dst, dstCapacity, src, srcSize);
3589*c03c5b1cSMartin Matuska }
3590*c03c5b1cSMartin Matuska 
3591*c03c5b1cSMartin Matuska /*! ZSTD_compress_usingCDict() :
3592*c03c5b1cSMartin Matuska  *  Compression using a digested Dictionary.
3593*c03c5b1cSMartin Matuska  *  Faster startup than ZSTD_compress_usingDict(), recommended when same dictionary is used multiple times.
3594*c03c5b1cSMartin Matuska  *  Note that compression parameters are decided at CDict creation time
3595*c03c5b1cSMartin Matuska  *  while frame parameters are hardcoded */
ZSTD_compress_usingCDict(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize,const ZSTD_CDict * cdict)3596*c03c5b1cSMartin Matuska size_t ZSTD_compress_usingCDict(ZSTD_CCtx* cctx,
3597*c03c5b1cSMartin Matuska                                 void* dst, size_t dstCapacity,
3598*c03c5b1cSMartin Matuska                                 const void* src, size_t srcSize,
3599*c03c5b1cSMartin Matuska                                 const ZSTD_CDict* cdict)
3600*c03c5b1cSMartin Matuska {
3601*c03c5b1cSMartin Matuska     ZSTD_frameParameters const fParams = { 1 /*content*/, 0 /*checksum*/, 0 /*noDictID*/ };
3602*c03c5b1cSMartin Matuska     return ZSTD_compress_usingCDict_advanced(cctx, dst, dstCapacity, src, srcSize, cdict, fParams);
3603*c03c5b1cSMartin Matuska }
3604*c03c5b1cSMartin Matuska 
3605*c03c5b1cSMartin Matuska 
3606*c03c5b1cSMartin Matuska 
3607*c03c5b1cSMartin Matuska /* ******************************************************************
3608*c03c5b1cSMartin Matuska *  Streaming
3609*c03c5b1cSMartin Matuska ********************************************************************/
3610*c03c5b1cSMartin Matuska 
ZSTD_createCStream(void)3611*c03c5b1cSMartin Matuska ZSTD_CStream* ZSTD_createCStream(void)
3612*c03c5b1cSMartin Matuska {
3613*c03c5b1cSMartin Matuska     DEBUGLOG(3, "ZSTD_createCStream");
3614*c03c5b1cSMartin Matuska     return ZSTD_createCStream_advanced(ZSTD_defaultCMem);
3615*c03c5b1cSMartin Matuska }
3616*c03c5b1cSMartin Matuska 
ZSTD_initStaticCStream(void * workspace,size_t workspaceSize)3617*c03c5b1cSMartin Matuska ZSTD_CStream* ZSTD_initStaticCStream(void *workspace, size_t workspaceSize)
3618*c03c5b1cSMartin Matuska {
3619*c03c5b1cSMartin Matuska     return ZSTD_initStaticCCtx(workspace, workspaceSize);
3620*c03c5b1cSMartin Matuska }
3621*c03c5b1cSMartin Matuska 
ZSTD_createCStream_advanced(ZSTD_customMem customMem)3622*c03c5b1cSMartin Matuska ZSTD_CStream* ZSTD_createCStream_advanced(ZSTD_customMem customMem)
3623*c03c5b1cSMartin Matuska {   /* CStream and CCtx are now same object */
3624*c03c5b1cSMartin Matuska     return ZSTD_createCCtx_advanced(customMem);
3625*c03c5b1cSMartin Matuska }
3626*c03c5b1cSMartin Matuska 
ZSTD_freeCStream(ZSTD_CStream * zcs)3627*c03c5b1cSMartin Matuska size_t ZSTD_freeCStream(ZSTD_CStream* zcs)
3628*c03c5b1cSMartin Matuska {
3629*c03c5b1cSMartin Matuska     return ZSTD_freeCCtx(zcs);   /* same object */
3630*c03c5b1cSMartin Matuska }
3631*c03c5b1cSMartin Matuska 
3632*c03c5b1cSMartin Matuska 
3633*c03c5b1cSMartin Matuska 
3634*c03c5b1cSMartin Matuska /*======   Initialization   ======*/
3635*c03c5b1cSMartin Matuska 
ZSTD_CStreamInSize(void)3636*c03c5b1cSMartin Matuska size_t ZSTD_CStreamInSize(void)  { return ZSTD_BLOCKSIZE_MAX; }
3637*c03c5b1cSMartin Matuska 
ZSTD_CStreamOutSize(void)3638*c03c5b1cSMartin Matuska size_t ZSTD_CStreamOutSize(void)
3639*c03c5b1cSMartin Matuska {
3640*c03c5b1cSMartin Matuska     return ZSTD_compressBound(ZSTD_BLOCKSIZE_MAX) + ZSTD_blockHeaderSize + 4 /* 32-bits hash */ ;
3641*c03c5b1cSMartin Matuska }
3642*c03c5b1cSMartin Matuska 
ZSTD_resetCStream_internal(ZSTD_CStream * cctx,const void * const dict,size_t const dictSize,ZSTD_dictContentType_e const dictContentType,const ZSTD_CDict * const cdict,ZSTD_CCtx_params params,unsigned long long const pledgedSrcSize)3643*c03c5b1cSMartin Matuska static size_t ZSTD_resetCStream_internal(ZSTD_CStream* cctx,
3644*c03c5b1cSMartin Matuska                     const void* const dict, size_t const dictSize, ZSTD_dictContentType_e const dictContentType,
3645*c03c5b1cSMartin Matuska                     const ZSTD_CDict* const cdict,
3646*c03c5b1cSMartin Matuska                     ZSTD_CCtx_params params, unsigned long long const pledgedSrcSize)
3647*c03c5b1cSMartin Matuska {
3648*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_resetCStream_internal");
3649*c03c5b1cSMartin Matuska     /* Finalize the compression parameters */
3650*c03c5b1cSMartin Matuska     params.cParams = ZSTD_getCParamsFromCCtxParams(&params, pledgedSrcSize, dictSize);
3651*c03c5b1cSMartin Matuska     /* params are supposed to be fully validated at this point */
3652*c03c5b1cSMartin Matuska     assert(!ZSTD_isError(ZSTD_checkCParams(params.cParams)));
3653*c03c5b1cSMartin Matuska     assert(!((dict) && (cdict)));  /* either dict or cdict, not both */
3654*c03c5b1cSMartin Matuska 
3655*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_compressBegin_internal(cctx,
3656*c03c5b1cSMartin Matuska                                          dict, dictSize, dictContentType, ZSTD_dtlm_fast,
3657*c03c5b1cSMartin Matuska                                          cdict,
3658*c03c5b1cSMartin Matuska                                          &params, pledgedSrcSize,
3659*c03c5b1cSMartin Matuska                                          ZSTDb_buffered) , "");
3660*c03c5b1cSMartin Matuska 
3661*c03c5b1cSMartin Matuska     cctx->inToCompress = 0;
3662*c03c5b1cSMartin Matuska     cctx->inBuffPos = 0;
3663*c03c5b1cSMartin Matuska     cctx->inBuffTarget = cctx->blockSize
3664*c03c5b1cSMartin Matuska                       + (cctx->blockSize == pledgedSrcSize);   /* for small input: avoid automatic flush on reaching end of block, since it would require to add a 3-bytes null block to end frame */
3665*c03c5b1cSMartin Matuska     cctx->outBuffContentSize = cctx->outBuffFlushedSize = 0;
3666*c03c5b1cSMartin Matuska     cctx->streamStage = zcss_load;
3667*c03c5b1cSMartin Matuska     cctx->frameEnded = 0;
3668*c03c5b1cSMartin Matuska     return 0;   /* ready to go */
3669*c03c5b1cSMartin Matuska }
3670*c03c5b1cSMartin Matuska 
3671*c03c5b1cSMartin Matuska /* ZSTD_resetCStream():
3672*c03c5b1cSMartin Matuska  * pledgedSrcSize == 0 means "unknown" */
ZSTD_resetCStream(ZSTD_CStream * zcs,unsigned long long pss)3673*c03c5b1cSMartin Matuska size_t ZSTD_resetCStream(ZSTD_CStream* zcs, unsigned long long pss)
3674*c03c5b1cSMartin Matuska {
3675*c03c5b1cSMartin Matuska     /* temporary : 0 interpreted as "unknown" during transition period.
3676*c03c5b1cSMartin Matuska      * Users willing to specify "unknown" **must** use ZSTD_CONTENTSIZE_UNKNOWN.
3677*c03c5b1cSMartin Matuska      * 0 will be interpreted as "empty" in the future.
3678*c03c5b1cSMartin Matuska      */
3679*c03c5b1cSMartin Matuska     U64 const pledgedSrcSize = (pss==0) ? ZSTD_CONTENTSIZE_UNKNOWN : pss;
3680*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_resetCStream: pledgedSrcSize = %u", (unsigned)pledgedSrcSize);
3681*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only) , "");
3682*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_CCtx_setPledgedSrcSize(zcs, pledgedSrcSize) , "");
3683*c03c5b1cSMartin Matuska     return 0;
3684*c03c5b1cSMartin Matuska }
3685*c03c5b1cSMartin Matuska 
3686*c03c5b1cSMartin Matuska /*! ZSTD_initCStream_internal() :
3687*c03c5b1cSMartin Matuska  *  Note : for lib/compress only. Used by zstdmt_compress.c.
3688*c03c5b1cSMartin Matuska  *  Assumption 1 : params are valid
3689*c03c5b1cSMartin Matuska  *  Assumption 2 : either dict, or cdict, is defined, not both */
ZSTD_initCStream_internal(ZSTD_CStream * zcs,const void * dict,size_t dictSize,const ZSTD_CDict * cdict,const ZSTD_CCtx_params * params,unsigned long long pledgedSrcSize)3690*c03c5b1cSMartin Matuska size_t ZSTD_initCStream_internal(ZSTD_CStream* zcs,
3691*c03c5b1cSMartin Matuska                     const void* dict, size_t dictSize, const ZSTD_CDict* cdict,
3692*c03c5b1cSMartin Matuska                     const ZSTD_CCtx_params* params,
3693*c03c5b1cSMartin Matuska                     unsigned long long pledgedSrcSize)
3694*c03c5b1cSMartin Matuska {
3695*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_initCStream_internal");
3696*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only) , "");
3697*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_CCtx_setPledgedSrcSize(zcs, pledgedSrcSize) , "");
3698*c03c5b1cSMartin Matuska     assert(!ZSTD_isError(ZSTD_checkCParams(params->cParams)));
3699*c03c5b1cSMartin Matuska     zcs->requestedParams = *params;
3700*c03c5b1cSMartin Matuska     assert(!((dict) && (cdict)));  /* either dict or cdict, not both */
3701*c03c5b1cSMartin Matuska     if (dict) {
3702*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR( ZSTD_CCtx_loadDictionary(zcs, dict, dictSize) , "");
3703*c03c5b1cSMartin Matuska     } else {
3704*c03c5b1cSMartin Matuska         /* Dictionary is cleared if !cdict */
3705*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR( ZSTD_CCtx_refCDict(zcs, cdict) , "");
3706*c03c5b1cSMartin Matuska     }
3707*c03c5b1cSMartin Matuska     return 0;
3708*c03c5b1cSMartin Matuska }
3709*c03c5b1cSMartin Matuska 
3710*c03c5b1cSMartin Matuska /* ZSTD_initCStream_usingCDict_advanced() :
3711*c03c5b1cSMartin Matuska  * same as ZSTD_initCStream_usingCDict(), with control over frame parameters */
ZSTD_initCStream_usingCDict_advanced(ZSTD_CStream * zcs,const ZSTD_CDict * cdict,ZSTD_frameParameters fParams,unsigned long long pledgedSrcSize)3712*c03c5b1cSMartin Matuska size_t ZSTD_initCStream_usingCDict_advanced(ZSTD_CStream* zcs,
3713*c03c5b1cSMartin Matuska                                             const ZSTD_CDict* cdict,
3714*c03c5b1cSMartin Matuska                                             ZSTD_frameParameters fParams,
3715*c03c5b1cSMartin Matuska                                             unsigned long long pledgedSrcSize)
3716*c03c5b1cSMartin Matuska {
3717*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_initCStream_usingCDict_advanced");
3718*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only) , "");
3719*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_CCtx_setPledgedSrcSize(zcs, pledgedSrcSize) , "");
3720*c03c5b1cSMartin Matuska     zcs->requestedParams.fParams = fParams;
3721*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_CCtx_refCDict(zcs, cdict) , "");
3722*c03c5b1cSMartin Matuska     return 0;
3723*c03c5b1cSMartin Matuska }
3724*c03c5b1cSMartin Matuska 
3725*c03c5b1cSMartin Matuska /* note : cdict must outlive compression session */
ZSTD_initCStream_usingCDict(ZSTD_CStream * zcs,const ZSTD_CDict * cdict)3726*c03c5b1cSMartin Matuska size_t ZSTD_initCStream_usingCDict(ZSTD_CStream* zcs, const ZSTD_CDict* cdict)
3727*c03c5b1cSMartin Matuska {
3728*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_initCStream_usingCDict");
3729*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only) , "");
3730*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_CCtx_refCDict(zcs, cdict) , "");
3731*c03c5b1cSMartin Matuska     return 0;
3732*c03c5b1cSMartin Matuska }
3733*c03c5b1cSMartin Matuska 
3734*c03c5b1cSMartin Matuska 
3735*c03c5b1cSMartin Matuska /* ZSTD_initCStream_advanced() :
3736*c03c5b1cSMartin Matuska  * pledgedSrcSize must be exact.
3737*c03c5b1cSMartin Matuska  * if srcSize is not known at init time, use value ZSTD_CONTENTSIZE_UNKNOWN.
3738*c03c5b1cSMartin Matuska  * dict is loaded with default parameters ZSTD_dct_auto and ZSTD_dlm_byCopy. */
ZSTD_initCStream_advanced(ZSTD_CStream * zcs,const void * dict,size_t dictSize,ZSTD_parameters params,unsigned long long pss)3739*c03c5b1cSMartin Matuska size_t ZSTD_initCStream_advanced(ZSTD_CStream* zcs,
3740*c03c5b1cSMartin Matuska                                  const void* dict, size_t dictSize,
3741*c03c5b1cSMartin Matuska                                  ZSTD_parameters params, unsigned long long pss)
3742*c03c5b1cSMartin Matuska {
3743*c03c5b1cSMartin Matuska     /* for compatibility with older programs relying on this behavior.
3744*c03c5b1cSMartin Matuska      * Users should now specify ZSTD_CONTENTSIZE_UNKNOWN.
3745*c03c5b1cSMartin Matuska      * This line will be removed in the future.
3746*c03c5b1cSMartin Matuska      */
3747*c03c5b1cSMartin Matuska     U64 const pledgedSrcSize = (pss==0 && params.fParams.contentSizeFlag==0) ? ZSTD_CONTENTSIZE_UNKNOWN : pss;
3748*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_initCStream_advanced");
3749*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only) , "");
3750*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_CCtx_setPledgedSrcSize(zcs, pledgedSrcSize) , "");
3751*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_checkCParams(params.cParams) , "");
3752*c03c5b1cSMartin Matuska     zcs->requestedParams = ZSTD_assignParamsToCCtxParams(&zcs->requestedParams, &params);
3753*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_CCtx_loadDictionary(zcs, dict, dictSize) , "");
3754*c03c5b1cSMartin Matuska     return 0;
3755*c03c5b1cSMartin Matuska }
3756*c03c5b1cSMartin Matuska 
ZSTD_initCStream_usingDict(ZSTD_CStream * zcs,const void * dict,size_t dictSize,int compressionLevel)3757*c03c5b1cSMartin Matuska size_t ZSTD_initCStream_usingDict(ZSTD_CStream* zcs, const void* dict, size_t dictSize, int compressionLevel)
3758*c03c5b1cSMartin Matuska {
3759*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_initCStream_usingDict");
3760*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only) , "");
3761*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_CCtx_setParameter(zcs, ZSTD_c_compressionLevel, compressionLevel) , "");
3762*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_CCtx_loadDictionary(zcs, dict, dictSize) , "");
3763*c03c5b1cSMartin Matuska     return 0;
3764*c03c5b1cSMartin Matuska }
3765*c03c5b1cSMartin Matuska 
ZSTD_initCStream_srcSize(ZSTD_CStream * zcs,int compressionLevel,unsigned long long pss)3766*c03c5b1cSMartin Matuska size_t ZSTD_initCStream_srcSize(ZSTD_CStream* zcs, int compressionLevel, unsigned long long pss)
3767*c03c5b1cSMartin Matuska {
3768*c03c5b1cSMartin Matuska     /* temporary : 0 interpreted as "unknown" during transition period.
3769*c03c5b1cSMartin Matuska      * Users willing to specify "unknown" **must** use ZSTD_CONTENTSIZE_UNKNOWN.
3770*c03c5b1cSMartin Matuska      * 0 will be interpreted as "empty" in the future.
3771*c03c5b1cSMartin Matuska      */
3772*c03c5b1cSMartin Matuska     U64 const pledgedSrcSize = (pss==0) ? ZSTD_CONTENTSIZE_UNKNOWN : pss;
3773*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_initCStream_srcSize");
3774*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only) , "");
3775*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_CCtx_refCDict(zcs, NULL) , "");
3776*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_CCtx_setParameter(zcs, ZSTD_c_compressionLevel, compressionLevel) , "");
3777*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_CCtx_setPledgedSrcSize(zcs, pledgedSrcSize) , "");
3778*c03c5b1cSMartin Matuska     return 0;
3779*c03c5b1cSMartin Matuska }
3780*c03c5b1cSMartin Matuska 
ZSTD_initCStream(ZSTD_CStream * zcs,int compressionLevel)3781*c03c5b1cSMartin Matuska size_t ZSTD_initCStream(ZSTD_CStream* zcs, int compressionLevel)
3782*c03c5b1cSMartin Matuska {
3783*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_initCStream");
3784*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only) , "");
3785*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_CCtx_refCDict(zcs, NULL) , "");
3786*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_CCtx_setParameter(zcs, ZSTD_c_compressionLevel, compressionLevel) , "");
3787*c03c5b1cSMartin Matuska     return 0;
3788*c03c5b1cSMartin Matuska }
3789*c03c5b1cSMartin Matuska 
3790*c03c5b1cSMartin Matuska /*======   Compression   ======*/
3791*c03c5b1cSMartin Matuska 
ZSTD_nextInputSizeHint(const ZSTD_CCtx * cctx)3792*c03c5b1cSMartin Matuska static size_t ZSTD_nextInputSizeHint(const ZSTD_CCtx* cctx)
3793*c03c5b1cSMartin Matuska {
3794*c03c5b1cSMartin Matuska     size_t hintInSize = cctx->inBuffTarget - cctx->inBuffPos;
3795*c03c5b1cSMartin Matuska     if (hintInSize==0) hintInSize = cctx->blockSize;
3796*c03c5b1cSMartin Matuska     return hintInSize;
3797*c03c5b1cSMartin Matuska }
3798*c03c5b1cSMartin Matuska 
3799*c03c5b1cSMartin Matuska /** ZSTD_compressStream_generic():
3800*c03c5b1cSMartin Matuska  *  internal function for all *compressStream*() variants
3801*c03c5b1cSMartin Matuska  *  non-static, because can be called from zstdmt_compress.c
3802*c03c5b1cSMartin Matuska  * @return : hint size for next input */
ZSTD_compressStream_generic(ZSTD_CStream * zcs,ZSTD_outBuffer * output,ZSTD_inBuffer * input,ZSTD_EndDirective const flushMode)3803*c03c5b1cSMartin Matuska static size_t ZSTD_compressStream_generic(ZSTD_CStream* zcs,
3804*c03c5b1cSMartin Matuska                                           ZSTD_outBuffer* output,
3805*c03c5b1cSMartin Matuska                                           ZSTD_inBuffer* input,
3806*c03c5b1cSMartin Matuska                                           ZSTD_EndDirective const flushMode)
3807*c03c5b1cSMartin Matuska {
3808*c03c5b1cSMartin Matuska     const char* const istart = (const char*)input->src;
3809*c03c5b1cSMartin Matuska     const char* const iend = input->size != 0 ? istart + input->size : istart;
3810*c03c5b1cSMartin Matuska     const char* ip = input->pos != 0 ? istart + input->pos : istart;
3811*c03c5b1cSMartin Matuska     char* const ostart = (char*)output->dst;
3812*c03c5b1cSMartin Matuska     char* const oend = output->size != 0 ? ostart + output->size : ostart;
3813*c03c5b1cSMartin Matuska     char* op = output->pos != 0 ? ostart + output->pos : ostart;
3814*c03c5b1cSMartin Matuska     U32 someMoreWork = 1;
3815*c03c5b1cSMartin Matuska 
3816*c03c5b1cSMartin Matuska     /* check expectations */
3817*c03c5b1cSMartin Matuska     DEBUGLOG(5, "ZSTD_compressStream_generic, flush=%u", (unsigned)flushMode);
3818*c03c5b1cSMartin Matuska     assert(zcs->inBuff != NULL);
3819*c03c5b1cSMartin Matuska     assert(zcs->inBuffSize > 0);
3820*c03c5b1cSMartin Matuska     assert(zcs->outBuff !=  NULL);
3821*c03c5b1cSMartin Matuska     assert(zcs->outBuffSize > 0);
3822*c03c5b1cSMartin Matuska     assert(output->pos <= output->size);
3823*c03c5b1cSMartin Matuska     assert(input->pos <= input->size);
3824*c03c5b1cSMartin Matuska 
3825*c03c5b1cSMartin Matuska     while (someMoreWork) {
3826*c03c5b1cSMartin Matuska         switch(zcs->streamStage)
3827*c03c5b1cSMartin Matuska         {
3828*c03c5b1cSMartin Matuska         case zcss_init:
3829*c03c5b1cSMartin Matuska             RETURN_ERROR(init_missing, "call ZSTD_initCStream() first!");
3830*c03c5b1cSMartin Matuska 
3831*c03c5b1cSMartin Matuska         case zcss_load:
3832*c03c5b1cSMartin Matuska             if ( (flushMode == ZSTD_e_end)
3833*c03c5b1cSMartin Matuska               && ((size_t)(oend-op) >= ZSTD_compressBound(iend-ip))  /* enough dstCapacity */
3834*c03c5b1cSMartin Matuska               && (zcs->inBuffPos == 0) ) {
3835*c03c5b1cSMartin Matuska                 /* shortcut to compression pass directly into output buffer */
3836*c03c5b1cSMartin Matuska                 size_t const cSize = ZSTD_compressEnd(zcs,
3837*c03c5b1cSMartin Matuska                                                 op, oend-op, ip, iend-ip);
3838*c03c5b1cSMartin Matuska                 DEBUGLOG(4, "ZSTD_compressEnd : cSize=%u", (unsigned)cSize);
3839*c03c5b1cSMartin Matuska                 FORWARD_IF_ERROR(cSize, "ZSTD_compressEnd failed");
3840*c03c5b1cSMartin Matuska                 ip = iend;
3841*c03c5b1cSMartin Matuska                 op += cSize;
3842*c03c5b1cSMartin Matuska                 zcs->frameEnded = 1;
3843*c03c5b1cSMartin Matuska                 ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only);
3844*c03c5b1cSMartin Matuska                 someMoreWork = 0; break;
3845*c03c5b1cSMartin Matuska             }
3846*c03c5b1cSMartin Matuska             /* complete loading into inBuffer */
3847*c03c5b1cSMartin Matuska             {   size_t const toLoad = zcs->inBuffTarget - zcs->inBuffPos;
3848*c03c5b1cSMartin Matuska                 size_t const loaded = ZSTD_limitCopy(
3849*c03c5b1cSMartin Matuska                                         zcs->inBuff + zcs->inBuffPos, toLoad,
3850*c03c5b1cSMartin Matuska                                         ip, iend-ip);
3851*c03c5b1cSMartin Matuska                 zcs->inBuffPos += loaded;
3852*c03c5b1cSMartin Matuska                 if (loaded != 0)
3853*c03c5b1cSMartin Matuska                     ip += loaded;
3854*c03c5b1cSMartin Matuska                 if ( (flushMode == ZSTD_e_continue)
3855*c03c5b1cSMartin Matuska                   && (zcs->inBuffPos < zcs->inBuffTarget) ) {
3856*c03c5b1cSMartin Matuska                     /* not enough input to fill full block : stop here */
3857*c03c5b1cSMartin Matuska                     someMoreWork = 0; break;
3858*c03c5b1cSMartin Matuska                 }
3859*c03c5b1cSMartin Matuska                 if ( (flushMode == ZSTD_e_flush)
3860*c03c5b1cSMartin Matuska                   && (zcs->inBuffPos == zcs->inToCompress) ) {
3861*c03c5b1cSMartin Matuska                     /* empty */
3862*c03c5b1cSMartin Matuska                     someMoreWork = 0; break;
3863*c03c5b1cSMartin Matuska                 }
3864*c03c5b1cSMartin Matuska             }
3865*c03c5b1cSMartin Matuska             /* compress current block (note : this stage cannot be stopped in the middle) */
3866*c03c5b1cSMartin Matuska             DEBUGLOG(5, "stream compression stage (flushMode==%u)", flushMode);
3867*c03c5b1cSMartin Matuska             {   void* cDst;
3868*c03c5b1cSMartin Matuska                 size_t cSize;
3869*c03c5b1cSMartin Matuska                 size_t const iSize = zcs->inBuffPos - zcs->inToCompress;
3870*c03c5b1cSMartin Matuska                 size_t oSize = oend-op;
3871*c03c5b1cSMartin Matuska                 unsigned const lastBlock = (flushMode == ZSTD_e_end) && (ip==iend);
3872*c03c5b1cSMartin Matuska                 if (oSize >= ZSTD_compressBound(iSize))
3873*c03c5b1cSMartin Matuska                     cDst = op;   /* compress into output buffer, to skip flush stage */
3874*c03c5b1cSMartin Matuska                 else
3875*c03c5b1cSMartin Matuska                     cDst = zcs->outBuff, oSize = zcs->outBuffSize;
3876*c03c5b1cSMartin Matuska                 cSize = lastBlock ?
3877*c03c5b1cSMartin Matuska                         ZSTD_compressEnd(zcs, cDst, oSize,
3878*c03c5b1cSMartin Matuska                                     zcs->inBuff + zcs->inToCompress, iSize) :
3879*c03c5b1cSMartin Matuska                         ZSTD_compressContinue(zcs, cDst, oSize,
3880*c03c5b1cSMartin Matuska                                     zcs->inBuff + zcs->inToCompress, iSize);
3881*c03c5b1cSMartin Matuska                 FORWARD_IF_ERROR(cSize, "%s", lastBlock ? "ZSTD_compressEnd failed" : "ZSTD_compressContinue failed");
3882*c03c5b1cSMartin Matuska                 zcs->frameEnded = lastBlock;
3883*c03c5b1cSMartin Matuska                 /* prepare next block */
3884*c03c5b1cSMartin Matuska                 zcs->inBuffTarget = zcs->inBuffPos + zcs->blockSize;
3885*c03c5b1cSMartin Matuska                 if (zcs->inBuffTarget > zcs->inBuffSize)
3886*c03c5b1cSMartin Matuska                     zcs->inBuffPos = 0, zcs->inBuffTarget = zcs->blockSize;
3887*c03c5b1cSMartin Matuska                 DEBUGLOG(5, "inBuffTarget:%u / inBuffSize:%u",
3888*c03c5b1cSMartin Matuska                          (unsigned)zcs->inBuffTarget, (unsigned)zcs->inBuffSize);
3889*c03c5b1cSMartin Matuska                 if (!lastBlock)
3890*c03c5b1cSMartin Matuska                     assert(zcs->inBuffTarget <= zcs->inBuffSize);
3891*c03c5b1cSMartin Matuska                 zcs->inToCompress = zcs->inBuffPos;
3892*c03c5b1cSMartin Matuska                 if (cDst == op) {  /* no need to flush */
3893*c03c5b1cSMartin Matuska                     op += cSize;
3894*c03c5b1cSMartin Matuska                     if (zcs->frameEnded) {
3895*c03c5b1cSMartin Matuska                         DEBUGLOG(5, "Frame completed directly in outBuffer");
3896*c03c5b1cSMartin Matuska                         someMoreWork = 0;
3897*c03c5b1cSMartin Matuska                         ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only);
3898*c03c5b1cSMartin Matuska                     }
3899*c03c5b1cSMartin Matuska                     break;
3900*c03c5b1cSMartin Matuska                 }
3901*c03c5b1cSMartin Matuska                 zcs->outBuffContentSize = cSize;
3902*c03c5b1cSMartin Matuska                 zcs->outBuffFlushedSize = 0;
3903*c03c5b1cSMartin Matuska                 zcs->streamStage = zcss_flush; /* pass-through to flush stage */
3904*c03c5b1cSMartin Matuska             }
3905*c03c5b1cSMartin Matuska 	    /* fall-through */
3906*c03c5b1cSMartin Matuska         case zcss_flush:
3907*c03c5b1cSMartin Matuska             DEBUGLOG(5, "flush stage");
3908*c03c5b1cSMartin Matuska             {   size_t const toFlush = zcs->outBuffContentSize - zcs->outBuffFlushedSize;
3909*c03c5b1cSMartin Matuska                 size_t const flushed = ZSTD_limitCopy(op, (size_t)(oend-op),
3910*c03c5b1cSMartin Matuska                             zcs->outBuff + zcs->outBuffFlushedSize, toFlush);
3911*c03c5b1cSMartin Matuska                 DEBUGLOG(5, "toFlush: %u into %u ==> flushed: %u",
3912*c03c5b1cSMartin Matuska                             (unsigned)toFlush, (unsigned)(oend-op), (unsigned)flushed);
3913*c03c5b1cSMartin Matuska                 if (flushed)
3914*c03c5b1cSMartin Matuska                     op += flushed;
3915*c03c5b1cSMartin Matuska                 zcs->outBuffFlushedSize += flushed;
3916*c03c5b1cSMartin Matuska                 if (toFlush!=flushed) {
3917*c03c5b1cSMartin Matuska                     /* flush not fully completed, presumably because dst is too small */
3918*c03c5b1cSMartin Matuska                     assert(op==oend);
3919*c03c5b1cSMartin Matuska                     someMoreWork = 0;
3920*c03c5b1cSMartin Matuska                     break;
3921*c03c5b1cSMartin Matuska                 }
3922*c03c5b1cSMartin Matuska                 zcs->outBuffContentSize = zcs->outBuffFlushedSize = 0;
3923*c03c5b1cSMartin Matuska                 if (zcs->frameEnded) {
3924*c03c5b1cSMartin Matuska                     DEBUGLOG(5, "Frame completed on flush");
3925*c03c5b1cSMartin Matuska                     someMoreWork = 0;
3926*c03c5b1cSMartin Matuska                     ZSTD_CCtx_reset(zcs, ZSTD_reset_session_only);
3927*c03c5b1cSMartin Matuska                     break;
3928*c03c5b1cSMartin Matuska                 }
3929*c03c5b1cSMartin Matuska                 zcs->streamStage = zcss_load;
3930*c03c5b1cSMartin Matuska                 break;
3931*c03c5b1cSMartin Matuska             }
3932*c03c5b1cSMartin Matuska 
3933*c03c5b1cSMartin Matuska         default: /* impossible */
3934*c03c5b1cSMartin Matuska             assert(0);
3935*c03c5b1cSMartin Matuska         }
3936*c03c5b1cSMartin Matuska     }
3937*c03c5b1cSMartin Matuska 
3938*c03c5b1cSMartin Matuska     input->pos = ip - istart;
3939*c03c5b1cSMartin Matuska     output->pos = op - ostart;
3940*c03c5b1cSMartin Matuska     if (zcs->frameEnded) return 0;
3941*c03c5b1cSMartin Matuska     return ZSTD_nextInputSizeHint(zcs);
3942*c03c5b1cSMartin Matuska }
3943*c03c5b1cSMartin Matuska 
ZSTD_nextInputSizeHint_MTorST(const ZSTD_CCtx * cctx)3944*c03c5b1cSMartin Matuska static size_t ZSTD_nextInputSizeHint_MTorST(const ZSTD_CCtx* cctx)
3945*c03c5b1cSMartin Matuska {
3946*c03c5b1cSMartin Matuska #ifdef ZSTD_MULTITHREAD
3947*c03c5b1cSMartin Matuska     if (cctx->appliedParams.nbWorkers >= 1) {
3948*c03c5b1cSMartin Matuska         assert(cctx->mtctx != NULL);
3949*c03c5b1cSMartin Matuska         return ZSTDMT_nextInputSizeHint(cctx->mtctx);
3950*c03c5b1cSMartin Matuska     }
3951*c03c5b1cSMartin Matuska #endif
3952*c03c5b1cSMartin Matuska     return ZSTD_nextInputSizeHint(cctx);
3953*c03c5b1cSMartin Matuska 
3954*c03c5b1cSMartin Matuska }
3955*c03c5b1cSMartin Matuska 
ZSTD_compressStream(ZSTD_CStream * zcs,ZSTD_outBuffer * output,ZSTD_inBuffer * input)3956*c03c5b1cSMartin Matuska size_t ZSTD_compressStream(ZSTD_CStream* zcs, ZSTD_outBuffer* output, ZSTD_inBuffer* input)
3957*c03c5b1cSMartin Matuska {
3958*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_compressStream2(zcs, output, input, ZSTD_e_continue) , "");
3959*c03c5b1cSMartin Matuska     return ZSTD_nextInputSizeHint_MTorST(zcs);
3960*c03c5b1cSMartin Matuska }
3961*c03c5b1cSMartin Matuska 
3962*c03c5b1cSMartin Matuska 
ZSTD_compressStream2(ZSTD_CCtx * cctx,ZSTD_outBuffer * output,ZSTD_inBuffer * input,ZSTD_EndDirective endOp)3963*c03c5b1cSMartin Matuska size_t ZSTD_compressStream2( ZSTD_CCtx* cctx,
3964*c03c5b1cSMartin Matuska                              ZSTD_outBuffer* output,
3965*c03c5b1cSMartin Matuska                              ZSTD_inBuffer* input,
3966*c03c5b1cSMartin Matuska                              ZSTD_EndDirective endOp)
3967*c03c5b1cSMartin Matuska {
3968*c03c5b1cSMartin Matuska     DEBUGLOG(5, "ZSTD_compressStream2, endOp=%u ", (unsigned)endOp);
3969*c03c5b1cSMartin Matuska     /* check conditions */
3970*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(output->pos > output->size, GENERIC, "invalid buffer");
3971*c03c5b1cSMartin Matuska     RETURN_ERROR_IF(input->pos  > input->size, GENERIC, "invalid buffer");
3972*c03c5b1cSMartin Matuska     assert(cctx!=NULL);
3973*c03c5b1cSMartin Matuska 
3974*c03c5b1cSMartin Matuska     /* transparent initialization stage */
3975*c03c5b1cSMartin Matuska     if (cctx->streamStage == zcss_init) {
3976*c03c5b1cSMartin Matuska         ZSTD_CCtx_params params = cctx->requestedParams;
3977*c03c5b1cSMartin Matuska         ZSTD_prefixDict const prefixDict = cctx->prefixDict;
3978*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR( ZSTD_initLocalDict(cctx) , ""); /* Init the local dict if present. */
3979*c03c5b1cSMartin Matuska         memset(&cctx->prefixDict, 0, sizeof(cctx->prefixDict));   /* single usage */
3980*c03c5b1cSMartin Matuska         assert(prefixDict.dict==NULL || cctx->cdict==NULL);    /* only one can be set */
3981*c03c5b1cSMartin Matuska         DEBUGLOG(4, "ZSTD_compressStream2 : transparent init stage");
3982*c03c5b1cSMartin Matuska         if (endOp == ZSTD_e_end) cctx->pledgedSrcSizePlusOne = input->size + 1;  /* auto-fix pledgedSrcSize */
3983*c03c5b1cSMartin Matuska         params.cParams = ZSTD_getCParamsFromCCtxParams(
3984*c03c5b1cSMartin Matuska                 &cctx->requestedParams, cctx->pledgedSrcSizePlusOne-1, 0 /*dictSize*/);
3985*c03c5b1cSMartin Matuska 
3986*c03c5b1cSMartin Matuska 
3987*c03c5b1cSMartin Matuska #ifdef ZSTD_MULTITHREAD
3988*c03c5b1cSMartin Matuska         if ((cctx->pledgedSrcSizePlusOne-1) <= ZSTDMT_JOBSIZE_MIN) {
3989*c03c5b1cSMartin Matuska             params.nbWorkers = 0; /* do not invoke multi-threading when src size is too small */
3990*c03c5b1cSMartin Matuska         }
3991*c03c5b1cSMartin Matuska         if (params.nbWorkers > 0) {
3992*c03c5b1cSMartin Matuska             /* mt context creation */
3993*c03c5b1cSMartin Matuska             if (cctx->mtctx == NULL) {
3994*c03c5b1cSMartin Matuska                 DEBUGLOG(4, "ZSTD_compressStream2: creating new mtctx for nbWorkers=%u",
3995*c03c5b1cSMartin Matuska                             params.nbWorkers);
3996*c03c5b1cSMartin Matuska                 cctx->mtctx = ZSTDMT_createCCtx_advanced((U32)params.nbWorkers, cctx->customMem);
3997*c03c5b1cSMartin Matuska                 RETURN_ERROR_IF(cctx->mtctx == NULL, memory_allocation, "NULL pointer!");
3998*c03c5b1cSMartin Matuska             }
3999*c03c5b1cSMartin Matuska             /* mt compression */
4000*c03c5b1cSMartin Matuska             DEBUGLOG(4, "call ZSTDMT_initCStream_internal as nbWorkers=%u", params.nbWorkers);
4001*c03c5b1cSMartin Matuska             FORWARD_IF_ERROR( ZSTDMT_initCStream_internal(
4002*c03c5b1cSMartin Matuska                         cctx->mtctx,
4003*c03c5b1cSMartin Matuska                         prefixDict.dict, prefixDict.dictSize, prefixDict.dictContentType,
4004*c03c5b1cSMartin Matuska                         cctx->cdict, params, cctx->pledgedSrcSizePlusOne-1) , "");
4005*c03c5b1cSMartin Matuska             cctx->streamStage = zcss_load;
4006*c03c5b1cSMartin Matuska             cctx->appliedParams.nbWorkers = params.nbWorkers;
4007*c03c5b1cSMartin Matuska         } else
4008*c03c5b1cSMartin Matuska #endif
4009*c03c5b1cSMartin Matuska         {   FORWARD_IF_ERROR( ZSTD_resetCStream_internal(cctx,
4010*c03c5b1cSMartin Matuska                             prefixDict.dict, prefixDict.dictSize, prefixDict.dictContentType,
4011*c03c5b1cSMartin Matuska                             cctx->cdict,
4012*c03c5b1cSMartin Matuska                             params, cctx->pledgedSrcSizePlusOne-1) , "");
4013*c03c5b1cSMartin Matuska             assert(cctx->streamStage == zcss_load);
4014*c03c5b1cSMartin Matuska             assert(cctx->appliedParams.nbWorkers == 0);
4015*c03c5b1cSMartin Matuska     }   }
4016*c03c5b1cSMartin Matuska     /* end of transparent initialization stage */
4017*c03c5b1cSMartin Matuska 
4018*c03c5b1cSMartin Matuska     /* compression stage */
4019*c03c5b1cSMartin Matuska #ifdef ZSTD_MULTITHREAD
4020*c03c5b1cSMartin Matuska     if (cctx->appliedParams.nbWorkers > 0) {
4021*c03c5b1cSMartin Matuska         int const forceMaxProgress = (endOp == ZSTD_e_flush || endOp == ZSTD_e_end);
4022*c03c5b1cSMartin Matuska         size_t flushMin;
4023*c03c5b1cSMartin Matuska         assert(forceMaxProgress || endOp == ZSTD_e_continue /* Protection for a new flush type */);
4024*c03c5b1cSMartin Matuska         if (cctx->cParamsChanged) {
4025*c03c5b1cSMartin Matuska             ZSTDMT_updateCParams_whileCompressing(cctx->mtctx, &cctx->requestedParams);
4026*c03c5b1cSMartin Matuska             cctx->cParamsChanged = 0;
4027*c03c5b1cSMartin Matuska         }
4028*c03c5b1cSMartin Matuska         do {
4029*c03c5b1cSMartin Matuska             flushMin = ZSTDMT_compressStream_generic(cctx->mtctx, output, input, endOp);
4030*c03c5b1cSMartin Matuska             if ( ZSTD_isError(flushMin)
4031*c03c5b1cSMartin Matuska               || (endOp == ZSTD_e_end && flushMin == 0) ) { /* compression completed */
4032*c03c5b1cSMartin Matuska                 ZSTD_CCtx_reset(cctx, ZSTD_reset_session_only);
4033*c03c5b1cSMartin Matuska             }
4034*c03c5b1cSMartin Matuska             FORWARD_IF_ERROR(flushMin, "ZSTDMT_compressStream_generic failed");
4035*c03c5b1cSMartin Matuska         } while (forceMaxProgress && flushMin != 0 && output->pos < output->size);
4036*c03c5b1cSMartin Matuska         DEBUGLOG(5, "completed ZSTD_compressStream2 delegating to ZSTDMT_compressStream_generic");
4037*c03c5b1cSMartin Matuska         /* Either we don't require maximum forward progress, we've finished the
4038*c03c5b1cSMartin Matuska          * flush, or we are out of output space.
4039*c03c5b1cSMartin Matuska          */
4040*c03c5b1cSMartin Matuska         assert(!forceMaxProgress || flushMin == 0 || output->pos == output->size);
4041*c03c5b1cSMartin Matuska         return flushMin;
4042*c03c5b1cSMartin Matuska     }
4043*c03c5b1cSMartin Matuska #endif
4044*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( ZSTD_compressStream_generic(cctx, output, input, endOp) , "");
4045*c03c5b1cSMartin Matuska     DEBUGLOG(5, "completed ZSTD_compressStream2");
4046*c03c5b1cSMartin Matuska     return cctx->outBuffContentSize - cctx->outBuffFlushedSize; /* remaining to flush */
4047*c03c5b1cSMartin Matuska }
4048*c03c5b1cSMartin Matuska 
ZSTD_compressStream2_simpleArgs(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,size_t * dstPos,const void * src,size_t srcSize,size_t * srcPos,ZSTD_EndDirective endOp)4049*c03c5b1cSMartin Matuska size_t ZSTD_compressStream2_simpleArgs (
4050*c03c5b1cSMartin Matuska                             ZSTD_CCtx* cctx,
4051*c03c5b1cSMartin Matuska                             void* dst, size_t dstCapacity, size_t* dstPos,
4052*c03c5b1cSMartin Matuska                       const void* src, size_t srcSize, size_t* srcPos,
4053*c03c5b1cSMartin Matuska                             ZSTD_EndDirective endOp)
4054*c03c5b1cSMartin Matuska {
4055*c03c5b1cSMartin Matuska     ZSTD_outBuffer output = { dst, dstCapacity, *dstPos };
4056*c03c5b1cSMartin Matuska     ZSTD_inBuffer  input  = { src, srcSize, *srcPos };
4057*c03c5b1cSMartin Matuska     /* ZSTD_compressStream2() will check validity of dstPos and srcPos */
4058*c03c5b1cSMartin Matuska     size_t const cErr = ZSTD_compressStream2(cctx, &output, &input, endOp);
4059*c03c5b1cSMartin Matuska     *dstPos = output.pos;
4060*c03c5b1cSMartin Matuska     *srcPos = input.pos;
4061*c03c5b1cSMartin Matuska     return cErr;
4062*c03c5b1cSMartin Matuska }
4063*c03c5b1cSMartin Matuska 
ZSTD_compress2(ZSTD_CCtx * cctx,void * dst,size_t dstCapacity,const void * src,size_t srcSize)4064*c03c5b1cSMartin Matuska size_t ZSTD_compress2(ZSTD_CCtx* cctx,
4065*c03c5b1cSMartin Matuska                       void* dst, size_t dstCapacity,
4066*c03c5b1cSMartin Matuska                       const void* src, size_t srcSize)
4067*c03c5b1cSMartin Matuska {
4068*c03c5b1cSMartin Matuska     DEBUGLOG(4, "ZSTD_compress2 (srcSize=%u)", (unsigned)srcSize);
4069*c03c5b1cSMartin Matuska     ZSTD_CCtx_reset(cctx, ZSTD_reset_session_only);
4070*c03c5b1cSMartin Matuska     {   size_t oPos = 0;
4071*c03c5b1cSMartin Matuska         size_t iPos = 0;
4072*c03c5b1cSMartin Matuska         size_t const result = ZSTD_compressStream2_simpleArgs(cctx,
4073*c03c5b1cSMartin Matuska                                         dst, dstCapacity, &oPos,
4074*c03c5b1cSMartin Matuska                                         src, srcSize, &iPos,
4075*c03c5b1cSMartin Matuska                                         ZSTD_e_end);
4076*c03c5b1cSMartin Matuska         FORWARD_IF_ERROR(result, "ZSTD_compressStream2_simpleArgs failed");
4077*c03c5b1cSMartin Matuska         if (result != 0) {  /* compression not completed, due to lack of output space */
4078*c03c5b1cSMartin Matuska             assert(oPos == dstCapacity);
4079*c03c5b1cSMartin Matuska             RETURN_ERROR(dstSize_tooSmall, "");
4080*c03c5b1cSMartin Matuska         }
4081*c03c5b1cSMartin Matuska         assert(iPos == srcSize);   /* all input is expected consumed */
4082*c03c5b1cSMartin Matuska         return oPos;
4083*c03c5b1cSMartin Matuska     }
4084*c03c5b1cSMartin Matuska }
4085*c03c5b1cSMartin Matuska 
4086*c03c5b1cSMartin Matuska /*======   Finalize   ======*/
4087*c03c5b1cSMartin Matuska 
4088*c03c5b1cSMartin Matuska /*! ZSTD_flushStream() :
4089*c03c5b1cSMartin Matuska  * @return : amount of data remaining to flush */
ZSTD_flushStream(ZSTD_CStream * zcs,ZSTD_outBuffer * output)4090*c03c5b1cSMartin Matuska size_t ZSTD_flushStream(ZSTD_CStream* zcs, ZSTD_outBuffer* output)
4091*c03c5b1cSMartin Matuska {
4092*c03c5b1cSMartin Matuska     ZSTD_inBuffer input = { NULL, 0, 0 };
4093*c03c5b1cSMartin Matuska     return ZSTD_compressStream2(zcs, output, &input, ZSTD_e_flush);
4094*c03c5b1cSMartin Matuska }
4095*c03c5b1cSMartin Matuska 
4096*c03c5b1cSMartin Matuska 
ZSTD_endStream(ZSTD_CStream * zcs,ZSTD_outBuffer * output)4097*c03c5b1cSMartin Matuska size_t ZSTD_endStream(ZSTD_CStream* zcs, ZSTD_outBuffer* output)
4098*c03c5b1cSMartin Matuska {
4099*c03c5b1cSMartin Matuska     ZSTD_inBuffer input = { NULL, 0, 0 };
4100*c03c5b1cSMartin Matuska     size_t const remainingToFlush = ZSTD_compressStream2(zcs, output, &input, ZSTD_e_end);
4101*c03c5b1cSMartin Matuska     FORWARD_IF_ERROR( remainingToFlush , "ZSTD_compressStream2 failed");
4102*c03c5b1cSMartin Matuska     if (zcs->appliedParams.nbWorkers > 0) return remainingToFlush;   /* minimal estimation */
4103*c03c5b1cSMartin Matuska     /* single thread mode : attempt to calculate remaining to flush more precisely */
4104*c03c5b1cSMartin Matuska     {   size_t const lastBlockSize = zcs->frameEnded ? 0 : ZSTD_BLOCKHEADERSIZE;
4105*c03c5b1cSMartin Matuska         size_t const checksumSize = (size_t)(zcs->frameEnded ? 0 : zcs->appliedParams.fParams.checksumFlag * 4);
4106*c03c5b1cSMartin Matuska         size_t const toFlush = remainingToFlush + lastBlockSize + checksumSize;
4107*c03c5b1cSMartin Matuska         DEBUGLOG(4, "ZSTD_endStream : remaining to flush : %u", (unsigned)toFlush);
4108*c03c5b1cSMartin Matuska         return toFlush;
4109*c03c5b1cSMartin Matuska     }
4110*c03c5b1cSMartin Matuska }
4111*c03c5b1cSMartin Matuska 
4112*c03c5b1cSMartin Matuska 
4113*c03c5b1cSMartin Matuska /*-=====  Pre-defined compression levels  =====-*/
4114*c03c5b1cSMartin Matuska 
4115*c03c5b1cSMartin Matuska #define ZSTD_MAX_CLEVEL     22
ZSTD_maxCLevel(void)4116*c03c5b1cSMartin Matuska int ZSTD_maxCLevel(void) { return ZSTD_MAX_CLEVEL; }
ZSTD_minCLevel(void)4117*c03c5b1cSMartin Matuska int ZSTD_minCLevel(void) { return (int)-ZSTD_TARGETLENGTH_MAX; }
4118*c03c5b1cSMartin Matuska 
4119*c03c5b1cSMartin Matuska static const ZSTD_compressionParameters ZSTD_defaultCParameters[4][ZSTD_MAX_CLEVEL+1] = {
4120*c03c5b1cSMartin Matuska {   /* "default" - for any srcSize > 256 KB */
4121*c03c5b1cSMartin Matuska     /* W,  C,  H,  S,  L, TL, strat */
4122*c03c5b1cSMartin Matuska     { 19, 12, 13,  1,  6,  1, ZSTD_fast    },  /* base for negative levels */
4123*c03c5b1cSMartin Matuska     { 19, 13, 14,  1,  7,  0, ZSTD_fast    },  /* level  1 */
4124*c03c5b1cSMartin Matuska     { 20, 15, 16,  1,  6,  0, ZSTD_fast    },  /* level  2 */
4125*c03c5b1cSMartin Matuska     { 21, 16, 17,  1,  5,  0, ZSTD_dfast   },  /* level  3 */
4126*c03c5b1cSMartin Matuska     { 21, 18, 18,  1,  5,  0, ZSTD_dfast   },  /* level  4 */
4127*c03c5b1cSMartin Matuska     { 21, 18, 19,  2,  5,  2, ZSTD_greedy  },  /* level  5 */
4128*c03c5b1cSMartin Matuska     { 21, 19, 19,  3,  5,  4, ZSTD_greedy  },  /* level  6 */
4129*c03c5b1cSMartin Matuska     { 21, 19, 19,  3,  5,  8, ZSTD_lazy    },  /* level  7 */
4130*c03c5b1cSMartin Matuska     { 21, 19, 19,  3,  5, 16, ZSTD_lazy2   },  /* level  8 */
4131*c03c5b1cSMartin Matuska     { 21, 19, 20,  4,  5, 16, ZSTD_lazy2   },  /* level  9 */
4132*c03c5b1cSMartin Matuska     { 22, 20, 21,  4,  5, 16, ZSTD_lazy2   },  /* level 10 */
4133*c03c5b1cSMartin Matuska     { 22, 21, 22,  4,  5, 16, ZSTD_lazy2   },  /* level 11 */
4134*c03c5b1cSMartin Matuska     { 22, 21, 22,  5,  5, 16, ZSTD_lazy2   },  /* level 12 */
4135*c03c5b1cSMartin Matuska     { 22, 21, 22,  5,  5, 32, ZSTD_btlazy2 },  /* level 13 */
4136*c03c5b1cSMartin Matuska     { 22, 22, 23,  5,  5, 32, ZSTD_btlazy2 },  /* level 14 */
4137*c03c5b1cSMartin Matuska     { 22, 23, 23,  6,  5, 32, ZSTD_btlazy2 },  /* level 15 */
4138*c03c5b1cSMartin Matuska     { 22, 22, 22,  5,  5, 48, ZSTD_btopt   },  /* level 16 */
4139*c03c5b1cSMartin Matuska     { 23, 23, 22,  5,  4, 64, ZSTD_btopt   },  /* level 17 */
4140*c03c5b1cSMartin Matuska     { 23, 23, 22,  6,  3, 64, ZSTD_btultra },  /* level 18 */
4141*c03c5b1cSMartin Matuska     { 23, 24, 22,  7,  3,256, ZSTD_btultra2},  /* level 19 */
4142*c03c5b1cSMartin Matuska     { 25, 25, 23,  7,  3,256, ZSTD_btultra2},  /* level 20 */
4143*c03c5b1cSMartin Matuska     { 26, 26, 24,  7,  3,512, ZSTD_btultra2},  /* level 21 */
4144*c03c5b1cSMartin Matuska     { 27, 27, 25,  9,  3,999, ZSTD_btultra2},  /* level 22 */
4145*c03c5b1cSMartin Matuska },
4146*c03c5b1cSMartin Matuska {   /* for srcSize <= 256 KB */
4147*c03c5b1cSMartin Matuska     /* W,  C,  H,  S,  L,  T, strat */
4148*c03c5b1cSMartin Matuska     { 18, 12, 13,  1,  5,  1, ZSTD_fast    },  /* base for negative levels */
4149*c03c5b1cSMartin Matuska     { 18, 13, 14,  1,  6,  0, ZSTD_fast    },  /* level  1 */
4150*c03c5b1cSMartin Matuska     { 18, 14, 14,  1,  5,  0, ZSTD_dfast   },  /* level  2 */
4151*c03c5b1cSMartin Matuska     { 18, 16, 16,  1,  4,  0, ZSTD_dfast   },  /* level  3 */
4152*c03c5b1cSMartin Matuska     { 18, 16, 17,  2,  5,  2, ZSTD_greedy  },  /* level  4.*/
4153*c03c5b1cSMartin Matuska     { 18, 18, 18,  3,  5,  2, ZSTD_greedy  },  /* level  5.*/
4154*c03c5b1cSMartin Matuska     { 18, 18, 19,  3,  5,  4, ZSTD_lazy    },  /* level  6.*/
4155*c03c5b1cSMartin Matuska     { 18, 18, 19,  4,  4,  4, ZSTD_lazy    },  /* level  7 */
4156*c03c5b1cSMartin Matuska     { 18, 18, 19,  4,  4,  8, ZSTD_lazy2   },  /* level  8 */
4157*c03c5b1cSMartin Matuska     { 18, 18, 19,  5,  4,  8, ZSTD_lazy2   },  /* level  9 */
4158*c03c5b1cSMartin Matuska     { 18, 18, 19,  6,  4,  8, ZSTD_lazy2   },  /* level 10 */
4159*c03c5b1cSMartin Matuska     { 18, 18, 19,  5,  4, 12, ZSTD_btlazy2 },  /* level 11.*/
4160*c03c5b1cSMartin Matuska     { 18, 19, 19,  7,  4, 12, ZSTD_btlazy2 },  /* level 12.*/
4161*c03c5b1cSMartin Matuska     { 18, 18, 19,  4,  4, 16, ZSTD_btopt   },  /* level 13 */
4162*c03c5b1cSMartin Matuska     { 18, 18, 19,  4,  3, 32, ZSTD_btopt   },  /* level 14.*/
4163*c03c5b1cSMartin Matuska     { 18, 18, 19,  6,  3,128, ZSTD_btopt   },  /* level 15.*/
4164*c03c5b1cSMartin Matuska     { 18, 19, 19,  6,  3,128, ZSTD_btultra },  /* level 16.*/
4165*c03c5b1cSMartin Matuska     { 18, 19, 19,  8,  3,256, ZSTD_btultra },  /* level 17.*/
4166*c03c5b1cSMartin Matuska     { 18, 19, 19,  6,  3,128, ZSTD_btultra2},  /* level 18.*/
4167*c03c5b1cSMartin Matuska     { 18, 19, 19,  8,  3,256, ZSTD_btultra2},  /* level 19.*/
4168*c03c5b1cSMartin Matuska     { 18, 19, 19, 10,  3,512, ZSTD_btultra2},  /* level 20.*/
4169*c03c5b1cSMartin Matuska     { 18, 19, 19, 12,  3,512, ZSTD_btultra2},  /* level 21.*/
4170*c03c5b1cSMartin Matuska     { 18, 19, 19, 13,  3,999, ZSTD_btultra2},  /* level 22.*/
4171*c03c5b1cSMartin Matuska },
4172*c03c5b1cSMartin Matuska {   /* for srcSize <= 128 KB */
4173*c03c5b1cSMartin Matuska     /* W,  C,  H,  S,  L,  T, strat */
4174*c03c5b1cSMartin Matuska     { 17, 12, 12,  1,  5,  1, ZSTD_fast    },  /* base for negative levels */
4175*c03c5b1cSMartin Matuska     { 17, 12, 13,  1,  6,  0, ZSTD_fast    },  /* level  1 */
4176*c03c5b1cSMartin Matuska     { 17, 13, 15,  1,  5,  0, ZSTD_fast    },  /* level  2 */
4177*c03c5b1cSMartin Matuska     { 17, 15, 16,  2,  5,  0, ZSTD_dfast   },  /* level  3 */
4178*c03c5b1cSMartin Matuska     { 17, 17, 17,  2,  4,  0, ZSTD_dfast   },  /* level  4 */
4179*c03c5b1cSMartin Matuska     { 17, 16, 17,  3,  4,  2, ZSTD_greedy  },  /* level  5 */
4180*c03c5b1cSMartin Matuska     { 17, 17, 17,  3,  4,  4, ZSTD_lazy    },  /* level  6 */
4181*c03c5b1cSMartin Matuska     { 17, 17, 17,  3,  4,  8, ZSTD_lazy2   },  /* level  7 */
4182*c03c5b1cSMartin Matuska     { 17, 17, 17,  4,  4,  8, ZSTD_lazy2   },  /* level  8 */
4183*c03c5b1cSMartin Matuska     { 17, 17, 17,  5,  4,  8, ZSTD_lazy2   },  /* level  9 */
4184*c03c5b1cSMartin Matuska     { 17, 17, 17,  6,  4,  8, ZSTD_lazy2   },  /* level 10 */
4185*c03c5b1cSMartin Matuska     { 17, 17, 17,  5,  4,  8, ZSTD_btlazy2 },  /* level 11 */
4186*c03c5b1cSMartin Matuska     { 17, 18, 17,  7,  4, 12, ZSTD_btlazy2 },  /* level 12 */
4187*c03c5b1cSMartin Matuska     { 17, 18, 17,  3,  4, 12, ZSTD_btopt   },  /* level 13.*/
4188*c03c5b1cSMartin Matuska     { 17, 18, 17,  4,  3, 32, ZSTD_btopt   },  /* level 14.*/
4189*c03c5b1cSMartin Matuska     { 17, 18, 17,  6,  3,256, ZSTD_btopt   },  /* level 15.*/
4190*c03c5b1cSMartin Matuska     { 17, 18, 17,  6,  3,128, ZSTD_btultra },  /* level 16.*/
4191*c03c5b1cSMartin Matuska     { 17, 18, 17,  8,  3,256, ZSTD_btultra },  /* level 17.*/
4192*c03c5b1cSMartin Matuska     { 17, 18, 17, 10,  3,512, ZSTD_btultra },  /* level 18.*/
4193*c03c5b1cSMartin Matuska     { 17, 18, 17,  5,  3,256, ZSTD_btultra2},  /* level 19.*/
4194*c03c5b1cSMartin Matuska     { 17, 18, 17,  7,  3,512, ZSTD_btultra2},  /* level 20.*/
4195*c03c5b1cSMartin Matuska     { 17, 18, 17,  9,  3,512, ZSTD_btultra2},  /* level 21.*/
4196*c03c5b1cSMartin Matuska     { 17, 18, 17, 11,  3,999, ZSTD_btultra2},  /* level 22.*/
4197*c03c5b1cSMartin Matuska },
4198*c03c5b1cSMartin Matuska {   /* for srcSize <= 16 KB */
4199*c03c5b1cSMartin Matuska     /* W,  C,  H,  S,  L,  T, strat */
4200*c03c5b1cSMartin Matuska     { 14, 12, 13,  1,  5,  1, ZSTD_fast    },  /* base for negative levels */
4201*c03c5b1cSMartin Matuska     { 14, 14, 15,  1,  5,  0, ZSTD_fast    },  /* level  1 */
4202*c03c5b1cSMartin Matuska     { 14, 14, 15,  1,  4,  0, ZSTD_fast    },  /* level  2 */
4203*c03c5b1cSMartin Matuska     { 14, 14, 15,  2,  4,  0, ZSTD_dfast   },  /* level  3 */
4204*c03c5b1cSMartin Matuska     { 14, 14, 14,  4,  4,  2, ZSTD_greedy  },  /* level  4 */
4205*c03c5b1cSMartin Matuska     { 14, 14, 14,  3,  4,  4, ZSTD_lazy    },  /* level  5.*/
4206*c03c5b1cSMartin Matuska     { 14, 14, 14,  4,  4,  8, ZSTD_lazy2   },  /* level  6 */
4207*c03c5b1cSMartin Matuska     { 14, 14, 14,  6,  4,  8, ZSTD_lazy2   },  /* level  7 */
4208*c03c5b1cSMartin Matuska     { 14, 14, 14,  8,  4,  8, ZSTD_lazy2   },  /* level  8.*/
4209*c03c5b1cSMartin Matuska     { 14, 15, 14,  5,  4,  8, ZSTD_btlazy2 },  /* level  9.*/
4210*c03c5b1cSMartin Matuska     { 14, 15, 14,  9,  4,  8, ZSTD_btlazy2 },  /* level 10.*/
4211*c03c5b1cSMartin Matuska     { 14, 15, 14,  3,  4, 12, ZSTD_btopt   },  /* level 11.*/
4212*c03c5b1cSMartin Matuska     { 14, 15, 14,  4,  3, 24, ZSTD_btopt   },  /* level 12.*/
4213*c03c5b1cSMartin Matuska     { 14, 15, 14,  5,  3, 32, ZSTD_btultra },  /* level 13.*/
4214*c03c5b1cSMartin Matuska     { 14, 15, 15,  6,  3, 64, ZSTD_btultra },  /* level 14.*/
4215*c03c5b1cSMartin Matuska     { 14, 15, 15,  7,  3,256, ZSTD_btultra },  /* level 15.*/
4216*c03c5b1cSMartin Matuska     { 14, 15, 15,  5,  3, 48, ZSTD_btultra2},  /* level 16.*/
4217*c03c5b1cSMartin Matuska     { 14, 15, 15,  6,  3,128, ZSTD_btultra2},  /* level 17.*/
4218*c03c5b1cSMartin Matuska     { 14, 15, 15,  7,  3,256, ZSTD_btultra2},  /* level 18.*/
4219*c03c5b1cSMartin Matuska     { 14, 15, 15,  8,  3,256, ZSTD_btultra2},  /* level 19.*/
4220*c03c5b1cSMartin Matuska     { 14, 15, 15,  8,  3,512, ZSTD_btultra2},  /* level 20.*/
4221*c03c5b1cSMartin Matuska     { 14, 15, 15,  9,  3,512, ZSTD_btultra2},  /* level 21.*/
4222*c03c5b1cSMartin Matuska     { 14, 15, 15, 10,  3,999, ZSTD_btultra2},  /* level 22.*/
4223*c03c5b1cSMartin Matuska },
4224*c03c5b1cSMartin Matuska };
4225*c03c5b1cSMartin Matuska 
4226*c03c5b1cSMartin Matuska /*! ZSTD_getCParams_internal() :
4227*c03c5b1cSMartin Matuska  * @return ZSTD_compressionParameters structure for a selected compression level, srcSize and dictSize.
4228*c03c5b1cSMartin Matuska  *  Note: srcSizeHint 0 means 0, use ZSTD_CONTENTSIZE_UNKNOWN for unknown.
4229*c03c5b1cSMartin Matuska  *        Use dictSize == 0 for unknown or unused. */
ZSTD_getCParams_internal(int compressionLevel,unsigned long long srcSizeHint,size_t dictSize)4230*c03c5b1cSMartin Matuska static ZSTD_compressionParameters ZSTD_getCParams_internal(int compressionLevel, unsigned long long srcSizeHint, size_t dictSize)
4231*c03c5b1cSMartin Matuska {
4232*c03c5b1cSMartin Matuska     int const unknown = srcSizeHint == ZSTD_CONTENTSIZE_UNKNOWN;
4233*c03c5b1cSMartin Matuska     size_t const addedSize = unknown && dictSize > 0 ? 500 : 0;
4234*c03c5b1cSMartin Matuska     U64 const rSize = unknown && dictSize == 0 ? ZSTD_CONTENTSIZE_UNKNOWN : srcSizeHint+dictSize+addedSize;
4235*c03c5b1cSMartin Matuska     U32 const tableID = (rSize <= 256 KB) + (rSize <= 128 KB) + (rSize <= 16 KB);
4236*c03c5b1cSMartin Matuska     int row = compressionLevel;
4237*c03c5b1cSMartin Matuska     DEBUGLOG(5, "ZSTD_getCParams_internal (cLevel=%i)", compressionLevel);
4238*c03c5b1cSMartin Matuska     if (compressionLevel == 0) row = ZSTD_CLEVEL_DEFAULT;   /* 0 == default */
4239*c03c5b1cSMartin Matuska     if (compressionLevel < 0) row = 0;   /* entry 0 is baseline for fast mode */
4240*c03c5b1cSMartin Matuska     if (compressionLevel > ZSTD_MAX_CLEVEL) row = ZSTD_MAX_CLEVEL;
4241*c03c5b1cSMartin Matuska     {   ZSTD_compressionParameters cp = ZSTD_defaultCParameters[tableID][row];
4242*c03c5b1cSMartin Matuska         if (compressionLevel < 0) cp.targetLength = (unsigned)(-compressionLevel);   /* acceleration factor */
4243*c03c5b1cSMartin Matuska         /* refine parameters based on srcSize & dictSize */
4244*c03c5b1cSMartin Matuska         return ZSTD_adjustCParams_internal(cp, srcSizeHint, dictSize);
4245*c03c5b1cSMartin Matuska     }
4246*c03c5b1cSMartin Matuska }
4247*c03c5b1cSMartin Matuska 
4248*c03c5b1cSMartin Matuska /*! ZSTD_getCParams() :
4249*c03c5b1cSMartin Matuska  * @return ZSTD_compressionParameters structure for a selected compression level, srcSize and dictSize.
4250*c03c5b1cSMartin Matuska  *  Size values are optional, provide 0 if not known or unused */
ZSTD_getCParams(int compressionLevel,unsigned long long srcSizeHint,size_t dictSize)4251*c03c5b1cSMartin Matuska ZSTD_compressionParameters ZSTD_getCParams(int compressionLevel, unsigned long long srcSizeHint, size_t dictSize)
4252*c03c5b1cSMartin Matuska {
4253*c03c5b1cSMartin Matuska     if (srcSizeHint == 0) srcSizeHint = ZSTD_CONTENTSIZE_UNKNOWN;
4254*c03c5b1cSMartin Matuska     return ZSTD_getCParams_internal(compressionLevel, srcSizeHint, dictSize);
4255*c03c5b1cSMartin Matuska }
4256*c03c5b1cSMartin Matuska 
4257*c03c5b1cSMartin Matuska /*! ZSTD_getParams() :
4258*c03c5b1cSMartin Matuska  *  same idea as ZSTD_getCParams()
4259*c03c5b1cSMartin Matuska  * @return a `ZSTD_parameters` structure (instead of `ZSTD_compressionParameters`).
4260*c03c5b1cSMartin Matuska  *  Fields of `ZSTD_frameParameters` are set to default values */
ZSTD_getParams_internal(int compressionLevel,unsigned long long srcSizeHint,size_t dictSize)4261*c03c5b1cSMartin Matuska static ZSTD_parameters ZSTD_getParams_internal(int compressionLevel, unsigned long long srcSizeHint, size_t dictSize) {
4262*c03c5b1cSMartin Matuska     ZSTD_parameters params;
4263*c03c5b1cSMartin Matuska     ZSTD_compressionParameters const cParams = ZSTD_getCParams_internal(compressionLevel, srcSizeHint, dictSize);
4264*c03c5b1cSMartin Matuska     DEBUGLOG(5, "ZSTD_getParams (cLevel=%i)", compressionLevel);
4265*c03c5b1cSMartin Matuska     memset(&params, 0, sizeof(params));
4266*c03c5b1cSMartin Matuska     params.cParams = cParams;
4267*c03c5b1cSMartin Matuska     params.fParams.contentSizeFlag = 1;
4268*c03c5b1cSMartin Matuska     return params;
4269*c03c5b1cSMartin Matuska }
4270*c03c5b1cSMartin Matuska 
4271*c03c5b1cSMartin Matuska /*! ZSTD_getParams() :
4272*c03c5b1cSMartin Matuska  *  same idea as ZSTD_getCParams()
4273*c03c5b1cSMartin Matuska  * @return a `ZSTD_parameters` structure (instead of `ZSTD_compressionParameters`).
4274*c03c5b1cSMartin Matuska  *  Fields of `ZSTD_frameParameters` are set to default values */
ZSTD_getParams(int compressionLevel,unsigned long long srcSizeHint,size_t dictSize)4275*c03c5b1cSMartin Matuska ZSTD_parameters ZSTD_getParams(int compressionLevel, unsigned long long srcSizeHint, size_t dictSize) {
4276*c03c5b1cSMartin Matuska     if (srcSizeHint == 0) srcSizeHint = ZSTD_CONTENTSIZE_UNKNOWN;
4277*c03c5b1cSMartin Matuska     return ZSTD_getParams_internal(compressionLevel, srcSizeHint, dictSize);
4278*c03c5b1cSMartin Matuska }
4279