1*a28cd43dSSascha Wildner /*
2*a28cd43dSSascha Wildner * Copyright (c) 2016-2020, Yann Collet, Facebook, Inc.
3*a28cd43dSSascha Wildner * All rights reserved.
4*a28cd43dSSascha Wildner *
5*a28cd43dSSascha Wildner * This source code is licensed under both the BSD-style license (found in the
6*a28cd43dSSascha Wildner * LICENSE file in the root directory of this source tree) and the GPLv2 (found
7*a28cd43dSSascha Wildner * in the COPYING file in the root directory of this source tree).
8*a28cd43dSSascha Wildner * You may select, at your option, one of the above-listed licenses.
9*a28cd43dSSascha Wildner */
10*a28cd43dSSascha Wildner
11*a28cd43dSSascha Wildner
12*a28cd43dSSascha Wildner /* *************************************
13*a28cd43dSSascha Wildner * Compiler Options
14*a28cd43dSSascha Wildner ***************************************/
15*a28cd43dSSascha Wildner #ifdef _MSC_VER /* Visual */
16*a28cd43dSSascha Wildner # pragma warning(disable : 4127) /* disable: C4127: conditional expression is constant */
17*a28cd43dSSascha Wildner # pragma warning(disable : 4204) /* non-constant aggregate initializer */
18*a28cd43dSSascha Wildner #endif
19*a28cd43dSSascha Wildner #if defined(__MINGW32__) && !defined(_POSIX_SOURCE)
20*a28cd43dSSascha Wildner # define _POSIX_SOURCE 1 /* disable %llu warnings with MinGW on Windows */
21*a28cd43dSSascha Wildner #endif
22*a28cd43dSSascha Wildner
23*a28cd43dSSascha Wildner /*-*************************************
24*a28cd43dSSascha Wildner * Includes
25*a28cd43dSSascha Wildner ***************************************/
26*a28cd43dSSascha Wildner #include "platform.h" /* Large Files support, SET_BINARY_MODE */
27*a28cd43dSSascha Wildner #include "util.h" /* UTIL_getFileSize, UTIL_isRegularFile, UTIL_isSameFile */
28*a28cd43dSSascha Wildner #include <stdio.h> /* fprintf, fopen, fread, _fileno, stdin, stdout */
29*a28cd43dSSascha Wildner #include <stdlib.h> /* malloc, free */
30*a28cd43dSSascha Wildner #include <string.h> /* strcmp, strlen */
31*a28cd43dSSascha Wildner #include <assert.h>
32*a28cd43dSSascha Wildner #include <errno.h> /* errno */
33*a28cd43dSSascha Wildner #include <limits.h> /* INT_MAX */
34*a28cd43dSSascha Wildner #include <signal.h>
35*a28cd43dSSascha Wildner #include "timefn.h" /* UTIL_getTime, UTIL_clockSpanMicro */
36*a28cd43dSSascha Wildner
37*a28cd43dSSascha Wildner #if defined (_MSC_VER)
38*a28cd43dSSascha Wildner # include <sys/stat.h>
39*a28cd43dSSascha Wildner # include <io.h>
40*a28cd43dSSascha Wildner #endif
41*a28cd43dSSascha Wildner
42*a28cd43dSSascha Wildner #include "../lib/common/mem.h" /* U32, U64 */
43*a28cd43dSSascha Wildner #include "fileio.h"
44*a28cd43dSSascha Wildner
45*a28cd43dSSascha Wildner #define ZSTD_STATIC_LINKING_ONLY /* ZSTD_magicNumber, ZSTD_frameHeaderSize_max */
46*a28cd43dSSascha Wildner #include "../lib/zstd.h"
47*a28cd43dSSascha Wildner #include "../lib/common/zstd_errors.h" /* ZSTD_error_frameParameter_windowTooLarge */
48*a28cd43dSSascha Wildner #include "../lib/compress/zstd_compress_internal.h"
49*a28cd43dSSascha Wildner
50*a28cd43dSSascha Wildner #if defined(ZSTD_GZCOMPRESS) || defined(ZSTD_GZDECOMPRESS)
51*a28cd43dSSascha Wildner # include <zlib.h>
52*a28cd43dSSascha Wildner # if !defined(z_const)
53*a28cd43dSSascha Wildner # define z_const
54*a28cd43dSSascha Wildner # endif
55*a28cd43dSSascha Wildner #endif
56*a28cd43dSSascha Wildner
57*a28cd43dSSascha Wildner #if defined(ZSTD_LZMACOMPRESS) || defined(ZSTD_LZMADECOMPRESS)
58*a28cd43dSSascha Wildner # include <lzma.h>
59*a28cd43dSSascha Wildner #endif
60*a28cd43dSSascha Wildner
61*a28cd43dSSascha Wildner #define LZ4_MAGICNUMBER 0x184D2204
62*a28cd43dSSascha Wildner #if defined(ZSTD_LZ4COMPRESS) || defined(ZSTD_LZ4DECOMPRESS)
63*a28cd43dSSascha Wildner # define LZ4F_ENABLE_OBSOLETE_ENUMS
64*a28cd43dSSascha Wildner # include <lz4frame.h>
65*a28cd43dSSascha Wildner # include <lz4.h>
66*a28cd43dSSascha Wildner #endif
67*a28cd43dSSascha Wildner
68*a28cd43dSSascha Wildner
69*a28cd43dSSascha Wildner /*-*************************************
70*a28cd43dSSascha Wildner * Constants
71*a28cd43dSSascha Wildner ***************************************/
72*a28cd43dSSascha Wildner #define ADAPT_WINDOWLOG_DEFAULT 23 /* 8 MB */
73*a28cd43dSSascha Wildner #define DICTSIZE_MAX (32 MB) /* protection against large input (attack scenario) */
74*a28cd43dSSascha Wildner
75*a28cd43dSSascha Wildner #define FNSPACE 30
76*a28cd43dSSascha Wildner
77*a28cd43dSSascha Wildner /*-*************************************
78*a28cd43dSSascha Wildner * Macros
79*a28cd43dSSascha Wildner ***************************************/
80*a28cd43dSSascha Wildner
81*a28cd43dSSascha Wildner struct FIO_display_prefs_s {
82*a28cd43dSSascha Wildner int displayLevel; /* 0 : no display; 1: errors; 2: + result + interaction + warnings; 3: + progression; 4: + information */
83*a28cd43dSSascha Wildner U32 noProgress;
84*a28cd43dSSascha Wildner };
85*a28cd43dSSascha Wildner
86*a28cd43dSSascha Wildner static FIO_display_prefs_t g_display_prefs = {2, 0};
87*a28cd43dSSascha Wildner
88*a28cd43dSSascha Wildner #define DISPLAY(...) fprintf(stderr, __VA_ARGS__)
89*a28cd43dSSascha Wildner #define DISPLAYOUT(...) fprintf(stdout, __VA_ARGS__)
90*a28cd43dSSascha Wildner #define DISPLAYLEVEL(l, ...) { if (g_display_prefs.displayLevel>=l) { DISPLAY(__VA_ARGS__); } }
91*a28cd43dSSascha Wildner
92*a28cd43dSSascha Wildner static const U64 g_refreshRate = SEC_TO_MICRO / 6;
93*a28cd43dSSascha Wildner static UTIL_time_t g_displayClock = UTIL_TIME_INITIALIZER;
94*a28cd43dSSascha Wildner
95*a28cd43dSSascha Wildner #define READY_FOR_UPDATE() (!g_display_prefs.noProgress && UTIL_clockSpanMicro(g_displayClock) > g_refreshRate)
96*a28cd43dSSascha Wildner #define DELAY_NEXT_UPDATE() { g_displayClock = UTIL_getTime(); }
97*a28cd43dSSascha Wildner #define DISPLAYUPDATE(l, ...) { \
98*a28cd43dSSascha Wildner if (g_display_prefs.displayLevel>=l && !g_display_prefs.noProgress) { \
99*a28cd43dSSascha Wildner if (READY_FOR_UPDATE() || (g_display_prefs.displayLevel>=4)) { \
100*a28cd43dSSascha Wildner DELAY_NEXT_UPDATE(); \
101*a28cd43dSSascha Wildner DISPLAY(__VA_ARGS__); \
102*a28cd43dSSascha Wildner if (g_display_prefs.displayLevel>=4) fflush(stderr); \
103*a28cd43dSSascha Wildner } } }
104*a28cd43dSSascha Wildner
105*a28cd43dSSascha Wildner #undef MIN /* in case it would be already defined */
106*a28cd43dSSascha Wildner #define MIN(a,b) ((a) < (b) ? (a) : (b))
107*a28cd43dSSascha Wildner
108*a28cd43dSSascha Wildner
109*a28cd43dSSascha Wildner #define EXM_THROW(error, ...) \
110*a28cd43dSSascha Wildner { \
111*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: "); \
112*a28cd43dSSascha Wildner DISPLAYLEVEL(5, "Error defined at %s, line %i : \n", __FILE__, __LINE__); \
113*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "error %i : ", error); \
114*a28cd43dSSascha Wildner DISPLAYLEVEL(1, __VA_ARGS__); \
115*a28cd43dSSascha Wildner DISPLAYLEVEL(1, " \n"); \
116*a28cd43dSSascha Wildner exit(error); \
117*a28cd43dSSascha Wildner }
118*a28cd43dSSascha Wildner
119*a28cd43dSSascha Wildner #define CHECK_V(v, f) \
120*a28cd43dSSascha Wildner v = f; \
121*a28cd43dSSascha Wildner if (ZSTD_isError(v)) { \
122*a28cd43dSSascha Wildner DISPLAYLEVEL(5, "%s \n", #f); \
123*a28cd43dSSascha Wildner EXM_THROW(11, "%s", ZSTD_getErrorName(v)); \
124*a28cd43dSSascha Wildner }
125*a28cd43dSSascha Wildner #define CHECK(f) { size_t err; CHECK_V(err, f); }
126*a28cd43dSSascha Wildner
127*a28cd43dSSascha Wildner
128*a28cd43dSSascha Wildner /*-************************************
129*a28cd43dSSascha Wildner * Signal (Ctrl-C trapping)
130*a28cd43dSSascha Wildner **************************************/
131*a28cd43dSSascha Wildner static const char* g_artefact = NULL;
INThandler(int sig)132*a28cd43dSSascha Wildner static void INThandler(int sig)
133*a28cd43dSSascha Wildner {
134*a28cd43dSSascha Wildner assert(sig==SIGINT); (void)sig;
135*a28cd43dSSascha Wildner #if !defined(_MSC_VER)
136*a28cd43dSSascha Wildner signal(sig, SIG_IGN); /* this invocation generates a buggy warning in Visual Studio */
137*a28cd43dSSascha Wildner #endif
138*a28cd43dSSascha Wildner if (g_artefact) {
139*a28cd43dSSascha Wildner assert(UTIL_isRegularFile(g_artefact));
140*a28cd43dSSascha Wildner remove(g_artefact);
141*a28cd43dSSascha Wildner }
142*a28cd43dSSascha Wildner DISPLAY("\n");
143*a28cd43dSSascha Wildner exit(2);
144*a28cd43dSSascha Wildner }
addHandler(char const * dstFileName)145*a28cd43dSSascha Wildner static void addHandler(char const* dstFileName)
146*a28cd43dSSascha Wildner {
147*a28cd43dSSascha Wildner if (UTIL_isRegularFile(dstFileName)) {
148*a28cd43dSSascha Wildner g_artefact = dstFileName;
149*a28cd43dSSascha Wildner signal(SIGINT, INThandler);
150*a28cd43dSSascha Wildner } else {
151*a28cd43dSSascha Wildner g_artefact = NULL;
152*a28cd43dSSascha Wildner }
153*a28cd43dSSascha Wildner }
154*a28cd43dSSascha Wildner /* Idempotent */
clearHandler(void)155*a28cd43dSSascha Wildner static void clearHandler(void)
156*a28cd43dSSascha Wildner {
157*a28cd43dSSascha Wildner if (g_artefact) signal(SIGINT, SIG_DFL);
158*a28cd43dSSascha Wildner g_artefact = NULL;
159*a28cd43dSSascha Wildner }
160*a28cd43dSSascha Wildner
161*a28cd43dSSascha Wildner
162*a28cd43dSSascha Wildner /*-*********************************************************
163*a28cd43dSSascha Wildner * Termination signal trapping (Print debug stack trace)
164*a28cd43dSSascha Wildner ***********************************************************/
165*a28cd43dSSascha Wildner #if defined(__has_feature) && !defined(BACKTRACE_ENABLE) /* Clang compiler */
166*a28cd43dSSascha Wildner # if (__has_feature(address_sanitizer))
167*a28cd43dSSascha Wildner # define BACKTRACE_ENABLE 0
168*a28cd43dSSascha Wildner # endif /* __has_feature(address_sanitizer) */
169*a28cd43dSSascha Wildner #elif defined(__SANITIZE_ADDRESS__) && !defined(BACKTRACE_ENABLE) /* GCC compiler */
170*a28cd43dSSascha Wildner # define BACKTRACE_ENABLE 0
171*a28cd43dSSascha Wildner #endif
172*a28cd43dSSascha Wildner
173*a28cd43dSSascha Wildner #if !defined(BACKTRACE_ENABLE)
174*a28cd43dSSascha Wildner /* automatic detector : backtrace enabled by default on linux+glibc and osx */
175*a28cd43dSSascha Wildner # if (defined(__linux__) && (defined(__GLIBC__) && !defined(__UCLIBC__))) \
176*a28cd43dSSascha Wildner || (defined(__APPLE__) && defined(__MACH__))
177*a28cd43dSSascha Wildner # define BACKTRACE_ENABLE 1
178*a28cd43dSSascha Wildner # else
179*a28cd43dSSascha Wildner # define BACKTRACE_ENABLE 0
180*a28cd43dSSascha Wildner # endif
181*a28cd43dSSascha Wildner #endif
182*a28cd43dSSascha Wildner
183*a28cd43dSSascha Wildner /* note : after this point, BACKTRACE_ENABLE is necessarily defined */
184*a28cd43dSSascha Wildner
185*a28cd43dSSascha Wildner
186*a28cd43dSSascha Wildner #if BACKTRACE_ENABLE
187*a28cd43dSSascha Wildner
188*a28cd43dSSascha Wildner #include <execinfo.h> /* backtrace, backtrace_symbols */
189*a28cd43dSSascha Wildner
190*a28cd43dSSascha Wildner #define MAX_STACK_FRAMES 50
191*a28cd43dSSascha Wildner
ABRThandler(int sig)192*a28cd43dSSascha Wildner static void ABRThandler(int sig) {
193*a28cd43dSSascha Wildner const char* name;
194*a28cd43dSSascha Wildner void* addrlist[MAX_STACK_FRAMES];
195*a28cd43dSSascha Wildner char** symbollist;
196*a28cd43dSSascha Wildner int addrlen, i;
197*a28cd43dSSascha Wildner
198*a28cd43dSSascha Wildner switch (sig) {
199*a28cd43dSSascha Wildner case SIGABRT: name = "SIGABRT"; break;
200*a28cd43dSSascha Wildner case SIGFPE: name = "SIGFPE"; break;
201*a28cd43dSSascha Wildner case SIGILL: name = "SIGILL"; break;
202*a28cd43dSSascha Wildner case SIGINT: name = "SIGINT"; break;
203*a28cd43dSSascha Wildner case SIGSEGV: name = "SIGSEGV"; break;
204*a28cd43dSSascha Wildner default: name = "UNKNOWN";
205*a28cd43dSSascha Wildner }
206*a28cd43dSSascha Wildner
207*a28cd43dSSascha Wildner DISPLAY("Caught %s signal, printing stack:\n", name);
208*a28cd43dSSascha Wildner /* Retrieve current stack addresses. */
209*a28cd43dSSascha Wildner addrlen = backtrace(addrlist, MAX_STACK_FRAMES);
210*a28cd43dSSascha Wildner if (addrlen == 0) {
211*a28cd43dSSascha Wildner DISPLAY("\n");
212*a28cd43dSSascha Wildner return;
213*a28cd43dSSascha Wildner }
214*a28cd43dSSascha Wildner /* Create readable strings to each frame. */
215*a28cd43dSSascha Wildner symbollist = backtrace_symbols(addrlist, addrlen);
216*a28cd43dSSascha Wildner /* Print the stack trace, excluding calls handling the signal. */
217*a28cd43dSSascha Wildner for (i = ZSTD_START_SYMBOLLIST_FRAME; i < addrlen; i++) {
218*a28cd43dSSascha Wildner DISPLAY("%s\n", symbollist[i]);
219*a28cd43dSSascha Wildner }
220*a28cd43dSSascha Wildner free(symbollist);
221*a28cd43dSSascha Wildner /* Reset and raise the signal so default handler runs. */
222*a28cd43dSSascha Wildner signal(sig, SIG_DFL);
223*a28cd43dSSascha Wildner raise(sig);
224*a28cd43dSSascha Wildner }
225*a28cd43dSSascha Wildner #endif
226*a28cd43dSSascha Wildner
FIO_addAbortHandler()227*a28cd43dSSascha Wildner void FIO_addAbortHandler()
228*a28cd43dSSascha Wildner {
229*a28cd43dSSascha Wildner #if BACKTRACE_ENABLE
230*a28cd43dSSascha Wildner signal(SIGABRT, ABRThandler);
231*a28cd43dSSascha Wildner signal(SIGFPE, ABRThandler);
232*a28cd43dSSascha Wildner signal(SIGILL, ABRThandler);
233*a28cd43dSSascha Wildner signal(SIGSEGV, ABRThandler);
234*a28cd43dSSascha Wildner signal(SIGBUS, ABRThandler);
235*a28cd43dSSascha Wildner #endif
236*a28cd43dSSascha Wildner }
237*a28cd43dSSascha Wildner
238*a28cd43dSSascha Wildner
239*a28cd43dSSascha Wildner /*-************************************************************
240*a28cd43dSSascha Wildner * Avoid fseek()'s 2GiB barrier with MSVC, macOS, *BSD, MinGW
241*a28cd43dSSascha Wildner ***************************************************************/
242*a28cd43dSSascha Wildner #if defined(_MSC_VER) && _MSC_VER >= 1400
243*a28cd43dSSascha Wildner # define LONG_SEEK _fseeki64
244*a28cd43dSSascha Wildner # define LONG_TELL _ftelli64
245*a28cd43dSSascha Wildner #elif !defined(__64BIT__) && (PLATFORM_POSIX_VERSION >= 200112L) /* No point defining Large file for 64 bit */
246*a28cd43dSSascha Wildner # define LONG_SEEK fseeko
247*a28cd43dSSascha Wildner # define LONG_TELL ftello
248*a28cd43dSSascha Wildner #elif defined(__MINGW32__) && !defined(__STRICT_ANSI__) && !defined(__NO_MINGW_LFS) && defined(__MSVCRT__)
249*a28cd43dSSascha Wildner # define LONG_SEEK fseeko64
250*a28cd43dSSascha Wildner # define LONG_TELL ftello64
251*a28cd43dSSascha Wildner #elif defined(_WIN32) && !defined(__DJGPP__)
252*a28cd43dSSascha Wildner # include <windows.h>
LONG_SEEK(FILE * file,__int64 offset,int origin)253*a28cd43dSSascha Wildner static int LONG_SEEK(FILE* file, __int64 offset, int origin) {
254*a28cd43dSSascha Wildner LARGE_INTEGER off;
255*a28cd43dSSascha Wildner DWORD method;
256*a28cd43dSSascha Wildner off.QuadPart = offset;
257*a28cd43dSSascha Wildner if (origin == SEEK_END)
258*a28cd43dSSascha Wildner method = FILE_END;
259*a28cd43dSSascha Wildner else if (origin == SEEK_CUR)
260*a28cd43dSSascha Wildner method = FILE_CURRENT;
261*a28cd43dSSascha Wildner else
262*a28cd43dSSascha Wildner method = FILE_BEGIN;
263*a28cd43dSSascha Wildner
264*a28cd43dSSascha Wildner if (SetFilePointerEx((HANDLE) _get_osfhandle(_fileno(file)), off, NULL, method))
265*a28cd43dSSascha Wildner return 0;
266*a28cd43dSSascha Wildner else
267*a28cd43dSSascha Wildner return -1;
268*a28cd43dSSascha Wildner }
LONG_TELL(FILE * file)269*a28cd43dSSascha Wildner static __int64 LONG_TELL(FILE* file) {
270*a28cd43dSSascha Wildner LARGE_INTEGER off, newOff;
271*a28cd43dSSascha Wildner off.QuadPart = 0;
272*a28cd43dSSascha Wildner newOff.QuadPart = 0;
273*a28cd43dSSascha Wildner SetFilePointerEx((HANDLE) _get_osfhandle(_fileno(file)), off, &newOff, FILE_CURRENT);
274*a28cd43dSSascha Wildner return newOff.QuadPart;
275*a28cd43dSSascha Wildner }
276*a28cd43dSSascha Wildner #else
277*a28cd43dSSascha Wildner # define LONG_SEEK fseek
278*a28cd43dSSascha Wildner # define LONG_TELL ftell
279*a28cd43dSSascha Wildner #endif
280*a28cd43dSSascha Wildner
281*a28cd43dSSascha Wildner
282*a28cd43dSSascha Wildner /*-*************************************
283*a28cd43dSSascha Wildner * Parameters: FIO_prefs_t
284*a28cd43dSSascha Wildner ***************************************/
285*a28cd43dSSascha Wildner
286*a28cd43dSSascha Wildner /* typedef'd to FIO_prefs_t within fileio.h */
287*a28cd43dSSascha Wildner struct FIO_prefs_s {
288*a28cd43dSSascha Wildner
289*a28cd43dSSascha Wildner /* Algorithm preferences */
290*a28cd43dSSascha Wildner FIO_compressionType_t compressionType;
291*a28cd43dSSascha Wildner U32 sparseFileSupport; /* 0: no sparse allowed; 1: auto (file yes, stdout no); 2: force sparse */
292*a28cd43dSSascha Wildner int dictIDFlag;
293*a28cd43dSSascha Wildner int checksumFlag;
294*a28cd43dSSascha Wildner int blockSize;
295*a28cd43dSSascha Wildner int overlapLog;
296*a28cd43dSSascha Wildner U32 adaptiveMode;
297*a28cd43dSSascha Wildner int rsyncable;
298*a28cd43dSSascha Wildner int minAdaptLevel;
299*a28cd43dSSascha Wildner int maxAdaptLevel;
300*a28cd43dSSascha Wildner int ldmFlag;
301*a28cd43dSSascha Wildner int ldmHashLog;
302*a28cd43dSSascha Wildner int ldmMinMatch;
303*a28cd43dSSascha Wildner int ldmBucketSizeLog;
304*a28cd43dSSascha Wildner int ldmHashRateLog;
305*a28cd43dSSascha Wildner size_t streamSrcSize;
306*a28cd43dSSascha Wildner size_t targetCBlockSize;
307*a28cd43dSSascha Wildner int srcSizeHint;
308*a28cd43dSSascha Wildner int testMode;
309*a28cd43dSSascha Wildner ZSTD_literalCompressionMode_e literalCompressionMode;
310*a28cd43dSSascha Wildner
311*a28cd43dSSascha Wildner /* IO preferences */
312*a28cd43dSSascha Wildner U32 removeSrcFile;
313*a28cd43dSSascha Wildner U32 overwrite;
314*a28cd43dSSascha Wildner
315*a28cd43dSSascha Wildner /* Computation resources preferences */
316*a28cd43dSSascha Wildner unsigned memLimit;
317*a28cd43dSSascha Wildner int nbWorkers;
318*a28cd43dSSascha Wildner
319*a28cd43dSSascha Wildner int excludeCompressedFiles;
320*a28cd43dSSascha Wildner int patchFromMode;
321*a28cd43dSSascha Wildner int contentSize;
322*a28cd43dSSascha Wildner };
323*a28cd43dSSascha Wildner
324*a28cd43dSSascha Wildner /*-*************************************
325*a28cd43dSSascha Wildner * Parameters: FIO_ctx_t
326*a28cd43dSSascha Wildner ***************************************/
327*a28cd43dSSascha Wildner
328*a28cd43dSSascha Wildner /* typedef'd to FIO_ctx_t within fileio.h */
329*a28cd43dSSascha Wildner struct FIO_ctx_s {
330*a28cd43dSSascha Wildner
331*a28cd43dSSascha Wildner /* file i/o info */
332*a28cd43dSSascha Wildner int nbFilesTotal;
333*a28cd43dSSascha Wildner int hasStdinInput;
334*a28cd43dSSascha Wildner int hasStdoutOutput;
335*a28cd43dSSascha Wildner
336*a28cd43dSSascha Wildner /* file i/o state */
337*a28cd43dSSascha Wildner int currFileIdx;
338*a28cd43dSSascha Wildner int nbFilesProcessed;
339*a28cd43dSSascha Wildner size_t totalBytesInput;
340*a28cd43dSSascha Wildner size_t totalBytesOutput;
341*a28cd43dSSascha Wildner };
342*a28cd43dSSascha Wildner
343*a28cd43dSSascha Wildner
344*a28cd43dSSascha Wildner /*-*************************************
345*a28cd43dSSascha Wildner * Parameters: Initialization
346*a28cd43dSSascha Wildner ***************************************/
347*a28cd43dSSascha Wildner
348*a28cd43dSSascha Wildner #define FIO_OVERLAP_LOG_NOTSET 9999
349*a28cd43dSSascha Wildner #define FIO_LDM_PARAM_NOTSET 9999
350*a28cd43dSSascha Wildner
351*a28cd43dSSascha Wildner
FIO_createPreferences(void)352*a28cd43dSSascha Wildner FIO_prefs_t* FIO_createPreferences(void)
353*a28cd43dSSascha Wildner {
354*a28cd43dSSascha Wildner FIO_prefs_t* const ret = (FIO_prefs_t*)malloc(sizeof(FIO_prefs_t));
355*a28cd43dSSascha Wildner if (!ret) EXM_THROW(21, "Allocation error : not enough memory");
356*a28cd43dSSascha Wildner
357*a28cd43dSSascha Wildner ret->compressionType = FIO_zstdCompression;
358*a28cd43dSSascha Wildner ret->overwrite = 0;
359*a28cd43dSSascha Wildner ret->sparseFileSupport = ZSTD_SPARSE_DEFAULT;
360*a28cd43dSSascha Wildner ret->dictIDFlag = 1;
361*a28cd43dSSascha Wildner ret->checksumFlag = 1;
362*a28cd43dSSascha Wildner ret->removeSrcFile = 0;
363*a28cd43dSSascha Wildner ret->memLimit = 0;
364*a28cd43dSSascha Wildner ret->nbWorkers = 1;
365*a28cd43dSSascha Wildner ret->blockSize = 0;
366*a28cd43dSSascha Wildner ret->overlapLog = FIO_OVERLAP_LOG_NOTSET;
367*a28cd43dSSascha Wildner ret->adaptiveMode = 0;
368*a28cd43dSSascha Wildner ret->rsyncable = 0;
369*a28cd43dSSascha Wildner ret->minAdaptLevel = -50; /* initializing this value requires a constant, so ZSTD_minCLevel() doesn't work */
370*a28cd43dSSascha Wildner ret->maxAdaptLevel = 22; /* initializing this value requires a constant, so ZSTD_maxCLevel() doesn't work */
371*a28cd43dSSascha Wildner ret->ldmFlag = 0;
372*a28cd43dSSascha Wildner ret->ldmHashLog = 0;
373*a28cd43dSSascha Wildner ret->ldmMinMatch = 0;
374*a28cd43dSSascha Wildner ret->ldmBucketSizeLog = FIO_LDM_PARAM_NOTSET;
375*a28cd43dSSascha Wildner ret->ldmHashRateLog = FIO_LDM_PARAM_NOTSET;
376*a28cd43dSSascha Wildner ret->streamSrcSize = 0;
377*a28cd43dSSascha Wildner ret->targetCBlockSize = 0;
378*a28cd43dSSascha Wildner ret->srcSizeHint = 0;
379*a28cd43dSSascha Wildner ret->testMode = 0;
380*a28cd43dSSascha Wildner ret->literalCompressionMode = ZSTD_lcm_auto;
381*a28cd43dSSascha Wildner ret->excludeCompressedFiles = 0;
382*a28cd43dSSascha Wildner return ret;
383*a28cd43dSSascha Wildner }
384*a28cd43dSSascha Wildner
FIO_createContext(void)385*a28cd43dSSascha Wildner FIO_ctx_t* FIO_createContext(void)
386*a28cd43dSSascha Wildner {
387*a28cd43dSSascha Wildner FIO_ctx_t* const ret = (FIO_ctx_t*)malloc(sizeof(FIO_ctx_t));
388*a28cd43dSSascha Wildner if (!ret) EXM_THROW(21, "Allocation error : not enough memory");
389*a28cd43dSSascha Wildner
390*a28cd43dSSascha Wildner ret->currFileIdx = 0;
391*a28cd43dSSascha Wildner ret->hasStdinInput = 0;
392*a28cd43dSSascha Wildner ret->hasStdoutOutput = 0;
393*a28cd43dSSascha Wildner ret->nbFilesTotal = 1;
394*a28cd43dSSascha Wildner ret->nbFilesProcessed = 0;
395*a28cd43dSSascha Wildner ret->totalBytesInput = 0;
396*a28cd43dSSascha Wildner ret->totalBytesOutput = 0;
397*a28cd43dSSascha Wildner return ret;
398*a28cd43dSSascha Wildner }
399*a28cd43dSSascha Wildner
FIO_freePreferences(FIO_prefs_t * const prefs)400*a28cd43dSSascha Wildner void FIO_freePreferences(FIO_prefs_t* const prefs)
401*a28cd43dSSascha Wildner {
402*a28cd43dSSascha Wildner free(prefs);
403*a28cd43dSSascha Wildner }
404*a28cd43dSSascha Wildner
FIO_freeContext(FIO_ctx_t * const fCtx)405*a28cd43dSSascha Wildner void FIO_freeContext(FIO_ctx_t* const fCtx)
406*a28cd43dSSascha Wildner {
407*a28cd43dSSascha Wildner free(fCtx);
408*a28cd43dSSascha Wildner }
409*a28cd43dSSascha Wildner
410*a28cd43dSSascha Wildner
411*a28cd43dSSascha Wildner /*-*************************************
412*a28cd43dSSascha Wildner * Parameters: Display Options
413*a28cd43dSSascha Wildner ***************************************/
414*a28cd43dSSascha Wildner
FIO_setNotificationLevel(int level)415*a28cd43dSSascha Wildner void FIO_setNotificationLevel(int level) { g_display_prefs.displayLevel=level; }
416*a28cd43dSSascha Wildner
FIO_setNoProgress(unsigned noProgress)417*a28cd43dSSascha Wildner void FIO_setNoProgress(unsigned noProgress) { g_display_prefs.noProgress = noProgress; }
418*a28cd43dSSascha Wildner
419*a28cd43dSSascha Wildner
420*a28cd43dSSascha Wildner /*-*************************************
421*a28cd43dSSascha Wildner * Parameters: Setters
422*a28cd43dSSascha Wildner ***************************************/
423*a28cd43dSSascha Wildner
424*a28cd43dSSascha Wildner /* FIO_prefs_t functions */
425*a28cd43dSSascha Wildner
FIO_setCompressionType(FIO_prefs_t * const prefs,FIO_compressionType_t compressionType)426*a28cd43dSSascha Wildner void FIO_setCompressionType(FIO_prefs_t* const prefs, FIO_compressionType_t compressionType) { prefs->compressionType = compressionType; }
427*a28cd43dSSascha Wildner
FIO_overwriteMode(FIO_prefs_t * const prefs)428*a28cd43dSSascha Wildner void FIO_overwriteMode(FIO_prefs_t* const prefs) { prefs->overwrite = 1; }
429*a28cd43dSSascha Wildner
FIO_setSparseWrite(FIO_prefs_t * const prefs,unsigned sparse)430*a28cd43dSSascha Wildner void FIO_setSparseWrite(FIO_prefs_t* const prefs, unsigned sparse) { prefs->sparseFileSupport = sparse; }
431*a28cd43dSSascha Wildner
FIO_setDictIDFlag(FIO_prefs_t * const prefs,int dictIDFlag)432*a28cd43dSSascha Wildner void FIO_setDictIDFlag(FIO_prefs_t* const prefs, int dictIDFlag) { prefs->dictIDFlag = dictIDFlag; }
433*a28cd43dSSascha Wildner
FIO_setChecksumFlag(FIO_prefs_t * const prefs,int checksumFlag)434*a28cd43dSSascha Wildner void FIO_setChecksumFlag(FIO_prefs_t* const prefs, int checksumFlag) { prefs->checksumFlag = checksumFlag; }
435*a28cd43dSSascha Wildner
FIO_setRemoveSrcFile(FIO_prefs_t * const prefs,unsigned flag)436*a28cd43dSSascha Wildner void FIO_setRemoveSrcFile(FIO_prefs_t* const prefs, unsigned flag) { prefs->removeSrcFile = (flag>0); }
437*a28cd43dSSascha Wildner
FIO_setMemLimit(FIO_prefs_t * const prefs,unsigned memLimit)438*a28cd43dSSascha Wildner void FIO_setMemLimit(FIO_prefs_t* const prefs, unsigned memLimit) { prefs->memLimit = memLimit; }
439*a28cd43dSSascha Wildner
FIO_setNbWorkers(FIO_prefs_t * const prefs,int nbWorkers)440*a28cd43dSSascha Wildner void FIO_setNbWorkers(FIO_prefs_t* const prefs, int nbWorkers) {
441*a28cd43dSSascha Wildner #ifndef ZSTD_MULTITHREAD
442*a28cd43dSSascha Wildner if (nbWorkers > 0) DISPLAYLEVEL(2, "Note : multi-threading is disabled \n");
443*a28cd43dSSascha Wildner #endif
444*a28cd43dSSascha Wildner prefs->nbWorkers = nbWorkers;
445*a28cd43dSSascha Wildner }
446*a28cd43dSSascha Wildner
FIO_setExcludeCompressedFile(FIO_prefs_t * const prefs,int excludeCompressedFiles)447*a28cd43dSSascha Wildner void FIO_setExcludeCompressedFile(FIO_prefs_t* const prefs, int excludeCompressedFiles) { prefs->excludeCompressedFiles = excludeCompressedFiles; }
448*a28cd43dSSascha Wildner
FIO_setBlockSize(FIO_prefs_t * const prefs,int blockSize)449*a28cd43dSSascha Wildner void FIO_setBlockSize(FIO_prefs_t* const prefs, int blockSize) {
450*a28cd43dSSascha Wildner if (blockSize && prefs->nbWorkers==0)
451*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "Setting block size is useless in single-thread mode \n");
452*a28cd43dSSascha Wildner prefs->blockSize = blockSize;
453*a28cd43dSSascha Wildner }
454*a28cd43dSSascha Wildner
FIO_setOverlapLog(FIO_prefs_t * const prefs,int overlapLog)455*a28cd43dSSascha Wildner void FIO_setOverlapLog(FIO_prefs_t* const prefs, int overlapLog){
456*a28cd43dSSascha Wildner if (overlapLog && prefs->nbWorkers==0)
457*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "Setting overlapLog is useless in single-thread mode \n");
458*a28cd43dSSascha Wildner prefs->overlapLog = overlapLog;
459*a28cd43dSSascha Wildner }
460*a28cd43dSSascha Wildner
FIO_setAdaptiveMode(FIO_prefs_t * const prefs,unsigned adapt)461*a28cd43dSSascha Wildner void FIO_setAdaptiveMode(FIO_prefs_t* const prefs, unsigned adapt) {
462*a28cd43dSSascha Wildner if ((adapt>0) && (prefs->nbWorkers==0))
463*a28cd43dSSascha Wildner EXM_THROW(1, "Adaptive mode is not compatible with single thread mode \n");
464*a28cd43dSSascha Wildner prefs->adaptiveMode = adapt;
465*a28cd43dSSascha Wildner }
466*a28cd43dSSascha Wildner
FIO_setRsyncable(FIO_prefs_t * const prefs,int rsyncable)467*a28cd43dSSascha Wildner void FIO_setRsyncable(FIO_prefs_t* const prefs, int rsyncable) {
468*a28cd43dSSascha Wildner if ((rsyncable>0) && (prefs->nbWorkers==0))
469*a28cd43dSSascha Wildner EXM_THROW(1, "Rsyncable mode is not compatible with single thread mode \n");
470*a28cd43dSSascha Wildner prefs->rsyncable = rsyncable;
471*a28cd43dSSascha Wildner }
472*a28cd43dSSascha Wildner
FIO_setStreamSrcSize(FIO_prefs_t * const prefs,size_t streamSrcSize)473*a28cd43dSSascha Wildner void FIO_setStreamSrcSize(FIO_prefs_t* const prefs, size_t streamSrcSize) {
474*a28cd43dSSascha Wildner prefs->streamSrcSize = streamSrcSize;
475*a28cd43dSSascha Wildner }
476*a28cd43dSSascha Wildner
FIO_setTargetCBlockSize(FIO_prefs_t * const prefs,size_t targetCBlockSize)477*a28cd43dSSascha Wildner void FIO_setTargetCBlockSize(FIO_prefs_t* const prefs, size_t targetCBlockSize) {
478*a28cd43dSSascha Wildner prefs->targetCBlockSize = targetCBlockSize;
479*a28cd43dSSascha Wildner }
480*a28cd43dSSascha Wildner
FIO_setSrcSizeHint(FIO_prefs_t * const prefs,size_t srcSizeHint)481*a28cd43dSSascha Wildner void FIO_setSrcSizeHint(FIO_prefs_t* const prefs, size_t srcSizeHint) {
482*a28cd43dSSascha Wildner prefs->srcSizeHint = (int)MIN((size_t)INT_MAX, srcSizeHint);
483*a28cd43dSSascha Wildner }
484*a28cd43dSSascha Wildner
FIO_setTestMode(FIO_prefs_t * const prefs,int testMode)485*a28cd43dSSascha Wildner void FIO_setTestMode(FIO_prefs_t* const prefs, int testMode) {
486*a28cd43dSSascha Wildner prefs->testMode = (testMode!=0);
487*a28cd43dSSascha Wildner }
488*a28cd43dSSascha Wildner
FIO_setLiteralCompressionMode(FIO_prefs_t * const prefs,ZSTD_literalCompressionMode_e mode)489*a28cd43dSSascha Wildner void FIO_setLiteralCompressionMode(
490*a28cd43dSSascha Wildner FIO_prefs_t* const prefs,
491*a28cd43dSSascha Wildner ZSTD_literalCompressionMode_e mode) {
492*a28cd43dSSascha Wildner prefs->literalCompressionMode = mode;
493*a28cd43dSSascha Wildner }
494*a28cd43dSSascha Wildner
FIO_setAdaptMin(FIO_prefs_t * const prefs,int minCLevel)495*a28cd43dSSascha Wildner void FIO_setAdaptMin(FIO_prefs_t* const prefs, int minCLevel)
496*a28cd43dSSascha Wildner {
497*a28cd43dSSascha Wildner #ifndef ZSTD_NOCOMPRESS
498*a28cd43dSSascha Wildner assert(minCLevel >= ZSTD_minCLevel());
499*a28cd43dSSascha Wildner #endif
500*a28cd43dSSascha Wildner prefs->minAdaptLevel = minCLevel;
501*a28cd43dSSascha Wildner }
502*a28cd43dSSascha Wildner
FIO_setAdaptMax(FIO_prefs_t * const prefs,int maxCLevel)503*a28cd43dSSascha Wildner void FIO_setAdaptMax(FIO_prefs_t* const prefs, int maxCLevel)
504*a28cd43dSSascha Wildner {
505*a28cd43dSSascha Wildner prefs->maxAdaptLevel = maxCLevel;
506*a28cd43dSSascha Wildner }
507*a28cd43dSSascha Wildner
FIO_setLdmFlag(FIO_prefs_t * const prefs,unsigned ldmFlag)508*a28cd43dSSascha Wildner void FIO_setLdmFlag(FIO_prefs_t* const prefs, unsigned ldmFlag) {
509*a28cd43dSSascha Wildner prefs->ldmFlag = (ldmFlag>0);
510*a28cd43dSSascha Wildner }
511*a28cd43dSSascha Wildner
FIO_setLdmHashLog(FIO_prefs_t * const prefs,int ldmHashLog)512*a28cd43dSSascha Wildner void FIO_setLdmHashLog(FIO_prefs_t* const prefs, int ldmHashLog) {
513*a28cd43dSSascha Wildner prefs->ldmHashLog = ldmHashLog;
514*a28cd43dSSascha Wildner }
515*a28cd43dSSascha Wildner
FIO_setLdmMinMatch(FIO_prefs_t * const prefs,int ldmMinMatch)516*a28cd43dSSascha Wildner void FIO_setLdmMinMatch(FIO_prefs_t* const prefs, int ldmMinMatch) {
517*a28cd43dSSascha Wildner prefs->ldmMinMatch = ldmMinMatch;
518*a28cd43dSSascha Wildner }
519*a28cd43dSSascha Wildner
FIO_setLdmBucketSizeLog(FIO_prefs_t * const prefs,int ldmBucketSizeLog)520*a28cd43dSSascha Wildner void FIO_setLdmBucketSizeLog(FIO_prefs_t* const prefs, int ldmBucketSizeLog) {
521*a28cd43dSSascha Wildner prefs->ldmBucketSizeLog = ldmBucketSizeLog;
522*a28cd43dSSascha Wildner }
523*a28cd43dSSascha Wildner
524*a28cd43dSSascha Wildner
FIO_setLdmHashRateLog(FIO_prefs_t * const prefs,int ldmHashRateLog)525*a28cd43dSSascha Wildner void FIO_setLdmHashRateLog(FIO_prefs_t* const prefs, int ldmHashRateLog) {
526*a28cd43dSSascha Wildner prefs->ldmHashRateLog = ldmHashRateLog;
527*a28cd43dSSascha Wildner }
528*a28cd43dSSascha Wildner
FIO_setPatchFromMode(FIO_prefs_t * const prefs,int value)529*a28cd43dSSascha Wildner void FIO_setPatchFromMode(FIO_prefs_t* const prefs, int value)
530*a28cd43dSSascha Wildner {
531*a28cd43dSSascha Wildner prefs->patchFromMode = value != 0;
532*a28cd43dSSascha Wildner }
533*a28cd43dSSascha Wildner
FIO_setContentSize(FIO_prefs_t * const prefs,int value)534*a28cd43dSSascha Wildner void FIO_setContentSize(FIO_prefs_t* const prefs, int value)
535*a28cd43dSSascha Wildner {
536*a28cd43dSSascha Wildner prefs->contentSize = value != 0;
537*a28cd43dSSascha Wildner }
538*a28cd43dSSascha Wildner
539*a28cd43dSSascha Wildner /* FIO_ctx_t functions */
540*a28cd43dSSascha Wildner
FIO_setHasStdoutOutput(FIO_ctx_t * const fCtx,int value)541*a28cd43dSSascha Wildner void FIO_setHasStdoutOutput(FIO_ctx_t* const fCtx, int value) {
542*a28cd43dSSascha Wildner fCtx->hasStdoutOutput = value;
543*a28cd43dSSascha Wildner }
544*a28cd43dSSascha Wildner
FIO_setNbFilesTotal(FIO_ctx_t * const fCtx,int value)545*a28cd43dSSascha Wildner void FIO_setNbFilesTotal(FIO_ctx_t* const fCtx, int value)
546*a28cd43dSSascha Wildner {
547*a28cd43dSSascha Wildner fCtx->nbFilesTotal = value;
548*a28cd43dSSascha Wildner }
549*a28cd43dSSascha Wildner
FIO_determineHasStdinInput(FIO_ctx_t * const fCtx,const FileNamesTable * const filenames)550*a28cd43dSSascha Wildner void FIO_determineHasStdinInput(FIO_ctx_t* const fCtx, const FileNamesTable* const filenames) {
551*a28cd43dSSascha Wildner size_t i = 0;
552*a28cd43dSSascha Wildner for ( ; i < filenames->tableSize; ++i) {
553*a28cd43dSSascha Wildner if (!strcmp(stdinmark, filenames->fileNames[i])) {
554*a28cd43dSSascha Wildner fCtx->hasStdinInput = 1;
555*a28cd43dSSascha Wildner return;
556*a28cd43dSSascha Wildner }
557*a28cd43dSSascha Wildner }
558*a28cd43dSSascha Wildner }
559*a28cd43dSSascha Wildner
560*a28cd43dSSascha Wildner /*-*************************************
561*a28cd43dSSascha Wildner * Functions
562*a28cd43dSSascha Wildner ***************************************/
563*a28cd43dSSascha Wildner /** FIO_removeFile() :
564*a28cd43dSSascha Wildner * @result : Unlink `fileName`, even if it's read-only */
FIO_removeFile(const char * path)565*a28cd43dSSascha Wildner static int FIO_removeFile(const char* path)
566*a28cd43dSSascha Wildner {
567*a28cd43dSSascha Wildner stat_t statbuf;
568*a28cd43dSSascha Wildner if (!UTIL_stat(path, &statbuf)) {
569*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "zstd: Failed to stat %s while trying to remove it\n", path);
570*a28cd43dSSascha Wildner return 0;
571*a28cd43dSSascha Wildner }
572*a28cd43dSSascha Wildner if (!UTIL_isRegularFileStat(&statbuf)) {
573*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "zstd: Refusing to remove non-regular file %s\n", path);
574*a28cd43dSSascha Wildner return 0;
575*a28cd43dSSascha Wildner }
576*a28cd43dSSascha Wildner #if defined(_WIN32) || defined(WIN32)
577*a28cd43dSSascha Wildner /* windows doesn't allow remove read-only files,
578*a28cd43dSSascha Wildner * so try to make it writable first */
579*a28cd43dSSascha Wildner if (!(statbuf.st_mode & _S_IWRITE)) {
580*a28cd43dSSascha Wildner UTIL_chmod(path, &statbuf, _S_IWRITE);
581*a28cd43dSSascha Wildner }
582*a28cd43dSSascha Wildner #endif
583*a28cd43dSSascha Wildner return remove(path);
584*a28cd43dSSascha Wildner }
585*a28cd43dSSascha Wildner
586*a28cd43dSSascha Wildner /** FIO_openSrcFile() :
587*a28cd43dSSascha Wildner * condition : `srcFileName` must be non-NULL.
588*a28cd43dSSascha Wildner * @result : FILE* to `srcFileName`, or NULL if it fails */
FIO_openSrcFile(const char * srcFileName)589*a28cd43dSSascha Wildner static FILE* FIO_openSrcFile(const char* srcFileName)
590*a28cd43dSSascha Wildner {
591*a28cd43dSSascha Wildner stat_t statbuf;
592*a28cd43dSSascha Wildner assert(srcFileName != NULL);
593*a28cd43dSSascha Wildner if (!strcmp (srcFileName, stdinmark)) {
594*a28cd43dSSascha Wildner DISPLAYLEVEL(4,"Using stdin for input \n");
595*a28cd43dSSascha Wildner SET_BINARY_MODE(stdin);
596*a28cd43dSSascha Wildner return stdin;
597*a28cd43dSSascha Wildner }
598*a28cd43dSSascha Wildner
599*a28cd43dSSascha Wildner if (!UTIL_stat(srcFileName, &statbuf)) {
600*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: can't stat %s : %s -- ignored \n",
601*a28cd43dSSascha Wildner srcFileName, strerror(errno));
602*a28cd43dSSascha Wildner return NULL;
603*a28cd43dSSascha Wildner }
604*a28cd43dSSascha Wildner
605*a28cd43dSSascha Wildner if (!UTIL_isRegularFileStat(&statbuf)
606*a28cd43dSSascha Wildner && !UTIL_isFIFOStat(&statbuf)
607*a28cd43dSSascha Wildner ) {
608*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s is not a regular file -- ignored \n",
609*a28cd43dSSascha Wildner srcFileName);
610*a28cd43dSSascha Wildner return NULL;
611*a28cd43dSSascha Wildner }
612*a28cd43dSSascha Wildner
613*a28cd43dSSascha Wildner { FILE* const f = fopen(srcFileName, "rb");
614*a28cd43dSSascha Wildner if (f == NULL)
615*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s: %s \n", srcFileName, strerror(errno));
616*a28cd43dSSascha Wildner return f;
617*a28cd43dSSascha Wildner }
618*a28cd43dSSascha Wildner }
619*a28cd43dSSascha Wildner
620*a28cd43dSSascha Wildner /** FIO_openDstFile() :
621*a28cd43dSSascha Wildner * condition : `dstFileName` must be non-NULL.
622*a28cd43dSSascha Wildner * @result : FILE* to `dstFileName`, or NULL if it fails */
623*a28cd43dSSascha Wildner static FILE*
FIO_openDstFile(FIO_ctx_t * fCtx,FIO_prefs_t * const prefs,const char * srcFileName,const char * dstFileName)624*a28cd43dSSascha Wildner FIO_openDstFile(FIO_ctx_t* fCtx, FIO_prefs_t* const prefs,
625*a28cd43dSSascha Wildner const char* srcFileName, const char* dstFileName)
626*a28cd43dSSascha Wildner {
627*a28cd43dSSascha Wildner if (prefs->testMode) return NULL; /* do not open file in test mode */
628*a28cd43dSSascha Wildner
629*a28cd43dSSascha Wildner assert(dstFileName != NULL);
630*a28cd43dSSascha Wildner if (!strcmp (dstFileName, stdoutmark)) {
631*a28cd43dSSascha Wildner DISPLAYLEVEL(4,"Using stdout for output \n");
632*a28cd43dSSascha Wildner SET_BINARY_MODE(stdout);
633*a28cd43dSSascha Wildner if (prefs->sparseFileSupport == 1) {
634*a28cd43dSSascha Wildner prefs->sparseFileSupport = 0;
635*a28cd43dSSascha Wildner DISPLAYLEVEL(4, "Sparse File Support is automatically disabled on stdout ; try --sparse \n");
636*a28cd43dSSascha Wildner }
637*a28cd43dSSascha Wildner return stdout;
638*a28cd43dSSascha Wildner }
639*a28cd43dSSascha Wildner
640*a28cd43dSSascha Wildner /* ensure dst is not the same as src */
641*a28cd43dSSascha Wildner if (srcFileName != NULL && UTIL_isSameFile(srcFileName, dstFileName)) {
642*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: Refusing to open an output file which will overwrite the input file \n");
643*a28cd43dSSascha Wildner return NULL;
644*a28cd43dSSascha Wildner }
645*a28cd43dSSascha Wildner
646*a28cd43dSSascha Wildner if (prefs->sparseFileSupport == 1) {
647*a28cd43dSSascha Wildner prefs->sparseFileSupport = ZSTD_SPARSE_DEFAULT;
648*a28cd43dSSascha Wildner }
649*a28cd43dSSascha Wildner
650*a28cd43dSSascha Wildner if (UTIL_isRegularFile(dstFileName)) {
651*a28cd43dSSascha Wildner /* Check if destination file already exists */
652*a28cd43dSSascha Wildner FILE* const fCheck = fopen( dstFileName, "rb" );
653*a28cd43dSSascha Wildner #if !defined(_WIN32)
654*a28cd43dSSascha Wildner /* this test does not work on Windows :
655*a28cd43dSSascha Wildner * `NUL` and `nul` are detected as regular files */
656*a28cd43dSSascha Wildner if (!strcmp(dstFileName, nulmark)) {
657*a28cd43dSSascha Wildner EXM_THROW(40, "%s is unexpectedly categorized as a regular file",
658*a28cd43dSSascha Wildner dstFileName);
659*a28cd43dSSascha Wildner }
660*a28cd43dSSascha Wildner #endif
661*a28cd43dSSascha Wildner if (fCheck != NULL) { /* dst file exists, authorization prompt */
662*a28cd43dSSascha Wildner fclose(fCheck);
663*a28cd43dSSascha Wildner if (!prefs->overwrite) {
664*a28cd43dSSascha Wildner if (g_display_prefs.displayLevel <= 1) {
665*a28cd43dSSascha Wildner /* No interaction possible */
666*a28cd43dSSascha Wildner DISPLAY("zstd: %s already exists; not overwritten \n",
667*a28cd43dSSascha Wildner dstFileName);
668*a28cd43dSSascha Wildner return NULL;
669*a28cd43dSSascha Wildner }
670*a28cd43dSSascha Wildner DISPLAY("zstd: %s already exists; ", dstFileName);
671*a28cd43dSSascha Wildner if (UTIL_requireUserConfirmation("overwrite (y/n) ? ", "Not overwritten \n", "yY", fCtx->hasStdinInput))
672*a28cd43dSSascha Wildner return NULL;
673*a28cd43dSSascha Wildner }
674*a28cd43dSSascha Wildner /* need to unlink */
675*a28cd43dSSascha Wildner FIO_removeFile(dstFileName);
676*a28cd43dSSascha Wildner } }
677*a28cd43dSSascha Wildner
678*a28cd43dSSascha Wildner { FILE* const f = fopen( dstFileName, "wb" );
679*a28cd43dSSascha Wildner if (f == NULL) {
680*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s: %s\n", dstFileName, strerror(errno));
681*a28cd43dSSascha Wildner } else if (srcFileName != NULL
682*a28cd43dSSascha Wildner && strcmp (srcFileName, stdinmark)
683*a28cd43dSSascha Wildner && strcmp(dstFileName, nulmark) ) {
684*a28cd43dSSascha Wildner /* reduce rights on newly created dst file while compression is ongoing */
685*a28cd43dSSascha Wildner UTIL_chmod(dstFileName, NULL, 00600);
686*a28cd43dSSascha Wildner }
687*a28cd43dSSascha Wildner return f;
688*a28cd43dSSascha Wildner }
689*a28cd43dSSascha Wildner }
690*a28cd43dSSascha Wildner
691*a28cd43dSSascha Wildner /*! FIO_createDictBuffer() :
692*a28cd43dSSascha Wildner * creates a buffer, pointed by `*bufferPtr`,
693*a28cd43dSSascha Wildner * loads `filename` content into it, up to DICTSIZE_MAX bytes.
694*a28cd43dSSascha Wildner * @return : loaded size
695*a28cd43dSSascha Wildner * if fileName==NULL, returns 0 and a NULL pointer
696*a28cd43dSSascha Wildner */
FIO_createDictBuffer(void ** bufferPtr,const char * fileName,FIO_prefs_t * const prefs)697*a28cd43dSSascha Wildner static size_t FIO_createDictBuffer(void** bufferPtr, const char* fileName, FIO_prefs_t* const prefs)
698*a28cd43dSSascha Wildner {
699*a28cd43dSSascha Wildner FILE* fileHandle;
700*a28cd43dSSascha Wildner U64 fileSize;
701*a28cd43dSSascha Wildner
702*a28cd43dSSascha Wildner assert(bufferPtr != NULL);
703*a28cd43dSSascha Wildner *bufferPtr = NULL;
704*a28cd43dSSascha Wildner if (fileName == NULL) return 0;
705*a28cd43dSSascha Wildner
706*a28cd43dSSascha Wildner DISPLAYLEVEL(4,"Loading %s as dictionary \n", fileName);
707*a28cd43dSSascha Wildner fileHandle = fopen(fileName, "rb");
708*a28cd43dSSascha Wildner if (fileHandle==NULL) EXM_THROW(31, "%s: %s", fileName, strerror(errno));
709*a28cd43dSSascha Wildner
710*a28cd43dSSascha Wildner fileSize = UTIL_getFileSize(fileName);
711*a28cd43dSSascha Wildner {
712*a28cd43dSSascha Wildner size_t const dictSizeMax = prefs->patchFromMode ? prefs->memLimit : DICTSIZE_MAX;
713*a28cd43dSSascha Wildner if (fileSize > dictSizeMax) {
714*a28cd43dSSascha Wildner EXM_THROW(32, "Dictionary file %s is too large (> %u bytes)",
715*a28cd43dSSascha Wildner fileName, (unsigned)dictSizeMax); /* avoid extreme cases */
716*a28cd43dSSascha Wildner }
717*a28cd43dSSascha Wildner }
718*a28cd43dSSascha Wildner *bufferPtr = malloc((size_t)fileSize);
719*a28cd43dSSascha Wildner if (*bufferPtr==NULL) EXM_THROW(34, "%s", strerror(errno));
720*a28cd43dSSascha Wildner { size_t const readSize = fread(*bufferPtr, 1, (size_t)fileSize, fileHandle);
721*a28cd43dSSascha Wildner if (readSize != fileSize)
722*a28cd43dSSascha Wildner EXM_THROW(35, "Error reading dictionary file %s : %s",
723*a28cd43dSSascha Wildner fileName, strerror(errno));
724*a28cd43dSSascha Wildner }
725*a28cd43dSSascha Wildner fclose(fileHandle);
726*a28cd43dSSascha Wildner return (size_t)fileSize;
727*a28cd43dSSascha Wildner }
728*a28cd43dSSascha Wildner
729*a28cd43dSSascha Wildner
730*a28cd43dSSascha Wildner
731*a28cd43dSSascha Wildner /* FIO_checkFilenameCollisions() :
732*a28cd43dSSascha Wildner * Checks for and warns if there are any files that would have the same output path
733*a28cd43dSSascha Wildner */
FIO_checkFilenameCollisions(const char ** filenameTable,unsigned nbFiles)734*a28cd43dSSascha Wildner int FIO_checkFilenameCollisions(const char** filenameTable, unsigned nbFiles) {
735*a28cd43dSSascha Wildner const char **filenameTableSorted, *prevElem, *filename;
736*a28cd43dSSascha Wildner unsigned u;
737*a28cd43dSSascha Wildner
738*a28cd43dSSascha Wildner filenameTableSorted = (const char**) malloc(sizeof(char*) * nbFiles);
739*a28cd43dSSascha Wildner if (!filenameTableSorted) {
740*a28cd43dSSascha Wildner DISPLAY("Unable to malloc new str array, not checking for name collisions\n");
741*a28cd43dSSascha Wildner return 1;
742*a28cd43dSSascha Wildner }
743*a28cd43dSSascha Wildner
744*a28cd43dSSascha Wildner for (u = 0; u < nbFiles; ++u) {
745*a28cd43dSSascha Wildner filename = strrchr(filenameTable[u], PATH_SEP);
746*a28cd43dSSascha Wildner if (filename == NULL) {
747*a28cd43dSSascha Wildner filenameTableSorted[u] = filenameTable[u];
748*a28cd43dSSascha Wildner } else {
749*a28cd43dSSascha Wildner filenameTableSorted[u] = filename+1;
750*a28cd43dSSascha Wildner }
751*a28cd43dSSascha Wildner }
752*a28cd43dSSascha Wildner
753*a28cd43dSSascha Wildner qsort((void*)filenameTableSorted, nbFiles, sizeof(char*), UTIL_compareStr);
754*a28cd43dSSascha Wildner prevElem = filenameTableSorted[0];
755*a28cd43dSSascha Wildner for (u = 1; u < nbFiles; ++u) {
756*a28cd43dSSascha Wildner if (strcmp(prevElem, filenameTableSorted[u]) == 0) {
757*a28cd43dSSascha Wildner DISPLAY("WARNING: Two files have same filename: %s\n", prevElem);
758*a28cd43dSSascha Wildner }
759*a28cd43dSSascha Wildner prevElem = filenameTableSorted[u];
760*a28cd43dSSascha Wildner }
761*a28cd43dSSascha Wildner
762*a28cd43dSSascha Wildner free((void*)filenameTableSorted);
763*a28cd43dSSascha Wildner return 0;
764*a28cd43dSSascha Wildner }
765*a28cd43dSSascha Wildner
766*a28cd43dSSascha Wildner static const char*
extractFilename(const char * path,char separator)767*a28cd43dSSascha Wildner extractFilename(const char* path, char separator)
768*a28cd43dSSascha Wildner {
769*a28cd43dSSascha Wildner const char* search = strrchr(path, separator);
770*a28cd43dSSascha Wildner if (search == NULL) return path;
771*a28cd43dSSascha Wildner return search+1;
772*a28cd43dSSascha Wildner }
773*a28cd43dSSascha Wildner
774*a28cd43dSSascha Wildner /* FIO_createFilename_fromOutDir() :
775*a28cd43dSSascha Wildner * Takes a source file name and specified output directory, and
776*a28cd43dSSascha Wildner * allocates memory for and returns a pointer to final path.
777*a28cd43dSSascha Wildner * This function never returns an error (it may abort() in case of pb)
778*a28cd43dSSascha Wildner */
779*a28cd43dSSascha Wildner static char*
FIO_createFilename_fromOutDir(const char * path,const char * outDirName,const size_t suffixLen)780*a28cd43dSSascha Wildner FIO_createFilename_fromOutDir(const char* path, const char* outDirName, const size_t suffixLen)
781*a28cd43dSSascha Wildner {
782*a28cd43dSSascha Wildner const char* filenameStart;
783*a28cd43dSSascha Wildner char separator;
784*a28cd43dSSascha Wildner char* result;
785*a28cd43dSSascha Wildner
786*a28cd43dSSascha Wildner #if defined(_MSC_VER) || defined(__MINGW32__) || defined (__MSVCRT__) /* windows support */
787*a28cd43dSSascha Wildner separator = '\\';
788*a28cd43dSSascha Wildner #else
789*a28cd43dSSascha Wildner separator = '/';
790*a28cd43dSSascha Wildner #endif
791*a28cd43dSSascha Wildner
792*a28cd43dSSascha Wildner filenameStart = extractFilename(path, separator);
793*a28cd43dSSascha Wildner #if defined(_MSC_VER) || defined(__MINGW32__) || defined (__MSVCRT__) /* windows support */
794*a28cd43dSSascha Wildner filenameStart = extractFilename(filenameStart, '/'); /* sometimes, '/' separator is also used on Windows (mingw+msys2) */
795*a28cd43dSSascha Wildner #endif
796*a28cd43dSSascha Wildner
797*a28cd43dSSascha Wildner result = (char*) calloc(1, strlen(outDirName) + 1 + strlen(filenameStart) + suffixLen + 1);
798*a28cd43dSSascha Wildner if (!result) {
799*a28cd43dSSascha Wildner EXM_THROW(30, "zstd: FIO_createFilename_fromOutDir: %s", strerror(errno));
800*a28cd43dSSascha Wildner }
801*a28cd43dSSascha Wildner
802*a28cd43dSSascha Wildner memcpy(result, outDirName, strlen(outDirName));
803*a28cd43dSSascha Wildner if (outDirName[strlen(outDirName)-1] == separator) {
804*a28cd43dSSascha Wildner memcpy(result + strlen(outDirName), filenameStart, strlen(filenameStart));
805*a28cd43dSSascha Wildner } else {
806*a28cd43dSSascha Wildner memcpy(result + strlen(outDirName), &separator, 1);
807*a28cd43dSSascha Wildner memcpy(result + strlen(outDirName) + 1, filenameStart, strlen(filenameStart));
808*a28cd43dSSascha Wildner }
809*a28cd43dSSascha Wildner
810*a28cd43dSSascha Wildner return result;
811*a28cd43dSSascha Wildner }
812*a28cd43dSSascha Wildner
813*a28cd43dSSascha Wildner /* FIO_highbit64() :
814*a28cd43dSSascha Wildner * gives position of highest bit.
815*a28cd43dSSascha Wildner * note : only works for v > 0 !
816*a28cd43dSSascha Wildner */
FIO_highbit64(unsigned long long v)817*a28cd43dSSascha Wildner static unsigned FIO_highbit64(unsigned long long v)
818*a28cd43dSSascha Wildner {
819*a28cd43dSSascha Wildner unsigned count = 0;
820*a28cd43dSSascha Wildner assert(v != 0);
821*a28cd43dSSascha Wildner v >>= 1;
822*a28cd43dSSascha Wildner while (v) { v >>= 1; count++; }
823*a28cd43dSSascha Wildner return count;
824*a28cd43dSSascha Wildner }
825*a28cd43dSSascha Wildner
FIO_adjustMemLimitForPatchFromMode(FIO_prefs_t * const prefs,unsigned long long const dictSize,unsigned long long const maxSrcFileSize)826*a28cd43dSSascha Wildner static void FIO_adjustMemLimitForPatchFromMode(FIO_prefs_t* const prefs,
827*a28cd43dSSascha Wildner unsigned long long const dictSize,
828*a28cd43dSSascha Wildner unsigned long long const maxSrcFileSize)
829*a28cd43dSSascha Wildner {
830*a28cd43dSSascha Wildner unsigned long long maxSize = MAX(prefs->memLimit, MAX(dictSize, maxSrcFileSize));
831*a28cd43dSSascha Wildner unsigned const maxWindowSize = (1U << ZSTD_WINDOWLOG_MAX);
832*a28cd43dSSascha Wildner if (maxSize == UTIL_FILESIZE_UNKNOWN)
833*a28cd43dSSascha Wildner EXM_THROW(42, "Using --patch-from with stdin requires --stream-size");
834*a28cd43dSSascha Wildner assert(maxSize != UTIL_FILESIZE_UNKNOWN);
835*a28cd43dSSascha Wildner if (maxSize > maxWindowSize)
836*a28cd43dSSascha Wildner EXM_THROW(42, "Can't handle files larger than %u GB\n", maxWindowSize/(1 GB));
837*a28cd43dSSascha Wildner FIO_setMemLimit(prefs, (unsigned)maxSize);
838*a28cd43dSSascha Wildner }
839*a28cd43dSSascha Wildner
840*a28cd43dSSascha Wildner /* FIO_removeMultiFilesWarning() :
841*a28cd43dSSascha Wildner * Returns 1 if the console should abort, 0 if console should proceed.
842*a28cd43dSSascha Wildner * This function handles logic when processing multiple files with -o, displaying the appropriate warnings/prompts.
843*a28cd43dSSascha Wildner *
844*a28cd43dSSascha Wildner * If -f is specified, or there is just 1 file, zstd will always proceed as usual.
845*a28cd43dSSascha Wildner * If --rm is specified, there will be a prompt asking for user confirmation.
846*a28cd43dSSascha Wildner * If -f is specified with --rm, zstd will proceed as usual
847*a28cd43dSSascha Wildner * If -q is specified with --rm, zstd will abort pre-emptively
848*a28cd43dSSascha Wildner * If neither flag is specified, zstd will prompt the user for confirmation to proceed.
849*a28cd43dSSascha Wildner * If --rm is not specified, then zstd will print a warning to the user (which can be silenced with -q).
850*a28cd43dSSascha Wildner * However, if the output is stdout, we will always abort rather than displaying the warning prompt.
851*a28cd43dSSascha Wildner */
FIO_removeMultiFilesWarning(FIO_ctx_t * const fCtx,const FIO_prefs_t * const prefs,const char * outFileName,int displayLevelCutoff)852*a28cd43dSSascha Wildner static int FIO_removeMultiFilesWarning(FIO_ctx_t* const fCtx, const FIO_prefs_t* const prefs, const char* outFileName, int displayLevelCutoff)
853*a28cd43dSSascha Wildner {
854*a28cd43dSSascha Wildner int error = 0;
855*a28cd43dSSascha Wildner if (fCtx->nbFilesTotal > 1 && !prefs->overwrite) {
856*a28cd43dSSascha Wildner if (g_display_prefs.displayLevel <= displayLevelCutoff) {
857*a28cd43dSSascha Wildner if (prefs->removeSrcFile) {
858*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: Aborting... not deleting files and processing into dst: %s", outFileName);
859*a28cd43dSSascha Wildner error = 1;
860*a28cd43dSSascha Wildner }
861*a28cd43dSSascha Wildner } else {
862*a28cd43dSSascha Wildner if (!strcmp(outFileName, stdoutmark)) {
863*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "zstd: WARNING: all input files will be processed and concatenated into stdout. ");
864*a28cd43dSSascha Wildner } else {
865*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "zstd: WARNING: all input files will be processed and concatenated into a single output file: %s ", outFileName);
866*a28cd43dSSascha Wildner }
867*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "\nThe concatenated output CANNOT regenerate the original directory tree. ")
868*a28cd43dSSascha Wildner if (prefs->removeSrcFile) {
869*a28cd43dSSascha Wildner if (fCtx->hasStdoutOutput) {
870*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "\nAborting. Use -f if you really want to delete the files and output to stdout");
871*a28cd43dSSascha Wildner error = 1;
872*a28cd43dSSascha Wildner } else {
873*a28cd43dSSascha Wildner error = g_display_prefs.displayLevel > displayLevelCutoff && UTIL_requireUserConfirmation("This is a destructive operation. Proceed? (y/n): ", "Aborting...", "yY", fCtx->hasStdinInput);
874*a28cd43dSSascha Wildner }
875*a28cd43dSSascha Wildner }
876*a28cd43dSSascha Wildner }
877*a28cd43dSSascha Wildner DISPLAY("\n");
878*a28cd43dSSascha Wildner }
879*a28cd43dSSascha Wildner return error;
880*a28cd43dSSascha Wildner }
881*a28cd43dSSascha Wildner
882*a28cd43dSSascha Wildner #ifndef ZSTD_NOCOMPRESS
883*a28cd43dSSascha Wildner
884*a28cd43dSSascha Wildner /* **********************************************************************
885*a28cd43dSSascha Wildner * Compression
886*a28cd43dSSascha Wildner ************************************************************************/
887*a28cd43dSSascha Wildner typedef struct {
888*a28cd43dSSascha Wildner FILE* srcFile;
889*a28cd43dSSascha Wildner FILE* dstFile;
890*a28cd43dSSascha Wildner void* srcBuffer;
891*a28cd43dSSascha Wildner size_t srcBufferSize;
892*a28cd43dSSascha Wildner void* dstBuffer;
893*a28cd43dSSascha Wildner size_t dstBufferSize;
894*a28cd43dSSascha Wildner void* dictBuffer;
895*a28cd43dSSascha Wildner size_t dictBufferSize;
896*a28cd43dSSascha Wildner const char* dictFileName;
897*a28cd43dSSascha Wildner ZSTD_CStream* cctx;
898*a28cd43dSSascha Wildner } cRess_t;
899*a28cd43dSSascha Wildner
FIO_adjustParamsForPatchFromMode(FIO_prefs_t * const prefs,ZSTD_compressionParameters * comprParams,unsigned long long const dictSize,unsigned long long const maxSrcFileSize,int cLevel)900*a28cd43dSSascha Wildner static void FIO_adjustParamsForPatchFromMode(FIO_prefs_t* const prefs,
901*a28cd43dSSascha Wildner ZSTD_compressionParameters* comprParams,
902*a28cd43dSSascha Wildner unsigned long long const dictSize,
903*a28cd43dSSascha Wildner unsigned long long const maxSrcFileSize,
904*a28cd43dSSascha Wildner int cLevel)
905*a28cd43dSSascha Wildner {
906*a28cd43dSSascha Wildner unsigned const fileWindowLog = FIO_highbit64(maxSrcFileSize) + 1;
907*a28cd43dSSascha Wildner ZSTD_compressionParameters const cParams = ZSTD_getCParams(cLevel, (size_t)maxSrcFileSize, (size_t)dictSize);
908*a28cd43dSSascha Wildner FIO_adjustMemLimitForPatchFromMode(prefs, dictSize, maxSrcFileSize);
909*a28cd43dSSascha Wildner if (fileWindowLog > ZSTD_WINDOWLOG_MAX)
910*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "Max window log exceeded by file (compression ratio will suffer)\n");
911*a28cd43dSSascha Wildner comprParams->windowLog = MIN(ZSTD_WINDOWLOG_MAX, fileWindowLog);
912*a28cd43dSSascha Wildner if (fileWindowLog > ZSTD_cycleLog(cParams.chainLog, cParams.strategy)) {
913*a28cd43dSSascha Wildner if (!prefs->ldmFlag)
914*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "long mode automatically triggered\n");
915*a28cd43dSSascha Wildner FIO_setLdmFlag(prefs, 1);
916*a28cd43dSSascha Wildner }
917*a28cd43dSSascha Wildner if (cParams.strategy >= ZSTD_btopt) {
918*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "[Optimal parser notes] Consider the following to improve patch size at the cost of speed:\n");
919*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "- Use --single-thread mode in the zstd cli\n");
920*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "- Set a larger targetLength (eg. --zstd=targetLength=4096)\n");
921*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "- Set a larger chainLog (eg. --zstd=chainLog=%u)\n", ZSTD_CHAINLOG_MAX);
922*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "Also consdier playing around with searchLog and hashLog\n");
923*a28cd43dSSascha Wildner }
924*a28cd43dSSascha Wildner }
925*a28cd43dSSascha Wildner
FIO_createCResources(FIO_prefs_t * const prefs,const char * dictFileName,unsigned long long const maxSrcFileSize,int cLevel,ZSTD_compressionParameters comprParams)926*a28cd43dSSascha Wildner static cRess_t FIO_createCResources(FIO_prefs_t* const prefs,
927*a28cd43dSSascha Wildner const char* dictFileName, unsigned long long const maxSrcFileSize,
928*a28cd43dSSascha Wildner int cLevel, ZSTD_compressionParameters comprParams) {
929*a28cd43dSSascha Wildner cRess_t ress;
930*a28cd43dSSascha Wildner memset(&ress, 0, sizeof(ress));
931*a28cd43dSSascha Wildner
932*a28cd43dSSascha Wildner DISPLAYLEVEL(6, "FIO_createCResources \n");
933*a28cd43dSSascha Wildner ress.cctx = ZSTD_createCCtx();
934*a28cd43dSSascha Wildner if (ress.cctx == NULL)
935*a28cd43dSSascha Wildner EXM_THROW(30, "allocation error (%s): can't create ZSTD_CCtx",
936*a28cd43dSSascha Wildner strerror(errno));
937*a28cd43dSSascha Wildner ress.srcBufferSize = ZSTD_CStreamInSize();
938*a28cd43dSSascha Wildner ress.srcBuffer = malloc(ress.srcBufferSize);
939*a28cd43dSSascha Wildner ress.dstBufferSize = ZSTD_CStreamOutSize();
940*a28cd43dSSascha Wildner
941*a28cd43dSSascha Wildner /* need to update memLimit before calling createDictBuffer
942*a28cd43dSSascha Wildner * because of memLimit check inside it */
943*a28cd43dSSascha Wildner if (prefs->patchFromMode) {
944*a28cd43dSSascha Wildner unsigned long long const ssSize = (unsigned long long)prefs->streamSrcSize;
945*a28cd43dSSascha Wildner FIO_adjustParamsForPatchFromMode(prefs, &comprParams, UTIL_getFileSize(dictFileName), ssSize > 0 ? ssSize : maxSrcFileSize, cLevel);
946*a28cd43dSSascha Wildner }
947*a28cd43dSSascha Wildner ress.dstBuffer = malloc(ress.dstBufferSize);
948*a28cd43dSSascha Wildner ress.dictBufferSize = FIO_createDictBuffer(&ress.dictBuffer, dictFileName, prefs); /* works with dictFileName==NULL */
949*a28cd43dSSascha Wildner if (!ress.srcBuffer || !ress.dstBuffer)
950*a28cd43dSSascha Wildner EXM_THROW(31, "allocation error : not enough memory");
951*a28cd43dSSascha Wildner
952*a28cd43dSSascha Wildner /* Advanced parameters, including dictionary */
953*a28cd43dSSascha Wildner if (dictFileName && (ress.dictBuffer==NULL))
954*a28cd43dSSascha Wildner EXM_THROW(32, "allocation error : can't create dictBuffer");
955*a28cd43dSSascha Wildner ress.dictFileName = dictFileName;
956*a28cd43dSSascha Wildner
957*a28cd43dSSascha Wildner if (prefs->adaptiveMode && !prefs->ldmFlag && !comprParams.windowLog)
958*a28cd43dSSascha Wildner comprParams.windowLog = ADAPT_WINDOWLOG_DEFAULT;
959*a28cd43dSSascha Wildner
960*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_contentSizeFlag, prefs->contentSize) ); /* always enable content size when available (note: supposed to be default) */
961*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_dictIDFlag, prefs->dictIDFlag) );
962*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_checksumFlag, prefs->checksumFlag) );
963*a28cd43dSSascha Wildner /* compression level */
964*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_compressionLevel, cLevel) );
965*a28cd43dSSascha Wildner /* max compressed block size */
966*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_targetCBlockSize, (int)prefs->targetCBlockSize) );
967*a28cd43dSSascha Wildner /* source size hint */
968*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_srcSizeHint, (int)prefs->srcSizeHint) );
969*a28cd43dSSascha Wildner /* long distance matching */
970*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_enableLongDistanceMatching, prefs->ldmFlag) );
971*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_ldmHashLog, prefs->ldmHashLog) );
972*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_ldmMinMatch, prefs->ldmMinMatch) );
973*a28cd43dSSascha Wildner if (prefs->ldmBucketSizeLog != FIO_LDM_PARAM_NOTSET) {
974*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_ldmBucketSizeLog, prefs->ldmBucketSizeLog) );
975*a28cd43dSSascha Wildner }
976*a28cd43dSSascha Wildner if (prefs->ldmHashRateLog != FIO_LDM_PARAM_NOTSET) {
977*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_ldmHashRateLog, prefs->ldmHashRateLog) );
978*a28cd43dSSascha Wildner }
979*a28cd43dSSascha Wildner /* compression parameters */
980*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_windowLog, (int)comprParams.windowLog) );
981*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_chainLog, (int)comprParams.chainLog) );
982*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_hashLog, (int)comprParams.hashLog) );
983*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_searchLog, (int)comprParams.searchLog) );
984*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_minMatch, (int)comprParams.minMatch) );
985*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_targetLength, (int)comprParams.targetLength) );
986*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_strategy, comprParams.strategy) );
987*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_literalCompressionMode, (int)prefs->literalCompressionMode) );
988*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_enableDedicatedDictSearch, 1) );
989*a28cd43dSSascha Wildner /* multi-threading */
990*a28cd43dSSascha Wildner #ifdef ZSTD_MULTITHREAD
991*a28cd43dSSascha Wildner DISPLAYLEVEL(5,"set nb workers = %u \n", prefs->nbWorkers);
992*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_nbWorkers, prefs->nbWorkers) );
993*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_jobSize, prefs->blockSize) );
994*a28cd43dSSascha Wildner if (prefs->overlapLog != FIO_OVERLAP_LOG_NOTSET) {
995*a28cd43dSSascha Wildner DISPLAYLEVEL(3,"set overlapLog = %u \n", prefs->overlapLog);
996*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_overlapLog, prefs->overlapLog) );
997*a28cd43dSSascha Wildner }
998*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_rsyncable, prefs->rsyncable) );
999*a28cd43dSSascha Wildner #endif
1000*a28cd43dSSascha Wildner /* dictionary */
1001*a28cd43dSSascha Wildner if (prefs->patchFromMode) {
1002*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_refPrefix(ress.cctx, ress.dictBuffer, ress.dictBufferSize) );
1003*a28cd43dSSascha Wildner } else {
1004*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_loadDictionary(ress.cctx, ress.dictBuffer, ress.dictBufferSize) );
1005*a28cd43dSSascha Wildner }
1006*a28cd43dSSascha Wildner
1007*a28cd43dSSascha Wildner return ress;
1008*a28cd43dSSascha Wildner }
1009*a28cd43dSSascha Wildner
FIO_freeCResources(const cRess_t * const ress)1010*a28cd43dSSascha Wildner static void FIO_freeCResources(const cRess_t* const ress)
1011*a28cd43dSSascha Wildner {
1012*a28cd43dSSascha Wildner free(ress->srcBuffer);
1013*a28cd43dSSascha Wildner free(ress->dstBuffer);
1014*a28cd43dSSascha Wildner free(ress->dictBuffer);
1015*a28cd43dSSascha Wildner ZSTD_freeCStream(ress->cctx); /* never fails */
1016*a28cd43dSSascha Wildner }
1017*a28cd43dSSascha Wildner
1018*a28cd43dSSascha Wildner
1019*a28cd43dSSascha Wildner #ifdef ZSTD_GZCOMPRESS
1020*a28cd43dSSascha Wildner static unsigned long long
FIO_compressGzFrame(const cRess_t * ress,const char * srcFileName,U64 const srcFileSize,int compressionLevel,U64 * readsize)1021*a28cd43dSSascha Wildner FIO_compressGzFrame(const cRess_t* ress, /* buffers & handlers are used, but not changed */
1022*a28cd43dSSascha Wildner const char* srcFileName, U64 const srcFileSize,
1023*a28cd43dSSascha Wildner int compressionLevel, U64* readsize)
1024*a28cd43dSSascha Wildner {
1025*a28cd43dSSascha Wildner unsigned long long inFileSize = 0, outFileSize = 0;
1026*a28cd43dSSascha Wildner z_stream strm;
1027*a28cd43dSSascha Wildner
1028*a28cd43dSSascha Wildner if (compressionLevel > Z_BEST_COMPRESSION)
1029*a28cd43dSSascha Wildner compressionLevel = Z_BEST_COMPRESSION;
1030*a28cd43dSSascha Wildner
1031*a28cd43dSSascha Wildner strm.zalloc = Z_NULL;
1032*a28cd43dSSascha Wildner strm.zfree = Z_NULL;
1033*a28cd43dSSascha Wildner strm.opaque = Z_NULL;
1034*a28cd43dSSascha Wildner
1035*a28cd43dSSascha Wildner { int const ret = deflateInit2(&strm, compressionLevel, Z_DEFLATED,
1036*a28cd43dSSascha Wildner 15 /* maxWindowLogSize */ + 16 /* gzip only */,
1037*a28cd43dSSascha Wildner 8, Z_DEFAULT_STRATEGY); /* see http://www.zlib.net/manual.html */
1038*a28cd43dSSascha Wildner if (ret != Z_OK) {
1039*a28cd43dSSascha Wildner EXM_THROW(71, "zstd: %s: deflateInit2 error %d \n", srcFileName, ret);
1040*a28cd43dSSascha Wildner } }
1041*a28cd43dSSascha Wildner
1042*a28cd43dSSascha Wildner strm.next_in = 0;
1043*a28cd43dSSascha Wildner strm.avail_in = 0;
1044*a28cd43dSSascha Wildner strm.next_out = (Bytef*)ress->dstBuffer;
1045*a28cd43dSSascha Wildner strm.avail_out = (uInt)ress->dstBufferSize;
1046*a28cd43dSSascha Wildner
1047*a28cd43dSSascha Wildner while (1) {
1048*a28cd43dSSascha Wildner int ret;
1049*a28cd43dSSascha Wildner if (strm.avail_in == 0) {
1050*a28cd43dSSascha Wildner size_t const inSize = fread(ress->srcBuffer, 1, ress->srcBufferSize, ress->srcFile);
1051*a28cd43dSSascha Wildner if (inSize == 0) break;
1052*a28cd43dSSascha Wildner inFileSize += inSize;
1053*a28cd43dSSascha Wildner strm.next_in = (z_const unsigned char*)ress->srcBuffer;
1054*a28cd43dSSascha Wildner strm.avail_in = (uInt)inSize;
1055*a28cd43dSSascha Wildner }
1056*a28cd43dSSascha Wildner ret = deflate(&strm, Z_NO_FLUSH);
1057*a28cd43dSSascha Wildner if (ret != Z_OK)
1058*a28cd43dSSascha Wildner EXM_THROW(72, "zstd: %s: deflate error %d \n", srcFileName, ret);
1059*a28cd43dSSascha Wildner { size_t const cSize = ress->dstBufferSize - strm.avail_out;
1060*a28cd43dSSascha Wildner if (cSize) {
1061*a28cd43dSSascha Wildner if (fwrite(ress->dstBuffer, 1, cSize, ress->dstFile) != cSize)
1062*a28cd43dSSascha Wildner EXM_THROW(73, "Write error : cannot write to output file : %s ", strerror(errno));
1063*a28cd43dSSascha Wildner outFileSize += cSize;
1064*a28cd43dSSascha Wildner strm.next_out = (Bytef*)ress->dstBuffer;
1065*a28cd43dSSascha Wildner strm.avail_out = (uInt)ress->dstBufferSize;
1066*a28cd43dSSascha Wildner } }
1067*a28cd43dSSascha Wildner if (srcFileSize == UTIL_FILESIZE_UNKNOWN) {
1068*a28cd43dSSascha Wildner DISPLAYUPDATE(2, "\rRead : %u MB ==> %.2f%% ",
1069*a28cd43dSSascha Wildner (unsigned)(inFileSize>>20),
1070*a28cd43dSSascha Wildner (double)outFileSize/inFileSize*100)
1071*a28cd43dSSascha Wildner } else {
1072*a28cd43dSSascha Wildner DISPLAYUPDATE(2, "\rRead : %u / %u MB ==> %.2f%% ",
1073*a28cd43dSSascha Wildner (unsigned)(inFileSize>>20), (unsigned)(srcFileSize>>20),
1074*a28cd43dSSascha Wildner (double)outFileSize/inFileSize*100);
1075*a28cd43dSSascha Wildner } }
1076*a28cd43dSSascha Wildner
1077*a28cd43dSSascha Wildner while (1) {
1078*a28cd43dSSascha Wildner int const ret = deflate(&strm, Z_FINISH);
1079*a28cd43dSSascha Wildner { size_t const cSize = ress->dstBufferSize - strm.avail_out;
1080*a28cd43dSSascha Wildner if (cSize) {
1081*a28cd43dSSascha Wildner if (fwrite(ress->dstBuffer, 1, cSize, ress->dstFile) != cSize)
1082*a28cd43dSSascha Wildner EXM_THROW(75, "Write error : %s ", strerror(errno));
1083*a28cd43dSSascha Wildner outFileSize += cSize;
1084*a28cd43dSSascha Wildner strm.next_out = (Bytef*)ress->dstBuffer;
1085*a28cd43dSSascha Wildner strm.avail_out = (uInt)ress->dstBufferSize;
1086*a28cd43dSSascha Wildner } }
1087*a28cd43dSSascha Wildner if (ret == Z_STREAM_END) break;
1088*a28cd43dSSascha Wildner if (ret != Z_BUF_ERROR)
1089*a28cd43dSSascha Wildner EXM_THROW(77, "zstd: %s: deflate error %d \n", srcFileName, ret);
1090*a28cd43dSSascha Wildner }
1091*a28cd43dSSascha Wildner
1092*a28cd43dSSascha Wildner { int const ret = deflateEnd(&strm);
1093*a28cd43dSSascha Wildner if (ret != Z_OK) {
1094*a28cd43dSSascha Wildner EXM_THROW(79, "zstd: %s: deflateEnd error %d \n", srcFileName, ret);
1095*a28cd43dSSascha Wildner } }
1096*a28cd43dSSascha Wildner *readsize = inFileSize;
1097*a28cd43dSSascha Wildner return outFileSize;
1098*a28cd43dSSascha Wildner }
1099*a28cd43dSSascha Wildner #endif
1100*a28cd43dSSascha Wildner
1101*a28cd43dSSascha Wildner
1102*a28cd43dSSascha Wildner #ifdef ZSTD_LZMACOMPRESS
1103*a28cd43dSSascha Wildner static unsigned long long
FIO_compressLzmaFrame(cRess_t * ress,const char * srcFileName,U64 const srcFileSize,int compressionLevel,U64 * readsize,int plain_lzma)1104*a28cd43dSSascha Wildner FIO_compressLzmaFrame(cRess_t* ress,
1105*a28cd43dSSascha Wildner const char* srcFileName, U64 const srcFileSize,
1106*a28cd43dSSascha Wildner int compressionLevel, U64* readsize, int plain_lzma)
1107*a28cd43dSSascha Wildner {
1108*a28cd43dSSascha Wildner unsigned long long inFileSize = 0, outFileSize = 0;
1109*a28cd43dSSascha Wildner lzma_stream strm = LZMA_STREAM_INIT;
1110*a28cd43dSSascha Wildner lzma_action action = LZMA_RUN;
1111*a28cd43dSSascha Wildner lzma_ret ret;
1112*a28cd43dSSascha Wildner
1113*a28cd43dSSascha Wildner if (compressionLevel < 0) compressionLevel = 0;
1114*a28cd43dSSascha Wildner if (compressionLevel > 9) compressionLevel = 9;
1115*a28cd43dSSascha Wildner
1116*a28cd43dSSascha Wildner if (plain_lzma) {
1117*a28cd43dSSascha Wildner lzma_options_lzma opt_lzma;
1118*a28cd43dSSascha Wildner if (lzma_lzma_preset(&opt_lzma, compressionLevel))
1119*a28cd43dSSascha Wildner EXM_THROW(81, "zstd: %s: lzma_lzma_preset error", srcFileName);
1120*a28cd43dSSascha Wildner ret = lzma_alone_encoder(&strm, &opt_lzma); /* LZMA */
1121*a28cd43dSSascha Wildner if (ret != LZMA_OK)
1122*a28cd43dSSascha Wildner EXM_THROW(82, "zstd: %s: lzma_alone_encoder error %d", srcFileName, ret);
1123*a28cd43dSSascha Wildner } else {
1124*a28cd43dSSascha Wildner ret = lzma_easy_encoder(&strm, compressionLevel, LZMA_CHECK_CRC64); /* XZ */
1125*a28cd43dSSascha Wildner if (ret != LZMA_OK)
1126*a28cd43dSSascha Wildner EXM_THROW(83, "zstd: %s: lzma_easy_encoder error %d", srcFileName, ret);
1127*a28cd43dSSascha Wildner }
1128*a28cd43dSSascha Wildner
1129*a28cd43dSSascha Wildner strm.next_in = 0;
1130*a28cd43dSSascha Wildner strm.avail_in = 0;
1131*a28cd43dSSascha Wildner strm.next_out = (BYTE*)ress->dstBuffer;
1132*a28cd43dSSascha Wildner strm.avail_out = ress->dstBufferSize;
1133*a28cd43dSSascha Wildner
1134*a28cd43dSSascha Wildner while (1) {
1135*a28cd43dSSascha Wildner if (strm.avail_in == 0) {
1136*a28cd43dSSascha Wildner size_t const inSize = fread(ress->srcBuffer, 1, ress->srcBufferSize, ress->srcFile);
1137*a28cd43dSSascha Wildner if (inSize == 0) action = LZMA_FINISH;
1138*a28cd43dSSascha Wildner inFileSize += inSize;
1139*a28cd43dSSascha Wildner strm.next_in = (BYTE const*)ress->srcBuffer;
1140*a28cd43dSSascha Wildner strm.avail_in = inSize;
1141*a28cd43dSSascha Wildner }
1142*a28cd43dSSascha Wildner
1143*a28cd43dSSascha Wildner ret = lzma_code(&strm, action);
1144*a28cd43dSSascha Wildner
1145*a28cd43dSSascha Wildner if (ret != LZMA_OK && ret != LZMA_STREAM_END)
1146*a28cd43dSSascha Wildner EXM_THROW(84, "zstd: %s: lzma_code encoding error %d", srcFileName, ret);
1147*a28cd43dSSascha Wildner { size_t const compBytes = ress->dstBufferSize - strm.avail_out;
1148*a28cd43dSSascha Wildner if (compBytes) {
1149*a28cd43dSSascha Wildner if (fwrite(ress->dstBuffer, 1, compBytes, ress->dstFile) != compBytes)
1150*a28cd43dSSascha Wildner EXM_THROW(85, "Write error : %s", strerror(errno));
1151*a28cd43dSSascha Wildner outFileSize += compBytes;
1152*a28cd43dSSascha Wildner strm.next_out = (BYTE*)ress->dstBuffer;
1153*a28cd43dSSascha Wildner strm.avail_out = ress->dstBufferSize;
1154*a28cd43dSSascha Wildner } }
1155*a28cd43dSSascha Wildner if (srcFileSize == UTIL_FILESIZE_UNKNOWN)
1156*a28cd43dSSascha Wildner DISPLAYUPDATE(2, "\rRead : %u MB ==> %.2f%%",
1157*a28cd43dSSascha Wildner (unsigned)(inFileSize>>20),
1158*a28cd43dSSascha Wildner (double)outFileSize/inFileSize*100)
1159*a28cd43dSSascha Wildner else
1160*a28cd43dSSascha Wildner DISPLAYUPDATE(2, "\rRead : %u / %u MB ==> %.2f%%",
1161*a28cd43dSSascha Wildner (unsigned)(inFileSize>>20), (unsigned)(srcFileSize>>20),
1162*a28cd43dSSascha Wildner (double)outFileSize/inFileSize*100);
1163*a28cd43dSSascha Wildner if (ret == LZMA_STREAM_END) break;
1164*a28cd43dSSascha Wildner }
1165*a28cd43dSSascha Wildner
1166*a28cd43dSSascha Wildner lzma_end(&strm);
1167*a28cd43dSSascha Wildner *readsize = inFileSize;
1168*a28cd43dSSascha Wildner
1169*a28cd43dSSascha Wildner return outFileSize;
1170*a28cd43dSSascha Wildner }
1171*a28cd43dSSascha Wildner #endif
1172*a28cd43dSSascha Wildner
1173*a28cd43dSSascha Wildner #ifdef ZSTD_LZ4COMPRESS
1174*a28cd43dSSascha Wildner
1175*a28cd43dSSascha Wildner #if LZ4_VERSION_NUMBER <= 10600
1176*a28cd43dSSascha Wildner #define LZ4F_blockLinked blockLinked
1177*a28cd43dSSascha Wildner #define LZ4F_max64KB max64KB
1178*a28cd43dSSascha Wildner #endif
1179*a28cd43dSSascha Wildner
FIO_LZ4_GetBlockSize_FromBlockId(int id)1180*a28cd43dSSascha Wildner static int FIO_LZ4_GetBlockSize_FromBlockId (int id) { return (1 << (8 + (2 * id))); }
1181*a28cd43dSSascha Wildner
1182*a28cd43dSSascha Wildner static unsigned long long
FIO_compressLz4Frame(cRess_t * ress,const char * srcFileName,U64 const srcFileSize,int compressionLevel,int checksumFlag,U64 * readsize)1183*a28cd43dSSascha Wildner FIO_compressLz4Frame(cRess_t* ress,
1184*a28cd43dSSascha Wildner const char* srcFileName, U64 const srcFileSize,
1185*a28cd43dSSascha Wildner int compressionLevel, int checksumFlag,
1186*a28cd43dSSascha Wildner U64* readsize)
1187*a28cd43dSSascha Wildner {
1188*a28cd43dSSascha Wildner const size_t blockSize = FIO_LZ4_GetBlockSize_FromBlockId(LZ4F_max64KB);
1189*a28cd43dSSascha Wildner unsigned long long inFileSize = 0, outFileSize = 0;
1190*a28cd43dSSascha Wildner
1191*a28cd43dSSascha Wildner LZ4F_preferences_t prefs;
1192*a28cd43dSSascha Wildner LZ4F_compressionContext_t ctx;
1193*a28cd43dSSascha Wildner
1194*a28cd43dSSascha Wildner LZ4F_errorCode_t const errorCode = LZ4F_createCompressionContext(&ctx, LZ4F_VERSION);
1195*a28cd43dSSascha Wildner if (LZ4F_isError(errorCode))
1196*a28cd43dSSascha Wildner EXM_THROW(31, "zstd: failed to create lz4 compression context");
1197*a28cd43dSSascha Wildner
1198*a28cd43dSSascha Wildner memset(&prefs, 0, sizeof(prefs));
1199*a28cd43dSSascha Wildner
1200*a28cd43dSSascha Wildner assert(blockSize <= ress->srcBufferSize);
1201*a28cd43dSSascha Wildner
1202*a28cd43dSSascha Wildner prefs.autoFlush = 1;
1203*a28cd43dSSascha Wildner prefs.compressionLevel = compressionLevel;
1204*a28cd43dSSascha Wildner prefs.frameInfo.blockMode = LZ4F_blockLinked;
1205*a28cd43dSSascha Wildner prefs.frameInfo.blockSizeID = LZ4F_max64KB;
1206*a28cd43dSSascha Wildner prefs.frameInfo.contentChecksumFlag = (contentChecksum_t)checksumFlag;
1207*a28cd43dSSascha Wildner #if LZ4_VERSION_NUMBER >= 10600
1208*a28cd43dSSascha Wildner prefs.frameInfo.contentSize = (srcFileSize==UTIL_FILESIZE_UNKNOWN) ? 0 : srcFileSize;
1209*a28cd43dSSascha Wildner #endif
1210*a28cd43dSSascha Wildner assert(LZ4F_compressBound(blockSize, &prefs) <= ress->dstBufferSize);
1211*a28cd43dSSascha Wildner
1212*a28cd43dSSascha Wildner {
1213*a28cd43dSSascha Wildner size_t readSize;
1214*a28cd43dSSascha Wildner size_t headerSize = LZ4F_compressBegin(ctx, ress->dstBuffer, ress->dstBufferSize, &prefs);
1215*a28cd43dSSascha Wildner if (LZ4F_isError(headerSize))
1216*a28cd43dSSascha Wildner EXM_THROW(33, "File header generation failed : %s",
1217*a28cd43dSSascha Wildner LZ4F_getErrorName(headerSize));
1218*a28cd43dSSascha Wildner if (fwrite(ress->dstBuffer, 1, headerSize, ress->dstFile) != headerSize)
1219*a28cd43dSSascha Wildner EXM_THROW(34, "Write error : %s (cannot write header)", strerror(errno));
1220*a28cd43dSSascha Wildner outFileSize += headerSize;
1221*a28cd43dSSascha Wildner
1222*a28cd43dSSascha Wildner /* Read first block */
1223*a28cd43dSSascha Wildner readSize = fread(ress->srcBuffer, (size_t)1, (size_t)blockSize, ress->srcFile);
1224*a28cd43dSSascha Wildner inFileSize += readSize;
1225*a28cd43dSSascha Wildner
1226*a28cd43dSSascha Wildner /* Main Loop */
1227*a28cd43dSSascha Wildner while (readSize>0) {
1228*a28cd43dSSascha Wildner size_t const outSize = LZ4F_compressUpdate(ctx,
1229*a28cd43dSSascha Wildner ress->dstBuffer, ress->dstBufferSize,
1230*a28cd43dSSascha Wildner ress->srcBuffer, readSize, NULL);
1231*a28cd43dSSascha Wildner if (LZ4F_isError(outSize))
1232*a28cd43dSSascha Wildner EXM_THROW(35, "zstd: %s: lz4 compression failed : %s",
1233*a28cd43dSSascha Wildner srcFileName, LZ4F_getErrorName(outSize));
1234*a28cd43dSSascha Wildner outFileSize += outSize;
1235*a28cd43dSSascha Wildner if (srcFileSize == UTIL_FILESIZE_UNKNOWN) {
1236*a28cd43dSSascha Wildner DISPLAYUPDATE(2, "\rRead : %u MB ==> %.2f%%",
1237*a28cd43dSSascha Wildner (unsigned)(inFileSize>>20),
1238*a28cd43dSSascha Wildner (double)outFileSize/inFileSize*100)
1239*a28cd43dSSascha Wildner } else {
1240*a28cd43dSSascha Wildner DISPLAYUPDATE(2, "\rRead : %u / %u MB ==> %.2f%%",
1241*a28cd43dSSascha Wildner (unsigned)(inFileSize>>20), (unsigned)(srcFileSize>>20),
1242*a28cd43dSSascha Wildner (double)outFileSize/inFileSize*100);
1243*a28cd43dSSascha Wildner }
1244*a28cd43dSSascha Wildner
1245*a28cd43dSSascha Wildner /* Write Block */
1246*a28cd43dSSascha Wildner { size_t const sizeCheck = fwrite(ress->dstBuffer, 1, outSize, ress->dstFile);
1247*a28cd43dSSascha Wildner if (sizeCheck != outSize)
1248*a28cd43dSSascha Wildner EXM_THROW(36, "Write error : %s", strerror(errno));
1249*a28cd43dSSascha Wildner }
1250*a28cd43dSSascha Wildner
1251*a28cd43dSSascha Wildner /* Read next block */
1252*a28cd43dSSascha Wildner readSize = fread(ress->srcBuffer, (size_t)1, (size_t)blockSize, ress->srcFile);
1253*a28cd43dSSascha Wildner inFileSize += readSize;
1254*a28cd43dSSascha Wildner }
1255*a28cd43dSSascha Wildner if (ferror(ress->srcFile)) EXM_THROW(37, "Error reading %s ", srcFileName);
1256*a28cd43dSSascha Wildner
1257*a28cd43dSSascha Wildner /* End of Stream mark */
1258*a28cd43dSSascha Wildner headerSize = LZ4F_compressEnd(ctx, ress->dstBuffer, ress->dstBufferSize, NULL);
1259*a28cd43dSSascha Wildner if (LZ4F_isError(headerSize))
1260*a28cd43dSSascha Wildner EXM_THROW(38, "zstd: %s: lz4 end of file generation failed : %s",
1261*a28cd43dSSascha Wildner srcFileName, LZ4F_getErrorName(headerSize));
1262*a28cd43dSSascha Wildner
1263*a28cd43dSSascha Wildner { size_t const sizeCheck = fwrite(ress->dstBuffer, 1, headerSize, ress->dstFile);
1264*a28cd43dSSascha Wildner if (sizeCheck != headerSize)
1265*a28cd43dSSascha Wildner EXM_THROW(39, "Write error : %s (cannot write end of stream)",
1266*a28cd43dSSascha Wildner strerror(errno));
1267*a28cd43dSSascha Wildner }
1268*a28cd43dSSascha Wildner outFileSize += headerSize;
1269*a28cd43dSSascha Wildner }
1270*a28cd43dSSascha Wildner
1271*a28cd43dSSascha Wildner *readsize = inFileSize;
1272*a28cd43dSSascha Wildner LZ4F_freeCompressionContext(ctx);
1273*a28cd43dSSascha Wildner
1274*a28cd43dSSascha Wildner return outFileSize;
1275*a28cd43dSSascha Wildner }
1276*a28cd43dSSascha Wildner #endif
1277*a28cd43dSSascha Wildner
1278*a28cd43dSSascha Wildner
1279*a28cd43dSSascha Wildner static unsigned long long
FIO_compressZstdFrame(FIO_ctx_t * const fCtx,FIO_prefs_t * const prefs,const cRess_t * ressPtr,const char * srcFileName,U64 fileSize,int compressionLevel,U64 * readsize)1280*a28cd43dSSascha Wildner FIO_compressZstdFrame(FIO_ctx_t* const fCtx,
1281*a28cd43dSSascha Wildner FIO_prefs_t* const prefs,
1282*a28cd43dSSascha Wildner const cRess_t* ressPtr,
1283*a28cd43dSSascha Wildner const char* srcFileName, U64 fileSize,
1284*a28cd43dSSascha Wildner int compressionLevel, U64* readsize)
1285*a28cd43dSSascha Wildner {
1286*a28cd43dSSascha Wildner cRess_t const ress = *ressPtr;
1287*a28cd43dSSascha Wildner FILE* const srcFile = ress.srcFile;
1288*a28cd43dSSascha Wildner FILE* const dstFile = ress.dstFile;
1289*a28cd43dSSascha Wildner U64 compressedfilesize = 0;
1290*a28cd43dSSascha Wildner ZSTD_EndDirective directive = ZSTD_e_continue;
1291*a28cd43dSSascha Wildner
1292*a28cd43dSSascha Wildner /* stats */
1293*a28cd43dSSascha Wildner ZSTD_frameProgression previous_zfp_update = { 0, 0, 0, 0, 0, 0 };
1294*a28cd43dSSascha Wildner ZSTD_frameProgression previous_zfp_correction = { 0, 0, 0, 0, 0, 0 };
1295*a28cd43dSSascha Wildner typedef enum { noChange, slower, faster } speedChange_e;
1296*a28cd43dSSascha Wildner speedChange_e speedChange = noChange;
1297*a28cd43dSSascha Wildner unsigned flushWaiting = 0;
1298*a28cd43dSSascha Wildner unsigned inputPresented = 0;
1299*a28cd43dSSascha Wildner unsigned inputBlocked = 0;
1300*a28cd43dSSascha Wildner unsigned lastJobID = 0;
1301*a28cd43dSSascha Wildner
1302*a28cd43dSSascha Wildner DISPLAYLEVEL(6, "compression using zstd format \n");
1303*a28cd43dSSascha Wildner
1304*a28cd43dSSascha Wildner /* init */
1305*a28cd43dSSascha Wildner if (fileSize != UTIL_FILESIZE_UNKNOWN) {
1306*a28cd43dSSascha Wildner CHECK(ZSTD_CCtx_setPledgedSrcSize(ress.cctx, fileSize));
1307*a28cd43dSSascha Wildner } else if (prefs->streamSrcSize > 0) {
1308*a28cd43dSSascha Wildner /* unknown source size; use the declared stream size */
1309*a28cd43dSSascha Wildner CHECK( ZSTD_CCtx_setPledgedSrcSize(ress.cctx, prefs->streamSrcSize) );
1310*a28cd43dSSascha Wildner }
1311*a28cd43dSSascha Wildner (void)srcFileName;
1312*a28cd43dSSascha Wildner
1313*a28cd43dSSascha Wildner /* Main compression loop */
1314*a28cd43dSSascha Wildner do {
1315*a28cd43dSSascha Wildner size_t stillToFlush;
1316*a28cd43dSSascha Wildner /* Fill input Buffer */
1317*a28cd43dSSascha Wildner size_t const inSize = fread(ress.srcBuffer, (size_t)1, ress.srcBufferSize, srcFile);
1318*a28cd43dSSascha Wildner ZSTD_inBuffer inBuff = { ress.srcBuffer, inSize, 0 };
1319*a28cd43dSSascha Wildner DISPLAYLEVEL(6, "fread %u bytes from source \n", (unsigned)inSize);
1320*a28cd43dSSascha Wildner *readsize += inSize;
1321*a28cd43dSSascha Wildner
1322*a28cd43dSSascha Wildner if ((inSize == 0) || (*readsize == fileSize))
1323*a28cd43dSSascha Wildner directive = ZSTD_e_end;
1324*a28cd43dSSascha Wildner
1325*a28cd43dSSascha Wildner stillToFlush = 1;
1326*a28cd43dSSascha Wildner while ((inBuff.pos != inBuff.size) /* input buffer must be entirely ingested */
1327*a28cd43dSSascha Wildner || (directive == ZSTD_e_end && stillToFlush != 0) ) {
1328*a28cd43dSSascha Wildner
1329*a28cd43dSSascha Wildner size_t const oldIPos = inBuff.pos;
1330*a28cd43dSSascha Wildner ZSTD_outBuffer outBuff = { ress.dstBuffer, ress.dstBufferSize, 0 };
1331*a28cd43dSSascha Wildner size_t const toFlushNow = ZSTD_toFlushNow(ress.cctx);
1332*a28cd43dSSascha Wildner CHECK_V(stillToFlush, ZSTD_compressStream2(ress.cctx, &outBuff, &inBuff, directive));
1333*a28cd43dSSascha Wildner
1334*a28cd43dSSascha Wildner /* count stats */
1335*a28cd43dSSascha Wildner inputPresented++;
1336*a28cd43dSSascha Wildner if (oldIPos == inBuff.pos) inputBlocked++; /* input buffer is full and can't take any more : input speed is faster than consumption rate */
1337*a28cd43dSSascha Wildner if (!toFlushNow) flushWaiting = 1;
1338*a28cd43dSSascha Wildner
1339*a28cd43dSSascha Wildner /* Write compressed stream */
1340*a28cd43dSSascha Wildner DISPLAYLEVEL(6, "ZSTD_compress_generic(end:%u) => input pos(%u)<=(%u)size ; output generated %u bytes \n",
1341*a28cd43dSSascha Wildner (unsigned)directive, (unsigned)inBuff.pos, (unsigned)inBuff.size, (unsigned)outBuff.pos);
1342*a28cd43dSSascha Wildner if (outBuff.pos) {
1343*a28cd43dSSascha Wildner size_t const sizeCheck = fwrite(ress.dstBuffer, 1, outBuff.pos, dstFile);
1344*a28cd43dSSascha Wildner if (sizeCheck != outBuff.pos)
1345*a28cd43dSSascha Wildner EXM_THROW(25, "Write error : %s (cannot write compressed block)",
1346*a28cd43dSSascha Wildner strerror(errno));
1347*a28cd43dSSascha Wildner compressedfilesize += outBuff.pos;
1348*a28cd43dSSascha Wildner }
1349*a28cd43dSSascha Wildner
1350*a28cd43dSSascha Wildner /* display notification; and adapt compression level */
1351*a28cd43dSSascha Wildner if (READY_FOR_UPDATE()) {
1352*a28cd43dSSascha Wildner ZSTD_frameProgression const zfp = ZSTD_getFrameProgression(ress.cctx);
1353*a28cd43dSSascha Wildner double const cShare = (double)zfp.produced / (zfp.consumed + !zfp.consumed/*avoid div0*/) * 100;
1354*a28cd43dSSascha Wildner
1355*a28cd43dSSascha Wildner /* display progress notifications */
1356*a28cd43dSSascha Wildner if (g_display_prefs.displayLevel >= 3) {
1357*a28cd43dSSascha Wildner DISPLAYUPDATE(3, "\r(L%i) Buffered :%4u MB - Consumed :%4u MB - Compressed :%4u MB => %.2f%% ",
1358*a28cd43dSSascha Wildner compressionLevel,
1359*a28cd43dSSascha Wildner (unsigned)((zfp.ingested - zfp.consumed) >> 20),
1360*a28cd43dSSascha Wildner (unsigned)(zfp.consumed >> 20),
1361*a28cd43dSSascha Wildner (unsigned)(zfp.produced >> 20),
1362*a28cd43dSSascha Wildner cShare );
1363*a28cd43dSSascha Wildner } else { /* summarized notifications if == 2 */
1364*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "\r%79s\r", ""); /* Clear out the current displayed line */
1365*a28cd43dSSascha Wildner if (fCtx->nbFilesTotal > 1) {
1366*a28cd43dSSascha Wildner size_t srcFileNameSize = strlen(srcFileName);
1367*a28cd43dSSascha Wildner /* Ensure that the string we print is roughly the same size each time */
1368*a28cd43dSSascha Wildner if (srcFileNameSize > 18) {
1369*a28cd43dSSascha Wildner const char* truncatedSrcFileName = srcFileName + srcFileNameSize - 15;
1370*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "Compress: %u/%u files. Current: ...%s ",
1371*a28cd43dSSascha Wildner fCtx->currFileIdx+1, fCtx->nbFilesTotal, truncatedSrcFileName);
1372*a28cd43dSSascha Wildner } else {
1373*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "Compress: %u/%u files. Current: %*s ",
1374*a28cd43dSSascha Wildner fCtx->currFileIdx+1, fCtx->nbFilesTotal, (int)(18-srcFileNameSize), srcFileName);
1375*a28cd43dSSascha Wildner }
1376*a28cd43dSSascha Wildner }
1377*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "Read : %2u ", (unsigned)(zfp.consumed >> 20));
1378*a28cd43dSSascha Wildner if (fileSize != UTIL_FILESIZE_UNKNOWN)
1379*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "/ %2u ", (unsigned)(fileSize >> 20));
1380*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "MB ==> %2.f%%", cShare);
1381*a28cd43dSSascha Wildner DELAY_NEXT_UPDATE();
1382*a28cd43dSSascha Wildner }
1383*a28cd43dSSascha Wildner
1384*a28cd43dSSascha Wildner /* adaptive mode : statistics measurement and speed correction */
1385*a28cd43dSSascha Wildner if (prefs->adaptiveMode) {
1386*a28cd43dSSascha Wildner
1387*a28cd43dSSascha Wildner /* check output speed */
1388*a28cd43dSSascha Wildner if (zfp.currentJobID > 1) { /* only possible if nbWorkers >= 1 */
1389*a28cd43dSSascha Wildner
1390*a28cd43dSSascha Wildner unsigned long long newlyProduced = zfp.produced - previous_zfp_update.produced;
1391*a28cd43dSSascha Wildner unsigned long long newlyFlushed = zfp.flushed - previous_zfp_update.flushed;
1392*a28cd43dSSascha Wildner assert(zfp.produced >= previous_zfp_update.produced);
1393*a28cd43dSSascha Wildner assert(prefs->nbWorkers >= 1);
1394*a28cd43dSSascha Wildner
1395*a28cd43dSSascha Wildner /* test if compression is blocked
1396*a28cd43dSSascha Wildner * either because output is slow and all buffers are full
1397*a28cd43dSSascha Wildner * or because input is slow and no job can start while waiting for at least one buffer to be filled.
1398*a28cd43dSSascha Wildner * note : exclude starting part, since currentJobID > 1 */
1399*a28cd43dSSascha Wildner if ( (zfp.consumed == previous_zfp_update.consumed) /* no data compressed : no data available, or no more buffer to compress to, OR compression is really slow (compression of a single block is slower than update rate)*/
1400*a28cd43dSSascha Wildner && (zfp.nbActiveWorkers == 0) /* confirmed : no compression ongoing */
1401*a28cd43dSSascha Wildner ) {
1402*a28cd43dSSascha Wildner DISPLAYLEVEL(6, "all buffers full : compression stopped => slow down \n")
1403*a28cd43dSSascha Wildner speedChange = slower;
1404*a28cd43dSSascha Wildner }
1405*a28cd43dSSascha Wildner
1406*a28cd43dSSascha Wildner previous_zfp_update = zfp;
1407*a28cd43dSSascha Wildner
1408*a28cd43dSSascha Wildner if ( (newlyProduced > (newlyFlushed * 9 / 8)) /* compression produces more data than output can flush (though production can be spiky, due to work unit : (N==4)*block sizes) */
1409*a28cd43dSSascha Wildner && (flushWaiting == 0) /* flush speed was never slowed by lack of production, so it's operating at max capacity */
1410*a28cd43dSSascha Wildner ) {
1411*a28cd43dSSascha Wildner DISPLAYLEVEL(6, "compression faster than flush (%llu > %llu), and flushed was never slowed down by lack of production => slow down \n", newlyProduced, newlyFlushed);
1412*a28cd43dSSascha Wildner speedChange = slower;
1413*a28cd43dSSascha Wildner }
1414*a28cd43dSSascha Wildner flushWaiting = 0;
1415*a28cd43dSSascha Wildner }
1416*a28cd43dSSascha Wildner
1417*a28cd43dSSascha Wildner /* course correct only if there is at least one new job completed */
1418*a28cd43dSSascha Wildner if (zfp.currentJobID > lastJobID) {
1419*a28cd43dSSascha Wildner DISPLAYLEVEL(6, "compression level adaptation check \n")
1420*a28cd43dSSascha Wildner
1421*a28cd43dSSascha Wildner /* check input speed */
1422*a28cd43dSSascha Wildner if (zfp.currentJobID > (unsigned)(prefs->nbWorkers+1)) { /* warm up period, to fill all workers */
1423*a28cd43dSSascha Wildner if (inputBlocked <= 0) {
1424*a28cd43dSSascha Wildner DISPLAYLEVEL(6, "input is never blocked => input is slower than ingestion \n");
1425*a28cd43dSSascha Wildner speedChange = slower;
1426*a28cd43dSSascha Wildner } else if (speedChange == noChange) {
1427*a28cd43dSSascha Wildner unsigned long long newlyIngested = zfp.ingested - previous_zfp_correction.ingested;
1428*a28cd43dSSascha Wildner unsigned long long newlyConsumed = zfp.consumed - previous_zfp_correction.consumed;
1429*a28cd43dSSascha Wildner unsigned long long newlyProduced = zfp.produced - previous_zfp_correction.produced;
1430*a28cd43dSSascha Wildner unsigned long long newlyFlushed = zfp.flushed - previous_zfp_correction.flushed;
1431*a28cd43dSSascha Wildner previous_zfp_correction = zfp;
1432*a28cd43dSSascha Wildner assert(inputPresented > 0);
1433*a28cd43dSSascha Wildner DISPLAYLEVEL(6, "input blocked %u/%u(%.2f) - ingested:%u vs %u:consumed - flushed:%u vs %u:produced \n",
1434*a28cd43dSSascha Wildner inputBlocked, inputPresented, (double)inputBlocked/inputPresented*100,
1435*a28cd43dSSascha Wildner (unsigned)newlyIngested, (unsigned)newlyConsumed,
1436*a28cd43dSSascha Wildner (unsigned)newlyFlushed, (unsigned)newlyProduced);
1437*a28cd43dSSascha Wildner if ( (inputBlocked > inputPresented / 8) /* input is waiting often, because input buffers is full : compression or output too slow */
1438*a28cd43dSSascha Wildner && (newlyFlushed * 33 / 32 > newlyProduced) /* flush everything that is produced */
1439*a28cd43dSSascha Wildner && (newlyIngested * 33 / 32 > newlyConsumed) /* input speed as fast or faster than compression speed */
1440*a28cd43dSSascha Wildner ) {
1441*a28cd43dSSascha Wildner DISPLAYLEVEL(6, "recommend faster as in(%llu) >= (%llu)comp(%llu) <= out(%llu) \n",
1442*a28cd43dSSascha Wildner newlyIngested, newlyConsumed, newlyProduced, newlyFlushed);
1443*a28cd43dSSascha Wildner speedChange = faster;
1444*a28cd43dSSascha Wildner }
1445*a28cd43dSSascha Wildner }
1446*a28cd43dSSascha Wildner inputBlocked = 0;
1447*a28cd43dSSascha Wildner inputPresented = 0;
1448*a28cd43dSSascha Wildner }
1449*a28cd43dSSascha Wildner
1450*a28cd43dSSascha Wildner if (speedChange == slower) {
1451*a28cd43dSSascha Wildner DISPLAYLEVEL(6, "slower speed , higher compression \n")
1452*a28cd43dSSascha Wildner compressionLevel ++;
1453*a28cd43dSSascha Wildner if (compressionLevel > ZSTD_maxCLevel()) compressionLevel = ZSTD_maxCLevel();
1454*a28cd43dSSascha Wildner if (compressionLevel > prefs->maxAdaptLevel) compressionLevel = prefs->maxAdaptLevel;
1455*a28cd43dSSascha Wildner compressionLevel += (compressionLevel == 0); /* skip 0 */
1456*a28cd43dSSascha Wildner ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_compressionLevel, compressionLevel);
1457*a28cd43dSSascha Wildner }
1458*a28cd43dSSascha Wildner if (speedChange == faster) {
1459*a28cd43dSSascha Wildner DISPLAYLEVEL(6, "faster speed , lighter compression \n")
1460*a28cd43dSSascha Wildner compressionLevel --;
1461*a28cd43dSSascha Wildner if (compressionLevel < prefs->minAdaptLevel) compressionLevel = prefs->minAdaptLevel;
1462*a28cd43dSSascha Wildner compressionLevel -= (compressionLevel == 0); /* skip 0 */
1463*a28cd43dSSascha Wildner ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_compressionLevel, compressionLevel);
1464*a28cd43dSSascha Wildner }
1465*a28cd43dSSascha Wildner speedChange = noChange;
1466*a28cd43dSSascha Wildner
1467*a28cd43dSSascha Wildner lastJobID = zfp.currentJobID;
1468*a28cd43dSSascha Wildner } /* if (zfp.currentJobID > lastJobID) */
1469*a28cd43dSSascha Wildner } /* if (g_adaptiveMode) */
1470*a28cd43dSSascha Wildner } /* if (READY_FOR_UPDATE()) */
1471*a28cd43dSSascha Wildner } /* while ((inBuff.pos != inBuff.size) */
1472*a28cd43dSSascha Wildner } while (directive != ZSTD_e_end);
1473*a28cd43dSSascha Wildner
1474*a28cd43dSSascha Wildner if (ferror(srcFile)) {
1475*a28cd43dSSascha Wildner EXM_THROW(26, "Read error : I/O error");
1476*a28cd43dSSascha Wildner }
1477*a28cd43dSSascha Wildner if (fileSize != UTIL_FILESIZE_UNKNOWN && *readsize != fileSize) {
1478*a28cd43dSSascha Wildner EXM_THROW(27, "Read error : Incomplete read : %llu / %llu B",
1479*a28cd43dSSascha Wildner (unsigned long long)*readsize, (unsigned long long)fileSize);
1480*a28cd43dSSascha Wildner }
1481*a28cd43dSSascha Wildner
1482*a28cd43dSSascha Wildner return compressedfilesize;
1483*a28cd43dSSascha Wildner }
1484*a28cd43dSSascha Wildner
1485*a28cd43dSSascha Wildner /*! FIO_compressFilename_internal() :
1486*a28cd43dSSascha Wildner * same as FIO_compressFilename_extRess(), with `ress.desFile` already opened.
1487*a28cd43dSSascha Wildner * @return : 0 : compression completed correctly,
1488*a28cd43dSSascha Wildner * 1 : missing or pb opening srcFileName
1489*a28cd43dSSascha Wildner */
1490*a28cd43dSSascha Wildner static int
FIO_compressFilename_internal(FIO_ctx_t * const fCtx,FIO_prefs_t * const prefs,cRess_t ress,const char * dstFileName,const char * srcFileName,int compressionLevel)1491*a28cd43dSSascha Wildner FIO_compressFilename_internal(FIO_ctx_t* const fCtx,
1492*a28cd43dSSascha Wildner FIO_prefs_t* const prefs,
1493*a28cd43dSSascha Wildner cRess_t ress,
1494*a28cd43dSSascha Wildner const char* dstFileName, const char* srcFileName,
1495*a28cd43dSSascha Wildner int compressionLevel)
1496*a28cd43dSSascha Wildner {
1497*a28cd43dSSascha Wildner UTIL_time_t const timeStart = UTIL_getTime();
1498*a28cd43dSSascha Wildner clock_t const cpuStart = clock();
1499*a28cd43dSSascha Wildner U64 readsize = 0;
1500*a28cd43dSSascha Wildner U64 compressedfilesize = 0;
1501*a28cd43dSSascha Wildner U64 const fileSize = UTIL_getFileSize(srcFileName);
1502*a28cd43dSSascha Wildner DISPLAYLEVEL(5, "%s: %u bytes \n", srcFileName, (unsigned)fileSize);
1503*a28cd43dSSascha Wildner
1504*a28cd43dSSascha Wildner /* compression format selection */
1505*a28cd43dSSascha Wildner switch (prefs->compressionType) {
1506*a28cd43dSSascha Wildner default:
1507*a28cd43dSSascha Wildner case FIO_zstdCompression:
1508*a28cd43dSSascha Wildner compressedfilesize = FIO_compressZstdFrame(fCtx, prefs, &ress, srcFileName, fileSize, compressionLevel, &readsize);
1509*a28cd43dSSascha Wildner break;
1510*a28cd43dSSascha Wildner
1511*a28cd43dSSascha Wildner case FIO_gzipCompression:
1512*a28cd43dSSascha Wildner #ifdef ZSTD_GZCOMPRESS
1513*a28cd43dSSascha Wildner compressedfilesize = FIO_compressGzFrame(&ress, srcFileName, fileSize, compressionLevel, &readsize);
1514*a28cd43dSSascha Wildner #else
1515*a28cd43dSSascha Wildner (void)compressionLevel;
1516*a28cd43dSSascha Wildner EXM_THROW(20, "zstd: %s: file cannot be compressed as gzip (zstd compiled without ZSTD_GZCOMPRESS) -- ignored \n",
1517*a28cd43dSSascha Wildner srcFileName);
1518*a28cd43dSSascha Wildner #endif
1519*a28cd43dSSascha Wildner break;
1520*a28cd43dSSascha Wildner
1521*a28cd43dSSascha Wildner case FIO_xzCompression:
1522*a28cd43dSSascha Wildner case FIO_lzmaCompression:
1523*a28cd43dSSascha Wildner #ifdef ZSTD_LZMACOMPRESS
1524*a28cd43dSSascha Wildner compressedfilesize = FIO_compressLzmaFrame(&ress, srcFileName, fileSize, compressionLevel, &readsize, prefs->compressionType==FIO_lzmaCompression);
1525*a28cd43dSSascha Wildner #else
1526*a28cd43dSSascha Wildner (void)compressionLevel;
1527*a28cd43dSSascha Wildner EXM_THROW(20, "zstd: %s: file cannot be compressed as xz/lzma (zstd compiled without ZSTD_LZMACOMPRESS) -- ignored \n",
1528*a28cd43dSSascha Wildner srcFileName);
1529*a28cd43dSSascha Wildner #endif
1530*a28cd43dSSascha Wildner break;
1531*a28cd43dSSascha Wildner
1532*a28cd43dSSascha Wildner case FIO_lz4Compression:
1533*a28cd43dSSascha Wildner #ifdef ZSTD_LZ4COMPRESS
1534*a28cd43dSSascha Wildner compressedfilesize = FIO_compressLz4Frame(&ress, srcFileName, fileSize, compressionLevel, prefs->checksumFlag, &readsize);
1535*a28cd43dSSascha Wildner #else
1536*a28cd43dSSascha Wildner (void)compressionLevel;
1537*a28cd43dSSascha Wildner EXM_THROW(20, "zstd: %s: file cannot be compressed as lz4 (zstd compiled without ZSTD_LZ4COMPRESS) -- ignored \n",
1538*a28cd43dSSascha Wildner srcFileName);
1539*a28cd43dSSascha Wildner #endif
1540*a28cd43dSSascha Wildner break;
1541*a28cd43dSSascha Wildner }
1542*a28cd43dSSascha Wildner
1543*a28cd43dSSascha Wildner /* Status */
1544*a28cd43dSSascha Wildner fCtx->totalBytesInput += (size_t)readsize;
1545*a28cd43dSSascha Wildner fCtx->totalBytesOutput += (size_t)compressedfilesize;
1546*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "\r%79s\r", "");
1547*a28cd43dSSascha Wildner if (g_display_prefs.displayLevel >= 2 &&
1548*a28cd43dSSascha Wildner !fCtx->hasStdoutOutput &&
1549*a28cd43dSSascha Wildner (g_display_prefs.displayLevel >= 3 || fCtx->nbFilesTotal <= 1)) {
1550*a28cd43dSSascha Wildner if (readsize == 0) {
1551*a28cd43dSSascha Wildner DISPLAYLEVEL(2,"%-20s : (%6llu => %6llu bytes, %s) \n",
1552*a28cd43dSSascha Wildner srcFileName,
1553*a28cd43dSSascha Wildner (unsigned long long)readsize, (unsigned long long) compressedfilesize,
1554*a28cd43dSSascha Wildner dstFileName);
1555*a28cd43dSSascha Wildner } else {
1556*a28cd43dSSascha Wildner DISPLAYLEVEL(2,"%-20s :%6.2f%% (%6llu => %6llu bytes, %s) \n",
1557*a28cd43dSSascha Wildner srcFileName,
1558*a28cd43dSSascha Wildner (double)compressedfilesize / readsize * 100,
1559*a28cd43dSSascha Wildner (unsigned long long)readsize, (unsigned long long) compressedfilesize,
1560*a28cd43dSSascha Wildner dstFileName);
1561*a28cd43dSSascha Wildner }
1562*a28cd43dSSascha Wildner }
1563*a28cd43dSSascha Wildner
1564*a28cd43dSSascha Wildner /* Elapsed Time and CPU Load */
1565*a28cd43dSSascha Wildner { clock_t const cpuEnd = clock();
1566*a28cd43dSSascha Wildner double const cpuLoad_s = (double)(cpuEnd - cpuStart) / CLOCKS_PER_SEC;
1567*a28cd43dSSascha Wildner U64 const timeLength_ns = UTIL_clockSpanNano(timeStart);
1568*a28cd43dSSascha Wildner double const timeLength_s = (double)timeLength_ns / 1000000000;
1569*a28cd43dSSascha Wildner double const cpuLoad_pct = (cpuLoad_s / timeLength_s) * 100;
1570*a28cd43dSSascha Wildner DISPLAYLEVEL(4, "%-20s : Completed in %.2f sec (cpu load : %.0f%%)\n",
1571*a28cd43dSSascha Wildner srcFileName, timeLength_s, cpuLoad_pct);
1572*a28cd43dSSascha Wildner }
1573*a28cd43dSSascha Wildner return 0;
1574*a28cd43dSSascha Wildner }
1575*a28cd43dSSascha Wildner
1576*a28cd43dSSascha Wildner
1577*a28cd43dSSascha Wildner /*! FIO_compressFilename_dstFile() :
1578*a28cd43dSSascha Wildner * open dstFileName, or pass-through if ress.dstFile != NULL,
1579*a28cd43dSSascha Wildner * then start compression with FIO_compressFilename_internal().
1580*a28cd43dSSascha Wildner * Manages source removal (--rm) and file permissions transfer.
1581*a28cd43dSSascha Wildner * note : ress.srcFile must be != NULL,
1582*a28cd43dSSascha Wildner * so reach this function through FIO_compressFilename_srcFile().
1583*a28cd43dSSascha Wildner * @return : 0 : compression completed correctly,
1584*a28cd43dSSascha Wildner * 1 : pb
1585*a28cd43dSSascha Wildner */
FIO_compressFilename_dstFile(FIO_ctx_t * const fCtx,FIO_prefs_t * const prefs,cRess_t ress,const char * dstFileName,const char * srcFileName,int compressionLevel)1586*a28cd43dSSascha Wildner static int FIO_compressFilename_dstFile(FIO_ctx_t* const fCtx,
1587*a28cd43dSSascha Wildner FIO_prefs_t* const prefs,
1588*a28cd43dSSascha Wildner cRess_t ress,
1589*a28cd43dSSascha Wildner const char* dstFileName,
1590*a28cd43dSSascha Wildner const char* srcFileName,
1591*a28cd43dSSascha Wildner int compressionLevel)
1592*a28cd43dSSascha Wildner {
1593*a28cd43dSSascha Wildner int closeDstFile = 0;
1594*a28cd43dSSascha Wildner int result;
1595*a28cd43dSSascha Wildner stat_t statbuf;
1596*a28cd43dSSascha Wildner int transfer_permissions = 0;
1597*a28cd43dSSascha Wildner assert(ress.srcFile != NULL);
1598*a28cd43dSSascha Wildner if (ress.dstFile == NULL) {
1599*a28cd43dSSascha Wildner closeDstFile = 1;
1600*a28cd43dSSascha Wildner DISPLAYLEVEL(6, "FIO_compressFilename_dstFile: opening dst: %s \n", dstFileName);
1601*a28cd43dSSascha Wildner ress.dstFile = FIO_openDstFile(fCtx, prefs, srcFileName, dstFileName);
1602*a28cd43dSSascha Wildner if (ress.dstFile==NULL) return 1; /* could not open dstFileName */
1603*a28cd43dSSascha Wildner /* Must only be added after FIO_openDstFile() succeeds.
1604*a28cd43dSSascha Wildner * Otherwise we may delete the destination file if it already exists,
1605*a28cd43dSSascha Wildner * and the user presses Ctrl-C when asked if they wish to overwrite.
1606*a28cd43dSSascha Wildner */
1607*a28cd43dSSascha Wildner addHandler(dstFileName);
1608*a28cd43dSSascha Wildner
1609*a28cd43dSSascha Wildner if ( strcmp (srcFileName, stdinmark)
1610*a28cd43dSSascha Wildner && UTIL_stat(srcFileName, &statbuf)
1611*a28cd43dSSascha Wildner && UTIL_isRegularFileStat(&statbuf) )
1612*a28cd43dSSascha Wildner transfer_permissions = 1;
1613*a28cd43dSSascha Wildner }
1614*a28cd43dSSascha Wildner
1615*a28cd43dSSascha Wildner result = FIO_compressFilename_internal(fCtx, prefs, ress, dstFileName, srcFileName, compressionLevel);
1616*a28cd43dSSascha Wildner
1617*a28cd43dSSascha Wildner if (closeDstFile) {
1618*a28cd43dSSascha Wildner FILE* const dstFile = ress.dstFile;
1619*a28cd43dSSascha Wildner ress.dstFile = NULL;
1620*a28cd43dSSascha Wildner
1621*a28cd43dSSascha Wildner clearHandler();
1622*a28cd43dSSascha Wildner
1623*a28cd43dSSascha Wildner DISPLAYLEVEL(6, "FIO_compressFilename_dstFile: closing dst: %s \n", dstFileName);
1624*a28cd43dSSascha Wildner if (fclose(dstFile)) { /* error closing dstFile */
1625*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s: %s \n", dstFileName, strerror(errno));
1626*a28cd43dSSascha Wildner result=1;
1627*a28cd43dSSascha Wildner }
1628*a28cd43dSSascha Wildner if ( (result != 0) /* operation failure */
1629*a28cd43dSSascha Wildner && strcmp(dstFileName, stdoutmark) /* special case : don't remove() stdout */
1630*a28cd43dSSascha Wildner ) {
1631*a28cd43dSSascha Wildner FIO_removeFile(dstFileName); /* remove compression artefact; note don't do anything special if remove() fails */
1632*a28cd43dSSascha Wildner } else if (transfer_permissions) {
1633*a28cd43dSSascha Wildner DISPLAYLEVEL(6, "FIO_compressFilename_dstFile: transferring permissions into dst: %s \n", dstFileName);
1634*a28cd43dSSascha Wildner UTIL_setFileStat(dstFileName, &statbuf);
1635*a28cd43dSSascha Wildner } else {
1636*a28cd43dSSascha Wildner DISPLAYLEVEL(6, "FIO_compressFilename_dstFile: do not transfer permissions into dst: %s \n", dstFileName);
1637*a28cd43dSSascha Wildner }
1638*a28cd43dSSascha Wildner }
1639*a28cd43dSSascha Wildner
1640*a28cd43dSSascha Wildner return result;
1641*a28cd43dSSascha Wildner }
1642*a28cd43dSSascha Wildner
1643*a28cd43dSSascha Wildner /* List used to compare file extensions (used with --exclude-compressed flag)
1644*a28cd43dSSascha Wildner * Different from the suffixList and should only apply to ZSTD compress operationResult
1645*a28cd43dSSascha Wildner */
1646*a28cd43dSSascha Wildner static const char *compressedFileExtensions[] = {
1647*a28cd43dSSascha Wildner ZSTD_EXTENSION,
1648*a28cd43dSSascha Wildner TZSTD_EXTENSION,
1649*a28cd43dSSascha Wildner GZ_EXTENSION,
1650*a28cd43dSSascha Wildner TGZ_EXTENSION,
1651*a28cd43dSSascha Wildner LZMA_EXTENSION,
1652*a28cd43dSSascha Wildner XZ_EXTENSION,
1653*a28cd43dSSascha Wildner TXZ_EXTENSION,
1654*a28cd43dSSascha Wildner LZ4_EXTENSION,
1655*a28cd43dSSascha Wildner TLZ4_EXTENSION,
1656*a28cd43dSSascha Wildner NULL
1657*a28cd43dSSascha Wildner };
1658*a28cd43dSSascha Wildner
1659*a28cd43dSSascha Wildner /*! FIO_compressFilename_srcFile() :
1660*a28cd43dSSascha Wildner * @return : 0 : compression completed correctly,
1661*a28cd43dSSascha Wildner * 1 : missing or pb opening srcFileName
1662*a28cd43dSSascha Wildner */
1663*a28cd43dSSascha Wildner static int
FIO_compressFilename_srcFile(FIO_ctx_t * const fCtx,FIO_prefs_t * const prefs,cRess_t ress,const char * dstFileName,const char * srcFileName,int compressionLevel)1664*a28cd43dSSascha Wildner FIO_compressFilename_srcFile(FIO_ctx_t* const fCtx,
1665*a28cd43dSSascha Wildner FIO_prefs_t* const prefs,
1666*a28cd43dSSascha Wildner cRess_t ress,
1667*a28cd43dSSascha Wildner const char* dstFileName,
1668*a28cd43dSSascha Wildner const char* srcFileName,
1669*a28cd43dSSascha Wildner int compressionLevel)
1670*a28cd43dSSascha Wildner {
1671*a28cd43dSSascha Wildner int result;
1672*a28cd43dSSascha Wildner DISPLAYLEVEL(6, "FIO_compressFilename_srcFile: %s \n", srcFileName);
1673*a28cd43dSSascha Wildner
1674*a28cd43dSSascha Wildner /* ensure src is not a directory */
1675*a28cd43dSSascha Wildner if (UTIL_isDirectory(srcFileName)) {
1676*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s is a directory -- ignored \n", srcFileName);
1677*a28cd43dSSascha Wildner return 1;
1678*a28cd43dSSascha Wildner }
1679*a28cd43dSSascha Wildner
1680*a28cd43dSSascha Wildner /* ensure src is not the same as dict (if present) */
1681*a28cd43dSSascha Wildner if (ress.dictFileName != NULL && UTIL_isSameFile(srcFileName, ress.dictFileName)) {
1682*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: cannot use %s as an input file and dictionary \n", srcFileName);
1683*a28cd43dSSascha Wildner return 1;
1684*a28cd43dSSascha Wildner }
1685*a28cd43dSSascha Wildner
1686*a28cd43dSSascha Wildner /* Check if "srcFile" is compressed. Only done if --exclude-compressed flag is used
1687*a28cd43dSSascha Wildner * YES => ZSTD will skip compression of the file and will return 0.
1688*a28cd43dSSascha Wildner * NO => ZSTD will resume with compress operation.
1689*a28cd43dSSascha Wildner */
1690*a28cd43dSSascha Wildner if (prefs->excludeCompressedFiles == 1 && UTIL_isCompressedFile(srcFileName, compressedFileExtensions)) {
1691*a28cd43dSSascha Wildner DISPLAYLEVEL(4, "File is already compressed : %s \n", srcFileName);
1692*a28cd43dSSascha Wildner return 0;
1693*a28cd43dSSascha Wildner }
1694*a28cd43dSSascha Wildner
1695*a28cd43dSSascha Wildner ress.srcFile = FIO_openSrcFile(srcFileName);
1696*a28cd43dSSascha Wildner if (ress.srcFile == NULL) return 1; /* srcFile could not be opened */
1697*a28cd43dSSascha Wildner
1698*a28cd43dSSascha Wildner result = FIO_compressFilename_dstFile(fCtx, prefs, ress, dstFileName, srcFileName, compressionLevel);
1699*a28cd43dSSascha Wildner
1700*a28cd43dSSascha Wildner fclose(ress.srcFile);
1701*a28cd43dSSascha Wildner ress.srcFile = NULL;
1702*a28cd43dSSascha Wildner if ( prefs->removeSrcFile /* --rm */
1703*a28cd43dSSascha Wildner && result == 0 /* success */
1704*a28cd43dSSascha Wildner && strcmp(srcFileName, stdinmark) /* exception : don't erase stdin */
1705*a28cd43dSSascha Wildner ) {
1706*a28cd43dSSascha Wildner /* We must clear the handler, since after this point calling it would
1707*a28cd43dSSascha Wildner * delete both the source and destination files.
1708*a28cd43dSSascha Wildner */
1709*a28cd43dSSascha Wildner clearHandler();
1710*a28cd43dSSascha Wildner if (FIO_removeFile(srcFileName))
1711*a28cd43dSSascha Wildner EXM_THROW(1, "zstd: %s: %s", srcFileName, strerror(errno));
1712*a28cd43dSSascha Wildner }
1713*a28cd43dSSascha Wildner return result;
1714*a28cd43dSSascha Wildner }
1715*a28cd43dSSascha Wildner
FIO_compressFilename(FIO_ctx_t * const fCtx,FIO_prefs_t * const prefs,const char * dstFileName,const char * srcFileName,const char * dictFileName,int compressionLevel,ZSTD_compressionParameters comprParams)1716*a28cd43dSSascha Wildner int FIO_compressFilename(FIO_ctx_t* const fCtx, FIO_prefs_t* const prefs, const char* dstFileName,
1717*a28cd43dSSascha Wildner const char* srcFileName, const char* dictFileName,
1718*a28cd43dSSascha Wildner int compressionLevel, ZSTD_compressionParameters comprParams)
1719*a28cd43dSSascha Wildner {
1720*a28cd43dSSascha Wildner cRess_t const ress = FIO_createCResources(prefs, dictFileName, UTIL_getFileSize(srcFileName), compressionLevel, comprParams);
1721*a28cd43dSSascha Wildner int const result = FIO_compressFilename_srcFile(fCtx, prefs, ress, dstFileName, srcFileName, compressionLevel);
1722*a28cd43dSSascha Wildner
1723*a28cd43dSSascha Wildner #define DISPLAY_LEVEL_DEFAULT 2
1724*a28cd43dSSascha Wildner
1725*a28cd43dSSascha Wildner FIO_freeCResources(&ress);
1726*a28cd43dSSascha Wildner return result;
1727*a28cd43dSSascha Wildner }
1728*a28cd43dSSascha Wildner
1729*a28cd43dSSascha Wildner /* FIO_determineCompressedName() :
1730*a28cd43dSSascha Wildner * create a destination filename for compressed srcFileName.
1731*a28cd43dSSascha Wildner * @return a pointer to it.
1732*a28cd43dSSascha Wildner * This function never returns an error (it may abort() in case of pb)
1733*a28cd43dSSascha Wildner */
1734*a28cd43dSSascha Wildner static const char*
FIO_determineCompressedName(const char * srcFileName,const char * outDirName,const char * suffix)1735*a28cd43dSSascha Wildner FIO_determineCompressedName(const char* srcFileName, const char* outDirName, const char* suffix)
1736*a28cd43dSSascha Wildner {
1737*a28cd43dSSascha Wildner static size_t dfnbCapacity = 0;
1738*a28cd43dSSascha Wildner static char* dstFileNameBuffer = NULL; /* using static allocation : this function cannot be multi-threaded */
1739*a28cd43dSSascha Wildner char* outDirFilename = NULL;
1740*a28cd43dSSascha Wildner size_t sfnSize = strlen(srcFileName);
1741*a28cd43dSSascha Wildner size_t const srcSuffixLen = strlen(suffix);
1742*a28cd43dSSascha Wildner if (outDirName) {
1743*a28cd43dSSascha Wildner outDirFilename = FIO_createFilename_fromOutDir(srcFileName, outDirName, srcSuffixLen);
1744*a28cd43dSSascha Wildner sfnSize = strlen(outDirFilename);
1745*a28cd43dSSascha Wildner assert(outDirFilename != NULL);
1746*a28cd43dSSascha Wildner }
1747*a28cd43dSSascha Wildner
1748*a28cd43dSSascha Wildner if (dfnbCapacity <= sfnSize+srcSuffixLen+1) {
1749*a28cd43dSSascha Wildner /* resize buffer for dstName */
1750*a28cd43dSSascha Wildner free(dstFileNameBuffer);
1751*a28cd43dSSascha Wildner dfnbCapacity = sfnSize + srcSuffixLen + 30;
1752*a28cd43dSSascha Wildner dstFileNameBuffer = (char*)malloc(dfnbCapacity);
1753*a28cd43dSSascha Wildner if (!dstFileNameBuffer) {
1754*a28cd43dSSascha Wildner EXM_THROW(30, "zstd: %s", strerror(errno));
1755*a28cd43dSSascha Wildner }
1756*a28cd43dSSascha Wildner }
1757*a28cd43dSSascha Wildner assert(dstFileNameBuffer != NULL);
1758*a28cd43dSSascha Wildner
1759*a28cd43dSSascha Wildner if (outDirFilename) {
1760*a28cd43dSSascha Wildner memcpy(dstFileNameBuffer, outDirFilename, sfnSize);
1761*a28cd43dSSascha Wildner free(outDirFilename);
1762*a28cd43dSSascha Wildner } else {
1763*a28cd43dSSascha Wildner memcpy(dstFileNameBuffer, srcFileName, sfnSize);
1764*a28cd43dSSascha Wildner }
1765*a28cd43dSSascha Wildner memcpy(dstFileNameBuffer+sfnSize, suffix, srcSuffixLen+1 /* Include terminating null */);
1766*a28cd43dSSascha Wildner return dstFileNameBuffer;
1767*a28cd43dSSascha Wildner }
1768*a28cd43dSSascha Wildner
FIO_getLargestFileSize(const char ** inFileNames,unsigned nbFiles)1769*a28cd43dSSascha Wildner static unsigned long long FIO_getLargestFileSize(const char** inFileNames, unsigned nbFiles)
1770*a28cd43dSSascha Wildner {
1771*a28cd43dSSascha Wildner size_t i;
1772*a28cd43dSSascha Wildner unsigned long long fileSize, maxFileSize = 0;
1773*a28cd43dSSascha Wildner for (i = 0; i < nbFiles; i++) {
1774*a28cd43dSSascha Wildner fileSize = UTIL_getFileSize(inFileNames[i]);
1775*a28cd43dSSascha Wildner maxFileSize = fileSize > maxFileSize ? fileSize : maxFileSize;
1776*a28cd43dSSascha Wildner }
1777*a28cd43dSSascha Wildner return maxFileSize;
1778*a28cd43dSSascha Wildner }
1779*a28cd43dSSascha Wildner
1780*a28cd43dSSascha Wildner /* FIO_compressMultipleFilenames() :
1781*a28cd43dSSascha Wildner * compress nbFiles files
1782*a28cd43dSSascha Wildner * into either one destination (outFileName),
1783*a28cd43dSSascha Wildner * or into one file each (outFileName == NULL, but suffix != NULL),
1784*a28cd43dSSascha Wildner * or into a destination folder (specified with -O)
1785*a28cd43dSSascha Wildner */
FIO_compressMultipleFilenames(FIO_ctx_t * const fCtx,FIO_prefs_t * const prefs,const char ** inFileNamesTable,const char * outMirroredRootDirName,const char * outDirName,const char * outFileName,const char * suffix,const char * dictFileName,int compressionLevel,ZSTD_compressionParameters comprParams)1786*a28cd43dSSascha Wildner int FIO_compressMultipleFilenames(FIO_ctx_t* const fCtx,
1787*a28cd43dSSascha Wildner FIO_prefs_t* const prefs,
1788*a28cd43dSSascha Wildner const char** inFileNamesTable,
1789*a28cd43dSSascha Wildner const char* outMirroredRootDirName,
1790*a28cd43dSSascha Wildner const char* outDirName,
1791*a28cd43dSSascha Wildner const char* outFileName, const char* suffix,
1792*a28cd43dSSascha Wildner const char* dictFileName, int compressionLevel,
1793*a28cd43dSSascha Wildner ZSTD_compressionParameters comprParams)
1794*a28cd43dSSascha Wildner {
1795*a28cd43dSSascha Wildner int status;
1796*a28cd43dSSascha Wildner int error = 0;
1797*a28cd43dSSascha Wildner cRess_t ress = FIO_createCResources(prefs, dictFileName,
1798*a28cd43dSSascha Wildner FIO_getLargestFileSize(inFileNamesTable, fCtx->nbFilesTotal),
1799*a28cd43dSSascha Wildner compressionLevel, comprParams);
1800*a28cd43dSSascha Wildner
1801*a28cd43dSSascha Wildner /* init */
1802*a28cd43dSSascha Wildner assert(outFileName != NULL || suffix != NULL);
1803*a28cd43dSSascha Wildner if (outFileName != NULL) { /* output into a single destination (stdout typically) */
1804*a28cd43dSSascha Wildner if (FIO_removeMultiFilesWarning(fCtx, prefs, outFileName, 1 /* displayLevelCutoff */)) {
1805*a28cd43dSSascha Wildner FIO_freeCResources(&ress);
1806*a28cd43dSSascha Wildner return 1;
1807*a28cd43dSSascha Wildner }
1808*a28cd43dSSascha Wildner ress.dstFile = FIO_openDstFile(fCtx, prefs, NULL, outFileName);
1809*a28cd43dSSascha Wildner if (ress.dstFile == NULL) { /* could not open outFileName */
1810*a28cd43dSSascha Wildner error = 1;
1811*a28cd43dSSascha Wildner } else {
1812*a28cd43dSSascha Wildner for (; fCtx->currFileIdx < fCtx->nbFilesTotal; ++fCtx->currFileIdx) {
1813*a28cd43dSSascha Wildner status = FIO_compressFilename_srcFile(fCtx, prefs, ress, outFileName, inFileNamesTable[fCtx->currFileIdx], compressionLevel);
1814*a28cd43dSSascha Wildner if (!status) fCtx->nbFilesProcessed++;
1815*a28cd43dSSascha Wildner error |= status;
1816*a28cd43dSSascha Wildner }
1817*a28cd43dSSascha Wildner if (fclose(ress.dstFile))
1818*a28cd43dSSascha Wildner EXM_THROW(29, "Write error (%s) : cannot properly close %s",
1819*a28cd43dSSascha Wildner strerror(errno), outFileName);
1820*a28cd43dSSascha Wildner ress.dstFile = NULL;
1821*a28cd43dSSascha Wildner }
1822*a28cd43dSSascha Wildner } else {
1823*a28cd43dSSascha Wildner if (outMirroredRootDirName)
1824*a28cd43dSSascha Wildner UTIL_mirrorSourceFilesDirectories(inFileNamesTable, fCtx->nbFilesTotal, outMirroredRootDirName);
1825*a28cd43dSSascha Wildner
1826*a28cd43dSSascha Wildner for (; fCtx->currFileIdx < fCtx->nbFilesTotal; ++fCtx->currFileIdx) {
1827*a28cd43dSSascha Wildner const char* const srcFileName = inFileNamesTable[fCtx->currFileIdx];
1828*a28cd43dSSascha Wildner const char* dstFileName = NULL;
1829*a28cd43dSSascha Wildner if (outMirroredRootDirName) {
1830*a28cd43dSSascha Wildner char* validMirroredDirName = UTIL_createMirroredDestDirName(srcFileName, outMirroredRootDirName);
1831*a28cd43dSSascha Wildner if (validMirroredDirName) {
1832*a28cd43dSSascha Wildner dstFileName = FIO_determineCompressedName(srcFileName, validMirroredDirName, suffix);
1833*a28cd43dSSascha Wildner free(validMirroredDirName);
1834*a28cd43dSSascha Wildner } else {
1835*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "zstd: --output-dir-mirror cannot compress '%s' into '%s' \n", srcFileName, outMirroredRootDirName);
1836*a28cd43dSSascha Wildner error=1;
1837*a28cd43dSSascha Wildner continue;
1838*a28cd43dSSascha Wildner }
1839*a28cd43dSSascha Wildner } else {
1840*a28cd43dSSascha Wildner dstFileName = FIO_determineCompressedName(srcFileName, outDirName, suffix); /* cannot fail */
1841*a28cd43dSSascha Wildner }
1842*a28cd43dSSascha Wildner status = FIO_compressFilename_srcFile(fCtx, prefs, ress, dstFileName, srcFileName, compressionLevel);
1843*a28cd43dSSascha Wildner if (!status) fCtx->nbFilesProcessed++;
1844*a28cd43dSSascha Wildner error |= status;
1845*a28cd43dSSascha Wildner }
1846*a28cd43dSSascha Wildner
1847*a28cd43dSSascha Wildner if (outDirName)
1848*a28cd43dSSascha Wildner FIO_checkFilenameCollisions(inFileNamesTable , fCtx->nbFilesTotal);
1849*a28cd43dSSascha Wildner }
1850*a28cd43dSSascha Wildner
1851*a28cd43dSSascha Wildner if (fCtx->nbFilesProcessed >= 1 && fCtx->nbFilesTotal > 1 && fCtx->totalBytesInput != 0) {
1852*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "\r%79s\r", "");
1853*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "%d files compressed : %.2f%% (%6zu => %6zu bytes)\n", fCtx->nbFilesProcessed,
1854*a28cd43dSSascha Wildner (double)fCtx->totalBytesOutput/((double)fCtx->totalBytesInput)*100,
1855*a28cd43dSSascha Wildner fCtx->totalBytesInput, fCtx->totalBytesOutput);
1856*a28cd43dSSascha Wildner }
1857*a28cd43dSSascha Wildner
1858*a28cd43dSSascha Wildner FIO_freeCResources(&ress);
1859*a28cd43dSSascha Wildner return error;
1860*a28cd43dSSascha Wildner }
1861*a28cd43dSSascha Wildner
1862*a28cd43dSSascha Wildner #endif /* #ifndef ZSTD_NOCOMPRESS */
1863*a28cd43dSSascha Wildner
1864*a28cd43dSSascha Wildner
1865*a28cd43dSSascha Wildner
1866*a28cd43dSSascha Wildner #ifndef ZSTD_NODECOMPRESS
1867*a28cd43dSSascha Wildner
1868*a28cd43dSSascha Wildner /* **************************************************************************
1869*a28cd43dSSascha Wildner * Decompression
1870*a28cd43dSSascha Wildner ***************************************************************************/
1871*a28cd43dSSascha Wildner typedef struct {
1872*a28cd43dSSascha Wildner void* srcBuffer;
1873*a28cd43dSSascha Wildner size_t srcBufferSize;
1874*a28cd43dSSascha Wildner size_t srcBufferLoaded;
1875*a28cd43dSSascha Wildner void* dstBuffer;
1876*a28cd43dSSascha Wildner size_t dstBufferSize;
1877*a28cd43dSSascha Wildner ZSTD_DStream* dctx;
1878*a28cd43dSSascha Wildner FILE* dstFile;
1879*a28cd43dSSascha Wildner } dRess_t;
1880*a28cd43dSSascha Wildner
FIO_createDResources(FIO_prefs_t * const prefs,const char * dictFileName)1881*a28cd43dSSascha Wildner static dRess_t FIO_createDResources(FIO_prefs_t* const prefs, const char* dictFileName)
1882*a28cd43dSSascha Wildner {
1883*a28cd43dSSascha Wildner dRess_t ress;
1884*a28cd43dSSascha Wildner memset(&ress, 0, sizeof(ress));
1885*a28cd43dSSascha Wildner
1886*a28cd43dSSascha Wildner if (prefs->patchFromMode)
1887*a28cd43dSSascha Wildner FIO_adjustMemLimitForPatchFromMode(prefs, UTIL_getFileSize(dictFileName), 0 /* just use the dict size */);
1888*a28cd43dSSascha Wildner
1889*a28cd43dSSascha Wildner /* Allocation */
1890*a28cd43dSSascha Wildner ress.dctx = ZSTD_createDStream();
1891*a28cd43dSSascha Wildner if (ress.dctx==NULL)
1892*a28cd43dSSascha Wildner EXM_THROW(60, "Error: %s : can't create ZSTD_DStream", strerror(errno));
1893*a28cd43dSSascha Wildner CHECK( ZSTD_DCtx_setMaxWindowSize(ress.dctx, prefs->memLimit) );
1894*a28cd43dSSascha Wildner CHECK( ZSTD_DCtx_setParameter(ress.dctx, ZSTD_d_forceIgnoreChecksum, !prefs->checksumFlag));
1895*a28cd43dSSascha Wildner
1896*a28cd43dSSascha Wildner ress.srcBufferSize = ZSTD_DStreamInSize();
1897*a28cd43dSSascha Wildner ress.srcBuffer = malloc(ress.srcBufferSize);
1898*a28cd43dSSascha Wildner ress.dstBufferSize = ZSTD_DStreamOutSize();
1899*a28cd43dSSascha Wildner ress.dstBuffer = malloc(ress.dstBufferSize);
1900*a28cd43dSSascha Wildner if (!ress.srcBuffer || !ress.dstBuffer)
1901*a28cd43dSSascha Wildner EXM_THROW(61, "Allocation error : not enough memory");
1902*a28cd43dSSascha Wildner
1903*a28cd43dSSascha Wildner /* dictionary */
1904*a28cd43dSSascha Wildner { void* dictBuffer;
1905*a28cd43dSSascha Wildner size_t const dictBufferSize = FIO_createDictBuffer(&dictBuffer, dictFileName, prefs);
1906*a28cd43dSSascha Wildner CHECK( ZSTD_initDStream_usingDict(ress.dctx, dictBuffer, dictBufferSize) );
1907*a28cd43dSSascha Wildner free(dictBuffer);
1908*a28cd43dSSascha Wildner }
1909*a28cd43dSSascha Wildner
1910*a28cd43dSSascha Wildner return ress;
1911*a28cd43dSSascha Wildner }
1912*a28cd43dSSascha Wildner
FIO_freeDResources(dRess_t ress)1913*a28cd43dSSascha Wildner static void FIO_freeDResources(dRess_t ress)
1914*a28cd43dSSascha Wildner {
1915*a28cd43dSSascha Wildner CHECK( ZSTD_freeDStream(ress.dctx) );
1916*a28cd43dSSascha Wildner free(ress.srcBuffer);
1917*a28cd43dSSascha Wildner free(ress.dstBuffer);
1918*a28cd43dSSascha Wildner }
1919*a28cd43dSSascha Wildner
1920*a28cd43dSSascha Wildner
1921*a28cd43dSSascha Wildner /** FIO_fwriteSparse() :
1922*a28cd43dSSascha Wildner * @return : storedSkips,
1923*a28cd43dSSascha Wildner * argument for next call to FIO_fwriteSparse() or FIO_fwriteSparseEnd() */
1924*a28cd43dSSascha Wildner static unsigned
FIO_fwriteSparse(FILE * file,const void * buffer,size_t bufferSize,const FIO_prefs_t * const prefs,unsigned storedSkips)1925*a28cd43dSSascha Wildner FIO_fwriteSparse(FILE* file,
1926*a28cd43dSSascha Wildner const void* buffer, size_t bufferSize,
1927*a28cd43dSSascha Wildner const FIO_prefs_t* const prefs,
1928*a28cd43dSSascha Wildner unsigned storedSkips)
1929*a28cd43dSSascha Wildner {
1930*a28cd43dSSascha Wildner const size_t* const bufferT = (const size_t*)buffer; /* Buffer is supposed malloc'ed, hence aligned on size_t */
1931*a28cd43dSSascha Wildner size_t bufferSizeT = bufferSize / sizeof(size_t);
1932*a28cd43dSSascha Wildner const size_t* const bufferTEnd = bufferT + bufferSizeT;
1933*a28cd43dSSascha Wildner const size_t* ptrT = bufferT;
1934*a28cd43dSSascha Wildner static const size_t segmentSizeT = (32 KB) / sizeof(size_t); /* check every 32 KB */
1935*a28cd43dSSascha Wildner
1936*a28cd43dSSascha Wildner if (prefs->testMode) return 0; /* do not output anything in test mode */
1937*a28cd43dSSascha Wildner
1938*a28cd43dSSascha Wildner if (!prefs->sparseFileSupport) { /* normal write */
1939*a28cd43dSSascha Wildner size_t const sizeCheck = fwrite(buffer, 1, bufferSize, file);
1940*a28cd43dSSascha Wildner if (sizeCheck != bufferSize)
1941*a28cd43dSSascha Wildner EXM_THROW(70, "Write error : cannot write decoded block : %s",
1942*a28cd43dSSascha Wildner strerror(errno));
1943*a28cd43dSSascha Wildner return 0;
1944*a28cd43dSSascha Wildner }
1945*a28cd43dSSascha Wildner
1946*a28cd43dSSascha Wildner /* avoid int overflow */
1947*a28cd43dSSascha Wildner if (storedSkips > 1 GB) {
1948*a28cd43dSSascha Wildner if (LONG_SEEK(file, 1 GB, SEEK_CUR) != 0)
1949*a28cd43dSSascha Wildner EXM_THROW(91, "1 GB skip error (sparse file support)");
1950*a28cd43dSSascha Wildner storedSkips -= 1 GB;
1951*a28cd43dSSascha Wildner }
1952*a28cd43dSSascha Wildner
1953*a28cd43dSSascha Wildner while (ptrT < bufferTEnd) {
1954*a28cd43dSSascha Wildner size_t nb0T;
1955*a28cd43dSSascha Wildner
1956*a28cd43dSSascha Wildner /* adjust last segment if < 32 KB */
1957*a28cd43dSSascha Wildner size_t seg0SizeT = segmentSizeT;
1958*a28cd43dSSascha Wildner if (seg0SizeT > bufferSizeT) seg0SizeT = bufferSizeT;
1959*a28cd43dSSascha Wildner bufferSizeT -= seg0SizeT;
1960*a28cd43dSSascha Wildner
1961*a28cd43dSSascha Wildner /* count leading zeroes */
1962*a28cd43dSSascha Wildner for (nb0T=0; (nb0T < seg0SizeT) && (ptrT[nb0T] == 0); nb0T++) ;
1963*a28cd43dSSascha Wildner storedSkips += (unsigned)(nb0T * sizeof(size_t));
1964*a28cd43dSSascha Wildner
1965*a28cd43dSSascha Wildner if (nb0T != seg0SizeT) { /* not all 0s */
1966*a28cd43dSSascha Wildner size_t const nbNon0ST = seg0SizeT - nb0T;
1967*a28cd43dSSascha Wildner /* skip leading zeros */
1968*a28cd43dSSascha Wildner if (LONG_SEEK(file, storedSkips, SEEK_CUR) != 0)
1969*a28cd43dSSascha Wildner EXM_THROW(92, "Sparse skip error ; try --no-sparse");
1970*a28cd43dSSascha Wildner storedSkips = 0;
1971*a28cd43dSSascha Wildner /* write the rest */
1972*a28cd43dSSascha Wildner if (fwrite(ptrT + nb0T, sizeof(size_t), nbNon0ST, file) != nbNon0ST)
1973*a28cd43dSSascha Wildner EXM_THROW(93, "Write error : cannot write decoded block : %s",
1974*a28cd43dSSascha Wildner strerror(errno));
1975*a28cd43dSSascha Wildner }
1976*a28cd43dSSascha Wildner ptrT += seg0SizeT;
1977*a28cd43dSSascha Wildner }
1978*a28cd43dSSascha Wildner
1979*a28cd43dSSascha Wildner { static size_t const maskT = sizeof(size_t)-1;
1980*a28cd43dSSascha Wildner if (bufferSize & maskT) {
1981*a28cd43dSSascha Wildner /* size not multiple of sizeof(size_t) : implies end of block */
1982*a28cd43dSSascha Wildner const char* const restStart = (const char*)bufferTEnd;
1983*a28cd43dSSascha Wildner const char* restPtr = restStart;
1984*a28cd43dSSascha Wildner const char* const restEnd = (const char*)buffer + bufferSize;
1985*a28cd43dSSascha Wildner assert(restEnd > restStart && restEnd < restStart + sizeof(size_t));
1986*a28cd43dSSascha Wildner for ( ; (restPtr < restEnd) && (*restPtr == 0); restPtr++) ;
1987*a28cd43dSSascha Wildner storedSkips += (unsigned) (restPtr - restStart);
1988*a28cd43dSSascha Wildner if (restPtr != restEnd) {
1989*a28cd43dSSascha Wildner /* not all remaining bytes are 0 */
1990*a28cd43dSSascha Wildner size_t const restSize = (size_t)(restEnd - restPtr);
1991*a28cd43dSSascha Wildner if (LONG_SEEK(file, storedSkips, SEEK_CUR) != 0)
1992*a28cd43dSSascha Wildner EXM_THROW(92, "Sparse skip error ; try --no-sparse");
1993*a28cd43dSSascha Wildner if (fwrite(restPtr, 1, restSize, file) != restSize)
1994*a28cd43dSSascha Wildner EXM_THROW(95, "Write error : cannot write end of decoded block : %s",
1995*a28cd43dSSascha Wildner strerror(errno));
1996*a28cd43dSSascha Wildner storedSkips = 0;
1997*a28cd43dSSascha Wildner } } }
1998*a28cd43dSSascha Wildner
1999*a28cd43dSSascha Wildner return storedSkips;
2000*a28cd43dSSascha Wildner }
2001*a28cd43dSSascha Wildner
2002*a28cd43dSSascha Wildner static void
FIO_fwriteSparseEnd(const FIO_prefs_t * const prefs,FILE * file,unsigned storedSkips)2003*a28cd43dSSascha Wildner FIO_fwriteSparseEnd(const FIO_prefs_t* const prefs, FILE* file, unsigned storedSkips)
2004*a28cd43dSSascha Wildner {
2005*a28cd43dSSascha Wildner if (prefs->testMode) assert(storedSkips == 0);
2006*a28cd43dSSascha Wildner if (storedSkips>0) {
2007*a28cd43dSSascha Wildner assert(prefs->sparseFileSupport > 0); /* storedSkips>0 implies sparse support is enabled */
2008*a28cd43dSSascha Wildner (void)prefs; /* assert can be disabled, in which case prefs becomes unused */
2009*a28cd43dSSascha Wildner if (LONG_SEEK(file, storedSkips-1, SEEK_CUR) != 0)
2010*a28cd43dSSascha Wildner EXM_THROW(69, "Final skip error (sparse file support)");
2011*a28cd43dSSascha Wildner /* last zero must be explicitly written,
2012*a28cd43dSSascha Wildner * so that skipped ones get implicitly translated as zero by FS */
2013*a28cd43dSSascha Wildner { const char lastZeroByte[1] = { 0 };
2014*a28cd43dSSascha Wildner if (fwrite(lastZeroByte, 1, 1, file) != 1)
2015*a28cd43dSSascha Wildner EXM_THROW(69, "Write error : cannot write last zero : %s", strerror(errno));
2016*a28cd43dSSascha Wildner } }
2017*a28cd43dSSascha Wildner }
2018*a28cd43dSSascha Wildner
2019*a28cd43dSSascha Wildner
2020*a28cd43dSSascha Wildner /** FIO_passThrough() : just copy input into output, for compatibility with gzip -df mode
2021*a28cd43dSSascha Wildner @return : 0 (no error) */
FIO_passThrough(const FIO_prefs_t * const prefs,FILE * foutput,FILE * finput,void * buffer,size_t bufferSize,size_t alreadyLoaded)2022*a28cd43dSSascha Wildner static int FIO_passThrough(const FIO_prefs_t* const prefs,
2023*a28cd43dSSascha Wildner FILE* foutput, FILE* finput,
2024*a28cd43dSSascha Wildner void* buffer, size_t bufferSize,
2025*a28cd43dSSascha Wildner size_t alreadyLoaded)
2026*a28cd43dSSascha Wildner {
2027*a28cd43dSSascha Wildner size_t const blockSize = MIN(64 KB, bufferSize);
2028*a28cd43dSSascha Wildner size_t readFromInput;
2029*a28cd43dSSascha Wildner unsigned storedSkips = 0;
2030*a28cd43dSSascha Wildner
2031*a28cd43dSSascha Wildner /* assumption : ress->srcBufferLoaded bytes already loaded and stored within buffer */
2032*a28cd43dSSascha Wildner { size_t const sizeCheck = fwrite(buffer, 1, alreadyLoaded, foutput);
2033*a28cd43dSSascha Wildner if (sizeCheck != alreadyLoaded) {
2034*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "Pass-through write error : %s\n", strerror(errno));
2035*a28cd43dSSascha Wildner return 1;
2036*a28cd43dSSascha Wildner } }
2037*a28cd43dSSascha Wildner
2038*a28cd43dSSascha Wildner do {
2039*a28cd43dSSascha Wildner readFromInput = fread(buffer, 1, blockSize, finput);
2040*a28cd43dSSascha Wildner storedSkips = FIO_fwriteSparse(foutput, buffer, readFromInput, prefs, storedSkips);
2041*a28cd43dSSascha Wildner } while (readFromInput == blockSize);
2042*a28cd43dSSascha Wildner if (ferror(finput)) {
2043*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "Pass-through read error : %s\n", strerror(errno));
2044*a28cd43dSSascha Wildner return 1;
2045*a28cd43dSSascha Wildner }
2046*a28cd43dSSascha Wildner assert(feof(finput));
2047*a28cd43dSSascha Wildner
2048*a28cd43dSSascha Wildner FIO_fwriteSparseEnd(prefs, foutput, storedSkips);
2049*a28cd43dSSascha Wildner return 0;
2050*a28cd43dSSascha Wildner }
2051*a28cd43dSSascha Wildner
2052*a28cd43dSSascha Wildner /* FIO_zstdErrorHelp() :
2053*a28cd43dSSascha Wildner * detailed error message when requested window size is too large */
2054*a28cd43dSSascha Wildner static void
FIO_zstdErrorHelp(const FIO_prefs_t * const prefs,const dRess_t * ress,size_t err,const char * srcFileName)2055*a28cd43dSSascha Wildner FIO_zstdErrorHelp(const FIO_prefs_t* const prefs,
2056*a28cd43dSSascha Wildner const dRess_t* ress,
2057*a28cd43dSSascha Wildner size_t err, const char* srcFileName)
2058*a28cd43dSSascha Wildner {
2059*a28cd43dSSascha Wildner ZSTD_frameHeader header;
2060*a28cd43dSSascha Wildner
2061*a28cd43dSSascha Wildner /* Help message only for one specific error */
2062*a28cd43dSSascha Wildner if (ZSTD_getErrorCode(err) != ZSTD_error_frameParameter_windowTooLarge)
2063*a28cd43dSSascha Wildner return;
2064*a28cd43dSSascha Wildner
2065*a28cd43dSSascha Wildner /* Try to decode the frame header */
2066*a28cd43dSSascha Wildner err = ZSTD_getFrameHeader(&header, ress->srcBuffer, ress->srcBufferLoaded);
2067*a28cd43dSSascha Wildner if (err == 0) {
2068*a28cd43dSSascha Wildner unsigned long long const windowSize = header.windowSize;
2069*a28cd43dSSascha Wildner unsigned const windowLog = FIO_highbit64(windowSize) + ((windowSize & (windowSize - 1)) != 0);
2070*a28cd43dSSascha Wildner assert(prefs->memLimit > 0);
2071*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "%s : Window size larger than maximum : %llu > %u \n",
2072*a28cd43dSSascha Wildner srcFileName, windowSize, prefs->memLimit);
2073*a28cd43dSSascha Wildner if (windowLog <= ZSTD_WINDOWLOG_MAX) {
2074*a28cd43dSSascha Wildner unsigned const windowMB = (unsigned)((windowSize >> 20) + ((windowSize & ((1 MB) - 1)) != 0));
2075*a28cd43dSSascha Wildner assert(windowSize < (U64)(1ULL << 52)); /* ensure now overflow for windowMB */
2076*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "%s : Use --long=%u or --memory=%uMB \n",
2077*a28cd43dSSascha Wildner srcFileName, windowLog, windowMB);
2078*a28cd43dSSascha Wildner return;
2079*a28cd43dSSascha Wildner } }
2080*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "%s : Window log larger than ZSTD_WINDOWLOG_MAX=%u; not supported \n",
2081*a28cd43dSSascha Wildner srcFileName, ZSTD_WINDOWLOG_MAX);
2082*a28cd43dSSascha Wildner }
2083*a28cd43dSSascha Wildner
2084*a28cd43dSSascha Wildner /** FIO_decompressFrame() :
2085*a28cd43dSSascha Wildner * @return : size of decoded zstd frame, or an error code
2086*a28cd43dSSascha Wildner */
2087*a28cd43dSSascha Wildner #define FIO_ERROR_FRAME_DECODING ((unsigned long long)(-2))
2088*a28cd43dSSascha Wildner static unsigned long long
FIO_decompressZstdFrame(FIO_ctx_t * const fCtx,dRess_t * ress,FILE * finput,const FIO_prefs_t * const prefs,const char * srcFileName,U64 alreadyDecoded)2089*a28cd43dSSascha Wildner FIO_decompressZstdFrame(FIO_ctx_t* const fCtx, dRess_t* ress, FILE* finput,
2090*a28cd43dSSascha Wildner const FIO_prefs_t* const prefs,
2091*a28cd43dSSascha Wildner const char* srcFileName,
2092*a28cd43dSSascha Wildner U64 alreadyDecoded) /* for multi-frames streams */
2093*a28cd43dSSascha Wildner {
2094*a28cd43dSSascha Wildner U64 frameSize = 0;
2095*a28cd43dSSascha Wildner U32 storedSkips = 0;
2096*a28cd43dSSascha Wildner
2097*a28cd43dSSascha Wildner /* display last 20 characters only */
2098*a28cd43dSSascha Wildner { size_t const srcFileLength = strlen(srcFileName);
2099*a28cd43dSSascha Wildner if (srcFileLength>20) srcFileName += srcFileLength-20;
2100*a28cd43dSSascha Wildner }
2101*a28cd43dSSascha Wildner
2102*a28cd43dSSascha Wildner ZSTD_resetDStream(ress->dctx);
2103*a28cd43dSSascha Wildner
2104*a28cd43dSSascha Wildner /* Header loading : ensures ZSTD_getFrameHeader() will succeed */
2105*a28cd43dSSascha Wildner { size_t const toDecode = ZSTD_FRAMEHEADERSIZE_MAX;
2106*a28cd43dSSascha Wildner if (ress->srcBufferLoaded < toDecode) {
2107*a28cd43dSSascha Wildner size_t const toRead = toDecode - ress->srcBufferLoaded;
2108*a28cd43dSSascha Wildner void* const startPosition = (char*)ress->srcBuffer + ress->srcBufferLoaded;
2109*a28cd43dSSascha Wildner ress->srcBufferLoaded += fread(startPosition, 1, toRead, finput);
2110*a28cd43dSSascha Wildner } }
2111*a28cd43dSSascha Wildner
2112*a28cd43dSSascha Wildner /* Main decompression Loop */
2113*a28cd43dSSascha Wildner while (1) {
2114*a28cd43dSSascha Wildner ZSTD_inBuffer inBuff = { ress->srcBuffer, ress->srcBufferLoaded, 0 };
2115*a28cd43dSSascha Wildner ZSTD_outBuffer outBuff= { ress->dstBuffer, ress->dstBufferSize, 0 };
2116*a28cd43dSSascha Wildner size_t const readSizeHint = ZSTD_decompressStream(ress->dctx, &outBuff, &inBuff);
2117*a28cd43dSSascha Wildner if (ZSTD_isError(readSizeHint)) {
2118*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "%s : Decoding error (36) : %s \n",
2119*a28cd43dSSascha Wildner srcFileName, ZSTD_getErrorName(readSizeHint));
2120*a28cd43dSSascha Wildner FIO_zstdErrorHelp(prefs, ress, readSizeHint, srcFileName);
2121*a28cd43dSSascha Wildner return FIO_ERROR_FRAME_DECODING;
2122*a28cd43dSSascha Wildner }
2123*a28cd43dSSascha Wildner
2124*a28cd43dSSascha Wildner /* Write block */
2125*a28cd43dSSascha Wildner storedSkips = FIO_fwriteSparse(ress->dstFile, ress->dstBuffer, outBuff.pos, prefs, storedSkips);
2126*a28cd43dSSascha Wildner frameSize += outBuff.pos;
2127*a28cd43dSSascha Wildner if (!fCtx->hasStdoutOutput) {
2128*a28cd43dSSascha Wildner if (fCtx->nbFilesTotal > 1) {
2129*a28cd43dSSascha Wildner size_t srcFileNameSize = strlen(srcFileName);
2130*a28cd43dSSascha Wildner if (srcFileNameSize > 18) {
2131*a28cd43dSSascha Wildner const char* truncatedSrcFileName = srcFileName + srcFileNameSize - 15;
2132*a28cd43dSSascha Wildner DISPLAYUPDATE(2, "\rDecompress: %2u/%2u files. Current: ...%s : %u MB... ",
2133*a28cd43dSSascha Wildner fCtx->currFileIdx+1, fCtx->nbFilesTotal, truncatedSrcFileName, (unsigned)((alreadyDecoded+frameSize)>>20) );
2134*a28cd43dSSascha Wildner } else {
2135*a28cd43dSSascha Wildner DISPLAYUPDATE(2, "\rDecompress: %2u/%2u files. Current: %s : %u MB... ",
2136*a28cd43dSSascha Wildner fCtx->currFileIdx+1, fCtx->nbFilesTotal, srcFileName, (unsigned)((alreadyDecoded+frameSize)>>20) );
2137*a28cd43dSSascha Wildner }
2138*a28cd43dSSascha Wildner } else {
2139*a28cd43dSSascha Wildner DISPLAYUPDATE(2, "\r%-20.20s : %u MB... ",
2140*a28cd43dSSascha Wildner srcFileName, (unsigned)((alreadyDecoded+frameSize)>>20) );
2141*a28cd43dSSascha Wildner }
2142*a28cd43dSSascha Wildner }
2143*a28cd43dSSascha Wildner
2144*a28cd43dSSascha Wildner if (inBuff.pos > 0) {
2145*a28cd43dSSascha Wildner memmove(ress->srcBuffer, (char*)ress->srcBuffer + inBuff.pos, inBuff.size - inBuff.pos);
2146*a28cd43dSSascha Wildner ress->srcBufferLoaded -= inBuff.pos;
2147*a28cd43dSSascha Wildner }
2148*a28cd43dSSascha Wildner
2149*a28cd43dSSascha Wildner if (readSizeHint == 0) break; /* end of frame */
2150*a28cd43dSSascha Wildner
2151*a28cd43dSSascha Wildner /* Fill input buffer */
2152*a28cd43dSSascha Wildner { size_t const toDecode = MIN(readSizeHint, ress->srcBufferSize); /* support large skippable frames */
2153*a28cd43dSSascha Wildner if (ress->srcBufferLoaded < toDecode) {
2154*a28cd43dSSascha Wildner size_t const toRead = toDecode - ress->srcBufferLoaded; /* > 0 */
2155*a28cd43dSSascha Wildner void* const startPosition = (char*)ress->srcBuffer + ress->srcBufferLoaded;
2156*a28cd43dSSascha Wildner size_t const readSize = fread(startPosition, 1, toRead, finput);
2157*a28cd43dSSascha Wildner if (readSize==0) {
2158*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "%s : Read error (39) : premature end \n",
2159*a28cd43dSSascha Wildner srcFileName);
2160*a28cd43dSSascha Wildner return FIO_ERROR_FRAME_DECODING;
2161*a28cd43dSSascha Wildner }
2162*a28cd43dSSascha Wildner ress->srcBufferLoaded += readSize;
2163*a28cd43dSSascha Wildner } } }
2164*a28cd43dSSascha Wildner
2165*a28cd43dSSascha Wildner FIO_fwriteSparseEnd(prefs, ress->dstFile, storedSkips);
2166*a28cd43dSSascha Wildner
2167*a28cd43dSSascha Wildner return frameSize;
2168*a28cd43dSSascha Wildner }
2169*a28cd43dSSascha Wildner
2170*a28cd43dSSascha Wildner
2171*a28cd43dSSascha Wildner #ifdef ZSTD_GZDECOMPRESS
2172*a28cd43dSSascha Wildner static unsigned long long
FIO_decompressGzFrame(dRess_t * ress,FILE * srcFile,const FIO_prefs_t * const prefs,const char * srcFileName)2173*a28cd43dSSascha Wildner FIO_decompressGzFrame(dRess_t* ress, FILE* srcFile,
2174*a28cd43dSSascha Wildner const FIO_prefs_t* const prefs,
2175*a28cd43dSSascha Wildner const char* srcFileName)
2176*a28cd43dSSascha Wildner {
2177*a28cd43dSSascha Wildner unsigned long long outFileSize = 0;
2178*a28cd43dSSascha Wildner z_stream strm;
2179*a28cd43dSSascha Wildner int flush = Z_NO_FLUSH;
2180*a28cd43dSSascha Wildner int decodingError = 0;
2181*a28cd43dSSascha Wildner unsigned storedSkips = 0;
2182*a28cd43dSSascha Wildner
2183*a28cd43dSSascha Wildner strm.zalloc = Z_NULL;
2184*a28cd43dSSascha Wildner strm.zfree = Z_NULL;
2185*a28cd43dSSascha Wildner strm.opaque = Z_NULL;
2186*a28cd43dSSascha Wildner strm.next_in = 0;
2187*a28cd43dSSascha Wildner strm.avail_in = 0;
2188*a28cd43dSSascha Wildner /* see http://www.zlib.net/manual.html */
2189*a28cd43dSSascha Wildner if (inflateInit2(&strm, 15 /* maxWindowLogSize */ + 16 /* gzip only */) != Z_OK)
2190*a28cd43dSSascha Wildner return FIO_ERROR_FRAME_DECODING;
2191*a28cd43dSSascha Wildner
2192*a28cd43dSSascha Wildner strm.next_out = (Bytef*)ress->dstBuffer;
2193*a28cd43dSSascha Wildner strm.avail_out = (uInt)ress->dstBufferSize;
2194*a28cd43dSSascha Wildner strm.avail_in = (uInt)ress->srcBufferLoaded;
2195*a28cd43dSSascha Wildner strm.next_in = (z_const unsigned char*)ress->srcBuffer;
2196*a28cd43dSSascha Wildner
2197*a28cd43dSSascha Wildner for ( ; ; ) {
2198*a28cd43dSSascha Wildner int ret;
2199*a28cd43dSSascha Wildner if (strm.avail_in == 0) {
2200*a28cd43dSSascha Wildner ress->srcBufferLoaded = fread(ress->srcBuffer, 1, ress->srcBufferSize, srcFile);
2201*a28cd43dSSascha Wildner if (ress->srcBufferLoaded == 0) flush = Z_FINISH;
2202*a28cd43dSSascha Wildner strm.next_in = (z_const unsigned char*)ress->srcBuffer;
2203*a28cd43dSSascha Wildner strm.avail_in = (uInt)ress->srcBufferLoaded;
2204*a28cd43dSSascha Wildner }
2205*a28cd43dSSascha Wildner ret = inflate(&strm, flush);
2206*a28cd43dSSascha Wildner if (ret == Z_BUF_ERROR) {
2207*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s: premature gz end \n", srcFileName);
2208*a28cd43dSSascha Wildner decodingError = 1; break;
2209*a28cd43dSSascha Wildner }
2210*a28cd43dSSascha Wildner if (ret != Z_OK && ret != Z_STREAM_END) {
2211*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s: inflate error %d \n", srcFileName, ret);
2212*a28cd43dSSascha Wildner decodingError = 1; break;
2213*a28cd43dSSascha Wildner }
2214*a28cd43dSSascha Wildner { size_t const decompBytes = ress->dstBufferSize - strm.avail_out;
2215*a28cd43dSSascha Wildner if (decompBytes) {
2216*a28cd43dSSascha Wildner storedSkips = FIO_fwriteSparse(ress->dstFile, ress->dstBuffer, decompBytes, prefs, storedSkips);
2217*a28cd43dSSascha Wildner outFileSize += decompBytes;
2218*a28cd43dSSascha Wildner strm.next_out = (Bytef*)ress->dstBuffer;
2219*a28cd43dSSascha Wildner strm.avail_out = (uInt)ress->dstBufferSize;
2220*a28cd43dSSascha Wildner }
2221*a28cd43dSSascha Wildner }
2222*a28cd43dSSascha Wildner if (ret == Z_STREAM_END) break;
2223*a28cd43dSSascha Wildner }
2224*a28cd43dSSascha Wildner
2225*a28cd43dSSascha Wildner if (strm.avail_in > 0)
2226*a28cd43dSSascha Wildner memmove(ress->srcBuffer, strm.next_in, strm.avail_in);
2227*a28cd43dSSascha Wildner ress->srcBufferLoaded = strm.avail_in;
2228*a28cd43dSSascha Wildner if ( (inflateEnd(&strm) != Z_OK) /* release resources ; error detected */
2229*a28cd43dSSascha Wildner && (decodingError==0) ) {
2230*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s: inflateEnd error \n", srcFileName);
2231*a28cd43dSSascha Wildner decodingError = 1;
2232*a28cd43dSSascha Wildner }
2233*a28cd43dSSascha Wildner FIO_fwriteSparseEnd(prefs, ress->dstFile, storedSkips);
2234*a28cd43dSSascha Wildner return decodingError ? FIO_ERROR_FRAME_DECODING : outFileSize;
2235*a28cd43dSSascha Wildner }
2236*a28cd43dSSascha Wildner #endif
2237*a28cd43dSSascha Wildner
2238*a28cd43dSSascha Wildner
2239*a28cd43dSSascha Wildner #ifdef ZSTD_LZMADECOMPRESS
2240*a28cd43dSSascha Wildner static unsigned long long
FIO_decompressLzmaFrame(dRess_t * ress,FILE * srcFile,const FIO_prefs_t * const prefs,const char * srcFileName,int plain_lzma)2241*a28cd43dSSascha Wildner FIO_decompressLzmaFrame(dRess_t* ress, FILE* srcFile,
2242*a28cd43dSSascha Wildner const FIO_prefs_t* const prefs,
2243*a28cd43dSSascha Wildner const char* srcFileName, int plain_lzma)
2244*a28cd43dSSascha Wildner {
2245*a28cd43dSSascha Wildner unsigned long long outFileSize = 0;
2246*a28cd43dSSascha Wildner lzma_stream strm = LZMA_STREAM_INIT;
2247*a28cd43dSSascha Wildner lzma_action action = LZMA_RUN;
2248*a28cd43dSSascha Wildner lzma_ret initRet;
2249*a28cd43dSSascha Wildner int decodingError = 0;
2250*a28cd43dSSascha Wildner unsigned storedSkips = 0;
2251*a28cd43dSSascha Wildner
2252*a28cd43dSSascha Wildner strm.next_in = 0;
2253*a28cd43dSSascha Wildner strm.avail_in = 0;
2254*a28cd43dSSascha Wildner if (plain_lzma) {
2255*a28cd43dSSascha Wildner initRet = lzma_alone_decoder(&strm, UINT64_MAX); /* LZMA */
2256*a28cd43dSSascha Wildner } else {
2257*a28cd43dSSascha Wildner initRet = lzma_stream_decoder(&strm, UINT64_MAX, 0); /* XZ */
2258*a28cd43dSSascha Wildner }
2259*a28cd43dSSascha Wildner
2260*a28cd43dSSascha Wildner if (initRet != LZMA_OK) {
2261*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s: %s error %d \n",
2262*a28cd43dSSascha Wildner plain_lzma ? "lzma_alone_decoder" : "lzma_stream_decoder",
2263*a28cd43dSSascha Wildner srcFileName, initRet);
2264*a28cd43dSSascha Wildner return FIO_ERROR_FRAME_DECODING;
2265*a28cd43dSSascha Wildner }
2266*a28cd43dSSascha Wildner
2267*a28cd43dSSascha Wildner strm.next_out = (BYTE*)ress->dstBuffer;
2268*a28cd43dSSascha Wildner strm.avail_out = ress->dstBufferSize;
2269*a28cd43dSSascha Wildner strm.next_in = (BYTE const*)ress->srcBuffer;
2270*a28cd43dSSascha Wildner strm.avail_in = ress->srcBufferLoaded;
2271*a28cd43dSSascha Wildner
2272*a28cd43dSSascha Wildner for ( ; ; ) {
2273*a28cd43dSSascha Wildner lzma_ret ret;
2274*a28cd43dSSascha Wildner if (strm.avail_in == 0) {
2275*a28cd43dSSascha Wildner ress->srcBufferLoaded = fread(ress->srcBuffer, 1, ress->srcBufferSize, srcFile);
2276*a28cd43dSSascha Wildner if (ress->srcBufferLoaded == 0) action = LZMA_FINISH;
2277*a28cd43dSSascha Wildner strm.next_in = (BYTE const*)ress->srcBuffer;
2278*a28cd43dSSascha Wildner strm.avail_in = ress->srcBufferLoaded;
2279*a28cd43dSSascha Wildner }
2280*a28cd43dSSascha Wildner ret = lzma_code(&strm, action);
2281*a28cd43dSSascha Wildner
2282*a28cd43dSSascha Wildner if (ret == LZMA_BUF_ERROR) {
2283*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s: premature lzma end \n", srcFileName);
2284*a28cd43dSSascha Wildner decodingError = 1; break;
2285*a28cd43dSSascha Wildner }
2286*a28cd43dSSascha Wildner if (ret != LZMA_OK && ret != LZMA_STREAM_END) {
2287*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s: lzma_code decoding error %d \n",
2288*a28cd43dSSascha Wildner srcFileName, ret);
2289*a28cd43dSSascha Wildner decodingError = 1; break;
2290*a28cd43dSSascha Wildner }
2291*a28cd43dSSascha Wildner { size_t const decompBytes = ress->dstBufferSize - strm.avail_out;
2292*a28cd43dSSascha Wildner if (decompBytes) {
2293*a28cd43dSSascha Wildner storedSkips = FIO_fwriteSparse(ress->dstFile, ress->dstBuffer, decompBytes, prefs, storedSkips);
2294*a28cd43dSSascha Wildner outFileSize += decompBytes;
2295*a28cd43dSSascha Wildner strm.next_out = (BYTE*)ress->dstBuffer;
2296*a28cd43dSSascha Wildner strm.avail_out = ress->dstBufferSize;
2297*a28cd43dSSascha Wildner } }
2298*a28cd43dSSascha Wildner if (ret == LZMA_STREAM_END) break;
2299*a28cd43dSSascha Wildner }
2300*a28cd43dSSascha Wildner
2301*a28cd43dSSascha Wildner if (strm.avail_in > 0)
2302*a28cd43dSSascha Wildner memmove(ress->srcBuffer, strm.next_in, strm.avail_in);
2303*a28cd43dSSascha Wildner ress->srcBufferLoaded = strm.avail_in;
2304*a28cd43dSSascha Wildner lzma_end(&strm);
2305*a28cd43dSSascha Wildner FIO_fwriteSparseEnd(prefs, ress->dstFile, storedSkips);
2306*a28cd43dSSascha Wildner return decodingError ? FIO_ERROR_FRAME_DECODING : outFileSize;
2307*a28cd43dSSascha Wildner }
2308*a28cd43dSSascha Wildner #endif
2309*a28cd43dSSascha Wildner
2310*a28cd43dSSascha Wildner #ifdef ZSTD_LZ4DECOMPRESS
2311*a28cd43dSSascha Wildner static unsigned long long
FIO_decompressLz4Frame(dRess_t * ress,FILE * srcFile,const FIO_prefs_t * const prefs,const char * srcFileName)2312*a28cd43dSSascha Wildner FIO_decompressLz4Frame(dRess_t* ress, FILE* srcFile,
2313*a28cd43dSSascha Wildner const FIO_prefs_t* const prefs,
2314*a28cd43dSSascha Wildner const char* srcFileName)
2315*a28cd43dSSascha Wildner {
2316*a28cd43dSSascha Wildner unsigned long long filesize = 0;
2317*a28cd43dSSascha Wildner LZ4F_errorCode_t nextToLoad;
2318*a28cd43dSSascha Wildner LZ4F_decompressionContext_t dCtx;
2319*a28cd43dSSascha Wildner LZ4F_errorCode_t const errorCode = LZ4F_createDecompressionContext(&dCtx, LZ4F_VERSION);
2320*a28cd43dSSascha Wildner int decodingError = 0;
2321*a28cd43dSSascha Wildner unsigned storedSkips = 0;
2322*a28cd43dSSascha Wildner
2323*a28cd43dSSascha Wildner if (LZ4F_isError(errorCode)) {
2324*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: failed to create lz4 decompression context \n");
2325*a28cd43dSSascha Wildner return FIO_ERROR_FRAME_DECODING;
2326*a28cd43dSSascha Wildner }
2327*a28cd43dSSascha Wildner
2328*a28cd43dSSascha Wildner /* Init feed with magic number (already consumed from FILE* sFile) */
2329*a28cd43dSSascha Wildner { size_t inSize = 4;
2330*a28cd43dSSascha Wildner size_t outSize= 0;
2331*a28cd43dSSascha Wildner MEM_writeLE32(ress->srcBuffer, LZ4_MAGICNUMBER);
2332*a28cd43dSSascha Wildner nextToLoad = LZ4F_decompress(dCtx, ress->dstBuffer, &outSize, ress->srcBuffer, &inSize, NULL);
2333*a28cd43dSSascha Wildner if (LZ4F_isError(nextToLoad)) {
2334*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s: lz4 header error : %s \n",
2335*a28cd43dSSascha Wildner srcFileName, LZ4F_getErrorName(nextToLoad));
2336*a28cd43dSSascha Wildner LZ4F_freeDecompressionContext(dCtx);
2337*a28cd43dSSascha Wildner return FIO_ERROR_FRAME_DECODING;
2338*a28cd43dSSascha Wildner } }
2339*a28cd43dSSascha Wildner
2340*a28cd43dSSascha Wildner /* Main Loop */
2341*a28cd43dSSascha Wildner for (;nextToLoad;) {
2342*a28cd43dSSascha Wildner size_t readSize;
2343*a28cd43dSSascha Wildner size_t pos = 0;
2344*a28cd43dSSascha Wildner size_t decodedBytes = ress->dstBufferSize;
2345*a28cd43dSSascha Wildner
2346*a28cd43dSSascha Wildner /* Read input */
2347*a28cd43dSSascha Wildner if (nextToLoad > ress->srcBufferSize) nextToLoad = ress->srcBufferSize;
2348*a28cd43dSSascha Wildner readSize = fread(ress->srcBuffer, 1, nextToLoad, srcFile);
2349*a28cd43dSSascha Wildner if (!readSize) break; /* reached end of file or stream */
2350*a28cd43dSSascha Wildner
2351*a28cd43dSSascha Wildner while ((pos < readSize) || (decodedBytes == ress->dstBufferSize)) { /* still to read, or still to flush */
2352*a28cd43dSSascha Wildner /* Decode Input (at least partially) */
2353*a28cd43dSSascha Wildner size_t remaining = readSize - pos;
2354*a28cd43dSSascha Wildner decodedBytes = ress->dstBufferSize;
2355*a28cd43dSSascha Wildner nextToLoad = LZ4F_decompress(dCtx, ress->dstBuffer, &decodedBytes, (char*)(ress->srcBuffer)+pos, &remaining, NULL);
2356*a28cd43dSSascha Wildner if (LZ4F_isError(nextToLoad)) {
2357*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s: lz4 decompression error : %s \n",
2358*a28cd43dSSascha Wildner srcFileName, LZ4F_getErrorName(nextToLoad));
2359*a28cd43dSSascha Wildner decodingError = 1; nextToLoad = 0; break;
2360*a28cd43dSSascha Wildner }
2361*a28cd43dSSascha Wildner pos += remaining;
2362*a28cd43dSSascha Wildner
2363*a28cd43dSSascha Wildner /* Write Block */
2364*a28cd43dSSascha Wildner if (decodedBytes) {
2365*a28cd43dSSascha Wildner storedSkips = FIO_fwriteSparse(ress->dstFile, ress->dstBuffer, decodedBytes, prefs, storedSkips);
2366*a28cd43dSSascha Wildner filesize += decodedBytes;
2367*a28cd43dSSascha Wildner DISPLAYUPDATE(2, "\rDecompressed : %u MB ", (unsigned)(filesize>>20));
2368*a28cd43dSSascha Wildner }
2369*a28cd43dSSascha Wildner
2370*a28cd43dSSascha Wildner if (!nextToLoad) break;
2371*a28cd43dSSascha Wildner }
2372*a28cd43dSSascha Wildner }
2373*a28cd43dSSascha Wildner /* can be out because readSize == 0, which could be an fread() error */
2374*a28cd43dSSascha Wildner if (ferror(srcFile)) {
2375*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s: read error \n", srcFileName);
2376*a28cd43dSSascha Wildner decodingError=1;
2377*a28cd43dSSascha Wildner }
2378*a28cd43dSSascha Wildner
2379*a28cd43dSSascha Wildner if (nextToLoad!=0) {
2380*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s: unfinished lz4 stream \n", srcFileName);
2381*a28cd43dSSascha Wildner decodingError=1;
2382*a28cd43dSSascha Wildner }
2383*a28cd43dSSascha Wildner
2384*a28cd43dSSascha Wildner LZ4F_freeDecompressionContext(dCtx);
2385*a28cd43dSSascha Wildner ress->srcBufferLoaded = 0; /* LZ4F will reach exact frame boundary */
2386*a28cd43dSSascha Wildner FIO_fwriteSparseEnd(prefs, ress->dstFile, storedSkips);
2387*a28cd43dSSascha Wildner
2388*a28cd43dSSascha Wildner return decodingError ? FIO_ERROR_FRAME_DECODING : filesize;
2389*a28cd43dSSascha Wildner }
2390*a28cd43dSSascha Wildner #endif
2391*a28cd43dSSascha Wildner
2392*a28cd43dSSascha Wildner
2393*a28cd43dSSascha Wildner
2394*a28cd43dSSascha Wildner /** FIO_decompressFrames() :
2395*a28cd43dSSascha Wildner * Find and decode frames inside srcFile
2396*a28cd43dSSascha Wildner * srcFile presumed opened and valid
2397*a28cd43dSSascha Wildner * @return : 0 : OK
2398*a28cd43dSSascha Wildner * 1 : error
2399*a28cd43dSSascha Wildner */
FIO_decompressFrames(FIO_ctx_t * const fCtx,dRess_t ress,FILE * srcFile,const FIO_prefs_t * const prefs,const char * dstFileName,const char * srcFileName)2400*a28cd43dSSascha Wildner static int FIO_decompressFrames(FIO_ctx_t* const fCtx,
2401*a28cd43dSSascha Wildner dRess_t ress, FILE* srcFile,
2402*a28cd43dSSascha Wildner const FIO_prefs_t* const prefs,
2403*a28cd43dSSascha Wildner const char* dstFileName, const char* srcFileName)
2404*a28cd43dSSascha Wildner {
2405*a28cd43dSSascha Wildner unsigned readSomething = 0;
2406*a28cd43dSSascha Wildner unsigned long long filesize = 0;
2407*a28cd43dSSascha Wildner assert(srcFile != NULL);
2408*a28cd43dSSascha Wildner
2409*a28cd43dSSascha Wildner /* for each frame */
2410*a28cd43dSSascha Wildner for ( ; ; ) {
2411*a28cd43dSSascha Wildner /* check magic number -> version */
2412*a28cd43dSSascha Wildner size_t const toRead = 4;
2413*a28cd43dSSascha Wildner const BYTE* const buf = (const BYTE*)ress.srcBuffer;
2414*a28cd43dSSascha Wildner if (ress.srcBufferLoaded < toRead) /* load up to 4 bytes for header */
2415*a28cd43dSSascha Wildner ress.srcBufferLoaded += fread((char*)ress.srcBuffer + ress.srcBufferLoaded,
2416*a28cd43dSSascha Wildner (size_t)1, toRead - ress.srcBufferLoaded, srcFile);
2417*a28cd43dSSascha Wildner if (ress.srcBufferLoaded==0) {
2418*a28cd43dSSascha Wildner if (readSomething==0) { /* srcFile is empty (which is invalid) */
2419*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s: unexpected end of file \n", srcFileName);
2420*a28cd43dSSascha Wildner return 1;
2421*a28cd43dSSascha Wildner } /* else, just reached frame boundary */
2422*a28cd43dSSascha Wildner break; /* no more input */
2423*a28cd43dSSascha Wildner }
2424*a28cd43dSSascha Wildner readSomething = 1; /* there is at least 1 byte in srcFile */
2425*a28cd43dSSascha Wildner if (ress.srcBufferLoaded < toRead) {
2426*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s: unknown header \n", srcFileName);
2427*a28cd43dSSascha Wildner return 1;
2428*a28cd43dSSascha Wildner }
2429*a28cd43dSSascha Wildner if (ZSTD_isFrame(buf, ress.srcBufferLoaded)) {
2430*a28cd43dSSascha Wildner unsigned long long const frameSize = FIO_decompressZstdFrame(fCtx, &ress, srcFile, prefs, srcFileName, filesize);
2431*a28cd43dSSascha Wildner if (frameSize == FIO_ERROR_FRAME_DECODING) return 1;
2432*a28cd43dSSascha Wildner filesize += frameSize;
2433*a28cd43dSSascha Wildner } else if (buf[0] == 31 && buf[1] == 139) { /* gz magic number */
2434*a28cd43dSSascha Wildner #ifdef ZSTD_GZDECOMPRESS
2435*a28cd43dSSascha Wildner unsigned long long const frameSize = FIO_decompressGzFrame(&ress, srcFile, prefs, srcFileName);
2436*a28cd43dSSascha Wildner if (frameSize == FIO_ERROR_FRAME_DECODING) return 1;
2437*a28cd43dSSascha Wildner filesize += frameSize;
2438*a28cd43dSSascha Wildner #else
2439*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s: gzip file cannot be uncompressed (zstd compiled without HAVE_ZLIB) -- ignored \n", srcFileName);
2440*a28cd43dSSascha Wildner return 1;
2441*a28cd43dSSascha Wildner #endif
2442*a28cd43dSSascha Wildner } else if ((buf[0] == 0xFD && buf[1] == 0x37) /* xz magic number */
2443*a28cd43dSSascha Wildner || (buf[0] == 0x5D && buf[1] == 0x00)) { /* lzma header (no magic number) */
2444*a28cd43dSSascha Wildner #ifdef ZSTD_LZMADECOMPRESS
2445*a28cd43dSSascha Wildner unsigned long long const frameSize = FIO_decompressLzmaFrame(&ress, srcFile, prefs, srcFileName, buf[0] != 0xFD);
2446*a28cd43dSSascha Wildner if (frameSize == FIO_ERROR_FRAME_DECODING) return 1;
2447*a28cd43dSSascha Wildner filesize += frameSize;
2448*a28cd43dSSascha Wildner #else
2449*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s: xz/lzma file cannot be uncompressed (zstd compiled without HAVE_LZMA) -- ignored \n", srcFileName);
2450*a28cd43dSSascha Wildner return 1;
2451*a28cd43dSSascha Wildner #endif
2452*a28cd43dSSascha Wildner } else if (MEM_readLE32(buf) == LZ4_MAGICNUMBER) {
2453*a28cd43dSSascha Wildner #ifdef ZSTD_LZ4DECOMPRESS
2454*a28cd43dSSascha Wildner unsigned long long const frameSize = FIO_decompressLz4Frame(&ress, srcFile, prefs, srcFileName);
2455*a28cd43dSSascha Wildner if (frameSize == FIO_ERROR_FRAME_DECODING) return 1;
2456*a28cd43dSSascha Wildner filesize += frameSize;
2457*a28cd43dSSascha Wildner #else
2458*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s: lz4 file cannot be uncompressed (zstd compiled without HAVE_LZ4) -- ignored \n", srcFileName);
2459*a28cd43dSSascha Wildner return 1;
2460*a28cd43dSSascha Wildner #endif
2461*a28cd43dSSascha Wildner } else if ((prefs->overwrite) && !strcmp (dstFileName, stdoutmark)) { /* pass-through mode */
2462*a28cd43dSSascha Wildner return FIO_passThrough(prefs,
2463*a28cd43dSSascha Wildner ress.dstFile, srcFile,
2464*a28cd43dSSascha Wildner ress.srcBuffer, ress.srcBufferSize,
2465*a28cd43dSSascha Wildner ress.srcBufferLoaded);
2466*a28cd43dSSascha Wildner } else {
2467*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s: unsupported format \n", srcFileName);
2468*a28cd43dSSascha Wildner return 1;
2469*a28cd43dSSascha Wildner } } /* for each frame */
2470*a28cd43dSSascha Wildner
2471*a28cd43dSSascha Wildner /* Final Status */
2472*a28cd43dSSascha Wildner fCtx->totalBytesOutput += (size_t)filesize;
2473*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "\r%79s\r", "");
2474*a28cd43dSSascha Wildner /* No status message in pipe mode (stdin - stdout) or multi-files mode */
2475*a28cd43dSSascha Wildner if (g_display_prefs.displayLevel >= 2) {
2476*a28cd43dSSascha Wildner if (fCtx->nbFilesTotal <= 1 || g_display_prefs.displayLevel >= 3) {
2477*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "%-20s: %llu bytes \n", srcFileName, filesize);
2478*a28cd43dSSascha Wildner }
2479*a28cd43dSSascha Wildner }
2480*a28cd43dSSascha Wildner
2481*a28cd43dSSascha Wildner return 0;
2482*a28cd43dSSascha Wildner }
2483*a28cd43dSSascha Wildner
2484*a28cd43dSSascha Wildner /** FIO_decompressDstFile() :
2485*a28cd43dSSascha Wildner open `dstFileName`,
2486*a28cd43dSSascha Wildner or path-through if ress.dstFile is already != 0,
2487*a28cd43dSSascha Wildner then start decompression process (FIO_decompressFrames()).
2488*a28cd43dSSascha Wildner @return : 0 : OK
2489*a28cd43dSSascha Wildner 1 : operation aborted
2490*a28cd43dSSascha Wildner */
FIO_decompressDstFile(FIO_ctx_t * const fCtx,FIO_prefs_t * const prefs,dRess_t ress,FILE * srcFile,const char * dstFileName,const char * srcFileName)2491*a28cd43dSSascha Wildner static int FIO_decompressDstFile(FIO_ctx_t* const fCtx,
2492*a28cd43dSSascha Wildner FIO_prefs_t* const prefs,
2493*a28cd43dSSascha Wildner dRess_t ress, FILE* srcFile,
2494*a28cd43dSSascha Wildner const char* dstFileName, const char* srcFileName)
2495*a28cd43dSSascha Wildner {
2496*a28cd43dSSascha Wildner int result;
2497*a28cd43dSSascha Wildner stat_t statbuf;
2498*a28cd43dSSascha Wildner int transfer_permissions = 0;
2499*a28cd43dSSascha Wildner int releaseDstFile = 0;
2500*a28cd43dSSascha Wildner
2501*a28cd43dSSascha Wildner if ((ress.dstFile == NULL) && (prefs->testMode==0)) {
2502*a28cd43dSSascha Wildner releaseDstFile = 1;
2503*a28cd43dSSascha Wildner
2504*a28cd43dSSascha Wildner ress.dstFile = FIO_openDstFile(fCtx, prefs, srcFileName, dstFileName);
2505*a28cd43dSSascha Wildner if (ress.dstFile==NULL) return 1;
2506*a28cd43dSSascha Wildner
2507*a28cd43dSSascha Wildner /* Must only be added after FIO_openDstFile() succeeds.
2508*a28cd43dSSascha Wildner * Otherwise we may delete the destination file if it already exists,
2509*a28cd43dSSascha Wildner * and the user presses Ctrl-C when asked if they wish to overwrite.
2510*a28cd43dSSascha Wildner */
2511*a28cd43dSSascha Wildner addHandler(dstFileName);
2512*a28cd43dSSascha Wildner
2513*a28cd43dSSascha Wildner if ( strcmp(srcFileName, stdinmark) /* special case : don't transfer permissions from stdin */
2514*a28cd43dSSascha Wildner && UTIL_stat(srcFileName, &statbuf)
2515*a28cd43dSSascha Wildner && UTIL_isRegularFileStat(&statbuf) )
2516*a28cd43dSSascha Wildner transfer_permissions = 1;
2517*a28cd43dSSascha Wildner }
2518*a28cd43dSSascha Wildner
2519*a28cd43dSSascha Wildner result = FIO_decompressFrames(fCtx, ress, srcFile, prefs, dstFileName, srcFileName);
2520*a28cd43dSSascha Wildner
2521*a28cd43dSSascha Wildner if (releaseDstFile) {
2522*a28cd43dSSascha Wildner FILE* const dstFile = ress.dstFile;
2523*a28cd43dSSascha Wildner clearHandler();
2524*a28cd43dSSascha Wildner ress.dstFile = NULL;
2525*a28cd43dSSascha Wildner if (fclose(dstFile)) {
2526*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s: %s \n", dstFileName, strerror(errno));
2527*a28cd43dSSascha Wildner result = 1;
2528*a28cd43dSSascha Wildner }
2529*a28cd43dSSascha Wildner
2530*a28cd43dSSascha Wildner if ( (result != 0) /* operation failure */
2531*a28cd43dSSascha Wildner && strcmp(dstFileName, stdoutmark) /* special case : don't remove() stdout */
2532*a28cd43dSSascha Wildner ) {
2533*a28cd43dSSascha Wildner FIO_removeFile(dstFileName); /* remove decompression artefact; note: don't do anything special if remove() fails */
2534*a28cd43dSSascha Wildner } else if ( transfer_permissions /* file permissions correctly extracted from src */ ) {
2535*a28cd43dSSascha Wildner UTIL_setFileStat(dstFileName, &statbuf); /* transfer file permissions from src into dst */
2536*a28cd43dSSascha Wildner }
2537*a28cd43dSSascha Wildner }
2538*a28cd43dSSascha Wildner
2539*a28cd43dSSascha Wildner return result;
2540*a28cd43dSSascha Wildner }
2541*a28cd43dSSascha Wildner
2542*a28cd43dSSascha Wildner
2543*a28cd43dSSascha Wildner /** FIO_decompressSrcFile() :
2544*a28cd43dSSascha Wildner Open `srcFileName`, transfer control to decompressDstFile()
2545*a28cd43dSSascha Wildner @return : 0 : OK
2546*a28cd43dSSascha Wildner 1 : error
2547*a28cd43dSSascha Wildner */
FIO_decompressSrcFile(FIO_ctx_t * const fCtx,FIO_prefs_t * const prefs,dRess_t ress,const char * dstFileName,const char * srcFileName)2548*a28cd43dSSascha Wildner static int FIO_decompressSrcFile(FIO_ctx_t* const fCtx, FIO_prefs_t* const prefs, dRess_t ress, const char* dstFileName, const char* srcFileName)
2549*a28cd43dSSascha Wildner {
2550*a28cd43dSSascha Wildner FILE* srcFile;
2551*a28cd43dSSascha Wildner int result;
2552*a28cd43dSSascha Wildner
2553*a28cd43dSSascha Wildner if (UTIL_isDirectory(srcFileName)) {
2554*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s is a directory -- ignored \n", srcFileName);
2555*a28cd43dSSascha Wildner return 1;
2556*a28cd43dSSascha Wildner }
2557*a28cd43dSSascha Wildner
2558*a28cd43dSSascha Wildner srcFile = FIO_openSrcFile(srcFileName);
2559*a28cd43dSSascha Wildner if (srcFile==NULL) return 1;
2560*a28cd43dSSascha Wildner ress.srcBufferLoaded = 0;
2561*a28cd43dSSascha Wildner
2562*a28cd43dSSascha Wildner result = FIO_decompressDstFile(fCtx, prefs, ress, srcFile, dstFileName, srcFileName);
2563*a28cd43dSSascha Wildner
2564*a28cd43dSSascha Wildner /* Close file */
2565*a28cd43dSSascha Wildner if (fclose(srcFile)) {
2566*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s: %s \n", srcFileName, strerror(errno)); /* error should not happen */
2567*a28cd43dSSascha Wildner return 1;
2568*a28cd43dSSascha Wildner }
2569*a28cd43dSSascha Wildner if ( prefs->removeSrcFile /* --rm */
2570*a28cd43dSSascha Wildner && (result==0) /* decompression successful */
2571*a28cd43dSSascha Wildner && strcmp(srcFileName, stdinmark) ) /* not stdin */ {
2572*a28cd43dSSascha Wildner /* We must clear the handler, since after this point calling it would
2573*a28cd43dSSascha Wildner * delete both the source and destination files.
2574*a28cd43dSSascha Wildner */
2575*a28cd43dSSascha Wildner clearHandler();
2576*a28cd43dSSascha Wildner if (FIO_removeFile(srcFileName)) {
2577*a28cd43dSSascha Wildner /* failed to remove src file */
2578*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: %s: %s \n", srcFileName, strerror(errno));
2579*a28cd43dSSascha Wildner return 1;
2580*a28cd43dSSascha Wildner } }
2581*a28cd43dSSascha Wildner return result;
2582*a28cd43dSSascha Wildner }
2583*a28cd43dSSascha Wildner
2584*a28cd43dSSascha Wildner
2585*a28cd43dSSascha Wildner
FIO_decompressFilename(FIO_ctx_t * const fCtx,FIO_prefs_t * const prefs,const char * dstFileName,const char * srcFileName,const char * dictFileName)2586*a28cd43dSSascha Wildner int FIO_decompressFilename(FIO_ctx_t* const fCtx, FIO_prefs_t* const prefs,
2587*a28cd43dSSascha Wildner const char* dstFileName, const char* srcFileName,
2588*a28cd43dSSascha Wildner const char* dictFileName)
2589*a28cd43dSSascha Wildner {
2590*a28cd43dSSascha Wildner dRess_t const ress = FIO_createDResources(prefs, dictFileName);
2591*a28cd43dSSascha Wildner
2592*a28cd43dSSascha Wildner int const decodingError = FIO_decompressSrcFile(fCtx, prefs, ress, dstFileName, srcFileName);
2593*a28cd43dSSascha Wildner
2594*a28cd43dSSascha Wildner FIO_freeDResources(ress);
2595*a28cd43dSSascha Wildner return decodingError;
2596*a28cd43dSSascha Wildner }
2597*a28cd43dSSascha Wildner
2598*a28cd43dSSascha Wildner static const char *suffixList[] = {
2599*a28cd43dSSascha Wildner ZSTD_EXTENSION,
2600*a28cd43dSSascha Wildner TZSTD_EXTENSION,
2601*a28cd43dSSascha Wildner #ifndef ZSTD_NODECOMPRESS
2602*a28cd43dSSascha Wildner ZSTD_ALT_EXTENSION,
2603*a28cd43dSSascha Wildner #endif
2604*a28cd43dSSascha Wildner #ifdef ZSTD_GZDECOMPRESS
2605*a28cd43dSSascha Wildner GZ_EXTENSION,
2606*a28cd43dSSascha Wildner TGZ_EXTENSION,
2607*a28cd43dSSascha Wildner #endif
2608*a28cd43dSSascha Wildner #ifdef ZSTD_LZMADECOMPRESS
2609*a28cd43dSSascha Wildner LZMA_EXTENSION,
2610*a28cd43dSSascha Wildner XZ_EXTENSION,
2611*a28cd43dSSascha Wildner TXZ_EXTENSION,
2612*a28cd43dSSascha Wildner #endif
2613*a28cd43dSSascha Wildner #ifdef ZSTD_LZ4DECOMPRESS
2614*a28cd43dSSascha Wildner LZ4_EXTENSION,
2615*a28cd43dSSascha Wildner TLZ4_EXTENSION,
2616*a28cd43dSSascha Wildner #endif
2617*a28cd43dSSascha Wildner NULL
2618*a28cd43dSSascha Wildner };
2619*a28cd43dSSascha Wildner
2620*a28cd43dSSascha Wildner static const char *suffixListStr =
2621*a28cd43dSSascha Wildner ZSTD_EXTENSION "/" TZSTD_EXTENSION
2622*a28cd43dSSascha Wildner #ifdef ZSTD_GZDECOMPRESS
2623*a28cd43dSSascha Wildner "/" GZ_EXTENSION "/" TGZ_EXTENSION
2624*a28cd43dSSascha Wildner #endif
2625*a28cd43dSSascha Wildner #ifdef ZSTD_LZMADECOMPRESS
2626*a28cd43dSSascha Wildner "/" LZMA_EXTENSION "/" XZ_EXTENSION "/" TXZ_EXTENSION
2627*a28cd43dSSascha Wildner #endif
2628*a28cd43dSSascha Wildner #ifdef ZSTD_LZ4DECOMPRESS
2629*a28cd43dSSascha Wildner "/" LZ4_EXTENSION "/" TLZ4_EXTENSION
2630*a28cd43dSSascha Wildner #endif
2631*a28cd43dSSascha Wildner ;
2632*a28cd43dSSascha Wildner
2633*a28cd43dSSascha Wildner /* FIO_determineDstName() :
2634*a28cd43dSSascha Wildner * create a destination filename from a srcFileName.
2635*a28cd43dSSascha Wildner * @return a pointer to it.
2636*a28cd43dSSascha Wildner * @return == NULL if there is an error */
2637*a28cd43dSSascha Wildner static const char*
FIO_determineDstName(const char * srcFileName,const char * outDirName)2638*a28cd43dSSascha Wildner FIO_determineDstName(const char* srcFileName, const char* outDirName)
2639*a28cd43dSSascha Wildner {
2640*a28cd43dSSascha Wildner static size_t dfnbCapacity = 0;
2641*a28cd43dSSascha Wildner static char* dstFileNameBuffer = NULL; /* using static allocation : this function cannot be multi-threaded */
2642*a28cd43dSSascha Wildner size_t dstFileNameEndPos;
2643*a28cd43dSSascha Wildner char* outDirFilename = NULL;
2644*a28cd43dSSascha Wildner const char* dstSuffix = "";
2645*a28cd43dSSascha Wildner size_t dstSuffixLen = 0;
2646*a28cd43dSSascha Wildner
2647*a28cd43dSSascha Wildner size_t sfnSize = strlen(srcFileName);
2648*a28cd43dSSascha Wildner
2649*a28cd43dSSascha Wildner size_t srcSuffixLen;
2650*a28cd43dSSascha Wildner const char* const srcSuffix = strrchr(srcFileName, '.');
2651*a28cd43dSSascha Wildner if (srcSuffix == NULL) {
2652*a28cd43dSSascha Wildner DISPLAYLEVEL(1,
2653*a28cd43dSSascha Wildner "zstd: %s: unknown suffix (%s expected). "
2654*a28cd43dSSascha Wildner "Can't derive the output file name. "
2655*a28cd43dSSascha Wildner "Specify it with -o dstFileName. Ignoring.\n",
2656*a28cd43dSSascha Wildner srcFileName, suffixListStr);
2657*a28cd43dSSascha Wildner return NULL;
2658*a28cd43dSSascha Wildner }
2659*a28cd43dSSascha Wildner srcSuffixLen = strlen(srcSuffix);
2660*a28cd43dSSascha Wildner
2661*a28cd43dSSascha Wildner {
2662*a28cd43dSSascha Wildner const char** matchedSuffixPtr;
2663*a28cd43dSSascha Wildner for (matchedSuffixPtr = suffixList; *matchedSuffixPtr != NULL; matchedSuffixPtr++) {
2664*a28cd43dSSascha Wildner if (!strcmp(*matchedSuffixPtr, srcSuffix)) {
2665*a28cd43dSSascha Wildner break;
2666*a28cd43dSSascha Wildner }
2667*a28cd43dSSascha Wildner }
2668*a28cd43dSSascha Wildner
2669*a28cd43dSSascha Wildner /* check suffix is authorized */
2670*a28cd43dSSascha Wildner if (sfnSize <= srcSuffixLen || *matchedSuffixPtr == NULL) {
2671*a28cd43dSSascha Wildner DISPLAYLEVEL(1,
2672*a28cd43dSSascha Wildner "zstd: %s: unknown suffix (%s expected). "
2673*a28cd43dSSascha Wildner "Can't derive the output file name. "
2674*a28cd43dSSascha Wildner "Specify it with -o dstFileName. Ignoring.\n",
2675*a28cd43dSSascha Wildner srcFileName, suffixListStr);
2676*a28cd43dSSascha Wildner return NULL;
2677*a28cd43dSSascha Wildner }
2678*a28cd43dSSascha Wildner
2679*a28cd43dSSascha Wildner if ((*matchedSuffixPtr)[1] == 't') {
2680*a28cd43dSSascha Wildner dstSuffix = ".tar";
2681*a28cd43dSSascha Wildner dstSuffixLen = strlen(dstSuffix);
2682*a28cd43dSSascha Wildner }
2683*a28cd43dSSascha Wildner }
2684*a28cd43dSSascha Wildner
2685*a28cd43dSSascha Wildner if (outDirName) {
2686*a28cd43dSSascha Wildner outDirFilename = FIO_createFilename_fromOutDir(srcFileName, outDirName, 0);
2687*a28cd43dSSascha Wildner sfnSize = strlen(outDirFilename);
2688*a28cd43dSSascha Wildner assert(outDirFilename != NULL);
2689*a28cd43dSSascha Wildner }
2690*a28cd43dSSascha Wildner
2691*a28cd43dSSascha Wildner if (dfnbCapacity+srcSuffixLen <= sfnSize+1+dstSuffixLen) {
2692*a28cd43dSSascha Wildner /* allocate enough space to write dstFilename into it */
2693*a28cd43dSSascha Wildner free(dstFileNameBuffer);
2694*a28cd43dSSascha Wildner dfnbCapacity = sfnSize + 20;
2695*a28cd43dSSascha Wildner dstFileNameBuffer = (char*)malloc(dfnbCapacity);
2696*a28cd43dSSascha Wildner if (dstFileNameBuffer==NULL)
2697*a28cd43dSSascha Wildner EXM_THROW(74, "%s : not enough memory for dstFileName",
2698*a28cd43dSSascha Wildner strerror(errno));
2699*a28cd43dSSascha Wildner }
2700*a28cd43dSSascha Wildner
2701*a28cd43dSSascha Wildner /* return dst name == src name truncated from suffix */
2702*a28cd43dSSascha Wildner assert(dstFileNameBuffer != NULL);
2703*a28cd43dSSascha Wildner dstFileNameEndPos = sfnSize - srcSuffixLen;
2704*a28cd43dSSascha Wildner if (outDirFilename) {
2705*a28cd43dSSascha Wildner memcpy(dstFileNameBuffer, outDirFilename, dstFileNameEndPos);
2706*a28cd43dSSascha Wildner free(outDirFilename);
2707*a28cd43dSSascha Wildner } else {
2708*a28cd43dSSascha Wildner memcpy(dstFileNameBuffer, srcFileName, dstFileNameEndPos);
2709*a28cd43dSSascha Wildner }
2710*a28cd43dSSascha Wildner
2711*a28cd43dSSascha Wildner /* The short tar extensions tzst, tgz, txz and tlz4 files should have "tar"
2712*a28cd43dSSascha Wildner * extension on decompression. Also writes terminating null. */
2713*a28cd43dSSascha Wildner strcpy(dstFileNameBuffer + dstFileNameEndPos, dstSuffix);
2714*a28cd43dSSascha Wildner return dstFileNameBuffer;
2715*a28cd43dSSascha Wildner
2716*a28cd43dSSascha Wildner /* note : dstFileNameBuffer memory is not going to be free */
2717*a28cd43dSSascha Wildner }
2718*a28cd43dSSascha Wildner
2719*a28cd43dSSascha Wildner int
FIO_decompressMultipleFilenames(FIO_ctx_t * const fCtx,FIO_prefs_t * const prefs,const char ** srcNamesTable,const char * outMirroredRootDirName,const char * outDirName,const char * outFileName,const char * dictFileName)2720*a28cd43dSSascha Wildner FIO_decompressMultipleFilenames(FIO_ctx_t* const fCtx,
2721*a28cd43dSSascha Wildner FIO_prefs_t* const prefs,
2722*a28cd43dSSascha Wildner const char** srcNamesTable,
2723*a28cd43dSSascha Wildner const char* outMirroredRootDirName,
2724*a28cd43dSSascha Wildner const char* outDirName, const char* outFileName,
2725*a28cd43dSSascha Wildner const char* dictFileName)
2726*a28cd43dSSascha Wildner {
2727*a28cd43dSSascha Wildner int status;
2728*a28cd43dSSascha Wildner int error = 0;
2729*a28cd43dSSascha Wildner dRess_t ress = FIO_createDResources(prefs, dictFileName);
2730*a28cd43dSSascha Wildner
2731*a28cd43dSSascha Wildner if (outFileName) {
2732*a28cd43dSSascha Wildner if (FIO_removeMultiFilesWarning(fCtx, prefs, outFileName, 1 /* displayLevelCutoff */)) {
2733*a28cd43dSSascha Wildner FIO_freeDResources(ress);
2734*a28cd43dSSascha Wildner return 1;
2735*a28cd43dSSascha Wildner }
2736*a28cd43dSSascha Wildner if (!prefs->testMode) {
2737*a28cd43dSSascha Wildner ress.dstFile = FIO_openDstFile(fCtx, prefs, NULL, outFileName);
2738*a28cd43dSSascha Wildner if (ress.dstFile == 0) EXM_THROW(19, "cannot open %s", outFileName);
2739*a28cd43dSSascha Wildner }
2740*a28cd43dSSascha Wildner for (; fCtx->currFileIdx < fCtx->nbFilesTotal; fCtx->currFileIdx++) {
2741*a28cd43dSSascha Wildner status = FIO_decompressSrcFile(fCtx, prefs, ress, outFileName, srcNamesTable[fCtx->currFileIdx]);
2742*a28cd43dSSascha Wildner if (!status) fCtx->nbFilesProcessed++;
2743*a28cd43dSSascha Wildner error |= status;
2744*a28cd43dSSascha Wildner }
2745*a28cd43dSSascha Wildner if ((!prefs->testMode) && (fclose(ress.dstFile)))
2746*a28cd43dSSascha Wildner EXM_THROW(72, "Write error : %s : cannot properly close output file",
2747*a28cd43dSSascha Wildner strerror(errno));
2748*a28cd43dSSascha Wildner } else {
2749*a28cd43dSSascha Wildner if (outMirroredRootDirName)
2750*a28cd43dSSascha Wildner UTIL_mirrorSourceFilesDirectories(srcNamesTable, fCtx->nbFilesTotal, outMirroredRootDirName);
2751*a28cd43dSSascha Wildner
2752*a28cd43dSSascha Wildner for (; fCtx->currFileIdx < fCtx->nbFilesTotal; fCtx->currFileIdx++) { /* create dstFileName */
2753*a28cd43dSSascha Wildner const char* const srcFileName = srcNamesTable[fCtx->currFileIdx];
2754*a28cd43dSSascha Wildner const char* dstFileName = NULL;
2755*a28cd43dSSascha Wildner if (outMirroredRootDirName) {
2756*a28cd43dSSascha Wildner char* validMirroredDirName = UTIL_createMirroredDestDirName(srcFileName, outMirroredRootDirName);
2757*a28cd43dSSascha Wildner if (validMirroredDirName) {
2758*a28cd43dSSascha Wildner dstFileName = FIO_determineDstName(srcFileName, validMirroredDirName);
2759*a28cd43dSSascha Wildner free(validMirroredDirName);
2760*a28cd43dSSascha Wildner } else {
2761*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "zstd: --output-dir-mirror cannot decompress '%s' into '%s'\n", srcFileName, outMirroredRootDirName);
2762*a28cd43dSSascha Wildner }
2763*a28cd43dSSascha Wildner } else {
2764*a28cd43dSSascha Wildner dstFileName = FIO_determineDstName(srcFileName, outDirName);
2765*a28cd43dSSascha Wildner }
2766*a28cd43dSSascha Wildner if (dstFileName == NULL) { error=1; continue; }
2767*a28cd43dSSascha Wildner status = FIO_decompressSrcFile(fCtx, prefs, ress, dstFileName, srcFileName);
2768*a28cd43dSSascha Wildner if (!status) fCtx->nbFilesProcessed++;
2769*a28cd43dSSascha Wildner error |= status;
2770*a28cd43dSSascha Wildner }
2771*a28cd43dSSascha Wildner if (outDirName)
2772*a28cd43dSSascha Wildner FIO_checkFilenameCollisions(srcNamesTable , fCtx->nbFilesTotal);
2773*a28cd43dSSascha Wildner }
2774*a28cd43dSSascha Wildner
2775*a28cd43dSSascha Wildner if (fCtx->nbFilesProcessed >= 1 && fCtx->nbFilesTotal > 1 && fCtx->totalBytesOutput != 0)
2776*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "%d files decompressed : %6zu bytes total \n", fCtx->nbFilesProcessed, fCtx->totalBytesOutput);
2777*a28cd43dSSascha Wildner
2778*a28cd43dSSascha Wildner FIO_freeDResources(ress);
2779*a28cd43dSSascha Wildner return error;
2780*a28cd43dSSascha Wildner }
2781*a28cd43dSSascha Wildner
2782*a28cd43dSSascha Wildner /* **************************************************************************
2783*a28cd43dSSascha Wildner * .zst file info (--list command)
2784*a28cd43dSSascha Wildner ***************************************************************************/
2785*a28cd43dSSascha Wildner
2786*a28cd43dSSascha Wildner typedef struct {
2787*a28cd43dSSascha Wildner U64 decompressedSize;
2788*a28cd43dSSascha Wildner U64 compressedSize;
2789*a28cd43dSSascha Wildner U64 windowSize;
2790*a28cd43dSSascha Wildner int numActualFrames;
2791*a28cd43dSSascha Wildner int numSkippableFrames;
2792*a28cd43dSSascha Wildner int decompUnavailable;
2793*a28cd43dSSascha Wildner int usesCheck;
2794*a28cd43dSSascha Wildner U32 nbFiles;
2795*a28cd43dSSascha Wildner } fileInfo_t;
2796*a28cd43dSSascha Wildner
2797*a28cd43dSSascha Wildner typedef enum {
2798*a28cd43dSSascha Wildner info_success=0,
2799*a28cd43dSSascha Wildner info_frame_error=1,
2800*a28cd43dSSascha Wildner info_not_zstd=2,
2801*a28cd43dSSascha Wildner info_file_error=3,
2802*a28cd43dSSascha Wildner info_truncated_input=4,
2803*a28cd43dSSascha Wildner } InfoError;
2804*a28cd43dSSascha Wildner
2805*a28cd43dSSascha Wildner #define ERROR_IF(c,n,...) { \
2806*a28cd43dSSascha Wildner if (c) { \
2807*a28cd43dSSascha Wildner DISPLAYLEVEL(1, __VA_ARGS__); \
2808*a28cd43dSSascha Wildner DISPLAYLEVEL(1, " \n"); \
2809*a28cd43dSSascha Wildner return n; \
2810*a28cd43dSSascha Wildner } \
2811*a28cd43dSSascha Wildner }
2812*a28cd43dSSascha Wildner
2813*a28cd43dSSascha Wildner static InfoError
FIO_analyzeFrames(fileInfo_t * info,FILE * const srcFile)2814*a28cd43dSSascha Wildner FIO_analyzeFrames(fileInfo_t* info, FILE* const srcFile)
2815*a28cd43dSSascha Wildner {
2816*a28cd43dSSascha Wildner /* begin analyzing frame */
2817*a28cd43dSSascha Wildner for ( ; ; ) {
2818*a28cd43dSSascha Wildner BYTE headerBuffer[ZSTD_FRAMEHEADERSIZE_MAX];
2819*a28cd43dSSascha Wildner size_t const numBytesRead = fread(headerBuffer, 1, sizeof(headerBuffer), srcFile);
2820*a28cd43dSSascha Wildner if (numBytesRead < ZSTD_FRAMEHEADERSIZE_MIN(ZSTD_f_zstd1)) {
2821*a28cd43dSSascha Wildner if ( feof(srcFile)
2822*a28cd43dSSascha Wildner && (numBytesRead == 0)
2823*a28cd43dSSascha Wildner && (info->compressedSize > 0)
2824*a28cd43dSSascha Wildner && (info->compressedSize != UTIL_FILESIZE_UNKNOWN) ) {
2825*a28cd43dSSascha Wildner unsigned long long file_position = (unsigned long long) LONG_TELL(srcFile);
2826*a28cd43dSSascha Wildner unsigned long long file_size = (unsigned long long) info->compressedSize;
2827*a28cd43dSSascha Wildner ERROR_IF(file_position != file_size, info_truncated_input,
2828*a28cd43dSSascha Wildner "Error: seeked to position %llu, which is beyond file size of %llu\n",
2829*a28cd43dSSascha Wildner file_position,
2830*a28cd43dSSascha Wildner file_size);
2831*a28cd43dSSascha Wildner break; /* correct end of file => success */
2832*a28cd43dSSascha Wildner }
2833*a28cd43dSSascha Wildner ERROR_IF(feof(srcFile), info_not_zstd, "Error: reached end of file with incomplete frame");
2834*a28cd43dSSascha Wildner ERROR_IF(1, info_frame_error, "Error: did not reach end of file but ran out of frames");
2835*a28cd43dSSascha Wildner }
2836*a28cd43dSSascha Wildner { U32 const magicNumber = MEM_readLE32(headerBuffer);
2837*a28cd43dSSascha Wildner /* Zstandard frame */
2838*a28cd43dSSascha Wildner if (magicNumber == ZSTD_MAGICNUMBER) {
2839*a28cd43dSSascha Wildner ZSTD_frameHeader header;
2840*a28cd43dSSascha Wildner U64 const frameContentSize = ZSTD_getFrameContentSize(headerBuffer, numBytesRead);
2841*a28cd43dSSascha Wildner if ( frameContentSize == ZSTD_CONTENTSIZE_ERROR
2842*a28cd43dSSascha Wildner || frameContentSize == ZSTD_CONTENTSIZE_UNKNOWN ) {
2843*a28cd43dSSascha Wildner info->decompUnavailable = 1;
2844*a28cd43dSSascha Wildner } else {
2845*a28cd43dSSascha Wildner info->decompressedSize += frameContentSize;
2846*a28cd43dSSascha Wildner }
2847*a28cd43dSSascha Wildner ERROR_IF(ZSTD_getFrameHeader(&header, headerBuffer, numBytesRead) != 0,
2848*a28cd43dSSascha Wildner info_frame_error, "Error: could not decode frame header");
2849*a28cd43dSSascha Wildner info->windowSize = header.windowSize;
2850*a28cd43dSSascha Wildner /* move to the end of the frame header */
2851*a28cd43dSSascha Wildner { size_t const headerSize = ZSTD_frameHeaderSize(headerBuffer, numBytesRead);
2852*a28cd43dSSascha Wildner ERROR_IF(ZSTD_isError(headerSize), info_frame_error, "Error: could not determine frame header size");
2853*a28cd43dSSascha Wildner ERROR_IF(fseek(srcFile, ((long)headerSize)-((long)numBytesRead), SEEK_CUR) != 0,
2854*a28cd43dSSascha Wildner info_frame_error, "Error: could not move to end of frame header");
2855*a28cd43dSSascha Wildner }
2856*a28cd43dSSascha Wildner
2857*a28cd43dSSascha Wildner /* skip all blocks in the frame */
2858*a28cd43dSSascha Wildner { int lastBlock = 0;
2859*a28cd43dSSascha Wildner do {
2860*a28cd43dSSascha Wildner BYTE blockHeaderBuffer[3];
2861*a28cd43dSSascha Wildner ERROR_IF(fread(blockHeaderBuffer, 1, 3, srcFile) != 3,
2862*a28cd43dSSascha Wildner info_frame_error, "Error while reading block header");
2863*a28cd43dSSascha Wildner { U32 const blockHeader = MEM_readLE24(blockHeaderBuffer);
2864*a28cd43dSSascha Wildner U32 const blockTypeID = (blockHeader >> 1) & 3;
2865*a28cd43dSSascha Wildner U32 const isRLE = (blockTypeID == 1);
2866*a28cd43dSSascha Wildner U32 const isWrongBlock = (blockTypeID == 3);
2867*a28cd43dSSascha Wildner long const blockSize = isRLE ? 1 : (long)(blockHeader >> 3);
2868*a28cd43dSSascha Wildner ERROR_IF(isWrongBlock, info_frame_error, "Error: unsupported block type");
2869*a28cd43dSSascha Wildner lastBlock = blockHeader & 1;
2870*a28cd43dSSascha Wildner ERROR_IF(fseek(srcFile, blockSize, SEEK_CUR) != 0,
2871*a28cd43dSSascha Wildner info_frame_error, "Error: could not skip to end of block");
2872*a28cd43dSSascha Wildner }
2873*a28cd43dSSascha Wildner } while (lastBlock != 1);
2874*a28cd43dSSascha Wildner }
2875*a28cd43dSSascha Wildner
2876*a28cd43dSSascha Wildner /* check if checksum is used */
2877*a28cd43dSSascha Wildner { BYTE const frameHeaderDescriptor = headerBuffer[4];
2878*a28cd43dSSascha Wildner int const contentChecksumFlag = (frameHeaderDescriptor & (1 << 2)) >> 2;
2879*a28cd43dSSascha Wildner if (contentChecksumFlag) {
2880*a28cd43dSSascha Wildner info->usesCheck = 1;
2881*a28cd43dSSascha Wildner ERROR_IF(fseek(srcFile, 4, SEEK_CUR) != 0,
2882*a28cd43dSSascha Wildner info_frame_error, "Error: could not skip past checksum");
2883*a28cd43dSSascha Wildner } }
2884*a28cd43dSSascha Wildner info->numActualFrames++;
2885*a28cd43dSSascha Wildner }
2886*a28cd43dSSascha Wildner /* Skippable frame */
2887*a28cd43dSSascha Wildner else if ((magicNumber & ZSTD_MAGIC_SKIPPABLE_MASK) == ZSTD_MAGIC_SKIPPABLE_START) {
2888*a28cd43dSSascha Wildner U32 const frameSize = MEM_readLE32(headerBuffer + 4);
2889*a28cd43dSSascha Wildner long const seek = (long)(8 + frameSize - numBytesRead);
2890*a28cd43dSSascha Wildner ERROR_IF(LONG_SEEK(srcFile, seek, SEEK_CUR) != 0,
2891*a28cd43dSSascha Wildner info_frame_error, "Error: could not find end of skippable frame");
2892*a28cd43dSSascha Wildner info->numSkippableFrames++;
2893*a28cd43dSSascha Wildner }
2894*a28cd43dSSascha Wildner /* unknown content */
2895*a28cd43dSSascha Wildner else {
2896*a28cd43dSSascha Wildner return info_not_zstd;
2897*a28cd43dSSascha Wildner }
2898*a28cd43dSSascha Wildner } /* magic number analysis */
2899*a28cd43dSSascha Wildner } /* end analyzing frames */
2900*a28cd43dSSascha Wildner return info_success;
2901*a28cd43dSSascha Wildner }
2902*a28cd43dSSascha Wildner
2903*a28cd43dSSascha Wildner
2904*a28cd43dSSascha Wildner static InfoError
getFileInfo_fileConfirmed(fileInfo_t * info,const char * inFileName)2905*a28cd43dSSascha Wildner getFileInfo_fileConfirmed(fileInfo_t* info, const char* inFileName)
2906*a28cd43dSSascha Wildner {
2907*a28cd43dSSascha Wildner InfoError status;
2908*a28cd43dSSascha Wildner FILE* const srcFile = FIO_openSrcFile(inFileName);
2909*a28cd43dSSascha Wildner ERROR_IF(srcFile == NULL, info_file_error, "Error: could not open source file %s", inFileName);
2910*a28cd43dSSascha Wildner
2911*a28cd43dSSascha Wildner info->compressedSize = UTIL_getFileSize(inFileName);
2912*a28cd43dSSascha Wildner status = FIO_analyzeFrames(info, srcFile);
2913*a28cd43dSSascha Wildner
2914*a28cd43dSSascha Wildner fclose(srcFile);
2915*a28cd43dSSascha Wildner info->nbFiles = 1;
2916*a28cd43dSSascha Wildner return status;
2917*a28cd43dSSascha Wildner }
2918*a28cd43dSSascha Wildner
2919*a28cd43dSSascha Wildner
2920*a28cd43dSSascha Wildner /** getFileInfo() :
2921*a28cd43dSSascha Wildner * Reads information from file, stores in *info
2922*a28cd43dSSascha Wildner * @return : InfoError status
2923*a28cd43dSSascha Wildner */
2924*a28cd43dSSascha Wildner static InfoError
getFileInfo(fileInfo_t * info,const char * srcFileName)2925*a28cd43dSSascha Wildner getFileInfo(fileInfo_t* info, const char* srcFileName)
2926*a28cd43dSSascha Wildner {
2927*a28cd43dSSascha Wildner ERROR_IF(!UTIL_isRegularFile(srcFileName),
2928*a28cd43dSSascha Wildner info_file_error, "Error : %s is not a file", srcFileName);
2929*a28cd43dSSascha Wildner return getFileInfo_fileConfirmed(info, srcFileName);
2930*a28cd43dSSascha Wildner }
2931*a28cd43dSSascha Wildner
2932*a28cd43dSSascha Wildner
2933*a28cd43dSSascha Wildner static void
displayInfo(const char * inFileName,const fileInfo_t * info,int displayLevel)2934*a28cd43dSSascha Wildner displayInfo(const char* inFileName, const fileInfo_t* info, int displayLevel)
2935*a28cd43dSSascha Wildner {
2936*a28cd43dSSascha Wildner unsigned const unit = info->compressedSize < (1 MB) ? (1 KB) : (1 MB);
2937*a28cd43dSSascha Wildner const char* const unitStr = info->compressedSize < (1 MB) ? "KB" : "MB";
2938*a28cd43dSSascha Wildner double const windowSizeUnit = (double)info->windowSize / unit;
2939*a28cd43dSSascha Wildner double const compressedSizeUnit = (double)info->compressedSize / unit;
2940*a28cd43dSSascha Wildner double const decompressedSizeUnit = (double)info->decompressedSize / unit;
2941*a28cd43dSSascha Wildner double const ratio = (info->compressedSize == 0) ? 0 : ((double)info->decompressedSize)/info->compressedSize;
2942*a28cd43dSSascha Wildner const char* const checkString = (info->usesCheck ? "XXH64" : "None");
2943*a28cd43dSSascha Wildner if (displayLevel <= 2) {
2944*a28cd43dSSascha Wildner if (!info->decompUnavailable) {
2945*a28cd43dSSascha Wildner DISPLAYOUT("%6d %5d %7.2f %2s %9.2f %2s %5.3f %5s %s\n",
2946*a28cd43dSSascha Wildner info->numSkippableFrames + info->numActualFrames,
2947*a28cd43dSSascha Wildner info->numSkippableFrames,
2948*a28cd43dSSascha Wildner compressedSizeUnit, unitStr, decompressedSizeUnit, unitStr,
2949*a28cd43dSSascha Wildner ratio, checkString, inFileName);
2950*a28cd43dSSascha Wildner } else {
2951*a28cd43dSSascha Wildner DISPLAYOUT("%6d %5d %7.2f %2s %5s %s\n",
2952*a28cd43dSSascha Wildner info->numSkippableFrames + info->numActualFrames,
2953*a28cd43dSSascha Wildner info->numSkippableFrames,
2954*a28cd43dSSascha Wildner compressedSizeUnit, unitStr,
2955*a28cd43dSSascha Wildner checkString, inFileName);
2956*a28cd43dSSascha Wildner }
2957*a28cd43dSSascha Wildner } else {
2958*a28cd43dSSascha Wildner DISPLAYOUT("%s \n", inFileName);
2959*a28cd43dSSascha Wildner DISPLAYOUT("# Zstandard Frames: %d\n", info->numActualFrames);
2960*a28cd43dSSascha Wildner if (info->numSkippableFrames)
2961*a28cd43dSSascha Wildner DISPLAYOUT("# Skippable Frames: %d\n", info->numSkippableFrames);
2962*a28cd43dSSascha Wildner DISPLAYOUT("Window Size: %.2f %2s (%llu B)\n",
2963*a28cd43dSSascha Wildner windowSizeUnit, unitStr,
2964*a28cd43dSSascha Wildner (unsigned long long)info->windowSize);
2965*a28cd43dSSascha Wildner DISPLAYOUT("Compressed Size: %.2f %2s (%llu B)\n",
2966*a28cd43dSSascha Wildner compressedSizeUnit, unitStr,
2967*a28cd43dSSascha Wildner (unsigned long long)info->compressedSize);
2968*a28cd43dSSascha Wildner if (!info->decompUnavailable) {
2969*a28cd43dSSascha Wildner DISPLAYOUT("Decompressed Size: %.2f %2s (%llu B)\n",
2970*a28cd43dSSascha Wildner decompressedSizeUnit, unitStr,
2971*a28cd43dSSascha Wildner (unsigned long long)info->decompressedSize);
2972*a28cd43dSSascha Wildner DISPLAYOUT("Ratio: %.4f\n", ratio);
2973*a28cd43dSSascha Wildner }
2974*a28cd43dSSascha Wildner DISPLAYOUT("Check: %s\n", checkString);
2975*a28cd43dSSascha Wildner DISPLAYOUT("\n");
2976*a28cd43dSSascha Wildner }
2977*a28cd43dSSascha Wildner }
2978*a28cd43dSSascha Wildner
FIO_addFInfo(fileInfo_t fi1,fileInfo_t fi2)2979*a28cd43dSSascha Wildner static fileInfo_t FIO_addFInfo(fileInfo_t fi1, fileInfo_t fi2)
2980*a28cd43dSSascha Wildner {
2981*a28cd43dSSascha Wildner fileInfo_t total;
2982*a28cd43dSSascha Wildner memset(&total, 0, sizeof(total));
2983*a28cd43dSSascha Wildner total.numActualFrames = fi1.numActualFrames + fi2.numActualFrames;
2984*a28cd43dSSascha Wildner total.numSkippableFrames = fi1.numSkippableFrames + fi2.numSkippableFrames;
2985*a28cd43dSSascha Wildner total.compressedSize = fi1.compressedSize + fi2.compressedSize;
2986*a28cd43dSSascha Wildner total.decompressedSize = fi1.decompressedSize + fi2.decompressedSize;
2987*a28cd43dSSascha Wildner total.decompUnavailable = fi1.decompUnavailable | fi2.decompUnavailable;
2988*a28cd43dSSascha Wildner total.usesCheck = fi1.usesCheck & fi2.usesCheck;
2989*a28cd43dSSascha Wildner total.nbFiles = fi1.nbFiles + fi2.nbFiles;
2990*a28cd43dSSascha Wildner return total;
2991*a28cd43dSSascha Wildner }
2992*a28cd43dSSascha Wildner
2993*a28cd43dSSascha Wildner static int
FIO_listFile(fileInfo_t * total,const char * inFileName,int displayLevel)2994*a28cd43dSSascha Wildner FIO_listFile(fileInfo_t* total, const char* inFileName, int displayLevel)
2995*a28cd43dSSascha Wildner {
2996*a28cd43dSSascha Wildner fileInfo_t info;
2997*a28cd43dSSascha Wildner memset(&info, 0, sizeof(info));
2998*a28cd43dSSascha Wildner { InfoError const error = getFileInfo(&info, inFileName);
2999*a28cd43dSSascha Wildner switch (error) {
3000*a28cd43dSSascha Wildner case info_frame_error:
3001*a28cd43dSSascha Wildner /* display error, but provide output */
3002*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "Error while parsing \"%s\" \n", inFileName);
3003*a28cd43dSSascha Wildner break;
3004*a28cd43dSSascha Wildner case info_not_zstd:
3005*a28cd43dSSascha Wildner DISPLAYOUT("File \"%s\" not compressed by zstd \n", inFileName);
3006*a28cd43dSSascha Wildner if (displayLevel > 2) DISPLAYOUT("\n");
3007*a28cd43dSSascha Wildner return 1;
3008*a28cd43dSSascha Wildner case info_file_error:
3009*a28cd43dSSascha Wildner /* error occurred while opening the file */
3010*a28cd43dSSascha Wildner if (displayLevel > 2) DISPLAYOUT("\n");
3011*a28cd43dSSascha Wildner return 1;
3012*a28cd43dSSascha Wildner case info_truncated_input:
3013*a28cd43dSSascha Wildner DISPLAYOUT("File \"%s\" is truncated \n", inFileName);
3014*a28cd43dSSascha Wildner if (displayLevel > 2) DISPLAYOUT("\n");
3015*a28cd43dSSascha Wildner return 1;
3016*a28cd43dSSascha Wildner case info_success:
3017*a28cd43dSSascha Wildner default:
3018*a28cd43dSSascha Wildner break;
3019*a28cd43dSSascha Wildner }
3020*a28cd43dSSascha Wildner
3021*a28cd43dSSascha Wildner displayInfo(inFileName, &info, displayLevel);
3022*a28cd43dSSascha Wildner *total = FIO_addFInfo(*total, info);
3023*a28cd43dSSascha Wildner assert(error == info_success || error == info_frame_error);
3024*a28cd43dSSascha Wildner return (int)error;
3025*a28cd43dSSascha Wildner }
3026*a28cd43dSSascha Wildner }
3027*a28cd43dSSascha Wildner
FIO_listMultipleFiles(unsigned numFiles,const char ** filenameTable,int displayLevel)3028*a28cd43dSSascha Wildner int FIO_listMultipleFiles(unsigned numFiles, const char** filenameTable, int displayLevel)
3029*a28cd43dSSascha Wildner {
3030*a28cd43dSSascha Wildner /* ensure no specified input is stdin (needs fseek() capability) */
3031*a28cd43dSSascha Wildner { unsigned u;
3032*a28cd43dSSascha Wildner for (u=0; u<numFiles;u++) {
3033*a28cd43dSSascha Wildner ERROR_IF(!strcmp (filenameTable[u], stdinmark),
3034*a28cd43dSSascha Wildner 1, "zstd: --list does not support reading from standard input");
3035*a28cd43dSSascha Wildner } }
3036*a28cd43dSSascha Wildner
3037*a28cd43dSSascha Wildner if (numFiles == 0) {
3038*a28cd43dSSascha Wildner if (!IS_CONSOLE(stdin)) {
3039*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: --list does not support reading from standard input \n");
3040*a28cd43dSSascha Wildner }
3041*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "No files given \n");
3042*a28cd43dSSascha Wildner return 1;
3043*a28cd43dSSascha Wildner }
3044*a28cd43dSSascha Wildner
3045*a28cd43dSSascha Wildner if (displayLevel <= 2) {
3046*a28cd43dSSascha Wildner DISPLAYOUT("Frames Skips Compressed Uncompressed Ratio Check Filename\n");
3047*a28cd43dSSascha Wildner }
3048*a28cd43dSSascha Wildner { int error = 0;
3049*a28cd43dSSascha Wildner fileInfo_t total;
3050*a28cd43dSSascha Wildner memset(&total, 0, sizeof(total));
3051*a28cd43dSSascha Wildner total.usesCheck = 1;
3052*a28cd43dSSascha Wildner /* --list each file, and check for any error */
3053*a28cd43dSSascha Wildner { unsigned u;
3054*a28cd43dSSascha Wildner for (u=0; u<numFiles;u++) {
3055*a28cd43dSSascha Wildner error |= FIO_listFile(&total, filenameTable[u], displayLevel);
3056*a28cd43dSSascha Wildner } }
3057*a28cd43dSSascha Wildner if (numFiles > 1 && displayLevel <= 2) { /* display total */
3058*a28cd43dSSascha Wildner unsigned const unit = total.compressedSize < (1 MB) ? (1 KB) : (1 MB);
3059*a28cd43dSSascha Wildner const char* const unitStr = total.compressedSize < (1 MB) ? "KB" : "MB";
3060*a28cd43dSSascha Wildner double const compressedSizeUnit = (double)total.compressedSize / unit;
3061*a28cd43dSSascha Wildner double const decompressedSizeUnit = (double)total.decompressedSize / unit;
3062*a28cd43dSSascha Wildner double const ratio = (total.compressedSize == 0) ? 0 : ((double)total.decompressedSize)/total.compressedSize;
3063*a28cd43dSSascha Wildner const char* const checkString = (total.usesCheck ? "XXH64" : "");
3064*a28cd43dSSascha Wildner DISPLAYOUT("----------------------------------------------------------------- \n");
3065*a28cd43dSSascha Wildner if (total.decompUnavailable) {
3066*a28cd43dSSascha Wildner DISPLAYOUT("%6d %5d %7.2f %2s %5s %u files\n",
3067*a28cd43dSSascha Wildner total.numSkippableFrames + total.numActualFrames,
3068*a28cd43dSSascha Wildner total.numSkippableFrames,
3069*a28cd43dSSascha Wildner compressedSizeUnit, unitStr,
3070*a28cd43dSSascha Wildner checkString, (unsigned)total.nbFiles);
3071*a28cd43dSSascha Wildner } else {
3072*a28cd43dSSascha Wildner DISPLAYOUT("%6d %5d %7.2f %2s %9.2f %2s %5.3f %5s %u files\n",
3073*a28cd43dSSascha Wildner total.numSkippableFrames + total.numActualFrames,
3074*a28cd43dSSascha Wildner total.numSkippableFrames,
3075*a28cd43dSSascha Wildner compressedSizeUnit, unitStr, decompressedSizeUnit, unitStr,
3076*a28cd43dSSascha Wildner ratio, checkString, (unsigned)total.nbFiles);
3077*a28cd43dSSascha Wildner } }
3078*a28cd43dSSascha Wildner return error;
3079*a28cd43dSSascha Wildner }
3080*a28cd43dSSascha Wildner }
3081*a28cd43dSSascha Wildner
3082*a28cd43dSSascha Wildner
3083*a28cd43dSSascha Wildner #endif /* #ifndef ZSTD_NODECOMPRESS */
3084