1*a28cd43dSSascha Wildner /*
2*a28cd43dSSascha Wildner * Copyright (c) 2016-2020, Yann Collet, Facebook, Inc.
3*a28cd43dSSascha Wildner * All rights reserved.
4*a28cd43dSSascha Wildner *
5*a28cd43dSSascha Wildner * This source code is licensed under both the BSD-style license (found in the
6*a28cd43dSSascha Wildner * LICENSE file in the root directory of this source tree) and the GPLv2 (found
7*a28cd43dSSascha Wildner * in the COPYING file in the root directory of this source tree).
8*a28cd43dSSascha Wildner * You may select, at your option, one of the above-listed licenses.
9*a28cd43dSSascha Wildner */
10*a28cd43dSSascha Wildner
11*a28cd43dSSascha Wildner
12*a28cd43dSSascha Wildner /*-************************************
13*a28cd43dSSascha Wildner * Tuning parameters
14*a28cd43dSSascha Wildner **************************************/
15*a28cd43dSSascha Wildner #ifndef ZSTDCLI_CLEVEL_DEFAULT
16*a28cd43dSSascha Wildner # define ZSTDCLI_CLEVEL_DEFAULT 3
17*a28cd43dSSascha Wildner #endif
18*a28cd43dSSascha Wildner
19*a28cd43dSSascha Wildner #ifndef ZSTDCLI_CLEVEL_MAX
20*a28cd43dSSascha Wildner # define ZSTDCLI_CLEVEL_MAX 19 /* without using --ultra */
21*a28cd43dSSascha Wildner #endif
22*a28cd43dSSascha Wildner
23*a28cd43dSSascha Wildner #ifndef ZSTDCLI_NBTHREADS_DEFAULT
24*a28cd43dSSascha Wildner # define ZSTDCLI_NBTHREADS_DEFAULT 1
25*a28cd43dSSascha Wildner #endif
26*a28cd43dSSascha Wildner
27*a28cd43dSSascha Wildner /*-************************************
28*a28cd43dSSascha Wildner * Dependencies
29*a28cd43dSSascha Wildner **************************************/
30*a28cd43dSSascha Wildner #include "platform.h" /* IS_CONSOLE, PLATFORM_POSIX_VERSION */
31*a28cd43dSSascha Wildner #include "util.h" /* UTIL_HAS_CREATEFILELIST, UTIL_createFileList */
32*a28cd43dSSascha Wildner #include <stdlib.h> /* getenv */
33*a28cd43dSSascha Wildner #include <string.h> /* strcmp, strlen */
34*a28cd43dSSascha Wildner #include <stdio.h> /* fprintf(), stdin, stdout, stderr */
35*a28cd43dSSascha Wildner #include <errno.h> /* errno */
36*a28cd43dSSascha Wildner #include <assert.h> /* assert */
37*a28cd43dSSascha Wildner
38*a28cd43dSSascha Wildner #include "fileio.h" /* stdinmark, stdoutmark, ZSTD_EXTENSION */
39*a28cd43dSSascha Wildner #ifndef ZSTD_NOBENCH
40*a28cd43dSSascha Wildner # include "benchzstd.h" /* BMK_benchFiles */
41*a28cd43dSSascha Wildner #endif
42*a28cd43dSSascha Wildner #ifndef ZSTD_NODICT
43*a28cd43dSSascha Wildner # include "dibio.h" /* ZDICT_cover_params_t, DiB_trainFromFiles() */
44*a28cd43dSSascha Wildner #endif
45*a28cd43dSSascha Wildner #include "../lib/zstd.h" /* ZSTD_VERSION_STRING, ZSTD_minCLevel, ZSTD_maxCLevel */
46*a28cd43dSSascha Wildner
47*a28cd43dSSascha Wildner
48*a28cd43dSSascha Wildner /*-************************************
49*a28cd43dSSascha Wildner * Constants
50*a28cd43dSSascha Wildner **************************************/
51*a28cd43dSSascha Wildner #define COMPRESSOR_NAME "zstd command line interface"
52*a28cd43dSSascha Wildner #ifndef ZSTD_VERSION
53*a28cd43dSSascha Wildner # define ZSTD_VERSION "v" ZSTD_VERSION_STRING
54*a28cd43dSSascha Wildner #endif
55*a28cd43dSSascha Wildner #define AUTHOR "Yann Collet"
56*a28cd43dSSascha Wildner #define WELCOME_MESSAGE "*** %s %i-bits %s, by %s ***\n", COMPRESSOR_NAME, (int)(sizeof(size_t)*8), ZSTD_VERSION, AUTHOR
57*a28cd43dSSascha Wildner
58*a28cd43dSSascha Wildner #define ZSTD_ZSTDMT "zstdmt"
59*a28cd43dSSascha Wildner #define ZSTD_UNZSTD "unzstd"
60*a28cd43dSSascha Wildner #define ZSTD_CAT "zstdcat"
61*a28cd43dSSascha Wildner #define ZSTD_ZCAT "zcat"
62*a28cd43dSSascha Wildner #define ZSTD_GZ "gzip"
63*a28cd43dSSascha Wildner #define ZSTD_GUNZIP "gunzip"
64*a28cd43dSSascha Wildner #define ZSTD_GZCAT "gzcat"
65*a28cd43dSSascha Wildner #define ZSTD_LZMA "lzma"
66*a28cd43dSSascha Wildner #define ZSTD_UNLZMA "unlzma"
67*a28cd43dSSascha Wildner #define ZSTD_XZ "xz"
68*a28cd43dSSascha Wildner #define ZSTD_UNXZ "unxz"
69*a28cd43dSSascha Wildner #define ZSTD_LZ4 "lz4"
70*a28cd43dSSascha Wildner #define ZSTD_UNLZ4 "unlz4"
71*a28cd43dSSascha Wildner
72*a28cd43dSSascha Wildner #define KB *(1 <<10)
73*a28cd43dSSascha Wildner #define MB *(1 <<20)
74*a28cd43dSSascha Wildner #define GB *(1U<<30)
75*a28cd43dSSascha Wildner
76*a28cd43dSSascha Wildner #define DISPLAY_LEVEL_DEFAULT 2
77*a28cd43dSSascha Wildner
78*a28cd43dSSascha Wildner static const char* g_defaultDictName = "dictionary";
79*a28cd43dSSascha Wildner static const unsigned g_defaultMaxDictSize = 110 KB;
80*a28cd43dSSascha Wildner static const int g_defaultDictCLevel = 3;
81*a28cd43dSSascha Wildner static const unsigned g_defaultSelectivityLevel = 9;
82*a28cd43dSSascha Wildner static const unsigned g_defaultMaxWindowLog = 27;
83*a28cd43dSSascha Wildner #define OVERLAP_LOG_DEFAULT 9999
84*a28cd43dSSascha Wildner #define LDM_PARAM_DEFAULT 9999 /* Default for parameters where 0 is valid */
85*a28cd43dSSascha Wildner static U32 g_overlapLog = OVERLAP_LOG_DEFAULT;
86*a28cd43dSSascha Wildner static U32 g_ldmHashLog = 0;
87*a28cd43dSSascha Wildner static U32 g_ldmMinMatch = 0;
88*a28cd43dSSascha Wildner static U32 g_ldmHashRateLog = LDM_PARAM_DEFAULT;
89*a28cd43dSSascha Wildner static U32 g_ldmBucketSizeLog = LDM_PARAM_DEFAULT;
90*a28cd43dSSascha Wildner
91*a28cd43dSSascha Wildner
92*a28cd43dSSascha Wildner #define DEFAULT_ACCEL 1
93*a28cd43dSSascha Wildner
94*a28cd43dSSascha Wildner typedef enum { cover, fastCover, legacy } dictType;
95*a28cd43dSSascha Wildner
96*a28cd43dSSascha Wildner /*-************************************
97*a28cd43dSSascha Wildner * Display Macros
98*a28cd43dSSascha Wildner **************************************/
99*a28cd43dSSascha Wildner #define DISPLAY_F(f, ...) fprintf((f), __VA_ARGS__)
100*a28cd43dSSascha Wildner #define DISPLAYOUT(...) DISPLAY_F(stdout, __VA_ARGS__)
101*a28cd43dSSascha Wildner #define DISPLAY(...) DISPLAY_F(stderr, __VA_ARGS__)
102*a28cd43dSSascha Wildner #define DISPLAYLEVEL(l, ...) { if (g_displayLevel>=l) { DISPLAY(__VA_ARGS__); } }
103*a28cd43dSSascha Wildner static int g_displayLevel = DISPLAY_LEVEL_DEFAULT; /* 0 : no display, 1: errors, 2 : + result + interaction + warnings, 3 : + progression, 4 : + information */
104*a28cd43dSSascha Wildner
105*a28cd43dSSascha Wildner
106*a28cd43dSSascha Wildner /*-************************************
107*a28cd43dSSascha Wildner * Command Line
108*a28cd43dSSascha Wildner **************************************/
109*a28cd43dSSascha Wildner /* print help either in `stderr` or `stdout` depending on originating request
110*a28cd43dSSascha Wildner * error (badusage) => stderr
111*a28cd43dSSascha Wildner * help (usage_advanced) => stdout
112*a28cd43dSSascha Wildner */
usage(FILE * f,const char * programName)113*a28cd43dSSascha Wildner static void usage(FILE* f, const char* programName)
114*a28cd43dSSascha Wildner {
115*a28cd43dSSascha Wildner DISPLAY_F(f, "Usage : \n");
116*a28cd43dSSascha Wildner DISPLAY_F(f, " %s [args] [FILE(s)] [-o file] \n", programName);
117*a28cd43dSSascha Wildner DISPLAY_F(f, "\n");
118*a28cd43dSSascha Wildner DISPLAY_F(f, "FILE : a filename \n");
119*a28cd43dSSascha Wildner DISPLAY_F(f, " with no FILE, or when FILE is - , read standard input\n");
120*a28cd43dSSascha Wildner DISPLAY_F(f, "Arguments : \n");
121*a28cd43dSSascha Wildner #ifndef ZSTD_NOCOMPRESS
122*a28cd43dSSascha Wildner DISPLAY_F(f, " -# : # compression level (1-%d, default: %d) \n", ZSTDCLI_CLEVEL_MAX, ZSTDCLI_CLEVEL_DEFAULT);
123*a28cd43dSSascha Wildner #endif
124*a28cd43dSSascha Wildner #ifndef ZSTD_NODECOMPRESS
125*a28cd43dSSascha Wildner DISPLAY_F(f, " -d : decompression \n");
126*a28cd43dSSascha Wildner #endif
127*a28cd43dSSascha Wildner DISPLAY_F(f, " -D DICT: use DICT as Dictionary for compression or decompression \n");
128*a28cd43dSSascha Wildner DISPLAY_F(f, " -o file: result stored into `file` (only 1 output file) \n");
129*a28cd43dSSascha Wildner DISPLAY_F(f, " -f : overwrite output without prompting, also (de)compress links \n");
130*a28cd43dSSascha Wildner DISPLAY_F(f, "--rm : remove source file(s) after successful de/compression \n");
131*a28cd43dSSascha Wildner DISPLAY_F(f, " -k : preserve source file(s) (default) \n");
132*a28cd43dSSascha Wildner DISPLAY_F(f, " -h/-H : display help/long help and exit \n");
133*a28cd43dSSascha Wildner }
134*a28cd43dSSascha Wildner
usage_advanced(const char * programName)135*a28cd43dSSascha Wildner static void usage_advanced(const char* programName)
136*a28cd43dSSascha Wildner {
137*a28cd43dSSascha Wildner DISPLAYOUT(WELCOME_MESSAGE);
138*a28cd43dSSascha Wildner usage(stdout, programName);
139*a28cd43dSSascha Wildner DISPLAYOUT( "\n");
140*a28cd43dSSascha Wildner DISPLAYOUT( "Advanced arguments : \n");
141*a28cd43dSSascha Wildner DISPLAYOUT( " -V : display Version number and exit \n");
142*a28cd43dSSascha Wildner
143*a28cd43dSSascha Wildner DISPLAYOUT( " -c : force write to standard output, even if it is the console \n");
144*a28cd43dSSascha Wildner
145*a28cd43dSSascha Wildner DISPLAYOUT( " -v : verbose mode; specify multiple times to increase verbosity \n");
146*a28cd43dSSascha Wildner DISPLAYOUT( " -q : suppress warnings; specify twice to suppress errors too \n");
147*a28cd43dSSascha Wildner DISPLAYOUT( "--no-progress : do not display the progress counter \n");
148*a28cd43dSSascha Wildner
149*a28cd43dSSascha Wildner #ifdef UTIL_HAS_CREATEFILELIST
150*a28cd43dSSascha Wildner DISPLAYOUT( " -r : operate recursively on directories \n");
151*a28cd43dSSascha Wildner DISPLAYOUT( "--filelist FILE : read list of files to operate upon from FILE \n");
152*a28cd43dSSascha Wildner DISPLAYOUT( "--output-dir-flat DIR : processed files are stored into DIR \n");
153*a28cd43dSSascha Wildner #endif
154*a28cd43dSSascha Wildner
155*a28cd43dSSascha Wildner #ifdef UTIL_HAS_MIRRORFILELIST
156*a28cd43dSSascha Wildner DISPLAYOUT( "--output-dir-mirror DIR : processed files are stored into DIR respecting original directory structure \n");
157*a28cd43dSSascha Wildner #endif
158*a28cd43dSSascha Wildner
159*a28cd43dSSascha Wildner
160*a28cd43dSSascha Wildner #ifndef ZSTD_NOCOMPRESS
161*a28cd43dSSascha Wildner DISPLAYOUT( "--[no-]check : during compression, add XXH64 integrity checksum to frame (default: enabled)");
162*a28cd43dSSascha Wildner #ifndef ZSTD_NODECOMPRESS
163*a28cd43dSSascha Wildner DISPLAYOUT( ". If specified with -d, decompressor will ignore/validate checksums in compressed frame (default: validate).");
164*a28cd43dSSascha Wildner #endif
165*a28cd43dSSascha Wildner #else
166*a28cd43dSSascha Wildner #ifdef ZSTD_NOCOMPRESS
167*a28cd43dSSascha Wildner DISPLAYOUT( "--[no-]check : during decompression, ignore/validate checksums in compressed frame (default: validate).");
168*a28cd43dSSascha Wildner #endif
169*a28cd43dSSascha Wildner #endif /* ZSTD_NOCOMPRESS */
170*a28cd43dSSascha Wildner DISPLAYOUT( "\n");
171*a28cd43dSSascha Wildner
172*a28cd43dSSascha Wildner DISPLAYOUT( "-- : All arguments after \"--\" are treated as files \n");
173*a28cd43dSSascha Wildner
174*a28cd43dSSascha Wildner #ifndef ZSTD_NOCOMPRESS
175*a28cd43dSSascha Wildner DISPLAYOUT( "\n");
176*a28cd43dSSascha Wildner DISPLAYOUT( "Advanced compression arguments : \n");
177*a28cd43dSSascha Wildner DISPLAYOUT( "--ultra : enable levels beyond %i, up to %i (requires more memory) \n", ZSTDCLI_CLEVEL_MAX, ZSTD_maxCLevel());
178*a28cd43dSSascha Wildner DISPLAYOUT( "--long[=#]: enable long distance matching with given window log (default: %u) \n", g_defaultMaxWindowLog);
179*a28cd43dSSascha Wildner DISPLAYOUT( "--fast[=#]: switch to very fast compression levels (default: %u) \n", 1);
180*a28cd43dSSascha Wildner DISPLAYOUT( "--adapt : dynamically adapt compression level to I/O conditions \n");
181*a28cd43dSSascha Wildner # ifdef ZSTD_MULTITHREAD
182*a28cd43dSSascha Wildner DISPLAYOUT( " -T# : spawns # compression threads (default: 1, 0==# cores) \n");
183*a28cd43dSSascha Wildner DISPLAYOUT( " -B# : select size of each job (default: 0==automatic) \n");
184*a28cd43dSSascha Wildner DISPLAYOUT( "--single-thread : use a single thread for both I/O and compression (result slightly different than -T1) \n");
185*a28cd43dSSascha Wildner DISPLAYOUT( "--rsyncable : compress using a rsync-friendly method (-B sets block size) \n");
186*a28cd43dSSascha Wildner # endif
187*a28cd43dSSascha Wildner DISPLAYOUT( "--exclude-compressed: only compress files that are not already compressed \n");
188*a28cd43dSSascha Wildner DISPLAYOUT( "--stream-size=# : specify size of streaming input from `stdin` \n");
189*a28cd43dSSascha Wildner DISPLAYOUT( "--size-hint=# optimize compression parameters for streaming input of approximately this size \n");
190*a28cd43dSSascha Wildner DISPLAYOUT( "--target-compressed-block-size=# : generate compressed block of approximately targeted size \n");
191*a28cd43dSSascha Wildner DISPLAYOUT( "--no-dictID : don't write dictID into header (dictionary compression only) \n");
192*a28cd43dSSascha Wildner DISPLAYOUT( "--[no-]compress-literals : force (un)compressed literals \n");
193*a28cd43dSSascha Wildner
194*a28cd43dSSascha Wildner DISPLAYOUT( "--format=zstd : compress files to the .zst format (default) \n");
195*a28cd43dSSascha Wildner #ifdef ZSTD_GZCOMPRESS
196*a28cd43dSSascha Wildner DISPLAYOUT( "--format=gzip : compress files to the .gz format \n");
197*a28cd43dSSascha Wildner #endif
198*a28cd43dSSascha Wildner #ifdef ZSTD_LZMACOMPRESS
199*a28cd43dSSascha Wildner DISPLAYOUT( "--format=xz : compress files to the .xz format \n");
200*a28cd43dSSascha Wildner DISPLAYOUT( "--format=lzma : compress files to the .lzma format \n");
201*a28cd43dSSascha Wildner #endif
202*a28cd43dSSascha Wildner #ifdef ZSTD_LZ4COMPRESS
203*a28cd43dSSascha Wildner DISPLAYOUT( "--format=lz4 : compress files to the .lz4 format \n");
204*a28cd43dSSascha Wildner #endif
205*a28cd43dSSascha Wildner #endif /* !ZSTD_NOCOMPRESS */
206*a28cd43dSSascha Wildner
207*a28cd43dSSascha Wildner #ifndef ZSTD_NODECOMPRESS
208*a28cd43dSSascha Wildner DISPLAYOUT( "\n");
209*a28cd43dSSascha Wildner DISPLAYOUT( "Advanced decompression arguments : \n");
210*a28cd43dSSascha Wildner DISPLAYOUT( " -l : print information about zstd compressed files \n");
211*a28cd43dSSascha Wildner DISPLAYOUT( "--test : test compressed file integrity \n");
212*a28cd43dSSascha Wildner DISPLAYOUT( " -M# : Set a memory usage limit for decompression \n");
213*a28cd43dSSascha Wildner # if ZSTD_SPARSE_DEFAULT
214*a28cd43dSSascha Wildner DISPLAYOUT( "--[no-]sparse : sparse mode (default: enabled on file, disabled on stdout) \n");
215*a28cd43dSSascha Wildner # else
216*a28cd43dSSascha Wildner DISPLAYOUT( "--[no-]sparse : sparse mode (default: disabled) \n");
217*a28cd43dSSascha Wildner # endif
218*a28cd43dSSascha Wildner #endif /* ZSTD_NODECOMPRESS */
219*a28cd43dSSascha Wildner
220*a28cd43dSSascha Wildner #ifndef ZSTD_NODICT
221*a28cd43dSSascha Wildner DISPLAYOUT( "\n");
222*a28cd43dSSascha Wildner DISPLAYOUT( "Dictionary builder : \n");
223*a28cd43dSSascha Wildner DISPLAYOUT( "--train ## : create a dictionary from a training set of files \n");
224*a28cd43dSSascha Wildner DISPLAYOUT( "--train-cover[=k=#,d=#,steps=#,split=#,shrink[=#]] : use the cover algorithm with optional args \n");
225*a28cd43dSSascha Wildner DISPLAYOUT( "--train-fastcover[=k=#,d=#,f=#,steps=#,split=#,accel=#,shrink[=#]] : use the fast cover algorithm with optional args \n");
226*a28cd43dSSascha Wildner DISPLAYOUT( "--train-legacy[=s=#] : use the legacy algorithm with selectivity (default: %u) \n", g_defaultSelectivityLevel);
227*a28cd43dSSascha Wildner DISPLAYOUT( " -o DICT : DICT is dictionary name (default: %s) \n", g_defaultDictName);
228*a28cd43dSSascha Wildner DISPLAYOUT( "--maxdict=# : limit dictionary to specified size (default: %u) \n", g_defaultMaxDictSize);
229*a28cd43dSSascha Wildner DISPLAYOUT( "--dictID=# : force dictionary ID to specified value (default: random) \n");
230*a28cd43dSSascha Wildner #endif
231*a28cd43dSSascha Wildner
232*a28cd43dSSascha Wildner #ifndef ZSTD_NOBENCH
233*a28cd43dSSascha Wildner DISPLAYOUT( "\n");
234*a28cd43dSSascha Wildner DISPLAYOUT( "Benchmark arguments : \n");
235*a28cd43dSSascha Wildner DISPLAYOUT( " -b# : benchmark file(s), using # compression level (default: %d) \n", ZSTDCLI_CLEVEL_DEFAULT);
236*a28cd43dSSascha Wildner DISPLAYOUT( " -e# : test all compression levels successively from -b# to -e# (default: 1) \n");
237*a28cd43dSSascha Wildner DISPLAYOUT( " -i# : minimum evaluation time in seconds (default: 3s) \n");
238*a28cd43dSSascha Wildner DISPLAYOUT( " -B# : cut file into independent blocks of size # (default: no block) \n");
239*a28cd43dSSascha Wildner DISPLAYOUT( " -S : output one benchmark result per input file (default: consolidated result) \n");
240*a28cd43dSSascha Wildner DISPLAYOUT( "--priority=rt : set process priority to real-time \n");
241*a28cd43dSSascha Wildner #endif
242*a28cd43dSSascha Wildner
243*a28cd43dSSascha Wildner }
244*a28cd43dSSascha Wildner
badusage(const char * programName)245*a28cd43dSSascha Wildner static void badusage(const char* programName)
246*a28cd43dSSascha Wildner {
247*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "Incorrect parameters \n");
248*a28cd43dSSascha Wildner if (g_displayLevel >= 2) usage(stderr, programName);
249*a28cd43dSSascha Wildner }
250*a28cd43dSSascha Wildner
waitEnter(void)251*a28cd43dSSascha Wildner static void waitEnter(void)
252*a28cd43dSSascha Wildner {
253*a28cd43dSSascha Wildner int unused;
254*a28cd43dSSascha Wildner DISPLAY("Press enter to continue... \n");
255*a28cd43dSSascha Wildner unused = getchar();
256*a28cd43dSSascha Wildner (void)unused;
257*a28cd43dSSascha Wildner }
258*a28cd43dSSascha Wildner
lastNameFromPath(const char * path)259*a28cd43dSSascha Wildner static const char* lastNameFromPath(const char* path)
260*a28cd43dSSascha Wildner {
261*a28cd43dSSascha Wildner const char* name = path;
262*a28cd43dSSascha Wildner if (strrchr(name, '/')) name = strrchr(name, '/') + 1;
263*a28cd43dSSascha Wildner if (strrchr(name, '\\')) name = strrchr(name, '\\') + 1; /* windows */
264*a28cd43dSSascha Wildner return name;
265*a28cd43dSSascha Wildner }
266*a28cd43dSSascha Wildner
267*a28cd43dSSascha Wildner /*! exeNameMatch() :
268*a28cd43dSSascha Wildner @return : a non-zero value if exeName matches test, excluding the extension
269*a28cd43dSSascha Wildner */
exeNameMatch(const char * exeName,const char * test)270*a28cd43dSSascha Wildner static int exeNameMatch(const char* exeName, const char* test)
271*a28cd43dSSascha Wildner {
272*a28cd43dSSascha Wildner return !strncmp(exeName, test, strlen(test)) &&
273*a28cd43dSSascha Wildner (exeName[strlen(test)] == '\0' || exeName[strlen(test)] == '.');
274*a28cd43dSSascha Wildner }
275*a28cd43dSSascha Wildner
errorOut(const char * msg)276*a28cd43dSSascha Wildner static void errorOut(const char* msg)
277*a28cd43dSSascha Wildner {
278*a28cd43dSSascha Wildner DISPLAY("%s \n", msg); exit(1);
279*a28cd43dSSascha Wildner }
280*a28cd43dSSascha Wildner
281*a28cd43dSSascha Wildner /*! readU32FromCharChecked() :
282*a28cd43dSSascha Wildner * @return 0 if success, and store the result in *value.
283*a28cd43dSSascha Wildner * allows and interprets K, KB, KiB, M, MB and MiB suffix.
284*a28cd43dSSascha Wildner * Will also modify `*stringPtr`, advancing it to position where it stopped reading.
285*a28cd43dSSascha Wildner * @return 1 if an overflow error occurs */
readU32FromCharChecked(const char ** stringPtr,unsigned * value)286*a28cd43dSSascha Wildner static int readU32FromCharChecked(const char** stringPtr, unsigned* value)
287*a28cd43dSSascha Wildner {
288*a28cd43dSSascha Wildner unsigned result = 0;
289*a28cd43dSSascha Wildner while ((**stringPtr >='0') && (**stringPtr <='9')) {
290*a28cd43dSSascha Wildner unsigned const max = ((unsigned)(-1)) / 10;
291*a28cd43dSSascha Wildner unsigned last = result;
292*a28cd43dSSascha Wildner if (result > max) return 1; /* overflow error */
293*a28cd43dSSascha Wildner result *= 10;
294*a28cd43dSSascha Wildner result += (unsigned)(**stringPtr - '0');
295*a28cd43dSSascha Wildner if (result < last) return 1; /* overflow error */
296*a28cd43dSSascha Wildner (*stringPtr)++ ;
297*a28cd43dSSascha Wildner }
298*a28cd43dSSascha Wildner if ((**stringPtr=='K') || (**stringPtr=='M')) {
299*a28cd43dSSascha Wildner unsigned const maxK = ((unsigned)(-1)) >> 10;
300*a28cd43dSSascha Wildner if (result > maxK) return 1; /* overflow error */
301*a28cd43dSSascha Wildner result <<= 10;
302*a28cd43dSSascha Wildner if (**stringPtr=='M') {
303*a28cd43dSSascha Wildner if (result > maxK) return 1; /* overflow error */
304*a28cd43dSSascha Wildner result <<= 10;
305*a28cd43dSSascha Wildner }
306*a28cd43dSSascha Wildner (*stringPtr)++; /* skip `K` or `M` */
307*a28cd43dSSascha Wildner if (**stringPtr=='i') (*stringPtr)++;
308*a28cd43dSSascha Wildner if (**stringPtr=='B') (*stringPtr)++;
309*a28cd43dSSascha Wildner }
310*a28cd43dSSascha Wildner *value = result;
311*a28cd43dSSascha Wildner return 0;
312*a28cd43dSSascha Wildner }
313*a28cd43dSSascha Wildner
314*a28cd43dSSascha Wildner /*! readU32FromChar() :
315*a28cd43dSSascha Wildner * @return : unsigned integer value read from input in `char` format.
316*a28cd43dSSascha Wildner * allows and interprets K, KB, KiB, M, MB and MiB suffix.
317*a28cd43dSSascha Wildner * Will also modify `*stringPtr`, advancing it to position where it stopped reading.
318*a28cd43dSSascha Wildner * Note : function will exit() program if digit sequence overflows */
readU32FromChar(const char ** stringPtr)319*a28cd43dSSascha Wildner static unsigned readU32FromChar(const char** stringPtr) {
320*a28cd43dSSascha Wildner static const char errorMsg[] = "error: numeric value overflows 32-bit unsigned int";
321*a28cd43dSSascha Wildner unsigned result;
322*a28cd43dSSascha Wildner if (readU32FromCharChecked(stringPtr, &result)) { errorOut(errorMsg); }
323*a28cd43dSSascha Wildner return result;
324*a28cd43dSSascha Wildner }
325*a28cd43dSSascha Wildner
326*a28cd43dSSascha Wildner /*! readSizeTFromCharChecked() :
327*a28cd43dSSascha Wildner * @return 0 if success, and store the result in *value.
328*a28cd43dSSascha Wildner * allows and interprets K, KB, KiB, M, MB and MiB suffix.
329*a28cd43dSSascha Wildner * Will also modify `*stringPtr`, advancing it to position where it stopped reading.
330*a28cd43dSSascha Wildner * @return 1 if an overflow error occurs */
readSizeTFromCharChecked(const char ** stringPtr,size_t * value)331*a28cd43dSSascha Wildner static int readSizeTFromCharChecked(const char** stringPtr, size_t* value)
332*a28cd43dSSascha Wildner {
333*a28cd43dSSascha Wildner size_t result = 0;
334*a28cd43dSSascha Wildner while ((**stringPtr >='0') && (**stringPtr <='9')) {
335*a28cd43dSSascha Wildner size_t const max = ((size_t)(-1)) / 10;
336*a28cd43dSSascha Wildner size_t last = result;
337*a28cd43dSSascha Wildner if (result > max) return 1; /* overflow error */
338*a28cd43dSSascha Wildner result *= 10;
339*a28cd43dSSascha Wildner result += (size_t)(**stringPtr - '0');
340*a28cd43dSSascha Wildner if (result < last) return 1; /* overflow error */
341*a28cd43dSSascha Wildner (*stringPtr)++ ;
342*a28cd43dSSascha Wildner }
343*a28cd43dSSascha Wildner if ((**stringPtr=='K') || (**stringPtr=='M')) {
344*a28cd43dSSascha Wildner size_t const maxK = ((size_t)(-1)) >> 10;
345*a28cd43dSSascha Wildner if (result > maxK) return 1; /* overflow error */
346*a28cd43dSSascha Wildner result <<= 10;
347*a28cd43dSSascha Wildner if (**stringPtr=='M') {
348*a28cd43dSSascha Wildner if (result > maxK) return 1; /* overflow error */
349*a28cd43dSSascha Wildner result <<= 10;
350*a28cd43dSSascha Wildner }
351*a28cd43dSSascha Wildner (*stringPtr)++; /* skip `K` or `M` */
352*a28cd43dSSascha Wildner if (**stringPtr=='i') (*stringPtr)++;
353*a28cd43dSSascha Wildner if (**stringPtr=='B') (*stringPtr)++;
354*a28cd43dSSascha Wildner }
355*a28cd43dSSascha Wildner *value = result;
356*a28cd43dSSascha Wildner return 0;
357*a28cd43dSSascha Wildner }
358*a28cd43dSSascha Wildner
359*a28cd43dSSascha Wildner /*! readSizeTFromChar() :
360*a28cd43dSSascha Wildner * @return : size_t value read from input in `char` format.
361*a28cd43dSSascha Wildner * allows and interprets K, KB, KiB, M, MB and MiB suffix.
362*a28cd43dSSascha Wildner * Will also modify `*stringPtr`, advancing it to position where it stopped reading.
363*a28cd43dSSascha Wildner * Note : function will exit() program if digit sequence overflows */
readSizeTFromChar(const char ** stringPtr)364*a28cd43dSSascha Wildner static size_t readSizeTFromChar(const char** stringPtr) {
365*a28cd43dSSascha Wildner static const char errorMsg[] = "error: numeric value overflows size_t";
366*a28cd43dSSascha Wildner size_t result;
367*a28cd43dSSascha Wildner if (readSizeTFromCharChecked(stringPtr, &result)) { errorOut(errorMsg); }
368*a28cd43dSSascha Wildner return result;
369*a28cd43dSSascha Wildner }
370*a28cd43dSSascha Wildner
371*a28cd43dSSascha Wildner /** longCommandWArg() :
372*a28cd43dSSascha Wildner * check if *stringPtr is the same as longCommand.
373*a28cd43dSSascha Wildner * If yes, @return 1 and advances *stringPtr to the position which immediately follows longCommand.
374*a28cd43dSSascha Wildner * @return 0 and doesn't modify *stringPtr otherwise.
375*a28cd43dSSascha Wildner */
longCommandWArg(const char ** stringPtr,const char * longCommand)376*a28cd43dSSascha Wildner static int longCommandWArg(const char** stringPtr, const char* longCommand)
377*a28cd43dSSascha Wildner {
378*a28cd43dSSascha Wildner size_t const comSize = strlen(longCommand);
379*a28cd43dSSascha Wildner int const result = !strncmp(*stringPtr, longCommand, comSize);
380*a28cd43dSSascha Wildner if (result) *stringPtr += comSize;
381*a28cd43dSSascha Wildner return result;
382*a28cd43dSSascha Wildner }
383*a28cd43dSSascha Wildner
384*a28cd43dSSascha Wildner
385*a28cd43dSSascha Wildner #ifndef ZSTD_NODICT
386*a28cd43dSSascha Wildner
387*a28cd43dSSascha Wildner static const unsigned kDefaultRegression = 1;
388*a28cd43dSSascha Wildner /**
389*a28cd43dSSascha Wildner * parseCoverParameters() :
390*a28cd43dSSascha Wildner * reads cover parameters from *stringPtr (e.g. "--train-cover=k=48,d=8,steps=32") into *params
391*a28cd43dSSascha Wildner * @return 1 means that cover parameters were correct
392*a28cd43dSSascha Wildner * @return 0 in case of malformed parameters
393*a28cd43dSSascha Wildner */
parseCoverParameters(const char * stringPtr,ZDICT_cover_params_t * params)394*a28cd43dSSascha Wildner static unsigned parseCoverParameters(const char* stringPtr, ZDICT_cover_params_t* params)
395*a28cd43dSSascha Wildner {
396*a28cd43dSSascha Wildner memset(params, 0, sizeof(*params));
397*a28cd43dSSascha Wildner for (; ;) {
398*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "k=")) { params->k = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
399*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "d=")) { params->d = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
400*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "steps=")) { params->steps = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
401*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "split=")) {
402*a28cd43dSSascha Wildner unsigned splitPercentage = readU32FromChar(&stringPtr);
403*a28cd43dSSascha Wildner params->splitPoint = (double)splitPercentage / 100.0;
404*a28cd43dSSascha Wildner if (stringPtr[0]==',') { stringPtr++; continue; } else break;
405*a28cd43dSSascha Wildner }
406*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "shrink")) {
407*a28cd43dSSascha Wildner params->shrinkDictMaxRegression = kDefaultRegression;
408*a28cd43dSSascha Wildner params->shrinkDict = 1;
409*a28cd43dSSascha Wildner if (stringPtr[0]=='=') {
410*a28cd43dSSascha Wildner stringPtr++;
411*a28cd43dSSascha Wildner params->shrinkDictMaxRegression = readU32FromChar(&stringPtr);
412*a28cd43dSSascha Wildner }
413*a28cd43dSSascha Wildner if (stringPtr[0]==',') {
414*a28cd43dSSascha Wildner stringPtr++;
415*a28cd43dSSascha Wildner continue;
416*a28cd43dSSascha Wildner }
417*a28cd43dSSascha Wildner else break;
418*a28cd43dSSascha Wildner }
419*a28cd43dSSascha Wildner return 0;
420*a28cd43dSSascha Wildner }
421*a28cd43dSSascha Wildner if (stringPtr[0] != 0) return 0;
422*a28cd43dSSascha Wildner DISPLAYLEVEL(4, "cover: k=%u\nd=%u\nsteps=%u\nsplit=%u\nshrink%u\n", params->k, params->d, params->steps, (unsigned)(params->splitPoint * 100), params->shrinkDictMaxRegression);
423*a28cd43dSSascha Wildner return 1;
424*a28cd43dSSascha Wildner }
425*a28cd43dSSascha Wildner
426*a28cd43dSSascha Wildner /**
427*a28cd43dSSascha Wildner * parseFastCoverParameters() :
428*a28cd43dSSascha Wildner * reads fastcover parameters from *stringPtr (e.g. "--train-fastcover=k=48,d=8,f=20,steps=32,accel=2") into *params
429*a28cd43dSSascha Wildner * @return 1 means that fastcover parameters were correct
430*a28cd43dSSascha Wildner * @return 0 in case of malformed parameters
431*a28cd43dSSascha Wildner */
parseFastCoverParameters(const char * stringPtr,ZDICT_fastCover_params_t * params)432*a28cd43dSSascha Wildner static unsigned parseFastCoverParameters(const char* stringPtr, ZDICT_fastCover_params_t* params)
433*a28cd43dSSascha Wildner {
434*a28cd43dSSascha Wildner memset(params, 0, sizeof(*params));
435*a28cd43dSSascha Wildner for (; ;) {
436*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "k=")) { params->k = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
437*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "d=")) { params->d = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
438*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "f=")) { params->f = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
439*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "steps=")) { params->steps = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
440*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "accel=")) { params->accel = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
441*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "split=")) {
442*a28cd43dSSascha Wildner unsigned splitPercentage = readU32FromChar(&stringPtr);
443*a28cd43dSSascha Wildner params->splitPoint = (double)splitPercentage / 100.0;
444*a28cd43dSSascha Wildner if (stringPtr[0]==',') { stringPtr++; continue; } else break;
445*a28cd43dSSascha Wildner }
446*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "shrink")) {
447*a28cd43dSSascha Wildner params->shrinkDictMaxRegression = kDefaultRegression;
448*a28cd43dSSascha Wildner params->shrinkDict = 1;
449*a28cd43dSSascha Wildner if (stringPtr[0]=='=') {
450*a28cd43dSSascha Wildner stringPtr++;
451*a28cd43dSSascha Wildner params->shrinkDictMaxRegression = readU32FromChar(&stringPtr);
452*a28cd43dSSascha Wildner }
453*a28cd43dSSascha Wildner if (stringPtr[0]==',') {
454*a28cd43dSSascha Wildner stringPtr++;
455*a28cd43dSSascha Wildner continue;
456*a28cd43dSSascha Wildner }
457*a28cd43dSSascha Wildner else break;
458*a28cd43dSSascha Wildner }
459*a28cd43dSSascha Wildner return 0;
460*a28cd43dSSascha Wildner }
461*a28cd43dSSascha Wildner if (stringPtr[0] != 0) return 0;
462*a28cd43dSSascha Wildner DISPLAYLEVEL(4, "cover: k=%u\nd=%u\nf=%u\nsteps=%u\nsplit=%u\naccel=%u\nshrink=%u\n", params->k, params->d, params->f, params->steps, (unsigned)(params->splitPoint * 100), params->accel, params->shrinkDictMaxRegression);
463*a28cd43dSSascha Wildner return 1;
464*a28cd43dSSascha Wildner }
465*a28cd43dSSascha Wildner
466*a28cd43dSSascha Wildner /**
467*a28cd43dSSascha Wildner * parseLegacyParameters() :
468*a28cd43dSSascha Wildner * reads legacy dictionary builder parameters from *stringPtr (e.g. "--train-legacy=selectivity=8") into *selectivity
469*a28cd43dSSascha Wildner * @return 1 means that legacy dictionary builder parameters were correct
470*a28cd43dSSascha Wildner * @return 0 in case of malformed parameters
471*a28cd43dSSascha Wildner */
parseLegacyParameters(const char * stringPtr,unsigned * selectivity)472*a28cd43dSSascha Wildner static unsigned parseLegacyParameters(const char* stringPtr, unsigned* selectivity)
473*a28cd43dSSascha Wildner {
474*a28cd43dSSascha Wildner if (!longCommandWArg(&stringPtr, "s=") && !longCommandWArg(&stringPtr, "selectivity=")) { return 0; }
475*a28cd43dSSascha Wildner *selectivity = readU32FromChar(&stringPtr);
476*a28cd43dSSascha Wildner if (stringPtr[0] != 0) return 0;
477*a28cd43dSSascha Wildner DISPLAYLEVEL(4, "legacy: selectivity=%u\n", *selectivity);
478*a28cd43dSSascha Wildner return 1;
479*a28cd43dSSascha Wildner }
480*a28cd43dSSascha Wildner
defaultCoverParams(void)481*a28cd43dSSascha Wildner static ZDICT_cover_params_t defaultCoverParams(void)
482*a28cd43dSSascha Wildner {
483*a28cd43dSSascha Wildner ZDICT_cover_params_t params;
484*a28cd43dSSascha Wildner memset(¶ms, 0, sizeof(params));
485*a28cd43dSSascha Wildner params.d = 8;
486*a28cd43dSSascha Wildner params.steps = 4;
487*a28cd43dSSascha Wildner params.splitPoint = 1.0;
488*a28cd43dSSascha Wildner params.shrinkDict = 0;
489*a28cd43dSSascha Wildner params.shrinkDictMaxRegression = kDefaultRegression;
490*a28cd43dSSascha Wildner return params;
491*a28cd43dSSascha Wildner }
492*a28cd43dSSascha Wildner
defaultFastCoverParams(void)493*a28cd43dSSascha Wildner static ZDICT_fastCover_params_t defaultFastCoverParams(void)
494*a28cd43dSSascha Wildner {
495*a28cd43dSSascha Wildner ZDICT_fastCover_params_t params;
496*a28cd43dSSascha Wildner memset(¶ms, 0, sizeof(params));
497*a28cd43dSSascha Wildner params.d = 8;
498*a28cd43dSSascha Wildner params.f = 20;
499*a28cd43dSSascha Wildner params.steps = 4;
500*a28cd43dSSascha Wildner params.splitPoint = 0.75; /* different from default splitPoint of cover */
501*a28cd43dSSascha Wildner params.accel = DEFAULT_ACCEL;
502*a28cd43dSSascha Wildner params.shrinkDict = 0;
503*a28cd43dSSascha Wildner params.shrinkDictMaxRegression = kDefaultRegression;
504*a28cd43dSSascha Wildner return params;
505*a28cd43dSSascha Wildner }
506*a28cd43dSSascha Wildner #endif
507*a28cd43dSSascha Wildner
508*a28cd43dSSascha Wildner
509*a28cd43dSSascha Wildner /** parseAdaptParameters() :
510*a28cd43dSSascha Wildner * reads adapt parameters from *stringPtr (e.g. "--zstd=min=1,max=19) and store them into adaptMinPtr and adaptMaxPtr.
511*a28cd43dSSascha Wildner * Both adaptMinPtr and adaptMaxPtr must be already allocated and correctly initialized.
512*a28cd43dSSascha Wildner * There is no guarantee that any of these values will be updated.
513*a28cd43dSSascha Wildner * @return 1 means that parsing was successful,
514*a28cd43dSSascha Wildner * @return 0 in case of malformed parameters
515*a28cd43dSSascha Wildner */
parseAdaptParameters(const char * stringPtr,int * adaptMinPtr,int * adaptMaxPtr)516*a28cd43dSSascha Wildner static unsigned parseAdaptParameters(const char* stringPtr, int* adaptMinPtr, int* adaptMaxPtr)
517*a28cd43dSSascha Wildner {
518*a28cd43dSSascha Wildner for ( ; ;) {
519*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "min=")) { *adaptMinPtr = (int)readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
520*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "max=")) { *adaptMaxPtr = (int)readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
521*a28cd43dSSascha Wildner DISPLAYLEVEL(4, "invalid compression parameter \n");
522*a28cd43dSSascha Wildner return 0;
523*a28cd43dSSascha Wildner }
524*a28cd43dSSascha Wildner if (stringPtr[0] != 0) return 0; /* check the end of string */
525*a28cd43dSSascha Wildner if (*adaptMinPtr > *adaptMaxPtr) {
526*a28cd43dSSascha Wildner DISPLAYLEVEL(4, "incoherent adaptation limits \n");
527*a28cd43dSSascha Wildner return 0;
528*a28cd43dSSascha Wildner }
529*a28cd43dSSascha Wildner return 1;
530*a28cd43dSSascha Wildner }
531*a28cd43dSSascha Wildner
532*a28cd43dSSascha Wildner
533*a28cd43dSSascha Wildner /** parseCompressionParameters() :
534*a28cd43dSSascha Wildner * reads compression parameters from *stringPtr (e.g. "--zstd=wlog=23,clog=23,hlog=22,slog=6,mml=3,tlen=48,strat=6") into *params
535*a28cd43dSSascha Wildner * @return 1 means that compression parameters were correct
536*a28cd43dSSascha Wildner * @return 0 in case of malformed parameters
537*a28cd43dSSascha Wildner */
parseCompressionParameters(const char * stringPtr,ZSTD_compressionParameters * params)538*a28cd43dSSascha Wildner static unsigned parseCompressionParameters(const char* stringPtr, ZSTD_compressionParameters* params)
539*a28cd43dSSascha Wildner {
540*a28cd43dSSascha Wildner for ( ; ;) {
541*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "windowLog=") || longCommandWArg(&stringPtr, "wlog=")) { params->windowLog = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
542*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "chainLog=") || longCommandWArg(&stringPtr, "clog=")) { params->chainLog = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
543*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "hashLog=") || longCommandWArg(&stringPtr, "hlog=")) { params->hashLog = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
544*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "searchLog=") || longCommandWArg(&stringPtr, "slog=")) { params->searchLog = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
545*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "minMatch=") || longCommandWArg(&stringPtr, "mml=")) { params->minMatch = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
546*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "targetLength=") || longCommandWArg(&stringPtr, "tlen=")) { params->targetLength = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
547*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "strategy=") || longCommandWArg(&stringPtr, "strat=")) { params->strategy = (ZSTD_strategy)(readU32FromChar(&stringPtr)); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
548*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "overlapLog=") || longCommandWArg(&stringPtr, "ovlog=")) { g_overlapLog = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
549*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "ldmHashLog=") || longCommandWArg(&stringPtr, "lhlog=")) { g_ldmHashLog = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
550*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "ldmMinMatch=") || longCommandWArg(&stringPtr, "lmml=")) { g_ldmMinMatch = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
551*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "ldmBucketSizeLog=") || longCommandWArg(&stringPtr, "lblog=")) { g_ldmBucketSizeLog = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
552*a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "ldmHashRateLog=") || longCommandWArg(&stringPtr, "lhrlog=")) { g_ldmHashRateLog = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
553*a28cd43dSSascha Wildner DISPLAYLEVEL(4, "invalid compression parameter \n");
554*a28cd43dSSascha Wildner return 0;
555*a28cd43dSSascha Wildner }
556*a28cd43dSSascha Wildner
557*a28cd43dSSascha Wildner DISPLAYLEVEL(4, "windowLog=%d, chainLog=%d, hashLog=%d, searchLog=%d \n", params->windowLog, params->chainLog, params->hashLog, params->searchLog);
558*a28cd43dSSascha Wildner DISPLAYLEVEL(4, "minMatch=%d, targetLength=%d, strategy=%d \n", params->minMatch, params->targetLength, params->strategy);
559*a28cd43dSSascha Wildner if (stringPtr[0] != 0) return 0; /* check the end of string */
560*a28cd43dSSascha Wildner return 1;
561*a28cd43dSSascha Wildner }
562*a28cd43dSSascha Wildner
printVersion(void)563*a28cd43dSSascha Wildner static void printVersion(void)
564*a28cd43dSSascha Wildner {
565*a28cd43dSSascha Wildner if (g_displayLevel < DISPLAY_LEVEL_DEFAULT) {
566*a28cd43dSSascha Wildner DISPLAYOUT("%s\n", ZSTD_VERSION_STRING);
567*a28cd43dSSascha Wildner return;
568*a28cd43dSSascha Wildner }
569*a28cd43dSSascha Wildner
570*a28cd43dSSascha Wildner DISPLAYOUT(WELCOME_MESSAGE);
571*a28cd43dSSascha Wildner if (g_displayLevel >= 3) {
572*a28cd43dSSascha Wildner /* format support */
573*a28cd43dSSascha Wildner DISPLAYOUT("*** supports: zstd");
574*a28cd43dSSascha Wildner #if defined(ZSTD_LEGACY_SUPPORT) && (ZSTD_LEGACY_SUPPORT>0) && (ZSTD_LEGACY_SUPPORT<8)
575*a28cd43dSSascha Wildner DISPLAYOUT(", zstd legacy v0.%d+", ZSTD_LEGACY_SUPPORT);
576*a28cd43dSSascha Wildner #endif
577*a28cd43dSSascha Wildner #ifdef ZSTD_GZCOMPRESS
578*a28cd43dSSascha Wildner DISPLAYOUT(", gzip");
579*a28cd43dSSascha Wildner #endif
580*a28cd43dSSascha Wildner #ifdef ZSTD_LZ4COMPRESS
581*a28cd43dSSascha Wildner DISPLAYOUT(", lz4");
582*a28cd43dSSascha Wildner #endif
583*a28cd43dSSascha Wildner #ifdef ZSTD_LZMACOMPRESS
584*a28cd43dSSascha Wildner DISPLAYOUT(", lzma, xz ");
585*a28cd43dSSascha Wildner #endif
586*a28cd43dSSascha Wildner DISPLAYOUT("\n");
587*a28cd43dSSascha Wildner if (g_displayLevel >= 4) {
588*a28cd43dSSascha Wildner /* posix support */
589*a28cd43dSSascha Wildner #ifdef _POSIX_C_SOURCE
590*a28cd43dSSascha Wildner DISPLAYOUT("_POSIX_C_SOURCE defined: %ldL\n", (long) _POSIX_C_SOURCE);
591*a28cd43dSSascha Wildner #endif
592*a28cd43dSSascha Wildner #ifdef _POSIX_VERSION
593*a28cd43dSSascha Wildner DISPLAYOUT("_POSIX_VERSION defined: %ldL \n", (long) _POSIX_VERSION);
594*a28cd43dSSascha Wildner #endif
595*a28cd43dSSascha Wildner #ifdef PLATFORM_POSIX_VERSION
596*a28cd43dSSascha Wildner DISPLAYOUT("PLATFORM_POSIX_VERSION defined: %ldL\n", (long) PLATFORM_POSIX_VERSION);
597*a28cd43dSSascha Wildner #endif
598*a28cd43dSSascha Wildner } }
599*a28cd43dSSascha Wildner }
600*a28cd43dSSascha Wildner
601*a28cd43dSSascha Wildner /* Environment variables for parameter setting */
602*a28cd43dSSascha Wildner #define ENV_CLEVEL "ZSTD_CLEVEL"
603*a28cd43dSSascha Wildner #define ENV_NBTHREADS "ZSTD_NBTHREADS" /* takes lower precedence than directly specifying -T# in the CLI */
604*a28cd43dSSascha Wildner
605*a28cd43dSSascha Wildner /* pick up environment variable */
init_cLevel(void)606*a28cd43dSSascha Wildner static int init_cLevel(void) {
607*a28cd43dSSascha Wildner const char* const env = getenv(ENV_CLEVEL);
608*a28cd43dSSascha Wildner if (env != NULL) {
609*a28cd43dSSascha Wildner const char* ptr = env;
610*a28cd43dSSascha Wildner int sign = 1;
611*a28cd43dSSascha Wildner if (*ptr == '-') {
612*a28cd43dSSascha Wildner sign = -1;
613*a28cd43dSSascha Wildner ptr++;
614*a28cd43dSSascha Wildner } else if (*ptr == '+') {
615*a28cd43dSSascha Wildner ptr++;
616*a28cd43dSSascha Wildner }
617*a28cd43dSSascha Wildner
618*a28cd43dSSascha Wildner if ((*ptr>='0') && (*ptr<='9')) {
619*a28cd43dSSascha Wildner unsigned absLevel;
620*a28cd43dSSascha Wildner if (readU32FromCharChecked(&ptr, &absLevel)) {
621*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "Ignore environment variable setting %s=%s: numeric value too large \n", ENV_CLEVEL, env);
622*a28cd43dSSascha Wildner return ZSTDCLI_CLEVEL_DEFAULT;
623*a28cd43dSSascha Wildner } else if (*ptr == 0) {
624*a28cd43dSSascha Wildner return sign * (int)absLevel;
625*a28cd43dSSascha Wildner } }
626*a28cd43dSSascha Wildner
627*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "Ignore environment variable setting %s=%s: not a valid integer value \n", ENV_CLEVEL, env);
628*a28cd43dSSascha Wildner }
629*a28cd43dSSascha Wildner
630*a28cd43dSSascha Wildner return ZSTDCLI_CLEVEL_DEFAULT;
631*a28cd43dSSascha Wildner }
632*a28cd43dSSascha Wildner
633*a28cd43dSSascha Wildner #ifdef ZSTD_MULTITHREAD
init_nbThreads(void)634*a28cd43dSSascha Wildner static unsigned init_nbThreads(void) {
635*a28cd43dSSascha Wildner const char* const env = getenv(ENV_NBTHREADS);
636*a28cd43dSSascha Wildner if (env != NULL) {
637*a28cd43dSSascha Wildner const char* ptr = env;
638*a28cd43dSSascha Wildner if ((*ptr>='0') && (*ptr<='9')) {
639*a28cd43dSSascha Wildner unsigned nbThreads;
640*a28cd43dSSascha Wildner if (readU32FromCharChecked(&ptr, &nbThreads)) {
641*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "Ignore environment variable setting %s=%s: numeric value too large \n", ENV_NBTHREADS, env);
642*a28cd43dSSascha Wildner return ZSTDCLI_NBTHREADS_DEFAULT;
643*a28cd43dSSascha Wildner } else if (*ptr == 0) {
644*a28cd43dSSascha Wildner return nbThreads;
645*a28cd43dSSascha Wildner }
646*a28cd43dSSascha Wildner }
647*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "Ignore environment variable setting %s=%s: not a valid unsigned value \n", ENV_NBTHREADS, env);
648*a28cd43dSSascha Wildner }
649*a28cd43dSSascha Wildner
650*a28cd43dSSascha Wildner return ZSTDCLI_NBTHREADS_DEFAULT;
651*a28cd43dSSascha Wildner }
652*a28cd43dSSascha Wildner #endif
653*a28cd43dSSascha Wildner
654*a28cd43dSSascha Wildner #define NEXT_FIELD(ptr) { \
655*a28cd43dSSascha Wildner if (*argument == '=') { \
656*a28cd43dSSascha Wildner ptr = ++argument; \
657*a28cd43dSSascha Wildner argument += strlen(ptr); \
658*a28cd43dSSascha Wildner } else { \
659*a28cd43dSSascha Wildner argNb++; \
660*a28cd43dSSascha Wildner if (argNb >= argCount) { \
661*a28cd43dSSascha Wildner DISPLAY("error: missing command argument \n"); \
662*a28cd43dSSascha Wildner CLEAN_RETURN(1); \
663*a28cd43dSSascha Wildner } \
664*a28cd43dSSascha Wildner ptr = argv[argNb]; \
665*a28cd43dSSascha Wildner assert(ptr != NULL); \
666*a28cd43dSSascha Wildner if (ptr[0]=='-') { \
667*a28cd43dSSascha Wildner DISPLAY("error: command cannot be separated from its argument by another command \n"); \
668*a28cd43dSSascha Wildner CLEAN_RETURN(1); \
669*a28cd43dSSascha Wildner } } }
670*a28cd43dSSascha Wildner
671*a28cd43dSSascha Wildner #define NEXT_UINT32(val32) { \
672*a28cd43dSSascha Wildner const char* __nb; \
673*a28cd43dSSascha Wildner NEXT_FIELD(__nb); \
674*a28cd43dSSascha Wildner val32 = readU32FromChar(&__nb); \
675*a28cd43dSSascha Wildner }
676*a28cd43dSSascha Wildner
677*a28cd43dSSascha Wildner #define ZSTD_NB_STRATEGIES 9
678*a28cd43dSSascha Wildner static const char* ZSTD_strategyMap[ZSTD_NB_STRATEGIES + 1] = { "", "ZSTD_fast",
679*a28cd43dSSascha Wildner "ZSTD_dfast", "ZSTD_greedy", "ZSTD_lazy", "ZSTD_lazy2", "ZSTD_btlazy2",
680*a28cd43dSSascha Wildner "ZSTD_btopt", "ZSTD_btultra", "ZSTD_btultra2"};
681*a28cd43dSSascha Wildner
682*a28cd43dSSascha Wildner typedef enum { zom_compress, zom_decompress, zom_test, zom_bench, zom_train, zom_list } zstd_operation_mode;
683*a28cd43dSSascha Wildner
684*a28cd43dSSascha Wildner #define CLEAN_RETURN(i) { operationResult = (i); goto _end; }
685*a28cd43dSSascha Wildner
686*a28cd43dSSascha Wildner #ifdef ZSTD_NOCOMPRESS
687*a28cd43dSSascha Wildner /* symbols from compression library are not defined and should not be invoked */
688*a28cd43dSSascha Wildner # define MINCLEVEL -99
689*a28cd43dSSascha Wildner # define MAXCLEVEL 22
690*a28cd43dSSascha Wildner #else
691*a28cd43dSSascha Wildner # define MINCLEVEL ZSTD_minCLevel()
692*a28cd43dSSascha Wildner # define MAXCLEVEL ZSTD_maxCLevel()
693*a28cd43dSSascha Wildner #endif
694*a28cd43dSSascha Wildner
main(int const argCount,const char * argv[])695*a28cd43dSSascha Wildner int main(int const argCount, const char* argv[])
696*a28cd43dSSascha Wildner {
697*a28cd43dSSascha Wildner int argNb,
698*a28cd43dSSascha Wildner followLinks = 0,
699*a28cd43dSSascha Wildner forceStdout = 0,
700*a28cd43dSSascha Wildner hasStdout = 0,
701*a28cd43dSSascha Wildner ldmFlag = 0,
702*a28cd43dSSascha Wildner main_pause = 0,
703*a28cd43dSSascha Wildner nbWorkers = 0,
704*a28cd43dSSascha Wildner adapt = 0,
705*a28cd43dSSascha Wildner adaptMin = MINCLEVEL,
706*a28cd43dSSascha Wildner adaptMax = MAXCLEVEL,
707*a28cd43dSSascha Wildner rsyncable = 0,
708*a28cd43dSSascha Wildner nextArgumentsAreFiles = 0,
709*a28cd43dSSascha Wildner operationResult = 0,
710*a28cd43dSSascha Wildner separateFiles = 0,
711*a28cd43dSSascha Wildner setRealTimePrio = 0,
712*a28cd43dSSascha Wildner singleThread = 0,
713*a28cd43dSSascha Wildner showDefaultCParams = 0,
714*a28cd43dSSascha Wildner ultra=0,
715*a28cd43dSSascha Wildner contentSize=1;
716*a28cd43dSSascha Wildner double compressibility = 0.5;
717*a28cd43dSSascha Wildner unsigned bench_nbSeconds = 3; /* would be better if this value was synchronized from bench */
718*a28cd43dSSascha Wildner size_t blockSize = 0;
719*a28cd43dSSascha Wildner
720*a28cd43dSSascha Wildner FIO_prefs_t* const prefs = FIO_createPreferences();
721*a28cd43dSSascha Wildner FIO_ctx_t* const fCtx = FIO_createContext();
722*a28cd43dSSascha Wildner zstd_operation_mode operation = zom_compress;
723*a28cd43dSSascha Wildner ZSTD_compressionParameters compressionParams;
724*a28cd43dSSascha Wildner int cLevel = init_cLevel();
725*a28cd43dSSascha Wildner int cLevelLast = MINCLEVEL - 1; /* lower than minimum */
726*a28cd43dSSascha Wildner unsigned recursive = 0;
727*a28cd43dSSascha Wildner unsigned memLimit = 0;
728*a28cd43dSSascha Wildner FileNamesTable* filenames = UTIL_allocateFileNamesTable((size_t)argCount); /* argCount >= 1 */
729*a28cd43dSSascha Wildner FileNamesTable* file_of_names = UTIL_allocateFileNamesTable((size_t)argCount); /* argCount >= 1 */
730*a28cd43dSSascha Wildner const char* programName = argv[0];
731*a28cd43dSSascha Wildner const char* outFileName = NULL;
732*a28cd43dSSascha Wildner const char* outDirName = NULL;
733*a28cd43dSSascha Wildner const char* outMirroredDirName = NULL;
734*a28cd43dSSascha Wildner const char* dictFileName = NULL;
735*a28cd43dSSascha Wildner const char* patchFromDictFileName = NULL;
736*a28cd43dSSascha Wildner const char* suffix = ZSTD_EXTENSION;
737*a28cd43dSSascha Wildner unsigned maxDictSize = g_defaultMaxDictSize;
738*a28cd43dSSascha Wildner unsigned dictID = 0;
739*a28cd43dSSascha Wildner size_t streamSrcSize = 0;
740*a28cd43dSSascha Wildner size_t targetCBlockSize = 0;
741*a28cd43dSSascha Wildner size_t srcSizeHint = 0;
742*a28cd43dSSascha Wildner int dictCLevel = g_defaultDictCLevel;
743*a28cd43dSSascha Wildner unsigned dictSelect = g_defaultSelectivityLevel;
744*a28cd43dSSascha Wildner #ifndef ZSTD_NODICT
745*a28cd43dSSascha Wildner ZDICT_cover_params_t coverParams = defaultCoverParams();
746*a28cd43dSSascha Wildner ZDICT_fastCover_params_t fastCoverParams = defaultFastCoverParams();
747*a28cd43dSSascha Wildner dictType dict = fastCover;
748*a28cd43dSSascha Wildner #endif
749*a28cd43dSSascha Wildner #ifndef ZSTD_NOBENCH
750*a28cd43dSSascha Wildner BMK_advancedParams_t benchParams = BMK_initAdvancedParams();
751*a28cd43dSSascha Wildner #endif
752*a28cd43dSSascha Wildner ZSTD_literalCompressionMode_e literalCompressionMode = ZSTD_lcm_auto;
753*a28cd43dSSascha Wildner
754*a28cd43dSSascha Wildner
755*a28cd43dSSascha Wildner /* init */
756*a28cd43dSSascha Wildner (void)recursive; (void)cLevelLast; /* not used when ZSTD_NOBENCH set */
757*a28cd43dSSascha Wildner (void)memLimit;
758*a28cd43dSSascha Wildner assert(argCount >= 1);
759*a28cd43dSSascha Wildner if ((filenames==NULL) || (file_of_names==NULL)) { DISPLAY("zstd: allocation error \n"); exit(1); }
760*a28cd43dSSascha Wildner programName = lastNameFromPath(programName);
761*a28cd43dSSascha Wildner #ifdef ZSTD_MULTITHREAD
762*a28cd43dSSascha Wildner nbWorkers = init_nbThreads();
763*a28cd43dSSascha Wildner #endif
764*a28cd43dSSascha Wildner
765*a28cd43dSSascha Wildner /* preset behaviors */
766*a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_ZSTDMT)) nbWorkers=0, singleThread=0;
767*a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_UNZSTD)) operation=zom_decompress;
768*a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_CAT)) { operation=zom_decompress; FIO_overwriteMode(prefs); forceStdout=1; followLinks=1; outFileName=stdoutmark; g_displayLevel=1; } /* supports multiple formats */
769*a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_ZCAT)) { operation=zom_decompress; FIO_overwriteMode(prefs); forceStdout=1; followLinks=1; outFileName=stdoutmark; g_displayLevel=1; } /* behave like zcat, also supports multiple formats */
770*a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_GZ)) { suffix = GZ_EXTENSION; FIO_setCompressionType(prefs, FIO_gzipCompression); FIO_setRemoveSrcFile(prefs, 1); } /* behave like gzip */
771*a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_GUNZIP)) { operation=zom_decompress; FIO_setRemoveSrcFile(prefs, 1); } /* behave like gunzip, also supports multiple formats */
772*a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_GZCAT)) { operation=zom_decompress; FIO_overwriteMode(prefs); forceStdout=1; followLinks=1; outFileName=stdoutmark; g_displayLevel=1; } /* behave like gzcat, also supports multiple formats */
773*a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_LZMA)) { suffix = LZMA_EXTENSION; FIO_setCompressionType(prefs, FIO_lzmaCompression); FIO_setRemoveSrcFile(prefs, 1); } /* behave like lzma */
774*a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_UNLZMA)) { operation=zom_decompress; FIO_setCompressionType(prefs, FIO_lzmaCompression); FIO_setRemoveSrcFile(prefs, 1); } /* behave like unlzma, also supports multiple formats */
775*a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_XZ)) { suffix = XZ_EXTENSION; FIO_setCompressionType(prefs, FIO_xzCompression); FIO_setRemoveSrcFile(prefs, 1); } /* behave like xz */
776*a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_UNXZ)) { operation=zom_decompress; FIO_setCompressionType(prefs, FIO_xzCompression); FIO_setRemoveSrcFile(prefs, 1); } /* behave like unxz, also supports multiple formats */
777*a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_LZ4)) { suffix = LZ4_EXTENSION; FIO_setCompressionType(prefs, FIO_lz4Compression); } /* behave like lz4 */
778*a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_UNLZ4)) { operation=zom_decompress; FIO_setCompressionType(prefs, FIO_lz4Compression); } /* behave like unlz4, also supports multiple formats */
779*a28cd43dSSascha Wildner memset(&compressionParams, 0, sizeof(compressionParams));
780*a28cd43dSSascha Wildner
781*a28cd43dSSascha Wildner /* init crash handler */
782*a28cd43dSSascha Wildner FIO_addAbortHandler();
783*a28cd43dSSascha Wildner
784*a28cd43dSSascha Wildner /* command switches */
785*a28cd43dSSascha Wildner for (argNb=1; argNb<argCount; argNb++) {
786*a28cd43dSSascha Wildner const char* argument = argv[argNb];
787*a28cd43dSSascha Wildner if (!argument) continue; /* Protection if argument empty */
788*a28cd43dSSascha Wildner
789*a28cd43dSSascha Wildner if (nextArgumentsAreFiles) {
790*a28cd43dSSascha Wildner UTIL_refFilename(filenames, argument);
791*a28cd43dSSascha Wildner continue;
792*a28cd43dSSascha Wildner }
793*a28cd43dSSascha Wildner
794*a28cd43dSSascha Wildner /* "-" means stdin/stdout */
795*a28cd43dSSascha Wildner if (!strcmp(argument, "-")){
796*a28cd43dSSascha Wildner UTIL_refFilename(filenames, stdinmark);
797*a28cd43dSSascha Wildner continue;
798*a28cd43dSSascha Wildner }
799*a28cd43dSSascha Wildner
800*a28cd43dSSascha Wildner /* Decode commands (note : aggregated commands are allowed) */
801*a28cd43dSSascha Wildner if (argument[0]=='-') {
802*a28cd43dSSascha Wildner
803*a28cd43dSSascha Wildner if (argument[1]=='-') {
804*a28cd43dSSascha Wildner /* long commands (--long-word) */
805*a28cd43dSSascha Wildner if (!strcmp(argument, "--")) { nextArgumentsAreFiles=1; continue; } /* only file names allowed from now on */
806*a28cd43dSSascha Wildner if (!strcmp(argument, "--list")) { operation=zom_list; continue; }
807*a28cd43dSSascha Wildner if (!strcmp(argument, "--compress")) { operation=zom_compress; continue; }
808*a28cd43dSSascha Wildner if (!strcmp(argument, "--decompress")) { operation=zom_decompress; continue; }
809*a28cd43dSSascha Wildner if (!strcmp(argument, "--uncompress")) { operation=zom_decompress; continue; }
810*a28cd43dSSascha Wildner if (!strcmp(argument, "--force")) { FIO_overwriteMode(prefs); forceStdout=1; followLinks=1; continue; }
811*a28cd43dSSascha Wildner if (!strcmp(argument, "--version")) { printVersion(); CLEAN_RETURN(0); }
812*a28cd43dSSascha Wildner if (!strcmp(argument, "--help")) { usage_advanced(programName); CLEAN_RETURN(0); }
813*a28cd43dSSascha Wildner if (!strcmp(argument, "--verbose")) { g_displayLevel++; continue; }
814*a28cd43dSSascha Wildner if (!strcmp(argument, "--quiet")) { g_displayLevel--; continue; }
815*a28cd43dSSascha Wildner if (!strcmp(argument, "--stdout")) { forceStdout=1; outFileName=stdoutmark; g_displayLevel-=(g_displayLevel==2); continue; }
816*a28cd43dSSascha Wildner if (!strcmp(argument, "--ultra")) { ultra=1; continue; }
817*a28cd43dSSascha Wildner if (!strcmp(argument, "--check")) { FIO_setChecksumFlag(prefs, 2); continue; }
818*a28cd43dSSascha Wildner if (!strcmp(argument, "--no-check")) { FIO_setChecksumFlag(prefs, 0); continue; }
819*a28cd43dSSascha Wildner if (!strcmp(argument, "--sparse")) { FIO_setSparseWrite(prefs, 2); continue; }
820*a28cd43dSSascha Wildner if (!strcmp(argument, "--no-sparse")) { FIO_setSparseWrite(prefs, 0); continue; }
821*a28cd43dSSascha Wildner if (!strcmp(argument, "--test")) { operation=zom_test; continue; }
822*a28cd43dSSascha Wildner if (!strcmp(argument, "--train")) { operation=zom_train; if (outFileName==NULL) outFileName=g_defaultDictName; continue; }
823*a28cd43dSSascha Wildner if (!strcmp(argument, "--no-dictID")) { FIO_setDictIDFlag(prefs, 0); continue; }
824*a28cd43dSSascha Wildner if (!strcmp(argument, "--keep")) { FIO_setRemoveSrcFile(prefs, 0); continue; }
825*a28cd43dSSascha Wildner if (!strcmp(argument, "--rm")) { FIO_setRemoveSrcFile(prefs, 1); continue; }
826*a28cd43dSSascha Wildner if (!strcmp(argument, "--priority=rt")) { setRealTimePrio = 1; continue; }
827*a28cd43dSSascha Wildner if (!strcmp(argument, "--show-default-cparams")) { showDefaultCParams = 1; continue; }
828*a28cd43dSSascha Wildner if (!strcmp(argument, "--content-size")) { contentSize = 1; continue; }
829*a28cd43dSSascha Wildner if (!strcmp(argument, "--no-content-size")) { contentSize = 0; continue; }
830*a28cd43dSSascha Wildner if (!strcmp(argument, "--adapt")) { adapt = 1; continue; }
831*a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--adapt=")) { adapt = 1; if (!parseAdaptParameters(argument, &adaptMin, &adaptMax)) { badusage(programName); CLEAN_RETURN(1); } continue; }
832*a28cd43dSSascha Wildner if (!strcmp(argument, "--single-thread")) { nbWorkers = 0; singleThread = 1; continue; }
833*a28cd43dSSascha Wildner if (!strcmp(argument, "--format=zstd")) { suffix = ZSTD_EXTENSION; FIO_setCompressionType(prefs, FIO_zstdCompression); continue; }
834*a28cd43dSSascha Wildner #ifdef ZSTD_GZCOMPRESS
835*a28cd43dSSascha Wildner if (!strcmp(argument, "--format=gzip")) { suffix = GZ_EXTENSION; FIO_setCompressionType(prefs, FIO_gzipCompression); continue; }
836*a28cd43dSSascha Wildner #endif
837*a28cd43dSSascha Wildner #ifdef ZSTD_LZMACOMPRESS
838*a28cd43dSSascha Wildner if (!strcmp(argument, "--format=lzma")) { suffix = LZMA_EXTENSION; FIO_setCompressionType(prefs, FIO_lzmaCompression); continue; }
839*a28cd43dSSascha Wildner if (!strcmp(argument, "--format=xz")) { suffix = XZ_EXTENSION; FIO_setCompressionType(prefs, FIO_xzCompression); continue; }
840*a28cd43dSSascha Wildner #endif
841*a28cd43dSSascha Wildner #ifdef ZSTD_LZ4COMPRESS
842*a28cd43dSSascha Wildner if (!strcmp(argument, "--format=lz4")) { suffix = LZ4_EXTENSION; FIO_setCompressionType(prefs, FIO_lz4Compression); continue; }
843*a28cd43dSSascha Wildner #endif
844*a28cd43dSSascha Wildner if (!strcmp(argument, "--rsyncable")) { rsyncable = 1; continue; }
845*a28cd43dSSascha Wildner if (!strcmp(argument, "--compress-literals")) { literalCompressionMode = ZSTD_lcm_huffman; continue; }
846*a28cd43dSSascha Wildner if (!strcmp(argument, "--no-compress-literals")) { literalCompressionMode = ZSTD_lcm_uncompressed; continue; }
847*a28cd43dSSascha Wildner if (!strcmp(argument, "--no-progress")) { FIO_setNoProgress(1); continue; }
848*a28cd43dSSascha Wildner if (!strcmp(argument, "--exclude-compressed")) { FIO_setExcludeCompressedFile(prefs, 1); continue; }
849*a28cd43dSSascha Wildner
850*a28cd43dSSascha Wildner /* long commands with arguments */
851*a28cd43dSSascha Wildner #ifndef ZSTD_NODICT
852*a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--train-cover")) {
853*a28cd43dSSascha Wildner operation = zom_train;
854*a28cd43dSSascha Wildner if (outFileName == NULL)
855*a28cd43dSSascha Wildner outFileName = g_defaultDictName;
856*a28cd43dSSascha Wildner dict = cover;
857*a28cd43dSSascha Wildner /* Allow optional arguments following an = */
858*a28cd43dSSascha Wildner if (*argument == 0) { memset(&coverParams, 0, sizeof(coverParams)); }
859*a28cd43dSSascha Wildner else if (*argument++ != '=') { badusage(programName); CLEAN_RETURN(1); }
860*a28cd43dSSascha Wildner else if (!parseCoverParameters(argument, &coverParams)) { badusage(programName); CLEAN_RETURN(1); }
861*a28cd43dSSascha Wildner continue;
862*a28cd43dSSascha Wildner }
863*a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--train-fastcover")) {
864*a28cd43dSSascha Wildner operation = zom_train;
865*a28cd43dSSascha Wildner if (outFileName == NULL)
866*a28cd43dSSascha Wildner outFileName = g_defaultDictName;
867*a28cd43dSSascha Wildner dict = fastCover;
868*a28cd43dSSascha Wildner /* Allow optional arguments following an = */
869*a28cd43dSSascha Wildner if (*argument == 0) { memset(&fastCoverParams, 0, sizeof(fastCoverParams)); }
870*a28cd43dSSascha Wildner else if (*argument++ != '=') { badusage(programName); CLEAN_RETURN(1); }
871*a28cd43dSSascha Wildner else if (!parseFastCoverParameters(argument, &fastCoverParams)) { badusage(programName); CLEAN_RETURN(1); }
872*a28cd43dSSascha Wildner continue;
873*a28cd43dSSascha Wildner }
874*a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--train-legacy")) {
875*a28cd43dSSascha Wildner operation = zom_train;
876*a28cd43dSSascha Wildner if (outFileName == NULL)
877*a28cd43dSSascha Wildner outFileName = g_defaultDictName;
878*a28cd43dSSascha Wildner dict = legacy;
879*a28cd43dSSascha Wildner /* Allow optional arguments following an = */
880*a28cd43dSSascha Wildner if (*argument == 0) { continue; }
881*a28cd43dSSascha Wildner else if (*argument++ != '=') { badusage(programName); CLEAN_RETURN(1); }
882*a28cd43dSSascha Wildner else if (!parseLegacyParameters(argument, &dictSelect)) { badusage(programName); CLEAN_RETURN(1); }
883*a28cd43dSSascha Wildner continue;
884*a28cd43dSSascha Wildner }
885*a28cd43dSSascha Wildner #endif
886*a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--threads")) { NEXT_UINT32(nbWorkers); continue; }
887*a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--memlimit")) { NEXT_UINT32(memLimit); continue; }
888*a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--memory")) { NEXT_UINT32(memLimit); continue; }
889*a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--memlimit-decompress")) { NEXT_UINT32(memLimit); continue; }
890*a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--block-size=")) { blockSize = readSizeTFromChar(&argument); continue; }
891*a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--maxdict")) { NEXT_UINT32(maxDictSize); continue; }
892*a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--dictID")) { NEXT_UINT32(dictID); continue; }
893*a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--zstd=")) { if (!parseCompressionParameters(argument, &compressionParams)) { badusage(programName); CLEAN_RETURN(1); } continue; }
894*a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--stream-size=")) { streamSrcSize = readSizeTFromChar(&argument); continue; }
895*a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--target-compressed-block-size=")) { targetCBlockSize = readSizeTFromChar(&argument); continue; }
896*a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--size-hint=")) { srcSizeHint = readSizeTFromChar(&argument); continue; }
897*a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--output-dir-flat")) { NEXT_FIELD(outDirName); continue; }
898*a28cd43dSSascha Wildner #ifdef UTIL_HAS_MIRRORFILELIST
899*a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--output-dir-mirror")) { NEXT_FIELD(outMirroredDirName); continue; }
900*a28cd43dSSascha Wildner #endif
901*a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--patch-from")) { NEXT_FIELD(patchFromDictFileName); continue; }
902*a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--long")) {
903*a28cd43dSSascha Wildner unsigned ldmWindowLog = 0;
904*a28cd43dSSascha Wildner ldmFlag = 1;
905*a28cd43dSSascha Wildner /* Parse optional window log */
906*a28cd43dSSascha Wildner if (*argument == '=') {
907*a28cd43dSSascha Wildner ++argument;
908*a28cd43dSSascha Wildner ldmWindowLog = readU32FromChar(&argument);
909*a28cd43dSSascha Wildner } else if (*argument != 0) {
910*a28cd43dSSascha Wildner /* Invalid character following --long */
911*a28cd43dSSascha Wildner badusage(programName);
912*a28cd43dSSascha Wildner CLEAN_RETURN(1);
913*a28cd43dSSascha Wildner }
914*a28cd43dSSascha Wildner /* Only set windowLog if not already set by --zstd */
915*a28cd43dSSascha Wildner if (compressionParams.windowLog == 0)
916*a28cd43dSSascha Wildner compressionParams.windowLog = ldmWindowLog;
917*a28cd43dSSascha Wildner continue;
918*a28cd43dSSascha Wildner }
919*a28cd43dSSascha Wildner #ifndef ZSTD_NOCOMPRESS /* linking ZSTD_minCLevel() requires compression support */
920*a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--fast")) {
921*a28cd43dSSascha Wildner /* Parse optional acceleration factor */
922*a28cd43dSSascha Wildner if (*argument == '=') {
923*a28cd43dSSascha Wildner U32 const maxFast = (U32)-ZSTD_minCLevel();
924*a28cd43dSSascha Wildner U32 fastLevel;
925*a28cd43dSSascha Wildner ++argument;
926*a28cd43dSSascha Wildner fastLevel = readU32FromChar(&argument);
927*a28cd43dSSascha Wildner if (fastLevel > maxFast) fastLevel = maxFast;
928*a28cd43dSSascha Wildner if (fastLevel) {
929*a28cd43dSSascha Wildner dictCLevel = cLevel = -(int)fastLevel;
930*a28cd43dSSascha Wildner } else {
931*a28cd43dSSascha Wildner badusage(programName);
932*a28cd43dSSascha Wildner CLEAN_RETURN(1);
933*a28cd43dSSascha Wildner }
934*a28cd43dSSascha Wildner } else if (*argument != 0) {
935*a28cd43dSSascha Wildner /* Invalid character following --fast */
936*a28cd43dSSascha Wildner badusage(programName);
937*a28cd43dSSascha Wildner CLEAN_RETURN(1);
938*a28cd43dSSascha Wildner } else {
939*a28cd43dSSascha Wildner cLevel = -1; /* default for --fast */
940*a28cd43dSSascha Wildner }
941*a28cd43dSSascha Wildner continue;
942*a28cd43dSSascha Wildner }
943*a28cd43dSSascha Wildner #endif
944*a28cd43dSSascha Wildner
945*a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--filelist")) {
946*a28cd43dSSascha Wildner const char* listName;
947*a28cd43dSSascha Wildner NEXT_FIELD(listName);
948*a28cd43dSSascha Wildner UTIL_refFilename(file_of_names, listName);
949*a28cd43dSSascha Wildner continue;
950*a28cd43dSSascha Wildner }
951*a28cd43dSSascha Wildner
952*a28cd43dSSascha Wildner /* fall-through, will trigger bad_usage() later on */
953*a28cd43dSSascha Wildner }
954*a28cd43dSSascha Wildner
955*a28cd43dSSascha Wildner argument++;
956*a28cd43dSSascha Wildner while (argument[0]!=0) {
957*a28cd43dSSascha Wildner
958*a28cd43dSSascha Wildner #ifndef ZSTD_NOCOMPRESS
959*a28cd43dSSascha Wildner /* compression Level */
960*a28cd43dSSascha Wildner if ((*argument>='0') && (*argument<='9')) {
961*a28cd43dSSascha Wildner dictCLevel = cLevel = (int)readU32FromChar(&argument);
962*a28cd43dSSascha Wildner continue;
963*a28cd43dSSascha Wildner }
964*a28cd43dSSascha Wildner #endif
965*a28cd43dSSascha Wildner
966*a28cd43dSSascha Wildner switch(argument[0])
967*a28cd43dSSascha Wildner {
968*a28cd43dSSascha Wildner /* Display help */
969*a28cd43dSSascha Wildner case 'V': printVersion(); CLEAN_RETURN(0); /* Version Only */
970*a28cd43dSSascha Wildner case 'H':
971*a28cd43dSSascha Wildner case 'h': usage_advanced(programName); CLEAN_RETURN(0);
972*a28cd43dSSascha Wildner
973*a28cd43dSSascha Wildner /* Compress */
974*a28cd43dSSascha Wildner case 'z': operation=zom_compress; argument++; break;
975*a28cd43dSSascha Wildner
976*a28cd43dSSascha Wildner /* Decoding */
977*a28cd43dSSascha Wildner case 'd':
978*a28cd43dSSascha Wildner #ifndef ZSTD_NOBENCH
979*a28cd43dSSascha Wildner benchParams.mode = BMK_decodeOnly;
980*a28cd43dSSascha Wildner if (operation==zom_bench) { argument++; break; } /* benchmark decode (hidden option) */
981*a28cd43dSSascha Wildner #endif
982*a28cd43dSSascha Wildner operation=zom_decompress; argument++; break;
983*a28cd43dSSascha Wildner
984*a28cd43dSSascha Wildner /* Force stdout, even if stdout==console */
985*a28cd43dSSascha Wildner case 'c': forceStdout=1; outFileName=stdoutmark; argument++; break;
986*a28cd43dSSascha Wildner
987*a28cd43dSSascha Wildner /* Use file content as dictionary */
988*a28cd43dSSascha Wildner case 'D': argument++; NEXT_FIELD(dictFileName); break;
989*a28cd43dSSascha Wildner
990*a28cd43dSSascha Wildner /* Overwrite */
991*a28cd43dSSascha Wildner case 'f': FIO_overwriteMode(prefs); forceStdout=1; followLinks=1; argument++; break;
992*a28cd43dSSascha Wildner
993*a28cd43dSSascha Wildner /* Verbose mode */
994*a28cd43dSSascha Wildner case 'v': g_displayLevel++; argument++; break;
995*a28cd43dSSascha Wildner
996*a28cd43dSSascha Wildner /* Quiet mode */
997*a28cd43dSSascha Wildner case 'q': g_displayLevel--; argument++; break;
998*a28cd43dSSascha Wildner
999*a28cd43dSSascha Wildner /* keep source file (default) */
1000*a28cd43dSSascha Wildner case 'k': FIO_setRemoveSrcFile(prefs, 0); argument++; break;
1001*a28cd43dSSascha Wildner
1002*a28cd43dSSascha Wildner /* Checksum */
1003*a28cd43dSSascha Wildner case 'C': FIO_setChecksumFlag(prefs, 2); argument++; break;
1004*a28cd43dSSascha Wildner
1005*a28cd43dSSascha Wildner /* test compressed file */
1006*a28cd43dSSascha Wildner case 't': operation=zom_test; argument++; break;
1007*a28cd43dSSascha Wildner
1008*a28cd43dSSascha Wildner /* destination file name */
1009*a28cd43dSSascha Wildner case 'o': argument++; NEXT_FIELD(outFileName); break;
1010*a28cd43dSSascha Wildner
1011*a28cd43dSSascha Wildner /* limit memory */
1012*a28cd43dSSascha Wildner case 'M':
1013*a28cd43dSSascha Wildner argument++;
1014*a28cd43dSSascha Wildner memLimit = readU32FromChar(&argument);
1015*a28cd43dSSascha Wildner break;
1016*a28cd43dSSascha Wildner case 'l': operation=zom_list; argument++; break;
1017*a28cd43dSSascha Wildner #ifdef UTIL_HAS_CREATEFILELIST
1018*a28cd43dSSascha Wildner /* recursive */
1019*a28cd43dSSascha Wildner case 'r': recursive=1; argument++; break;
1020*a28cd43dSSascha Wildner #endif
1021*a28cd43dSSascha Wildner
1022*a28cd43dSSascha Wildner #ifndef ZSTD_NOBENCH
1023*a28cd43dSSascha Wildner /* Benchmark */
1024*a28cd43dSSascha Wildner case 'b':
1025*a28cd43dSSascha Wildner operation=zom_bench;
1026*a28cd43dSSascha Wildner argument++;
1027*a28cd43dSSascha Wildner break;
1028*a28cd43dSSascha Wildner
1029*a28cd43dSSascha Wildner /* range bench (benchmark only) */
1030*a28cd43dSSascha Wildner case 'e':
1031*a28cd43dSSascha Wildner /* compression Level */
1032*a28cd43dSSascha Wildner argument++;
1033*a28cd43dSSascha Wildner cLevelLast = (int)readU32FromChar(&argument);
1034*a28cd43dSSascha Wildner break;
1035*a28cd43dSSascha Wildner
1036*a28cd43dSSascha Wildner /* Modify Nb Iterations (benchmark only) */
1037*a28cd43dSSascha Wildner case 'i':
1038*a28cd43dSSascha Wildner argument++;
1039*a28cd43dSSascha Wildner bench_nbSeconds = readU32FromChar(&argument);
1040*a28cd43dSSascha Wildner break;
1041*a28cd43dSSascha Wildner
1042*a28cd43dSSascha Wildner /* cut input into blocks (benchmark only) */
1043*a28cd43dSSascha Wildner case 'B':
1044*a28cd43dSSascha Wildner argument++;
1045*a28cd43dSSascha Wildner blockSize = readU32FromChar(&argument);
1046*a28cd43dSSascha Wildner break;
1047*a28cd43dSSascha Wildner
1048*a28cd43dSSascha Wildner /* benchmark files separately (hidden option) */
1049*a28cd43dSSascha Wildner case 'S':
1050*a28cd43dSSascha Wildner argument++;
1051*a28cd43dSSascha Wildner separateFiles = 1;
1052*a28cd43dSSascha Wildner break;
1053*a28cd43dSSascha Wildner
1054*a28cd43dSSascha Wildner #endif /* ZSTD_NOBENCH */
1055*a28cd43dSSascha Wildner
1056*a28cd43dSSascha Wildner /* nb of threads (hidden option) */
1057*a28cd43dSSascha Wildner case 'T':
1058*a28cd43dSSascha Wildner argument++;
1059*a28cd43dSSascha Wildner nbWorkers = (int)readU32FromChar(&argument);
1060*a28cd43dSSascha Wildner break;
1061*a28cd43dSSascha Wildner
1062*a28cd43dSSascha Wildner /* Dictionary Selection level */
1063*a28cd43dSSascha Wildner case 's':
1064*a28cd43dSSascha Wildner argument++;
1065*a28cd43dSSascha Wildner dictSelect = readU32FromChar(&argument);
1066*a28cd43dSSascha Wildner break;
1067*a28cd43dSSascha Wildner
1068*a28cd43dSSascha Wildner /* Pause at the end (-p) or set an additional param (-p#) (hidden option) */
1069*a28cd43dSSascha Wildner case 'p': argument++;
1070*a28cd43dSSascha Wildner #ifndef ZSTD_NOBENCH
1071*a28cd43dSSascha Wildner if ((*argument>='0') && (*argument<='9')) {
1072*a28cd43dSSascha Wildner benchParams.additionalParam = (int)readU32FromChar(&argument);
1073*a28cd43dSSascha Wildner } else
1074*a28cd43dSSascha Wildner #endif
1075*a28cd43dSSascha Wildner main_pause=1;
1076*a28cd43dSSascha Wildner break;
1077*a28cd43dSSascha Wildner
1078*a28cd43dSSascha Wildner /* Select compressibility of synthetic sample */
1079*a28cd43dSSascha Wildner case 'P':
1080*a28cd43dSSascha Wildner argument++;
1081*a28cd43dSSascha Wildner compressibility = (double)readU32FromChar(&argument) / 100;
1082*a28cd43dSSascha Wildner break;
1083*a28cd43dSSascha Wildner
1084*a28cd43dSSascha Wildner /* unknown command */
1085*a28cd43dSSascha Wildner default : badusage(programName); CLEAN_RETURN(1);
1086*a28cd43dSSascha Wildner }
1087*a28cd43dSSascha Wildner }
1088*a28cd43dSSascha Wildner continue;
1089*a28cd43dSSascha Wildner } /* if (argument[0]=='-') */
1090*a28cd43dSSascha Wildner
1091*a28cd43dSSascha Wildner /* none of the above : add filename to list */
1092*a28cd43dSSascha Wildner UTIL_refFilename(filenames, argument);
1093*a28cd43dSSascha Wildner }
1094*a28cd43dSSascha Wildner
1095*a28cd43dSSascha Wildner /* Welcome message (if verbose) */
1096*a28cd43dSSascha Wildner DISPLAYLEVEL(3, WELCOME_MESSAGE);
1097*a28cd43dSSascha Wildner
1098*a28cd43dSSascha Wildner #ifdef ZSTD_MULTITHREAD
1099*a28cd43dSSascha Wildner if ((nbWorkers==0) && (!singleThread)) {
1100*a28cd43dSSascha Wildner /* automatically set # workers based on # of reported cpus */
1101*a28cd43dSSascha Wildner nbWorkers = UTIL_countPhysicalCores();
1102*a28cd43dSSascha Wildner DISPLAYLEVEL(3, "Note: %d physical core(s) detected \n", nbWorkers);
1103*a28cd43dSSascha Wildner }
1104*a28cd43dSSascha Wildner #else
1105*a28cd43dSSascha Wildner (void)singleThread; (void)nbWorkers;
1106*a28cd43dSSascha Wildner #endif
1107*a28cd43dSSascha Wildner
1108*a28cd43dSSascha Wildner #ifdef UTIL_HAS_CREATEFILELIST
1109*a28cd43dSSascha Wildner g_utilDisplayLevel = g_displayLevel;
1110*a28cd43dSSascha Wildner if (!followLinks) {
1111*a28cd43dSSascha Wildner unsigned u, fileNamesNb;
1112*a28cd43dSSascha Wildner unsigned const nbFilenames = (unsigned)filenames->tableSize;
1113*a28cd43dSSascha Wildner for (u=0, fileNamesNb=0; u<nbFilenames; u++) {
1114*a28cd43dSSascha Wildner if ( UTIL_isLink(filenames->fileNames[u])
1115*a28cd43dSSascha Wildner && !UTIL_isFIFO(filenames->fileNames[u])
1116*a28cd43dSSascha Wildner ) {
1117*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "Warning : %s is a symbolic link, ignoring \n", filenames->fileNames[u]);
1118*a28cd43dSSascha Wildner } else {
1119*a28cd43dSSascha Wildner filenames->fileNames[fileNamesNb++] = filenames->fileNames[u];
1120*a28cd43dSSascha Wildner } }
1121*a28cd43dSSascha Wildner if (fileNamesNb == 0 && nbFilenames > 0) /* all names are eliminated */
1122*a28cd43dSSascha Wildner CLEAN_RETURN(1);
1123*a28cd43dSSascha Wildner filenames->tableSize = fileNamesNb;
1124*a28cd43dSSascha Wildner } /* if (!followLinks) */
1125*a28cd43dSSascha Wildner
1126*a28cd43dSSascha Wildner /* read names from a file */
1127*a28cd43dSSascha Wildner if (file_of_names->tableSize) {
1128*a28cd43dSSascha Wildner size_t const nbFileLists = file_of_names->tableSize;
1129*a28cd43dSSascha Wildner size_t flNb;
1130*a28cd43dSSascha Wildner for (flNb=0; flNb < nbFileLists; flNb++) {
1131*a28cd43dSSascha Wildner FileNamesTable* const fnt = UTIL_createFileNamesTable_fromFileName(file_of_names->fileNames[flNb]);
1132*a28cd43dSSascha Wildner if (fnt==NULL) {
1133*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: error reading %s \n", file_of_names->fileNames[flNb]);
1134*a28cd43dSSascha Wildner CLEAN_RETURN(1);
1135*a28cd43dSSascha Wildner }
1136*a28cd43dSSascha Wildner filenames = UTIL_mergeFileNamesTable(filenames, fnt);
1137*a28cd43dSSascha Wildner }
1138*a28cd43dSSascha Wildner }
1139*a28cd43dSSascha Wildner
1140*a28cd43dSSascha Wildner if (recursive) { /* at this stage, filenameTable is a list of paths, which can contain both files and directories */
1141*a28cd43dSSascha Wildner UTIL_expandFNT(&filenames, followLinks);
1142*a28cd43dSSascha Wildner }
1143*a28cd43dSSascha Wildner #else
1144*a28cd43dSSascha Wildner (void)followLinks;
1145*a28cd43dSSascha Wildner #endif
1146*a28cd43dSSascha Wildner
1147*a28cd43dSSascha Wildner if (operation == zom_list) {
1148*a28cd43dSSascha Wildner #ifndef ZSTD_NODECOMPRESS
1149*a28cd43dSSascha Wildner int const ret = FIO_listMultipleFiles((unsigned)filenames->tableSize, filenames->fileNames, g_displayLevel);
1150*a28cd43dSSascha Wildner CLEAN_RETURN(ret);
1151*a28cd43dSSascha Wildner #else
1152*a28cd43dSSascha Wildner DISPLAY("file information is not supported \n");
1153*a28cd43dSSascha Wildner CLEAN_RETURN(1);
1154*a28cd43dSSascha Wildner #endif
1155*a28cd43dSSascha Wildner }
1156*a28cd43dSSascha Wildner
1157*a28cd43dSSascha Wildner /* Check if benchmark is selected */
1158*a28cd43dSSascha Wildner if (operation==zom_bench) {
1159*a28cd43dSSascha Wildner #ifndef ZSTD_NOBENCH
1160*a28cd43dSSascha Wildner benchParams.blockSize = blockSize;
1161*a28cd43dSSascha Wildner benchParams.nbWorkers = nbWorkers;
1162*a28cd43dSSascha Wildner benchParams.realTime = (unsigned)setRealTimePrio;
1163*a28cd43dSSascha Wildner benchParams.nbSeconds = bench_nbSeconds;
1164*a28cd43dSSascha Wildner benchParams.ldmFlag = ldmFlag;
1165*a28cd43dSSascha Wildner benchParams.ldmMinMatch = (int)g_ldmMinMatch;
1166*a28cd43dSSascha Wildner benchParams.ldmHashLog = (int)g_ldmHashLog;
1167*a28cd43dSSascha Wildner if (g_ldmBucketSizeLog != LDM_PARAM_DEFAULT) {
1168*a28cd43dSSascha Wildner benchParams.ldmBucketSizeLog = (int)g_ldmBucketSizeLog;
1169*a28cd43dSSascha Wildner }
1170*a28cd43dSSascha Wildner if (g_ldmHashRateLog != LDM_PARAM_DEFAULT) {
1171*a28cd43dSSascha Wildner benchParams.ldmHashRateLog = (int)g_ldmHashRateLog;
1172*a28cd43dSSascha Wildner }
1173*a28cd43dSSascha Wildner benchParams.literalCompressionMode = literalCompressionMode;
1174*a28cd43dSSascha Wildner
1175*a28cd43dSSascha Wildner if (cLevel > ZSTD_maxCLevel()) cLevel = ZSTD_maxCLevel();
1176*a28cd43dSSascha Wildner if (cLevelLast > ZSTD_maxCLevel()) cLevelLast = ZSTD_maxCLevel();
1177*a28cd43dSSascha Wildner if (cLevelLast < cLevel) cLevelLast = cLevel;
1178*a28cd43dSSascha Wildner if (cLevelLast > cLevel)
1179*a28cd43dSSascha Wildner DISPLAYLEVEL(3, "Benchmarking levels from %d to %d\n", cLevel, cLevelLast);
1180*a28cd43dSSascha Wildner if (filenames->tableSize > 0) {
1181*a28cd43dSSascha Wildner if(separateFiles) {
1182*a28cd43dSSascha Wildner unsigned i;
1183*a28cd43dSSascha Wildner for(i = 0; i < filenames->tableSize; i++) {
1184*a28cd43dSSascha Wildner int c;
1185*a28cd43dSSascha Wildner DISPLAYLEVEL(3, "Benchmarking %s \n", filenames->fileNames[i]);
1186*a28cd43dSSascha Wildner for(c = cLevel; c <= cLevelLast; c++) {
1187*a28cd43dSSascha Wildner BMK_benchFilesAdvanced(&filenames->fileNames[i], 1, dictFileName, c, &compressionParams, g_displayLevel, &benchParams);
1188*a28cd43dSSascha Wildner } }
1189*a28cd43dSSascha Wildner } else {
1190*a28cd43dSSascha Wildner for(; cLevel <= cLevelLast; cLevel++) {
1191*a28cd43dSSascha Wildner BMK_benchFilesAdvanced(filenames->fileNames, (unsigned)filenames->tableSize, dictFileName, cLevel, &compressionParams, g_displayLevel, &benchParams);
1192*a28cd43dSSascha Wildner } }
1193*a28cd43dSSascha Wildner } else {
1194*a28cd43dSSascha Wildner for(; cLevel <= cLevelLast; cLevel++) {
1195*a28cd43dSSascha Wildner BMK_syntheticTest(cLevel, compressibility, &compressionParams, g_displayLevel, &benchParams);
1196*a28cd43dSSascha Wildner } }
1197*a28cd43dSSascha Wildner
1198*a28cd43dSSascha Wildner #else
1199*a28cd43dSSascha Wildner (void)bench_nbSeconds; (void)blockSize; (void)setRealTimePrio; (void)separateFiles; (void)compressibility;
1200*a28cd43dSSascha Wildner #endif
1201*a28cd43dSSascha Wildner goto _end;
1202*a28cd43dSSascha Wildner }
1203*a28cd43dSSascha Wildner
1204*a28cd43dSSascha Wildner /* Check if dictionary builder is selected */
1205*a28cd43dSSascha Wildner if (operation==zom_train) {
1206*a28cd43dSSascha Wildner #ifndef ZSTD_NODICT
1207*a28cd43dSSascha Wildner ZDICT_params_t zParams;
1208*a28cd43dSSascha Wildner zParams.compressionLevel = dictCLevel;
1209*a28cd43dSSascha Wildner zParams.notificationLevel = (unsigned)g_displayLevel;
1210*a28cd43dSSascha Wildner zParams.dictID = dictID;
1211*a28cd43dSSascha Wildner if (dict == cover) {
1212*a28cd43dSSascha Wildner int const optimize = !coverParams.k || !coverParams.d;
1213*a28cd43dSSascha Wildner coverParams.nbThreads = (unsigned)nbWorkers;
1214*a28cd43dSSascha Wildner coverParams.zParams = zParams;
1215*a28cd43dSSascha Wildner operationResult = DiB_trainFromFiles(outFileName, maxDictSize, filenames->fileNames, (unsigned)filenames->tableSize, blockSize, NULL, &coverParams, NULL, optimize);
1216*a28cd43dSSascha Wildner } else if (dict == fastCover) {
1217*a28cd43dSSascha Wildner int const optimize = !fastCoverParams.k || !fastCoverParams.d;
1218*a28cd43dSSascha Wildner fastCoverParams.nbThreads = (unsigned)nbWorkers;
1219*a28cd43dSSascha Wildner fastCoverParams.zParams = zParams;
1220*a28cd43dSSascha Wildner operationResult = DiB_trainFromFiles(outFileName, maxDictSize, filenames->fileNames, (unsigned)filenames->tableSize, blockSize, NULL, NULL, &fastCoverParams, optimize);
1221*a28cd43dSSascha Wildner } else {
1222*a28cd43dSSascha Wildner ZDICT_legacy_params_t dictParams;
1223*a28cd43dSSascha Wildner memset(&dictParams, 0, sizeof(dictParams));
1224*a28cd43dSSascha Wildner dictParams.selectivityLevel = dictSelect;
1225*a28cd43dSSascha Wildner dictParams.zParams = zParams;
1226*a28cd43dSSascha Wildner operationResult = DiB_trainFromFiles(outFileName, maxDictSize, filenames->fileNames, (unsigned)filenames->tableSize, blockSize, &dictParams, NULL, NULL, 0);
1227*a28cd43dSSascha Wildner }
1228*a28cd43dSSascha Wildner #else
1229*a28cd43dSSascha Wildner (void)dictCLevel; (void)dictSelect; (void)dictID; (void)maxDictSize; /* not used when ZSTD_NODICT set */
1230*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "training mode not available \n");
1231*a28cd43dSSascha Wildner operationResult = 1;
1232*a28cd43dSSascha Wildner #endif
1233*a28cd43dSSascha Wildner goto _end;
1234*a28cd43dSSascha Wildner }
1235*a28cd43dSSascha Wildner
1236*a28cd43dSSascha Wildner #ifndef ZSTD_NODECOMPRESS
1237*a28cd43dSSascha Wildner if (operation==zom_test) { FIO_setTestMode(prefs, 1); outFileName=nulmark; FIO_setRemoveSrcFile(prefs, 0); } /* test mode */
1238*a28cd43dSSascha Wildner #endif
1239*a28cd43dSSascha Wildner
1240*a28cd43dSSascha Wildner /* No input filename ==> use stdin and stdout */
1241*a28cd43dSSascha Wildner if (filenames->tableSize == 0) UTIL_refFilename(filenames, stdinmark);
1242*a28cd43dSSascha Wildner if (!strcmp(filenames->fileNames[0], stdinmark) && !outFileName)
1243*a28cd43dSSascha Wildner outFileName = stdoutmark; /* when input is stdin, default output is stdout */
1244*a28cd43dSSascha Wildner
1245*a28cd43dSSascha Wildner /* Check if input/output defined as console; trigger an error in this case */
1246*a28cd43dSSascha Wildner if (!strcmp(filenames->fileNames[0], stdinmark) && IS_CONSOLE(stdin) ) {
1247*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "stdin is a console, aborting\n");
1248*a28cd43dSSascha Wildner CLEAN_RETURN(1);
1249*a28cd43dSSascha Wildner }
1250*a28cd43dSSascha Wildner if ( outFileName && !strcmp(outFileName, stdoutmark)
1251*a28cd43dSSascha Wildner && IS_CONSOLE(stdout)
1252*a28cd43dSSascha Wildner && !strcmp(filenames->fileNames[0], stdinmark)
1253*a28cd43dSSascha Wildner && !forceStdout
1254*a28cd43dSSascha Wildner && operation!=zom_decompress ) {
1255*a28cd43dSSascha Wildner DISPLAYLEVEL(1, "stdout is a console, aborting\n");
1256*a28cd43dSSascha Wildner CLEAN_RETURN(1);
1257*a28cd43dSSascha Wildner }
1258*a28cd43dSSascha Wildner
1259*a28cd43dSSascha Wildner #ifndef ZSTD_NOCOMPRESS
1260*a28cd43dSSascha Wildner /* check compression level limits */
1261*a28cd43dSSascha Wildner { int const maxCLevel = ultra ? ZSTD_maxCLevel() : ZSTDCLI_CLEVEL_MAX;
1262*a28cd43dSSascha Wildner if (cLevel > maxCLevel) {
1263*a28cd43dSSascha Wildner DISPLAYLEVEL(2, "Warning : compression level higher than max, reduced to %i \n", maxCLevel);
1264*a28cd43dSSascha Wildner cLevel = maxCLevel;
1265*a28cd43dSSascha Wildner } }
1266*a28cd43dSSascha Wildner #endif
1267*a28cd43dSSascha Wildner
1268*a28cd43dSSascha Wildner if (showDefaultCParams) {
1269*a28cd43dSSascha Wildner if (operation == zom_decompress) {
1270*a28cd43dSSascha Wildner DISPLAY("error : can't use --show-default-cparams in decomrpession mode \n");
1271*a28cd43dSSascha Wildner CLEAN_RETURN(1);
1272*a28cd43dSSascha Wildner }
1273*a28cd43dSSascha Wildner }
1274*a28cd43dSSascha Wildner
1275*a28cd43dSSascha Wildner if (dictFileName != NULL && patchFromDictFileName != NULL) {
1276*a28cd43dSSascha Wildner DISPLAY("error : can't use -D and --patch-from=# at the same time \n");
1277*a28cd43dSSascha Wildner CLEAN_RETURN(1);
1278*a28cd43dSSascha Wildner }
1279*a28cd43dSSascha Wildner
1280*a28cd43dSSascha Wildner if (patchFromDictFileName != NULL && filenames->tableSize > 1) {
1281*a28cd43dSSascha Wildner DISPLAY("error : can't use --patch-from=# on multiple files \n");
1282*a28cd43dSSascha Wildner CLEAN_RETURN(1);
1283*a28cd43dSSascha Wildner }
1284*a28cd43dSSascha Wildner
1285*a28cd43dSSascha Wildner /* No status message in pipe mode (stdin - stdout) */
1286*a28cd43dSSascha Wildner hasStdout = outFileName && !strcmp(outFileName,stdoutmark);
1287*a28cd43dSSascha Wildner
1288*a28cd43dSSascha Wildner if (hasStdout && (g_displayLevel==2)) g_displayLevel=1;
1289*a28cd43dSSascha Wildner
1290*a28cd43dSSascha Wildner /* IO Stream/File */
1291*a28cd43dSSascha Wildner FIO_setHasStdoutOutput(fCtx, hasStdout);
1292*a28cd43dSSascha Wildner FIO_setNbFilesTotal(fCtx, (int)filenames->tableSize);
1293*a28cd43dSSascha Wildner FIO_determineHasStdinInput(fCtx, filenames);
1294*a28cd43dSSascha Wildner FIO_setNotificationLevel(g_displayLevel);
1295*a28cd43dSSascha Wildner FIO_setPatchFromMode(prefs, patchFromDictFileName != NULL);
1296*a28cd43dSSascha Wildner if (memLimit == 0) {
1297*a28cd43dSSascha Wildner if (compressionParams.windowLog == 0) {
1298*a28cd43dSSascha Wildner memLimit = (U32)1 << g_defaultMaxWindowLog;
1299*a28cd43dSSascha Wildner } else {
1300*a28cd43dSSascha Wildner memLimit = (U32)1 << (compressionParams.windowLog & 31);
1301*a28cd43dSSascha Wildner } }
1302*a28cd43dSSascha Wildner if (patchFromDictFileName != NULL)
1303*a28cd43dSSascha Wildner dictFileName = patchFromDictFileName;
1304*a28cd43dSSascha Wildner FIO_setMemLimit(prefs, memLimit);
1305*a28cd43dSSascha Wildner if (operation==zom_compress) {
1306*a28cd43dSSascha Wildner #ifndef ZSTD_NOCOMPRESS
1307*a28cd43dSSascha Wildner FIO_setContentSize(prefs, contentSize);
1308*a28cd43dSSascha Wildner FIO_setNbWorkers(prefs, nbWorkers);
1309*a28cd43dSSascha Wildner FIO_setBlockSize(prefs, (int)blockSize);
1310*a28cd43dSSascha Wildner if (g_overlapLog!=OVERLAP_LOG_DEFAULT) FIO_setOverlapLog(prefs, (int)g_overlapLog);
1311*a28cd43dSSascha Wildner FIO_setLdmFlag(prefs, (unsigned)ldmFlag);
1312*a28cd43dSSascha Wildner FIO_setLdmHashLog(prefs, (int)g_ldmHashLog);
1313*a28cd43dSSascha Wildner FIO_setLdmMinMatch(prefs, (int)g_ldmMinMatch);
1314*a28cd43dSSascha Wildner if (g_ldmBucketSizeLog != LDM_PARAM_DEFAULT) FIO_setLdmBucketSizeLog(prefs, (int)g_ldmBucketSizeLog);
1315*a28cd43dSSascha Wildner if (g_ldmHashRateLog != LDM_PARAM_DEFAULT) FIO_setLdmHashRateLog(prefs, (int)g_ldmHashRateLog);
1316*a28cd43dSSascha Wildner FIO_setAdaptiveMode(prefs, (unsigned)adapt);
1317*a28cd43dSSascha Wildner FIO_setAdaptMin(prefs, adaptMin);
1318*a28cd43dSSascha Wildner FIO_setAdaptMax(prefs, adaptMax);
1319*a28cd43dSSascha Wildner FIO_setRsyncable(prefs, rsyncable);
1320*a28cd43dSSascha Wildner FIO_setStreamSrcSize(prefs, streamSrcSize);
1321*a28cd43dSSascha Wildner FIO_setTargetCBlockSize(prefs, targetCBlockSize);
1322*a28cd43dSSascha Wildner FIO_setSrcSizeHint(prefs, srcSizeHint);
1323*a28cd43dSSascha Wildner FIO_setLiteralCompressionMode(prefs, literalCompressionMode);
1324*a28cd43dSSascha Wildner if (adaptMin > cLevel) cLevel = adaptMin;
1325*a28cd43dSSascha Wildner if (adaptMax < cLevel) cLevel = adaptMax;
1326*a28cd43dSSascha Wildner
1327*a28cd43dSSascha Wildner /* Compare strategies constant with the ground truth */
1328*a28cd43dSSascha Wildner { ZSTD_bounds strategyBounds = ZSTD_cParam_getBounds(ZSTD_c_strategy);
1329*a28cd43dSSascha Wildner assert(ZSTD_NB_STRATEGIES == strategyBounds.upperBound);
1330*a28cd43dSSascha Wildner (void)strategyBounds; }
1331*a28cd43dSSascha Wildner
1332*a28cd43dSSascha Wildner if (showDefaultCParams) {
1333*a28cd43dSSascha Wildner size_t fileNb;
1334*a28cd43dSSascha Wildner for (fileNb = 0; fileNb < (size_t)filenames->tableSize; fileNb++) {
1335*a28cd43dSSascha Wildner unsigned long long fileSize = UTIL_getFileSize(filenames->fileNames[fileNb]);
1336*a28cd43dSSascha Wildner const size_t dictSize = dictFileName != NULL ? (size_t)UTIL_getFileSize(dictFileName) : 0;
1337*a28cd43dSSascha Wildner const ZSTD_compressionParameters cParams = ZSTD_getCParams(cLevel, fileSize, dictSize);
1338*a28cd43dSSascha Wildner if (fileSize != UTIL_FILESIZE_UNKNOWN) DISPLAY("%s (%u bytes)\n", filenames->fileNames[fileNb], (unsigned)fileSize);
1339*a28cd43dSSascha Wildner else DISPLAY("%s (src size unknown)\n", filenames->fileNames[fileNb]);
1340*a28cd43dSSascha Wildner DISPLAY(" - windowLog : %u\n", cParams.windowLog);
1341*a28cd43dSSascha Wildner DISPLAY(" - chainLog : %u\n", cParams.chainLog);
1342*a28cd43dSSascha Wildner DISPLAY(" - hashLog : %u\n", cParams.hashLog);
1343*a28cd43dSSascha Wildner DISPLAY(" - searchLog : %u\n", cParams.searchLog);
1344*a28cd43dSSascha Wildner DISPLAY(" - minMatch : %u\n", cParams.minMatch);
1345*a28cd43dSSascha Wildner DISPLAY(" - targetLength : %u\n", cParams.targetLength);
1346*a28cd43dSSascha Wildner assert(cParams.strategy < ZSTD_NB_STRATEGIES + 1);
1347*a28cd43dSSascha Wildner DISPLAY(" - strategy : %s (%u)\n", ZSTD_strategyMap[(int)cParams.strategy], (unsigned)cParams.strategy);
1348*a28cd43dSSascha Wildner }
1349*a28cd43dSSascha Wildner }
1350*a28cd43dSSascha Wildner
1351*a28cd43dSSascha Wildner if ((filenames->tableSize==1) && outFileName)
1352*a28cd43dSSascha Wildner operationResult = FIO_compressFilename(fCtx, prefs, outFileName, filenames->fileNames[0], dictFileName, cLevel, compressionParams);
1353*a28cd43dSSascha Wildner else
1354*a28cd43dSSascha Wildner operationResult = FIO_compressMultipleFilenames(fCtx, prefs, filenames->fileNames, outMirroredDirName, outDirName, outFileName, suffix, dictFileName, cLevel, compressionParams);
1355*a28cd43dSSascha Wildner #else
1356*a28cd43dSSascha Wildner (void)contentSize; (void)suffix; (void)adapt; (void)rsyncable; (void)ultra; (void)cLevel; (void)ldmFlag; (void)literalCompressionMode; (void)targetCBlockSize; (void)streamSrcSize; (void)srcSizeHint; (void)ZSTD_strategyMap; /* not used when ZSTD_NOCOMPRESS set */
1357*a28cd43dSSascha Wildner DISPLAY("Compression not supported \n");
1358*a28cd43dSSascha Wildner #endif
1359*a28cd43dSSascha Wildner } else { /* decompression or test */
1360*a28cd43dSSascha Wildner #ifndef ZSTD_NODECOMPRESS
1361*a28cd43dSSascha Wildner if (filenames->tableSize == 1 && outFileName) {
1362*a28cd43dSSascha Wildner operationResult = FIO_decompressFilename(fCtx, prefs, outFileName, filenames->fileNames[0], dictFileName);
1363*a28cd43dSSascha Wildner } else {
1364*a28cd43dSSascha Wildner operationResult = FIO_decompressMultipleFilenames(fCtx, prefs, filenames->fileNames, outMirroredDirName, outDirName, outFileName, dictFileName);
1365*a28cd43dSSascha Wildner }
1366*a28cd43dSSascha Wildner #else
1367*a28cd43dSSascha Wildner DISPLAY("Decompression not supported \n");
1368*a28cd43dSSascha Wildner #endif
1369*a28cd43dSSascha Wildner }
1370*a28cd43dSSascha Wildner
1371*a28cd43dSSascha Wildner _end:
1372*a28cd43dSSascha Wildner FIO_freePreferences(prefs);
1373*a28cd43dSSascha Wildner FIO_freeContext(fCtx);
1374*a28cd43dSSascha Wildner if (main_pause) waitEnter();
1375*a28cd43dSSascha Wildner UTIL_freeFileNamesTable(filenames);
1376*a28cd43dSSascha Wildner UTIL_freeFileNamesTable(file_of_names);
1377*a28cd43dSSascha Wildner
1378*a28cd43dSSascha Wildner return operationResult;
1379*a28cd43dSSascha Wildner }
1380