1a28cd43dSSascha Wildner /*
2a28cd43dSSascha Wildner * Copyright (c) 2016-2020, Yann Collet, Facebook, Inc.
3a28cd43dSSascha Wildner * All rights reserved.
4a28cd43dSSascha Wildner *
5a28cd43dSSascha Wildner * This source code is licensed under both the BSD-style license (found in the
6a28cd43dSSascha Wildner * LICENSE file in the root directory of this source tree) and the GPLv2 (found
7a28cd43dSSascha Wildner * in the COPYING file in the root directory of this source tree).
8a28cd43dSSascha Wildner * You may select, at your option, one of the above-listed licenses.
9a28cd43dSSascha Wildner */
10a28cd43dSSascha Wildner
11a28cd43dSSascha Wildner
12a28cd43dSSascha Wildner /*-************************************
13a28cd43dSSascha Wildner * Tuning parameters
14a28cd43dSSascha Wildner **************************************/
15a28cd43dSSascha Wildner #ifndef ZSTDCLI_CLEVEL_DEFAULT
16a28cd43dSSascha Wildner # define ZSTDCLI_CLEVEL_DEFAULT 3
17a28cd43dSSascha Wildner #endif
18a28cd43dSSascha Wildner
19a28cd43dSSascha Wildner #ifndef ZSTDCLI_CLEVEL_MAX
20a28cd43dSSascha Wildner # define ZSTDCLI_CLEVEL_MAX 19 /* without using --ultra */
21a28cd43dSSascha Wildner #endif
22a28cd43dSSascha Wildner
23a28cd43dSSascha Wildner #ifndef ZSTDCLI_NBTHREADS_DEFAULT
24a28cd43dSSascha Wildner # define ZSTDCLI_NBTHREADS_DEFAULT 1
25a28cd43dSSascha Wildner #endif
26a28cd43dSSascha Wildner
27a28cd43dSSascha Wildner /*-************************************
28a28cd43dSSascha Wildner * Dependencies
29a28cd43dSSascha Wildner **************************************/
30a28cd43dSSascha Wildner #include "platform.h" /* IS_CONSOLE, PLATFORM_POSIX_VERSION */
31a28cd43dSSascha Wildner #include "util.h" /* UTIL_HAS_CREATEFILELIST, UTIL_createFileList */
32a28cd43dSSascha Wildner #include <stdlib.h> /* getenv */
33a28cd43dSSascha Wildner #include <string.h> /* strcmp, strlen */
34a28cd43dSSascha Wildner #include <stdio.h> /* fprintf(), stdin, stdout, stderr */
35a28cd43dSSascha Wildner #include <errno.h> /* errno */
36a28cd43dSSascha Wildner #include <assert.h> /* assert */
37a28cd43dSSascha Wildner
38a28cd43dSSascha Wildner #include "fileio.h" /* stdinmark, stdoutmark, ZSTD_EXTENSION */
39a28cd43dSSascha Wildner #ifndef ZSTD_NOBENCH
40a28cd43dSSascha Wildner # include "benchzstd.h" /* BMK_benchFiles */
41a28cd43dSSascha Wildner #endif
42a28cd43dSSascha Wildner #ifndef ZSTD_NODICT
43a28cd43dSSascha Wildner # include "dibio.h" /* ZDICT_cover_params_t, DiB_trainFromFiles() */
44a28cd43dSSascha Wildner #endif
45a28cd43dSSascha Wildner #include "../lib/zstd.h" /* ZSTD_VERSION_STRING, ZSTD_minCLevel, ZSTD_maxCLevel */
46a28cd43dSSascha Wildner
47a28cd43dSSascha Wildner
48a28cd43dSSascha Wildner /*-************************************
49a28cd43dSSascha Wildner * Constants
50a28cd43dSSascha Wildner **************************************/
51a28cd43dSSascha Wildner #define COMPRESSOR_NAME "zstd command line interface"
52a28cd43dSSascha Wildner #ifndef ZSTD_VERSION
53a28cd43dSSascha Wildner # define ZSTD_VERSION "v" ZSTD_VERSION_STRING
54a28cd43dSSascha Wildner #endif
55a28cd43dSSascha Wildner #define AUTHOR "Yann Collet"
56a28cd43dSSascha Wildner #define WELCOME_MESSAGE "*** %s %i-bits %s, by %s ***\n", COMPRESSOR_NAME, (int)(sizeof(size_t)*8), ZSTD_VERSION, AUTHOR
57a28cd43dSSascha Wildner
58a28cd43dSSascha Wildner #define ZSTD_ZSTDMT "zstdmt"
59a28cd43dSSascha Wildner #define ZSTD_UNZSTD "unzstd"
60a28cd43dSSascha Wildner #define ZSTD_CAT "zstdcat"
61a28cd43dSSascha Wildner #define ZSTD_ZCAT "zcat"
62a28cd43dSSascha Wildner #define ZSTD_GZ "gzip"
63a28cd43dSSascha Wildner #define ZSTD_GUNZIP "gunzip"
64a28cd43dSSascha Wildner #define ZSTD_GZCAT "gzcat"
65a28cd43dSSascha Wildner #define ZSTD_LZMA "lzma"
66a28cd43dSSascha Wildner #define ZSTD_UNLZMA "unlzma"
67a28cd43dSSascha Wildner #define ZSTD_XZ "xz"
68a28cd43dSSascha Wildner #define ZSTD_UNXZ "unxz"
69a28cd43dSSascha Wildner #define ZSTD_LZ4 "lz4"
70a28cd43dSSascha Wildner #define ZSTD_UNLZ4 "unlz4"
71a28cd43dSSascha Wildner
72a28cd43dSSascha Wildner #define KB *(1 <<10)
73a28cd43dSSascha Wildner #define MB *(1 <<20)
74a28cd43dSSascha Wildner #define GB *(1U<<30)
75a28cd43dSSascha Wildner
76a28cd43dSSascha Wildner #define DISPLAY_LEVEL_DEFAULT 2
77a28cd43dSSascha Wildner
78a28cd43dSSascha Wildner static const char* g_defaultDictName = "dictionary";
79a28cd43dSSascha Wildner static const unsigned g_defaultMaxDictSize = 110 KB;
80a28cd43dSSascha Wildner static const int g_defaultDictCLevel = 3;
81a28cd43dSSascha Wildner static const unsigned g_defaultSelectivityLevel = 9;
82a28cd43dSSascha Wildner static const unsigned g_defaultMaxWindowLog = 27;
83a28cd43dSSascha Wildner #define OVERLAP_LOG_DEFAULT 9999
84a28cd43dSSascha Wildner #define LDM_PARAM_DEFAULT 9999 /* Default for parameters where 0 is valid */
85a28cd43dSSascha Wildner static U32 g_overlapLog = OVERLAP_LOG_DEFAULT;
86a28cd43dSSascha Wildner static U32 g_ldmHashLog = 0;
87a28cd43dSSascha Wildner static U32 g_ldmMinMatch = 0;
88a28cd43dSSascha Wildner static U32 g_ldmHashRateLog = LDM_PARAM_DEFAULT;
89a28cd43dSSascha Wildner static U32 g_ldmBucketSizeLog = LDM_PARAM_DEFAULT;
90a28cd43dSSascha Wildner
91a28cd43dSSascha Wildner
92a28cd43dSSascha Wildner #define DEFAULT_ACCEL 1
93a28cd43dSSascha Wildner
94a28cd43dSSascha Wildner typedef enum { cover, fastCover, legacy } dictType;
95a28cd43dSSascha Wildner
96a28cd43dSSascha Wildner /*-************************************
97a28cd43dSSascha Wildner * Display Macros
98a28cd43dSSascha Wildner **************************************/
99a28cd43dSSascha Wildner #define DISPLAY_F(f, ...) fprintf((f), __VA_ARGS__)
100a28cd43dSSascha Wildner #define DISPLAYOUT(...) DISPLAY_F(stdout, __VA_ARGS__)
101a28cd43dSSascha Wildner #define DISPLAY(...) DISPLAY_F(stderr, __VA_ARGS__)
102a28cd43dSSascha Wildner #define DISPLAYLEVEL(l, ...) { if (g_displayLevel>=l) { DISPLAY(__VA_ARGS__); } }
103a28cd43dSSascha Wildner static int g_displayLevel = DISPLAY_LEVEL_DEFAULT; /* 0 : no display, 1: errors, 2 : + result + interaction + warnings, 3 : + progression, 4 : + information */
104a28cd43dSSascha Wildner
105a28cd43dSSascha Wildner
106a28cd43dSSascha Wildner /*-************************************
107a28cd43dSSascha Wildner * Command Line
108a28cd43dSSascha Wildner **************************************/
109a28cd43dSSascha Wildner /* print help either in `stderr` or `stdout` depending on originating request
110a28cd43dSSascha Wildner * error (badusage) => stderr
111a28cd43dSSascha Wildner * help (usage_advanced) => stdout
112a28cd43dSSascha Wildner */
usage(FILE * f,const char * programName)113a28cd43dSSascha Wildner static void usage(FILE* f, const char* programName)
114a28cd43dSSascha Wildner {
115a28cd43dSSascha Wildner DISPLAY_F(f, "Usage : \n");
116a28cd43dSSascha Wildner DISPLAY_F(f, " %s [args] [FILE(s)] [-o file] \n", programName);
117a28cd43dSSascha Wildner DISPLAY_F(f, "\n");
118a28cd43dSSascha Wildner DISPLAY_F(f, "FILE : a filename \n");
119a28cd43dSSascha Wildner DISPLAY_F(f, " with no FILE, or when FILE is - , read standard input\n");
120a28cd43dSSascha Wildner DISPLAY_F(f, "Arguments : \n");
121a28cd43dSSascha Wildner #ifndef ZSTD_NOCOMPRESS
122a28cd43dSSascha Wildner DISPLAY_F(f, " -# : # compression level (1-%d, default: %d) \n", ZSTDCLI_CLEVEL_MAX, ZSTDCLI_CLEVEL_DEFAULT);
123a28cd43dSSascha Wildner #endif
124a28cd43dSSascha Wildner #ifndef ZSTD_NODECOMPRESS
125a28cd43dSSascha Wildner DISPLAY_F(f, " -d : decompression \n");
126a28cd43dSSascha Wildner #endif
127a28cd43dSSascha Wildner DISPLAY_F(f, " -D DICT: use DICT as Dictionary for compression or decompression \n");
128a28cd43dSSascha Wildner DISPLAY_F(f, " -o file: result stored into `file` (only 1 output file) \n");
129a28cd43dSSascha Wildner DISPLAY_F(f, " -f : overwrite output without prompting, also (de)compress links \n");
130a28cd43dSSascha Wildner DISPLAY_F(f, "--rm : remove source file(s) after successful de/compression \n");
131a28cd43dSSascha Wildner DISPLAY_F(f, " -k : preserve source file(s) (default) \n");
132a28cd43dSSascha Wildner DISPLAY_F(f, " -h/-H : display help/long help and exit \n");
133a28cd43dSSascha Wildner }
134a28cd43dSSascha Wildner
usage_advanced(const char * programName)135a28cd43dSSascha Wildner static void usage_advanced(const char* programName)
136a28cd43dSSascha Wildner {
137a28cd43dSSascha Wildner DISPLAYOUT(WELCOME_MESSAGE);
138a28cd43dSSascha Wildner usage(stdout, programName);
139a28cd43dSSascha Wildner DISPLAYOUT( "\n");
140a28cd43dSSascha Wildner DISPLAYOUT( "Advanced arguments : \n");
141a28cd43dSSascha Wildner DISPLAYOUT( " -V : display Version number and exit \n");
142a28cd43dSSascha Wildner
143a28cd43dSSascha Wildner DISPLAYOUT( " -c : force write to standard output, even if it is the console \n");
144a28cd43dSSascha Wildner
145a28cd43dSSascha Wildner DISPLAYOUT( " -v : verbose mode; specify multiple times to increase verbosity \n");
146a28cd43dSSascha Wildner DISPLAYOUT( " -q : suppress warnings; specify twice to suppress errors too \n");
147a28cd43dSSascha Wildner DISPLAYOUT( "--no-progress : do not display the progress counter \n");
148a28cd43dSSascha Wildner
149a28cd43dSSascha Wildner #ifdef UTIL_HAS_CREATEFILELIST
150a28cd43dSSascha Wildner DISPLAYOUT( " -r : operate recursively on directories \n");
151a28cd43dSSascha Wildner DISPLAYOUT( "--filelist FILE : read list of files to operate upon from FILE \n");
152a28cd43dSSascha Wildner DISPLAYOUT( "--output-dir-flat DIR : processed files are stored into DIR \n");
153a28cd43dSSascha Wildner #endif
154a28cd43dSSascha Wildner
155a28cd43dSSascha Wildner #ifdef UTIL_HAS_MIRRORFILELIST
156a28cd43dSSascha Wildner DISPLAYOUT( "--output-dir-mirror DIR : processed files are stored into DIR respecting original directory structure \n");
157a28cd43dSSascha Wildner #endif
158a28cd43dSSascha Wildner
159a28cd43dSSascha Wildner
160a28cd43dSSascha Wildner #ifndef ZSTD_NOCOMPRESS
161a28cd43dSSascha Wildner DISPLAYOUT( "--[no-]check : during compression, add XXH64 integrity checksum to frame (default: enabled)");
162a28cd43dSSascha Wildner #ifndef ZSTD_NODECOMPRESS
163a28cd43dSSascha Wildner DISPLAYOUT( ". If specified with -d, decompressor will ignore/validate checksums in compressed frame (default: validate).");
164a28cd43dSSascha Wildner #endif
165a28cd43dSSascha Wildner #else
166a28cd43dSSascha Wildner #ifdef ZSTD_NOCOMPRESS
167a28cd43dSSascha Wildner DISPLAYOUT( "--[no-]check : during decompression, ignore/validate checksums in compressed frame (default: validate).");
168a28cd43dSSascha Wildner #endif
169a28cd43dSSascha Wildner #endif /* ZSTD_NOCOMPRESS */
170a28cd43dSSascha Wildner DISPLAYOUT( "\n");
171a28cd43dSSascha Wildner
172a28cd43dSSascha Wildner DISPLAYOUT( "-- : All arguments after \"--\" are treated as files \n");
173a28cd43dSSascha Wildner
174a28cd43dSSascha Wildner #ifndef ZSTD_NOCOMPRESS
175a28cd43dSSascha Wildner DISPLAYOUT( "\n");
176a28cd43dSSascha Wildner DISPLAYOUT( "Advanced compression arguments : \n");
177a28cd43dSSascha Wildner DISPLAYOUT( "--ultra : enable levels beyond %i, up to %i (requires more memory) \n", ZSTDCLI_CLEVEL_MAX, ZSTD_maxCLevel());
178a28cd43dSSascha Wildner DISPLAYOUT( "--long[=#]: enable long distance matching with given window log (default: %u) \n", g_defaultMaxWindowLog);
179a28cd43dSSascha Wildner DISPLAYOUT( "--fast[=#]: switch to very fast compression levels (default: %u) \n", 1);
180a28cd43dSSascha Wildner DISPLAYOUT( "--adapt : dynamically adapt compression level to I/O conditions \n");
181a28cd43dSSascha Wildner # ifdef ZSTD_MULTITHREAD
182a28cd43dSSascha Wildner DISPLAYOUT( " -T# : spawns # compression threads (default: 1, 0==# cores) \n");
183a28cd43dSSascha Wildner DISPLAYOUT( " -B# : select size of each job (default: 0==automatic) \n");
184a28cd43dSSascha Wildner DISPLAYOUT( "--single-thread : use a single thread for both I/O and compression (result slightly different than -T1) \n");
185a28cd43dSSascha Wildner DISPLAYOUT( "--rsyncable : compress using a rsync-friendly method (-B sets block size) \n");
186a28cd43dSSascha Wildner # endif
187a28cd43dSSascha Wildner DISPLAYOUT( "--exclude-compressed: only compress files that are not already compressed \n");
188a28cd43dSSascha Wildner DISPLAYOUT( "--stream-size=# : specify size of streaming input from `stdin` \n");
189a28cd43dSSascha Wildner DISPLAYOUT( "--size-hint=# optimize compression parameters for streaming input of approximately this size \n");
190a28cd43dSSascha Wildner DISPLAYOUT( "--target-compressed-block-size=# : generate compressed block of approximately targeted size \n");
191a28cd43dSSascha Wildner DISPLAYOUT( "--no-dictID : don't write dictID into header (dictionary compression only) \n");
192a28cd43dSSascha Wildner DISPLAYOUT( "--[no-]compress-literals : force (un)compressed literals \n");
193a28cd43dSSascha Wildner
194a28cd43dSSascha Wildner DISPLAYOUT( "--format=zstd : compress files to the .zst format (default) \n");
195a28cd43dSSascha Wildner #ifdef ZSTD_GZCOMPRESS
196a28cd43dSSascha Wildner DISPLAYOUT( "--format=gzip : compress files to the .gz format \n");
197a28cd43dSSascha Wildner #endif
198a28cd43dSSascha Wildner #ifdef ZSTD_LZMACOMPRESS
199a28cd43dSSascha Wildner DISPLAYOUT( "--format=xz : compress files to the .xz format \n");
200a28cd43dSSascha Wildner DISPLAYOUT( "--format=lzma : compress files to the .lzma format \n");
201a28cd43dSSascha Wildner #endif
202a28cd43dSSascha Wildner #ifdef ZSTD_LZ4COMPRESS
203a28cd43dSSascha Wildner DISPLAYOUT( "--format=lz4 : compress files to the .lz4 format \n");
204a28cd43dSSascha Wildner #endif
205a28cd43dSSascha Wildner #endif /* !ZSTD_NOCOMPRESS */
206a28cd43dSSascha Wildner
207a28cd43dSSascha Wildner #ifndef ZSTD_NODECOMPRESS
208a28cd43dSSascha Wildner DISPLAYOUT( "\n");
209a28cd43dSSascha Wildner DISPLAYOUT( "Advanced decompression arguments : \n");
210a28cd43dSSascha Wildner DISPLAYOUT( " -l : print information about zstd compressed files \n");
211a28cd43dSSascha Wildner DISPLAYOUT( "--test : test compressed file integrity \n");
212a28cd43dSSascha Wildner DISPLAYOUT( " -M# : Set a memory usage limit for decompression \n");
213a28cd43dSSascha Wildner # if ZSTD_SPARSE_DEFAULT
214a28cd43dSSascha Wildner DISPLAYOUT( "--[no-]sparse : sparse mode (default: enabled on file, disabled on stdout) \n");
215a28cd43dSSascha Wildner # else
216a28cd43dSSascha Wildner DISPLAYOUT( "--[no-]sparse : sparse mode (default: disabled) \n");
217a28cd43dSSascha Wildner # endif
218a28cd43dSSascha Wildner #endif /* ZSTD_NODECOMPRESS */
219a28cd43dSSascha Wildner
220a28cd43dSSascha Wildner #ifndef ZSTD_NODICT
221a28cd43dSSascha Wildner DISPLAYOUT( "\n");
222a28cd43dSSascha Wildner DISPLAYOUT( "Dictionary builder : \n");
223a28cd43dSSascha Wildner DISPLAYOUT( "--train ## : create a dictionary from a training set of files \n");
224a28cd43dSSascha Wildner DISPLAYOUT( "--train-cover[=k=#,d=#,steps=#,split=#,shrink[=#]] : use the cover algorithm with optional args \n");
225a28cd43dSSascha Wildner DISPLAYOUT( "--train-fastcover[=k=#,d=#,f=#,steps=#,split=#,accel=#,shrink[=#]] : use the fast cover algorithm with optional args \n");
226a28cd43dSSascha Wildner DISPLAYOUT( "--train-legacy[=s=#] : use the legacy algorithm with selectivity (default: %u) \n", g_defaultSelectivityLevel);
227a28cd43dSSascha Wildner DISPLAYOUT( " -o DICT : DICT is dictionary name (default: %s) \n", g_defaultDictName);
228a28cd43dSSascha Wildner DISPLAYOUT( "--maxdict=# : limit dictionary to specified size (default: %u) \n", g_defaultMaxDictSize);
229a28cd43dSSascha Wildner DISPLAYOUT( "--dictID=# : force dictionary ID to specified value (default: random) \n");
230a28cd43dSSascha Wildner #endif
231a28cd43dSSascha Wildner
232a28cd43dSSascha Wildner #ifndef ZSTD_NOBENCH
233a28cd43dSSascha Wildner DISPLAYOUT( "\n");
234a28cd43dSSascha Wildner DISPLAYOUT( "Benchmark arguments : \n");
235a28cd43dSSascha Wildner DISPLAYOUT( " -b# : benchmark file(s), using # compression level (default: %d) \n", ZSTDCLI_CLEVEL_DEFAULT);
236a28cd43dSSascha Wildner DISPLAYOUT( " -e# : test all compression levels successively from -b# to -e# (default: 1) \n");
237a28cd43dSSascha Wildner DISPLAYOUT( " -i# : minimum evaluation time in seconds (default: 3s) \n");
238a28cd43dSSascha Wildner DISPLAYOUT( " -B# : cut file into independent blocks of size # (default: no block) \n");
239a28cd43dSSascha Wildner DISPLAYOUT( " -S : output one benchmark result per input file (default: consolidated result) \n");
240a28cd43dSSascha Wildner DISPLAYOUT( "--priority=rt : set process priority to real-time \n");
241a28cd43dSSascha Wildner #endif
242a28cd43dSSascha Wildner
243a28cd43dSSascha Wildner }
244a28cd43dSSascha Wildner
badusage(const char * programName)245a28cd43dSSascha Wildner static void badusage(const char* programName)
246a28cd43dSSascha Wildner {
247a28cd43dSSascha Wildner DISPLAYLEVEL(1, "Incorrect parameters \n");
248a28cd43dSSascha Wildner if (g_displayLevel >= 2) usage(stderr, programName);
249a28cd43dSSascha Wildner }
250a28cd43dSSascha Wildner
waitEnter(void)251a28cd43dSSascha Wildner static void waitEnter(void)
252a28cd43dSSascha Wildner {
253a28cd43dSSascha Wildner int unused;
254a28cd43dSSascha Wildner DISPLAY("Press enter to continue... \n");
255a28cd43dSSascha Wildner unused = getchar();
256a28cd43dSSascha Wildner (void)unused;
257a28cd43dSSascha Wildner }
258a28cd43dSSascha Wildner
lastNameFromPath(const char * path)259a28cd43dSSascha Wildner static const char* lastNameFromPath(const char* path)
260a28cd43dSSascha Wildner {
261a28cd43dSSascha Wildner const char* name = path;
262a28cd43dSSascha Wildner if (strrchr(name, '/')) name = strrchr(name, '/') + 1;
263a28cd43dSSascha Wildner if (strrchr(name, '\\')) name = strrchr(name, '\\') + 1; /* windows */
264a28cd43dSSascha Wildner return name;
265a28cd43dSSascha Wildner }
266a28cd43dSSascha Wildner
267a28cd43dSSascha Wildner /*! exeNameMatch() :
268a28cd43dSSascha Wildner @return : a non-zero value if exeName matches test, excluding the extension
269a28cd43dSSascha Wildner */
exeNameMatch(const char * exeName,const char * test)270a28cd43dSSascha Wildner static int exeNameMatch(const char* exeName, const char* test)
271a28cd43dSSascha Wildner {
272a28cd43dSSascha Wildner return !strncmp(exeName, test, strlen(test)) &&
273a28cd43dSSascha Wildner (exeName[strlen(test)] == '\0' || exeName[strlen(test)] == '.');
274a28cd43dSSascha Wildner }
275a28cd43dSSascha Wildner
errorOut(const char * msg)276a28cd43dSSascha Wildner static void errorOut(const char* msg)
277a28cd43dSSascha Wildner {
278a28cd43dSSascha Wildner DISPLAY("%s \n", msg); exit(1);
279a28cd43dSSascha Wildner }
280a28cd43dSSascha Wildner
281a28cd43dSSascha Wildner /*! readU32FromCharChecked() :
282a28cd43dSSascha Wildner * @return 0 if success, and store the result in *value.
283a28cd43dSSascha Wildner * allows and interprets K, KB, KiB, M, MB and MiB suffix.
284a28cd43dSSascha Wildner * Will also modify `*stringPtr`, advancing it to position where it stopped reading.
285a28cd43dSSascha Wildner * @return 1 if an overflow error occurs */
readU32FromCharChecked(const char ** stringPtr,unsigned * value)286a28cd43dSSascha Wildner static int readU32FromCharChecked(const char** stringPtr, unsigned* value)
287a28cd43dSSascha Wildner {
288a28cd43dSSascha Wildner unsigned result = 0;
289a28cd43dSSascha Wildner while ((**stringPtr >='0') && (**stringPtr <='9')) {
290a28cd43dSSascha Wildner unsigned const max = ((unsigned)(-1)) / 10;
291a28cd43dSSascha Wildner unsigned last = result;
292a28cd43dSSascha Wildner if (result > max) return 1; /* overflow error */
293a28cd43dSSascha Wildner result *= 10;
294a28cd43dSSascha Wildner result += (unsigned)(**stringPtr - '0');
295a28cd43dSSascha Wildner if (result < last) return 1; /* overflow error */
296a28cd43dSSascha Wildner (*stringPtr)++ ;
297a28cd43dSSascha Wildner }
298a28cd43dSSascha Wildner if ((**stringPtr=='K') || (**stringPtr=='M')) {
299a28cd43dSSascha Wildner unsigned const maxK = ((unsigned)(-1)) >> 10;
300a28cd43dSSascha Wildner if (result > maxK) return 1; /* overflow error */
301a28cd43dSSascha Wildner result <<= 10;
302a28cd43dSSascha Wildner if (**stringPtr=='M') {
303a28cd43dSSascha Wildner if (result > maxK) return 1; /* overflow error */
304a28cd43dSSascha Wildner result <<= 10;
305a28cd43dSSascha Wildner }
306a28cd43dSSascha Wildner (*stringPtr)++; /* skip `K` or `M` */
307a28cd43dSSascha Wildner if (**stringPtr=='i') (*stringPtr)++;
308a28cd43dSSascha Wildner if (**stringPtr=='B') (*stringPtr)++;
309a28cd43dSSascha Wildner }
310a28cd43dSSascha Wildner *value = result;
311a28cd43dSSascha Wildner return 0;
312a28cd43dSSascha Wildner }
313a28cd43dSSascha Wildner
314a28cd43dSSascha Wildner /*! readU32FromChar() :
315a28cd43dSSascha Wildner * @return : unsigned integer value read from input in `char` format.
316a28cd43dSSascha Wildner * allows and interprets K, KB, KiB, M, MB and MiB suffix.
317a28cd43dSSascha Wildner * Will also modify `*stringPtr`, advancing it to position where it stopped reading.
318a28cd43dSSascha Wildner * Note : function will exit() program if digit sequence overflows */
readU32FromChar(const char ** stringPtr)319a28cd43dSSascha Wildner static unsigned readU32FromChar(const char** stringPtr) {
320a28cd43dSSascha Wildner static const char errorMsg[] = "error: numeric value overflows 32-bit unsigned int";
321a28cd43dSSascha Wildner unsigned result;
322a28cd43dSSascha Wildner if (readU32FromCharChecked(stringPtr, &result)) { errorOut(errorMsg); }
323a28cd43dSSascha Wildner return result;
324a28cd43dSSascha Wildner }
325a28cd43dSSascha Wildner
326a28cd43dSSascha Wildner /*! readSizeTFromCharChecked() :
327a28cd43dSSascha Wildner * @return 0 if success, and store the result in *value.
328a28cd43dSSascha Wildner * allows and interprets K, KB, KiB, M, MB and MiB suffix.
329a28cd43dSSascha Wildner * Will also modify `*stringPtr`, advancing it to position where it stopped reading.
330a28cd43dSSascha Wildner * @return 1 if an overflow error occurs */
readSizeTFromCharChecked(const char ** stringPtr,size_t * value)331a28cd43dSSascha Wildner static int readSizeTFromCharChecked(const char** stringPtr, size_t* value)
332a28cd43dSSascha Wildner {
333a28cd43dSSascha Wildner size_t result = 0;
334a28cd43dSSascha Wildner while ((**stringPtr >='0') && (**stringPtr <='9')) {
335a28cd43dSSascha Wildner size_t const max = ((size_t)(-1)) / 10;
336a28cd43dSSascha Wildner size_t last = result;
337a28cd43dSSascha Wildner if (result > max) return 1; /* overflow error */
338a28cd43dSSascha Wildner result *= 10;
339a28cd43dSSascha Wildner result += (size_t)(**stringPtr - '0');
340a28cd43dSSascha Wildner if (result < last) return 1; /* overflow error */
341a28cd43dSSascha Wildner (*stringPtr)++ ;
342a28cd43dSSascha Wildner }
343a28cd43dSSascha Wildner if ((**stringPtr=='K') || (**stringPtr=='M')) {
344a28cd43dSSascha Wildner size_t const maxK = ((size_t)(-1)) >> 10;
345a28cd43dSSascha Wildner if (result > maxK) return 1; /* overflow error */
346a28cd43dSSascha Wildner result <<= 10;
347a28cd43dSSascha Wildner if (**stringPtr=='M') {
348a28cd43dSSascha Wildner if (result > maxK) return 1; /* overflow error */
349a28cd43dSSascha Wildner result <<= 10;
350a28cd43dSSascha Wildner }
351a28cd43dSSascha Wildner (*stringPtr)++; /* skip `K` or `M` */
352a28cd43dSSascha Wildner if (**stringPtr=='i') (*stringPtr)++;
353a28cd43dSSascha Wildner if (**stringPtr=='B') (*stringPtr)++;
354a28cd43dSSascha Wildner }
355a28cd43dSSascha Wildner *value = result;
356a28cd43dSSascha Wildner return 0;
357a28cd43dSSascha Wildner }
358a28cd43dSSascha Wildner
359a28cd43dSSascha Wildner /*! readSizeTFromChar() :
360a28cd43dSSascha Wildner * @return : size_t value read from input in `char` format.
361a28cd43dSSascha Wildner * allows and interprets K, KB, KiB, M, MB and MiB suffix.
362a28cd43dSSascha Wildner * Will also modify `*stringPtr`, advancing it to position where it stopped reading.
363a28cd43dSSascha Wildner * Note : function will exit() program if digit sequence overflows */
readSizeTFromChar(const char ** stringPtr)364a28cd43dSSascha Wildner static size_t readSizeTFromChar(const char** stringPtr) {
365a28cd43dSSascha Wildner static const char errorMsg[] = "error: numeric value overflows size_t";
366a28cd43dSSascha Wildner size_t result;
367a28cd43dSSascha Wildner if (readSizeTFromCharChecked(stringPtr, &result)) { errorOut(errorMsg); }
368a28cd43dSSascha Wildner return result;
369a28cd43dSSascha Wildner }
370a28cd43dSSascha Wildner
371a28cd43dSSascha Wildner /** longCommandWArg() :
372a28cd43dSSascha Wildner * check if *stringPtr is the same as longCommand.
373a28cd43dSSascha Wildner * If yes, @return 1 and advances *stringPtr to the position which immediately follows longCommand.
374a28cd43dSSascha Wildner * @return 0 and doesn't modify *stringPtr otherwise.
375a28cd43dSSascha Wildner */
longCommandWArg(const char ** stringPtr,const char * longCommand)376a28cd43dSSascha Wildner static int longCommandWArg(const char** stringPtr, const char* longCommand)
377a28cd43dSSascha Wildner {
378a28cd43dSSascha Wildner size_t const comSize = strlen(longCommand);
379a28cd43dSSascha Wildner int const result = !strncmp(*stringPtr, longCommand, comSize);
380a28cd43dSSascha Wildner if (result) *stringPtr += comSize;
381a28cd43dSSascha Wildner return result;
382a28cd43dSSascha Wildner }
383a28cd43dSSascha Wildner
384a28cd43dSSascha Wildner
385a28cd43dSSascha Wildner #ifndef ZSTD_NODICT
386a28cd43dSSascha Wildner
387a28cd43dSSascha Wildner static const unsigned kDefaultRegression = 1;
388a28cd43dSSascha Wildner /**
389a28cd43dSSascha Wildner * parseCoverParameters() :
390a28cd43dSSascha Wildner * reads cover parameters from *stringPtr (e.g. "--train-cover=k=48,d=8,steps=32") into *params
391a28cd43dSSascha Wildner * @return 1 means that cover parameters were correct
392a28cd43dSSascha Wildner * @return 0 in case of malformed parameters
393a28cd43dSSascha Wildner */
parseCoverParameters(const char * stringPtr,ZDICT_cover_params_t * params)394a28cd43dSSascha Wildner static unsigned parseCoverParameters(const char* stringPtr, ZDICT_cover_params_t* params)
395a28cd43dSSascha Wildner {
396a28cd43dSSascha Wildner memset(params, 0, sizeof(*params));
397a28cd43dSSascha Wildner for (; ;) {
398a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "k=")) { params->k = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
399a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "d=")) { params->d = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
400a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "steps=")) { params->steps = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
401a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "split=")) {
402a28cd43dSSascha Wildner unsigned splitPercentage = readU32FromChar(&stringPtr);
403a28cd43dSSascha Wildner params->splitPoint = (double)splitPercentage / 100.0;
404a28cd43dSSascha Wildner if (stringPtr[0]==',') { stringPtr++; continue; } else break;
405a28cd43dSSascha Wildner }
406a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "shrink")) {
407a28cd43dSSascha Wildner params->shrinkDictMaxRegression = kDefaultRegression;
408a28cd43dSSascha Wildner params->shrinkDict = 1;
409a28cd43dSSascha Wildner if (stringPtr[0]=='=') {
410a28cd43dSSascha Wildner stringPtr++;
411a28cd43dSSascha Wildner params->shrinkDictMaxRegression = readU32FromChar(&stringPtr);
412a28cd43dSSascha Wildner }
413a28cd43dSSascha Wildner if (stringPtr[0]==',') {
414a28cd43dSSascha Wildner stringPtr++;
415a28cd43dSSascha Wildner continue;
416a28cd43dSSascha Wildner }
417a28cd43dSSascha Wildner else break;
418a28cd43dSSascha Wildner }
419a28cd43dSSascha Wildner return 0;
420a28cd43dSSascha Wildner }
421a28cd43dSSascha Wildner if (stringPtr[0] != 0) return 0;
422a28cd43dSSascha Wildner DISPLAYLEVEL(4, "cover: k=%u\nd=%u\nsteps=%u\nsplit=%u\nshrink%u\n", params->k, params->d, params->steps, (unsigned)(params->splitPoint * 100), params->shrinkDictMaxRegression);
423a28cd43dSSascha Wildner return 1;
424a28cd43dSSascha Wildner }
425a28cd43dSSascha Wildner
426a28cd43dSSascha Wildner /**
427a28cd43dSSascha Wildner * parseFastCoverParameters() :
428a28cd43dSSascha Wildner * reads fastcover parameters from *stringPtr (e.g. "--train-fastcover=k=48,d=8,f=20,steps=32,accel=2") into *params
429a28cd43dSSascha Wildner * @return 1 means that fastcover parameters were correct
430a28cd43dSSascha Wildner * @return 0 in case of malformed parameters
431a28cd43dSSascha Wildner */
parseFastCoverParameters(const char * stringPtr,ZDICT_fastCover_params_t * params)432a28cd43dSSascha Wildner static unsigned parseFastCoverParameters(const char* stringPtr, ZDICT_fastCover_params_t* params)
433a28cd43dSSascha Wildner {
434a28cd43dSSascha Wildner memset(params, 0, sizeof(*params));
435a28cd43dSSascha Wildner for (; ;) {
436a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "k=")) { params->k = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
437a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "d=")) { params->d = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
438a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "f=")) { params->f = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
439a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "steps=")) { params->steps = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
440a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "accel=")) { params->accel = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
441a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "split=")) {
442a28cd43dSSascha Wildner unsigned splitPercentage = readU32FromChar(&stringPtr);
443a28cd43dSSascha Wildner params->splitPoint = (double)splitPercentage / 100.0;
444a28cd43dSSascha Wildner if (stringPtr[0]==',') { stringPtr++; continue; } else break;
445a28cd43dSSascha Wildner }
446a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "shrink")) {
447a28cd43dSSascha Wildner params->shrinkDictMaxRegression = kDefaultRegression;
448a28cd43dSSascha Wildner params->shrinkDict = 1;
449a28cd43dSSascha Wildner if (stringPtr[0]=='=') {
450a28cd43dSSascha Wildner stringPtr++;
451a28cd43dSSascha Wildner params->shrinkDictMaxRegression = readU32FromChar(&stringPtr);
452a28cd43dSSascha Wildner }
453a28cd43dSSascha Wildner if (stringPtr[0]==',') {
454a28cd43dSSascha Wildner stringPtr++;
455a28cd43dSSascha Wildner continue;
456a28cd43dSSascha Wildner }
457a28cd43dSSascha Wildner else break;
458a28cd43dSSascha Wildner }
459a28cd43dSSascha Wildner return 0;
460a28cd43dSSascha Wildner }
461a28cd43dSSascha Wildner if (stringPtr[0] != 0) return 0;
462a28cd43dSSascha Wildner DISPLAYLEVEL(4, "cover: k=%u\nd=%u\nf=%u\nsteps=%u\nsplit=%u\naccel=%u\nshrink=%u\n", params->k, params->d, params->f, params->steps, (unsigned)(params->splitPoint * 100), params->accel, params->shrinkDictMaxRegression);
463a28cd43dSSascha Wildner return 1;
464a28cd43dSSascha Wildner }
465a28cd43dSSascha Wildner
466a28cd43dSSascha Wildner /**
467a28cd43dSSascha Wildner * parseLegacyParameters() :
468a28cd43dSSascha Wildner * reads legacy dictionary builder parameters from *stringPtr (e.g. "--train-legacy=selectivity=8") into *selectivity
469a28cd43dSSascha Wildner * @return 1 means that legacy dictionary builder parameters were correct
470a28cd43dSSascha Wildner * @return 0 in case of malformed parameters
471a28cd43dSSascha Wildner */
parseLegacyParameters(const char * stringPtr,unsigned * selectivity)472a28cd43dSSascha Wildner static unsigned parseLegacyParameters(const char* stringPtr, unsigned* selectivity)
473a28cd43dSSascha Wildner {
474a28cd43dSSascha Wildner if (!longCommandWArg(&stringPtr, "s=") && !longCommandWArg(&stringPtr, "selectivity=")) { return 0; }
475a28cd43dSSascha Wildner *selectivity = readU32FromChar(&stringPtr);
476a28cd43dSSascha Wildner if (stringPtr[0] != 0) return 0;
477a28cd43dSSascha Wildner DISPLAYLEVEL(4, "legacy: selectivity=%u\n", *selectivity);
478a28cd43dSSascha Wildner return 1;
479a28cd43dSSascha Wildner }
480a28cd43dSSascha Wildner
defaultCoverParams(void)481a28cd43dSSascha Wildner static ZDICT_cover_params_t defaultCoverParams(void)
482a28cd43dSSascha Wildner {
483a28cd43dSSascha Wildner ZDICT_cover_params_t params;
484a28cd43dSSascha Wildner memset(¶ms, 0, sizeof(params));
485a28cd43dSSascha Wildner params.d = 8;
486a28cd43dSSascha Wildner params.steps = 4;
487a28cd43dSSascha Wildner params.splitPoint = 1.0;
488a28cd43dSSascha Wildner params.shrinkDict = 0;
489a28cd43dSSascha Wildner params.shrinkDictMaxRegression = kDefaultRegression;
490a28cd43dSSascha Wildner return params;
491a28cd43dSSascha Wildner }
492a28cd43dSSascha Wildner
defaultFastCoverParams(void)493a28cd43dSSascha Wildner static ZDICT_fastCover_params_t defaultFastCoverParams(void)
494a28cd43dSSascha Wildner {
495a28cd43dSSascha Wildner ZDICT_fastCover_params_t params;
496a28cd43dSSascha Wildner memset(¶ms, 0, sizeof(params));
497a28cd43dSSascha Wildner params.d = 8;
498a28cd43dSSascha Wildner params.f = 20;
499a28cd43dSSascha Wildner params.steps = 4;
500a28cd43dSSascha Wildner params.splitPoint = 0.75; /* different from default splitPoint of cover */
501a28cd43dSSascha Wildner params.accel = DEFAULT_ACCEL;
502a28cd43dSSascha Wildner params.shrinkDict = 0;
503a28cd43dSSascha Wildner params.shrinkDictMaxRegression = kDefaultRegression;
504a28cd43dSSascha Wildner return params;
505a28cd43dSSascha Wildner }
506a28cd43dSSascha Wildner #endif
507a28cd43dSSascha Wildner
508a28cd43dSSascha Wildner
509a28cd43dSSascha Wildner /** parseAdaptParameters() :
510a28cd43dSSascha Wildner * reads adapt parameters from *stringPtr (e.g. "--zstd=min=1,max=19) and store them into adaptMinPtr and adaptMaxPtr.
511a28cd43dSSascha Wildner * Both adaptMinPtr and adaptMaxPtr must be already allocated and correctly initialized.
512a28cd43dSSascha Wildner * There is no guarantee that any of these values will be updated.
513a28cd43dSSascha Wildner * @return 1 means that parsing was successful,
514a28cd43dSSascha Wildner * @return 0 in case of malformed parameters
515a28cd43dSSascha Wildner */
parseAdaptParameters(const char * stringPtr,int * adaptMinPtr,int * adaptMaxPtr)516a28cd43dSSascha Wildner static unsigned parseAdaptParameters(const char* stringPtr, int* adaptMinPtr, int* adaptMaxPtr)
517a28cd43dSSascha Wildner {
518a28cd43dSSascha Wildner for ( ; ;) {
519a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "min=")) { *adaptMinPtr = (int)readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
520a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "max=")) { *adaptMaxPtr = (int)readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
521a28cd43dSSascha Wildner DISPLAYLEVEL(4, "invalid compression parameter \n");
522a28cd43dSSascha Wildner return 0;
523a28cd43dSSascha Wildner }
524a28cd43dSSascha Wildner if (stringPtr[0] != 0) return 0; /* check the end of string */
525a28cd43dSSascha Wildner if (*adaptMinPtr > *adaptMaxPtr) {
526a28cd43dSSascha Wildner DISPLAYLEVEL(4, "incoherent adaptation limits \n");
527a28cd43dSSascha Wildner return 0;
528a28cd43dSSascha Wildner }
529a28cd43dSSascha Wildner return 1;
530a28cd43dSSascha Wildner }
531a28cd43dSSascha Wildner
532a28cd43dSSascha Wildner
533a28cd43dSSascha Wildner /** parseCompressionParameters() :
534a28cd43dSSascha Wildner * reads compression parameters from *stringPtr (e.g. "--zstd=wlog=23,clog=23,hlog=22,slog=6,mml=3,tlen=48,strat=6") into *params
535a28cd43dSSascha Wildner * @return 1 means that compression parameters were correct
536a28cd43dSSascha Wildner * @return 0 in case of malformed parameters
537a28cd43dSSascha Wildner */
parseCompressionParameters(const char * stringPtr,ZSTD_compressionParameters * params)538a28cd43dSSascha Wildner static unsigned parseCompressionParameters(const char* stringPtr, ZSTD_compressionParameters* params)
539a28cd43dSSascha Wildner {
540a28cd43dSSascha Wildner for ( ; ;) {
541a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "windowLog=") || longCommandWArg(&stringPtr, "wlog=")) { params->windowLog = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
542a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "chainLog=") || longCommandWArg(&stringPtr, "clog=")) { params->chainLog = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
543a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "hashLog=") || longCommandWArg(&stringPtr, "hlog=")) { params->hashLog = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
544a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "searchLog=") || longCommandWArg(&stringPtr, "slog=")) { params->searchLog = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
545a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "minMatch=") || longCommandWArg(&stringPtr, "mml=")) { params->minMatch = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
546a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "targetLength=") || longCommandWArg(&stringPtr, "tlen=")) { params->targetLength = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
547a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "strategy=") || longCommandWArg(&stringPtr, "strat=")) { params->strategy = (ZSTD_strategy)(readU32FromChar(&stringPtr)); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
548a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "overlapLog=") || longCommandWArg(&stringPtr, "ovlog=")) { g_overlapLog = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
549a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "ldmHashLog=") || longCommandWArg(&stringPtr, "lhlog=")) { g_ldmHashLog = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
550a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "ldmMinMatch=") || longCommandWArg(&stringPtr, "lmml=")) { g_ldmMinMatch = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
551a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "ldmBucketSizeLog=") || longCommandWArg(&stringPtr, "lblog=")) { g_ldmBucketSizeLog = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
552a28cd43dSSascha Wildner if (longCommandWArg(&stringPtr, "ldmHashRateLog=") || longCommandWArg(&stringPtr, "lhrlog=")) { g_ldmHashRateLog = readU32FromChar(&stringPtr); if (stringPtr[0]==',') { stringPtr++; continue; } else break; }
553a28cd43dSSascha Wildner DISPLAYLEVEL(4, "invalid compression parameter \n");
554a28cd43dSSascha Wildner return 0;
555a28cd43dSSascha Wildner }
556a28cd43dSSascha Wildner
557a28cd43dSSascha Wildner DISPLAYLEVEL(4, "windowLog=%d, chainLog=%d, hashLog=%d, searchLog=%d \n", params->windowLog, params->chainLog, params->hashLog, params->searchLog);
558a28cd43dSSascha Wildner DISPLAYLEVEL(4, "minMatch=%d, targetLength=%d, strategy=%d \n", params->minMatch, params->targetLength, params->strategy);
559a28cd43dSSascha Wildner if (stringPtr[0] != 0) return 0; /* check the end of string */
560a28cd43dSSascha Wildner return 1;
561a28cd43dSSascha Wildner }
562a28cd43dSSascha Wildner
printVersion(void)563a28cd43dSSascha Wildner static void printVersion(void)
564a28cd43dSSascha Wildner {
565a28cd43dSSascha Wildner if (g_displayLevel < DISPLAY_LEVEL_DEFAULT) {
566a28cd43dSSascha Wildner DISPLAYOUT("%s\n", ZSTD_VERSION_STRING);
567a28cd43dSSascha Wildner return;
568a28cd43dSSascha Wildner }
569a28cd43dSSascha Wildner
570a28cd43dSSascha Wildner DISPLAYOUT(WELCOME_MESSAGE);
571a28cd43dSSascha Wildner if (g_displayLevel >= 3) {
572a28cd43dSSascha Wildner /* format support */
573a28cd43dSSascha Wildner DISPLAYOUT("*** supports: zstd");
574a28cd43dSSascha Wildner #if defined(ZSTD_LEGACY_SUPPORT) && (ZSTD_LEGACY_SUPPORT>0) && (ZSTD_LEGACY_SUPPORT<8)
575a28cd43dSSascha Wildner DISPLAYOUT(", zstd legacy v0.%d+", ZSTD_LEGACY_SUPPORT);
576a28cd43dSSascha Wildner #endif
577a28cd43dSSascha Wildner #ifdef ZSTD_GZCOMPRESS
578a28cd43dSSascha Wildner DISPLAYOUT(", gzip");
579a28cd43dSSascha Wildner #endif
580a28cd43dSSascha Wildner #ifdef ZSTD_LZ4COMPRESS
581a28cd43dSSascha Wildner DISPLAYOUT(", lz4");
582a28cd43dSSascha Wildner #endif
583a28cd43dSSascha Wildner #ifdef ZSTD_LZMACOMPRESS
584a28cd43dSSascha Wildner DISPLAYOUT(", lzma, xz ");
585a28cd43dSSascha Wildner #endif
586a28cd43dSSascha Wildner DISPLAYOUT("\n");
587a28cd43dSSascha Wildner if (g_displayLevel >= 4) {
588a28cd43dSSascha Wildner /* posix support */
589a28cd43dSSascha Wildner #ifdef _POSIX_C_SOURCE
590a28cd43dSSascha Wildner DISPLAYOUT("_POSIX_C_SOURCE defined: %ldL\n", (long) _POSIX_C_SOURCE);
591a28cd43dSSascha Wildner #endif
592a28cd43dSSascha Wildner #ifdef _POSIX_VERSION
593a28cd43dSSascha Wildner DISPLAYOUT("_POSIX_VERSION defined: %ldL \n", (long) _POSIX_VERSION);
594a28cd43dSSascha Wildner #endif
595a28cd43dSSascha Wildner #ifdef PLATFORM_POSIX_VERSION
596a28cd43dSSascha Wildner DISPLAYOUT("PLATFORM_POSIX_VERSION defined: %ldL\n", (long) PLATFORM_POSIX_VERSION);
597a28cd43dSSascha Wildner #endif
598a28cd43dSSascha Wildner } }
599a28cd43dSSascha Wildner }
600a28cd43dSSascha Wildner
601a28cd43dSSascha Wildner /* Environment variables for parameter setting */
602a28cd43dSSascha Wildner #define ENV_CLEVEL "ZSTD_CLEVEL"
603a28cd43dSSascha Wildner #define ENV_NBTHREADS "ZSTD_NBTHREADS" /* takes lower precedence than directly specifying -T# in the CLI */
604a28cd43dSSascha Wildner
605a28cd43dSSascha Wildner /* pick up environment variable */
init_cLevel(void)606a28cd43dSSascha Wildner static int init_cLevel(void) {
607a28cd43dSSascha Wildner const char* const env = getenv(ENV_CLEVEL);
608a28cd43dSSascha Wildner if (env != NULL) {
609a28cd43dSSascha Wildner const char* ptr = env;
610a28cd43dSSascha Wildner int sign = 1;
611a28cd43dSSascha Wildner if (*ptr == '-') {
612a28cd43dSSascha Wildner sign = -1;
613a28cd43dSSascha Wildner ptr++;
614a28cd43dSSascha Wildner } else if (*ptr == '+') {
615a28cd43dSSascha Wildner ptr++;
616a28cd43dSSascha Wildner }
617a28cd43dSSascha Wildner
618a28cd43dSSascha Wildner if ((*ptr>='0') && (*ptr<='9')) {
619a28cd43dSSascha Wildner unsigned absLevel;
620a28cd43dSSascha Wildner if (readU32FromCharChecked(&ptr, &absLevel)) {
621a28cd43dSSascha Wildner DISPLAYLEVEL(2, "Ignore environment variable setting %s=%s: numeric value too large \n", ENV_CLEVEL, env);
622a28cd43dSSascha Wildner return ZSTDCLI_CLEVEL_DEFAULT;
623a28cd43dSSascha Wildner } else if (*ptr == 0) {
624a28cd43dSSascha Wildner return sign * (int)absLevel;
625a28cd43dSSascha Wildner } }
626a28cd43dSSascha Wildner
627a28cd43dSSascha Wildner DISPLAYLEVEL(2, "Ignore environment variable setting %s=%s: not a valid integer value \n", ENV_CLEVEL, env);
628a28cd43dSSascha Wildner }
629a28cd43dSSascha Wildner
630a28cd43dSSascha Wildner return ZSTDCLI_CLEVEL_DEFAULT;
631a28cd43dSSascha Wildner }
632a28cd43dSSascha Wildner
633a28cd43dSSascha Wildner #ifdef ZSTD_MULTITHREAD
init_nbThreads(void)634a28cd43dSSascha Wildner static unsigned init_nbThreads(void) {
635a28cd43dSSascha Wildner const char* const env = getenv(ENV_NBTHREADS);
636a28cd43dSSascha Wildner if (env != NULL) {
637a28cd43dSSascha Wildner const char* ptr = env;
638a28cd43dSSascha Wildner if ((*ptr>='0') && (*ptr<='9')) {
639a28cd43dSSascha Wildner unsigned nbThreads;
640a28cd43dSSascha Wildner if (readU32FromCharChecked(&ptr, &nbThreads)) {
641a28cd43dSSascha Wildner DISPLAYLEVEL(2, "Ignore environment variable setting %s=%s: numeric value too large \n", ENV_NBTHREADS, env);
642a28cd43dSSascha Wildner return ZSTDCLI_NBTHREADS_DEFAULT;
643a28cd43dSSascha Wildner } else if (*ptr == 0) {
644a28cd43dSSascha Wildner return nbThreads;
645a28cd43dSSascha Wildner }
646a28cd43dSSascha Wildner }
647a28cd43dSSascha Wildner DISPLAYLEVEL(2, "Ignore environment variable setting %s=%s: not a valid unsigned value \n", ENV_NBTHREADS, env);
648a28cd43dSSascha Wildner }
649a28cd43dSSascha Wildner
650a28cd43dSSascha Wildner return ZSTDCLI_NBTHREADS_DEFAULT;
651a28cd43dSSascha Wildner }
652a28cd43dSSascha Wildner #endif
653a28cd43dSSascha Wildner
654a28cd43dSSascha Wildner #define NEXT_FIELD(ptr) { \
655a28cd43dSSascha Wildner if (*argument == '=') { \
656a28cd43dSSascha Wildner ptr = ++argument; \
657a28cd43dSSascha Wildner argument += strlen(ptr); \
658a28cd43dSSascha Wildner } else { \
659a28cd43dSSascha Wildner argNb++; \
660a28cd43dSSascha Wildner if (argNb >= argCount) { \
661a28cd43dSSascha Wildner DISPLAY("error: missing command argument \n"); \
662a28cd43dSSascha Wildner CLEAN_RETURN(1); \
663a28cd43dSSascha Wildner } \
664a28cd43dSSascha Wildner ptr = argv[argNb]; \
665a28cd43dSSascha Wildner assert(ptr != NULL); \
666a28cd43dSSascha Wildner if (ptr[0]=='-') { \
667a28cd43dSSascha Wildner DISPLAY("error: command cannot be separated from its argument by another command \n"); \
668a28cd43dSSascha Wildner CLEAN_RETURN(1); \
669a28cd43dSSascha Wildner } } }
670a28cd43dSSascha Wildner
671a28cd43dSSascha Wildner #define NEXT_UINT32(val32) { \
672a28cd43dSSascha Wildner const char* __nb; \
673a28cd43dSSascha Wildner NEXT_FIELD(__nb); \
674a28cd43dSSascha Wildner val32 = readU32FromChar(&__nb); \
675a28cd43dSSascha Wildner }
676a28cd43dSSascha Wildner
677a28cd43dSSascha Wildner #define ZSTD_NB_STRATEGIES 9
678a28cd43dSSascha Wildner static const char* ZSTD_strategyMap[ZSTD_NB_STRATEGIES + 1] = { "", "ZSTD_fast",
679a28cd43dSSascha Wildner "ZSTD_dfast", "ZSTD_greedy", "ZSTD_lazy", "ZSTD_lazy2", "ZSTD_btlazy2",
680a28cd43dSSascha Wildner "ZSTD_btopt", "ZSTD_btultra", "ZSTD_btultra2"};
681a28cd43dSSascha Wildner
682a28cd43dSSascha Wildner typedef enum { zom_compress, zom_decompress, zom_test, zom_bench, zom_train, zom_list } zstd_operation_mode;
683a28cd43dSSascha Wildner
684a28cd43dSSascha Wildner #define CLEAN_RETURN(i) { operationResult = (i); goto _end; }
685a28cd43dSSascha Wildner
686a28cd43dSSascha Wildner #ifdef ZSTD_NOCOMPRESS
687a28cd43dSSascha Wildner /* symbols from compression library are not defined and should not be invoked */
688a28cd43dSSascha Wildner # define MINCLEVEL -99
689a28cd43dSSascha Wildner # define MAXCLEVEL 22
690a28cd43dSSascha Wildner #else
691a28cd43dSSascha Wildner # define MINCLEVEL ZSTD_minCLevel()
692a28cd43dSSascha Wildner # define MAXCLEVEL ZSTD_maxCLevel()
693a28cd43dSSascha Wildner #endif
694a28cd43dSSascha Wildner
main(int const argCount,const char * argv[])695a28cd43dSSascha Wildner int main(int const argCount, const char* argv[])
696a28cd43dSSascha Wildner {
697a28cd43dSSascha Wildner int argNb,
698a28cd43dSSascha Wildner followLinks = 0,
699a28cd43dSSascha Wildner forceStdout = 0,
700a28cd43dSSascha Wildner hasStdout = 0,
701a28cd43dSSascha Wildner ldmFlag = 0,
702a28cd43dSSascha Wildner main_pause = 0,
703a28cd43dSSascha Wildner nbWorkers = 0,
704a28cd43dSSascha Wildner adapt = 0,
705a28cd43dSSascha Wildner adaptMin = MINCLEVEL,
706a28cd43dSSascha Wildner adaptMax = MAXCLEVEL,
707a28cd43dSSascha Wildner rsyncable = 0,
708a28cd43dSSascha Wildner nextArgumentsAreFiles = 0,
709a28cd43dSSascha Wildner operationResult = 0,
710a28cd43dSSascha Wildner separateFiles = 0,
711a28cd43dSSascha Wildner setRealTimePrio = 0,
712a28cd43dSSascha Wildner singleThread = 0,
713a28cd43dSSascha Wildner showDefaultCParams = 0,
714a28cd43dSSascha Wildner ultra=0,
715a28cd43dSSascha Wildner contentSize=1;
716a28cd43dSSascha Wildner double compressibility = 0.5;
717a28cd43dSSascha Wildner unsigned bench_nbSeconds = 3; /* would be better if this value was synchronized from bench */
718a28cd43dSSascha Wildner size_t blockSize = 0;
719a28cd43dSSascha Wildner
720a28cd43dSSascha Wildner FIO_prefs_t* const prefs = FIO_createPreferences();
721a28cd43dSSascha Wildner FIO_ctx_t* const fCtx = FIO_createContext();
722a28cd43dSSascha Wildner zstd_operation_mode operation = zom_compress;
723a28cd43dSSascha Wildner ZSTD_compressionParameters compressionParams;
724a28cd43dSSascha Wildner int cLevel = init_cLevel();
725a28cd43dSSascha Wildner int cLevelLast = MINCLEVEL - 1; /* lower than minimum */
726a28cd43dSSascha Wildner unsigned recursive = 0;
727a28cd43dSSascha Wildner unsigned memLimit = 0;
728a28cd43dSSascha Wildner FileNamesTable* filenames = UTIL_allocateFileNamesTable((size_t)argCount); /* argCount >= 1 */
729a28cd43dSSascha Wildner FileNamesTable* file_of_names = UTIL_allocateFileNamesTable((size_t)argCount); /* argCount >= 1 */
730a28cd43dSSascha Wildner const char* programName = argv[0];
731a28cd43dSSascha Wildner const char* outFileName = NULL;
732a28cd43dSSascha Wildner const char* outDirName = NULL;
733a28cd43dSSascha Wildner const char* outMirroredDirName = NULL;
734a28cd43dSSascha Wildner const char* dictFileName = NULL;
735a28cd43dSSascha Wildner const char* patchFromDictFileName = NULL;
736a28cd43dSSascha Wildner const char* suffix = ZSTD_EXTENSION;
737a28cd43dSSascha Wildner unsigned maxDictSize = g_defaultMaxDictSize;
738a28cd43dSSascha Wildner unsigned dictID = 0;
739a28cd43dSSascha Wildner size_t streamSrcSize = 0;
740a28cd43dSSascha Wildner size_t targetCBlockSize = 0;
741a28cd43dSSascha Wildner size_t srcSizeHint = 0;
742a28cd43dSSascha Wildner int dictCLevel = g_defaultDictCLevel;
743a28cd43dSSascha Wildner unsigned dictSelect = g_defaultSelectivityLevel;
744a28cd43dSSascha Wildner #ifndef ZSTD_NODICT
745a28cd43dSSascha Wildner ZDICT_cover_params_t coverParams = defaultCoverParams();
746a28cd43dSSascha Wildner ZDICT_fastCover_params_t fastCoverParams = defaultFastCoverParams();
747a28cd43dSSascha Wildner dictType dict = fastCover;
748a28cd43dSSascha Wildner #endif
749a28cd43dSSascha Wildner #ifndef ZSTD_NOBENCH
750a28cd43dSSascha Wildner BMK_advancedParams_t benchParams = BMK_initAdvancedParams();
751a28cd43dSSascha Wildner #endif
752a28cd43dSSascha Wildner ZSTD_literalCompressionMode_e literalCompressionMode = ZSTD_lcm_auto;
753a28cd43dSSascha Wildner
754a28cd43dSSascha Wildner
755a28cd43dSSascha Wildner /* init */
756a28cd43dSSascha Wildner (void)recursive; (void)cLevelLast; /* not used when ZSTD_NOBENCH set */
757a28cd43dSSascha Wildner (void)memLimit;
758a28cd43dSSascha Wildner assert(argCount >= 1);
759a28cd43dSSascha Wildner if ((filenames==NULL) || (file_of_names==NULL)) { DISPLAY("zstd: allocation error \n"); exit(1); }
760a28cd43dSSascha Wildner programName = lastNameFromPath(programName);
761a28cd43dSSascha Wildner #ifdef ZSTD_MULTITHREAD
762a28cd43dSSascha Wildner nbWorkers = init_nbThreads();
763a28cd43dSSascha Wildner #endif
764a28cd43dSSascha Wildner
765a28cd43dSSascha Wildner /* preset behaviors */
766a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_ZSTDMT)) nbWorkers=0, singleThread=0;
767a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_UNZSTD)) operation=zom_decompress;
768a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_CAT)) { operation=zom_decompress; FIO_overwriteMode(prefs); forceStdout=1; followLinks=1; outFileName=stdoutmark; g_displayLevel=1; } /* supports multiple formats */
769a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_ZCAT)) { operation=zom_decompress; FIO_overwriteMode(prefs); forceStdout=1; followLinks=1; outFileName=stdoutmark; g_displayLevel=1; } /* behave like zcat, also supports multiple formats */
770a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_GZ)) { suffix = GZ_EXTENSION; FIO_setCompressionType(prefs, FIO_gzipCompression); FIO_setRemoveSrcFile(prefs, 1); } /* behave like gzip */
771a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_GUNZIP)) { operation=zom_decompress; FIO_setRemoveSrcFile(prefs, 1); } /* behave like gunzip, also supports multiple formats */
772a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_GZCAT)) { operation=zom_decompress; FIO_overwriteMode(prefs); forceStdout=1; followLinks=1; outFileName=stdoutmark; g_displayLevel=1; } /* behave like gzcat, also supports multiple formats */
773a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_LZMA)) { suffix = LZMA_EXTENSION; FIO_setCompressionType(prefs, FIO_lzmaCompression); FIO_setRemoveSrcFile(prefs, 1); } /* behave like lzma */
774a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_UNLZMA)) { operation=zom_decompress; FIO_setCompressionType(prefs, FIO_lzmaCompression); FIO_setRemoveSrcFile(prefs, 1); } /* behave like unlzma, also supports multiple formats */
775a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_XZ)) { suffix = XZ_EXTENSION; FIO_setCompressionType(prefs, FIO_xzCompression); FIO_setRemoveSrcFile(prefs, 1); } /* behave like xz */
776a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_UNXZ)) { operation=zom_decompress; FIO_setCompressionType(prefs, FIO_xzCompression); FIO_setRemoveSrcFile(prefs, 1); } /* behave like unxz, also supports multiple formats */
777a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_LZ4)) { suffix = LZ4_EXTENSION; FIO_setCompressionType(prefs, FIO_lz4Compression); } /* behave like lz4 */
778a28cd43dSSascha Wildner if (exeNameMatch(programName, ZSTD_UNLZ4)) { operation=zom_decompress; FIO_setCompressionType(prefs, FIO_lz4Compression); } /* behave like unlz4, also supports multiple formats */
779a28cd43dSSascha Wildner memset(&compressionParams, 0, sizeof(compressionParams));
780a28cd43dSSascha Wildner
781a28cd43dSSascha Wildner /* init crash handler */
782a28cd43dSSascha Wildner FIO_addAbortHandler();
783a28cd43dSSascha Wildner
784a28cd43dSSascha Wildner /* command switches */
785a28cd43dSSascha Wildner for (argNb=1; argNb<argCount; argNb++) {
786a28cd43dSSascha Wildner const char* argument = argv[argNb];
787a28cd43dSSascha Wildner if (!argument) continue; /* Protection if argument empty */
788a28cd43dSSascha Wildner
789a28cd43dSSascha Wildner if (nextArgumentsAreFiles) {
790a28cd43dSSascha Wildner UTIL_refFilename(filenames, argument);
791a28cd43dSSascha Wildner continue;
792a28cd43dSSascha Wildner }
793a28cd43dSSascha Wildner
794a28cd43dSSascha Wildner /* "-" means stdin/stdout */
795a28cd43dSSascha Wildner if (!strcmp(argument, "-")){
796a28cd43dSSascha Wildner UTIL_refFilename(filenames, stdinmark);
797a28cd43dSSascha Wildner continue;
798a28cd43dSSascha Wildner }
799a28cd43dSSascha Wildner
800a28cd43dSSascha Wildner /* Decode commands (note : aggregated commands are allowed) */
801a28cd43dSSascha Wildner if (argument[0]=='-') {
802a28cd43dSSascha Wildner
803a28cd43dSSascha Wildner if (argument[1]=='-') {
804a28cd43dSSascha Wildner /* long commands (--long-word) */
805a28cd43dSSascha Wildner if (!strcmp(argument, "--")) { nextArgumentsAreFiles=1; continue; } /* only file names allowed from now on */
806a28cd43dSSascha Wildner if (!strcmp(argument, "--list")) { operation=zom_list; continue; }
807a28cd43dSSascha Wildner if (!strcmp(argument, "--compress")) { operation=zom_compress; continue; }
808a28cd43dSSascha Wildner if (!strcmp(argument, "--decompress")) { operation=zom_decompress; continue; }
809a28cd43dSSascha Wildner if (!strcmp(argument, "--uncompress")) { operation=zom_decompress; continue; }
810a28cd43dSSascha Wildner if (!strcmp(argument, "--force")) { FIO_overwriteMode(prefs); forceStdout=1; followLinks=1; continue; }
811a28cd43dSSascha Wildner if (!strcmp(argument, "--version")) { printVersion(); CLEAN_RETURN(0); }
812a28cd43dSSascha Wildner if (!strcmp(argument, "--help")) { usage_advanced(programName); CLEAN_RETURN(0); }
813a28cd43dSSascha Wildner if (!strcmp(argument, "--verbose")) { g_displayLevel++; continue; }
814a28cd43dSSascha Wildner if (!strcmp(argument, "--quiet")) { g_displayLevel--; continue; }
815a28cd43dSSascha Wildner if (!strcmp(argument, "--stdout")) { forceStdout=1; outFileName=stdoutmark; g_displayLevel-=(g_displayLevel==2); continue; }
816a28cd43dSSascha Wildner if (!strcmp(argument, "--ultra")) { ultra=1; continue; }
817a28cd43dSSascha Wildner if (!strcmp(argument, "--check")) { FIO_setChecksumFlag(prefs, 2); continue; }
818a28cd43dSSascha Wildner if (!strcmp(argument, "--no-check")) { FIO_setChecksumFlag(prefs, 0); continue; }
819a28cd43dSSascha Wildner if (!strcmp(argument, "--sparse")) { FIO_setSparseWrite(prefs, 2); continue; }
820a28cd43dSSascha Wildner if (!strcmp(argument, "--no-sparse")) { FIO_setSparseWrite(prefs, 0); continue; }
821a28cd43dSSascha Wildner if (!strcmp(argument, "--test")) { operation=zom_test; continue; }
822a28cd43dSSascha Wildner if (!strcmp(argument, "--train")) { operation=zom_train; if (outFileName==NULL) outFileName=g_defaultDictName; continue; }
823a28cd43dSSascha Wildner if (!strcmp(argument, "--no-dictID")) { FIO_setDictIDFlag(prefs, 0); continue; }
824a28cd43dSSascha Wildner if (!strcmp(argument, "--keep")) { FIO_setRemoveSrcFile(prefs, 0); continue; }
825a28cd43dSSascha Wildner if (!strcmp(argument, "--rm")) { FIO_setRemoveSrcFile(prefs, 1); continue; }
826a28cd43dSSascha Wildner if (!strcmp(argument, "--priority=rt")) { setRealTimePrio = 1; continue; }
827a28cd43dSSascha Wildner if (!strcmp(argument, "--show-default-cparams")) { showDefaultCParams = 1; continue; }
828a28cd43dSSascha Wildner if (!strcmp(argument, "--content-size")) { contentSize = 1; continue; }
829a28cd43dSSascha Wildner if (!strcmp(argument, "--no-content-size")) { contentSize = 0; continue; }
830a28cd43dSSascha Wildner if (!strcmp(argument, "--adapt")) { adapt = 1; continue; }
831a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--adapt=")) { adapt = 1; if (!parseAdaptParameters(argument, &adaptMin, &adaptMax)) { badusage(programName); CLEAN_RETURN(1); } continue; }
832a28cd43dSSascha Wildner if (!strcmp(argument, "--single-thread")) { nbWorkers = 0; singleThread = 1; continue; }
833a28cd43dSSascha Wildner if (!strcmp(argument, "--format=zstd")) { suffix = ZSTD_EXTENSION; FIO_setCompressionType(prefs, FIO_zstdCompression); continue; }
834a28cd43dSSascha Wildner #ifdef ZSTD_GZCOMPRESS
835a28cd43dSSascha Wildner if (!strcmp(argument, "--format=gzip")) { suffix = GZ_EXTENSION; FIO_setCompressionType(prefs, FIO_gzipCompression); continue; }
836a28cd43dSSascha Wildner #endif
837a28cd43dSSascha Wildner #ifdef ZSTD_LZMACOMPRESS
838a28cd43dSSascha Wildner if (!strcmp(argument, "--format=lzma")) { suffix = LZMA_EXTENSION; FIO_setCompressionType(prefs, FIO_lzmaCompression); continue; }
839a28cd43dSSascha Wildner if (!strcmp(argument, "--format=xz")) { suffix = XZ_EXTENSION; FIO_setCompressionType(prefs, FIO_xzCompression); continue; }
840a28cd43dSSascha Wildner #endif
841a28cd43dSSascha Wildner #ifdef ZSTD_LZ4COMPRESS
842a28cd43dSSascha Wildner if (!strcmp(argument, "--format=lz4")) { suffix = LZ4_EXTENSION; FIO_setCompressionType(prefs, FIO_lz4Compression); continue; }
843a28cd43dSSascha Wildner #endif
844a28cd43dSSascha Wildner if (!strcmp(argument, "--rsyncable")) { rsyncable = 1; continue; }
845a28cd43dSSascha Wildner if (!strcmp(argument, "--compress-literals")) { literalCompressionMode = ZSTD_lcm_huffman; continue; }
846a28cd43dSSascha Wildner if (!strcmp(argument, "--no-compress-literals")) { literalCompressionMode = ZSTD_lcm_uncompressed; continue; }
847a28cd43dSSascha Wildner if (!strcmp(argument, "--no-progress")) { FIO_setNoProgress(1); continue; }
848a28cd43dSSascha Wildner if (!strcmp(argument, "--exclude-compressed")) { FIO_setExcludeCompressedFile(prefs, 1); continue; }
849a28cd43dSSascha Wildner
850a28cd43dSSascha Wildner /* long commands with arguments */
851a28cd43dSSascha Wildner #ifndef ZSTD_NODICT
852a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--train-cover")) {
853a28cd43dSSascha Wildner operation = zom_train;
854a28cd43dSSascha Wildner if (outFileName == NULL)
855a28cd43dSSascha Wildner outFileName = g_defaultDictName;
856a28cd43dSSascha Wildner dict = cover;
857a28cd43dSSascha Wildner /* Allow optional arguments following an = */
858a28cd43dSSascha Wildner if (*argument == 0) { memset(&coverParams, 0, sizeof(coverParams)); }
859a28cd43dSSascha Wildner else if (*argument++ != '=') { badusage(programName); CLEAN_RETURN(1); }
860a28cd43dSSascha Wildner else if (!parseCoverParameters(argument, &coverParams)) { badusage(programName); CLEAN_RETURN(1); }
861a28cd43dSSascha Wildner continue;
862a28cd43dSSascha Wildner }
863a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--train-fastcover")) {
864a28cd43dSSascha Wildner operation = zom_train;
865a28cd43dSSascha Wildner if (outFileName == NULL)
866a28cd43dSSascha Wildner outFileName = g_defaultDictName;
867a28cd43dSSascha Wildner dict = fastCover;
868a28cd43dSSascha Wildner /* Allow optional arguments following an = */
869a28cd43dSSascha Wildner if (*argument == 0) { memset(&fastCoverParams, 0, sizeof(fastCoverParams)); }
870a28cd43dSSascha Wildner else if (*argument++ != '=') { badusage(programName); CLEAN_RETURN(1); }
871a28cd43dSSascha Wildner else if (!parseFastCoverParameters(argument, &fastCoverParams)) { badusage(programName); CLEAN_RETURN(1); }
872a28cd43dSSascha Wildner continue;
873a28cd43dSSascha Wildner }
874a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--train-legacy")) {
875a28cd43dSSascha Wildner operation = zom_train;
876a28cd43dSSascha Wildner if (outFileName == NULL)
877a28cd43dSSascha Wildner outFileName = g_defaultDictName;
878a28cd43dSSascha Wildner dict = legacy;
879a28cd43dSSascha Wildner /* Allow optional arguments following an = */
880a28cd43dSSascha Wildner if (*argument == 0) { continue; }
881a28cd43dSSascha Wildner else if (*argument++ != '=') { badusage(programName); CLEAN_RETURN(1); }
882a28cd43dSSascha Wildner else if (!parseLegacyParameters(argument, &dictSelect)) { badusage(programName); CLEAN_RETURN(1); }
883a28cd43dSSascha Wildner continue;
884a28cd43dSSascha Wildner }
885a28cd43dSSascha Wildner #endif
886a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--threads")) { NEXT_UINT32(nbWorkers); continue; }
887a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--memlimit")) { NEXT_UINT32(memLimit); continue; }
888a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--memory")) { NEXT_UINT32(memLimit); continue; }
889a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--memlimit-decompress")) { NEXT_UINT32(memLimit); continue; }
890a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--block-size=")) { blockSize = readSizeTFromChar(&argument); continue; }
891a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--maxdict")) { NEXT_UINT32(maxDictSize); continue; }
892a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--dictID")) { NEXT_UINT32(dictID); continue; }
893a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--zstd=")) { if (!parseCompressionParameters(argument, &compressionParams)) { badusage(programName); CLEAN_RETURN(1); } continue; }
894a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--stream-size=")) { streamSrcSize = readSizeTFromChar(&argument); continue; }
895a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--target-compressed-block-size=")) { targetCBlockSize = readSizeTFromChar(&argument); continue; }
896a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--size-hint=")) { srcSizeHint = readSizeTFromChar(&argument); continue; }
897a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--output-dir-flat")) { NEXT_FIELD(outDirName); continue; }
898a28cd43dSSascha Wildner #ifdef UTIL_HAS_MIRRORFILELIST
899a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--output-dir-mirror")) { NEXT_FIELD(outMirroredDirName); continue; }
900a28cd43dSSascha Wildner #endif
901a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--patch-from")) { NEXT_FIELD(patchFromDictFileName); continue; }
902a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--long")) {
903a28cd43dSSascha Wildner unsigned ldmWindowLog = 0;
904a28cd43dSSascha Wildner ldmFlag = 1;
905a28cd43dSSascha Wildner /* Parse optional window log */
906a28cd43dSSascha Wildner if (*argument == '=') {
907a28cd43dSSascha Wildner ++argument;
908a28cd43dSSascha Wildner ldmWindowLog = readU32FromChar(&argument);
909a28cd43dSSascha Wildner } else if (*argument != 0) {
910a28cd43dSSascha Wildner /* Invalid character following --long */
911a28cd43dSSascha Wildner badusage(programName);
912a28cd43dSSascha Wildner CLEAN_RETURN(1);
913a28cd43dSSascha Wildner }
914a28cd43dSSascha Wildner /* Only set windowLog if not already set by --zstd */
915a28cd43dSSascha Wildner if (compressionParams.windowLog == 0)
916a28cd43dSSascha Wildner compressionParams.windowLog = ldmWindowLog;
917a28cd43dSSascha Wildner continue;
918a28cd43dSSascha Wildner }
919a28cd43dSSascha Wildner #ifndef ZSTD_NOCOMPRESS /* linking ZSTD_minCLevel() requires compression support */
920a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--fast")) {
921a28cd43dSSascha Wildner /* Parse optional acceleration factor */
922a28cd43dSSascha Wildner if (*argument == '=') {
923a28cd43dSSascha Wildner U32 const maxFast = (U32)-ZSTD_minCLevel();
924a28cd43dSSascha Wildner U32 fastLevel;
925a28cd43dSSascha Wildner ++argument;
926a28cd43dSSascha Wildner fastLevel = readU32FromChar(&argument);
927a28cd43dSSascha Wildner if (fastLevel > maxFast) fastLevel = maxFast;
928a28cd43dSSascha Wildner if (fastLevel) {
929a28cd43dSSascha Wildner dictCLevel = cLevel = -(int)fastLevel;
930a28cd43dSSascha Wildner } else {
931a28cd43dSSascha Wildner badusage(programName);
932a28cd43dSSascha Wildner CLEAN_RETURN(1);
933a28cd43dSSascha Wildner }
934a28cd43dSSascha Wildner } else if (*argument != 0) {
935a28cd43dSSascha Wildner /* Invalid character following --fast */
936a28cd43dSSascha Wildner badusage(programName);
937a28cd43dSSascha Wildner CLEAN_RETURN(1);
938a28cd43dSSascha Wildner } else {
939a28cd43dSSascha Wildner cLevel = -1; /* default for --fast */
940a28cd43dSSascha Wildner }
941a28cd43dSSascha Wildner continue;
942a28cd43dSSascha Wildner }
943a28cd43dSSascha Wildner #endif
944a28cd43dSSascha Wildner
945a28cd43dSSascha Wildner if (longCommandWArg(&argument, "--filelist")) {
946a28cd43dSSascha Wildner const char* listName;
947a28cd43dSSascha Wildner NEXT_FIELD(listName);
948a28cd43dSSascha Wildner UTIL_refFilename(file_of_names, listName);
949a28cd43dSSascha Wildner continue;
950a28cd43dSSascha Wildner }
951a28cd43dSSascha Wildner
952a28cd43dSSascha Wildner /* fall-through, will trigger bad_usage() later on */
953a28cd43dSSascha Wildner }
954a28cd43dSSascha Wildner
955a28cd43dSSascha Wildner argument++;
956a28cd43dSSascha Wildner while (argument[0]!=0) {
957a28cd43dSSascha Wildner
958a28cd43dSSascha Wildner #ifndef ZSTD_NOCOMPRESS
959a28cd43dSSascha Wildner /* compression Level */
960a28cd43dSSascha Wildner if ((*argument>='0') && (*argument<='9')) {
961a28cd43dSSascha Wildner dictCLevel = cLevel = (int)readU32FromChar(&argument);
962a28cd43dSSascha Wildner continue;
963a28cd43dSSascha Wildner }
964a28cd43dSSascha Wildner #endif
965a28cd43dSSascha Wildner
966a28cd43dSSascha Wildner switch(argument[0])
967a28cd43dSSascha Wildner {
968a28cd43dSSascha Wildner /* Display help */
969a28cd43dSSascha Wildner case 'V': printVersion(); CLEAN_RETURN(0); /* Version Only */
970a28cd43dSSascha Wildner case 'H':
971a28cd43dSSascha Wildner case 'h': usage_advanced(programName); CLEAN_RETURN(0);
972a28cd43dSSascha Wildner
973a28cd43dSSascha Wildner /* Compress */
974a28cd43dSSascha Wildner case 'z': operation=zom_compress; argument++; break;
975a28cd43dSSascha Wildner
976a28cd43dSSascha Wildner /* Decoding */
977a28cd43dSSascha Wildner case 'd':
978a28cd43dSSascha Wildner #ifndef ZSTD_NOBENCH
979a28cd43dSSascha Wildner benchParams.mode = BMK_decodeOnly;
980a28cd43dSSascha Wildner if (operation==zom_bench) { argument++; break; } /* benchmark decode (hidden option) */
981a28cd43dSSascha Wildner #endif
982a28cd43dSSascha Wildner operation=zom_decompress; argument++; break;
983a28cd43dSSascha Wildner
984a28cd43dSSascha Wildner /* Force stdout, even if stdout==console */
985a28cd43dSSascha Wildner case 'c': forceStdout=1; outFileName=stdoutmark; argument++; break;
986a28cd43dSSascha Wildner
987a28cd43dSSascha Wildner /* Use file content as dictionary */
988a28cd43dSSascha Wildner case 'D': argument++; NEXT_FIELD(dictFileName); break;
989a28cd43dSSascha Wildner
990a28cd43dSSascha Wildner /* Overwrite */
991a28cd43dSSascha Wildner case 'f': FIO_overwriteMode(prefs); forceStdout=1; followLinks=1; argument++; break;
992a28cd43dSSascha Wildner
993a28cd43dSSascha Wildner /* Verbose mode */
994a28cd43dSSascha Wildner case 'v': g_displayLevel++; argument++; break;
995a28cd43dSSascha Wildner
996a28cd43dSSascha Wildner /* Quiet mode */
997a28cd43dSSascha Wildner case 'q': g_displayLevel--; argument++; break;
998a28cd43dSSascha Wildner
999a28cd43dSSascha Wildner /* keep source file (default) */
1000a28cd43dSSascha Wildner case 'k': FIO_setRemoveSrcFile(prefs, 0); argument++; break;
1001a28cd43dSSascha Wildner
1002a28cd43dSSascha Wildner /* Checksum */
1003a28cd43dSSascha Wildner case 'C': FIO_setChecksumFlag(prefs, 2); argument++; break;
1004a28cd43dSSascha Wildner
1005a28cd43dSSascha Wildner /* test compressed file */
1006a28cd43dSSascha Wildner case 't': operation=zom_test; argument++; break;
1007a28cd43dSSascha Wildner
1008a28cd43dSSascha Wildner /* destination file name */
1009a28cd43dSSascha Wildner case 'o': argument++; NEXT_FIELD(outFileName); break;
1010a28cd43dSSascha Wildner
1011a28cd43dSSascha Wildner /* limit memory */
1012a28cd43dSSascha Wildner case 'M':
1013a28cd43dSSascha Wildner argument++;
1014a28cd43dSSascha Wildner memLimit = readU32FromChar(&argument);
1015a28cd43dSSascha Wildner break;
1016a28cd43dSSascha Wildner case 'l': operation=zom_list; argument++; break;
1017a28cd43dSSascha Wildner #ifdef UTIL_HAS_CREATEFILELIST
1018a28cd43dSSascha Wildner /* recursive */
1019a28cd43dSSascha Wildner case 'r': recursive=1; argument++; break;
1020a28cd43dSSascha Wildner #endif
1021a28cd43dSSascha Wildner
1022a28cd43dSSascha Wildner #ifndef ZSTD_NOBENCH
1023a28cd43dSSascha Wildner /* Benchmark */
1024a28cd43dSSascha Wildner case 'b':
1025a28cd43dSSascha Wildner operation=zom_bench;
1026a28cd43dSSascha Wildner argument++;
1027a28cd43dSSascha Wildner break;
1028a28cd43dSSascha Wildner
1029a28cd43dSSascha Wildner /* range bench (benchmark only) */
1030a28cd43dSSascha Wildner case 'e':
1031a28cd43dSSascha Wildner /* compression Level */
1032a28cd43dSSascha Wildner argument++;
1033a28cd43dSSascha Wildner cLevelLast = (int)readU32FromChar(&argument);
1034a28cd43dSSascha Wildner break;
1035a28cd43dSSascha Wildner
1036a28cd43dSSascha Wildner /* Modify Nb Iterations (benchmark only) */
1037a28cd43dSSascha Wildner case 'i':
1038a28cd43dSSascha Wildner argument++;
1039a28cd43dSSascha Wildner bench_nbSeconds = readU32FromChar(&argument);
1040a28cd43dSSascha Wildner break;
1041a28cd43dSSascha Wildner
1042a28cd43dSSascha Wildner /* cut input into blocks (benchmark only) */
1043a28cd43dSSascha Wildner case 'B':
1044a28cd43dSSascha Wildner argument++;
1045a28cd43dSSascha Wildner blockSize = readU32FromChar(&argument);
1046a28cd43dSSascha Wildner break;
1047a28cd43dSSascha Wildner
1048a28cd43dSSascha Wildner /* benchmark files separately (hidden option) */
1049a28cd43dSSascha Wildner case 'S':
1050a28cd43dSSascha Wildner argument++;
1051a28cd43dSSascha Wildner separateFiles = 1;
1052a28cd43dSSascha Wildner break;
1053a28cd43dSSascha Wildner
1054a28cd43dSSascha Wildner #endif /* ZSTD_NOBENCH */
1055a28cd43dSSascha Wildner
1056a28cd43dSSascha Wildner /* nb of threads (hidden option) */
1057a28cd43dSSascha Wildner case 'T':
1058a28cd43dSSascha Wildner argument++;
1059a28cd43dSSascha Wildner nbWorkers = (int)readU32FromChar(&argument);
1060a28cd43dSSascha Wildner break;
1061a28cd43dSSascha Wildner
1062a28cd43dSSascha Wildner /* Dictionary Selection level */
1063a28cd43dSSascha Wildner case 's':
1064a28cd43dSSascha Wildner argument++;
1065a28cd43dSSascha Wildner dictSelect = readU32FromChar(&argument);
1066a28cd43dSSascha Wildner break;
1067a28cd43dSSascha Wildner
1068a28cd43dSSascha Wildner /* Pause at the end (-p) or set an additional param (-p#) (hidden option) */
1069a28cd43dSSascha Wildner case 'p': argument++;
1070a28cd43dSSascha Wildner #ifndef ZSTD_NOBENCH
1071a28cd43dSSascha Wildner if ((*argument>='0') && (*argument<='9')) {
1072a28cd43dSSascha Wildner benchParams.additionalParam = (int)readU32FromChar(&argument);
1073a28cd43dSSascha Wildner } else
1074a28cd43dSSascha Wildner #endif
1075a28cd43dSSascha Wildner main_pause=1;
1076a28cd43dSSascha Wildner break;
1077a28cd43dSSascha Wildner
1078a28cd43dSSascha Wildner /* Select compressibility of synthetic sample */
1079a28cd43dSSascha Wildner case 'P':
1080a28cd43dSSascha Wildner argument++;
1081a28cd43dSSascha Wildner compressibility = (double)readU32FromChar(&argument) / 100;
1082a28cd43dSSascha Wildner break;
1083a28cd43dSSascha Wildner
1084a28cd43dSSascha Wildner /* unknown command */
1085a28cd43dSSascha Wildner default : badusage(programName); CLEAN_RETURN(1);
1086a28cd43dSSascha Wildner }
1087a28cd43dSSascha Wildner }
1088a28cd43dSSascha Wildner continue;
1089a28cd43dSSascha Wildner } /* if (argument[0]=='-') */
1090a28cd43dSSascha Wildner
1091a28cd43dSSascha Wildner /* none of the above : add filename to list */
1092a28cd43dSSascha Wildner UTIL_refFilename(filenames, argument);
1093a28cd43dSSascha Wildner }
1094a28cd43dSSascha Wildner
1095a28cd43dSSascha Wildner /* Welcome message (if verbose) */
1096a28cd43dSSascha Wildner DISPLAYLEVEL(3, WELCOME_MESSAGE);
1097a28cd43dSSascha Wildner
1098a28cd43dSSascha Wildner #ifdef ZSTD_MULTITHREAD
1099a28cd43dSSascha Wildner if ((nbWorkers==0) && (!singleThread)) {
1100a28cd43dSSascha Wildner /* automatically set # workers based on # of reported cpus */
1101a28cd43dSSascha Wildner nbWorkers = UTIL_countPhysicalCores();
1102a28cd43dSSascha Wildner DISPLAYLEVEL(3, "Note: %d physical core(s) detected \n", nbWorkers);
1103a28cd43dSSascha Wildner }
1104a28cd43dSSascha Wildner #else
1105a28cd43dSSascha Wildner (void)singleThread; (void)nbWorkers;
1106a28cd43dSSascha Wildner #endif
1107a28cd43dSSascha Wildner
1108a28cd43dSSascha Wildner #ifdef UTIL_HAS_CREATEFILELIST
1109a28cd43dSSascha Wildner g_utilDisplayLevel = g_displayLevel;
1110a28cd43dSSascha Wildner if (!followLinks) {
1111a28cd43dSSascha Wildner unsigned u, fileNamesNb;
1112a28cd43dSSascha Wildner unsigned const nbFilenames = (unsigned)filenames->tableSize;
1113a28cd43dSSascha Wildner for (u=0, fileNamesNb=0; u<nbFilenames; u++) {
1114a28cd43dSSascha Wildner if ( UTIL_isLink(filenames->fileNames[u])
1115a28cd43dSSascha Wildner && !UTIL_isFIFO(filenames->fileNames[u])
1116a28cd43dSSascha Wildner ) {
1117a28cd43dSSascha Wildner DISPLAYLEVEL(2, "Warning : %s is a symbolic link, ignoring \n", filenames->fileNames[u]);
1118a28cd43dSSascha Wildner } else {
1119a28cd43dSSascha Wildner filenames->fileNames[fileNamesNb++] = filenames->fileNames[u];
1120a28cd43dSSascha Wildner } }
1121a28cd43dSSascha Wildner if (fileNamesNb == 0 && nbFilenames > 0) /* all names are eliminated */
1122a28cd43dSSascha Wildner CLEAN_RETURN(1);
1123a28cd43dSSascha Wildner filenames->tableSize = fileNamesNb;
1124a28cd43dSSascha Wildner } /* if (!followLinks) */
1125a28cd43dSSascha Wildner
1126a28cd43dSSascha Wildner /* read names from a file */
1127a28cd43dSSascha Wildner if (file_of_names->tableSize) {
1128a28cd43dSSascha Wildner size_t const nbFileLists = file_of_names->tableSize;
1129a28cd43dSSascha Wildner size_t flNb;
1130a28cd43dSSascha Wildner for (flNb=0; flNb < nbFileLists; flNb++) {
1131a28cd43dSSascha Wildner FileNamesTable* const fnt = UTIL_createFileNamesTable_fromFileName(file_of_names->fileNames[flNb]);
1132a28cd43dSSascha Wildner if (fnt==NULL) {
1133a28cd43dSSascha Wildner DISPLAYLEVEL(1, "zstd: error reading %s \n", file_of_names->fileNames[flNb]);
1134a28cd43dSSascha Wildner CLEAN_RETURN(1);
1135a28cd43dSSascha Wildner }
1136a28cd43dSSascha Wildner filenames = UTIL_mergeFileNamesTable(filenames, fnt);
1137a28cd43dSSascha Wildner }
1138a28cd43dSSascha Wildner }
1139a28cd43dSSascha Wildner
1140a28cd43dSSascha Wildner if (recursive) { /* at this stage, filenameTable is a list of paths, which can contain both files and directories */
1141a28cd43dSSascha Wildner UTIL_expandFNT(&filenames, followLinks);
1142a28cd43dSSascha Wildner }
1143a28cd43dSSascha Wildner #else
1144a28cd43dSSascha Wildner (void)followLinks;
1145a28cd43dSSascha Wildner #endif
1146a28cd43dSSascha Wildner
1147a28cd43dSSascha Wildner if (operation == zom_list) {
1148a28cd43dSSascha Wildner #ifndef ZSTD_NODECOMPRESS
1149a28cd43dSSascha Wildner int const ret = FIO_listMultipleFiles((unsigned)filenames->tableSize, filenames->fileNames, g_displayLevel);
1150a28cd43dSSascha Wildner CLEAN_RETURN(ret);
1151a28cd43dSSascha Wildner #else
1152a28cd43dSSascha Wildner DISPLAY("file information is not supported \n");
1153a28cd43dSSascha Wildner CLEAN_RETURN(1);
1154a28cd43dSSascha Wildner #endif
1155a28cd43dSSascha Wildner }
1156a28cd43dSSascha Wildner
1157a28cd43dSSascha Wildner /* Check if benchmark is selected */
1158a28cd43dSSascha Wildner if (operation==zom_bench) {
1159a28cd43dSSascha Wildner #ifndef ZSTD_NOBENCH
1160a28cd43dSSascha Wildner benchParams.blockSize = blockSize;
1161a28cd43dSSascha Wildner benchParams.nbWorkers = nbWorkers;
1162a28cd43dSSascha Wildner benchParams.realTime = (unsigned)setRealTimePrio;
1163a28cd43dSSascha Wildner benchParams.nbSeconds = bench_nbSeconds;
1164a28cd43dSSascha Wildner benchParams.ldmFlag = ldmFlag;
1165a28cd43dSSascha Wildner benchParams.ldmMinMatch = (int)g_ldmMinMatch;
1166a28cd43dSSascha Wildner benchParams.ldmHashLog = (int)g_ldmHashLog;
1167a28cd43dSSascha Wildner if (g_ldmBucketSizeLog != LDM_PARAM_DEFAULT) {
1168a28cd43dSSascha Wildner benchParams.ldmBucketSizeLog = (int)g_ldmBucketSizeLog;
1169a28cd43dSSascha Wildner }
1170a28cd43dSSascha Wildner if (g_ldmHashRateLog != LDM_PARAM_DEFAULT) {
1171a28cd43dSSascha Wildner benchParams.ldmHashRateLog = (int)g_ldmHashRateLog;
1172a28cd43dSSascha Wildner }
1173a28cd43dSSascha Wildner benchParams.literalCompressionMode = literalCompressionMode;
1174a28cd43dSSascha Wildner
1175a28cd43dSSascha Wildner if (cLevel > ZSTD_maxCLevel()) cLevel = ZSTD_maxCLevel();
1176a28cd43dSSascha Wildner if (cLevelLast > ZSTD_maxCLevel()) cLevelLast = ZSTD_maxCLevel();
1177a28cd43dSSascha Wildner if (cLevelLast < cLevel) cLevelLast = cLevel;
1178a28cd43dSSascha Wildner if (cLevelLast > cLevel)
1179a28cd43dSSascha Wildner DISPLAYLEVEL(3, "Benchmarking levels from %d to %d\n", cLevel, cLevelLast);
1180a28cd43dSSascha Wildner if (filenames->tableSize > 0) {
1181a28cd43dSSascha Wildner if(separateFiles) {
1182a28cd43dSSascha Wildner unsigned i;
1183a28cd43dSSascha Wildner for(i = 0; i < filenames->tableSize; i++) {
1184a28cd43dSSascha Wildner int c;
1185a28cd43dSSascha Wildner DISPLAYLEVEL(3, "Benchmarking %s \n", filenames->fileNames[i]);
1186a28cd43dSSascha Wildner for(c = cLevel; c <= cLevelLast; c++) {
1187a28cd43dSSascha Wildner BMK_benchFilesAdvanced(&filenames->fileNames[i], 1, dictFileName, c, &compressionParams, g_displayLevel, &benchParams);
1188a28cd43dSSascha Wildner } }
1189a28cd43dSSascha Wildner } else {
1190a28cd43dSSascha Wildner for(; cLevel <= cLevelLast; cLevel++) {
1191a28cd43dSSascha Wildner BMK_benchFilesAdvanced(filenames->fileNames, (unsigned)filenames->tableSize, dictFileName, cLevel, &compressionParams, g_displayLevel, &benchParams);
1192a28cd43dSSascha Wildner } }
1193a28cd43dSSascha Wildner } else {
1194a28cd43dSSascha Wildner for(; cLevel <= cLevelLast; cLevel++) {
1195a28cd43dSSascha Wildner BMK_syntheticTest(cLevel, compressibility, &compressionParams, g_displayLevel, &benchParams);
1196a28cd43dSSascha Wildner } }
1197a28cd43dSSascha Wildner
1198a28cd43dSSascha Wildner #else
1199a28cd43dSSascha Wildner (void)bench_nbSeconds; (void)blockSize; (void)setRealTimePrio; (void)separateFiles; (void)compressibility;
1200a28cd43dSSascha Wildner #endif
1201a28cd43dSSascha Wildner goto _end;
1202a28cd43dSSascha Wildner }
1203a28cd43dSSascha Wildner
1204a28cd43dSSascha Wildner /* Check if dictionary builder is selected */
1205a28cd43dSSascha Wildner if (operation==zom_train) {
1206a28cd43dSSascha Wildner #ifndef ZSTD_NODICT
1207a28cd43dSSascha Wildner ZDICT_params_t zParams;
1208a28cd43dSSascha Wildner zParams.compressionLevel = dictCLevel;
1209a28cd43dSSascha Wildner zParams.notificationLevel = (unsigned)g_displayLevel;
1210a28cd43dSSascha Wildner zParams.dictID = dictID;
1211a28cd43dSSascha Wildner if (dict == cover) {
1212a28cd43dSSascha Wildner int const optimize = !coverParams.k || !coverParams.d;
1213a28cd43dSSascha Wildner coverParams.nbThreads = (unsigned)nbWorkers;
1214a28cd43dSSascha Wildner coverParams.zParams = zParams;
1215a28cd43dSSascha Wildner operationResult = DiB_trainFromFiles(outFileName, maxDictSize, filenames->fileNames, (unsigned)filenames->tableSize, blockSize, NULL, &coverParams, NULL, optimize);
1216a28cd43dSSascha Wildner } else if (dict == fastCover) {
1217a28cd43dSSascha Wildner int const optimize = !fastCoverParams.k || !fastCoverParams.d;
1218a28cd43dSSascha Wildner fastCoverParams.nbThreads = (unsigned)nbWorkers;
1219a28cd43dSSascha Wildner fastCoverParams.zParams = zParams;
1220a28cd43dSSascha Wildner operationResult = DiB_trainFromFiles(outFileName, maxDictSize, filenames->fileNames, (unsigned)filenames->tableSize, blockSize, NULL, NULL, &fastCoverParams, optimize);
1221a28cd43dSSascha Wildner } else {
1222a28cd43dSSascha Wildner ZDICT_legacy_params_t dictParams;
1223a28cd43dSSascha Wildner memset(&dictParams, 0, sizeof(dictParams));
1224a28cd43dSSascha Wildner dictParams.selectivityLevel = dictSelect;
1225a28cd43dSSascha Wildner dictParams.zParams = zParams;
1226a28cd43dSSascha Wildner operationResult = DiB_trainFromFiles(outFileName, maxDictSize, filenames->fileNames, (unsigned)filenames->tableSize, blockSize, &dictParams, NULL, NULL, 0);
1227a28cd43dSSascha Wildner }
1228a28cd43dSSascha Wildner #else
1229a28cd43dSSascha Wildner (void)dictCLevel; (void)dictSelect; (void)dictID; (void)maxDictSize; /* not used when ZSTD_NODICT set */
1230a28cd43dSSascha Wildner DISPLAYLEVEL(1, "training mode not available \n");
1231a28cd43dSSascha Wildner operationResult = 1;
1232a28cd43dSSascha Wildner #endif
1233a28cd43dSSascha Wildner goto _end;
1234a28cd43dSSascha Wildner }
1235a28cd43dSSascha Wildner
1236a28cd43dSSascha Wildner #ifndef ZSTD_NODECOMPRESS
1237a28cd43dSSascha Wildner if (operation==zom_test) { FIO_setTestMode(prefs, 1); outFileName=nulmark; FIO_setRemoveSrcFile(prefs, 0); } /* test mode */
1238a28cd43dSSascha Wildner #endif
1239a28cd43dSSascha Wildner
1240a28cd43dSSascha Wildner /* No input filename ==> use stdin and stdout */
1241a28cd43dSSascha Wildner if (filenames->tableSize == 0) UTIL_refFilename(filenames, stdinmark);
1242a28cd43dSSascha Wildner if (!strcmp(filenames->fileNames[0], stdinmark) && !outFileName)
1243a28cd43dSSascha Wildner outFileName = stdoutmark; /* when input is stdin, default output is stdout */
1244a28cd43dSSascha Wildner
1245a28cd43dSSascha Wildner /* Check if input/output defined as console; trigger an error in this case */
1246a28cd43dSSascha Wildner if (!strcmp(filenames->fileNames[0], stdinmark) && IS_CONSOLE(stdin) ) {
1247a28cd43dSSascha Wildner DISPLAYLEVEL(1, "stdin is a console, aborting\n");
1248a28cd43dSSascha Wildner CLEAN_RETURN(1);
1249a28cd43dSSascha Wildner }
1250a28cd43dSSascha Wildner if ( outFileName && !strcmp(outFileName, stdoutmark)
1251a28cd43dSSascha Wildner && IS_CONSOLE(stdout)
1252a28cd43dSSascha Wildner && !strcmp(filenames->fileNames[0], stdinmark)
1253a28cd43dSSascha Wildner && !forceStdout
1254a28cd43dSSascha Wildner && operation!=zom_decompress ) {
1255a28cd43dSSascha Wildner DISPLAYLEVEL(1, "stdout is a console, aborting\n");
1256a28cd43dSSascha Wildner CLEAN_RETURN(1);
1257a28cd43dSSascha Wildner }
1258a28cd43dSSascha Wildner
1259a28cd43dSSascha Wildner #ifndef ZSTD_NOCOMPRESS
1260a28cd43dSSascha Wildner /* check compression level limits */
1261a28cd43dSSascha Wildner { int const maxCLevel = ultra ? ZSTD_maxCLevel() : ZSTDCLI_CLEVEL_MAX;
1262a28cd43dSSascha Wildner if (cLevel > maxCLevel) {
1263a28cd43dSSascha Wildner DISPLAYLEVEL(2, "Warning : compression level higher than max, reduced to %i \n", maxCLevel);
1264a28cd43dSSascha Wildner cLevel = maxCLevel;
1265a28cd43dSSascha Wildner } }
1266a28cd43dSSascha Wildner #endif
1267a28cd43dSSascha Wildner
1268a28cd43dSSascha Wildner if (showDefaultCParams) {
1269a28cd43dSSascha Wildner if (operation == zom_decompress) {
1270a28cd43dSSascha Wildner DISPLAY("error : can't use --show-default-cparams in decomrpession mode \n");
1271a28cd43dSSascha Wildner CLEAN_RETURN(1);
1272a28cd43dSSascha Wildner }
1273a28cd43dSSascha Wildner }
1274a28cd43dSSascha Wildner
1275a28cd43dSSascha Wildner if (dictFileName != NULL && patchFromDictFileName != NULL) {
1276a28cd43dSSascha Wildner DISPLAY("error : can't use -D and --patch-from=# at the same time \n");
1277a28cd43dSSascha Wildner CLEAN_RETURN(1);
1278a28cd43dSSascha Wildner }
1279a28cd43dSSascha Wildner
1280a28cd43dSSascha Wildner if (patchFromDictFileName != NULL && filenames->tableSize > 1) {
1281a28cd43dSSascha Wildner DISPLAY("error : can't use --patch-from=# on multiple files \n");
1282a28cd43dSSascha Wildner CLEAN_RETURN(1);
1283a28cd43dSSascha Wildner }
1284a28cd43dSSascha Wildner
1285a28cd43dSSascha Wildner /* No status message in pipe mode (stdin - stdout) */
1286a28cd43dSSascha Wildner hasStdout = outFileName && !strcmp(outFileName,stdoutmark);
1287a28cd43dSSascha Wildner
1288a28cd43dSSascha Wildner if (hasStdout && (g_displayLevel==2)) g_displayLevel=1;
1289a28cd43dSSascha Wildner
1290a28cd43dSSascha Wildner /* IO Stream/File */
1291a28cd43dSSascha Wildner FIO_setHasStdoutOutput(fCtx, hasStdout);
1292a28cd43dSSascha Wildner FIO_setNbFilesTotal(fCtx, (int)filenames->tableSize);
1293a28cd43dSSascha Wildner FIO_determineHasStdinInput(fCtx, filenames);
1294a28cd43dSSascha Wildner FIO_setNotificationLevel(g_displayLevel);
1295a28cd43dSSascha Wildner FIO_setPatchFromMode(prefs, patchFromDictFileName != NULL);
1296a28cd43dSSascha Wildner if (memLimit == 0) {
1297a28cd43dSSascha Wildner if (compressionParams.windowLog == 0) {
1298a28cd43dSSascha Wildner memLimit = (U32)1 << g_defaultMaxWindowLog;
1299a28cd43dSSascha Wildner } else {
1300a28cd43dSSascha Wildner memLimit = (U32)1 << (compressionParams.windowLog & 31);
1301a28cd43dSSascha Wildner } }
1302a28cd43dSSascha Wildner if (patchFromDictFileName != NULL)
1303a28cd43dSSascha Wildner dictFileName = patchFromDictFileName;
1304a28cd43dSSascha Wildner FIO_setMemLimit(prefs, memLimit);
1305a28cd43dSSascha Wildner if (operation==zom_compress) {
1306a28cd43dSSascha Wildner #ifndef ZSTD_NOCOMPRESS
1307a28cd43dSSascha Wildner FIO_setContentSize(prefs, contentSize);
1308a28cd43dSSascha Wildner FIO_setNbWorkers(prefs, nbWorkers);
1309a28cd43dSSascha Wildner FIO_setBlockSize(prefs, (int)blockSize);
1310a28cd43dSSascha Wildner if (g_overlapLog!=OVERLAP_LOG_DEFAULT) FIO_setOverlapLog(prefs, (int)g_overlapLog);
1311a28cd43dSSascha Wildner FIO_setLdmFlag(prefs, (unsigned)ldmFlag);
1312a28cd43dSSascha Wildner FIO_setLdmHashLog(prefs, (int)g_ldmHashLog);
1313a28cd43dSSascha Wildner FIO_setLdmMinMatch(prefs, (int)g_ldmMinMatch);
1314a28cd43dSSascha Wildner if (g_ldmBucketSizeLog != LDM_PARAM_DEFAULT) FIO_setLdmBucketSizeLog(prefs, (int)g_ldmBucketSizeLog);
1315a28cd43dSSascha Wildner if (g_ldmHashRateLog != LDM_PARAM_DEFAULT) FIO_setLdmHashRateLog(prefs, (int)g_ldmHashRateLog);
1316a28cd43dSSascha Wildner FIO_setAdaptiveMode(prefs, (unsigned)adapt);
1317a28cd43dSSascha Wildner FIO_setAdaptMin(prefs, adaptMin);
1318a28cd43dSSascha Wildner FIO_setAdaptMax(prefs, adaptMax);
1319a28cd43dSSascha Wildner FIO_setRsyncable(prefs, rsyncable);
1320a28cd43dSSascha Wildner FIO_setStreamSrcSize(prefs, streamSrcSize);
1321a28cd43dSSascha Wildner FIO_setTargetCBlockSize(prefs, targetCBlockSize);
1322a28cd43dSSascha Wildner FIO_setSrcSizeHint(prefs, srcSizeHint);
1323a28cd43dSSascha Wildner FIO_setLiteralCompressionMode(prefs, literalCompressionMode);
1324a28cd43dSSascha Wildner if (adaptMin > cLevel) cLevel = adaptMin;
1325a28cd43dSSascha Wildner if (adaptMax < cLevel) cLevel = adaptMax;
1326a28cd43dSSascha Wildner
1327a28cd43dSSascha Wildner /* Compare strategies constant with the ground truth */
1328a28cd43dSSascha Wildner { ZSTD_bounds strategyBounds = ZSTD_cParam_getBounds(ZSTD_c_strategy);
1329a28cd43dSSascha Wildner assert(ZSTD_NB_STRATEGIES == strategyBounds.upperBound);
1330a28cd43dSSascha Wildner (void)strategyBounds; }
1331a28cd43dSSascha Wildner
1332a28cd43dSSascha Wildner if (showDefaultCParams) {
1333a28cd43dSSascha Wildner size_t fileNb;
1334a28cd43dSSascha Wildner for (fileNb = 0; fileNb < (size_t)filenames->tableSize; fileNb++) {
1335a28cd43dSSascha Wildner unsigned long long fileSize = UTIL_getFileSize(filenames->fileNames[fileNb]);
1336a28cd43dSSascha Wildner const size_t dictSize = dictFileName != NULL ? (size_t)UTIL_getFileSize(dictFileName) : 0;
1337a28cd43dSSascha Wildner const ZSTD_compressionParameters cParams = ZSTD_getCParams(cLevel, fileSize, dictSize);
1338a28cd43dSSascha Wildner if (fileSize != UTIL_FILESIZE_UNKNOWN) DISPLAY("%s (%u bytes)\n", filenames->fileNames[fileNb], (unsigned)fileSize);
1339a28cd43dSSascha Wildner else DISPLAY("%s (src size unknown)\n", filenames->fileNames[fileNb]);
1340a28cd43dSSascha Wildner DISPLAY(" - windowLog : %u\n", cParams.windowLog);
1341a28cd43dSSascha Wildner DISPLAY(" - chainLog : %u\n", cParams.chainLog);
1342a28cd43dSSascha Wildner DISPLAY(" - hashLog : %u\n", cParams.hashLog);
1343a28cd43dSSascha Wildner DISPLAY(" - searchLog : %u\n", cParams.searchLog);
1344a28cd43dSSascha Wildner DISPLAY(" - minMatch : %u\n", cParams.minMatch);
1345a28cd43dSSascha Wildner DISPLAY(" - targetLength : %u\n", cParams.targetLength);
1346a28cd43dSSascha Wildner assert(cParams.strategy < ZSTD_NB_STRATEGIES + 1);
1347a28cd43dSSascha Wildner DISPLAY(" - strategy : %s (%u)\n", ZSTD_strategyMap[(int)cParams.strategy], (unsigned)cParams.strategy);
1348a28cd43dSSascha Wildner }
1349a28cd43dSSascha Wildner }
1350a28cd43dSSascha Wildner
1351a28cd43dSSascha Wildner if ((filenames->tableSize==1) && outFileName)
1352a28cd43dSSascha Wildner operationResult = FIO_compressFilename(fCtx, prefs, outFileName, filenames->fileNames[0], dictFileName, cLevel, compressionParams);
1353a28cd43dSSascha Wildner else
1354a28cd43dSSascha Wildner operationResult = FIO_compressMultipleFilenames(fCtx, prefs, filenames->fileNames, outMirroredDirName, outDirName, outFileName, suffix, dictFileName, cLevel, compressionParams);
1355a28cd43dSSascha Wildner #else
1356a28cd43dSSascha Wildner (void)contentSize; (void)suffix; (void)adapt; (void)rsyncable; (void)ultra; (void)cLevel; (void)ldmFlag; (void)literalCompressionMode; (void)targetCBlockSize; (void)streamSrcSize; (void)srcSizeHint; (void)ZSTD_strategyMap; /* not used when ZSTD_NOCOMPRESS set */
1357a28cd43dSSascha Wildner DISPLAY("Compression not supported \n");
1358a28cd43dSSascha Wildner #endif
1359a28cd43dSSascha Wildner } else { /* decompression or test */
1360a28cd43dSSascha Wildner #ifndef ZSTD_NODECOMPRESS
1361a28cd43dSSascha Wildner if (filenames->tableSize == 1 && outFileName) {
1362a28cd43dSSascha Wildner operationResult = FIO_decompressFilename(fCtx, prefs, outFileName, filenames->fileNames[0], dictFileName);
1363a28cd43dSSascha Wildner } else {
1364a28cd43dSSascha Wildner operationResult = FIO_decompressMultipleFilenames(fCtx, prefs, filenames->fileNames, outMirroredDirName, outDirName, outFileName, dictFileName);
1365a28cd43dSSascha Wildner }
1366a28cd43dSSascha Wildner #else
1367a28cd43dSSascha Wildner DISPLAY("Decompression not supported \n");
1368a28cd43dSSascha Wildner #endif
1369a28cd43dSSascha Wildner }
1370a28cd43dSSascha Wildner
1371a28cd43dSSascha Wildner _end:
1372a28cd43dSSascha Wildner FIO_freePreferences(prefs);
1373a28cd43dSSascha Wildner FIO_freeContext(fCtx);
1374a28cd43dSSascha Wildner if (main_pause) waitEnter();
1375a28cd43dSSascha Wildner UTIL_freeFileNamesTable(filenames);
1376a28cd43dSSascha Wildner UTIL_freeFileNamesTable(file_of_names);
1377a28cd43dSSascha Wildner
1378a28cd43dSSascha Wildner return operationResult;
1379a28cd43dSSascha Wildner }
1380