1*3117ece4Schristos /* 2*3117ece4Schristos * Copyright (c) Meta Platforms, Inc. and affiliates. 3*3117ece4Schristos * All rights reserved. 4*3117ece4Schristos * 5*3117ece4Schristos * This source code is licensed under both the BSD-style license (found in the 6*3117ece4Schristos * LICENSE file in the root directory of this source tree) and the GPLv2 (found 7*3117ece4Schristos * in the COPYING file in the root directory of this source tree). 8*3117ece4Schristos * You may select, at your option, one of the above-listed licenses. 9*3117ece4Schristos */ 10*3117ece4Schristos 11*3117ece4Schristos 12*3117ece4Schristos /* ************************************* 13*3117ece4Schristos * Compiler Options 14*3117ece4Schristos ***************************************/ 15*3117ece4Schristos #ifdef _MSC_VER /* Visual */ 16*3117ece4Schristos # pragma warning(disable : 4127) /* disable: C4127: conditional expression is constant */ 17*3117ece4Schristos # pragma warning(disable : 4204) /* non-constant aggregate initializer */ 18*3117ece4Schristos #endif 19*3117ece4Schristos #if defined(__MINGW32__) && !defined(_POSIX_SOURCE) 20*3117ece4Schristos # define _POSIX_SOURCE 1 /* disable %llu warnings with MinGW on Windows */ 21*3117ece4Schristos #endif 22*3117ece4Schristos 23*3117ece4Schristos /*-************************************* 24*3117ece4Schristos * Includes 25*3117ece4Schristos ***************************************/ 26*3117ece4Schristos #include "platform.h" /* Large Files support, SET_BINARY_MODE */ 27*3117ece4Schristos #include "util.h" /* UTIL_getFileSize, UTIL_isRegularFile, UTIL_isSameFile */ 28*3117ece4Schristos #include <stdio.h> /* fprintf, open, fdopen, fread, _fileno, stdin, stdout */ 29*3117ece4Schristos #include <stdlib.h> /* malloc, free */ 30*3117ece4Schristos #include <string.h> /* strcmp, strlen */ 31*3117ece4Schristos #include <time.h> /* clock_t, to measure process time */ 32*3117ece4Schristos #include <fcntl.h> /* O_WRONLY */ 33*3117ece4Schristos #include <assert.h> 34*3117ece4Schristos #include <errno.h> /* errno */ 35*3117ece4Schristos #include <limits.h> /* INT_MAX */ 36*3117ece4Schristos #include <signal.h> 37*3117ece4Schristos #include "timefn.h" /* UTIL_getTime, UTIL_clockSpanMicro */ 38*3117ece4Schristos 39*3117ece4Schristos #if defined (_MSC_VER) 40*3117ece4Schristos # include <sys/stat.h> 41*3117ece4Schristos # include <io.h> 42*3117ece4Schristos #endif 43*3117ece4Schristos 44*3117ece4Schristos #include "fileio.h" 45*3117ece4Schristos #include "fileio_asyncio.h" 46*3117ece4Schristos #include "fileio_common.h" 47*3117ece4Schristos 48*3117ece4Schristos FIO_display_prefs_t g_display_prefs = {2, FIO_ps_auto}; 49*3117ece4Schristos UTIL_time_t g_displayClock = UTIL_TIME_INITIALIZER; 50*3117ece4Schristos 51*3117ece4Schristos #define ZSTD_STATIC_LINKING_ONLY /* ZSTD_magicNumber, ZSTD_frameHeaderSize_max */ 52*3117ece4Schristos #include "../lib/zstd.h" 53*3117ece4Schristos #include "../lib/zstd_errors.h" /* ZSTD_error_frameParameter_windowTooLarge */ 54*3117ece4Schristos 55*3117ece4Schristos #if defined(ZSTD_GZCOMPRESS) || defined(ZSTD_GZDECOMPRESS) 56*3117ece4Schristos # include <zlib.h> 57*3117ece4Schristos # if !defined(z_const) 58*3117ece4Schristos # define z_const 59*3117ece4Schristos # endif 60*3117ece4Schristos #endif 61*3117ece4Schristos 62*3117ece4Schristos #if defined(ZSTD_LZMACOMPRESS) || defined(ZSTD_LZMADECOMPRESS) 63*3117ece4Schristos # include <lzma.h> 64*3117ece4Schristos #endif 65*3117ece4Schristos 66*3117ece4Schristos #define LZ4_MAGICNUMBER 0x184D2204 67*3117ece4Schristos #if defined(ZSTD_LZ4COMPRESS) || defined(ZSTD_LZ4DECOMPRESS) 68*3117ece4Schristos # define LZ4F_ENABLE_OBSOLETE_ENUMS 69*3117ece4Schristos # include <lz4frame.h> 70*3117ece4Schristos # include <lz4.h> 71*3117ece4Schristos #endif 72*3117ece4Schristos 73*3117ece4Schristos char const* FIO_zlibVersion(void) 74*3117ece4Schristos { 75*3117ece4Schristos #if defined(ZSTD_GZCOMPRESS) || defined(ZSTD_GZDECOMPRESS) 76*3117ece4Schristos return zlibVersion(); 77*3117ece4Schristos #else 78*3117ece4Schristos return "Unsupported"; 79*3117ece4Schristos #endif 80*3117ece4Schristos } 81*3117ece4Schristos 82*3117ece4Schristos char const* FIO_lz4Version(void) 83*3117ece4Schristos { 84*3117ece4Schristos #if defined(ZSTD_LZ4COMPRESS) || defined(ZSTD_LZ4DECOMPRESS) 85*3117ece4Schristos /* LZ4_versionString() added in v1.7.3 */ 86*3117ece4Schristos # if LZ4_VERSION_NUMBER >= 10703 87*3117ece4Schristos return LZ4_versionString(); 88*3117ece4Schristos # else 89*3117ece4Schristos # define ZSTD_LZ4_VERSION LZ4_VERSION_MAJOR.LZ4_VERSION_MINOR.LZ4_VERSION_RELEASE 90*3117ece4Schristos # define ZSTD_LZ4_VERSION_STRING ZSTD_EXPAND_AND_QUOTE(ZSTD_LZ4_VERSION) 91*3117ece4Schristos return ZSTD_LZ4_VERSION_STRING; 92*3117ece4Schristos # endif 93*3117ece4Schristos #else 94*3117ece4Schristos return "Unsupported"; 95*3117ece4Schristos #endif 96*3117ece4Schristos } 97*3117ece4Schristos 98*3117ece4Schristos char const* FIO_lzmaVersion(void) 99*3117ece4Schristos { 100*3117ece4Schristos #if defined(ZSTD_LZMACOMPRESS) || defined(ZSTD_LZMADECOMPRESS) 101*3117ece4Schristos return lzma_version_string(); 102*3117ece4Schristos #else 103*3117ece4Schristos return "Unsupported"; 104*3117ece4Schristos #endif 105*3117ece4Schristos } 106*3117ece4Schristos 107*3117ece4Schristos 108*3117ece4Schristos /*-************************************* 109*3117ece4Schristos * Constants 110*3117ece4Schristos ***************************************/ 111*3117ece4Schristos #define ADAPT_WINDOWLOG_DEFAULT 23 /* 8 MB */ 112*3117ece4Schristos #define DICTSIZE_MAX (32 MB) /* protection against large input (attack scenario) */ 113*3117ece4Schristos 114*3117ece4Schristos #define FNSPACE 30 115*3117ece4Schristos 116*3117ece4Schristos /* Default file permissions 0666 (modulated by umask) */ 117*3117ece4Schristos /* Temporary restricted file permissions are used when we're going to 118*3117ece4Schristos * chmod/chown at the end of the operation. */ 119*3117ece4Schristos #if !defined(_WIN32) 120*3117ece4Schristos /* These macros aren't defined on windows. */ 121*3117ece4Schristos #define DEFAULT_FILE_PERMISSIONS (S_IRUSR|S_IWUSR|S_IRGRP|S_IWGRP|S_IROTH|S_IWOTH) 122*3117ece4Schristos #define TEMPORARY_FILE_PERMISSIONS (S_IRUSR|S_IWUSR) 123*3117ece4Schristos #else 124*3117ece4Schristos #define DEFAULT_FILE_PERMISSIONS (0666) 125*3117ece4Schristos #define TEMPORARY_FILE_PERMISSIONS (0600) 126*3117ece4Schristos #endif 127*3117ece4Schristos 128*3117ece4Schristos /*-************************************ 129*3117ece4Schristos * Signal (Ctrl-C trapping) 130*3117ece4Schristos **************************************/ 131*3117ece4Schristos static const char* g_artefact = NULL; 132*3117ece4Schristos static void INThandler(int sig) 133*3117ece4Schristos { 134*3117ece4Schristos assert(sig==SIGINT); (void)sig; 135*3117ece4Schristos #if !defined(_MSC_VER) 136*3117ece4Schristos signal(sig, SIG_IGN); /* this invocation generates a buggy warning in Visual Studio */ 137*3117ece4Schristos #endif 138*3117ece4Schristos if (g_artefact) { 139*3117ece4Schristos assert(UTIL_isRegularFile(g_artefact)); 140*3117ece4Schristos remove(g_artefact); 141*3117ece4Schristos } 142*3117ece4Schristos DISPLAY("\n"); 143*3117ece4Schristos exit(2); 144*3117ece4Schristos } 145*3117ece4Schristos static void addHandler(char const* dstFileName) 146*3117ece4Schristos { 147*3117ece4Schristos if (UTIL_isRegularFile(dstFileName)) { 148*3117ece4Schristos g_artefact = dstFileName; 149*3117ece4Schristos signal(SIGINT, INThandler); 150*3117ece4Schristos } else { 151*3117ece4Schristos g_artefact = NULL; 152*3117ece4Schristos } 153*3117ece4Schristos } 154*3117ece4Schristos /* Idempotent */ 155*3117ece4Schristos static void clearHandler(void) 156*3117ece4Schristos { 157*3117ece4Schristos if (g_artefact) signal(SIGINT, SIG_DFL); 158*3117ece4Schristos g_artefact = NULL; 159*3117ece4Schristos } 160*3117ece4Schristos 161*3117ece4Schristos 162*3117ece4Schristos /*-********************************************************* 163*3117ece4Schristos * Termination signal trapping (Print debug stack trace) 164*3117ece4Schristos ***********************************************************/ 165*3117ece4Schristos #if defined(__has_feature) && !defined(BACKTRACE_ENABLE) /* Clang compiler */ 166*3117ece4Schristos # if (__has_feature(address_sanitizer)) 167*3117ece4Schristos # define BACKTRACE_ENABLE 0 168*3117ece4Schristos # endif /* __has_feature(address_sanitizer) */ 169*3117ece4Schristos #elif defined(__SANITIZE_ADDRESS__) && !defined(BACKTRACE_ENABLE) /* GCC compiler */ 170*3117ece4Schristos # define BACKTRACE_ENABLE 0 171*3117ece4Schristos #endif 172*3117ece4Schristos 173*3117ece4Schristos #if !defined(BACKTRACE_ENABLE) 174*3117ece4Schristos /* automatic detector : backtrace enabled by default on linux+glibc and osx */ 175*3117ece4Schristos # if (defined(__linux__) && (defined(__GLIBC__) && !defined(__UCLIBC__))) \ 176*3117ece4Schristos || (defined(__APPLE__) && defined(__MACH__)) 177*3117ece4Schristos # define BACKTRACE_ENABLE 1 178*3117ece4Schristos # else 179*3117ece4Schristos # define BACKTRACE_ENABLE 0 180*3117ece4Schristos # endif 181*3117ece4Schristos #endif 182*3117ece4Schristos 183*3117ece4Schristos /* note : after this point, BACKTRACE_ENABLE is necessarily defined */ 184*3117ece4Schristos 185*3117ece4Schristos 186*3117ece4Schristos #if BACKTRACE_ENABLE 187*3117ece4Schristos 188*3117ece4Schristos #include <execinfo.h> /* backtrace, backtrace_symbols */ 189*3117ece4Schristos 190*3117ece4Schristos #define MAX_STACK_FRAMES 50 191*3117ece4Schristos 192*3117ece4Schristos static void ABRThandler(int sig) { 193*3117ece4Schristos const char* name; 194*3117ece4Schristos void* addrlist[MAX_STACK_FRAMES]; 195*3117ece4Schristos char** symbollist; 196*3117ece4Schristos int addrlen, i; 197*3117ece4Schristos 198*3117ece4Schristos switch (sig) { 199*3117ece4Schristos case SIGABRT: name = "SIGABRT"; break; 200*3117ece4Schristos case SIGFPE: name = "SIGFPE"; break; 201*3117ece4Schristos case SIGILL: name = "SIGILL"; break; 202*3117ece4Schristos case SIGINT: name = "SIGINT"; break; 203*3117ece4Schristos case SIGSEGV: name = "SIGSEGV"; break; 204*3117ece4Schristos default: name = "UNKNOWN"; 205*3117ece4Schristos } 206*3117ece4Schristos 207*3117ece4Schristos DISPLAY("Caught %s signal, printing stack:\n", name); 208*3117ece4Schristos /* Retrieve current stack addresses. */ 209*3117ece4Schristos addrlen = backtrace(addrlist, MAX_STACK_FRAMES); 210*3117ece4Schristos if (addrlen == 0) { 211*3117ece4Schristos DISPLAY("\n"); 212*3117ece4Schristos return; 213*3117ece4Schristos } 214*3117ece4Schristos /* Create readable strings to each frame. */ 215*3117ece4Schristos symbollist = backtrace_symbols(addrlist, addrlen); 216*3117ece4Schristos /* Print the stack trace, excluding calls handling the signal. */ 217*3117ece4Schristos for (i = ZSTD_START_SYMBOLLIST_FRAME; i < addrlen; i++) { 218*3117ece4Schristos DISPLAY("%s\n", symbollist[i]); 219*3117ece4Schristos } 220*3117ece4Schristos free(symbollist); 221*3117ece4Schristos /* Reset and raise the signal so default handler runs. */ 222*3117ece4Schristos signal(sig, SIG_DFL); 223*3117ece4Schristos raise(sig); 224*3117ece4Schristos } 225*3117ece4Schristos #endif 226*3117ece4Schristos 227*3117ece4Schristos void FIO_addAbortHandler(void) 228*3117ece4Schristos { 229*3117ece4Schristos #if BACKTRACE_ENABLE 230*3117ece4Schristos signal(SIGABRT, ABRThandler); 231*3117ece4Schristos signal(SIGFPE, ABRThandler); 232*3117ece4Schristos signal(SIGILL, ABRThandler); 233*3117ece4Schristos signal(SIGSEGV, ABRThandler); 234*3117ece4Schristos signal(SIGBUS, ABRThandler); 235*3117ece4Schristos #endif 236*3117ece4Schristos } 237*3117ece4Schristos 238*3117ece4Schristos /*-************************************* 239*3117ece4Schristos * Parameters: FIO_ctx_t 240*3117ece4Schristos ***************************************/ 241*3117ece4Schristos 242*3117ece4Schristos /* typedef'd to FIO_ctx_t within fileio.h */ 243*3117ece4Schristos struct FIO_ctx_s { 244*3117ece4Schristos 245*3117ece4Schristos /* file i/o info */ 246*3117ece4Schristos int nbFilesTotal; 247*3117ece4Schristos int hasStdinInput; 248*3117ece4Schristos int hasStdoutOutput; 249*3117ece4Schristos 250*3117ece4Schristos /* file i/o state */ 251*3117ece4Schristos int currFileIdx; 252*3117ece4Schristos int nbFilesProcessed; 253*3117ece4Schristos size_t totalBytesInput; 254*3117ece4Schristos size_t totalBytesOutput; 255*3117ece4Schristos }; 256*3117ece4Schristos 257*3117ece4Schristos static int FIO_shouldDisplayFileSummary(FIO_ctx_t const* fCtx) 258*3117ece4Schristos { 259*3117ece4Schristos return fCtx->nbFilesTotal <= 1 || g_display_prefs.displayLevel >= 3; 260*3117ece4Schristos } 261*3117ece4Schristos 262*3117ece4Schristos static int FIO_shouldDisplayMultipleFileSummary(FIO_ctx_t const* fCtx) 263*3117ece4Schristos { 264*3117ece4Schristos int const shouldDisplay = (fCtx->nbFilesProcessed >= 1 && fCtx->nbFilesTotal > 1); 265*3117ece4Schristos assert(shouldDisplay || FIO_shouldDisplayFileSummary(fCtx) || fCtx->nbFilesProcessed == 0); 266*3117ece4Schristos return shouldDisplay; 267*3117ece4Schristos } 268*3117ece4Schristos 269*3117ece4Schristos 270*3117ece4Schristos /*-************************************* 271*3117ece4Schristos * Parameters: Initialization 272*3117ece4Schristos ***************************************/ 273*3117ece4Schristos 274*3117ece4Schristos #define FIO_OVERLAP_LOG_NOTSET 9999 275*3117ece4Schristos #define FIO_LDM_PARAM_NOTSET 9999 276*3117ece4Schristos 277*3117ece4Schristos 278*3117ece4Schristos FIO_prefs_t* FIO_createPreferences(void) 279*3117ece4Schristos { 280*3117ece4Schristos FIO_prefs_t* const ret = (FIO_prefs_t*)malloc(sizeof(FIO_prefs_t)); 281*3117ece4Schristos if (!ret) EXM_THROW(21, "Allocation error : not enough memory"); 282*3117ece4Schristos 283*3117ece4Schristos ret->compressionType = FIO_zstdCompression; 284*3117ece4Schristos ret->overwrite = 0; 285*3117ece4Schristos ret->sparseFileSupport = ZSTD_SPARSE_DEFAULT; 286*3117ece4Schristos ret->dictIDFlag = 1; 287*3117ece4Schristos ret->checksumFlag = 1; 288*3117ece4Schristos ret->removeSrcFile = 0; 289*3117ece4Schristos ret->memLimit = 0; 290*3117ece4Schristos ret->nbWorkers = 1; 291*3117ece4Schristos ret->blockSize = 0; 292*3117ece4Schristos ret->overlapLog = FIO_OVERLAP_LOG_NOTSET; 293*3117ece4Schristos ret->adaptiveMode = 0; 294*3117ece4Schristos ret->rsyncable = 0; 295*3117ece4Schristos ret->minAdaptLevel = -50; /* initializing this value requires a constant, so ZSTD_minCLevel() doesn't work */ 296*3117ece4Schristos ret->maxAdaptLevel = 22; /* initializing this value requires a constant, so ZSTD_maxCLevel() doesn't work */ 297*3117ece4Schristos ret->ldmFlag = 0; 298*3117ece4Schristos ret->ldmHashLog = 0; 299*3117ece4Schristos ret->ldmMinMatch = 0; 300*3117ece4Schristos ret->ldmBucketSizeLog = FIO_LDM_PARAM_NOTSET; 301*3117ece4Schristos ret->ldmHashRateLog = FIO_LDM_PARAM_NOTSET; 302*3117ece4Schristos ret->streamSrcSize = 0; 303*3117ece4Schristos ret->targetCBlockSize = 0; 304*3117ece4Schristos ret->srcSizeHint = 0; 305*3117ece4Schristos ret->testMode = 0; 306*3117ece4Schristos ret->literalCompressionMode = ZSTD_ps_auto; 307*3117ece4Schristos ret->excludeCompressedFiles = 0; 308*3117ece4Schristos ret->allowBlockDevices = 0; 309*3117ece4Schristos ret->asyncIO = AIO_supported(); 310*3117ece4Schristos ret->passThrough = -1; 311*3117ece4Schristos return ret; 312*3117ece4Schristos } 313*3117ece4Schristos 314*3117ece4Schristos FIO_ctx_t* FIO_createContext(void) 315*3117ece4Schristos { 316*3117ece4Schristos FIO_ctx_t* const ret = (FIO_ctx_t*)malloc(sizeof(FIO_ctx_t)); 317*3117ece4Schristos if (!ret) EXM_THROW(21, "Allocation error : not enough memory"); 318*3117ece4Schristos 319*3117ece4Schristos ret->currFileIdx = 0; 320*3117ece4Schristos ret->hasStdinInput = 0; 321*3117ece4Schristos ret->hasStdoutOutput = 0; 322*3117ece4Schristos ret->nbFilesTotal = 1; 323*3117ece4Schristos ret->nbFilesProcessed = 0; 324*3117ece4Schristos ret->totalBytesInput = 0; 325*3117ece4Schristos ret->totalBytesOutput = 0; 326*3117ece4Schristos return ret; 327*3117ece4Schristos } 328*3117ece4Schristos 329*3117ece4Schristos void FIO_freePreferences(FIO_prefs_t* const prefs) 330*3117ece4Schristos { 331*3117ece4Schristos free(prefs); 332*3117ece4Schristos } 333*3117ece4Schristos 334*3117ece4Schristos void FIO_freeContext(FIO_ctx_t* const fCtx) 335*3117ece4Schristos { 336*3117ece4Schristos free(fCtx); 337*3117ece4Schristos } 338*3117ece4Schristos 339*3117ece4Schristos 340*3117ece4Schristos /*-************************************* 341*3117ece4Schristos * Parameters: Display Options 342*3117ece4Schristos ***************************************/ 343*3117ece4Schristos 344*3117ece4Schristos void FIO_setNotificationLevel(int level) { g_display_prefs.displayLevel=level; } 345*3117ece4Schristos 346*3117ece4Schristos void FIO_setProgressSetting(FIO_progressSetting_e setting) { g_display_prefs.progressSetting = setting; } 347*3117ece4Schristos 348*3117ece4Schristos 349*3117ece4Schristos /*-************************************* 350*3117ece4Schristos * Parameters: Setters 351*3117ece4Schristos ***************************************/ 352*3117ece4Schristos 353*3117ece4Schristos /* FIO_prefs_t functions */ 354*3117ece4Schristos 355*3117ece4Schristos void FIO_setCompressionType(FIO_prefs_t* const prefs, FIO_compressionType_t compressionType) { prefs->compressionType = compressionType; } 356*3117ece4Schristos 357*3117ece4Schristos void FIO_overwriteMode(FIO_prefs_t* const prefs) { prefs->overwrite = 1; } 358*3117ece4Schristos 359*3117ece4Schristos void FIO_setSparseWrite(FIO_prefs_t* const prefs, int sparse) { prefs->sparseFileSupport = sparse; } 360*3117ece4Schristos 361*3117ece4Schristos void FIO_setDictIDFlag(FIO_prefs_t* const prefs, int dictIDFlag) { prefs->dictIDFlag = dictIDFlag; } 362*3117ece4Schristos 363*3117ece4Schristos void FIO_setChecksumFlag(FIO_prefs_t* const prefs, int checksumFlag) { prefs->checksumFlag = checksumFlag; } 364*3117ece4Schristos 365*3117ece4Schristos void FIO_setRemoveSrcFile(FIO_prefs_t* const prefs, int flag) { prefs->removeSrcFile = (flag!=0); } 366*3117ece4Schristos 367*3117ece4Schristos void FIO_setMemLimit(FIO_prefs_t* const prefs, unsigned memLimit) { prefs->memLimit = memLimit; } 368*3117ece4Schristos 369*3117ece4Schristos void FIO_setNbWorkers(FIO_prefs_t* const prefs, int nbWorkers) { 370*3117ece4Schristos #ifndef ZSTD_MULTITHREAD 371*3117ece4Schristos if (nbWorkers > 0) DISPLAYLEVEL(2, "Note : multi-threading is disabled \n"); 372*3117ece4Schristos #endif 373*3117ece4Schristos prefs->nbWorkers = nbWorkers; 374*3117ece4Schristos } 375*3117ece4Schristos 376*3117ece4Schristos void FIO_setExcludeCompressedFile(FIO_prefs_t* const prefs, int excludeCompressedFiles) { prefs->excludeCompressedFiles = excludeCompressedFiles; } 377*3117ece4Schristos 378*3117ece4Schristos void FIO_setAllowBlockDevices(FIO_prefs_t* const prefs, int allowBlockDevices) { prefs->allowBlockDevices = allowBlockDevices; } 379*3117ece4Schristos 380*3117ece4Schristos void FIO_setBlockSize(FIO_prefs_t* const prefs, int blockSize) { 381*3117ece4Schristos if (blockSize && prefs->nbWorkers==0) 382*3117ece4Schristos DISPLAYLEVEL(2, "Setting block size is useless in single-thread mode \n"); 383*3117ece4Schristos prefs->blockSize = blockSize; 384*3117ece4Schristos } 385*3117ece4Schristos 386*3117ece4Schristos void FIO_setOverlapLog(FIO_prefs_t* const prefs, int overlapLog){ 387*3117ece4Schristos if (overlapLog && prefs->nbWorkers==0) 388*3117ece4Schristos DISPLAYLEVEL(2, "Setting overlapLog is useless in single-thread mode \n"); 389*3117ece4Schristos prefs->overlapLog = overlapLog; 390*3117ece4Schristos } 391*3117ece4Schristos 392*3117ece4Schristos void FIO_setAdaptiveMode(FIO_prefs_t* const prefs, int adapt) { 393*3117ece4Schristos if ((adapt>0) && (prefs->nbWorkers==0)) 394*3117ece4Schristos EXM_THROW(1, "Adaptive mode is not compatible with single thread mode \n"); 395*3117ece4Schristos prefs->adaptiveMode = adapt; 396*3117ece4Schristos } 397*3117ece4Schristos 398*3117ece4Schristos void FIO_setUseRowMatchFinder(FIO_prefs_t* const prefs, int useRowMatchFinder) { 399*3117ece4Schristos prefs->useRowMatchFinder = useRowMatchFinder; 400*3117ece4Schristos } 401*3117ece4Schristos 402*3117ece4Schristos void FIO_setRsyncable(FIO_prefs_t* const prefs, int rsyncable) { 403*3117ece4Schristos if ((rsyncable>0) && (prefs->nbWorkers==0)) 404*3117ece4Schristos EXM_THROW(1, "Rsyncable mode is not compatible with single thread mode \n"); 405*3117ece4Schristos prefs->rsyncable = rsyncable; 406*3117ece4Schristos } 407*3117ece4Schristos 408*3117ece4Schristos void FIO_setStreamSrcSize(FIO_prefs_t* const prefs, size_t streamSrcSize) { 409*3117ece4Schristos prefs->streamSrcSize = streamSrcSize; 410*3117ece4Schristos } 411*3117ece4Schristos 412*3117ece4Schristos void FIO_setTargetCBlockSize(FIO_prefs_t* const prefs, size_t targetCBlockSize) { 413*3117ece4Schristos prefs->targetCBlockSize = targetCBlockSize; 414*3117ece4Schristos } 415*3117ece4Schristos 416*3117ece4Schristos void FIO_setSrcSizeHint(FIO_prefs_t* const prefs, size_t srcSizeHint) { 417*3117ece4Schristos prefs->srcSizeHint = (int)MIN((size_t)INT_MAX, srcSizeHint); 418*3117ece4Schristos } 419*3117ece4Schristos 420*3117ece4Schristos void FIO_setTestMode(FIO_prefs_t* const prefs, int testMode) { 421*3117ece4Schristos prefs->testMode = (testMode!=0); 422*3117ece4Schristos } 423*3117ece4Schristos 424*3117ece4Schristos void FIO_setLiteralCompressionMode( 425*3117ece4Schristos FIO_prefs_t* const prefs, 426*3117ece4Schristos ZSTD_paramSwitch_e mode) { 427*3117ece4Schristos prefs->literalCompressionMode = mode; 428*3117ece4Schristos } 429*3117ece4Schristos 430*3117ece4Schristos void FIO_setAdaptMin(FIO_prefs_t* const prefs, int minCLevel) 431*3117ece4Schristos { 432*3117ece4Schristos #ifndef ZSTD_NOCOMPRESS 433*3117ece4Schristos assert(minCLevel >= ZSTD_minCLevel()); 434*3117ece4Schristos #endif 435*3117ece4Schristos prefs->minAdaptLevel = minCLevel; 436*3117ece4Schristos } 437*3117ece4Schristos 438*3117ece4Schristos void FIO_setAdaptMax(FIO_prefs_t* const prefs, int maxCLevel) 439*3117ece4Schristos { 440*3117ece4Schristos prefs->maxAdaptLevel = maxCLevel; 441*3117ece4Schristos } 442*3117ece4Schristos 443*3117ece4Schristos void FIO_setLdmFlag(FIO_prefs_t* const prefs, unsigned ldmFlag) { 444*3117ece4Schristos prefs->ldmFlag = (ldmFlag>0); 445*3117ece4Schristos } 446*3117ece4Schristos 447*3117ece4Schristos void FIO_setLdmHashLog(FIO_prefs_t* const prefs, int ldmHashLog) { 448*3117ece4Schristos prefs->ldmHashLog = ldmHashLog; 449*3117ece4Schristos } 450*3117ece4Schristos 451*3117ece4Schristos void FIO_setLdmMinMatch(FIO_prefs_t* const prefs, int ldmMinMatch) { 452*3117ece4Schristos prefs->ldmMinMatch = ldmMinMatch; 453*3117ece4Schristos } 454*3117ece4Schristos 455*3117ece4Schristos void FIO_setLdmBucketSizeLog(FIO_prefs_t* const prefs, int ldmBucketSizeLog) { 456*3117ece4Schristos prefs->ldmBucketSizeLog = ldmBucketSizeLog; 457*3117ece4Schristos } 458*3117ece4Schristos 459*3117ece4Schristos 460*3117ece4Schristos void FIO_setLdmHashRateLog(FIO_prefs_t* const prefs, int ldmHashRateLog) { 461*3117ece4Schristos prefs->ldmHashRateLog = ldmHashRateLog; 462*3117ece4Schristos } 463*3117ece4Schristos 464*3117ece4Schristos void FIO_setPatchFromMode(FIO_prefs_t* const prefs, int value) 465*3117ece4Schristos { 466*3117ece4Schristos prefs->patchFromMode = value != 0; 467*3117ece4Schristos } 468*3117ece4Schristos 469*3117ece4Schristos void FIO_setContentSize(FIO_prefs_t* const prefs, int value) 470*3117ece4Schristos { 471*3117ece4Schristos prefs->contentSize = value != 0; 472*3117ece4Schristos } 473*3117ece4Schristos 474*3117ece4Schristos void FIO_setAsyncIOFlag(FIO_prefs_t* const prefs, int value) { 475*3117ece4Schristos #ifdef ZSTD_MULTITHREAD 476*3117ece4Schristos prefs->asyncIO = value; 477*3117ece4Schristos #else 478*3117ece4Schristos (void) prefs; 479*3117ece4Schristos (void) value; 480*3117ece4Schristos DISPLAYLEVEL(2, "Note : asyncio is disabled (lack of multithreading support) \n"); 481*3117ece4Schristos #endif 482*3117ece4Schristos } 483*3117ece4Schristos 484*3117ece4Schristos void FIO_setPassThroughFlag(FIO_prefs_t* const prefs, int value) { 485*3117ece4Schristos prefs->passThrough = (value != 0); 486*3117ece4Schristos } 487*3117ece4Schristos 488*3117ece4Schristos void FIO_setMMapDict(FIO_prefs_t* const prefs, ZSTD_paramSwitch_e value) 489*3117ece4Schristos { 490*3117ece4Schristos prefs->mmapDict = value; 491*3117ece4Schristos } 492*3117ece4Schristos 493*3117ece4Schristos /* FIO_ctx_t functions */ 494*3117ece4Schristos 495*3117ece4Schristos void FIO_setHasStdoutOutput(FIO_ctx_t* const fCtx, int value) { 496*3117ece4Schristos fCtx->hasStdoutOutput = value; 497*3117ece4Schristos } 498*3117ece4Schristos 499*3117ece4Schristos void FIO_setNbFilesTotal(FIO_ctx_t* const fCtx, int value) 500*3117ece4Schristos { 501*3117ece4Schristos fCtx->nbFilesTotal = value; 502*3117ece4Schristos } 503*3117ece4Schristos 504*3117ece4Schristos void FIO_determineHasStdinInput(FIO_ctx_t* const fCtx, const FileNamesTable* const filenames) { 505*3117ece4Schristos size_t i = 0; 506*3117ece4Schristos for ( ; i < filenames->tableSize; ++i) { 507*3117ece4Schristos if (!strcmp(stdinmark, filenames->fileNames[i])) { 508*3117ece4Schristos fCtx->hasStdinInput = 1; 509*3117ece4Schristos return; 510*3117ece4Schristos } 511*3117ece4Schristos } 512*3117ece4Schristos } 513*3117ece4Schristos 514*3117ece4Schristos /*-************************************* 515*3117ece4Schristos * Functions 516*3117ece4Schristos ***************************************/ 517*3117ece4Schristos /** FIO_removeFile() : 518*3117ece4Schristos * @result : Unlink `fileName`, even if it's read-only */ 519*3117ece4Schristos static int FIO_removeFile(const char* path) 520*3117ece4Schristos { 521*3117ece4Schristos stat_t statbuf; 522*3117ece4Schristos if (!UTIL_stat(path, &statbuf)) { 523*3117ece4Schristos DISPLAYLEVEL(2, "zstd: Failed to stat %s while trying to remove it\n", path); 524*3117ece4Schristos return 0; 525*3117ece4Schristos } 526*3117ece4Schristos if (!UTIL_isRegularFileStat(&statbuf)) { 527*3117ece4Schristos DISPLAYLEVEL(2, "zstd: Refusing to remove non-regular file %s\n", path); 528*3117ece4Schristos return 0; 529*3117ece4Schristos } 530*3117ece4Schristos #if defined(_WIN32) 531*3117ece4Schristos /* windows doesn't allow remove read-only files, 532*3117ece4Schristos * so try to make it writable first */ 533*3117ece4Schristos if (!(statbuf.st_mode & _S_IWRITE)) { 534*3117ece4Schristos UTIL_chmod(path, &statbuf, _S_IWRITE); 535*3117ece4Schristos } 536*3117ece4Schristos #endif 537*3117ece4Schristos return remove(path); 538*3117ece4Schristos } 539*3117ece4Schristos 540*3117ece4Schristos /** FIO_openSrcFile() : 541*3117ece4Schristos * condition : `srcFileName` must be non-NULL. `prefs` may be NULL. 542*3117ece4Schristos * @result : FILE* to `srcFileName`, or NULL if it fails */ 543*3117ece4Schristos static FILE* FIO_openSrcFile(const FIO_prefs_t* const prefs, const char* srcFileName, stat_t* statbuf) 544*3117ece4Schristos { 545*3117ece4Schristos int allowBlockDevices = prefs != NULL ? prefs->allowBlockDevices : 0; 546*3117ece4Schristos assert(srcFileName != NULL); 547*3117ece4Schristos assert(statbuf != NULL); 548*3117ece4Schristos if (!strcmp (srcFileName, stdinmark)) { 549*3117ece4Schristos DISPLAYLEVEL(4,"Using stdin for input \n"); 550*3117ece4Schristos SET_BINARY_MODE(stdin); 551*3117ece4Schristos return stdin; 552*3117ece4Schristos } 553*3117ece4Schristos 554*3117ece4Schristos if (!UTIL_stat(srcFileName, statbuf)) { 555*3117ece4Schristos DISPLAYLEVEL(1, "zstd: can't stat %s : %s -- ignored \n", 556*3117ece4Schristos srcFileName, strerror(errno)); 557*3117ece4Schristos return NULL; 558*3117ece4Schristos } 559*3117ece4Schristos 560*3117ece4Schristos if (!UTIL_isRegularFileStat(statbuf) 561*3117ece4Schristos && !UTIL_isFIFOStat(statbuf) 562*3117ece4Schristos && !(allowBlockDevices && UTIL_isBlockDevStat(statbuf)) 563*3117ece4Schristos ) { 564*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s is not a regular file -- ignored \n", 565*3117ece4Schristos srcFileName); 566*3117ece4Schristos return NULL; 567*3117ece4Schristos } 568*3117ece4Schristos 569*3117ece4Schristos { FILE* const f = fopen(srcFileName, "rb"); 570*3117ece4Schristos if (f == NULL) 571*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s: %s \n", srcFileName, strerror(errno)); 572*3117ece4Schristos return f; 573*3117ece4Schristos } 574*3117ece4Schristos } 575*3117ece4Schristos 576*3117ece4Schristos /** FIO_openDstFile() : 577*3117ece4Schristos * condition : `dstFileName` must be non-NULL. 578*3117ece4Schristos * @result : FILE* to `dstFileName`, or NULL if it fails */ 579*3117ece4Schristos static FILE* 580*3117ece4Schristos FIO_openDstFile(FIO_ctx_t* fCtx, FIO_prefs_t* const prefs, 581*3117ece4Schristos const char* srcFileName, const char* dstFileName, 582*3117ece4Schristos const int mode) 583*3117ece4Schristos { 584*3117ece4Schristos int isDstRegFile; 585*3117ece4Schristos 586*3117ece4Schristos if (prefs->testMode) return NULL; /* do not open file in test mode */ 587*3117ece4Schristos 588*3117ece4Schristos assert(dstFileName != NULL); 589*3117ece4Schristos if (!strcmp (dstFileName, stdoutmark)) { 590*3117ece4Schristos DISPLAYLEVEL(4,"Using stdout for output \n"); 591*3117ece4Schristos SET_BINARY_MODE(stdout); 592*3117ece4Schristos if (prefs->sparseFileSupport == 1) { 593*3117ece4Schristos prefs->sparseFileSupport = 0; 594*3117ece4Schristos DISPLAYLEVEL(4, "Sparse File Support is automatically disabled on stdout ; try --sparse \n"); 595*3117ece4Schristos } 596*3117ece4Schristos return stdout; 597*3117ece4Schristos } 598*3117ece4Schristos 599*3117ece4Schristos /* ensure dst is not the same as src */ 600*3117ece4Schristos if (srcFileName != NULL && UTIL_isSameFile(srcFileName, dstFileName)) { 601*3117ece4Schristos DISPLAYLEVEL(1, "zstd: Refusing to open an output file which will overwrite the input file \n"); 602*3117ece4Schristos return NULL; 603*3117ece4Schristos } 604*3117ece4Schristos 605*3117ece4Schristos isDstRegFile = UTIL_isRegularFile(dstFileName); /* invoke once */ 606*3117ece4Schristos if (prefs->sparseFileSupport == 1) { 607*3117ece4Schristos prefs->sparseFileSupport = ZSTD_SPARSE_DEFAULT; 608*3117ece4Schristos if (!isDstRegFile) { 609*3117ece4Schristos prefs->sparseFileSupport = 0; 610*3117ece4Schristos DISPLAYLEVEL(4, "Sparse File Support is disabled when output is not a file \n"); 611*3117ece4Schristos } 612*3117ece4Schristos } 613*3117ece4Schristos 614*3117ece4Schristos if (isDstRegFile) { 615*3117ece4Schristos /* Check if destination file already exists */ 616*3117ece4Schristos #if !defined(_WIN32) 617*3117ece4Schristos /* this test does not work on Windows : 618*3117ece4Schristos * `NUL` and `nul` are detected as regular files */ 619*3117ece4Schristos if (!strcmp(dstFileName, nulmark)) { 620*3117ece4Schristos EXM_THROW(40, "%s is unexpectedly categorized as a regular file", 621*3117ece4Schristos dstFileName); 622*3117ece4Schristos } 623*3117ece4Schristos #endif 624*3117ece4Schristos if (!prefs->overwrite) { 625*3117ece4Schristos if (g_display_prefs.displayLevel <= 1) { 626*3117ece4Schristos /* No interaction possible */ 627*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s already exists; not overwritten \n", 628*3117ece4Schristos dstFileName); 629*3117ece4Schristos return NULL; 630*3117ece4Schristos } 631*3117ece4Schristos DISPLAY("zstd: %s already exists; ", dstFileName); 632*3117ece4Schristos if (UTIL_requireUserConfirmation("overwrite (y/n) ? ", "Not overwritten \n", "yY", fCtx->hasStdinInput)) 633*3117ece4Schristos return NULL; 634*3117ece4Schristos } 635*3117ece4Schristos /* need to unlink */ 636*3117ece4Schristos FIO_removeFile(dstFileName); 637*3117ece4Schristos } 638*3117ece4Schristos 639*3117ece4Schristos { 640*3117ece4Schristos #if defined(_WIN32) 641*3117ece4Schristos /* Windows requires opening the file as a "binary" file to avoid 642*3117ece4Schristos * mangling. This macro doesn't exist on unix. */ 643*3117ece4Schristos const int openflags = O_WRONLY|O_CREAT|O_TRUNC|O_BINARY; 644*3117ece4Schristos const int fd = _open(dstFileName, openflags, mode); 645*3117ece4Schristos FILE* f = NULL; 646*3117ece4Schristos if (fd != -1) { 647*3117ece4Schristos f = _fdopen(fd, "wb"); 648*3117ece4Schristos } 649*3117ece4Schristos #else 650*3117ece4Schristos const int openflags = O_WRONLY|O_CREAT|O_TRUNC; 651*3117ece4Schristos const int fd = open(dstFileName, openflags, mode); 652*3117ece4Schristos FILE* f = NULL; 653*3117ece4Schristos if (fd != -1) { 654*3117ece4Schristos f = fdopen(fd, "wb"); 655*3117ece4Schristos } 656*3117ece4Schristos #endif 657*3117ece4Schristos if (f == NULL) { 658*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s: %s\n", dstFileName, strerror(errno)); 659*3117ece4Schristos } else { 660*3117ece4Schristos /* An increased buffer size can provide a significant performance 661*3117ece4Schristos * boost on some platforms. Note that providing a NULL buf with a 662*3117ece4Schristos * size that's not 0 is not defined in ANSI C, but is defined in an 663*3117ece4Schristos * extension. There are three possibilities here: 664*3117ece4Schristos * 1. Libc supports the extended version and everything is good. 665*3117ece4Schristos * 2. Libc ignores the size when buf is NULL, in which case 666*3117ece4Schristos * everything will continue as if we didn't call `setvbuf()`. 667*3117ece4Schristos * 3. We fail the call and execution continues but a warning 668*3117ece4Schristos * message might be shown. 669*3117ece4Schristos * In all cases due execution continues. For now, I believe that 670*3117ece4Schristos * this is a more cost-effective solution than managing the buffers 671*3117ece4Schristos * allocations ourselves (will require an API change). 672*3117ece4Schristos */ 673*3117ece4Schristos if (setvbuf(f, NULL, _IOFBF, 1 MB)) { 674*3117ece4Schristos DISPLAYLEVEL(2, "Warning: setvbuf failed for %s\n", dstFileName); 675*3117ece4Schristos } 676*3117ece4Schristos } 677*3117ece4Schristos return f; 678*3117ece4Schristos } 679*3117ece4Schristos } 680*3117ece4Schristos 681*3117ece4Schristos 682*3117ece4Schristos /* FIO_getDictFileStat() : 683*3117ece4Schristos */ 684*3117ece4Schristos static void FIO_getDictFileStat(const char* fileName, stat_t* dictFileStat) { 685*3117ece4Schristos assert(dictFileStat != NULL); 686*3117ece4Schristos if (fileName == NULL) return; 687*3117ece4Schristos 688*3117ece4Schristos if (!UTIL_stat(fileName, dictFileStat)) { 689*3117ece4Schristos EXM_THROW(31, "Stat failed on dictionary file %s: %s", fileName, strerror(errno)); 690*3117ece4Schristos } 691*3117ece4Schristos 692*3117ece4Schristos if (!UTIL_isRegularFileStat(dictFileStat)) { 693*3117ece4Schristos EXM_THROW(32, "Dictionary %s must be a regular file.", fileName); 694*3117ece4Schristos } 695*3117ece4Schristos } 696*3117ece4Schristos 697*3117ece4Schristos /* FIO_setDictBufferMalloc() : 698*3117ece4Schristos * allocates a buffer, pointed by `dict->dictBuffer`, 699*3117ece4Schristos * loads `filename` content into it, up to DICTSIZE_MAX bytes. 700*3117ece4Schristos * @return : loaded size 701*3117ece4Schristos * if fileName==NULL, returns 0 and a NULL pointer 702*3117ece4Schristos */ 703*3117ece4Schristos static size_t FIO_setDictBufferMalloc(FIO_Dict_t* dict, const char* fileName, FIO_prefs_t* const prefs, stat_t* dictFileStat) 704*3117ece4Schristos { 705*3117ece4Schristos FILE* fileHandle; 706*3117ece4Schristos U64 fileSize; 707*3117ece4Schristos void** bufferPtr = &dict->dictBuffer; 708*3117ece4Schristos 709*3117ece4Schristos assert(bufferPtr != NULL); 710*3117ece4Schristos assert(dictFileStat != NULL); 711*3117ece4Schristos *bufferPtr = NULL; 712*3117ece4Schristos if (fileName == NULL) return 0; 713*3117ece4Schristos 714*3117ece4Schristos DISPLAYLEVEL(4,"Loading %s as dictionary \n", fileName); 715*3117ece4Schristos 716*3117ece4Schristos fileHandle = fopen(fileName, "rb"); 717*3117ece4Schristos 718*3117ece4Schristos if (fileHandle == NULL) { 719*3117ece4Schristos EXM_THROW(33, "Couldn't open dictionary %s: %s", fileName, strerror(errno)); 720*3117ece4Schristos } 721*3117ece4Schristos 722*3117ece4Schristos fileSize = UTIL_getFileSizeStat(dictFileStat); 723*3117ece4Schristos { 724*3117ece4Schristos size_t const dictSizeMax = prefs->patchFromMode ? prefs->memLimit : DICTSIZE_MAX; 725*3117ece4Schristos if (fileSize > dictSizeMax) { 726*3117ece4Schristos EXM_THROW(34, "Dictionary file %s is too large (> %u bytes)", 727*3117ece4Schristos fileName, (unsigned)dictSizeMax); /* avoid extreme cases */ 728*3117ece4Schristos } 729*3117ece4Schristos } 730*3117ece4Schristos *bufferPtr = malloc((size_t)fileSize); 731*3117ece4Schristos if (*bufferPtr==NULL) EXM_THROW(34, "%s", strerror(errno)); 732*3117ece4Schristos { size_t const readSize = fread(*bufferPtr, 1, (size_t)fileSize, fileHandle); 733*3117ece4Schristos if (readSize != fileSize) { 734*3117ece4Schristos EXM_THROW(35, "Error reading dictionary file %s : %s", 735*3117ece4Schristos fileName, strerror(errno)); 736*3117ece4Schristos } 737*3117ece4Schristos } 738*3117ece4Schristos fclose(fileHandle); 739*3117ece4Schristos return (size_t)fileSize; 740*3117ece4Schristos } 741*3117ece4Schristos 742*3117ece4Schristos #if (PLATFORM_POSIX_VERSION > 0) 743*3117ece4Schristos #include <sys/mman.h> 744*3117ece4Schristos static void FIO_munmap(FIO_Dict_t* dict) 745*3117ece4Schristos { 746*3117ece4Schristos munmap(dict->dictBuffer, dict->dictBufferSize); 747*3117ece4Schristos dict->dictBuffer = NULL; 748*3117ece4Schristos dict->dictBufferSize = 0; 749*3117ece4Schristos } 750*3117ece4Schristos static size_t FIO_setDictBufferMMap(FIO_Dict_t* dict, const char* fileName, FIO_prefs_t* const prefs, stat_t* dictFileStat) 751*3117ece4Schristos { 752*3117ece4Schristos int fileHandle; 753*3117ece4Schristos U64 fileSize; 754*3117ece4Schristos void** bufferPtr = &dict->dictBuffer; 755*3117ece4Schristos 756*3117ece4Schristos assert(bufferPtr != NULL); 757*3117ece4Schristos assert(dictFileStat != NULL); 758*3117ece4Schristos *bufferPtr = NULL; 759*3117ece4Schristos if (fileName == NULL) return 0; 760*3117ece4Schristos 761*3117ece4Schristos DISPLAYLEVEL(4,"Loading %s as dictionary \n", fileName); 762*3117ece4Schristos 763*3117ece4Schristos fileHandle = open(fileName, O_RDONLY); 764*3117ece4Schristos 765*3117ece4Schristos if (fileHandle == -1) { 766*3117ece4Schristos EXM_THROW(33, "Couldn't open dictionary %s: %s", fileName, strerror(errno)); 767*3117ece4Schristos } 768*3117ece4Schristos 769*3117ece4Schristos fileSize = UTIL_getFileSizeStat(dictFileStat); 770*3117ece4Schristos { 771*3117ece4Schristos size_t const dictSizeMax = prefs->patchFromMode ? prefs->memLimit : DICTSIZE_MAX; 772*3117ece4Schristos if (fileSize > dictSizeMax) { 773*3117ece4Schristos EXM_THROW(34, "Dictionary file %s is too large (> %u bytes)", 774*3117ece4Schristos fileName, (unsigned)dictSizeMax); /* avoid extreme cases */ 775*3117ece4Schristos } 776*3117ece4Schristos } 777*3117ece4Schristos 778*3117ece4Schristos *bufferPtr = mmap(NULL, (size_t)fileSize, PROT_READ, MAP_PRIVATE, fileHandle, 0); 779*3117ece4Schristos if (*bufferPtr==NULL) EXM_THROW(34, "%s", strerror(errno)); 780*3117ece4Schristos 781*3117ece4Schristos close(fileHandle); 782*3117ece4Schristos return (size_t)fileSize; 783*3117ece4Schristos } 784*3117ece4Schristos #elif defined(_MSC_VER) || defined(_WIN32) 785*3117ece4Schristos #include <windows.h> 786*3117ece4Schristos static void FIO_munmap(FIO_Dict_t* dict) 787*3117ece4Schristos { 788*3117ece4Schristos UnmapViewOfFile(dict->dictBuffer); 789*3117ece4Schristos CloseHandle(dict->dictHandle); 790*3117ece4Schristos dict->dictBuffer = NULL; 791*3117ece4Schristos dict->dictBufferSize = 0; 792*3117ece4Schristos } 793*3117ece4Schristos static size_t FIO_setDictBufferMMap(FIO_Dict_t* dict, const char* fileName, FIO_prefs_t* const prefs, stat_t* dictFileStat) 794*3117ece4Schristos { 795*3117ece4Schristos HANDLE fileHandle, mapping; 796*3117ece4Schristos U64 fileSize; 797*3117ece4Schristos void** bufferPtr = &dict->dictBuffer; 798*3117ece4Schristos 799*3117ece4Schristos assert(bufferPtr != NULL); 800*3117ece4Schristos assert(dictFileStat != NULL); 801*3117ece4Schristos *bufferPtr = NULL; 802*3117ece4Schristos if (fileName == NULL) return 0; 803*3117ece4Schristos 804*3117ece4Schristos DISPLAYLEVEL(4,"Loading %s as dictionary \n", fileName); 805*3117ece4Schristos 806*3117ece4Schristos fileHandle = CreateFileA(fileName, GENERIC_READ, FILE_SHARE_READ, NULL, OPEN_EXISTING, FILE_ATTRIBUTE_READONLY, NULL); 807*3117ece4Schristos 808*3117ece4Schristos if (fileHandle == INVALID_HANDLE_VALUE) { 809*3117ece4Schristos EXM_THROW(33, "Couldn't open dictionary %s: %s", fileName, strerror(errno)); 810*3117ece4Schristos } 811*3117ece4Schristos 812*3117ece4Schristos fileSize = UTIL_getFileSizeStat(dictFileStat); 813*3117ece4Schristos { 814*3117ece4Schristos size_t const dictSizeMax = prefs->patchFromMode ? prefs->memLimit : DICTSIZE_MAX; 815*3117ece4Schristos if (fileSize > dictSizeMax) { 816*3117ece4Schristos EXM_THROW(34, "Dictionary file %s is too large (> %u bytes)", 817*3117ece4Schristos fileName, (unsigned)dictSizeMax); /* avoid extreme cases */ 818*3117ece4Schristos } 819*3117ece4Schristos } 820*3117ece4Schristos 821*3117ece4Schristos mapping = CreateFileMapping(fileHandle, NULL, PAGE_READONLY, 0, 0, NULL); 822*3117ece4Schristos if (mapping == NULL) { 823*3117ece4Schristos EXM_THROW(35, "Couldn't map dictionary %s: %s", fileName, strerror(errno)); 824*3117ece4Schristos } 825*3117ece4Schristos 826*3117ece4Schristos *bufferPtr = MapViewOfFile(mapping, FILE_MAP_READ, 0, 0, (DWORD)fileSize); /* we can only cast to DWORD here because dictSize <= 2GB */ 827*3117ece4Schristos if (*bufferPtr==NULL) EXM_THROW(36, "%s", strerror(errno)); 828*3117ece4Schristos 829*3117ece4Schristos dict->dictHandle = fileHandle; 830*3117ece4Schristos return (size_t)fileSize; 831*3117ece4Schristos } 832*3117ece4Schristos #else 833*3117ece4Schristos static size_t FIO_setDictBufferMMap(FIO_Dict_t* dict, const char* fileName, FIO_prefs_t* const prefs, stat_t* dictFileStat) 834*3117ece4Schristos { 835*3117ece4Schristos return FIO_setDictBufferMalloc(dict, fileName, prefs, dictFileStat); 836*3117ece4Schristos } 837*3117ece4Schristos static void FIO_munmap(FIO_Dict_t* dict) { 838*3117ece4Schristos free(dict->dictBuffer); 839*3117ece4Schristos dict->dictBuffer = NULL; 840*3117ece4Schristos dict->dictBufferSize = 0; 841*3117ece4Schristos } 842*3117ece4Schristos #endif 843*3117ece4Schristos 844*3117ece4Schristos static void FIO_freeDict(FIO_Dict_t* dict) { 845*3117ece4Schristos if (dict->dictBufferType == FIO_mallocDict) { 846*3117ece4Schristos free(dict->dictBuffer); 847*3117ece4Schristos dict->dictBuffer = NULL; 848*3117ece4Schristos dict->dictBufferSize = 0; 849*3117ece4Schristos } else if (dict->dictBufferType == FIO_mmapDict) { 850*3117ece4Schristos FIO_munmap(dict); 851*3117ece4Schristos } else { 852*3117ece4Schristos assert(0); /* Should not reach this case */ 853*3117ece4Schristos } 854*3117ece4Schristos } 855*3117ece4Schristos 856*3117ece4Schristos static void FIO_initDict(FIO_Dict_t* dict, const char* fileName, FIO_prefs_t* const prefs, stat_t* dictFileStat, FIO_dictBufferType_t dictBufferType) { 857*3117ece4Schristos dict->dictBufferType = dictBufferType; 858*3117ece4Schristos if (dict->dictBufferType == FIO_mallocDict) { 859*3117ece4Schristos dict->dictBufferSize = FIO_setDictBufferMalloc(dict, fileName, prefs, dictFileStat); 860*3117ece4Schristos } else if (dict->dictBufferType == FIO_mmapDict) { 861*3117ece4Schristos dict->dictBufferSize = FIO_setDictBufferMMap(dict, fileName, prefs, dictFileStat); 862*3117ece4Schristos } else { 863*3117ece4Schristos assert(0); /* Should not reach this case */ 864*3117ece4Schristos } 865*3117ece4Schristos } 866*3117ece4Schristos 867*3117ece4Schristos 868*3117ece4Schristos /* FIO_checkFilenameCollisions() : 869*3117ece4Schristos * Checks for and warns if there are any files that would have the same output path 870*3117ece4Schristos */ 871*3117ece4Schristos int FIO_checkFilenameCollisions(const char** filenameTable, unsigned nbFiles) { 872*3117ece4Schristos const char **filenameTableSorted, *prevElem, *filename; 873*3117ece4Schristos unsigned u; 874*3117ece4Schristos 875*3117ece4Schristos filenameTableSorted = (const char**) malloc(sizeof(char*) * nbFiles); 876*3117ece4Schristos if (!filenameTableSorted) { 877*3117ece4Schristos DISPLAYLEVEL(1, "Allocation error during filename collision checking \n"); 878*3117ece4Schristos return 1; 879*3117ece4Schristos } 880*3117ece4Schristos 881*3117ece4Schristos for (u = 0; u < nbFiles; ++u) { 882*3117ece4Schristos filename = strrchr(filenameTable[u], PATH_SEP); 883*3117ece4Schristos if (filename == NULL) { 884*3117ece4Schristos filenameTableSorted[u] = filenameTable[u]; 885*3117ece4Schristos } else { 886*3117ece4Schristos filenameTableSorted[u] = filename+1; 887*3117ece4Schristos } 888*3117ece4Schristos } 889*3117ece4Schristos 890*3117ece4Schristos qsort((void*)filenameTableSorted, nbFiles, sizeof(char*), UTIL_compareStr); 891*3117ece4Schristos prevElem = filenameTableSorted[0]; 892*3117ece4Schristos for (u = 1; u < nbFiles; ++u) { 893*3117ece4Schristos if (strcmp(prevElem, filenameTableSorted[u]) == 0) { 894*3117ece4Schristos DISPLAYLEVEL(2, "WARNING: Two files have same filename: %s\n", prevElem); 895*3117ece4Schristos } 896*3117ece4Schristos prevElem = filenameTableSorted[u]; 897*3117ece4Schristos } 898*3117ece4Schristos 899*3117ece4Schristos free((void*)filenameTableSorted); 900*3117ece4Schristos return 0; 901*3117ece4Schristos } 902*3117ece4Schristos 903*3117ece4Schristos static const char* 904*3117ece4Schristos extractFilename(const char* path, char separator) 905*3117ece4Schristos { 906*3117ece4Schristos const char* search = strrchr(path, separator); 907*3117ece4Schristos if (search == NULL) return path; 908*3117ece4Schristos return search+1; 909*3117ece4Schristos } 910*3117ece4Schristos 911*3117ece4Schristos /* FIO_createFilename_fromOutDir() : 912*3117ece4Schristos * Takes a source file name and specified output directory, and 913*3117ece4Schristos * allocates memory for and returns a pointer to final path. 914*3117ece4Schristos * This function never returns an error (it may abort() in case of pb) 915*3117ece4Schristos */ 916*3117ece4Schristos static char* 917*3117ece4Schristos FIO_createFilename_fromOutDir(const char* path, const char* outDirName, const size_t suffixLen) 918*3117ece4Schristos { 919*3117ece4Schristos const char* filenameStart; 920*3117ece4Schristos char separator; 921*3117ece4Schristos char* result; 922*3117ece4Schristos 923*3117ece4Schristos #if defined(_MSC_VER) || defined(__MINGW32__) || defined (__MSVCRT__) /* windows support */ 924*3117ece4Schristos separator = '\\'; 925*3117ece4Schristos #else 926*3117ece4Schristos separator = '/'; 927*3117ece4Schristos #endif 928*3117ece4Schristos 929*3117ece4Schristos filenameStart = extractFilename(path, separator); 930*3117ece4Schristos #if defined(_MSC_VER) || defined(__MINGW32__) || defined (__MSVCRT__) /* windows support */ 931*3117ece4Schristos filenameStart = extractFilename(filenameStart, '/'); /* sometimes, '/' separator is also used on Windows (mingw+msys2) */ 932*3117ece4Schristos #endif 933*3117ece4Schristos 934*3117ece4Schristos result = (char*) calloc(1, strlen(outDirName) + 1 + strlen(filenameStart) + suffixLen + 1); 935*3117ece4Schristos if (!result) { 936*3117ece4Schristos EXM_THROW(30, "zstd: FIO_createFilename_fromOutDir: %s", strerror(errno)); 937*3117ece4Schristos } 938*3117ece4Schristos 939*3117ece4Schristos memcpy(result, outDirName, strlen(outDirName)); 940*3117ece4Schristos if (outDirName[strlen(outDirName)-1] == separator) { 941*3117ece4Schristos memcpy(result + strlen(outDirName), filenameStart, strlen(filenameStart)); 942*3117ece4Schristos } else { 943*3117ece4Schristos memcpy(result + strlen(outDirName), &separator, 1); 944*3117ece4Schristos memcpy(result + strlen(outDirName) + 1, filenameStart, strlen(filenameStart)); 945*3117ece4Schristos } 946*3117ece4Schristos 947*3117ece4Schristos return result; 948*3117ece4Schristos } 949*3117ece4Schristos 950*3117ece4Schristos /* FIO_highbit64() : 951*3117ece4Schristos * gives position of highest bit. 952*3117ece4Schristos * note : only works for v > 0 ! 953*3117ece4Schristos */ 954*3117ece4Schristos static unsigned FIO_highbit64(unsigned long long v) 955*3117ece4Schristos { 956*3117ece4Schristos unsigned count = 0; 957*3117ece4Schristos assert(v != 0); 958*3117ece4Schristos v >>= 1; 959*3117ece4Schristos while (v) { v >>= 1; count++; } 960*3117ece4Schristos return count; 961*3117ece4Schristos } 962*3117ece4Schristos 963*3117ece4Schristos static void FIO_adjustMemLimitForPatchFromMode(FIO_prefs_t* const prefs, 964*3117ece4Schristos unsigned long long const dictSize, 965*3117ece4Schristos unsigned long long const maxSrcFileSize) 966*3117ece4Schristos { 967*3117ece4Schristos unsigned long long maxSize = MAX(prefs->memLimit, MAX(dictSize, maxSrcFileSize)); 968*3117ece4Schristos unsigned const maxWindowSize = (1U << ZSTD_WINDOWLOG_MAX); 969*3117ece4Schristos if (maxSize == UTIL_FILESIZE_UNKNOWN) 970*3117ece4Schristos EXM_THROW(42, "Using --patch-from with stdin requires --stream-size"); 971*3117ece4Schristos assert(maxSize != UTIL_FILESIZE_UNKNOWN); 972*3117ece4Schristos if (maxSize > maxWindowSize) 973*3117ece4Schristos EXM_THROW(42, "Can't handle files larger than %u GB\n", maxWindowSize/(1 GB)); 974*3117ece4Schristos FIO_setMemLimit(prefs, (unsigned)maxSize); 975*3117ece4Schristos } 976*3117ece4Schristos 977*3117ece4Schristos /* FIO_multiFilesConcatWarning() : 978*3117ece4Schristos * This function handles logic when processing multiple files with -o or -c, displaying the appropriate warnings/prompts. 979*3117ece4Schristos * Returns 1 if the console should abort, 0 if console should proceed. 980*3117ece4Schristos * 981*3117ece4Schristos * If output is stdout or test mode is active, check that `--rm` disabled. 982*3117ece4Schristos * 983*3117ece4Schristos * If there is just 1 file to process, zstd will proceed as usual. 984*3117ece4Schristos * If each file get processed into its own separate destination file, proceed as usual. 985*3117ece4Schristos * 986*3117ece4Schristos * When multiple files are processed into a single output, 987*3117ece4Schristos * display a warning message, then disable --rm if it's set. 988*3117ece4Schristos * 989*3117ece4Schristos * If -f is specified or if output is stdout, just proceed. 990*3117ece4Schristos * If output is set with -o, prompt for confirmation. 991*3117ece4Schristos */ 992*3117ece4Schristos static int FIO_multiFilesConcatWarning(const FIO_ctx_t* fCtx, FIO_prefs_t* prefs, const char* outFileName, int displayLevelCutoff) 993*3117ece4Schristos { 994*3117ece4Schristos if (fCtx->hasStdoutOutput) { 995*3117ece4Schristos if (prefs->removeSrcFile) 996*3117ece4Schristos /* this should not happen ; hard fail, to protect user's data 997*3117ece4Schristos * note: this should rather be an assert(), but we want to be certain that user's data will not be wiped out in case it nonetheless happen */ 998*3117ece4Schristos EXM_THROW(43, "It's not allowed to remove input files when processed output is piped to stdout. " 999*3117ece4Schristos "This scenario is not supposed to be possible. " 1000*3117ece4Schristos "This is a programming error. File an issue for it to be fixed."); 1001*3117ece4Schristos } 1002*3117ece4Schristos if (prefs->testMode) { 1003*3117ece4Schristos if (prefs->removeSrcFile) 1004*3117ece4Schristos /* this should not happen ; hard fail, to protect user's data 1005*3117ece4Schristos * note: this should rather be an assert(), but we want to be certain that user's data will not be wiped out in case it nonetheless happen */ 1006*3117ece4Schristos EXM_THROW(43, "Test mode shall not remove input files! " 1007*3117ece4Schristos "This scenario is not supposed to be possible. " 1008*3117ece4Schristos "This is a programming error. File an issue for it to be fixed."); 1009*3117ece4Schristos return 0; 1010*3117ece4Schristos } 1011*3117ece4Schristos 1012*3117ece4Schristos if (fCtx->nbFilesTotal == 1) return 0; 1013*3117ece4Schristos assert(fCtx->nbFilesTotal > 1); 1014*3117ece4Schristos 1015*3117ece4Schristos if (!outFileName) return 0; 1016*3117ece4Schristos 1017*3117ece4Schristos if (fCtx->hasStdoutOutput) { 1018*3117ece4Schristos DISPLAYLEVEL(2, "zstd: WARNING: all input files will be processed and concatenated into stdout. \n"); 1019*3117ece4Schristos } else { 1020*3117ece4Schristos DISPLAYLEVEL(2, "zstd: WARNING: all input files will be processed and concatenated into a single output file: %s \n", outFileName); 1021*3117ece4Schristos } 1022*3117ece4Schristos DISPLAYLEVEL(2, "The concatenated output CANNOT regenerate original file names nor directory structure. \n") 1023*3117ece4Schristos 1024*3117ece4Schristos /* multi-input into single output : --rm is not allowed */ 1025*3117ece4Schristos if (prefs->removeSrcFile) { 1026*3117ece4Schristos DISPLAYLEVEL(2, "Since it's a destructive operation, input files will not be removed. \n"); 1027*3117ece4Schristos prefs->removeSrcFile = 0; 1028*3117ece4Schristos } 1029*3117ece4Schristos 1030*3117ece4Schristos if (fCtx->hasStdoutOutput) return 0; 1031*3117ece4Schristos if (prefs->overwrite) return 0; 1032*3117ece4Schristos 1033*3117ece4Schristos /* multiple files concatenated into single destination file using -o without -f */ 1034*3117ece4Schristos if (g_display_prefs.displayLevel <= displayLevelCutoff) { 1035*3117ece4Schristos /* quiet mode => no prompt => fail automatically */ 1036*3117ece4Schristos DISPLAYLEVEL(1, "Concatenating multiple processed inputs into a single output loses file metadata. \n"); 1037*3117ece4Schristos DISPLAYLEVEL(1, "Aborting. \n"); 1038*3117ece4Schristos return 1; 1039*3117ece4Schristos } 1040*3117ece4Schristos /* normal mode => prompt */ 1041*3117ece4Schristos return UTIL_requireUserConfirmation("Proceed? (y/n): ", "Aborting...", "yY", fCtx->hasStdinInput); 1042*3117ece4Schristos } 1043*3117ece4Schristos 1044*3117ece4Schristos static ZSTD_inBuffer setInBuffer(const void* buf, size_t s, size_t pos) 1045*3117ece4Schristos { 1046*3117ece4Schristos ZSTD_inBuffer i; 1047*3117ece4Schristos i.src = buf; 1048*3117ece4Schristos i.size = s; 1049*3117ece4Schristos i.pos = pos; 1050*3117ece4Schristos return i; 1051*3117ece4Schristos } 1052*3117ece4Schristos 1053*3117ece4Schristos static ZSTD_outBuffer setOutBuffer(void* buf, size_t s, size_t pos) 1054*3117ece4Schristos { 1055*3117ece4Schristos ZSTD_outBuffer o; 1056*3117ece4Schristos o.dst = buf; 1057*3117ece4Schristos o.size = s; 1058*3117ece4Schristos o.pos = pos; 1059*3117ece4Schristos return o; 1060*3117ece4Schristos } 1061*3117ece4Schristos 1062*3117ece4Schristos #ifndef ZSTD_NOCOMPRESS 1063*3117ece4Schristos 1064*3117ece4Schristos /* ********************************************************************** 1065*3117ece4Schristos * Compression 1066*3117ece4Schristos ************************************************************************/ 1067*3117ece4Schristos typedef struct { 1068*3117ece4Schristos FIO_Dict_t dict; 1069*3117ece4Schristos const char* dictFileName; 1070*3117ece4Schristos stat_t dictFileStat; 1071*3117ece4Schristos ZSTD_CStream* cctx; 1072*3117ece4Schristos WritePoolCtx_t *writeCtx; 1073*3117ece4Schristos ReadPoolCtx_t *readCtx; 1074*3117ece4Schristos } cRess_t; 1075*3117ece4Schristos 1076*3117ece4Schristos /** ZSTD_cycleLog() : 1077*3117ece4Schristos * condition for correct operation : hashLog > 1 */ 1078*3117ece4Schristos static U32 ZSTD_cycleLog(U32 hashLog, ZSTD_strategy strat) 1079*3117ece4Schristos { 1080*3117ece4Schristos U32 const btScale = ((U32)strat >= (U32)ZSTD_btlazy2); 1081*3117ece4Schristos assert(hashLog > 1); 1082*3117ece4Schristos return hashLog - btScale; 1083*3117ece4Schristos } 1084*3117ece4Schristos 1085*3117ece4Schristos static void FIO_adjustParamsForPatchFromMode(FIO_prefs_t* const prefs, 1086*3117ece4Schristos ZSTD_compressionParameters* comprParams, 1087*3117ece4Schristos unsigned long long const dictSize, 1088*3117ece4Schristos unsigned long long const maxSrcFileSize, 1089*3117ece4Schristos int cLevel) 1090*3117ece4Schristos { 1091*3117ece4Schristos unsigned const fileWindowLog = FIO_highbit64(maxSrcFileSize) + 1; 1092*3117ece4Schristos ZSTD_compressionParameters const cParams = ZSTD_getCParams(cLevel, (size_t)maxSrcFileSize, (size_t)dictSize); 1093*3117ece4Schristos FIO_adjustMemLimitForPatchFromMode(prefs, dictSize, maxSrcFileSize); 1094*3117ece4Schristos if (fileWindowLog > ZSTD_WINDOWLOG_MAX) 1095*3117ece4Schristos DISPLAYLEVEL(1, "Max window log exceeded by file (compression ratio will suffer)\n"); 1096*3117ece4Schristos comprParams->windowLog = MAX(ZSTD_WINDOWLOG_MIN, MIN(ZSTD_WINDOWLOG_MAX, fileWindowLog)); 1097*3117ece4Schristos if (fileWindowLog > ZSTD_cycleLog(cParams.chainLog, cParams.strategy)) { 1098*3117ece4Schristos if (!prefs->ldmFlag) 1099*3117ece4Schristos DISPLAYLEVEL(2, "long mode automatically triggered\n"); 1100*3117ece4Schristos FIO_setLdmFlag(prefs, 1); 1101*3117ece4Schristos } 1102*3117ece4Schristos if (cParams.strategy >= ZSTD_btopt) { 1103*3117ece4Schristos DISPLAYLEVEL(3, "[Optimal parser notes] Consider the following to improve patch size at the cost of speed:\n"); 1104*3117ece4Schristos DISPLAYLEVEL(3, "- Use --single-thread mode in the zstd cli\n"); 1105*3117ece4Schristos DISPLAYLEVEL(3, "- Set a larger targetLength (e.g. --zstd=targetLength=4096)\n"); 1106*3117ece4Schristos DISPLAYLEVEL(3, "- Set a larger chainLog (e.g. --zstd=chainLog=%u)\n", ZSTD_CHAINLOG_MAX); 1107*3117ece4Schristos DISPLAYLEVEL(3, "Also consider playing around with searchLog and hashLog\n"); 1108*3117ece4Schristos } 1109*3117ece4Schristos } 1110*3117ece4Schristos 1111*3117ece4Schristos static cRess_t FIO_createCResources(FIO_prefs_t* const prefs, 1112*3117ece4Schristos const char* dictFileName, unsigned long long const maxSrcFileSize, 1113*3117ece4Schristos int cLevel, ZSTD_compressionParameters comprParams) { 1114*3117ece4Schristos int useMMap = prefs->mmapDict == ZSTD_ps_enable; 1115*3117ece4Schristos int forceNoUseMMap = prefs->mmapDict == ZSTD_ps_disable; 1116*3117ece4Schristos FIO_dictBufferType_t dictBufferType; 1117*3117ece4Schristos cRess_t ress; 1118*3117ece4Schristos memset(&ress, 0, sizeof(ress)); 1119*3117ece4Schristos 1120*3117ece4Schristos DISPLAYLEVEL(6, "FIO_createCResources \n"); 1121*3117ece4Schristos ress.cctx = ZSTD_createCCtx(); 1122*3117ece4Schristos if (ress.cctx == NULL) 1123*3117ece4Schristos EXM_THROW(30, "allocation error (%s): can't create ZSTD_CCtx", 1124*3117ece4Schristos strerror(errno)); 1125*3117ece4Schristos 1126*3117ece4Schristos FIO_getDictFileStat(dictFileName, &ress.dictFileStat); 1127*3117ece4Schristos 1128*3117ece4Schristos /* need to update memLimit before calling createDictBuffer 1129*3117ece4Schristos * because of memLimit check inside it */ 1130*3117ece4Schristos if (prefs->patchFromMode) { 1131*3117ece4Schristos U64 const dictSize = UTIL_getFileSizeStat(&ress.dictFileStat); 1132*3117ece4Schristos unsigned long long const ssSize = (unsigned long long)prefs->streamSrcSize; 1133*3117ece4Schristos useMMap |= dictSize > prefs->memLimit; 1134*3117ece4Schristos FIO_adjustParamsForPatchFromMode(prefs, &comprParams, dictSize, ssSize > 0 ? ssSize : maxSrcFileSize, cLevel); 1135*3117ece4Schristos } 1136*3117ece4Schristos 1137*3117ece4Schristos dictBufferType = (useMMap && !forceNoUseMMap) ? FIO_mmapDict : FIO_mallocDict; 1138*3117ece4Schristos FIO_initDict(&ress.dict, dictFileName, prefs, &ress.dictFileStat, dictBufferType); /* works with dictFileName==NULL */ 1139*3117ece4Schristos 1140*3117ece4Schristos ress.writeCtx = AIO_WritePool_create(prefs, ZSTD_CStreamOutSize()); 1141*3117ece4Schristos ress.readCtx = AIO_ReadPool_create(prefs, ZSTD_CStreamInSize()); 1142*3117ece4Schristos 1143*3117ece4Schristos /* Advanced parameters, including dictionary */ 1144*3117ece4Schristos if (dictFileName && (ress.dict.dictBuffer==NULL)) 1145*3117ece4Schristos EXM_THROW(32, "allocation error : can't create dictBuffer"); 1146*3117ece4Schristos ress.dictFileName = dictFileName; 1147*3117ece4Schristos 1148*3117ece4Schristos if (prefs->adaptiveMode && !prefs->ldmFlag && !comprParams.windowLog) 1149*3117ece4Schristos comprParams.windowLog = ADAPT_WINDOWLOG_DEFAULT; 1150*3117ece4Schristos 1151*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_contentSizeFlag, prefs->contentSize) ); /* always enable content size when available (note: supposed to be default) */ 1152*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_dictIDFlag, prefs->dictIDFlag) ); 1153*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_checksumFlag, prefs->checksumFlag) ); 1154*3117ece4Schristos /* compression level */ 1155*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_compressionLevel, cLevel) ); 1156*3117ece4Schristos /* max compressed block size */ 1157*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_targetCBlockSize, (int)prefs->targetCBlockSize) ); 1158*3117ece4Schristos /* source size hint */ 1159*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_srcSizeHint, (int)prefs->srcSizeHint) ); 1160*3117ece4Schristos /* long distance matching */ 1161*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_enableLongDistanceMatching, prefs->ldmFlag) ); 1162*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_ldmHashLog, prefs->ldmHashLog) ); 1163*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_ldmMinMatch, prefs->ldmMinMatch) ); 1164*3117ece4Schristos if (prefs->ldmBucketSizeLog != FIO_LDM_PARAM_NOTSET) { 1165*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_ldmBucketSizeLog, prefs->ldmBucketSizeLog) ); 1166*3117ece4Schristos } 1167*3117ece4Schristos if (prefs->ldmHashRateLog != FIO_LDM_PARAM_NOTSET) { 1168*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_ldmHashRateLog, prefs->ldmHashRateLog) ); 1169*3117ece4Schristos } 1170*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_useRowMatchFinder, prefs->useRowMatchFinder)); 1171*3117ece4Schristos /* compression parameters */ 1172*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_windowLog, (int)comprParams.windowLog) ); 1173*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_chainLog, (int)comprParams.chainLog) ); 1174*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_hashLog, (int)comprParams.hashLog) ); 1175*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_searchLog, (int)comprParams.searchLog) ); 1176*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_minMatch, (int)comprParams.minMatch) ); 1177*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_targetLength, (int)comprParams.targetLength) ); 1178*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_strategy, (int)comprParams.strategy) ); 1179*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_literalCompressionMode, (int)prefs->literalCompressionMode) ); 1180*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_enableDedicatedDictSearch, 1) ); 1181*3117ece4Schristos /* multi-threading */ 1182*3117ece4Schristos #ifdef ZSTD_MULTITHREAD 1183*3117ece4Schristos DISPLAYLEVEL(5,"set nb workers = %u \n", prefs->nbWorkers); 1184*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_nbWorkers, prefs->nbWorkers) ); 1185*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_jobSize, prefs->blockSize) ); 1186*3117ece4Schristos if (prefs->overlapLog != FIO_OVERLAP_LOG_NOTSET) { 1187*3117ece4Schristos DISPLAYLEVEL(3,"set overlapLog = %u \n", prefs->overlapLog); 1188*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_overlapLog, prefs->overlapLog) ); 1189*3117ece4Schristos } 1190*3117ece4Schristos CHECK( ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_rsyncable, prefs->rsyncable) ); 1191*3117ece4Schristos #endif 1192*3117ece4Schristos /* dictionary */ 1193*3117ece4Schristos if (prefs->patchFromMode) { 1194*3117ece4Schristos CHECK( ZSTD_CCtx_refPrefix(ress.cctx, ress.dict.dictBuffer, ress.dict.dictBufferSize) ); 1195*3117ece4Schristos } else { 1196*3117ece4Schristos CHECK( ZSTD_CCtx_loadDictionary_byReference(ress.cctx, ress.dict.dictBuffer, ress.dict.dictBufferSize) ); 1197*3117ece4Schristos } 1198*3117ece4Schristos 1199*3117ece4Schristos return ress; 1200*3117ece4Schristos } 1201*3117ece4Schristos 1202*3117ece4Schristos static void FIO_freeCResources(cRess_t* const ress) 1203*3117ece4Schristos { 1204*3117ece4Schristos FIO_freeDict(&(ress->dict)); 1205*3117ece4Schristos AIO_WritePool_free(ress->writeCtx); 1206*3117ece4Schristos AIO_ReadPool_free(ress->readCtx); 1207*3117ece4Schristos ZSTD_freeCStream(ress->cctx); /* never fails */ 1208*3117ece4Schristos } 1209*3117ece4Schristos 1210*3117ece4Schristos 1211*3117ece4Schristos #ifdef ZSTD_GZCOMPRESS 1212*3117ece4Schristos static unsigned long long 1213*3117ece4Schristos FIO_compressGzFrame(const cRess_t* ress, /* buffers & handlers are used, but not changed */ 1214*3117ece4Schristos const char* srcFileName, U64 const srcFileSize, 1215*3117ece4Schristos int compressionLevel, U64* readsize) 1216*3117ece4Schristos { 1217*3117ece4Schristos unsigned long long inFileSize = 0, outFileSize = 0; 1218*3117ece4Schristos z_stream strm; 1219*3117ece4Schristos IOJob_t *writeJob = NULL; 1220*3117ece4Schristos 1221*3117ece4Schristos if (compressionLevel > Z_BEST_COMPRESSION) 1222*3117ece4Schristos compressionLevel = Z_BEST_COMPRESSION; 1223*3117ece4Schristos 1224*3117ece4Schristos strm.zalloc = Z_NULL; 1225*3117ece4Schristos strm.zfree = Z_NULL; 1226*3117ece4Schristos strm.opaque = Z_NULL; 1227*3117ece4Schristos 1228*3117ece4Schristos { int const ret = deflateInit2(&strm, compressionLevel, Z_DEFLATED, 1229*3117ece4Schristos 15 /* maxWindowLogSize */ + 16 /* gzip only */, 1230*3117ece4Schristos 8, Z_DEFAULT_STRATEGY); /* see https://www.zlib.net/manual.html */ 1231*3117ece4Schristos if (ret != Z_OK) { 1232*3117ece4Schristos EXM_THROW(71, "zstd: %s: deflateInit2 error %d \n", srcFileName, ret); 1233*3117ece4Schristos } } 1234*3117ece4Schristos 1235*3117ece4Schristos writeJob = AIO_WritePool_acquireJob(ress->writeCtx); 1236*3117ece4Schristos strm.next_in = 0; 1237*3117ece4Schristos strm.avail_in = 0; 1238*3117ece4Schristos strm.next_out = (Bytef*)writeJob->buffer; 1239*3117ece4Schristos strm.avail_out = (uInt)writeJob->bufferSize; 1240*3117ece4Schristos 1241*3117ece4Schristos while (1) { 1242*3117ece4Schristos int ret; 1243*3117ece4Schristos if (strm.avail_in == 0) { 1244*3117ece4Schristos AIO_ReadPool_fillBuffer(ress->readCtx, ZSTD_CStreamInSize()); 1245*3117ece4Schristos if (ress->readCtx->srcBufferLoaded == 0) break; 1246*3117ece4Schristos inFileSize += ress->readCtx->srcBufferLoaded; 1247*3117ece4Schristos strm.next_in = (z_const unsigned char*)ress->readCtx->srcBuffer; 1248*3117ece4Schristos strm.avail_in = (uInt)ress->readCtx->srcBufferLoaded; 1249*3117ece4Schristos } 1250*3117ece4Schristos 1251*3117ece4Schristos { 1252*3117ece4Schristos size_t const availBefore = strm.avail_in; 1253*3117ece4Schristos ret = deflate(&strm, Z_NO_FLUSH); 1254*3117ece4Schristos AIO_ReadPool_consumeBytes(ress->readCtx, availBefore - strm.avail_in); 1255*3117ece4Schristos } 1256*3117ece4Schristos 1257*3117ece4Schristos if (ret != Z_OK) 1258*3117ece4Schristos EXM_THROW(72, "zstd: %s: deflate error %d \n", srcFileName, ret); 1259*3117ece4Schristos { size_t const cSize = writeJob->bufferSize - strm.avail_out; 1260*3117ece4Schristos if (cSize) { 1261*3117ece4Schristos writeJob->usedBufferSize = cSize; 1262*3117ece4Schristos AIO_WritePool_enqueueAndReacquireWriteJob(&writeJob); 1263*3117ece4Schristos outFileSize += cSize; 1264*3117ece4Schristos strm.next_out = (Bytef*)writeJob->buffer; 1265*3117ece4Schristos strm.avail_out = (uInt)writeJob->bufferSize; 1266*3117ece4Schristos } } 1267*3117ece4Schristos if (srcFileSize == UTIL_FILESIZE_UNKNOWN) { 1268*3117ece4Schristos DISPLAYUPDATE_PROGRESS( 1269*3117ece4Schristos "\rRead : %u MB ==> %.2f%% ", 1270*3117ece4Schristos (unsigned)(inFileSize>>20), 1271*3117ece4Schristos (double)outFileSize/(double)inFileSize*100) 1272*3117ece4Schristos } else { 1273*3117ece4Schristos DISPLAYUPDATE_PROGRESS( 1274*3117ece4Schristos "\rRead : %u / %u MB ==> %.2f%% ", 1275*3117ece4Schristos (unsigned)(inFileSize>>20), (unsigned)(srcFileSize>>20), 1276*3117ece4Schristos (double)outFileSize/(double)inFileSize*100); 1277*3117ece4Schristos } } 1278*3117ece4Schristos 1279*3117ece4Schristos while (1) { 1280*3117ece4Schristos int const ret = deflate(&strm, Z_FINISH); 1281*3117ece4Schristos { size_t const cSize = writeJob->bufferSize - strm.avail_out; 1282*3117ece4Schristos if (cSize) { 1283*3117ece4Schristos writeJob->usedBufferSize = cSize; 1284*3117ece4Schristos AIO_WritePool_enqueueAndReacquireWriteJob(&writeJob); 1285*3117ece4Schristos outFileSize += cSize; 1286*3117ece4Schristos strm.next_out = (Bytef*)writeJob->buffer; 1287*3117ece4Schristos strm.avail_out = (uInt)writeJob->bufferSize; 1288*3117ece4Schristos } } 1289*3117ece4Schristos if (ret == Z_STREAM_END) break; 1290*3117ece4Schristos if (ret != Z_BUF_ERROR) 1291*3117ece4Schristos EXM_THROW(77, "zstd: %s: deflate error %d \n", srcFileName, ret); 1292*3117ece4Schristos } 1293*3117ece4Schristos 1294*3117ece4Schristos { int const ret = deflateEnd(&strm); 1295*3117ece4Schristos if (ret != Z_OK) { 1296*3117ece4Schristos EXM_THROW(79, "zstd: %s: deflateEnd error %d \n", srcFileName, ret); 1297*3117ece4Schristos } } 1298*3117ece4Schristos *readsize = inFileSize; 1299*3117ece4Schristos AIO_WritePool_releaseIoJob(writeJob); 1300*3117ece4Schristos AIO_WritePool_sparseWriteEnd(ress->writeCtx); 1301*3117ece4Schristos return outFileSize; 1302*3117ece4Schristos } 1303*3117ece4Schristos #endif 1304*3117ece4Schristos 1305*3117ece4Schristos 1306*3117ece4Schristos #ifdef ZSTD_LZMACOMPRESS 1307*3117ece4Schristos static unsigned long long 1308*3117ece4Schristos FIO_compressLzmaFrame(cRess_t* ress, 1309*3117ece4Schristos const char* srcFileName, U64 const srcFileSize, 1310*3117ece4Schristos int compressionLevel, U64* readsize, int plain_lzma) 1311*3117ece4Schristos { 1312*3117ece4Schristos unsigned long long inFileSize = 0, outFileSize = 0; 1313*3117ece4Schristos lzma_stream strm = LZMA_STREAM_INIT; 1314*3117ece4Schristos lzma_action action = LZMA_RUN; 1315*3117ece4Schristos lzma_ret ret; 1316*3117ece4Schristos IOJob_t *writeJob = NULL; 1317*3117ece4Schristos 1318*3117ece4Schristos if (compressionLevel < 0) compressionLevel = 0; 1319*3117ece4Schristos if (compressionLevel > 9) compressionLevel = 9; 1320*3117ece4Schristos 1321*3117ece4Schristos if (plain_lzma) { 1322*3117ece4Schristos lzma_options_lzma opt_lzma; 1323*3117ece4Schristos if (lzma_lzma_preset(&opt_lzma, compressionLevel)) 1324*3117ece4Schristos EXM_THROW(81, "zstd: %s: lzma_lzma_preset error", srcFileName); 1325*3117ece4Schristos ret = lzma_alone_encoder(&strm, &opt_lzma); /* LZMA */ 1326*3117ece4Schristos if (ret != LZMA_OK) 1327*3117ece4Schristos EXM_THROW(82, "zstd: %s: lzma_alone_encoder error %d", srcFileName, ret); 1328*3117ece4Schristos } else { 1329*3117ece4Schristos ret = lzma_easy_encoder(&strm, compressionLevel, LZMA_CHECK_CRC64); /* XZ */ 1330*3117ece4Schristos if (ret != LZMA_OK) 1331*3117ece4Schristos EXM_THROW(83, "zstd: %s: lzma_easy_encoder error %d", srcFileName, ret); 1332*3117ece4Schristos } 1333*3117ece4Schristos 1334*3117ece4Schristos writeJob =AIO_WritePool_acquireJob(ress->writeCtx); 1335*3117ece4Schristos strm.next_out = (BYTE*)writeJob->buffer; 1336*3117ece4Schristos strm.avail_out = writeJob->bufferSize; 1337*3117ece4Schristos strm.next_in = 0; 1338*3117ece4Schristos strm.avail_in = 0; 1339*3117ece4Schristos 1340*3117ece4Schristos while (1) { 1341*3117ece4Schristos if (strm.avail_in == 0) { 1342*3117ece4Schristos size_t const inSize = AIO_ReadPool_fillBuffer(ress->readCtx, ZSTD_CStreamInSize()); 1343*3117ece4Schristos if (ress->readCtx->srcBufferLoaded == 0) action = LZMA_FINISH; 1344*3117ece4Schristos inFileSize += inSize; 1345*3117ece4Schristos strm.next_in = (BYTE const*)ress->readCtx->srcBuffer; 1346*3117ece4Schristos strm.avail_in = ress->readCtx->srcBufferLoaded; 1347*3117ece4Schristos } 1348*3117ece4Schristos 1349*3117ece4Schristos { 1350*3117ece4Schristos size_t const availBefore = strm.avail_in; 1351*3117ece4Schristos ret = lzma_code(&strm, action); 1352*3117ece4Schristos AIO_ReadPool_consumeBytes(ress->readCtx, availBefore - strm.avail_in); 1353*3117ece4Schristos } 1354*3117ece4Schristos 1355*3117ece4Schristos 1356*3117ece4Schristos if (ret != LZMA_OK && ret != LZMA_STREAM_END) 1357*3117ece4Schristos EXM_THROW(84, "zstd: %s: lzma_code encoding error %d", srcFileName, ret); 1358*3117ece4Schristos { size_t const compBytes = writeJob->bufferSize - strm.avail_out; 1359*3117ece4Schristos if (compBytes) { 1360*3117ece4Schristos writeJob->usedBufferSize = compBytes; 1361*3117ece4Schristos AIO_WritePool_enqueueAndReacquireWriteJob(&writeJob); 1362*3117ece4Schristos outFileSize += compBytes; 1363*3117ece4Schristos strm.next_out = (BYTE*)writeJob->buffer; 1364*3117ece4Schristos strm.avail_out = writeJob->bufferSize; 1365*3117ece4Schristos } } 1366*3117ece4Schristos if (srcFileSize == UTIL_FILESIZE_UNKNOWN) 1367*3117ece4Schristos DISPLAYUPDATE_PROGRESS("\rRead : %u MB ==> %.2f%%", 1368*3117ece4Schristos (unsigned)(inFileSize>>20), 1369*3117ece4Schristos (double)outFileSize/(double)inFileSize*100) 1370*3117ece4Schristos else 1371*3117ece4Schristos DISPLAYUPDATE_PROGRESS("\rRead : %u / %u MB ==> %.2f%%", 1372*3117ece4Schristos (unsigned)(inFileSize>>20), (unsigned)(srcFileSize>>20), 1373*3117ece4Schristos (double)outFileSize/(double)inFileSize*100); 1374*3117ece4Schristos if (ret == LZMA_STREAM_END) break; 1375*3117ece4Schristos } 1376*3117ece4Schristos 1377*3117ece4Schristos lzma_end(&strm); 1378*3117ece4Schristos *readsize = inFileSize; 1379*3117ece4Schristos 1380*3117ece4Schristos AIO_WritePool_releaseIoJob(writeJob); 1381*3117ece4Schristos AIO_WritePool_sparseWriteEnd(ress->writeCtx); 1382*3117ece4Schristos 1383*3117ece4Schristos return outFileSize; 1384*3117ece4Schristos } 1385*3117ece4Schristos #endif 1386*3117ece4Schristos 1387*3117ece4Schristos #ifdef ZSTD_LZ4COMPRESS 1388*3117ece4Schristos 1389*3117ece4Schristos #if LZ4_VERSION_NUMBER <= 10600 1390*3117ece4Schristos #define LZ4F_blockLinked blockLinked 1391*3117ece4Schristos #define LZ4F_max64KB max64KB 1392*3117ece4Schristos #endif 1393*3117ece4Schristos 1394*3117ece4Schristos static int FIO_LZ4_GetBlockSize_FromBlockId (int id) { return (1 << (8 + (2 * id))); } 1395*3117ece4Schristos 1396*3117ece4Schristos static unsigned long long 1397*3117ece4Schristos FIO_compressLz4Frame(cRess_t* ress, 1398*3117ece4Schristos const char* srcFileName, U64 const srcFileSize, 1399*3117ece4Schristos int compressionLevel, int checksumFlag, 1400*3117ece4Schristos U64* readsize) 1401*3117ece4Schristos { 1402*3117ece4Schristos const size_t blockSize = FIO_LZ4_GetBlockSize_FromBlockId(LZ4F_max64KB); 1403*3117ece4Schristos unsigned long long inFileSize = 0, outFileSize = 0; 1404*3117ece4Schristos 1405*3117ece4Schristos LZ4F_preferences_t prefs; 1406*3117ece4Schristos LZ4F_compressionContext_t ctx; 1407*3117ece4Schristos 1408*3117ece4Schristos IOJob_t* writeJob = AIO_WritePool_acquireJob(ress->writeCtx); 1409*3117ece4Schristos 1410*3117ece4Schristos LZ4F_errorCode_t const errorCode = LZ4F_createCompressionContext(&ctx, LZ4F_VERSION); 1411*3117ece4Schristos if (LZ4F_isError(errorCode)) 1412*3117ece4Schristos EXM_THROW(31, "zstd: failed to create lz4 compression context"); 1413*3117ece4Schristos 1414*3117ece4Schristos memset(&prefs, 0, sizeof(prefs)); 1415*3117ece4Schristos 1416*3117ece4Schristos assert(blockSize <= ress->readCtx->base.jobBufferSize); 1417*3117ece4Schristos 1418*3117ece4Schristos /* autoflush off to mitigate a bug in lz4<=1.9.3 for compression level 12 */ 1419*3117ece4Schristos prefs.autoFlush = 0; 1420*3117ece4Schristos prefs.compressionLevel = compressionLevel; 1421*3117ece4Schristos prefs.frameInfo.blockMode = LZ4F_blockLinked; 1422*3117ece4Schristos prefs.frameInfo.blockSizeID = LZ4F_max64KB; 1423*3117ece4Schristos prefs.frameInfo.contentChecksumFlag = (contentChecksum_t)checksumFlag; 1424*3117ece4Schristos #if LZ4_VERSION_NUMBER >= 10600 1425*3117ece4Schristos prefs.frameInfo.contentSize = (srcFileSize==UTIL_FILESIZE_UNKNOWN) ? 0 : srcFileSize; 1426*3117ece4Schristos #endif 1427*3117ece4Schristos assert(LZ4F_compressBound(blockSize, &prefs) <= writeJob->bufferSize); 1428*3117ece4Schristos 1429*3117ece4Schristos { 1430*3117ece4Schristos size_t headerSize = LZ4F_compressBegin(ctx, writeJob->buffer, writeJob->bufferSize, &prefs); 1431*3117ece4Schristos if (LZ4F_isError(headerSize)) 1432*3117ece4Schristos EXM_THROW(33, "File header generation failed : %s", 1433*3117ece4Schristos LZ4F_getErrorName(headerSize)); 1434*3117ece4Schristos writeJob->usedBufferSize = headerSize; 1435*3117ece4Schristos AIO_WritePool_enqueueAndReacquireWriteJob(&writeJob); 1436*3117ece4Schristos outFileSize += headerSize; 1437*3117ece4Schristos 1438*3117ece4Schristos /* Read first block */ 1439*3117ece4Schristos inFileSize += AIO_ReadPool_fillBuffer(ress->readCtx, blockSize); 1440*3117ece4Schristos 1441*3117ece4Schristos /* Main Loop */ 1442*3117ece4Schristos while (ress->readCtx->srcBufferLoaded) { 1443*3117ece4Schristos size_t inSize = MIN(blockSize, ress->readCtx->srcBufferLoaded); 1444*3117ece4Schristos size_t const outSize = LZ4F_compressUpdate(ctx, writeJob->buffer, writeJob->bufferSize, 1445*3117ece4Schristos ress->readCtx->srcBuffer, inSize, NULL); 1446*3117ece4Schristos if (LZ4F_isError(outSize)) 1447*3117ece4Schristos EXM_THROW(35, "zstd: %s: lz4 compression failed : %s", 1448*3117ece4Schristos srcFileName, LZ4F_getErrorName(outSize)); 1449*3117ece4Schristos outFileSize += outSize; 1450*3117ece4Schristos if (srcFileSize == UTIL_FILESIZE_UNKNOWN) { 1451*3117ece4Schristos DISPLAYUPDATE_PROGRESS("\rRead : %u MB ==> %.2f%%", 1452*3117ece4Schristos (unsigned)(inFileSize>>20), 1453*3117ece4Schristos (double)outFileSize/(double)inFileSize*100) 1454*3117ece4Schristos } else { 1455*3117ece4Schristos DISPLAYUPDATE_PROGRESS("\rRead : %u / %u MB ==> %.2f%%", 1456*3117ece4Schristos (unsigned)(inFileSize>>20), (unsigned)(srcFileSize>>20), 1457*3117ece4Schristos (double)outFileSize/(double)inFileSize*100); 1458*3117ece4Schristos } 1459*3117ece4Schristos 1460*3117ece4Schristos /* Write Block */ 1461*3117ece4Schristos writeJob->usedBufferSize = outSize; 1462*3117ece4Schristos AIO_WritePool_enqueueAndReacquireWriteJob(&writeJob); 1463*3117ece4Schristos 1464*3117ece4Schristos /* Read next block */ 1465*3117ece4Schristos AIO_ReadPool_consumeBytes(ress->readCtx, inSize); 1466*3117ece4Schristos inFileSize += AIO_ReadPool_fillBuffer(ress->readCtx, blockSize); 1467*3117ece4Schristos } 1468*3117ece4Schristos 1469*3117ece4Schristos /* End of Stream mark */ 1470*3117ece4Schristos headerSize = LZ4F_compressEnd(ctx, writeJob->buffer, writeJob->bufferSize, NULL); 1471*3117ece4Schristos if (LZ4F_isError(headerSize)) 1472*3117ece4Schristos EXM_THROW(38, "zstd: %s: lz4 end of file generation failed : %s", 1473*3117ece4Schristos srcFileName, LZ4F_getErrorName(headerSize)); 1474*3117ece4Schristos 1475*3117ece4Schristos writeJob->usedBufferSize = headerSize; 1476*3117ece4Schristos AIO_WritePool_enqueueAndReacquireWriteJob(&writeJob); 1477*3117ece4Schristos outFileSize += headerSize; 1478*3117ece4Schristos } 1479*3117ece4Schristos 1480*3117ece4Schristos *readsize = inFileSize; 1481*3117ece4Schristos LZ4F_freeCompressionContext(ctx); 1482*3117ece4Schristos AIO_WritePool_releaseIoJob(writeJob); 1483*3117ece4Schristos AIO_WritePool_sparseWriteEnd(ress->writeCtx); 1484*3117ece4Schristos 1485*3117ece4Schristos return outFileSize; 1486*3117ece4Schristos } 1487*3117ece4Schristos #endif 1488*3117ece4Schristos 1489*3117ece4Schristos static unsigned long long 1490*3117ece4Schristos FIO_compressZstdFrame(FIO_ctx_t* const fCtx, 1491*3117ece4Schristos FIO_prefs_t* const prefs, 1492*3117ece4Schristos const cRess_t* ressPtr, 1493*3117ece4Schristos const char* srcFileName, U64 fileSize, 1494*3117ece4Schristos int compressionLevel, U64* readsize) 1495*3117ece4Schristos { 1496*3117ece4Schristos cRess_t const ress = *ressPtr; 1497*3117ece4Schristos IOJob_t *writeJob = AIO_WritePool_acquireJob(ressPtr->writeCtx); 1498*3117ece4Schristos 1499*3117ece4Schristos U64 compressedfilesize = 0; 1500*3117ece4Schristos ZSTD_EndDirective directive = ZSTD_e_continue; 1501*3117ece4Schristos U64 pledgedSrcSize = ZSTD_CONTENTSIZE_UNKNOWN; 1502*3117ece4Schristos 1503*3117ece4Schristos /* stats */ 1504*3117ece4Schristos ZSTD_frameProgression previous_zfp_update = { 0, 0, 0, 0, 0, 0 }; 1505*3117ece4Schristos ZSTD_frameProgression previous_zfp_correction = { 0, 0, 0, 0, 0, 0 }; 1506*3117ece4Schristos typedef enum { noChange, slower, faster } speedChange_e; 1507*3117ece4Schristos speedChange_e speedChange = noChange; 1508*3117ece4Schristos unsigned flushWaiting = 0; 1509*3117ece4Schristos unsigned inputPresented = 0; 1510*3117ece4Schristos unsigned inputBlocked = 0; 1511*3117ece4Schristos unsigned lastJobID = 0; 1512*3117ece4Schristos UTIL_time_t lastAdaptTime = UTIL_getTime(); 1513*3117ece4Schristos U64 const adaptEveryMicro = REFRESH_RATE; 1514*3117ece4Schristos 1515*3117ece4Schristos UTIL_HumanReadableSize_t const file_hrs = UTIL_makeHumanReadableSize(fileSize); 1516*3117ece4Schristos 1517*3117ece4Schristos DISPLAYLEVEL(6, "compression using zstd format \n"); 1518*3117ece4Schristos 1519*3117ece4Schristos /* init */ 1520*3117ece4Schristos if (fileSize != UTIL_FILESIZE_UNKNOWN) { 1521*3117ece4Schristos pledgedSrcSize = fileSize; 1522*3117ece4Schristos CHECK(ZSTD_CCtx_setPledgedSrcSize(ress.cctx, fileSize)); 1523*3117ece4Schristos } else if (prefs->streamSrcSize > 0) { 1524*3117ece4Schristos /* unknown source size; use the declared stream size */ 1525*3117ece4Schristos pledgedSrcSize = prefs->streamSrcSize; 1526*3117ece4Schristos CHECK( ZSTD_CCtx_setPledgedSrcSize(ress.cctx, prefs->streamSrcSize) ); 1527*3117ece4Schristos } 1528*3117ece4Schristos 1529*3117ece4Schristos { 1530*3117ece4Schristos int windowLog; 1531*3117ece4Schristos UTIL_HumanReadableSize_t windowSize; 1532*3117ece4Schristos CHECK(ZSTD_CCtx_getParameter(ress.cctx, ZSTD_c_windowLog, &windowLog)); 1533*3117ece4Schristos if (windowLog == 0) { 1534*3117ece4Schristos if (prefs->ldmFlag) { 1535*3117ece4Schristos /* If long mode is set without a window size libzstd will set this size internally */ 1536*3117ece4Schristos windowLog = ZSTD_WINDOWLOG_LIMIT_DEFAULT; 1537*3117ece4Schristos } else { 1538*3117ece4Schristos const ZSTD_compressionParameters cParams = ZSTD_getCParams(compressionLevel, fileSize, 0); 1539*3117ece4Schristos windowLog = (int)cParams.windowLog; 1540*3117ece4Schristos } 1541*3117ece4Schristos } 1542*3117ece4Schristos windowSize = UTIL_makeHumanReadableSize(MAX(1ULL, MIN(1ULL << windowLog, pledgedSrcSize))); 1543*3117ece4Schristos DISPLAYLEVEL(4, "Decompression will require %.*f%s of memory\n", windowSize.precision, windowSize.value, windowSize.suffix); 1544*3117ece4Schristos } 1545*3117ece4Schristos (void)srcFileName; 1546*3117ece4Schristos 1547*3117ece4Schristos /* Main compression loop */ 1548*3117ece4Schristos do { 1549*3117ece4Schristos size_t stillToFlush; 1550*3117ece4Schristos /* Fill input Buffer */ 1551*3117ece4Schristos size_t const inSize = AIO_ReadPool_fillBuffer(ress.readCtx, ZSTD_CStreamInSize()); 1552*3117ece4Schristos ZSTD_inBuffer inBuff = setInBuffer( ress.readCtx->srcBuffer, ress.readCtx->srcBufferLoaded, 0 ); 1553*3117ece4Schristos DISPLAYLEVEL(6, "fread %u bytes from source \n", (unsigned)inSize); 1554*3117ece4Schristos *readsize += inSize; 1555*3117ece4Schristos 1556*3117ece4Schristos if ((ress.readCtx->srcBufferLoaded == 0) || (*readsize == fileSize)) 1557*3117ece4Schristos directive = ZSTD_e_end; 1558*3117ece4Schristos 1559*3117ece4Schristos stillToFlush = 1; 1560*3117ece4Schristos while ((inBuff.pos != inBuff.size) /* input buffer must be entirely ingested */ 1561*3117ece4Schristos || (directive == ZSTD_e_end && stillToFlush != 0) ) { 1562*3117ece4Schristos 1563*3117ece4Schristos size_t const oldIPos = inBuff.pos; 1564*3117ece4Schristos ZSTD_outBuffer outBuff = setOutBuffer( writeJob->buffer, writeJob->bufferSize, 0 ); 1565*3117ece4Schristos size_t const toFlushNow = ZSTD_toFlushNow(ress.cctx); 1566*3117ece4Schristos CHECK_V(stillToFlush, ZSTD_compressStream2(ress.cctx, &outBuff, &inBuff, directive)); 1567*3117ece4Schristos AIO_ReadPool_consumeBytes(ress.readCtx, inBuff.pos - oldIPos); 1568*3117ece4Schristos 1569*3117ece4Schristos /* count stats */ 1570*3117ece4Schristos inputPresented++; 1571*3117ece4Schristos if (oldIPos == inBuff.pos) inputBlocked++; /* input buffer is full and can't take any more : input speed is faster than consumption rate */ 1572*3117ece4Schristos if (!toFlushNow) flushWaiting = 1; 1573*3117ece4Schristos 1574*3117ece4Schristos /* Write compressed stream */ 1575*3117ece4Schristos DISPLAYLEVEL(6, "ZSTD_compress_generic(end:%u) => input pos(%u)<=(%u)size ; output generated %u bytes \n", 1576*3117ece4Schristos (unsigned)directive, (unsigned)inBuff.pos, (unsigned)inBuff.size, (unsigned)outBuff.pos); 1577*3117ece4Schristos if (outBuff.pos) { 1578*3117ece4Schristos writeJob->usedBufferSize = outBuff.pos; 1579*3117ece4Schristos AIO_WritePool_enqueueAndReacquireWriteJob(&writeJob); 1580*3117ece4Schristos compressedfilesize += outBuff.pos; 1581*3117ece4Schristos } 1582*3117ece4Schristos 1583*3117ece4Schristos /* adaptive mode : statistics measurement and speed correction */ 1584*3117ece4Schristos if (prefs->adaptiveMode && UTIL_clockSpanMicro(lastAdaptTime) > adaptEveryMicro) { 1585*3117ece4Schristos ZSTD_frameProgression const zfp = ZSTD_getFrameProgression(ress.cctx); 1586*3117ece4Schristos 1587*3117ece4Schristos lastAdaptTime = UTIL_getTime(); 1588*3117ece4Schristos 1589*3117ece4Schristos /* check output speed */ 1590*3117ece4Schristos if (zfp.currentJobID > 1) { /* only possible if nbWorkers >= 1 */ 1591*3117ece4Schristos 1592*3117ece4Schristos unsigned long long newlyProduced = zfp.produced - previous_zfp_update.produced; 1593*3117ece4Schristos unsigned long long newlyFlushed = zfp.flushed - previous_zfp_update.flushed; 1594*3117ece4Schristos assert(zfp.produced >= previous_zfp_update.produced); 1595*3117ece4Schristos assert(prefs->nbWorkers >= 1); 1596*3117ece4Schristos 1597*3117ece4Schristos /* test if compression is blocked 1598*3117ece4Schristos * either because output is slow and all buffers are full 1599*3117ece4Schristos * or because input is slow and no job can start while waiting for at least one buffer to be filled. 1600*3117ece4Schristos * note : exclude starting part, since currentJobID > 1 */ 1601*3117ece4Schristos if ( (zfp.consumed == previous_zfp_update.consumed) /* no data compressed : no data available, or no more buffer to compress to, OR compression is really slow (compression of a single block is slower than update rate)*/ 1602*3117ece4Schristos && (zfp.nbActiveWorkers == 0) /* confirmed : no compression ongoing */ 1603*3117ece4Schristos ) { 1604*3117ece4Schristos DISPLAYLEVEL(6, "all buffers full : compression stopped => slow down \n") 1605*3117ece4Schristos speedChange = slower; 1606*3117ece4Schristos } 1607*3117ece4Schristos 1608*3117ece4Schristos previous_zfp_update = zfp; 1609*3117ece4Schristos 1610*3117ece4Schristos if ( (newlyProduced > (newlyFlushed * 9 / 8)) /* compression produces more data than output can flush (though production can be spiky, due to work unit : (N==4)*block sizes) */ 1611*3117ece4Schristos && (flushWaiting == 0) /* flush speed was never slowed by lack of production, so it's operating at max capacity */ 1612*3117ece4Schristos ) { 1613*3117ece4Schristos DISPLAYLEVEL(6, "compression faster than flush (%llu > %llu), and flushed was never slowed down by lack of production => slow down \n", newlyProduced, newlyFlushed); 1614*3117ece4Schristos speedChange = slower; 1615*3117ece4Schristos } 1616*3117ece4Schristos flushWaiting = 0; 1617*3117ece4Schristos } 1618*3117ece4Schristos 1619*3117ece4Schristos /* course correct only if there is at least one new job completed */ 1620*3117ece4Schristos if (zfp.currentJobID > lastJobID) { 1621*3117ece4Schristos DISPLAYLEVEL(6, "compression level adaptation check \n") 1622*3117ece4Schristos 1623*3117ece4Schristos /* check input speed */ 1624*3117ece4Schristos if (zfp.currentJobID > (unsigned)(prefs->nbWorkers+1)) { /* warm up period, to fill all workers */ 1625*3117ece4Schristos if (inputBlocked <= 0) { 1626*3117ece4Schristos DISPLAYLEVEL(6, "input is never blocked => input is slower than ingestion \n"); 1627*3117ece4Schristos speedChange = slower; 1628*3117ece4Schristos } else if (speedChange == noChange) { 1629*3117ece4Schristos unsigned long long newlyIngested = zfp.ingested - previous_zfp_correction.ingested; 1630*3117ece4Schristos unsigned long long newlyConsumed = zfp.consumed - previous_zfp_correction.consumed; 1631*3117ece4Schristos unsigned long long newlyProduced = zfp.produced - previous_zfp_correction.produced; 1632*3117ece4Schristos unsigned long long newlyFlushed = zfp.flushed - previous_zfp_correction.flushed; 1633*3117ece4Schristos previous_zfp_correction = zfp; 1634*3117ece4Schristos assert(inputPresented > 0); 1635*3117ece4Schristos DISPLAYLEVEL(6, "input blocked %u/%u(%.2f) - ingested:%u vs %u:consumed - flushed:%u vs %u:produced \n", 1636*3117ece4Schristos inputBlocked, inputPresented, (double)inputBlocked/inputPresented*100, 1637*3117ece4Schristos (unsigned)newlyIngested, (unsigned)newlyConsumed, 1638*3117ece4Schristos (unsigned)newlyFlushed, (unsigned)newlyProduced); 1639*3117ece4Schristos if ( (inputBlocked > inputPresented / 8) /* input is waiting often, because input buffers is full : compression or output too slow */ 1640*3117ece4Schristos && (newlyFlushed * 33 / 32 > newlyProduced) /* flush everything that is produced */ 1641*3117ece4Schristos && (newlyIngested * 33 / 32 > newlyConsumed) /* input speed as fast or faster than compression speed */ 1642*3117ece4Schristos ) { 1643*3117ece4Schristos DISPLAYLEVEL(6, "recommend faster as in(%llu) >= (%llu)comp(%llu) <= out(%llu) \n", 1644*3117ece4Schristos newlyIngested, newlyConsumed, newlyProduced, newlyFlushed); 1645*3117ece4Schristos speedChange = faster; 1646*3117ece4Schristos } 1647*3117ece4Schristos } 1648*3117ece4Schristos inputBlocked = 0; 1649*3117ece4Schristos inputPresented = 0; 1650*3117ece4Schristos } 1651*3117ece4Schristos 1652*3117ece4Schristos if (speedChange == slower) { 1653*3117ece4Schristos DISPLAYLEVEL(6, "slower speed , higher compression \n") 1654*3117ece4Schristos compressionLevel ++; 1655*3117ece4Schristos if (compressionLevel > ZSTD_maxCLevel()) compressionLevel = ZSTD_maxCLevel(); 1656*3117ece4Schristos if (compressionLevel > prefs->maxAdaptLevel) compressionLevel = prefs->maxAdaptLevel; 1657*3117ece4Schristos compressionLevel += (compressionLevel == 0); /* skip 0 */ 1658*3117ece4Schristos ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_compressionLevel, compressionLevel); 1659*3117ece4Schristos } 1660*3117ece4Schristos if (speedChange == faster) { 1661*3117ece4Schristos DISPLAYLEVEL(6, "faster speed , lighter compression \n") 1662*3117ece4Schristos compressionLevel --; 1663*3117ece4Schristos if (compressionLevel < prefs->minAdaptLevel) compressionLevel = prefs->minAdaptLevel; 1664*3117ece4Schristos compressionLevel -= (compressionLevel == 0); /* skip 0 */ 1665*3117ece4Schristos ZSTD_CCtx_setParameter(ress.cctx, ZSTD_c_compressionLevel, compressionLevel); 1666*3117ece4Schristos } 1667*3117ece4Schristos speedChange = noChange; 1668*3117ece4Schristos 1669*3117ece4Schristos lastJobID = zfp.currentJobID; 1670*3117ece4Schristos } /* if (zfp.currentJobID > lastJobID) */ 1671*3117ece4Schristos } /* if (prefs->adaptiveMode && UTIL_clockSpanMicro(lastAdaptTime) > adaptEveryMicro) */ 1672*3117ece4Schristos 1673*3117ece4Schristos /* display notification */ 1674*3117ece4Schristos if (SHOULD_DISPLAY_PROGRESS() && READY_FOR_UPDATE()) { 1675*3117ece4Schristos ZSTD_frameProgression const zfp = ZSTD_getFrameProgression(ress.cctx); 1676*3117ece4Schristos double const cShare = (double)zfp.produced / (double)(zfp.consumed + !zfp.consumed/*avoid div0*/) * 100; 1677*3117ece4Schristos UTIL_HumanReadableSize_t const buffered_hrs = UTIL_makeHumanReadableSize(zfp.ingested - zfp.consumed); 1678*3117ece4Schristos UTIL_HumanReadableSize_t const consumed_hrs = UTIL_makeHumanReadableSize(zfp.consumed); 1679*3117ece4Schristos UTIL_HumanReadableSize_t const produced_hrs = UTIL_makeHumanReadableSize(zfp.produced); 1680*3117ece4Schristos 1681*3117ece4Schristos DELAY_NEXT_UPDATE(); 1682*3117ece4Schristos 1683*3117ece4Schristos /* display progress notifications */ 1684*3117ece4Schristos DISPLAY_PROGRESS("\r%79s\r", ""); /* Clear out the current displayed line */ 1685*3117ece4Schristos if (g_display_prefs.displayLevel >= 3) { 1686*3117ece4Schristos /* Verbose progress update */ 1687*3117ece4Schristos DISPLAY_PROGRESS( 1688*3117ece4Schristos "(L%i) Buffered:%5.*f%s - Consumed:%5.*f%s - Compressed:%5.*f%s => %.2f%% ", 1689*3117ece4Schristos compressionLevel, 1690*3117ece4Schristos buffered_hrs.precision, buffered_hrs.value, buffered_hrs.suffix, 1691*3117ece4Schristos consumed_hrs.precision, consumed_hrs.value, consumed_hrs.suffix, 1692*3117ece4Schristos produced_hrs.precision, produced_hrs.value, produced_hrs.suffix, 1693*3117ece4Schristos cShare ); 1694*3117ece4Schristos } else { 1695*3117ece4Schristos /* Require level 2 or forcibly displayed progress counter for summarized updates */ 1696*3117ece4Schristos if (fCtx->nbFilesTotal > 1) { 1697*3117ece4Schristos size_t srcFileNameSize = strlen(srcFileName); 1698*3117ece4Schristos /* Ensure that the string we print is roughly the same size each time */ 1699*3117ece4Schristos if (srcFileNameSize > 18) { 1700*3117ece4Schristos const char* truncatedSrcFileName = srcFileName + srcFileNameSize - 15; 1701*3117ece4Schristos DISPLAY_PROGRESS("Compress: %u/%u files. Current: ...%s ", 1702*3117ece4Schristos fCtx->currFileIdx+1, fCtx->nbFilesTotal, truncatedSrcFileName); 1703*3117ece4Schristos } else { 1704*3117ece4Schristos DISPLAY_PROGRESS("Compress: %u/%u files. Current: %*s ", 1705*3117ece4Schristos fCtx->currFileIdx+1, fCtx->nbFilesTotal, (int)(18-srcFileNameSize), srcFileName); 1706*3117ece4Schristos } 1707*3117ece4Schristos } 1708*3117ece4Schristos DISPLAY_PROGRESS("Read:%6.*f%4s ", consumed_hrs.precision, consumed_hrs.value, consumed_hrs.suffix); 1709*3117ece4Schristos if (fileSize != UTIL_FILESIZE_UNKNOWN) 1710*3117ece4Schristos DISPLAY_PROGRESS("/%6.*f%4s", file_hrs.precision, file_hrs.value, file_hrs.suffix); 1711*3117ece4Schristos DISPLAY_PROGRESS(" ==> %2.f%%", cShare); 1712*3117ece4Schristos } 1713*3117ece4Schristos } /* if (SHOULD_DISPLAY_PROGRESS() && READY_FOR_UPDATE()) */ 1714*3117ece4Schristos } /* while ((inBuff.pos != inBuff.size) */ 1715*3117ece4Schristos } while (directive != ZSTD_e_end); 1716*3117ece4Schristos 1717*3117ece4Schristos if (fileSize != UTIL_FILESIZE_UNKNOWN && *readsize != fileSize) { 1718*3117ece4Schristos EXM_THROW(27, "Read error : Incomplete read : %llu / %llu B", 1719*3117ece4Schristos (unsigned long long)*readsize, (unsigned long long)fileSize); 1720*3117ece4Schristos } 1721*3117ece4Schristos 1722*3117ece4Schristos AIO_WritePool_releaseIoJob(writeJob); 1723*3117ece4Schristos AIO_WritePool_sparseWriteEnd(ressPtr->writeCtx); 1724*3117ece4Schristos 1725*3117ece4Schristos return compressedfilesize; 1726*3117ece4Schristos } 1727*3117ece4Schristos 1728*3117ece4Schristos /*! FIO_compressFilename_internal() : 1729*3117ece4Schristos * same as FIO_compressFilename_extRess(), with `ress.desFile` already opened. 1730*3117ece4Schristos * @return : 0 : compression completed correctly, 1731*3117ece4Schristos * 1 : missing or pb opening srcFileName 1732*3117ece4Schristos */ 1733*3117ece4Schristos static int 1734*3117ece4Schristos FIO_compressFilename_internal(FIO_ctx_t* const fCtx, 1735*3117ece4Schristos FIO_prefs_t* const prefs, 1736*3117ece4Schristos cRess_t ress, 1737*3117ece4Schristos const char* dstFileName, const char* srcFileName, 1738*3117ece4Schristos int compressionLevel) 1739*3117ece4Schristos { 1740*3117ece4Schristos UTIL_time_t const timeStart = UTIL_getTime(); 1741*3117ece4Schristos clock_t const cpuStart = clock(); 1742*3117ece4Schristos U64 readsize = 0; 1743*3117ece4Schristos U64 compressedfilesize = 0; 1744*3117ece4Schristos U64 const fileSize = UTIL_getFileSize(srcFileName); 1745*3117ece4Schristos DISPLAYLEVEL(5, "%s: %llu bytes \n", srcFileName, (unsigned long long)fileSize); 1746*3117ece4Schristos 1747*3117ece4Schristos /* compression format selection */ 1748*3117ece4Schristos switch (prefs->compressionType) { 1749*3117ece4Schristos default: 1750*3117ece4Schristos case FIO_zstdCompression: 1751*3117ece4Schristos compressedfilesize = FIO_compressZstdFrame(fCtx, prefs, &ress, srcFileName, fileSize, compressionLevel, &readsize); 1752*3117ece4Schristos break; 1753*3117ece4Schristos 1754*3117ece4Schristos case FIO_gzipCompression: 1755*3117ece4Schristos #ifdef ZSTD_GZCOMPRESS 1756*3117ece4Schristos compressedfilesize = FIO_compressGzFrame(&ress, srcFileName, fileSize, compressionLevel, &readsize); 1757*3117ece4Schristos #else 1758*3117ece4Schristos (void)compressionLevel; 1759*3117ece4Schristos EXM_THROW(20, "zstd: %s: file cannot be compressed as gzip (zstd compiled without ZSTD_GZCOMPRESS) -- ignored \n", 1760*3117ece4Schristos srcFileName); 1761*3117ece4Schristos #endif 1762*3117ece4Schristos break; 1763*3117ece4Schristos 1764*3117ece4Schristos case FIO_xzCompression: 1765*3117ece4Schristos case FIO_lzmaCompression: 1766*3117ece4Schristos #ifdef ZSTD_LZMACOMPRESS 1767*3117ece4Schristos compressedfilesize = FIO_compressLzmaFrame(&ress, srcFileName, fileSize, compressionLevel, &readsize, prefs->compressionType==FIO_lzmaCompression); 1768*3117ece4Schristos #else 1769*3117ece4Schristos (void)compressionLevel; 1770*3117ece4Schristos EXM_THROW(20, "zstd: %s: file cannot be compressed as xz/lzma (zstd compiled without ZSTD_LZMACOMPRESS) -- ignored \n", 1771*3117ece4Schristos srcFileName); 1772*3117ece4Schristos #endif 1773*3117ece4Schristos break; 1774*3117ece4Schristos 1775*3117ece4Schristos case FIO_lz4Compression: 1776*3117ece4Schristos #ifdef ZSTD_LZ4COMPRESS 1777*3117ece4Schristos compressedfilesize = FIO_compressLz4Frame(&ress, srcFileName, fileSize, compressionLevel, prefs->checksumFlag, &readsize); 1778*3117ece4Schristos #else 1779*3117ece4Schristos (void)compressionLevel; 1780*3117ece4Schristos EXM_THROW(20, "zstd: %s: file cannot be compressed as lz4 (zstd compiled without ZSTD_LZ4COMPRESS) -- ignored \n", 1781*3117ece4Schristos srcFileName); 1782*3117ece4Schristos #endif 1783*3117ece4Schristos break; 1784*3117ece4Schristos } 1785*3117ece4Schristos 1786*3117ece4Schristos /* Status */ 1787*3117ece4Schristos fCtx->totalBytesInput += (size_t)readsize; 1788*3117ece4Schristos fCtx->totalBytesOutput += (size_t)compressedfilesize; 1789*3117ece4Schristos DISPLAY_PROGRESS("\r%79s\r", ""); 1790*3117ece4Schristos if (FIO_shouldDisplayFileSummary(fCtx)) { 1791*3117ece4Schristos UTIL_HumanReadableSize_t hr_isize = UTIL_makeHumanReadableSize((U64) readsize); 1792*3117ece4Schristos UTIL_HumanReadableSize_t hr_osize = UTIL_makeHumanReadableSize((U64) compressedfilesize); 1793*3117ece4Schristos if (readsize == 0) { 1794*3117ece4Schristos DISPLAY_SUMMARY("%-20s : (%6.*f%s => %6.*f%s, %s) \n", 1795*3117ece4Schristos srcFileName, 1796*3117ece4Schristos hr_isize.precision, hr_isize.value, hr_isize.suffix, 1797*3117ece4Schristos hr_osize.precision, hr_osize.value, hr_osize.suffix, 1798*3117ece4Schristos dstFileName); 1799*3117ece4Schristos } else { 1800*3117ece4Schristos DISPLAY_SUMMARY("%-20s :%6.2f%% (%6.*f%s => %6.*f%s, %s) \n", 1801*3117ece4Schristos srcFileName, 1802*3117ece4Schristos (double)compressedfilesize / (double)readsize * 100, 1803*3117ece4Schristos hr_isize.precision, hr_isize.value, hr_isize.suffix, 1804*3117ece4Schristos hr_osize.precision, hr_osize.value, hr_osize.suffix, 1805*3117ece4Schristos dstFileName); 1806*3117ece4Schristos } 1807*3117ece4Schristos } 1808*3117ece4Schristos 1809*3117ece4Schristos /* Elapsed Time and CPU Load */ 1810*3117ece4Schristos { clock_t const cpuEnd = clock(); 1811*3117ece4Schristos double const cpuLoad_s = (double)(cpuEnd - cpuStart) / CLOCKS_PER_SEC; 1812*3117ece4Schristos U64 const timeLength_ns = UTIL_clockSpanNano(timeStart); 1813*3117ece4Schristos double const timeLength_s = (double)timeLength_ns / 1000000000; 1814*3117ece4Schristos double const cpuLoad_pct = (cpuLoad_s / timeLength_s) * 100; 1815*3117ece4Schristos DISPLAYLEVEL(4, "%-20s : Completed in %.2f sec (cpu load : %.0f%%)\n", 1816*3117ece4Schristos srcFileName, timeLength_s, cpuLoad_pct); 1817*3117ece4Schristos } 1818*3117ece4Schristos return 0; 1819*3117ece4Schristos } 1820*3117ece4Schristos 1821*3117ece4Schristos 1822*3117ece4Schristos /*! FIO_compressFilename_dstFile() : 1823*3117ece4Schristos * open dstFileName, or pass-through if ress.file != NULL, 1824*3117ece4Schristos * then start compression with FIO_compressFilename_internal(). 1825*3117ece4Schristos * Manages source removal (--rm) and file permissions transfer. 1826*3117ece4Schristos * note : ress.srcFile must be != NULL, 1827*3117ece4Schristos * so reach this function through FIO_compressFilename_srcFile(). 1828*3117ece4Schristos * @return : 0 : compression completed correctly, 1829*3117ece4Schristos * 1 : pb 1830*3117ece4Schristos */ 1831*3117ece4Schristos static int FIO_compressFilename_dstFile(FIO_ctx_t* const fCtx, 1832*3117ece4Schristos FIO_prefs_t* const prefs, 1833*3117ece4Schristos cRess_t ress, 1834*3117ece4Schristos const char* dstFileName, 1835*3117ece4Schristos const char* srcFileName, 1836*3117ece4Schristos const stat_t* srcFileStat, 1837*3117ece4Schristos int compressionLevel) 1838*3117ece4Schristos { 1839*3117ece4Schristos int closeDstFile = 0; 1840*3117ece4Schristos int result; 1841*3117ece4Schristos int transferStat = 0; 1842*3117ece4Schristos int dstFd = -1; 1843*3117ece4Schristos 1844*3117ece4Schristos assert(AIO_ReadPool_getFile(ress.readCtx) != NULL); 1845*3117ece4Schristos if (AIO_WritePool_getFile(ress.writeCtx) == NULL) { 1846*3117ece4Schristos int dstFileInitialPermissions = DEFAULT_FILE_PERMISSIONS; 1847*3117ece4Schristos if ( strcmp (srcFileName, stdinmark) 1848*3117ece4Schristos && strcmp (dstFileName, stdoutmark) 1849*3117ece4Schristos && UTIL_isRegularFileStat(srcFileStat) ) { 1850*3117ece4Schristos transferStat = 1; 1851*3117ece4Schristos dstFileInitialPermissions = TEMPORARY_FILE_PERMISSIONS; 1852*3117ece4Schristos } 1853*3117ece4Schristos 1854*3117ece4Schristos closeDstFile = 1; 1855*3117ece4Schristos DISPLAYLEVEL(6, "FIO_compressFilename_dstFile: opening dst: %s \n", dstFileName); 1856*3117ece4Schristos { FILE *dstFile = FIO_openDstFile(fCtx, prefs, srcFileName, dstFileName, dstFileInitialPermissions); 1857*3117ece4Schristos if (dstFile==NULL) return 1; /* could not open dstFileName */ 1858*3117ece4Schristos dstFd = fileno(dstFile); 1859*3117ece4Schristos AIO_WritePool_setFile(ress.writeCtx, dstFile); 1860*3117ece4Schristos } 1861*3117ece4Schristos /* Must only be added after FIO_openDstFile() succeeds. 1862*3117ece4Schristos * Otherwise we may delete the destination file if it already exists, 1863*3117ece4Schristos * and the user presses Ctrl-C when asked if they wish to overwrite. 1864*3117ece4Schristos */ 1865*3117ece4Schristos addHandler(dstFileName); 1866*3117ece4Schristos } 1867*3117ece4Schristos 1868*3117ece4Schristos result = FIO_compressFilename_internal(fCtx, prefs, ress, dstFileName, srcFileName, compressionLevel); 1869*3117ece4Schristos 1870*3117ece4Schristos if (closeDstFile) { 1871*3117ece4Schristos clearHandler(); 1872*3117ece4Schristos 1873*3117ece4Schristos if (transferStat) { 1874*3117ece4Schristos UTIL_setFDStat(dstFd, dstFileName, srcFileStat); 1875*3117ece4Schristos } 1876*3117ece4Schristos 1877*3117ece4Schristos DISPLAYLEVEL(6, "FIO_compressFilename_dstFile: closing dst: %s \n", dstFileName); 1878*3117ece4Schristos if (AIO_WritePool_closeFile(ress.writeCtx)) { /* error closing file */ 1879*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s: %s \n", dstFileName, strerror(errno)); 1880*3117ece4Schristos result=1; 1881*3117ece4Schristos } 1882*3117ece4Schristos 1883*3117ece4Schristos if (transferStat) { 1884*3117ece4Schristos UTIL_utime(dstFileName, srcFileStat); 1885*3117ece4Schristos } 1886*3117ece4Schristos 1887*3117ece4Schristos if ( (result != 0) /* operation failure */ 1888*3117ece4Schristos && strcmp(dstFileName, stdoutmark) /* special case : don't remove() stdout */ 1889*3117ece4Schristos ) { 1890*3117ece4Schristos FIO_removeFile(dstFileName); /* remove compression artefact; note don't do anything special if remove() fails */ 1891*3117ece4Schristos } 1892*3117ece4Schristos } 1893*3117ece4Schristos 1894*3117ece4Schristos return result; 1895*3117ece4Schristos } 1896*3117ece4Schristos 1897*3117ece4Schristos /* List used to compare file extensions (used with --exclude-compressed flag) 1898*3117ece4Schristos * Different from the suffixList and should only apply to ZSTD compress operationResult 1899*3117ece4Schristos */ 1900*3117ece4Schristos static const char *compressedFileExtensions[] = { 1901*3117ece4Schristos ZSTD_EXTENSION, 1902*3117ece4Schristos TZSTD_EXTENSION, 1903*3117ece4Schristos GZ_EXTENSION, 1904*3117ece4Schristos TGZ_EXTENSION, 1905*3117ece4Schristos LZMA_EXTENSION, 1906*3117ece4Schristos XZ_EXTENSION, 1907*3117ece4Schristos TXZ_EXTENSION, 1908*3117ece4Schristos LZ4_EXTENSION, 1909*3117ece4Schristos TLZ4_EXTENSION, 1910*3117ece4Schristos ".7z", 1911*3117ece4Schristos ".aa3", 1912*3117ece4Schristos ".aac", 1913*3117ece4Schristos ".aar", 1914*3117ece4Schristos ".ace", 1915*3117ece4Schristos ".alac", 1916*3117ece4Schristos ".ape", 1917*3117ece4Schristos ".apk", 1918*3117ece4Schristos ".apng", 1919*3117ece4Schristos ".arc", 1920*3117ece4Schristos ".archive", 1921*3117ece4Schristos ".arj", 1922*3117ece4Schristos ".ark", 1923*3117ece4Schristos ".asf", 1924*3117ece4Schristos ".avi", 1925*3117ece4Schristos ".avif", 1926*3117ece4Schristos ".ba", 1927*3117ece4Schristos ".br", 1928*3117ece4Schristos ".bz2", 1929*3117ece4Schristos ".cab", 1930*3117ece4Schristos ".cdx", 1931*3117ece4Schristos ".chm", 1932*3117ece4Schristos ".cr2", 1933*3117ece4Schristos ".divx", 1934*3117ece4Schristos ".dmg", 1935*3117ece4Schristos ".dng", 1936*3117ece4Schristos ".docm", 1937*3117ece4Schristos ".docx", 1938*3117ece4Schristos ".dotm", 1939*3117ece4Schristos ".dotx", 1940*3117ece4Schristos ".dsft", 1941*3117ece4Schristos ".ear", 1942*3117ece4Schristos ".eftx", 1943*3117ece4Schristos ".emz", 1944*3117ece4Schristos ".eot", 1945*3117ece4Schristos ".epub", 1946*3117ece4Schristos ".f4v", 1947*3117ece4Schristos ".flac", 1948*3117ece4Schristos ".flv", 1949*3117ece4Schristos ".gho", 1950*3117ece4Schristos ".gif", 1951*3117ece4Schristos ".gifv", 1952*3117ece4Schristos ".gnp", 1953*3117ece4Schristos ".iso", 1954*3117ece4Schristos ".jar", 1955*3117ece4Schristos ".jpeg", 1956*3117ece4Schristos ".jpg", 1957*3117ece4Schristos ".jxl", 1958*3117ece4Schristos ".lz", 1959*3117ece4Schristos ".lzh", 1960*3117ece4Schristos ".m4a", 1961*3117ece4Schristos ".m4v", 1962*3117ece4Schristos ".mkv", 1963*3117ece4Schristos ".mov", 1964*3117ece4Schristos ".mp2", 1965*3117ece4Schristos ".mp3", 1966*3117ece4Schristos ".mp4", 1967*3117ece4Schristos ".mpa", 1968*3117ece4Schristos ".mpc", 1969*3117ece4Schristos ".mpe", 1970*3117ece4Schristos ".mpeg", 1971*3117ece4Schristos ".mpg", 1972*3117ece4Schristos ".mpl", 1973*3117ece4Schristos ".mpv", 1974*3117ece4Schristos ".msi", 1975*3117ece4Schristos ".odp", 1976*3117ece4Schristos ".ods", 1977*3117ece4Schristos ".odt", 1978*3117ece4Schristos ".ogg", 1979*3117ece4Schristos ".ogv", 1980*3117ece4Schristos ".otp", 1981*3117ece4Schristos ".ots", 1982*3117ece4Schristos ".ott", 1983*3117ece4Schristos ".pea", 1984*3117ece4Schristos ".png", 1985*3117ece4Schristos ".pptx", 1986*3117ece4Schristos ".qt", 1987*3117ece4Schristos ".rar", 1988*3117ece4Schristos ".s7z", 1989*3117ece4Schristos ".sfx", 1990*3117ece4Schristos ".sit", 1991*3117ece4Schristos ".sitx", 1992*3117ece4Schristos ".sqx", 1993*3117ece4Schristos ".svgz", 1994*3117ece4Schristos ".swf", 1995*3117ece4Schristos ".tbz2", 1996*3117ece4Schristos ".tib", 1997*3117ece4Schristos ".tlz", 1998*3117ece4Schristos ".vob", 1999*3117ece4Schristos ".war", 2000*3117ece4Schristos ".webm", 2001*3117ece4Schristos ".webp", 2002*3117ece4Schristos ".wma", 2003*3117ece4Schristos ".wmv", 2004*3117ece4Schristos ".woff", 2005*3117ece4Schristos ".woff2", 2006*3117ece4Schristos ".wvl", 2007*3117ece4Schristos ".xlsx", 2008*3117ece4Schristos ".xpi", 2009*3117ece4Schristos ".xps", 2010*3117ece4Schristos ".zip", 2011*3117ece4Schristos ".zipx", 2012*3117ece4Schristos ".zoo", 2013*3117ece4Schristos ".zpaq", 2014*3117ece4Schristos NULL 2015*3117ece4Schristos }; 2016*3117ece4Schristos 2017*3117ece4Schristos /*! FIO_compressFilename_srcFile() : 2018*3117ece4Schristos * @return : 0 : compression completed correctly, 2019*3117ece4Schristos * 1 : missing or pb opening srcFileName 2020*3117ece4Schristos */ 2021*3117ece4Schristos static int 2022*3117ece4Schristos FIO_compressFilename_srcFile(FIO_ctx_t* const fCtx, 2023*3117ece4Schristos FIO_prefs_t* const prefs, 2024*3117ece4Schristos cRess_t ress, 2025*3117ece4Schristos const char* dstFileName, 2026*3117ece4Schristos const char* srcFileName, 2027*3117ece4Schristos int compressionLevel) 2028*3117ece4Schristos { 2029*3117ece4Schristos int result; 2030*3117ece4Schristos FILE* srcFile; 2031*3117ece4Schristos stat_t srcFileStat; 2032*3117ece4Schristos U64 fileSize = UTIL_FILESIZE_UNKNOWN; 2033*3117ece4Schristos DISPLAYLEVEL(6, "FIO_compressFilename_srcFile: %s \n", srcFileName); 2034*3117ece4Schristos 2035*3117ece4Schristos if (strcmp(srcFileName, stdinmark)) { 2036*3117ece4Schristos if (UTIL_stat(srcFileName, &srcFileStat)) { 2037*3117ece4Schristos /* failure to stat at all is handled during opening */ 2038*3117ece4Schristos 2039*3117ece4Schristos /* ensure src is not a directory */ 2040*3117ece4Schristos if (UTIL_isDirectoryStat(&srcFileStat)) { 2041*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s is a directory -- ignored \n", srcFileName); 2042*3117ece4Schristos return 1; 2043*3117ece4Schristos } 2044*3117ece4Schristos 2045*3117ece4Schristos /* ensure src is not the same as dict (if present) */ 2046*3117ece4Schristos if (ress.dictFileName != NULL && UTIL_isSameFileStat(srcFileName, ress.dictFileName, &srcFileStat, &ress.dictFileStat)) { 2047*3117ece4Schristos DISPLAYLEVEL(1, "zstd: cannot use %s as an input file and dictionary \n", srcFileName); 2048*3117ece4Schristos return 1; 2049*3117ece4Schristos } 2050*3117ece4Schristos } 2051*3117ece4Schristos } 2052*3117ece4Schristos 2053*3117ece4Schristos /* Check if "srcFile" is compressed. Only done if --exclude-compressed flag is used 2054*3117ece4Schristos * YES => ZSTD will skip compression of the file and will return 0. 2055*3117ece4Schristos * NO => ZSTD will resume with compress operation. 2056*3117ece4Schristos */ 2057*3117ece4Schristos if (prefs->excludeCompressedFiles == 1 && UTIL_isCompressedFile(srcFileName, compressedFileExtensions)) { 2058*3117ece4Schristos DISPLAYLEVEL(4, "File is already compressed : %s \n", srcFileName); 2059*3117ece4Schristos return 0; 2060*3117ece4Schristos } 2061*3117ece4Schristos 2062*3117ece4Schristos srcFile = FIO_openSrcFile(prefs, srcFileName, &srcFileStat); 2063*3117ece4Schristos if (srcFile == NULL) return 1; /* srcFile could not be opened */ 2064*3117ece4Schristos 2065*3117ece4Schristos /* Don't use AsyncIO for small files */ 2066*3117ece4Schristos if (strcmp(srcFileName, stdinmark)) /* Stdin doesn't have stats */ 2067*3117ece4Schristos fileSize = UTIL_getFileSizeStat(&srcFileStat); 2068*3117ece4Schristos if(fileSize != UTIL_FILESIZE_UNKNOWN && fileSize < ZSTD_BLOCKSIZE_MAX * 3) { 2069*3117ece4Schristos AIO_ReadPool_setAsync(ress.readCtx, 0); 2070*3117ece4Schristos AIO_WritePool_setAsync(ress.writeCtx, 0); 2071*3117ece4Schristos } else { 2072*3117ece4Schristos AIO_ReadPool_setAsync(ress.readCtx, 1); 2073*3117ece4Schristos AIO_WritePool_setAsync(ress.writeCtx, 1); 2074*3117ece4Schristos } 2075*3117ece4Schristos 2076*3117ece4Schristos AIO_ReadPool_setFile(ress.readCtx, srcFile); 2077*3117ece4Schristos result = FIO_compressFilename_dstFile( 2078*3117ece4Schristos fCtx, prefs, ress, 2079*3117ece4Schristos dstFileName, srcFileName, 2080*3117ece4Schristos &srcFileStat, compressionLevel); 2081*3117ece4Schristos AIO_ReadPool_closeFile(ress.readCtx); 2082*3117ece4Schristos 2083*3117ece4Schristos if ( prefs->removeSrcFile /* --rm */ 2084*3117ece4Schristos && result == 0 /* success */ 2085*3117ece4Schristos && strcmp(srcFileName, stdinmark) /* exception : don't erase stdin */ 2086*3117ece4Schristos ) { 2087*3117ece4Schristos /* We must clear the handler, since after this point calling it would 2088*3117ece4Schristos * delete both the source and destination files. 2089*3117ece4Schristos */ 2090*3117ece4Schristos clearHandler(); 2091*3117ece4Schristos if (FIO_removeFile(srcFileName)) 2092*3117ece4Schristos EXM_THROW(1, "zstd: %s: %s", srcFileName, strerror(errno)); 2093*3117ece4Schristos } 2094*3117ece4Schristos return result; 2095*3117ece4Schristos } 2096*3117ece4Schristos 2097*3117ece4Schristos static const char* 2098*3117ece4Schristos checked_index(const char* options[], size_t length, size_t index) { 2099*3117ece4Schristos assert(index < length); 2100*3117ece4Schristos /* Necessary to avoid warnings since -O3 will omit the above `assert` */ 2101*3117ece4Schristos (void) length; 2102*3117ece4Schristos return options[index]; 2103*3117ece4Schristos } 2104*3117ece4Schristos 2105*3117ece4Schristos #define INDEX(options, index) checked_index((options), sizeof(options) / sizeof(char*), (size_t)(index)) 2106*3117ece4Schristos 2107*3117ece4Schristos void FIO_displayCompressionParameters(const FIO_prefs_t* prefs) 2108*3117ece4Schristos { 2109*3117ece4Schristos static const char* formatOptions[5] = {ZSTD_EXTENSION, GZ_EXTENSION, XZ_EXTENSION, 2110*3117ece4Schristos LZMA_EXTENSION, LZ4_EXTENSION}; 2111*3117ece4Schristos static const char* sparseOptions[3] = {" --no-sparse", "", " --sparse"}; 2112*3117ece4Schristos static const char* checkSumOptions[3] = {" --no-check", "", " --check"}; 2113*3117ece4Schristos static const char* rowMatchFinderOptions[3] = {"", " --no-row-match-finder", " --row-match-finder"}; 2114*3117ece4Schristos static const char* compressLiteralsOptions[3] = {"", " --compress-literals", " --no-compress-literals"}; 2115*3117ece4Schristos 2116*3117ece4Schristos assert(g_display_prefs.displayLevel >= 4); 2117*3117ece4Schristos 2118*3117ece4Schristos DISPLAY("--format=%s", formatOptions[prefs->compressionType]); 2119*3117ece4Schristos DISPLAY("%s", INDEX(sparseOptions, prefs->sparseFileSupport)); 2120*3117ece4Schristos DISPLAY("%s", prefs->dictIDFlag ? "" : " --no-dictID"); 2121*3117ece4Schristos DISPLAY("%s", INDEX(checkSumOptions, prefs->checksumFlag)); 2122*3117ece4Schristos DISPLAY(" --block-size=%d", prefs->blockSize); 2123*3117ece4Schristos if (prefs->adaptiveMode) 2124*3117ece4Schristos DISPLAY(" --adapt=min=%d,max=%d", prefs->minAdaptLevel, prefs->maxAdaptLevel); 2125*3117ece4Schristos DISPLAY("%s", INDEX(rowMatchFinderOptions, prefs->useRowMatchFinder)); 2126*3117ece4Schristos DISPLAY("%s", prefs->rsyncable ? " --rsyncable" : ""); 2127*3117ece4Schristos if (prefs->streamSrcSize) 2128*3117ece4Schristos DISPLAY(" --stream-size=%u", (unsigned) prefs->streamSrcSize); 2129*3117ece4Schristos if (prefs->srcSizeHint) 2130*3117ece4Schristos DISPLAY(" --size-hint=%d", prefs->srcSizeHint); 2131*3117ece4Schristos if (prefs->targetCBlockSize) 2132*3117ece4Schristos DISPLAY(" --target-compressed-block-size=%u", (unsigned) prefs->targetCBlockSize); 2133*3117ece4Schristos DISPLAY("%s", INDEX(compressLiteralsOptions, prefs->literalCompressionMode)); 2134*3117ece4Schristos DISPLAY(" --memory=%u", prefs->memLimit ? prefs->memLimit : 128 MB); 2135*3117ece4Schristos DISPLAY(" --threads=%d", prefs->nbWorkers); 2136*3117ece4Schristos DISPLAY("%s", prefs->excludeCompressedFiles ? " --exclude-compressed" : ""); 2137*3117ece4Schristos DISPLAY(" --%scontent-size", prefs->contentSize ? "" : "no-"); 2138*3117ece4Schristos DISPLAY("\n"); 2139*3117ece4Schristos } 2140*3117ece4Schristos 2141*3117ece4Schristos #undef INDEX 2142*3117ece4Schristos 2143*3117ece4Schristos int FIO_compressFilename(FIO_ctx_t* const fCtx, FIO_prefs_t* const prefs, const char* dstFileName, 2144*3117ece4Schristos const char* srcFileName, const char* dictFileName, 2145*3117ece4Schristos int compressionLevel, ZSTD_compressionParameters comprParams) 2146*3117ece4Schristos { 2147*3117ece4Schristos cRess_t ress = FIO_createCResources(prefs, dictFileName, UTIL_getFileSize(srcFileName), compressionLevel, comprParams); 2148*3117ece4Schristos int const result = FIO_compressFilename_srcFile(fCtx, prefs, ress, dstFileName, srcFileName, compressionLevel); 2149*3117ece4Schristos 2150*3117ece4Schristos #define DISPLAY_LEVEL_DEFAULT 2 2151*3117ece4Schristos 2152*3117ece4Schristos FIO_freeCResources(&ress); 2153*3117ece4Schristos return result; 2154*3117ece4Schristos } 2155*3117ece4Schristos 2156*3117ece4Schristos /* FIO_determineCompressedName() : 2157*3117ece4Schristos * create a destination filename for compressed srcFileName. 2158*3117ece4Schristos * @return a pointer to it. 2159*3117ece4Schristos * This function never returns an error (it may abort() in case of pb) 2160*3117ece4Schristos */ 2161*3117ece4Schristos static const char* 2162*3117ece4Schristos FIO_determineCompressedName(const char* srcFileName, const char* outDirName, const char* suffix) 2163*3117ece4Schristos { 2164*3117ece4Schristos static size_t dfnbCapacity = 0; 2165*3117ece4Schristos static char* dstFileNameBuffer = NULL; /* using static allocation : this function cannot be multi-threaded */ 2166*3117ece4Schristos char* outDirFilename = NULL; 2167*3117ece4Schristos size_t sfnSize = strlen(srcFileName); 2168*3117ece4Schristos size_t const srcSuffixLen = strlen(suffix); 2169*3117ece4Schristos 2170*3117ece4Schristos if(!strcmp(srcFileName, stdinmark)) { 2171*3117ece4Schristos return stdoutmark; 2172*3117ece4Schristos } 2173*3117ece4Schristos 2174*3117ece4Schristos if (outDirName) { 2175*3117ece4Schristos outDirFilename = FIO_createFilename_fromOutDir(srcFileName, outDirName, srcSuffixLen); 2176*3117ece4Schristos sfnSize = strlen(outDirFilename); 2177*3117ece4Schristos assert(outDirFilename != NULL); 2178*3117ece4Schristos } 2179*3117ece4Schristos 2180*3117ece4Schristos if (dfnbCapacity <= sfnSize+srcSuffixLen+1) { 2181*3117ece4Schristos /* resize buffer for dstName */ 2182*3117ece4Schristos free(dstFileNameBuffer); 2183*3117ece4Schristos dfnbCapacity = sfnSize + srcSuffixLen + 30; 2184*3117ece4Schristos dstFileNameBuffer = (char*)malloc(dfnbCapacity); 2185*3117ece4Schristos if (!dstFileNameBuffer) { 2186*3117ece4Schristos EXM_THROW(30, "zstd: %s", strerror(errno)); 2187*3117ece4Schristos } 2188*3117ece4Schristos } 2189*3117ece4Schristos assert(dstFileNameBuffer != NULL); 2190*3117ece4Schristos 2191*3117ece4Schristos if (outDirFilename) { 2192*3117ece4Schristos memcpy(dstFileNameBuffer, outDirFilename, sfnSize); 2193*3117ece4Schristos free(outDirFilename); 2194*3117ece4Schristos } else { 2195*3117ece4Schristos memcpy(dstFileNameBuffer, srcFileName, sfnSize); 2196*3117ece4Schristos } 2197*3117ece4Schristos memcpy(dstFileNameBuffer+sfnSize, suffix, srcSuffixLen+1 /* Include terminating null */); 2198*3117ece4Schristos return dstFileNameBuffer; 2199*3117ece4Schristos } 2200*3117ece4Schristos 2201*3117ece4Schristos static unsigned long long FIO_getLargestFileSize(const char** inFileNames, unsigned nbFiles) 2202*3117ece4Schristos { 2203*3117ece4Schristos size_t i; 2204*3117ece4Schristos unsigned long long fileSize, maxFileSize = 0; 2205*3117ece4Schristos for (i = 0; i < nbFiles; i++) { 2206*3117ece4Schristos fileSize = UTIL_getFileSize(inFileNames[i]); 2207*3117ece4Schristos maxFileSize = fileSize > maxFileSize ? fileSize : maxFileSize; 2208*3117ece4Schristos } 2209*3117ece4Schristos return maxFileSize; 2210*3117ece4Schristos } 2211*3117ece4Schristos 2212*3117ece4Schristos /* FIO_compressMultipleFilenames() : 2213*3117ece4Schristos * compress nbFiles files 2214*3117ece4Schristos * into either one destination (outFileName), 2215*3117ece4Schristos * or into one file each (outFileName == NULL, but suffix != NULL), 2216*3117ece4Schristos * or into a destination folder (specified with -O) 2217*3117ece4Schristos */ 2218*3117ece4Schristos int FIO_compressMultipleFilenames(FIO_ctx_t* const fCtx, 2219*3117ece4Schristos FIO_prefs_t* const prefs, 2220*3117ece4Schristos const char** inFileNamesTable, 2221*3117ece4Schristos const char* outMirroredRootDirName, 2222*3117ece4Schristos const char* outDirName, 2223*3117ece4Schristos const char* outFileName, const char* suffix, 2224*3117ece4Schristos const char* dictFileName, int compressionLevel, 2225*3117ece4Schristos ZSTD_compressionParameters comprParams) 2226*3117ece4Schristos { 2227*3117ece4Schristos int status; 2228*3117ece4Schristos int error = 0; 2229*3117ece4Schristos cRess_t ress = FIO_createCResources(prefs, dictFileName, 2230*3117ece4Schristos FIO_getLargestFileSize(inFileNamesTable, (unsigned)fCtx->nbFilesTotal), 2231*3117ece4Schristos compressionLevel, comprParams); 2232*3117ece4Schristos 2233*3117ece4Schristos /* init */ 2234*3117ece4Schristos assert(outFileName != NULL || suffix != NULL); 2235*3117ece4Schristos if (outFileName != NULL) { /* output into a single destination (stdout typically) */ 2236*3117ece4Schristos FILE *dstFile; 2237*3117ece4Schristos if (FIO_multiFilesConcatWarning(fCtx, prefs, outFileName, 1 /* displayLevelCutoff */)) { 2238*3117ece4Schristos FIO_freeCResources(&ress); 2239*3117ece4Schristos return 1; 2240*3117ece4Schristos } 2241*3117ece4Schristos dstFile = FIO_openDstFile(fCtx, prefs, NULL, outFileName, DEFAULT_FILE_PERMISSIONS); 2242*3117ece4Schristos if (dstFile == NULL) { /* could not open outFileName */ 2243*3117ece4Schristos error = 1; 2244*3117ece4Schristos } else { 2245*3117ece4Schristos AIO_WritePool_setFile(ress.writeCtx, dstFile); 2246*3117ece4Schristos for (; fCtx->currFileIdx < fCtx->nbFilesTotal; ++fCtx->currFileIdx) { 2247*3117ece4Schristos status = FIO_compressFilename_srcFile(fCtx, prefs, ress, outFileName, inFileNamesTable[fCtx->currFileIdx], compressionLevel); 2248*3117ece4Schristos if (!status) fCtx->nbFilesProcessed++; 2249*3117ece4Schristos error |= status; 2250*3117ece4Schristos } 2251*3117ece4Schristos if (AIO_WritePool_closeFile(ress.writeCtx)) 2252*3117ece4Schristos EXM_THROW(29, "Write error (%s) : cannot properly close %s", 2253*3117ece4Schristos strerror(errno), outFileName); 2254*3117ece4Schristos } 2255*3117ece4Schristos } else { 2256*3117ece4Schristos if (outMirroredRootDirName) 2257*3117ece4Schristos UTIL_mirrorSourceFilesDirectories(inFileNamesTable, (unsigned)fCtx->nbFilesTotal, outMirroredRootDirName); 2258*3117ece4Schristos 2259*3117ece4Schristos for (; fCtx->currFileIdx < fCtx->nbFilesTotal; ++fCtx->currFileIdx) { 2260*3117ece4Schristos const char* const srcFileName = inFileNamesTable[fCtx->currFileIdx]; 2261*3117ece4Schristos const char* dstFileName = NULL; 2262*3117ece4Schristos if (outMirroredRootDirName) { 2263*3117ece4Schristos char* validMirroredDirName = UTIL_createMirroredDestDirName(srcFileName, outMirroredRootDirName); 2264*3117ece4Schristos if (validMirroredDirName) { 2265*3117ece4Schristos dstFileName = FIO_determineCompressedName(srcFileName, validMirroredDirName, suffix); 2266*3117ece4Schristos free(validMirroredDirName); 2267*3117ece4Schristos } else { 2268*3117ece4Schristos DISPLAYLEVEL(2, "zstd: --output-dir-mirror cannot compress '%s' into '%s' \n", srcFileName, outMirroredRootDirName); 2269*3117ece4Schristos error=1; 2270*3117ece4Schristos continue; 2271*3117ece4Schristos } 2272*3117ece4Schristos } else { 2273*3117ece4Schristos dstFileName = FIO_determineCompressedName(srcFileName, outDirName, suffix); /* cannot fail */ 2274*3117ece4Schristos } 2275*3117ece4Schristos status = FIO_compressFilename_srcFile(fCtx, prefs, ress, dstFileName, srcFileName, compressionLevel); 2276*3117ece4Schristos if (!status) fCtx->nbFilesProcessed++; 2277*3117ece4Schristos error |= status; 2278*3117ece4Schristos } 2279*3117ece4Schristos 2280*3117ece4Schristos if (outDirName) 2281*3117ece4Schristos FIO_checkFilenameCollisions(inFileNamesTable , (unsigned)fCtx->nbFilesTotal); 2282*3117ece4Schristos } 2283*3117ece4Schristos 2284*3117ece4Schristos if (FIO_shouldDisplayMultipleFileSummary(fCtx)) { 2285*3117ece4Schristos UTIL_HumanReadableSize_t hr_isize = UTIL_makeHumanReadableSize((U64) fCtx->totalBytesInput); 2286*3117ece4Schristos UTIL_HumanReadableSize_t hr_osize = UTIL_makeHumanReadableSize((U64) fCtx->totalBytesOutput); 2287*3117ece4Schristos 2288*3117ece4Schristos DISPLAY_PROGRESS("\r%79s\r", ""); 2289*3117ece4Schristos if (fCtx->totalBytesInput == 0) { 2290*3117ece4Schristos DISPLAY_SUMMARY("%3d files compressed : (%6.*f%4s => %6.*f%4s)\n", 2291*3117ece4Schristos fCtx->nbFilesProcessed, 2292*3117ece4Schristos hr_isize.precision, hr_isize.value, hr_isize.suffix, 2293*3117ece4Schristos hr_osize.precision, hr_osize.value, hr_osize.suffix); 2294*3117ece4Schristos } else { 2295*3117ece4Schristos DISPLAY_SUMMARY("%3d files compressed : %.2f%% (%6.*f%4s => %6.*f%4s)\n", 2296*3117ece4Schristos fCtx->nbFilesProcessed, 2297*3117ece4Schristos (double)fCtx->totalBytesOutput/((double)fCtx->totalBytesInput)*100, 2298*3117ece4Schristos hr_isize.precision, hr_isize.value, hr_isize.suffix, 2299*3117ece4Schristos hr_osize.precision, hr_osize.value, hr_osize.suffix); 2300*3117ece4Schristos } 2301*3117ece4Schristos } 2302*3117ece4Schristos 2303*3117ece4Schristos FIO_freeCResources(&ress); 2304*3117ece4Schristos return error; 2305*3117ece4Schristos } 2306*3117ece4Schristos 2307*3117ece4Schristos #endif /* #ifndef ZSTD_NOCOMPRESS */ 2308*3117ece4Schristos 2309*3117ece4Schristos 2310*3117ece4Schristos 2311*3117ece4Schristos #ifndef ZSTD_NODECOMPRESS 2312*3117ece4Schristos 2313*3117ece4Schristos /* ************************************************************************** 2314*3117ece4Schristos * Decompression 2315*3117ece4Schristos ***************************************************************************/ 2316*3117ece4Schristos typedef struct { 2317*3117ece4Schristos FIO_Dict_t dict; 2318*3117ece4Schristos ZSTD_DStream* dctx; 2319*3117ece4Schristos WritePoolCtx_t *writeCtx; 2320*3117ece4Schristos ReadPoolCtx_t *readCtx; 2321*3117ece4Schristos } dRess_t; 2322*3117ece4Schristos 2323*3117ece4Schristos static dRess_t FIO_createDResources(FIO_prefs_t* const prefs, const char* dictFileName) 2324*3117ece4Schristos { 2325*3117ece4Schristos int useMMap = prefs->mmapDict == ZSTD_ps_enable; 2326*3117ece4Schristos int forceNoUseMMap = prefs->mmapDict == ZSTD_ps_disable; 2327*3117ece4Schristos stat_t statbuf; 2328*3117ece4Schristos dRess_t ress; 2329*3117ece4Schristos memset(&statbuf, 0, sizeof(statbuf)); 2330*3117ece4Schristos memset(&ress, 0, sizeof(ress)); 2331*3117ece4Schristos 2332*3117ece4Schristos FIO_getDictFileStat(dictFileName, &statbuf); 2333*3117ece4Schristos 2334*3117ece4Schristos if (prefs->patchFromMode){ 2335*3117ece4Schristos U64 const dictSize = UTIL_getFileSizeStat(&statbuf); 2336*3117ece4Schristos useMMap |= dictSize > prefs->memLimit; 2337*3117ece4Schristos FIO_adjustMemLimitForPatchFromMode(prefs, dictSize, 0 /* just use the dict size */); 2338*3117ece4Schristos } 2339*3117ece4Schristos 2340*3117ece4Schristos /* Allocation */ 2341*3117ece4Schristos ress.dctx = ZSTD_createDStream(); 2342*3117ece4Schristos if (ress.dctx==NULL) 2343*3117ece4Schristos EXM_THROW(60, "Error: %s : can't create ZSTD_DStream", strerror(errno)); 2344*3117ece4Schristos CHECK( ZSTD_DCtx_setMaxWindowSize(ress.dctx, prefs->memLimit) ); 2345*3117ece4Schristos CHECK( ZSTD_DCtx_setParameter(ress.dctx, ZSTD_d_forceIgnoreChecksum, !prefs->checksumFlag)); 2346*3117ece4Schristos 2347*3117ece4Schristos /* dictionary */ 2348*3117ece4Schristos { 2349*3117ece4Schristos FIO_dictBufferType_t dictBufferType = (useMMap && !forceNoUseMMap) ? FIO_mmapDict : FIO_mallocDict; 2350*3117ece4Schristos FIO_initDict(&ress.dict, dictFileName, prefs, &statbuf, dictBufferType); 2351*3117ece4Schristos 2352*3117ece4Schristos CHECK(ZSTD_DCtx_reset(ress.dctx, ZSTD_reset_session_only) ); 2353*3117ece4Schristos 2354*3117ece4Schristos if (prefs->patchFromMode){ 2355*3117ece4Schristos CHECK(ZSTD_DCtx_refPrefix(ress.dctx, ress.dict.dictBuffer, ress.dict.dictBufferSize)); 2356*3117ece4Schristos } else { 2357*3117ece4Schristos CHECK(ZSTD_DCtx_loadDictionary_byReference(ress.dctx, ress.dict.dictBuffer, ress.dict.dictBufferSize)); 2358*3117ece4Schristos } 2359*3117ece4Schristos } 2360*3117ece4Schristos 2361*3117ece4Schristos ress.writeCtx = AIO_WritePool_create(prefs, ZSTD_DStreamOutSize()); 2362*3117ece4Schristos ress.readCtx = AIO_ReadPool_create(prefs, ZSTD_DStreamInSize()); 2363*3117ece4Schristos return ress; 2364*3117ece4Schristos } 2365*3117ece4Schristos 2366*3117ece4Schristos static void FIO_freeDResources(dRess_t ress) 2367*3117ece4Schristos { 2368*3117ece4Schristos FIO_freeDict(&(ress.dict)); 2369*3117ece4Schristos CHECK( ZSTD_freeDStream(ress.dctx) ); 2370*3117ece4Schristos AIO_WritePool_free(ress.writeCtx); 2371*3117ece4Schristos AIO_ReadPool_free(ress.readCtx); 2372*3117ece4Schristos } 2373*3117ece4Schristos 2374*3117ece4Schristos /* FIO_passThrough() : just copy input into output, for compatibility with gzip -df mode 2375*3117ece4Schristos * @return : 0 (no error) */ 2376*3117ece4Schristos static int FIO_passThrough(dRess_t *ress) 2377*3117ece4Schristos { 2378*3117ece4Schristos size_t const blockSize = MIN(MIN(64 KB, ZSTD_DStreamInSize()), ZSTD_DStreamOutSize()); 2379*3117ece4Schristos IOJob_t *writeJob = AIO_WritePool_acquireJob(ress->writeCtx); 2380*3117ece4Schristos AIO_ReadPool_fillBuffer(ress->readCtx, blockSize); 2381*3117ece4Schristos 2382*3117ece4Schristos while(ress->readCtx->srcBufferLoaded) { 2383*3117ece4Schristos size_t writeSize; 2384*3117ece4Schristos writeSize = MIN(blockSize, ress->readCtx->srcBufferLoaded); 2385*3117ece4Schristos assert(writeSize <= writeJob->bufferSize); 2386*3117ece4Schristos memcpy(writeJob->buffer, ress->readCtx->srcBuffer, writeSize); 2387*3117ece4Schristos writeJob->usedBufferSize = writeSize; 2388*3117ece4Schristos AIO_WritePool_enqueueAndReacquireWriteJob(&writeJob); 2389*3117ece4Schristos AIO_ReadPool_consumeBytes(ress->readCtx, writeSize); 2390*3117ece4Schristos AIO_ReadPool_fillBuffer(ress->readCtx, blockSize); 2391*3117ece4Schristos } 2392*3117ece4Schristos assert(ress->readCtx->reachedEof); 2393*3117ece4Schristos AIO_WritePool_releaseIoJob(writeJob); 2394*3117ece4Schristos AIO_WritePool_sparseWriteEnd(ress->writeCtx); 2395*3117ece4Schristos return 0; 2396*3117ece4Schristos } 2397*3117ece4Schristos 2398*3117ece4Schristos /* FIO_zstdErrorHelp() : 2399*3117ece4Schristos * detailed error message when requested window size is too large */ 2400*3117ece4Schristos static void 2401*3117ece4Schristos FIO_zstdErrorHelp(const FIO_prefs_t* const prefs, 2402*3117ece4Schristos const dRess_t* ress, 2403*3117ece4Schristos size_t err, 2404*3117ece4Schristos const char* srcFileName) 2405*3117ece4Schristos { 2406*3117ece4Schristos ZSTD_frameHeader header; 2407*3117ece4Schristos 2408*3117ece4Schristos /* Help message only for one specific error */ 2409*3117ece4Schristos if (ZSTD_getErrorCode(err) != ZSTD_error_frameParameter_windowTooLarge) 2410*3117ece4Schristos return; 2411*3117ece4Schristos 2412*3117ece4Schristos /* Try to decode the frame header */ 2413*3117ece4Schristos err = ZSTD_getFrameHeader(&header, ress->readCtx->srcBuffer, ress->readCtx->srcBufferLoaded); 2414*3117ece4Schristos if (err == 0) { 2415*3117ece4Schristos unsigned long long const windowSize = header.windowSize; 2416*3117ece4Schristos unsigned const windowLog = FIO_highbit64(windowSize) + ((windowSize & (windowSize - 1)) != 0); 2417*3117ece4Schristos assert(prefs->memLimit > 0); 2418*3117ece4Schristos DISPLAYLEVEL(1, "%s : Window size larger than maximum : %llu > %u \n", 2419*3117ece4Schristos srcFileName, windowSize, prefs->memLimit); 2420*3117ece4Schristos if (windowLog <= ZSTD_WINDOWLOG_MAX) { 2421*3117ece4Schristos unsigned const windowMB = (unsigned)((windowSize >> 20) + ((windowSize & ((1 MB) - 1)) != 0)); 2422*3117ece4Schristos assert(windowSize < (U64)(1ULL << 52)); /* ensure now overflow for windowMB */ 2423*3117ece4Schristos DISPLAYLEVEL(1, "%s : Use --long=%u or --memory=%uMB \n", 2424*3117ece4Schristos srcFileName, windowLog, windowMB); 2425*3117ece4Schristos return; 2426*3117ece4Schristos } } 2427*3117ece4Schristos DISPLAYLEVEL(1, "%s : Window log larger than ZSTD_WINDOWLOG_MAX=%u; not supported \n", 2428*3117ece4Schristos srcFileName, ZSTD_WINDOWLOG_MAX); 2429*3117ece4Schristos } 2430*3117ece4Schristos 2431*3117ece4Schristos /** FIO_decompressFrame() : 2432*3117ece4Schristos * @return : size of decoded zstd frame, or an error code 2433*3117ece4Schristos */ 2434*3117ece4Schristos #define FIO_ERROR_FRAME_DECODING ((unsigned long long)(-2)) 2435*3117ece4Schristos static unsigned long long 2436*3117ece4Schristos FIO_decompressZstdFrame(FIO_ctx_t* const fCtx, dRess_t* ress, 2437*3117ece4Schristos const FIO_prefs_t* const prefs, 2438*3117ece4Schristos const char* srcFileName, 2439*3117ece4Schristos U64 alreadyDecoded) /* for multi-frames streams */ 2440*3117ece4Schristos { 2441*3117ece4Schristos U64 frameSize = 0; 2442*3117ece4Schristos IOJob_t *writeJob = AIO_WritePool_acquireJob(ress->writeCtx); 2443*3117ece4Schristos 2444*3117ece4Schristos /* display last 20 characters only when not --verbose */ 2445*3117ece4Schristos { size_t const srcFileLength = strlen(srcFileName); 2446*3117ece4Schristos if ((srcFileLength>20) && (g_display_prefs.displayLevel<3)) 2447*3117ece4Schristos srcFileName += srcFileLength-20; 2448*3117ece4Schristos } 2449*3117ece4Schristos 2450*3117ece4Schristos ZSTD_DCtx_reset(ress->dctx, ZSTD_reset_session_only); 2451*3117ece4Schristos 2452*3117ece4Schristos /* Header loading : ensures ZSTD_getFrameHeader() will succeed */ 2453*3117ece4Schristos AIO_ReadPool_fillBuffer(ress->readCtx, ZSTD_FRAMEHEADERSIZE_MAX); 2454*3117ece4Schristos 2455*3117ece4Schristos /* Main decompression Loop */ 2456*3117ece4Schristos while (1) { 2457*3117ece4Schristos ZSTD_inBuffer inBuff = setInBuffer( ress->readCtx->srcBuffer, ress->readCtx->srcBufferLoaded, 0 ); 2458*3117ece4Schristos ZSTD_outBuffer outBuff= setOutBuffer( writeJob->buffer, writeJob->bufferSize, 0 ); 2459*3117ece4Schristos size_t const readSizeHint = ZSTD_decompressStream(ress->dctx, &outBuff, &inBuff); 2460*3117ece4Schristos UTIL_HumanReadableSize_t const hrs = UTIL_makeHumanReadableSize(alreadyDecoded+frameSize); 2461*3117ece4Schristos if (ZSTD_isError(readSizeHint)) { 2462*3117ece4Schristos DISPLAYLEVEL(1, "%s : Decoding error (36) : %s \n", 2463*3117ece4Schristos srcFileName, ZSTD_getErrorName(readSizeHint)); 2464*3117ece4Schristos FIO_zstdErrorHelp(prefs, ress, readSizeHint, srcFileName); 2465*3117ece4Schristos AIO_WritePool_releaseIoJob(writeJob); 2466*3117ece4Schristos return FIO_ERROR_FRAME_DECODING; 2467*3117ece4Schristos } 2468*3117ece4Schristos 2469*3117ece4Schristos /* Write block */ 2470*3117ece4Schristos writeJob->usedBufferSize = outBuff.pos; 2471*3117ece4Schristos AIO_WritePool_enqueueAndReacquireWriteJob(&writeJob); 2472*3117ece4Schristos frameSize += outBuff.pos; 2473*3117ece4Schristos if (fCtx->nbFilesTotal > 1) { 2474*3117ece4Schristos size_t srcFileNameSize = strlen(srcFileName); 2475*3117ece4Schristos if (srcFileNameSize > 18) { 2476*3117ece4Schristos const char* truncatedSrcFileName = srcFileName + srcFileNameSize - 15; 2477*3117ece4Schristos DISPLAYUPDATE_PROGRESS( 2478*3117ece4Schristos "\rDecompress: %2u/%2u files. Current: ...%s : %.*f%s... ", 2479*3117ece4Schristos fCtx->currFileIdx+1, fCtx->nbFilesTotal, truncatedSrcFileName, hrs.precision, hrs.value, hrs.suffix); 2480*3117ece4Schristos } else { 2481*3117ece4Schristos DISPLAYUPDATE_PROGRESS("\rDecompress: %2u/%2u files. Current: %s : %.*f%s... ", 2482*3117ece4Schristos fCtx->currFileIdx+1, fCtx->nbFilesTotal, srcFileName, hrs.precision, hrs.value, hrs.suffix); 2483*3117ece4Schristos } 2484*3117ece4Schristos } else { 2485*3117ece4Schristos DISPLAYUPDATE_PROGRESS("\r%-20.20s : %.*f%s... ", 2486*3117ece4Schristos srcFileName, hrs.precision, hrs.value, hrs.suffix); 2487*3117ece4Schristos } 2488*3117ece4Schristos 2489*3117ece4Schristos AIO_ReadPool_consumeBytes(ress->readCtx, inBuff.pos); 2490*3117ece4Schristos 2491*3117ece4Schristos if (readSizeHint == 0) break; /* end of frame */ 2492*3117ece4Schristos 2493*3117ece4Schristos /* Fill input buffer */ 2494*3117ece4Schristos { size_t const toDecode = MIN(readSizeHint, ZSTD_DStreamInSize()); /* support large skippable frames */ 2495*3117ece4Schristos if (ress->readCtx->srcBufferLoaded < toDecode) { 2496*3117ece4Schristos size_t const readSize = AIO_ReadPool_fillBuffer(ress->readCtx, toDecode); 2497*3117ece4Schristos if (readSize==0) { 2498*3117ece4Schristos DISPLAYLEVEL(1, "%s : Read error (39) : premature end \n", 2499*3117ece4Schristos srcFileName); 2500*3117ece4Schristos AIO_WritePool_releaseIoJob(writeJob); 2501*3117ece4Schristos return FIO_ERROR_FRAME_DECODING; 2502*3117ece4Schristos } 2503*3117ece4Schristos } } } 2504*3117ece4Schristos 2505*3117ece4Schristos AIO_WritePool_releaseIoJob(writeJob); 2506*3117ece4Schristos AIO_WritePool_sparseWriteEnd(ress->writeCtx); 2507*3117ece4Schristos 2508*3117ece4Schristos return frameSize; 2509*3117ece4Schristos } 2510*3117ece4Schristos 2511*3117ece4Schristos 2512*3117ece4Schristos #ifdef ZSTD_GZDECOMPRESS 2513*3117ece4Schristos static unsigned long long 2514*3117ece4Schristos FIO_decompressGzFrame(dRess_t* ress, const char* srcFileName) 2515*3117ece4Schristos { 2516*3117ece4Schristos unsigned long long outFileSize = 0; 2517*3117ece4Schristos z_stream strm; 2518*3117ece4Schristos int flush = Z_NO_FLUSH; 2519*3117ece4Schristos int decodingError = 0; 2520*3117ece4Schristos IOJob_t *writeJob = NULL; 2521*3117ece4Schristos 2522*3117ece4Schristos strm.zalloc = Z_NULL; 2523*3117ece4Schristos strm.zfree = Z_NULL; 2524*3117ece4Schristos strm.opaque = Z_NULL; 2525*3117ece4Schristos strm.next_in = 0; 2526*3117ece4Schristos strm.avail_in = 0; 2527*3117ece4Schristos /* see https://www.zlib.net/manual.html */ 2528*3117ece4Schristos if (inflateInit2(&strm, 15 /* maxWindowLogSize */ + 16 /* gzip only */) != Z_OK) 2529*3117ece4Schristos return FIO_ERROR_FRAME_DECODING; 2530*3117ece4Schristos 2531*3117ece4Schristos writeJob = AIO_WritePool_acquireJob(ress->writeCtx); 2532*3117ece4Schristos strm.next_out = (Bytef*)writeJob->buffer; 2533*3117ece4Schristos strm.avail_out = (uInt)writeJob->bufferSize; 2534*3117ece4Schristos strm.avail_in = (uInt)ress->readCtx->srcBufferLoaded; 2535*3117ece4Schristos strm.next_in = (z_const unsigned char*)ress->readCtx->srcBuffer; 2536*3117ece4Schristos 2537*3117ece4Schristos for ( ; ; ) { 2538*3117ece4Schristos int ret; 2539*3117ece4Schristos if (strm.avail_in == 0) { 2540*3117ece4Schristos AIO_ReadPool_consumeAndRefill(ress->readCtx); 2541*3117ece4Schristos if (ress->readCtx->srcBufferLoaded == 0) flush = Z_FINISH; 2542*3117ece4Schristos strm.next_in = (z_const unsigned char*)ress->readCtx->srcBuffer; 2543*3117ece4Schristos strm.avail_in = (uInt)ress->readCtx->srcBufferLoaded; 2544*3117ece4Schristos } 2545*3117ece4Schristos ret = inflate(&strm, flush); 2546*3117ece4Schristos if (ret == Z_BUF_ERROR) { 2547*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s: premature gz end \n", srcFileName); 2548*3117ece4Schristos decodingError = 1; break; 2549*3117ece4Schristos } 2550*3117ece4Schristos if (ret != Z_OK && ret != Z_STREAM_END) { 2551*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s: inflate error %d \n", srcFileName, ret); 2552*3117ece4Schristos decodingError = 1; break; 2553*3117ece4Schristos } 2554*3117ece4Schristos { size_t const decompBytes = writeJob->bufferSize - strm.avail_out; 2555*3117ece4Schristos if (decompBytes) { 2556*3117ece4Schristos writeJob->usedBufferSize = decompBytes; 2557*3117ece4Schristos AIO_WritePool_enqueueAndReacquireWriteJob(&writeJob); 2558*3117ece4Schristos outFileSize += decompBytes; 2559*3117ece4Schristos strm.next_out = (Bytef*)writeJob->buffer; 2560*3117ece4Schristos strm.avail_out = (uInt)writeJob->bufferSize; 2561*3117ece4Schristos } 2562*3117ece4Schristos } 2563*3117ece4Schristos if (ret == Z_STREAM_END) break; 2564*3117ece4Schristos } 2565*3117ece4Schristos 2566*3117ece4Schristos AIO_ReadPool_consumeBytes(ress->readCtx, ress->readCtx->srcBufferLoaded - strm.avail_in); 2567*3117ece4Schristos 2568*3117ece4Schristos if ( (inflateEnd(&strm) != Z_OK) /* release resources ; error detected */ 2569*3117ece4Schristos && (decodingError==0) ) { 2570*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s: inflateEnd error \n", srcFileName); 2571*3117ece4Schristos decodingError = 1; 2572*3117ece4Schristos } 2573*3117ece4Schristos AIO_WritePool_releaseIoJob(writeJob); 2574*3117ece4Schristos AIO_WritePool_sparseWriteEnd(ress->writeCtx); 2575*3117ece4Schristos return decodingError ? FIO_ERROR_FRAME_DECODING : outFileSize; 2576*3117ece4Schristos } 2577*3117ece4Schristos #endif 2578*3117ece4Schristos 2579*3117ece4Schristos #ifdef ZSTD_LZMADECOMPRESS 2580*3117ece4Schristos static unsigned long long 2581*3117ece4Schristos FIO_decompressLzmaFrame(dRess_t* ress, 2582*3117ece4Schristos const char* srcFileName, int plain_lzma) 2583*3117ece4Schristos { 2584*3117ece4Schristos unsigned long long outFileSize = 0; 2585*3117ece4Schristos lzma_stream strm = LZMA_STREAM_INIT; 2586*3117ece4Schristos lzma_action action = LZMA_RUN; 2587*3117ece4Schristos lzma_ret initRet; 2588*3117ece4Schristos int decodingError = 0; 2589*3117ece4Schristos IOJob_t *writeJob = NULL; 2590*3117ece4Schristos 2591*3117ece4Schristos strm.next_in = 0; 2592*3117ece4Schristos strm.avail_in = 0; 2593*3117ece4Schristos if (plain_lzma) { 2594*3117ece4Schristos initRet = lzma_alone_decoder(&strm, UINT64_MAX); /* LZMA */ 2595*3117ece4Schristos } else { 2596*3117ece4Schristos initRet = lzma_stream_decoder(&strm, UINT64_MAX, 0); /* XZ */ 2597*3117ece4Schristos } 2598*3117ece4Schristos 2599*3117ece4Schristos if (initRet != LZMA_OK) { 2600*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s: %s error %d \n", 2601*3117ece4Schristos plain_lzma ? "lzma_alone_decoder" : "lzma_stream_decoder", 2602*3117ece4Schristos srcFileName, initRet); 2603*3117ece4Schristos return FIO_ERROR_FRAME_DECODING; 2604*3117ece4Schristos } 2605*3117ece4Schristos 2606*3117ece4Schristos writeJob = AIO_WritePool_acquireJob(ress->writeCtx); 2607*3117ece4Schristos strm.next_out = (BYTE*)writeJob->buffer; 2608*3117ece4Schristos strm.avail_out = writeJob->bufferSize; 2609*3117ece4Schristos strm.next_in = (BYTE const*)ress->readCtx->srcBuffer; 2610*3117ece4Schristos strm.avail_in = ress->readCtx->srcBufferLoaded; 2611*3117ece4Schristos 2612*3117ece4Schristos for ( ; ; ) { 2613*3117ece4Schristos lzma_ret ret; 2614*3117ece4Schristos if (strm.avail_in == 0) { 2615*3117ece4Schristos AIO_ReadPool_consumeAndRefill(ress->readCtx); 2616*3117ece4Schristos if (ress->readCtx->srcBufferLoaded == 0) action = LZMA_FINISH; 2617*3117ece4Schristos strm.next_in = (BYTE const*)ress->readCtx->srcBuffer; 2618*3117ece4Schristos strm.avail_in = ress->readCtx->srcBufferLoaded; 2619*3117ece4Schristos } 2620*3117ece4Schristos ret = lzma_code(&strm, action); 2621*3117ece4Schristos 2622*3117ece4Schristos if (ret == LZMA_BUF_ERROR) { 2623*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s: premature lzma end \n", srcFileName); 2624*3117ece4Schristos decodingError = 1; break; 2625*3117ece4Schristos } 2626*3117ece4Schristos if (ret != LZMA_OK && ret != LZMA_STREAM_END) { 2627*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s: lzma_code decoding error %d \n", 2628*3117ece4Schristos srcFileName, ret); 2629*3117ece4Schristos decodingError = 1; break; 2630*3117ece4Schristos } 2631*3117ece4Schristos { size_t const decompBytes = writeJob->bufferSize - strm.avail_out; 2632*3117ece4Schristos if (decompBytes) { 2633*3117ece4Schristos writeJob->usedBufferSize = decompBytes; 2634*3117ece4Schristos AIO_WritePool_enqueueAndReacquireWriteJob(&writeJob); 2635*3117ece4Schristos outFileSize += decompBytes; 2636*3117ece4Schristos strm.next_out = (BYTE*)writeJob->buffer; 2637*3117ece4Schristos strm.avail_out = writeJob->bufferSize; 2638*3117ece4Schristos } } 2639*3117ece4Schristos if (ret == LZMA_STREAM_END) break; 2640*3117ece4Schristos } 2641*3117ece4Schristos 2642*3117ece4Schristos AIO_ReadPool_consumeBytes(ress->readCtx, ress->readCtx->srcBufferLoaded - strm.avail_in); 2643*3117ece4Schristos lzma_end(&strm); 2644*3117ece4Schristos AIO_WritePool_releaseIoJob(writeJob); 2645*3117ece4Schristos AIO_WritePool_sparseWriteEnd(ress->writeCtx); 2646*3117ece4Schristos return decodingError ? FIO_ERROR_FRAME_DECODING : outFileSize; 2647*3117ece4Schristos } 2648*3117ece4Schristos #endif 2649*3117ece4Schristos 2650*3117ece4Schristos #ifdef ZSTD_LZ4DECOMPRESS 2651*3117ece4Schristos static unsigned long long 2652*3117ece4Schristos FIO_decompressLz4Frame(dRess_t* ress, const char* srcFileName) 2653*3117ece4Schristos { 2654*3117ece4Schristos unsigned long long filesize = 0; 2655*3117ece4Schristos LZ4F_errorCode_t nextToLoad = 4; 2656*3117ece4Schristos LZ4F_decompressionContext_t dCtx; 2657*3117ece4Schristos LZ4F_errorCode_t const errorCode = LZ4F_createDecompressionContext(&dCtx, LZ4F_VERSION); 2658*3117ece4Schristos int decodingError = 0; 2659*3117ece4Schristos IOJob_t *writeJob = NULL; 2660*3117ece4Schristos 2661*3117ece4Schristos if (LZ4F_isError(errorCode)) { 2662*3117ece4Schristos DISPLAYLEVEL(1, "zstd: failed to create lz4 decompression context \n"); 2663*3117ece4Schristos return FIO_ERROR_FRAME_DECODING; 2664*3117ece4Schristos } 2665*3117ece4Schristos 2666*3117ece4Schristos writeJob = AIO_WritePool_acquireJob(ress->writeCtx); 2667*3117ece4Schristos 2668*3117ece4Schristos /* Main Loop */ 2669*3117ece4Schristos for (;nextToLoad;) { 2670*3117ece4Schristos size_t pos = 0; 2671*3117ece4Schristos size_t decodedBytes = writeJob->bufferSize; 2672*3117ece4Schristos int fullBufferDecoded = 0; 2673*3117ece4Schristos 2674*3117ece4Schristos /* Read input */ 2675*3117ece4Schristos AIO_ReadPool_fillBuffer(ress->readCtx, nextToLoad); 2676*3117ece4Schristos if(!ress->readCtx->srcBufferLoaded) break; /* reached end of file */ 2677*3117ece4Schristos 2678*3117ece4Schristos while ((pos < ress->readCtx->srcBufferLoaded) || fullBufferDecoded) { /* still to read, or still to flush */ 2679*3117ece4Schristos /* Decode Input (at least partially) */ 2680*3117ece4Schristos size_t remaining = ress->readCtx->srcBufferLoaded - pos; 2681*3117ece4Schristos decodedBytes = writeJob->bufferSize; 2682*3117ece4Schristos nextToLoad = LZ4F_decompress(dCtx, writeJob->buffer, &decodedBytes, (char*)(ress->readCtx->srcBuffer)+pos, 2683*3117ece4Schristos &remaining, NULL); 2684*3117ece4Schristos if (LZ4F_isError(nextToLoad)) { 2685*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s: lz4 decompression error : %s \n", 2686*3117ece4Schristos srcFileName, LZ4F_getErrorName(nextToLoad)); 2687*3117ece4Schristos decodingError = 1; nextToLoad = 0; break; 2688*3117ece4Schristos } 2689*3117ece4Schristos pos += remaining; 2690*3117ece4Schristos assert(pos <= ress->readCtx->srcBufferLoaded); 2691*3117ece4Schristos fullBufferDecoded = decodedBytes == writeJob->bufferSize; 2692*3117ece4Schristos 2693*3117ece4Schristos /* Write Block */ 2694*3117ece4Schristos if (decodedBytes) { 2695*3117ece4Schristos UTIL_HumanReadableSize_t hrs; 2696*3117ece4Schristos writeJob->usedBufferSize = decodedBytes; 2697*3117ece4Schristos AIO_WritePool_enqueueAndReacquireWriteJob(&writeJob); 2698*3117ece4Schristos filesize += decodedBytes; 2699*3117ece4Schristos hrs = UTIL_makeHumanReadableSize(filesize); 2700*3117ece4Schristos DISPLAYUPDATE_PROGRESS("\rDecompressed : %.*f%s ", hrs.precision, hrs.value, hrs.suffix); 2701*3117ece4Schristos } 2702*3117ece4Schristos 2703*3117ece4Schristos if (!nextToLoad) break; 2704*3117ece4Schristos } 2705*3117ece4Schristos AIO_ReadPool_consumeBytes(ress->readCtx, pos); 2706*3117ece4Schristos } 2707*3117ece4Schristos if (nextToLoad!=0) { 2708*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s: unfinished lz4 stream \n", srcFileName); 2709*3117ece4Schristos decodingError=1; 2710*3117ece4Schristos } 2711*3117ece4Schristos 2712*3117ece4Schristos LZ4F_freeDecompressionContext(dCtx); 2713*3117ece4Schristos AIO_WritePool_releaseIoJob(writeJob); 2714*3117ece4Schristos AIO_WritePool_sparseWriteEnd(ress->writeCtx); 2715*3117ece4Schristos 2716*3117ece4Schristos return decodingError ? FIO_ERROR_FRAME_DECODING : filesize; 2717*3117ece4Schristos } 2718*3117ece4Schristos #endif 2719*3117ece4Schristos 2720*3117ece4Schristos 2721*3117ece4Schristos 2722*3117ece4Schristos /** FIO_decompressFrames() : 2723*3117ece4Schristos * Find and decode frames inside srcFile 2724*3117ece4Schristos * srcFile presumed opened and valid 2725*3117ece4Schristos * @return : 0 : OK 2726*3117ece4Schristos * 1 : error 2727*3117ece4Schristos */ 2728*3117ece4Schristos static int FIO_decompressFrames(FIO_ctx_t* const fCtx, 2729*3117ece4Schristos dRess_t ress, const FIO_prefs_t* const prefs, 2730*3117ece4Schristos const char* dstFileName, const char* srcFileName) 2731*3117ece4Schristos { 2732*3117ece4Schristos unsigned readSomething = 0; 2733*3117ece4Schristos unsigned long long filesize = 0; 2734*3117ece4Schristos int passThrough = prefs->passThrough; 2735*3117ece4Schristos 2736*3117ece4Schristos if (passThrough == -1) { 2737*3117ece4Schristos /* If pass-through mode is not explicitly enabled or disabled, 2738*3117ece4Schristos * default to the legacy behavior of enabling it if we are writing 2739*3117ece4Schristos * to stdout with the overwrite flag enabled. 2740*3117ece4Schristos */ 2741*3117ece4Schristos passThrough = prefs->overwrite && !strcmp(dstFileName, stdoutmark); 2742*3117ece4Schristos } 2743*3117ece4Schristos assert(passThrough == 0 || passThrough == 1); 2744*3117ece4Schristos 2745*3117ece4Schristos /* for each frame */ 2746*3117ece4Schristos for ( ; ; ) { 2747*3117ece4Schristos /* check magic number -> version */ 2748*3117ece4Schristos size_t const toRead = 4; 2749*3117ece4Schristos const BYTE* buf; 2750*3117ece4Schristos AIO_ReadPool_fillBuffer(ress.readCtx, toRead); 2751*3117ece4Schristos buf = (const BYTE*)ress.readCtx->srcBuffer; 2752*3117ece4Schristos if (ress.readCtx->srcBufferLoaded==0) { 2753*3117ece4Schristos if (readSomething==0) { /* srcFile is empty (which is invalid) */ 2754*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s: unexpected end of file \n", srcFileName); 2755*3117ece4Schristos return 1; 2756*3117ece4Schristos } /* else, just reached frame boundary */ 2757*3117ece4Schristos break; /* no more input */ 2758*3117ece4Schristos } 2759*3117ece4Schristos readSomething = 1; /* there is at least 1 byte in srcFile */ 2760*3117ece4Schristos if (ress.readCtx->srcBufferLoaded < toRead) { /* not enough input to check magic number */ 2761*3117ece4Schristos if (passThrough) { 2762*3117ece4Schristos return FIO_passThrough(&ress); 2763*3117ece4Schristos } 2764*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s: unknown header \n", srcFileName); 2765*3117ece4Schristos return 1; 2766*3117ece4Schristos } 2767*3117ece4Schristos if (ZSTD_isFrame(buf, ress.readCtx->srcBufferLoaded)) { 2768*3117ece4Schristos unsigned long long const frameSize = FIO_decompressZstdFrame(fCtx, &ress, prefs, srcFileName, filesize); 2769*3117ece4Schristos if (frameSize == FIO_ERROR_FRAME_DECODING) return 1; 2770*3117ece4Schristos filesize += frameSize; 2771*3117ece4Schristos } else if (buf[0] == 31 && buf[1] == 139) { /* gz magic number */ 2772*3117ece4Schristos #ifdef ZSTD_GZDECOMPRESS 2773*3117ece4Schristos unsigned long long const frameSize = FIO_decompressGzFrame(&ress, srcFileName); 2774*3117ece4Schristos if (frameSize == FIO_ERROR_FRAME_DECODING) return 1; 2775*3117ece4Schristos filesize += frameSize; 2776*3117ece4Schristos #else 2777*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s: gzip file cannot be uncompressed (zstd compiled without HAVE_ZLIB) -- ignored \n", srcFileName); 2778*3117ece4Schristos return 1; 2779*3117ece4Schristos #endif 2780*3117ece4Schristos } else if ((buf[0] == 0xFD && buf[1] == 0x37) /* xz magic number */ 2781*3117ece4Schristos || (buf[0] == 0x5D && buf[1] == 0x00)) { /* lzma header (no magic number) */ 2782*3117ece4Schristos #ifdef ZSTD_LZMADECOMPRESS 2783*3117ece4Schristos unsigned long long const frameSize = FIO_decompressLzmaFrame(&ress, srcFileName, buf[0] != 0xFD); 2784*3117ece4Schristos if (frameSize == FIO_ERROR_FRAME_DECODING) return 1; 2785*3117ece4Schristos filesize += frameSize; 2786*3117ece4Schristos #else 2787*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s: xz/lzma file cannot be uncompressed (zstd compiled without HAVE_LZMA) -- ignored \n", srcFileName); 2788*3117ece4Schristos return 1; 2789*3117ece4Schristos #endif 2790*3117ece4Schristos } else if (MEM_readLE32(buf) == LZ4_MAGICNUMBER) { 2791*3117ece4Schristos #ifdef ZSTD_LZ4DECOMPRESS 2792*3117ece4Schristos unsigned long long const frameSize = FIO_decompressLz4Frame(&ress, srcFileName); 2793*3117ece4Schristos if (frameSize == FIO_ERROR_FRAME_DECODING) return 1; 2794*3117ece4Schristos filesize += frameSize; 2795*3117ece4Schristos #else 2796*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s: lz4 file cannot be uncompressed (zstd compiled without HAVE_LZ4) -- ignored \n", srcFileName); 2797*3117ece4Schristos return 1; 2798*3117ece4Schristos #endif 2799*3117ece4Schristos } else if (passThrough) { 2800*3117ece4Schristos return FIO_passThrough(&ress); 2801*3117ece4Schristos } else { 2802*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s: unsupported format \n", srcFileName); 2803*3117ece4Schristos return 1; 2804*3117ece4Schristos } } /* for each frame */ 2805*3117ece4Schristos 2806*3117ece4Schristos /* Final Status */ 2807*3117ece4Schristos fCtx->totalBytesOutput += (size_t)filesize; 2808*3117ece4Schristos DISPLAY_PROGRESS("\r%79s\r", ""); 2809*3117ece4Schristos if (FIO_shouldDisplayFileSummary(fCtx)) 2810*3117ece4Schristos DISPLAY_SUMMARY("%-20s: %llu bytes \n", srcFileName, filesize); 2811*3117ece4Schristos 2812*3117ece4Schristos return 0; 2813*3117ece4Schristos } 2814*3117ece4Schristos 2815*3117ece4Schristos /** FIO_decompressDstFile() : 2816*3117ece4Schristos open `dstFileName`, or pass-through if writeCtx's file is already != 0, 2817*3117ece4Schristos then start decompression process (FIO_decompressFrames()). 2818*3117ece4Schristos @return : 0 : OK 2819*3117ece4Schristos 1 : operation aborted 2820*3117ece4Schristos */ 2821*3117ece4Schristos static int FIO_decompressDstFile(FIO_ctx_t* const fCtx, 2822*3117ece4Schristos FIO_prefs_t* const prefs, 2823*3117ece4Schristos dRess_t ress, 2824*3117ece4Schristos const char* dstFileName, 2825*3117ece4Schristos const char* srcFileName, 2826*3117ece4Schristos const stat_t* srcFileStat) 2827*3117ece4Schristos { 2828*3117ece4Schristos int result; 2829*3117ece4Schristos int releaseDstFile = 0; 2830*3117ece4Schristos int transferStat = 0; 2831*3117ece4Schristos int dstFd = 0; 2832*3117ece4Schristos 2833*3117ece4Schristos if ((AIO_WritePool_getFile(ress.writeCtx) == NULL) && (prefs->testMode == 0)) { 2834*3117ece4Schristos FILE *dstFile; 2835*3117ece4Schristos int dstFilePermissions = DEFAULT_FILE_PERMISSIONS; 2836*3117ece4Schristos if ( strcmp(srcFileName, stdinmark) /* special case : don't transfer permissions from stdin */ 2837*3117ece4Schristos && strcmp(dstFileName, stdoutmark) 2838*3117ece4Schristos && UTIL_isRegularFileStat(srcFileStat) ) { 2839*3117ece4Schristos transferStat = 1; 2840*3117ece4Schristos dstFilePermissions = TEMPORARY_FILE_PERMISSIONS; 2841*3117ece4Schristos } 2842*3117ece4Schristos 2843*3117ece4Schristos releaseDstFile = 1; 2844*3117ece4Schristos 2845*3117ece4Schristos dstFile = FIO_openDstFile(fCtx, prefs, srcFileName, dstFileName, dstFilePermissions); 2846*3117ece4Schristos if (dstFile==NULL) return 1; 2847*3117ece4Schristos dstFd = fileno(dstFile); 2848*3117ece4Schristos AIO_WritePool_setFile(ress.writeCtx, dstFile); 2849*3117ece4Schristos 2850*3117ece4Schristos /* Must only be added after FIO_openDstFile() succeeds. 2851*3117ece4Schristos * Otherwise we may delete the destination file if it already exists, 2852*3117ece4Schristos * and the user presses Ctrl-C when asked if they wish to overwrite. 2853*3117ece4Schristos */ 2854*3117ece4Schristos addHandler(dstFileName); 2855*3117ece4Schristos } 2856*3117ece4Schristos 2857*3117ece4Schristos result = FIO_decompressFrames(fCtx, ress, prefs, dstFileName, srcFileName); 2858*3117ece4Schristos 2859*3117ece4Schristos if (releaseDstFile) { 2860*3117ece4Schristos clearHandler(); 2861*3117ece4Schristos 2862*3117ece4Schristos if (transferStat) { 2863*3117ece4Schristos UTIL_setFDStat(dstFd, dstFileName, srcFileStat); 2864*3117ece4Schristos } 2865*3117ece4Schristos 2866*3117ece4Schristos if (AIO_WritePool_closeFile(ress.writeCtx)) { 2867*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s: %s \n", dstFileName, strerror(errno)); 2868*3117ece4Schristos result = 1; 2869*3117ece4Schristos } 2870*3117ece4Schristos 2871*3117ece4Schristos if (transferStat) { 2872*3117ece4Schristos UTIL_utime(dstFileName, srcFileStat); 2873*3117ece4Schristos } 2874*3117ece4Schristos 2875*3117ece4Schristos if ( (result != 0) /* operation failure */ 2876*3117ece4Schristos && strcmp(dstFileName, stdoutmark) /* special case : don't remove() stdout */ 2877*3117ece4Schristos ) { 2878*3117ece4Schristos FIO_removeFile(dstFileName); /* remove decompression artefact; note: don't do anything special if remove() fails */ 2879*3117ece4Schristos } 2880*3117ece4Schristos } 2881*3117ece4Schristos 2882*3117ece4Schristos return result; 2883*3117ece4Schristos } 2884*3117ece4Schristos 2885*3117ece4Schristos 2886*3117ece4Schristos /** FIO_decompressSrcFile() : 2887*3117ece4Schristos Open `srcFileName`, transfer control to decompressDstFile() 2888*3117ece4Schristos @return : 0 : OK 2889*3117ece4Schristos 1 : error 2890*3117ece4Schristos */ 2891*3117ece4Schristos static int FIO_decompressSrcFile(FIO_ctx_t* const fCtx, FIO_prefs_t* const prefs, dRess_t ress, const char* dstFileName, const char* srcFileName) 2892*3117ece4Schristos { 2893*3117ece4Schristos FILE* srcFile; 2894*3117ece4Schristos stat_t srcFileStat; 2895*3117ece4Schristos int result; 2896*3117ece4Schristos U64 fileSize = UTIL_FILESIZE_UNKNOWN; 2897*3117ece4Schristos 2898*3117ece4Schristos if (UTIL_isDirectory(srcFileName)) { 2899*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s is a directory -- ignored \n", srcFileName); 2900*3117ece4Schristos return 1; 2901*3117ece4Schristos } 2902*3117ece4Schristos 2903*3117ece4Schristos srcFile = FIO_openSrcFile(prefs, srcFileName, &srcFileStat); 2904*3117ece4Schristos if (srcFile==NULL) return 1; 2905*3117ece4Schristos 2906*3117ece4Schristos /* Don't use AsyncIO for small files */ 2907*3117ece4Schristos if (strcmp(srcFileName, stdinmark)) /* Stdin doesn't have stats */ 2908*3117ece4Schristos fileSize = UTIL_getFileSizeStat(&srcFileStat); 2909*3117ece4Schristos if(fileSize != UTIL_FILESIZE_UNKNOWN && fileSize < ZSTD_BLOCKSIZE_MAX * 3) { 2910*3117ece4Schristos AIO_ReadPool_setAsync(ress.readCtx, 0); 2911*3117ece4Schristos AIO_WritePool_setAsync(ress.writeCtx, 0); 2912*3117ece4Schristos } else { 2913*3117ece4Schristos AIO_ReadPool_setAsync(ress.readCtx, 1); 2914*3117ece4Schristos AIO_WritePool_setAsync(ress.writeCtx, 1); 2915*3117ece4Schristos } 2916*3117ece4Schristos 2917*3117ece4Schristos AIO_ReadPool_setFile(ress.readCtx, srcFile); 2918*3117ece4Schristos 2919*3117ece4Schristos result = FIO_decompressDstFile(fCtx, prefs, ress, dstFileName, srcFileName, &srcFileStat); 2920*3117ece4Schristos 2921*3117ece4Schristos AIO_ReadPool_setFile(ress.readCtx, NULL); 2922*3117ece4Schristos 2923*3117ece4Schristos /* Close file */ 2924*3117ece4Schristos if (fclose(srcFile)) { 2925*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s: %s \n", srcFileName, strerror(errno)); /* error should not happen */ 2926*3117ece4Schristos return 1; 2927*3117ece4Schristos } 2928*3117ece4Schristos if ( prefs->removeSrcFile /* --rm */ 2929*3117ece4Schristos && (result==0) /* decompression successful */ 2930*3117ece4Schristos && strcmp(srcFileName, stdinmark) ) /* not stdin */ { 2931*3117ece4Schristos /* We must clear the handler, since after this point calling it would 2932*3117ece4Schristos * delete both the source and destination files. 2933*3117ece4Schristos */ 2934*3117ece4Schristos clearHandler(); 2935*3117ece4Schristos if (FIO_removeFile(srcFileName)) { 2936*3117ece4Schristos /* failed to remove src file */ 2937*3117ece4Schristos DISPLAYLEVEL(1, "zstd: %s: %s \n", srcFileName, strerror(errno)); 2938*3117ece4Schristos return 1; 2939*3117ece4Schristos } } 2940*3117ece4Schristos return result; 2941*3117ece4Schristos } 2942*3117ece4Schristos 2943*3117ece4Schristos 2944*3117ece4Schristos 2945*3117ece4Schristos int FIO_decompressFilename(FIO_ctx_t* const fCtx, FIO_prefs_t* const prefs, 2946*3117ece4Schristos const char* dstFileName, const char* srcFileName, 2947*3117ece4Schristos const char* dictFileName) 2948*3117ece4Schristos { 2949*3117ece4Schristos dRess_t const ress = FIO_createDResources(prefs, dictFileName); 2950*3117ece4Schristos 2951*3117ece4Schristos int const decodingError = FIO_decompressSrcFile(fCtx, prefs, ress, dstFileName, srcFileName); 2952*3117ece4Schristos 2953*3117ece4Schristos 2954*3117ece4Schristos 2955*3117ece4Schristos FIO_freeDResources(ress); 2956*3117ece4Schristos return decodingError; 2957*3117ece4Schristos } 2958*3117ece4Schristos 2959*3117ece4Schristos static const char *suffixList[] = { 2960*3117ece4Schristos ZSTD_EXTENSION, 2961*3117ece4Schristos TZSTD_EXTENSION, 2962*3117ece4Schristos #ifndef ZSTD_NODECOMPRESS 2963*3117ece4Schristos ZSTD_ALT_EXTENSION, 2964*3117ece4Schristos #endif 2965*3117ece4Schristos #ifdef ZSTD_GZDECOMPRESS 2966*3117ece4Schristos GZ_EXTENSION, 2967*3117ece4Schristos TGZ_EXTENSION, 2968*3117ece4Schristos #endif 2969*3117ece4Schristos #ifdef ZSTD_LZMADECOMPRESS 2970*3117ece4Schristos LZMA_EXTENSION, 2971*3117ece4Schristos XZ_EXTENSION, 2972*3117ece4Schristos TXZ_EXTENSION, 2973*3117ece4Schristos #endif 2974*3117ece4Schristos #ifdef ZSTD_LZ4DECOMPRESS 2975*3117ece4Schristos LZ4_EXTENSION, 2976*3117ece4Schristos TLZ4_EXTENSION, 2977*3117ece4Schristos #endif 2978*3117ece4Schristos NULL 2979*3117ece4Schristos }; 2980*3117ece4Schristos 2981*3117ece4Schristos static const char *suffixListStr = 2982*3117ece4Schristos ZSTD_EXTENSION "/" TZSTD_EXTENSION 2983*3117ece4Schristos #ifdef ZSTD_GZDECOMPRESS 2984*3117ece4Schristos "/" GZ_EXTENSION "/" TGZ_EXTENSION 2985*3117ece4Schristos #endif 2986*3117ece4Schristos #ifdef ZSTD_LZMADECOMPRESS 2987*3117ece4Schristos "/" LZMA_EXTENSION "/" XZ_EXTENSION "/" TXZ_EXTENSION 2988*3117ece4Schristos #endif 2989*3117ece4Schristos #ifdef ZSTD_LZ4DECOMPRESS 2990*3117ece4Schristos "/" LZ4_EXTENSION "/" TLZ4_EXTENSION 2991*3117ece4Schristos #endif 2992*3117ece4Schristos ; 2993*3117ece4Schristos 2994*3117ece4Schristos /* FIO_determineDstName() : 2995*3117ece4Schristos * create a destination filename from a srcFileName. 2996*3117ece4Schristos * @return a pointer to it. 2997*3117ece4Schristos * @return == NULL if there is an error */ 2998*3117ece4Schristos static const char* 2999*3117ece4Schristos FIO_determineDstName(const char* srcFileName, const char* outDirName) 3000*3117ece4Schristos { 3001*3117ece4Schristos static size_t dfnbCapacity = 0; 3002*3117ece4Schristos static char* dstFileNameBuffer = NULL; /* using static allocation : this function cannot be multi-threaded */ 3003*3117ece4Schristos size_t dstFileNameEndPos; 3004*3117ece4Schristos char* outDirFilename = NULL; 3005*3117ece4Schristos const char* dstSuffix = ""; 3006*3117ece4Schristos size_t dstSuffixLen = 0; 3007*3117ece4Schristos 3008*3117ece4Schristos size_t sfnSize = strlen(srcFileName); 3009*3117ece4Schristos 3010*3117ece4Schristos size_t srcSuffixLen; 3011*3117ece4Schristos const char* const srcSuffix = strrchr(srcFileName, '.'); 3012*3117ece4Schristos 3013*3117ece4Schristos if(!strcmp(srcFileName, stdinmark)) { 3014*3117ece4Schristos return stdoutmark; 3015*3117ece4Schristos } 3016*3117ece4Schristos 3017*3117ece4Schristos if (srcSuffix == NULL) { 3018*3117ece4Schristos DISPLAYLEVEL(1, 3019*3117ece4Schristos "zstd: %s: unknown suffix (%s expected). " 3020*3117ece4Schristos "Can't derive the output file name. " 3021*3117ece4Schristos "Specify it with -o dstFileName. Ignoring.\n", 3022*3117ece4Schristos srcFileName, suffixListStr); 3023*3117ece4Schristos return NULL; 3024*3117ece4Schristos } 3025*3117ece4Schristos srcSuffixLen = strlen(srcSuffix); 3026*3117ece4Schristos 3027*3117ece4Schristos { 3028*3117ece4Schristos const char** matchedSuffixPtr; 3029*3117ece4Schristos for (matchedSuffixPtr = suffixList; *matchedSuffixPtr != NULL; matchedSuffixPtr++) { 3030*3117ece4Schristos if (!strcmp(*matchedSuffixPtr, srcSuffix)) { 3031*3117ece4Schristos break; 3032*3117ece4Schristos } 3033*3117ece4Schristos } 3034*3117ece4Schristos 3035*3117ece4Schristos /* check suffix is authorized */ 3036*3117ece4Schristos if (sfnSize <= srcSuffixLen || *matchedSuffixPtr == NULL) { 3037*3117ece4Schristos DISPLAYLEVEL(1, 3038*3117ece4Schristos "zstd: %s: unknown suffix (%s expected). " 3039*3117ece4Schristos "Can't derive the output file name. " 3040*3117ece4Schristos "Specify it with -o dstFileName. Ignoring.\n", 3041*3117ece4Schristos srcFileName, suffixListStr); 3042*3117ece4Schristos return NULL; 3043*3117ece4Schristos } 3044*3117ece4Schristos 3045*3117ece4Schristos if ((*matchedSuffixPtr)[1] == 't') { 3046*3117ece4Schristos dstSuffix = ".tar"; 3047*3117ece4Schristos dstSuffixLen = strlen(dstSuffix); 3048*3117ece4Schristos } 3049*3117ece4Schristos } 3050*3117ece4Schristos 3051*3117ece4Schristos if (outDirName) { 3052*3117ece4Schristos outDirFilename = FIO_createFilename_fromOutDir(srcFileName, outDirName, 0); 3053*3117ece4Schristos sfnSize = strlen(outDirFilename); 3054*3117ece4Schristos assert(outDirFilename != NULL); 3055*3117ece4Schristos } 3056*3117ece4Schristos 3057*3117ece4Schristos if (dfnbCapacity+srcSuffixLen <= sfnSize+1+dstSuffixLen) { 3058*3117ece4Schristos /* allocate enough space to write dstFilename into it */ 3059*3117ece4Schristos free(dstFileNameBuffer); 3060*3117ece4Schristos dfnbCapacity = sfnSize + 20; 3061*3117ece4Schristos dstFileNameBuffer = (char*)malloc(dfnbCapacity); 3062*3117ece4Schristos if (dstFileNameBuffer==NULL) 3063*3117ece4Schristos EXM_THROW(74, "%s : not enough memory for dstFileName", 3064*3117ece4Schristos strerror(errno)); 3065*3117ece4Schristos } 3066*3117ece4Schristos 3067*3117ece4Schristos /* return dst name == src name truncated from suffix */ 3068*3117ece4Schristos assert(dstFileNameBuffer != NULL); 3069*3117ece4Schristos dstFileNameEndPos = sfnSize - srcSuffixLen; 3070*3117ece4Schristos if (outDirFilename) { 3071*3117ece4Schristos memcpy(dstFileNameBuffer, outDirFilename, dstFileNameEndPos); 3072*3117ece4Schristos free(outDirFilename); 3073*3117ece4Schristos } else { 3074*3117ece4Schristos memcpy(dstFileNameBuffer, srcFileName, dstFileNameEndPos); 3075*3117ece4Schristos } 3076*3117ece4Schristos 3077*3117ece4Schristos /* The short tar extensions tzst, tgz, txz and tlz4 files should have "tar" 3078*3117ece4Schristos * extension on decompression. Also writes terminating null. */ 3079*3117ece4Schristos strcpy(dstFileNameBuffer + dstFileNameEndPos, dstSuffix); 3080*3117ece4Schristos return dstFileNameBuffer; 3081*3117ece4Schristos 3082*3117ece4Schristos /* note : dstFileNameBuffer memory is not going to be free */ 3083*3117ece4Schristos } 3084*3117ece4Schristos 3085*3117ece4Schristos int 3086*3117ece4Schristos FIO_decompressMultipleFilenames(FIO_ctx_t* const fCtx, 3087*3117ece4Schristos FIO_prefs_t* const prefs, 3088*3117ece4Schristos const char** srcNamesTable, 3089*3117ece4Schristos const char* outMirroredRootDirName, 3090*3117ece4Schristos const char* outDirName, const char* outFileName, 3091*3117ece4Schristos const char* dictFileName) 3092*3117ece4Schristos { 3093*3117ece4Schristos int status; 3094*3117ece4Schristos int error = 0; 3095*3117ece4Schristos dRess_t ress = FIO_createDResources(prefs, dictFileName); 3096*3117ece4Schristos 3097*3117ece4Schristos if (outFileName) { 3098*3117ece4Schristos if (FIO_multiFilesConcatWarning(fCtx, prefs, outFileName, 1 /* displayLevelCutoff */)) { 3099*3117ece4Schristos FIO_freeDResources(ress); 3100*3117ece4Schristos return 1; 3101*3117ece4Schristos } 3102*3117ece4Schristos if (!prefs->testMode) { 3103*3117ece4Schristos FILE* dstFile = FIO_openDstFile(fCtx, prefs, NULL, outFileName, DEFAULT_FILE_PERMISSIONS); 3104*3117ece4Schristos if (dstFile == 0) EXM_THROW(19, "cannot open %s", outFileName); 3105*3117ece4Schristos AIO_WritePool_setFile(ress.writeCtx, dstFile); 3106*3117ece4Schristos } 3107*3117ece4Schristos for (; fCtx->currFileIdx < fCtx->nbFilesTotal; fCtx->currFileIdx++) { 3108*3117ece4Schristos status = FIO_decompressSrcFile(fCtx, prefs, ress, outFileName, srcNamesTable[fCtx->currFileIdx]); 3109*3117ece4Schristos if (!status) fCtx->nbFilesProcessed++; 3110*3117ece4Schristos error |= status; 3111*3117ece4Schristos } 3112*3117ece4Schristos if ((!prefs->testMode) && (AIO_WritePool_closeFile(ress.writeCtx))) 3113*3117ece4Schristos EXM_THROW(72, "Write error : %s : cannot properly close output file", 3114*3117ece4Schristos strerror(errno)); 3115*3117ece4Schristos } else { 3116*3117ece4Schristos if (outMirroredRootDirName) 3117*3117ece4Schristos UTIL_mirrorSourceFilesDirectories(srcNamesTable, (unsigned)fCtx->nbFilesTotal, outMirroredRootDirName); 3118*3117ece4Schristos 3119*3117ece4Schristos for (; fCtx->currFileIdx < fCtx->nbFilesTotal; fCtx->currFileIdx++) { /* create dstFileName */ 3120*3117ece4Schristos const char* const srcFileName = srcNamesTable[fCtx->currFileIdx]; 3121*3117ece4Schristos const char* dstFileName = NULL; 3122*3117ece4Schristos if (outMirroredRootDirName) { 3123*3117ece4Schristos char* validMirroredDirName = UTIL_createMirroredDestDirName(srcFileName, outMirroredRootDirName); 3124*3117ece4Schristos if (validMirroredDirName) { 3125*3117ece4Schristos dstFileName = FIO_determineDstName(srcFileName, validMirroredDirName); 3126*3117ece4Schristos free(validMirroredDirName); 3127*3117ece4Schristos } else { 3128*3117ece4Schristos DISPLAYLEVEL(2, "zstd: --output-dir-mirror cannot decompress '%s' into '%s'\n", srcFileName, outMirroredRootDirName); 3129*3117ece4Schristos } 3130*3117ece4Schristos } else { 3131*3117ece4Schristos dstFileName = FIO_determineDstName(srcFileName, outDirName); 3132*3117ece4Schristos } 3133*3117ece4Schristos if (dstFileName == NULL) { error=1; continue; } 3134*3117ece4Schristos status = FIO_decompressSrcFile(fCtx, prefs, ress, dstFileName, srcFileName); 3135*3117ece4Schristos if (!status) fCtx->nbFilesProcessed++; 3136*3117ece4Schristos error |= status; 3137*3117ece4Schristos } 3138*3117ece4Schristos if (outDirName) 3139*3117ece4Schristos FIO_checkFilenameCollisions(srcNamesTable , (unsigned)fCtx->nbFilesTotal); 3140*3117ece4Schristos } 3141*3117ece4Schristos 3142*3117ece4Schristos if (FIO_shouldDisplayMultipleFileSummary(fCtx)) { 3143*3117ece4Schristos DISPLAY_PROGRESS("\r%79s\r", ""); 3144*3117ece4Schristos DISPLAY_SUMMARY("%d files decompressed : %6llu bytes total \n", 3145*3117ece4Schristos fCtx->nbFilesProcessed, (unsigned long long)fCtx->totalBytesOutput); 3146*3117ece4Schristos } 3147*3117ece4Schristos 3148*3117ece4Schristos FIO_freeDResources(ress); 3149*3117ece4Schristos return error; 3150*3117ece4Schristos } 3151*3117ece4Schristos 3152*3117ece4Schristos /* ************************************************************************** 3153*3117ece4Schristos * .zst file info (--list command) 3154*3117ece4Schristos ***************************************************************************/ 3155*3117ece4Schristos 3156*3117ece4Schristos typedef struct { 3157*3117ece4Schristos U64 decompressedSize; 3158*3117ece4Schristos U64 compressedSize; 3159*3117ece4Schristos U64 windowSize; 3160*3117ece4Schristos int numActualFrames; 3161*3117ece4Schristos int numSkippableFrames; 3162*3117ece4Schristos int decompUnavailable; 3163*3117ece4Schristos int usesCheck; 3164*3117ece4Schristos BYTE checksum[4]; 3165*3117ece4Schristos U32 nbFiles; 3166*3117ece4Schristos unsigned dictID; 3167*3117ece4Schristos } fileInfo_t; 3168*3117ece4Schristos 3169*3117ece4Schristos typedef enum { 3170*3117ece4Schristos info_success=0, 3171*3117ece4Schristos info_frame_error=1, 3172*3117ece4Schristos info_not_zstd=2, 3173*3117ece4Schristos info_file_error=3, 3174*3117ece4Schristos info_truncated_input=4 3175*3117ece4Schristos } InfoError; 3176*3117ece4Schristos 3177*3117ece4Schristos #define ERROR_IF(c,n,...) { \ 3178*3117ece4Schristos if (c) { \ 3179*3117ece4Schristos DISPLAYLEVEL(1, __VA_ARGS__); \ 3180*3117ece4Schristos DISPLAYLEVEL(1, " \n"); \ 3181*3117ece4Schristos return n; \ 3182*3117ece4Schristos } \ 3183*3117ece4Schristos } 3184*3117ece4Schristos 3185*3117ece4Schristos static InfoError 3186*3117ece4Schristos FIO_analyzeFrames(fileInfo_t* info, FILE* const srcFile) 3187*3117ece4Schristos { 3188*3117ece4Schristos /* begin analyzing frame */ 3189*3117ece4Schristos for ( ; ; ) { 3190*3117ece4Schristos BYTE headerBuffer[ZSTD_FRAMEHEADERSIZE_MAX]; 3191*3117ece4Schristos size_t const numBytesRead = fread(headerBuffer, 1, sizeof(headerBuffer), srcFile); 3192*3117ece4Schristos if (numBytesRead < ZSTD_FRAMEHEADERSIZE_MIN(ZSTD_f_zstd1)) { 3193*3117ece4Schristos if ( feof(srcFile) 3194*3117ece4Schristos && (numBytesRead == 0) 3195*3117ece4Schristos && (info->compressedSize > 0) 3196*3117ece4Schristos && (info->compressedSize != UTIL_FILESIZE_UNKNOWN) ) { 3197*3117ece4Schristos unsigned long long file_position = (unsigned long long) LONG_TELL(srcFile); 3198*3117ece4Schristos unsigned long long file_size = (unsigned long long) info->compressedSize; 3199*3117ece4Schristos ERROR_IF(file_position != file_size, info_truncated_input, 3200*3117ece4Schristos "Error: seeked to position %llu, which is beyond file size of %llu\n", 3201*3117ece4Schristos file_position, 3202*3117ece4Schristos file_size); 3203*3117ece4Schristos break; /* correct end of file => success */ 3204*3117ece4Schristos } 3205*3117ece4Schristos ERROR_IF(feof(srcFile), info_not_zstd, "Error: reached end of file with incomplete frame"); 3206*3117ece4Schristos ERROR_IF(1, info_frame_error, "Error: did not reach end of file but ran out of frames"); 3207*3117ece4Schristos } 3208*3117ece4Schristos { U32 const magicNumber = MEM_readLE32(headerBuffer); 3209*3117ece4Schristos /* Zstandard frame */ 3210*3117ece4Schristos if (magicNumber == ZSTD_MAGICNUMBER) { 3211*3117ece4Schristos ZSTD_frameHeader header; 3212*3117ece4Schristos U64 const frameContentSize = ZSTD_getFrameContentSize(headerBuffer, numBytesRead); 3213*3117ece4Schristos if ( frameContentSize == ZSTD_CONTENTSIZE_ERROR 3214*3117ece4Schristos || frameContentSize == ZSTD_CONTENTSIZE_UNKNOWN ) { 3215*3117ece4Schristos info->decompUnavailable = 1; 3216*3117ece4Schristos } else { 3217*3117ece4Schristos info->decompressedSize += frameContentSize; 3218*3117ece4Schristos } 3219*3117ece4Schristos ERROR_IF(ZSTD_getFrameHeader(&header, headerBuffer, numBytesRead) != 0, 3220*3117ece4Schristos info_frame_error, "Error: could not decode frame header"); 3221*3117ece4Schristos if (info->dictID != 0 && info->dictID != header.dictID) { 3222*3117ece4Schristos DISPLAY("WARNING: File contains multiple frames with different dictionary IDs. Showing dictID 0 instead"); 3223*3117ece4Schristos info->dictID = 0; 3224*3117ece4Schristos } else { 3225*3117ece4Schristos info->dictID = header.dictID; 3226*3117ece4Schristos } 3227*3117ece4Schristos info->windowSize = header.windowSize; 3228*3117ece4Schristos /* move to the end of the frame header */ 3229*3117ece4Schristos { size_t const headerSize = ZSTD_frameHeaderSize(headerBuffer, numBytesRead); 3230*3117ece4Schristos ERROR_IF(ZSTD_isError(headerSize), info_frame_error, "Error: could not determine frame header size"); 3231*3117ece4Schristos ERROR_IF(fseek(srcFile, ((long)headerSize)-((long)numBytesRead), SEEK_CUR) != 0, 3232*3117ece4Schristos info_frame_error, "Error: could not move to end of frame header"); 3233*3117ece4Schristos } 3234*3117ece4Schristos 3235*3117ece4Schristos /* skip all blocks in the frame */ 3236*3117ece4Schristos { int lastBlock = 0; 3237*3117ece4Schristos do { 3238*3117ece4Schristos BYTE blockHeaderBuffer[3]; 3239*3117ece4Schristos ERROR_IF(fread(blockHeaderBuffer, 1, 3, srcFile) != 3, 3240*3117ece4Schristos info_frame_error, "Error while reading block header"); 3241*3117ece4Schristos { U32 const blockHeader = MEM_readLE24(blockHeaderBuffer); 3242*3117ece4Schristos U32 const blockTypeID = (blockHeader >> 1) & 3; 3243*3117ece4Schristos U32 const isRLE = (blockTypeID == 1); 3244*3117ece4Schristos U32 const isWrongBlock = (blockTypeID == 3); 3245*3117ece4Schristos long const blockSize = isRLE ? 1 : (long)(blockHeader >> 3); 3246*3117ece4Schristos ERROR_IF(isWrongBlock, info_frame_error, "Error: unsupported block type"); 3247*3117ece4Schristos lastBlock = blockHeader & 1; 3248*3117ece4Schristos ERROR_IF(fseek(srcFile, blockSize, SEEK_CUR) != 0, 3249*3117ece4Schristos info_frame_error, "Error: could not skip to end of block"); 3250*3117ece4Schristos } 3251*3117ece4Schristos } while (lastBlock != 1); 3252*3117ece4Schristos } 3253*3117ece4Schristos 3254*3117ece4Schristos /* check if checksum is used */ 3255*3117ece4Schristos { BYTE const frameHeaderDescriptor = headerBuffer[4]; 3256*3117ece4Schristos int const contentChecksumFlag = (frameHeaderDescriptor & (1 << 2)) >> 2; 3257*3117ece4Schristos if (contentChecksumFlag) { 3258*3117ece4Schristos info->usesCheck = 1; 3259*3117ece4Schristos ERROR_IF(fread(info->checksum, 1, 4, srcFile) != 4, 3260*3117ece4Schristos info_frame_error, "Error: could not read checksum"); 3261*3117ece4Schristos } } 3262*3117ece4Schristos info->numActualFrames++; 3263*3117ece4Schristos } 3264*3117ece4Schristos /* Skippable frame */ 3265*3117ece4Schristos else if ((magicNumber & ZSTD_MAGIC_SKIPPABLE_MASK) == ZSTD_MAGIC_SKIPPABLE_START) { 3266*3117ece4Schristos U32 const frameSize = MEM_readLE32(headerBuffer + 4); 3267*3117ece4Schristos long const seek = (long)(8 + frameSize - numBytesRead); 3268*3117ece4Schristos ERROR_IF(LONG_SEEK(srcFile, seek, SEEK_CUR) != 0, 3269*3117ece4Schristos info_frame_error, "Error: could not find end of skippable frame"); 3270*3117ece4Schristos info->numSkippableFrames++; 3271*3117ece4Schristos } 3272*3117ece4Schristos /* unknown content */ 3273*3117ece4Schristos else { 3274*3117ece4Schristos return info_not_zstd; 3275*3117ece4Schristos } 3276*3117ece4Schristos } /* magic number analysis */ 3277*3117ece4Schristos } /* end analyzing frames */ 3278*3117ece4Schristos return info_success; 3279*3117ece4Schristos } 3280*3117ece4Schristos 3281*3117ece4Schristos 3282*3117ece4Schristos static InfoError 3283*3117ece4Schristos getFileInfo_fileConfirmed(fileInfo_t* info, const char* inFileName) 3284*3117ece4Schristos { 3285*3117ece4Schristos InfoError status; 3286*3117ece4Schristos stat_t srcFileStat; 3287*3117ece4Schristos FILE* const srcFile = FIO_openSrcFile(NULL, inFileName, &srcFileStat); 3288*3117ece4Schristos ERROR_IF(srcFile == NULL, info_file_error, "Error: could not open source file %s", inFileName); 3289*3117ece4Schristos 3290*3117ece4Schristos info->compressedSize = UTIL_getFileSizeStat(&srcFileStat); 3291*3117ece4Schristos status = FIO_analyzeFrames(info, srcFile); 3292*3117ece4Schristos 3293*3117ece4Schristos fclose(srcFile); 3294*3117ece4Schristos info->nbFiles = 1; 3295*3117ece4Schristos return status; 3296*3117ece4Schristos } 3297*3117ece4Schristos 3298*3117ece4Schristos 3299*3117ece4Schristos /** getFileInfo() : 3300*3117ece4Schristos * Reads information from file, stores in *info 3301*3117ece4Schristos * @return : InfoError status 3302*3117ece4Schristos */ 3303*3117ece4Schristos static InfoError 3304*3117ece4Schristos getFileInfo(fileInfo_t* info, const char* srcFileName) 3305*3117ece4Schristos { 3306*3117ece4Schristos ERROR_IF(!UTIL_isRegularFile(srcFileName), 3307*3117ece4Schristos info_file_error, "Error : %s is not a file", srcFileName); 3308*3117ece4Schristos return getFileInfo_fileConfirmed(info, srcFileName); 3309*3117ece4Schristos } 3310*3117ece4Schristos 3311*3117ece4Schristos 3312*3117ece4Schristos static void 3313*3117ece4Schristos displayInfo(const char* inFileName, const fileInfo_t* info, int displayLevel) 3314*3117ece4Schristos { 3315*3117ece4Schristos UTIL_HumanReadableSize_t const window_hrs = UTIL_makeHumanReadableSize(info->windowSize); 3316*3117ece4Schristos UTIL_HumanReadableSize_t const compressed_hrs = UTIL_makeHumanReadableSize(info->compressedSize); 3317*3117ece4Schristos UTIL_HumanReadableSize_t const decompressed_hrs = UTIL_makeHumanReadableSize(info->decompressedSize); 3318*3117ece4Schristos double const ratio = (info->compressedSize == 0) ? 0 : ((double)info->decompressedSize)/(double)info->compressedSize; 3319*3117ece4Schristos const char* const checkString = (info->usesCheck ? "XXH64" : "None"); 3320*3117ece4Schristos if (displayLevel <= 2) { 3321*3117ece4Schristos if (!info->decompUnavailable) { 3322*3117ece4Schristos DISPLAYOUT("%6d %5d %6.*f%4s %8.*f%4s %5.3f %5s %s\n", 3323*3117ece4Schristos info->numSkippableFrames + info->numActualFrames, 3324*3117ece4Schristos info->numSkippableFrames, 3325*3117ece4Schristos compressed_hrs.precision, compressed_hrs.value, compressed_hrs.suffix, 3326*3117ece4Schristos decompressed_hrs.precision, decompressed_hrs.value, decompressed_hrs.suffix, 3327*3117ece4Schristos ratio, checkString, inFileName); 3328*3117ece4Schristos } else { 3329*3117ece4Schristos DISPLAYOUT("%6d %5d %6.*f%4s %5s %s\n", 3330*3117ece4Schristos info->numSkippableFrames + info->numActualFrames, 3331*3117ece4Schristos info->numSkippableFrames, 3332*3117ece4Schristos compressed_hrs.precision, compressed_hrs.value, compressed_hrs.suffix, 3333*3117ece4Schristos checkString, inFileName); 3334*3117ece4Schristos } 3335*3117ece4Schristos } else { 3336*3117ece4Schristos DISPLAYOUT("%s \n", inFileName); 3337*3117ece4Schristos DISPLAYOUT("# Zstandard Frames: %d\n", info->numActualFrames); 3338*3117ece4Schristos if (info->numSkippableFrames) 3339*3117ece4Schristos DISPLAYOUT("# Skippable Frames: %d\n", info->numSkippableFrames); 3340*3117ece4Schristos DISPLAYOUT("DictID: %u\n", info->dictID); 3341*3117ece4Schristos DISPLAYOUT("Window Size: %.*f%s (%llu B)\n", 3342*3117ece4Schristos window_hrs.precision, window_hrs.value, window_hrs.suffix, 3343*3117ece4Schristos (unsigned long long)info->windowSize); 3344*3117ece4Schristos DISPLAYOUT("Compressed Size: %.*f%s (%llu B)\n", 3345*3117ece4Schristos compressed_hrs.precision, compressed_hrs.value, compressed_hrs.suffix, 3346*3117ece4Schristos (unsigned long long)info->compressedSize); 3347*3117ece4Schristos if (!info->decompUnavailable) { 3348*3117ece4Schristos DISPLAYOUT("Decompressed Size: %.*f%s (%llu B)\n", 3349*3117ece4Schristos decompressed_hrs.precision, decompressed_hrs.value, decompressed_hrs.suffix, 3350*3117ece4Schristos (unsigned long long)info->decompressedSize); 3351*3117ece4Schristos DISPLAYOUT("Ratio: %.4f\n", ratio); 3352*3117ece4Schristos } 3353*3117ece4Schristos 3354*3117ece4Schristos if (info->usesCheck && info->numActualFrames == 1) { 3355*3117ece4Schristos DISPLAYOUT("Check: %s %02x%02x%02x%02x\n", checkString, 3356*3117ece4Schristos info->checksum[3], info->checksum[2], 3357*3117ece4Schristos info->checksum[1], info->checksum[0] 3358*3117ece4Schristos ); 3359*3117ece4Schristos } else { 3360*3117ece4Schristos DISPLAYOUT("Check: %s\n", checkString); 3361*3117ece4Schristos } 3362*3117ece4Schristos 3363*3117ece4Schristos DISPLAYOUT("\n"); 3364*3117ece4Schristos } 3365*3117ece4Schristos } 3366*3117ece4Schristos 3367*3117ece4Schristos static fileInfo_t FIO_addFInfo(fileInfo_t fi1, fileInfo_t fi2) 3368*3117ece4Schristos { 3369*3117ece4Schristos fileInfo_t total; 3370*3117ece4Schristos memset(&total, 0, sizeof(total)); 3371*3117ece4Schristos total.numActualFrames = fi1.numActualFrames + fi2.numActualFrames; 3372*3117ece4Schristos total.numSkippableFrames = fi1.numSkippableFrames + fi2.numSkippableFrames; 3373*3117ece4Schristos total.compressedSize = fi1.compressedSize + fi2.compressedSize; 3374*3117ece4Schristos total.decompressedSize = fi1.decompressedSize + fi2.decompressedSize; 3375*3117ece4Schristos total.decompUnavailable = fi1.decompUnavailable | fi2.decompUnavailable; 3376*3117ece4Schristos total.usesCheck = fi1.usesCheck & fi2.usesCheck; 3377*3117ece4Schristos total.nbFiles = fi1.nbFiles + fi2.nbFiles; 3378*3117ece4Schristos return total; 3379*3117ece4Schristos } 3380*3117ece4Schristos 3381*3117ece4Schristos static int 3382*3117ece4Schristos FIO_listFile(fileInfo_t* total, const char* inFileName, int displayLevel) 3383*3117ece4Schristos { 3384*3117ece4Schristos fileInfo_t info; 3385*3117ece4Schristos memset(&info, 0, sizeof(info)); 3386*3117ece4Schristos { InfoError const error = getFileInfo(&info, inFileName); 3387*3117ece4Schristos switch (error) { 3388*3117ece4Schristos case info_frame_error: 3389*3117ece4Schristos /* display error, but provide output */ 3390*3117ece4Schristos DISPLAYLEVEL(1, "Error while parsing \"%s\" \n", inFileName); 3391*3117ece4Schristos break; 3392*3117ece4Schristos case info_not_zstd: 3393*3117ece4Schristos DISPLAYOUT("File \"%s\" not compressed by zstd \n", inFileName); 3394*3117ece4Schristos if (displayLevel > 2) DISPLAYOUT("\n"); 3395*3117ece4Schristos return 1; 3396*3117ece4Schristos case info_file_error: 3397*3117ece4Schristos /* error occurred while opening the file */ 3398*3117ece4Schristos if (displayLevel > 2) DISPLAYOUT("\n"); 3399*3117ece4Schristos return 1; 3400*3117ece4Schristos case info_truncated_input: 3401*3117ece4Schristos DISPLAYOUT("File \"%s\" is truncated \n", inFileName); 3402*3117ece4Schristos if (displayLevel > 2) DISPLAYOUT("\n"); 3403*3117ece4Schristos return 1; 3404*3117ece4Schristos case info_success: 3405*3117ece4Schristos default: 3406*3117ece4Schristos break; 3407*3117ece4Schristos } 3408*3117ece4Schristos 3409*3117ece4Schristos displayInfo(inFileName, &info, displayLevel); 3410*3117ece4Schristos *total = FIO_addFInfo(*total, info); 3411*3117ece4Schristos assert(error == info_success || error == info_frame_error); 3412*3117ece4Schristos return (int)error; 3413*3117ece4Schristos } 3414*3117ece4Schristos } 3415*3117ece4Schristos 3416*3117ece4Schristos int FIO_listMultipleFiles(unsigned numFiles, const char** filenameTable, int displayLevel) 3417*3117ece4Schristos { 3418*3117ece4Schristos /* ensure no specified input is stdin (needs fseek() capability) */ 3419*3117ece4Schristos { unsigned u; 3420*3117ece4Schristos for (u=0; u<numFiles;u++) { 3421*3117ece4Schristos ERROR_IF(!strcmp (filenameTable[u], stdinmark), 3422*3117ece4Schristos 1, "zstd: --list does not support reading from standard input"); 3423*3117ece4Schristos } } 3424*3117ece4Schristos 3425*3117ece4Schristos if (numFiles == 0) { 3426*3117ece4Schristos if (!UTIL_isConsole(stdin)) { 3427*3117ece4Schristos DISPLAYLEVEL(1, "zstd: --list does not support reading from standard input \n"); 3428*3117ece4Schristos } 3429*3117ece4Schristos DISPLAYLEVEL(1, "No files given \n"); 3430*3117ece4Schristos return 1; 3431*3117ece4Schristos } 3432*3117ece4Schristos 3433*3117ece4Schristos if (displayLevel <= 2) { 3434*3117ece4Schristos DISPLAYOUT("Frames Skips Compressed Uncompressed Ratio Check Filename\n"); 3435*3117ece4Schristos } 3436*3117ece4Schristos { int error = 0; 3437*3117ece4Schristos fileInfo_t total; 3438*3117ece4Schristos memset(&total, 0, sizeof(total)); 3439*3117ece4Schristos total.usesCheck = 1; 3440*3117ece4Schristos /* --list each file, and check for any error */ 3441*3117ece4Schristos { unsigned u; 3442*3117ece4Schristos for (u=0; u<numFiles;u++) { 3443*3117ece4Schristos error |= FIO_listFile(&total, filenameTable[u], displayLevel); 3444*3117ece4Schristos } } 3445*3117ece4Schristos if (numFiles > 1 && displayLevel <= 2) { /* display total */ 3446*3117ece4Schristos UTIL_HumanReadableSize_t const compressed_hrs = UTIL_makeHumanReadableSize(total.compressedSize); 3447*3117ece4Schristos UTIL_HumanReadableSize_t const decompressed_hrs = UTIL_makeHumanReadableSize(total.decompressedSize); 3448*3117ece4Schristos double const ratio = (total.compressedSize == 0) ? 0 : ((double)total.decompressedSize)/(double)total.compressedSize; 3449*3117ece4Schristos const char* const checkString = (total.usesCheck ? "XXH64" : ""); 3450*3117ece4Schristos DISPLAYOUT("----------------------------------------------------------------- \n"); 3451*3117ece4Schristos if (total.decompUnavailable) { 3452*3117ece4Schristos DISPLAYOUT("%6d %5d %6.*f%4s %5s %u files\n", 3453*3117ece4Schristos total.numSkippableFrames + total.numActualFrames, 3454*3117ece4Schristos total.numSkippableFrames, 3455*3117ece4Schristos compressed_hrs.precision, compressed_hrs.value, compressed_hrs.suffix, 3456*3117ece4Schristos checkString, (unsigned)total.nbFiles); 3457*3117ece4Schristos } else { 3458*3117ece4Schristos DISPLAYOUT("%6d %5d %6.*f%4s %8.*f%4s %5.3f %5s %u files\n", 3459*3117ece4Schristos total.numSkippableFrames + total.numActualFrames, 3460*3117ece4Schristos total.numSkippableFrames, 3461*3117ece4Schristos compressed_hrs.precision, compressed_hrs.value, compressed_hrs.suffix, 3462*3117ece4Schristos decompressed_hrs.precision, decompressed_hrs.value, decompressed_hrs.suffix, 3463*3117ece4Schristos ratio, checkString, (unsigned)total.nbFiles); 3464*3117ece4Schristos } } 3465*3117ece4Schristos return error; 3466*3117ece4Schristos } 3467*3117ece4Schristos } 3468*3117ece4Schristos 3469*3117ece4Schristos 3470*3117ece4Schristos #endif /* #ifndef ZSTD_NODECOMPRESS */ 3471