1a28cd43dSSascha Wildner /* 2a28cd43dSSascha Wildner * Copyright (c) 2016-2020, Yann Collet, Facebook, Inc. 3a28cd43dSSascha Wildner * All rights reserved. 4a28cd43dSSascha Wildner * 5a28cd43dSSascha Wildner * This source code is licensed under both the BSD-style license (found in the 6a28cd43dSSascha Wildner * LICENSE file in the root directory of this source tree) and the GPLv2 (found 7a28cd43dSSascha Wildner * in the COPYING file in the root directory of this source tree). 8a28cd43dSSascha Wildner * You may select, at your option, one of the above-listed licenses. 9a28cd43dSSascha Wildner */ 10a28cd43dSSascha Wildner 11a28cd43dSSascha Wildner 12a28cd43dSSascha Wildner /* benchfn : 13a28cd43dSSascha Wildner * benchmark any function on a set of input 14a28cd43dSSascha Wildner * providing result in nanoSecPerRun 15a28cd43dSSascha Wildner * or detecting and returning an error 16a28cd43dSSascha Wildner */ 17a28cd43dSSascha Wildner 18a28cd43dSSascha Wildner #if defined (__cplusplus) 19a28cd43dSSascha Wildner extern "C" { 20a28cd43dSSascha Wildner #endif 21a28cd43dSSascha Wildner 22a28cd43dSSascha Wildner #ifndef BENCH_FN_H_23876 23a28cd43dSSascha Wildner #define BENCH_FN_H_23876 24a28cd43dSSascha Wildner 25a28cd43dSSascha Wildner /* === Dependencies === */ 26a28cd43dSSascha Wildner #include <stddef.h> /* size_t */ 27a28cd43dSSascha Wildner 28a28cd43dSSascha Wildner 29a28cd43dSSascha Wildner /* ==== Benchmark any function, iterated on a set of blocks ==== */ 30a28cd43dSSascha Wildner 31a28cd43dSSascha Wildner /* BMK_runTime_t: valid result return type */ 32a28cd43dSSascha Wildner 33a28cd43dSSascha Wildner typedef struct { 34a28cd43dSSascha Wildner double nanoSecPerRun; /* time per iteration (over all blocks) */ 35a28cd43dSSascha Wildner size_t sumOfReturn; /* sum of return values */ 36a28cd43dSSascha Wildner } BMK_runTime_t; 37a28cd43dSSascha Wildner 38a28cd43dSSascha Wildner 39a28cd43dSSascha Wildner /* BMK_runOutcome_t: 40a28cd43dSSascha Wildner * type expressing the outcome of a benchmark run by BMK_benchFunction(), 41a28cd43dSSascha Wildner * which can be either valid or invalid. 42a28cd43dSSascha Wildner * benchmark outcome can be invalid if errorFn is provided. 43a28cd43dSSascha Wildner * BMK_runOutcome_t must be considered "opaque" : never access its members directly. 44a28cd43dSSascha Wildner * Instead, use its assigned methods : 45a28cd43dSSascha Wildner * BMK_isSuccessful_runOutcome, BMK_extract_runTime, BMK_extract_errorResult. 46a28cd43dSSascha Wildner * The structure is only described here to allow its allocation on stack. */ 47a28cd43dSSascha Wildner 48a28cd43dSSascha Wildner typedef struct { 49a28cd43dSSascha Wildner BMK_runTime_t internal_never_ever_use_directly; 50a28cd43dSSascha Wildner size_t error_result_never_ever_use_directly; 51a28cd43dSSascha Wildner int error_tag_never_ever_use_directly; 52a28cd43dSSascha Wildner } BMK_runOutcome_t; 53a28cd43dSSascha Wildner 54a28cd43dSSascha Wildner 55a28cd43dSSascha Wildner /* prototypes for benchmarked functions */ 56a28cd43dSSascha Wildner typedef size_t (*BMK_benchFn_t)(const void* src, size_t srcSize, void* dst, size_t dstCapacity, void* customPayload); 57a28cd43dSSascha Wildner typedef size_t (*BMK_initFn_t)(void* initPayload); 58a28cd43dSSascha Wildner typedef unsigned (*BMK_errorFn_t)(size_t); 59a28cd43dSSascha Wildner 60a28cd43dSSascha Wildner 61a28cd43dSSascha Wildner /* BMK_benchFunction() parameters are provided via the following structure. 62a28cd43dSSascha Wildner * A structure is preferable for readability, 63a28cd43dSSascha Wildner * as the number of parameters required is fairly large. 64a28cd43dSSascha Wildner * No initializer is provided, because it doesn't make sense to provide some "default" : 65a28cd43dSSascha Wildner * all parameters must be specified by the caller. 66a28cd43dSSascha Wildner * optional parameters are labelled explicitly, and accept value NULL when not used */ 67a28cd43dSSascha Wildner typedef struct { 68a28cd43dSSascha Wildner BMK_benchFn_t benchFn; /* the function to benchmark, over the set of blocks */ 69a28cd43dSSascha Wildner void* benchPayload; /* pass custom parameters to benchFn : 70a28cd43dSSascha Wildner * (*benchFn)(srcBuffers[i], srcSizes[i], dstBuffers[i], dstCapacities[i], benchPayload) */ 71a28cd43dSSascha Wildner BMK_initFn_t initFn; /* (*initFn)(initPayload) is run once per run, at the beginning. */ 72a28cd43dSSascha Wildner void* initPayload; /* Both arguments can be NULL, in which case nothing is run. */ 73a28cd43dSSascha Wildner BMK_errorFn_t errorFn; /* errorFn will check each return value of benchFn over each block, to determine if it failed or not. 74a28cd43dSSascha Wildner * errorFn can be NULL, in which case no check is performed. 75a28cd43dSSascha Wildner * errorFn must return 0 when benchFn was successful, and >= 1 if it detects an error. 76a28cd43dSSascha Wildner * Execution is stopped as soon as an error is detected. 77a28cd43dSSascha Wildner * the triggering return value can be retrieved using BMK_extract_errorResult(). */ 78a28cd43dSSascha Wildner size_t blockCount; /* number of blocks to operate benchFn on. 79a28cd43dSSascha Wildner * It's also the size of all array parameters : 80a28cd43dSSascha Wildner * srcBuffers, srcSizes, dstBuffers, dstCapacities, blockResults */ 81a28cd43dSSascha Wildner const void *const * srcBuffers; /* read-only array of buffers to be operated on by benchFn */ 82a28cd43dSSascha Wildner const size_t* srcSizes; /* read-only array containing sizes of srcBuffers */ 83a28cd43dSSascha Wildner void *const * dstBuffers; /* array of buffers to be written into by benchFn. This array is not optional, it must be provided even if unused by benchfn. */ 84a28cd43dSSascha Wildner const size_t* dstCapacities; /* read-only array containing capacities of dstBuffers. This array must be present. */ 85a28cd43dSSascha Wildner size_t* blockResults; /* Optional: store the return value of benchFn for each block. Use NULL if this result is not requested. */ 86a28cd43dSSascha Wildner } BMK_benchParams_t; 87a28cd43dSSascha Wildner 88a28cd43dSSascha Wildner 89a28cd43dSSascha Wildner /* BMK_benchFunction() : 90a28cd43dSSascha Wildner * This function benchmarks benchFn and initFn, providing a result. 91a28cd43dSSascha Wildner * 92a28cd43dSSascha Wildner * params : see description of BMK_benchParams_t above. 93a28cd43dSSascha Wildner * nbLoops: defines number of times benchFn is run over the full set of blocks. 94a28cd43dSSascha Wildner * Minimum value is 1. A 0 is interpreted as a 1. 95a28cd43dSSascha Wildner * 96a28cd43dSSascha Wildner * @return: can express either an error or a successful result. 97a28cd43dSSascha Wildner * Use BMK_isSuccessful_runOutcome() to check if benchmark was successful. 98a28cd43dSSascha Wildner * If yes, extract the result with BMK_extract_runTime(), 99a28cd43dSSascha Wildner * it will contain : 100a28cd43dSSascha Wildner * .sumOfReturn : the sum of all return values of benchFn through all of blocks 101a28cd43dSSascha Wildner * .nanoSecPerRun : time per run of benchFn + (time for initFn / nbLoops) 102a28cd43dSSascha Wildner * .sumOfReturn is generally intended for functions which return a # of bytes written into dstBuffer, 103a28cd43dSSascha Wildner * in which case, this value will be the total amount of bytes written into dstBuffer. 104a28cd43dSSascha Wildner * 105a28cd43dSSascha Wildner * blockResults : when provided (!= NULL), and when benchmark is successful, 106a28cd43dSSascha Wildner * params.blockResults contains all return values of `benchFn` over all blocks. 107a28cd43dSSascha Wildner * when provided (!= NULL), and when benchmark failed, 108a28cd43dSSascha Wildner * params.blockResults contains return values of `benchFn` over all blocks preceding and including the failed block. 109a28cd43dSSascha Wildner */ 110a28cd43dSSascha Wildner BMK_runOutcome_t BMK_benchFunction(BMK_benchParams_t params, unsigned nbLoops); 111a28cd43dSSascha Wildner 112a28cd43dSSascha Wildner 113a28cd43dSSascha Wildner 114a28cd43dSSascha Wildner /* check first if the benchmark was successful or not */ 115a28cd43dSSascha Wildner int BMK_isSuccessful_runOutcome(BMK_runOutcome_t outcome); 116a28cd43dSSascha Wildner 117a28cd43dSSascha Wildner /* If the benchmark was successful, extract the result. 118a28cd43dSSascha Wildner * note : this function will abort() program execution if benchmark failed ! 119a28cd43dSSascha Wildner * always check if benchmark was successful first ! 120a28cd43dSSascha Wildner */ 121a28cd43dSSascha Wildner BMK_runTime_t BMK_extract_runTime(BMK_runOutcome_t outcome); 122a28cd43dSSascha Wildner 123a28cd43dSSascha Wildner /* when benchmark failed, it means one invocation of `benchFn` failed. 124a28cd43dSSascha Wildner * The failure was detected by `errorFn`, operating on return values of `benchFn`. 125a28cd43dSSascha Wildner * Returns the faulty return value. 126a28cd43dSSascha Wildner * note : this function will abort() program execution if benchmark did not failed. 127a28cd43dSSascha Wildner * always check if benchmark failed first ! 128a28cd43dSSascha Wildner */ 129a28cd43dSSascha Wildner size_t BMK_extract_errorResult(BMK_runOutcome_t outcome); 130a28cd43dSSascha Wildner 131a28cd43dSSascha Wildner 132a28cd43dSSascha Wildner 133a28cd43dSSascha Wildner /* ==== Benchmark any function, returning intermediate results ==== */ 134a28cd43dSSascha Wildner 135a28cd43dSSascha Wildner /* state information tracking benchmark session */ 136a28cd43dSSascha Wildner typedef struct BMK_timedFnState_s BMK_timedFnState_t; 137a28cd43dSSascha Wildner 138a28cd43dSSascha Wildner /* BMK_benchTimedFn() : 139a28cd43dSSascha Wildner * Similar to BMK_benchFunction(), most arguments being identical. 140a28cd43dSSascha Wildner * Automatically determines `nbLoops` so that each result is regularly produced at interval of about run_ms. 141a28cd43dSSascha Wildner * Note : minimum `nbLoops` is 1, therefore a run may last more than run_ms, and possibly even more than total_ms. 142a28cd43dSSascha Wildner * Usage - initialize timedFnState, select benchmark duration (total_ms) and each measurement duration (run_ms) 143a28cd43dSSascha Wildner * call BMK_benchTimedFn() repetitively, each measurement is supposed to last about run_ms 144a28cd43dSSascha Wildner * Check if total time budget is spent or exceeded, using BMK_isCompleted_TimedFn() 145a28cd43dSSascha Wildner */ 146a28cd43dSSascha Wildner BMK_runOutcome_t BMK_benchTimedFn(BMK_timedFnState_t* timedFnState, 147a28cd43dSSascha Wildner BMK_benchParams_t params); 148a28cd43dSSascha Wildner 149a28cd43dSSascha Wildner /* Tells if duration of all benchmark runs has exceeded total_ms 150a28cd43dSSascha Wildner */ 151a28cd43dSSascha Wildner int BMK_isCompleted_TimedFn(const BMK_timedFnState_t* timedFnState); 152a28cd43dSSascha Wildner 153a28cd43dSSascha Wildner /* BMK_createTimedFnState() and BMK_resetTimedFnState() : 154a28cd43dSSascha Wildner * Create/Set BMK_timedFnState_t for next benchmark session, 155a28cd43dSSascha Wildner * which shall last a minimum of total_ms milliseconds, 156a28cd43dSSascha Wildner * producing intermediate results, paced at interval of (approximately) run_ms. 157a28cd43dSSascha Wildner */ 158a28cd43dSSascha Wildner BMK_timedFnState_t* BMK_createTimedFnState(unsigned total_ms, unsigned run_ms); 159a28cd43dSSascha Wildner void BMK_resetTimedFnState(BMK_timedFnState_t* timedFnState, unsigned total_ms, unsigned run_ms); 160a28cd43dSSascha Wildner void BMK_freeTimedFnState(BMK_timedFnState_t* state); 161a28cd43dSSascha Wildner 162a28cd43dSSascha Wildner 163a28cd43dSSascha Wildner /* BMK_timedFnState_shell and BMK_initStatic_timedFnState() : 164a28cd43dSSascha Wildner * Makes it possible to statically allocate a BMK_timedFnState_t on stack. 165a28cd43dSSascha Wildner * BMK_timedFnState_shell is only there to allocate space, 166a28cd43dSSascha Wildner * never ever access its members. 167a28cd43dSSascha Wildner * BMK_timedFnState_t() actually accepts any buffer. 168a28cd43dSSascha Wildner * It will check if provided buffer is large enough and is correctly aligned, 169a28cd43dSSascha Wildner * and will return NULL if conditions are not respected. 170a28cd43dSSascha Wildner */ 171a28cd43dSSascha Wildner #define BMK_TIMEDFNSTATE_SIZE 64 172a28cd43dSSascha Wildner typedef union { 173a28cd43dSSascha Wildner char never_access_space[BMK_TIMEDFNSTATE_SIZE]; 174a28cd43dSSascha Wildner long long alignment_enforcer; /* must be aligned on 8-bytes boundaries */ 175a28cd43dSSascha Wildner } BMK_timedFnState_shell; 176a28cd43dSSascha Wildner BMK_timedFnState_t* BMK_initStatic_timedFnState(void* buffer, size_t size, unsigned total_ms, unsigned run_ms); 177a28cd43dSSascha Wildner 178a28cd43dSSascha Wildner 179a28cd43dSSascha Wildner #endif /* BENCH_FN_H_23876 */ 180a28cd43dSSascha Wildner 181a28cd43dSSascha Wildner #if defined (__cplusplus) 182a28cd43dSSascha Wildner } 183a28cd43dSSascha Wildner #endif 184