zstd/programs/benchfn.c

/*
 * Copyright (c) 2016-present, Yann Collet, Facebook, Inc.
 * All rights reserved.
 *
 * This source code is licensed under both the BSD-style license (found in the
 * LICENSE file in the root directory of this source tree) and the GPLv2 (found
 * in the COPYING file in the root directory of this source tree).
 * You may select, at your option, one of the above-listed licenses.
 */


/* *************************************
*  Includes
***************************************/
#include "platform.h"    /* Large Files support */
#include "util.h"        /* UTIL_getFileSize, UTIL_sleep */
#include <stdlib.h>      /* malloc, free */
#include <string.h>      /* memset */
#include <stdio.h>       /* fprintf, fopen */
#undef NDEBUG            /* assert must not be disabled */
#include <assert.h>      /* assert */

#include "mem.h"
#include "benchfn.h"


/* *************************************
*  Constants
***************************************/
#define TIMELOOP_MICROSEC     (1*1000000ULL) /* 1 second */
#define TIMELOOP_NANOSEC      (1*1000000000ULL) /* 1 second */
#define ACTIVEPERIOD_MICROSEC (70*TIMELOOP_MICROSEC) /* 70 seconds */
#define COOLPERIOD_SEC        10

#define KB *(1 <<10)
#define MB *(1 <<20)
#define GB *(1U<<30)


/* *************************************
*  Errors
***************************************/
#ifndef DEBUG
#  define DEBUG 0
#endif

#define DISPLAY(...)       fprintf(stderr, __VA_ARGS__)
#define DEBUGOUTPUT(...) { if (DEBUG) DISPLAY(__VA_ARGS__); }

/* error without displaying */
#define RETURN_QUIET_ERROR(retValue, ...) {           \
    DEBUGOUTPUT("%s: %i: \n", __FILE__, __LINE__);    \
    DEBUGOUTPUT("Error : ");                          \
    DEBUGOUTPUT(__VA_ARGS__);                         \
    DEBUGOUTPUT(" \n");                               \
    return retValue;                                  \
}


/* *************************************
*  Benchmarking an arbitrary function
***************************************/

int BMK_isSuccessful_runOutcome(BMK_runOutcome_t outcome)
{
    return outcome.error_tag_never_ever_use_directly == 0;
}

/* warning : this function will stop program execution if outcome is invalid !
 *           check outcome validity first, using BMK_isValid_runResult() */
BMK_runTime_t BMK_extract_runTime(BMK_runOutcome_t outcome)
{
    assert(outcome.error_tag_never_ever_use_directly == 0);
    return outcome.internal_never_ever_use_directly;
}

size_t BMK_extract_errorResult(BMK_runOutcome_t outcome)
{
    assert(outcome.error_tag_never_ever_use_directly != 0);
    return outcome.error_result_never_ever_use_directly;
}

static BMK_runOutcome_t BMK_runOutcome_error(size_t errorResult)
{
    BMK_runOutcome_t b;
    memset(&b, 0, sizeof(b));
    b.error_tag_never_ever_use_directly = 1;
    b.error_result_never_ever_use_directly = errorResult;
    return b;
}

static BMK_runOutcome_t BMK_setValid_runTime(BMK_runTime_t runTime)
{
    BMK_runOutcome_t outcome;
    outcome.error_tag_never_ever_use_directly = 0;
    outcome.internal_never_ever_use_directly = runTime;
    return outcome;
}


/* initFn will be measured once, benchFn will be measured `nbLoops` times */
/* initFn is optional, provide NULL if none */
/* benchFn must return a size_t value that errorFn can interpret */
/* takes # of blocks and list of size & stuff for each. */
/* can report result of benchFn for each block into blockResult. */
/* blockResult is optional, provide NULL if this information is not required */
/* note : time per loop can be reported as zero if run time < timer resolution */
BMK_runOutcome_t BMK_benchFunction(BMK_benchParams_t p,
                                   unsigned nbLoops)
{
    size_t dstSize = 0;
    nbLoops += !nbLoops;   /* minimum nbLoops is 1 */

    /* init */
    {   size_t i;
        for(i = 0; i < p.blockCount; i++) {
            memset(p.dstBuffers[i], 0xE5, p.dstCapacities[i]);  /* warm up and erase result buffer */
        }
#if 0
        /* based on testing these seem to lower accuracy of multiple calls of 1 nbLoops vs 1 call of multiple nbLoops
         * (Makes former slower)
         */
        UTIL_sleepMilli(5);  /* give processor time to other processes */
        UTIL_waitForNextTick();
#endif
    }

    /* benchmark */
    {   UTIL_time_t const clockStart = UTIL_getTime();
        unsigned loopNb, blockNb;
        if (p.initFn != NULL) p.initFn(p.initPayload);
        for (loopNb = 0; loopNb < nbLoops; loopNb++) {
            for (blockNb = 0; blockNb < p.blockCount; blockNb++) {
                size_t const res = p.benchFn(p.srcBuffers[blockNb], p.srcSizes[blockNb],
                                   p.dstBuffers[blockNb], p.dstCapacities[blockNb],
                                   p.benchPayload);
                if (loopNb == 0) {
                    if (p.blockResults != NULL) p.blockResults[blockNb] = res;
                    if ((p.errorFn != NULL) && (p.errorFn(res))) {
                        RETURN_QUIET_ERROR(BMK_runOutcome_error(res),
                            "Function benchmark failed on block %u (of size %u) with error %i",
                            blockNb, (unsigned)p.srcSizes[blockNb], (int)res);
                    }
                    dstSize += res;
            }   }
        }  /* for (loopNb = 0; loopNb < nbLoops; loopNb++) */

        {   U64 const totalTime = UTIL_clockSpanNano(clockStart);
            BMK_runTime_t rt;
            rt.nanoSecPerRun = (double)totalTime / nbLoops;
            rt.sumOfReturn = dstSize;
            return BMK_setValid_runTime(rt);
    }   }
}


/* ====  Benchmarking any function, providing intermediate results  ==== */

struct BMK_timedFnState_s {
    U64 timeSpent_ns;
    U64 timeBudget_ns;
    U64 runBudget_ns;
    BMK_runTime_t fastestRun;
    unsigned nbLoops;
    UTIL_time_t coolTime;
};  /* typedef'd to BMK_timedFnState_t within bench.h */

BMK_timedFnState_t* BMK_createTimedFnState(unsigned total_ms, unsigned run_ms)
{
    BMK_timedFnState_t* const r = (BMK_timedFnState_t*)malloc(sizeof(*r));
    if (r == NULL) return NULL;   /* malloc() error */
    BMK_resetTimedFnState(r, total_ms, run_ms);
    return r;
}

void BMK_freeTimedFnState(BMK_timedFnState_t* state) {
    free(state);
}

BMK_timedFnState_t* BMK_initStatic_timedFnState(void* buffer, size_t size, unsigned total_ms, unsigned run_ms)
{
    enum { timedFnState_staticSize_isLargeEnough=(1/(sizeof(BMK_timedFnState_shell) >= sizeof(struct BMK_timedFnState_s))) };  /* static assert */
    typedef struct { char c; long long ll; } ll_align;  /* this will force ll to be aligned at its next best position */
    size_t const ll_alignment = offsetof(ll_align, ll); /* provides the minimal alignment restriction for long long */
    BMK_timedFnState_t* const r = (BMK_timedFnState_t*)buffer;
    if (size < sizeof(struct BMK_timedFnState_s)) return NULL;
    if ((size_t)buffer % ll_alignment) return NULL;  /* must be aligned to satisfy `long long` alignment requirement */
    BMK_resetTimedFnState(r, total_ms, run_ms);
    return r;
}

void BMK_resetTimedFnState(BMK_timedFnState_t* timedFnState, unsigned total_ms, unsigned run_ms)
{
    if (!total_ms) total_ms = 1 ;
    if (!run_ms) run_ms = 1;
    if (run_ms > total_ms) run_ms = total_ms;
    timedFnState->timeSpent_ns = 0;
    timedFnState->timeBudget_ns = (U64)total_ms * TIMELOOP_NANOSEC / 1000;
    timedFnState->runBudget_ns = (U64)run_ms * TIMELOOP_NANOSEC / 1000;
    timedFnState->fastestRun.nanoSecPerRun = (double)TIMELOOP_NANOSEC * 2000000000;  /* hopefully large enough : must be larger than any potential measurement */
    timedFnState->fastestRun.sumOfReturn = (size_t)(-1LL);
    timedFnState->nbLoops = 1;
    timedFnState->coolTime = UTIL_getTime();
}

/* Tells if nb of seconds set in timedFnState for all runs is spent.
 * note : this function will return 1 if BMK_benchFunctionTimed() has actually errored. */
int BMK_isCompleted_TimedFn(const BMK_timedFnState_t* timedFnState)
{
    return (timedFnState->timeSpent_ns >= timedFnState->timeBudget_ns);
}


#undef MIN
#define MIN(a,b)   ( (a) < (b) ? (a) : (b) )

#define MINUSABLETIME  (TIMELOOP_NANOSEC / 2)  /* 0.5 seconds */

BMK_runOutcome_t BMK_benchTimedFn(BMK_timedFnState_t* cont,
                                  BMK_benchParams_t p)
{
    U64 const runBudget_ns = cont->runBudget_ns;
    U64 const runTimeMin_ns = runBudget_ns / 2;
    int completed = 0;
    BMK_runTime_t bestRunTime = cont->fastestRun;

    while (!completed) {
        BMK_runOutcome_t runResult;

        /* Overheat protection */
        if (UTIL_clockSpanMicro(cont->coolTime) > ACTIVEPERIOD_MICROSEC) {
            DEBUGOUTPUT("\rcooling down ...    \r");
            UTIL_sleep(COOLPERIOD_SEC);
            cont->coolTime = UTIL_getTime();
        }

        /* reinitialize capacity */
        runResult = BMK_benchFunction(p, cont->nbLoops);

        if(!BMK_isSuccessful_runOutcome(runResult)) { /* error : move out */
            return runResult;
        }

        {   BMK_runTime_t const newRunTime = BMK_extract_runTime(runResult);
            double const loopDuration_ns = newRunTime.nanoSecPerRun * cont->nbLoops;

            cont->timeSpent_ns += (unsigned long long)loopDuration_ns;

            /* estimate nbLoops for next run to last approximately 1 second */
            if (loopDuration_ns > (runBudget_ns / 50)) {
                double const fastestRun_ns = MIN(bestRunTime.nanoSecPerRun, newRunTime.nanoSecPerRun);
                cont->nbLoops = (U32)(runBudget_ns / fastestRun_ns) + 1;
            } else {
                /* previous run was too short : blindly increase workload by x multiplier */
                const unsigned multiplier = 10;
                assert(cont->nbLoops < ((unsigned)-1) / multiplier);  /* avoid overflow */
                cont->nbLoops *= multiplier;
            }

            if(loopDuration_ns < runTimeMin_ns) {
                /* don't report results for which benchmark run time was too small : increased risks of rounding errors */
                assert(completed == 0);
                continue;
            } else {
                if(newRunTime.nanoSecPerRun < bestRunTime.nanoSecPerRun) {
                    bestRunTime = newRunTime;
                }
                completed = 1;
            }
        }
    }   /* while (!completed) */

    return BMK_setValid_runTime(bestRunTime);
}
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`/*`
			`* Copyright (c) 2016-present, Yann Collet, Facebook, Inc.`
			`* All rights reserved.`
			`*`
			`* This source code is licensed under both the BSD-style license (found in the`
			`* LICENSE file in the root directory of this source tree) and the GPLv2 (found`
			`* in the COPYING file in the root directory of this source tree).`
			`* You may select, at your option, one of the above-listed licenses.`
			`*/`



			`/* *************************************`
			`* Includes`
			`***************************************/`
			`#include "platform.h" /* Large Files support */`
			`#include "util.h" /* UTIL_getFileSize, UTIL_sleep */`
			`#include <stdlib.h> /* malloc, free */`
			`#include <string.h> /* memset */`
			`#include <stdio.h> /* fprintf, fopen */`
changed benchfn api to use structure for function parameters as it expresses much clearer than a long list of parameters, since each parameter can now be named. 2018-11-13 13:05:39 -08:00			`#undef NDEBUG /* assert must not be disabled */`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`#include <assert.h> /* assert */`

			`#include "mem.h"`
			`#include "benchfn.h"`


			`/* *************************************`
			`* Constants`
			`***************************************/`
			`#define TIMELOOP_MICROSEC (11000000ULL) / 1 second */`
			`#define TIMELOOP_NANOSEC (11000000000ULL) / 1 second */`
			`#define ACTIVEPERIOD_MICROSEC (70TIMELOOP_MICROSEC) / 70 seconds */`
			`#define COOLPERIOD_SEC 10`

			`#define KB *(1 <<10)`
			`#define MB *(1 <<20)`
			`#define GB *(1U<<30)`


			`/* *************************************`
			`* Errors`
			`***************************************/`
			`#ifndef DEBUG`
			`# define DEBUG 0`
			`#endif`

changed benchfn api to use structure for function parameters as it expresses much clearer than a long list of parameters, since each parameter can now be named. 2018-11-13 13:05:39 -08:00			`#define DISPLAY(...) fprintf(stderr, __VA_ARGS__)`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`#define DEBUGOUTPUT(...) { if (DEBUG) DISPLAY(__VA_ARGS__); }`

			`/* error without displaying */`
benchfn can provided faulty return value with BMK_extract_returnValue() 2018-11-13 12:01:17 -08:00			`#define RETURN_QUIET_ERROR(retValue, ...) { \`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`DEBUGOUTPUT("%s: %i: \n", __FILE__, __LINE__); \`
benchfn can provided faulty return value with BMK_extract_returnValue() 2018-11-13 12:01:17 -08:00			`DEBUGOUTPUT("Error : "); \`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`DEBUGOUTPUT(__VA_ARGS__); \`
			`DEBUGOUTPUT(" \n"); \`
			`return retValue; \`
			`}`


			`/* *************************************`
			`* Benchmarking an arbitrary function`
			`***************************************/`

			`int BMK_isSuccessful_runOutcome(BMK_runOutcome_t outcome)`
			`{`
benchfn can provided faulty return value with BMK_extract_returnValue() 2018-11-13 12:01:17 -08:00			`return outcome.error_tag_never_ever_use_directly == 0;`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`}`

			`/* warning : this function will stop program execution if outcome is invalid !`
			`* check outcome validity first, using BMK_isValid_runResult() */`
			`BMK_runTime_t BMK_extract_runTime(BMK_runOutcome_t outcome)`
			`{`
benchfn can provided faulty return value with BMK_extract_returnValue() 2018-11-13 12:01:17 -08:00			`assert(outcome.error_tag_never_ever_use_directly == 0);`
			`return outcome.internal_never_ever_use_directly;`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`}`

benchfn can provided faulty return value with BMK_extract_returnValue() 2018-11-13 12:01:17 -08:00			`size_t BMK_extract_errorResult(BMK_runOutcome_t outcome)`
			`{`
			`assert(outcome.error_tag_never_ever_use_directly != 0);`
			`return outcome.error_result_never_ever_use_directly;`
			`}`

			`static BMK_runOutcome_t BMK_runOutcome_error(size_t errorResult)`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`{`
			`BMK_runOutcome_t b;`
			`memset(&b, 0, sizeof(b));`
benchfn can provided faulty return value with BMK_extract_returnValue() 2018-11-13 12:01:17 -08:00			`b.error_tag_never_ever_use_directly = 1;`
			`b.error_result_never_ever_use_directly = errorResult;`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`return b;`
			`}`

			`static BMK_runOutcome_t BMK_setValid_runTime(BMK_runTime_t runTime)`
			`{`
			`BMK_runOutcome_t outcome;`
benchfn can provided faulty return value with BMK_extract_returnValue() 2018-11-13 12:01:17 -08:00			`outcome.error_tag_never_ever_use_directly = 0;`
			`outcome.internal_never_ever_use_directly = runTime;`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`return outcome;`
			`}`


			/* initFn will be measured once, benchFn will be measured `nbLoops` times */
			`/* initFn is optional, provide NULL if none */`
benchfn can provided faulty return value with BMK_extract_returnValue() 2018-11-13 12:01:17 -08:00			`/* benchFn must return a size_t value that errorFn can interpret */`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`/* takes # of blocks and list of size & stuff for each. */`
			`/* can report result of benchFn for each block into blockResult. */`
			`/* blockResult is optional, provide NULL if this information is not required */`
benchfn can provided faulty return value with BMK_extract_returnValue() 2018-11-13 12:01:17 -08:00			`/* note : time per loop can be reported as zero if run time < timer resolution */`
changed benchfn api to use structure for function parameters as it expresses much clearer than a long list of parameters, since each parameter can now be named. 2018-11-13 13:05:39 -08:00			`BMK_runOutcome_t BMK_benchFunction(BMK_benchParams_t p,`
			`unsigned nbLoops)`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`{`
			`size_t dstSize = 0;`
benchfn can provided faulty return value with BMK_extract_returnValue() 2018-11-13 12:01:17 -08:00			`nbLoops += !nbLoops; /* minimum nbLoops is 1 */`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00
			`/* init */`
			`{ size_t i;`
changed benchfn api to use structure for function parameters as it expresses much clearer than a long list of parameters, since each parameter can now be named. 2018-11-13 13:05:39 -08:00			`for(i = 0; i < p.blockCount; i++) {`
			`memset(p.dstBuffers[i], 0xE5, p.dstCapacities[i]); /* warm up and erase result buffer */`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`}`
			`#if 0`
			`/* based on testing these seem to lower accuracy of multiple calls of 1 nbLoops vs 1 call of multiple nbLoops`
			`* (Makes former slower)`
			`*/`
			`UTIL_sleepMilli(5); /* give processor time to other processes */`
			`UTIL_waitForNextTick();`
			`#endif`
			`}`

			`/* benchmark */`
			`{ UTIL_time_t const clockStart = UTIL_getTime();`
			`unsigned loopNb, blockNb;`
changed benchfn api to use structure for function parameters as it expresses much clearer than a long list of parameters, since each parameter can now be named. 2018-11-13 13:05:39 -08:00			`if (p.initFn != NULL) p.initFn(p.initPayload);`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`for (loopNb = 0; loopNb < nbLoops; loopNb++) {`
changed benchfn api to use structure for function parameters as it expresses much clearer than a long list of parameters, since each parameter can now be named. 2018-11-13 13:05:39 -08:00			`for (blockNb = 0; blockNb < p.blockCount; blockNb++) {`
			`size_t const res = p.benchFn(p.srcBuffers[blockNb], p.srcSizes[blockNb],`
			`p.dstBuffers[blockNb], p.dstCapacities[blockNb],`
			`p.benchPayload);`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`if (loopNb == 0) {`
changed benchfn api to use structure for function parameters as it expresses much clearer than a long list of parameters, since each parameter can now be named. 2018-11-13 13:05:39 -08:00			`if (p.blockResults != NULL) p.blockResults[blockNb] = res;`
			`if ((p.errorFn != NULL) && (p.errorFn(res))) {`
benchfn can provided faulty return value with BMK_extract_returnValue() 2018-11-13 12:01:17 -08:00			`RETURN_QUIET_ERROR(BMK_runOutcome_error(res),`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`"Function benchmark failed on block %u (of size %u) with error %i",`
fix confusion between unsigned <-> U32 as suggested in #1441. generally U32 and unsigned are the same thing, except when they are not ... case : 32-bit compilation for MIPS (uint32_t == unsigned long) A vast majority of transformation consists in transforming U32 into unsigned. In rare cases, it's the other way around (typically for internal code, such as seeds). Among a few issues this patches solves : - some parameters were declared with type `unsigned` in .h, but with type `U32` in their implementation .c . - some parameters have type unsigned*, but the caller user a pointer to U32 instead. These fixes are useful. However, the bulk of changes is about %u formating, which requires unsigned type, but generally receives U32 values instead, often just for brevity (U32 is shorter than unsigned). These changes are generally minor, or even annoying. As a consequence, the amount of code changed is larger than I would expect for such a patch. Testing is also a pain : it requires manually modifying `mem.h`, in order to lie about `U32` and force it to be an `unsigned long` typically. On a 64-bit system, this will break the equivalence unsigned == U32. Unfortunately, it will also break a few static_assert(), controlling structure sizes. So it also requires modifying `debug.h` to make `static_assert()` a noop. And then reverting these changes. So it's inconvenient, and as a consequence, this property is currently not checked during CI tests. Therefore, these problems can emerge again in the future. I wonder if it is worth ensuring proper distinction of U32 != unsigned in CI tests. It's another restriction for coding, adding more frustration during merge tests, since most platforms don't need this distinction (hence contributor will not see it), and while this can matter in theory, the number of platforms impacted seems minimal. Thoughts ? 2018-12-21 16:19:44 -08:00			`blockNb, (unsigned)p.srcSizes[blockNb], (int)res);`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`}`
			`dstSize += res;`
			`} }`
			`} /* for (loopNb = 0; loopNb < nbLoops; loopNb++) */`

			`{ U64 const totalTime = UTIL_clockSpanNano(clockStart);`
			`BMK_runTime_t rt;`
added ability to create timedFnState on stack 2019-01-25 14:22:25 -08:00			`rt.nanoSecPerRun = (double)totalTime / nbLoops;`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`rt.sumOfReturn = dstSize;`
			`return BMK_setValid_runTime(rt);`
			`} }`
			`}`


			`/* ==== Benchmarking any function, providing intermediate results ==== */`

			`struct BMK_timedFnState_s {`
			`U64 timeSpent_ns;`
			`U64 timeBudget_ns;`
			`U64 runBudget_ns;`
			`BMK_runTime_t fastestRun;`
			`unsigned nbLoops;`
			`UTIL_time_t coolTime;`
			`}; /* typedef'd to BMK_timedFnState_t within bench.h */`

			`BMK_timedFnState_t* BMK_createTimedFnState(unsigned total_ms, unsigned run_ms)`
			`{`
			`BMK_timedFnState_t* const r = (BMK_timedFnState_t)malloc(sizeof(r));`
			`if (r == NULL) return NULL; /* malloc() error */`
			`BMK_resetTimedFnState(r, total_ms, run_ms);`
			`return r;`
			`}`

			`void BMK_freeTimedFnState(BMK_timedFnState_t* state) {`
			`free(state);`
			`}`

added ability to create timedFnState on stack 2019-01-25 14:22:25 -08:00			`BMK_timedFnState_t* BMK_initStatic_timedFnState(void* buffer, size_t size, unsigned total_ms, unsigned run_ms)`
			`{`
fixed static size of benchFnState added a static assert to ensure condition is respected on target platform 2019-01-25 21:58:44 -08:00			`enum { timedFnState_staticSize_isLargeEnough=(1/(sizeof(BMK_timedFnState_shell) >= sizeof(struct BMK_timedFnState_s))) }; /* static assert */`
			`typedef struct { char c; long long ll; } ll_align; /* this will force ll to be aligned at its next best position */`
			`size_t const ll_alignment = offsetof(ll_align, ll); /* provides the minimal alignment restriction for long long */`
added ability to create timedFnState on stack 2019-01-25 14:22:25 -08:00			`BMK_timedFnState_t* const r = (BMK_timedFnState_t*)buffer;`
			`if (size < sizeof(struct BMK_timedFnState_s)) return NULL;`
fixed static size of benchFnState added a static assert to ensure condition is respected on target platform 2019-01-25 21:58:44 -08:00			if ((size_t)buffer % ll_alignment) return NULL; /* must be aligned to satisfy `long long` alignment requirement */
added ability to create timedFnState on stack 2019-01-25 14:22:25 -08:00			`BMK_resetTimedFnState(r, total_ms, run_ms);`
			`return r;`
			`}`

separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`void BMK_resetTimedFnState(BMK_timedFnState_t* timedFnState, unsigned total_ms, unsigned run_ms)`
			`{`
			`if (!total_ms) total_ms = 1 ;`
			`if (!run_ms) run_ms = 1;`
			`if (run_ms > total_ms) run_ms = total_ms;`
			`timedFnState->timeSpent_ns = 0;`
			`timedFnState->timeBudget_ns = (U64)total_ms * TIMELOOP_NANOSEC / 1000;`
			`timedFnState->runBudget_ns = (U64)run_ms * TIMELOOP_NANOSEC / 1000;`
added ability to create timedFnState on stack 2019-01-25 14:22:25 -08:00			`timedFnState->fastestRun.nanoSecPerRun = (double)TIMELOOP_NANOSEC * 2000000000; /* hopefully large enough : must be larger than any potential measurement */`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`timedFnState->fastestRun.sumOfReturn = (size_t)(-1LL);`
			`timedFnState->nbLoops = 1;`
			`timedFnState->coolTime = UTIL_getTime();`
			`}`

			`/* Tells if nb of seconds set in timedFnState for all runs is spent.`
			`* note : this function will return 1 if BMK_benchFunctionTimed() has actually errored. */`
			`int BMK_isCompleted_TimedFn(const BMK_timedFnState_t* timedFnState)`
			`{`
			`return (timedFnState->timeSpent_ns >= timedFnState->timeBudget_ns);`
			`}`


			`#undef MIN`
			`#define MIN(a,b) ( (a) < (b) ? (a) : (b) )`

			`#define MINUSABLETIME (TIMELOOP_NANOSEC / 2) /* 0.5 seconds */`

changed benchfn api to use structure for function parameters as it expresses much clearer than a long list of parameters, since each parameter can now be named. 2018-11-13 13:05:39 -08:00			`BMK_runOutcome_t BMK_benchTimedFn(BMK_timedFnState_t* cont,`
			`BMK_benchParams_t p)`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`{`
			`U64 const runBudget_ns = cont->runBudget_ns;`
			`U64 const runTimeMin_ns = runBudget_ns / 2;`
			`int completed = 0;`
			`BMK_runTime_t bestRunTime = cont->fastestRun;`

			`while (!completed) {`
			`BMK_runOutcome_t runResult;`

			`/* Overheat protection */`
			`if (UTIL_clockSpanMicro(cont->coolTime) > ACTIVEPERIOD_MICROSEC) {`
			`DEBUGOUTPUT("\rcooling down ... \r");`
			`UTIL_sleep(COOLPERIOD_SEC);`
			`cont->coolTime = UTIL_getTime();`
			`}`

			`/* reinitialize capacity */`
changed benchfn api to use structure for function parameters as it expresses much clearer than a long list of parameters, since each parameter can now be named. 2018-11-13 13:05:39 -08:00			`runResult = BMK_benchFunction(p, cont->nbLoops);`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00
			`if(!BMK_isSuccessful_runOutcome(runResult)) { /* error : move out */`
benchfn can provided faulty return value with BMK_extract_returnValue() 2018-11-13 12:01:17 -08:00			`return runResult;`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`}`

			`{ BMK_runTime_t const newRunTime = BMK_extract_runTime(runResult);`
added ability to create timedFnState on stack 2019-01-25 14:22:25 -08:00			`double const loopDuration_ns = newRunTime.nanoSecPerRun * cont->nbLoops;`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00
added ability to create timedFnState on stack 2019-01-25 14:22:25 -08:00			`cont->timeSpent_ns += (unsigned long long)loopDuration_ns;`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00
			`/* estimate nbLoops for next run to last approximately 1 second */`
			`if (loopDuration_ns > (runBudget_ns / 50)) {`
added ability to create timedFnState on stack 2019-01-25 14:22:25 -08:00			`double const fastestRun_ns = MIN(bestRunTime.nanoSecPerRun, newRunTime.nanoSecPerRun);`
separated bench module into benchfn and benchzstd it shall be possible to use benchfn without any dependency on zstd. 2018-11-13 11:01:59 -08:00			`cont->nbLoops = (U32)(runBudget_ns / fastestRun_ns) + 1;`
			`} else {`
			`/* previous run was too short : blindly increase workload by x multiplier */`
			`const unsigned multiplier = 10;`
			`assert(cont->nbLoops < ((unsigned)-1) / multiplier); /* avoid overflow */`
			`cont->nbLoops *= multiplier;`
			`}`

			`if(loopDuration_ns < runTimeMin_ns) {`
			`/* don't report results for which benchmark run time was too small : increased risks of rounding errors */`
			`assert(completed == 0);`
			`continue;`
			`} else {`
			`if(newRunTime.nanoSecPerRun < bestRunTime.nanoSecPerRun) {`
			`bestRunTime = newRunTime;`
			`}`
			`completed = 1;`
			`}`
			`}`
			`} /* while (!completed) */`

			`return BMK_setValid_runTime(bestRunTime);`
			`}`