The Design and Implementation of the FreeBSD Operating System, Second Edition
Now available: The Design and Implementation of the FreeBSD Operating System (Second Edition)


[ source navigation ] [ diff markup ] [ identifier search ] [ freetext search ] [ file search ] [ list types ] [ track identifier ]

FreeBSD/Linux Kernel Cross Reference
sys/contrib/zstd/programs/benchfn.c

Version: -  FREEBSD  -  FREEBSD-13-STABLE  -  FREEBSD-13-0  -  FREEBSD-12-STABLE  -  FREEBSD-12-0  -  FREEBSD-11-STABLE  -  FREEBSD-11-0  -  FREEBSD-10-STABLE  -  FREEBSD-10-0  -  FREEBSD-9-STABLE  -  FREEBSD-9-0  -  FREEBSD-8-STABLE  -  FREEBSD-8-0  -  FREEBSD-7-STABLE  -  FREEBSD-7-0  -  FREEBSD-6-STABLE  -  FREEBSD-6-0  -  FREEBSD-5-STABLE  -  FREEBSD-5-0  -  FREEBSD-4-STABLE  -  FREEBSD-3-STABLE  -  FREEBSD22  -  l41  -  OPENBSD  -  linux-2.6  -  MK84  -  PLAN9  -  xnu-8792 
SearchContext: -  none  -  3  -  10 

    1 /*
    2  * Copyright (c) Yann Collet, Facebook, Inc.
    3  * All rights reserved.
    4  *
    5  * This source code is licensed under both the BSD-style license (found in the
    6  * LICENSE file in the root directory of this source tree) and the GPLv2 (found
    7  * in the COPYING file in the root directory of this source tree).
    8  * You may select, at your option, one of the above-listed licenses.
    9  */
   10 
   11 
   12 
   13 /* *************************************
   14 *  Includes
   15 ***************************************/
   16 #include <stdlib.h>      /* malloc, free */
   17 #include <string.h>      /* memset */
   18 #include <assert.h>      /* assert */
   19 
   20 #include "timefn.h"        /* UTIL_time_t, UTIL_getTime */
   21 #include "benchfn.h"
   22 
   23 
   24 /* *************************************
   25 *  Constants
   26 ***************************************/
   27 #define TIMELOOP_MICROSEC     SEC_TO_MICRO      /* 1 second */
   28 #define TIMELOOP_NANOSEC      (1*1000000000ULL) /* 1 second */
   29 
   30 #define KB *(1 <<10)
   31 #define MB *(1 <<20)
   32 #define GB *(1U<<30)
   33 
   34 
   35 /* *************************************
   36 *  Debug errors
   37 ***************************************/
   38 #if defined(DEBUG) && (DEBUG >= 1)
   39 #  include <stdio.h>       /* fprintf */
   40 #  define DISPLAY(...)       fprintf(stderr, __VA_ARGS__)
   41 #  define DEBUGOUTPUT(...) { if (DEBUG) DISPLAY(__VA_ARGS__); }
   42 #else
   43 #  define DEBUGOUTPUT(...)
   44 #endif
   45 
   46 
   47 /* error without displaying */
   48 #define RETURN_QUIET_ERROR(retValue, ...) {           \
   49     DEBUGOUTPUT("%s: %i: \n", __FILE__, __LINE__);    \
   50     DEBUGOUTPUT("Error : ");                          \
   51     DEBUGOUTPUT(__VA_ARGS__);                         \
   52     DEBUGOUTPUT(" \n");                               \
   53     return retValue;                                  \
   54 }
   55 
   56 /* Abort execution if a condition is not met */
   57 #define CONTROL(c) { if (!(c)) { DEBUGOUTPUT("error: %s \n", #c); abort(); } }
   58 
   59 
   60 /* *************************************
   61 *  Benchmarking an arbitrary function
   62 ***************************************/
   63 
   64 int BMK_isSuccessful_runOutcome(BMK_runOutcome_t outcome)
   65 {
   66     return outcome.error_tag_never_ever_use_directly == 0;
   67 }
   68 
   69 /* warning : this function will stop program execution if outcome is invalid !
   70  *           check outcome validity first, using BMK_isValid_runResult() */
   71 BMK_runTime_t BMK_extract_runTime(BMK_runOutcome_t outcome)
   72 {
   73     CONTROL(outcome.error_tag_never_ever_use_directly == 0);
   74     return outcome.internal_never_ever_use_directly;
   75 }
   76 
   77 size_t BMK_extract_errorResult(BMK_runOutcome_t outcome)
   78 {
   79     CONTROL(outcome.error_tag_never_ever_use_directly != 0);
   80     return outcome.error_result_never_ever_use_directly;
   81 }
   82 
   83 static BMK_runOutcome_t BMK_runOutcome_error(size_t errorResult)
   84 {
   85     BMK_runOutcome_t b;
   86     memset(&b, 0, sizeof(b));
   87     b.error_tag_never_ever_use_directly = 1;
   88     b.error_result_never_ever_use_directly = errorResult;
   89     return b;
   90 }
   91 
   92 static BMK_runOutcome_t BMK_setValid_runTime(BMK_runTime_t runTime)
   93 {
   94     BMK_runOutcome_t outcome;
   95     outcome.error_tag_never_ever_use_directly = 0;
   96     outcome.internal_never_ever_use_directly = runTime;
   97     return outcome;
   98 }
   99 
  100 
  101 /* initFn will be measured once, benchFn will be measured `nbLoops` times */
  102 /* initFn is optional, provide NULL if none */
  103 /* benchFn must return a size_t value that errorFn can interpret */
  104 /* takes # of blocks and list of size & stuff for each. */
  105 /* can report result of benchFn for each block into blockResult. */
  106 /* blockResult is optional, provide NULL if this information is not required */
  107 /* note : time per loop can be reported as zero if run time < timer resolution */
  108 BMK_runOutcome_t BMK_benchFunction(BMK_benchParams_t p,
  109                                    unsigned nbLoops)
  110 {
  111     size_t dstSize = 0;
  112     nbLoops += !nbLoops;   /* minimum nbLoops is 1 */
  113 
  114     /* init */
  115     {   size_t i;
  116         for(i = 0; i < p.blockCount; i++) {
  117             memset(p.dstBuffers[i], 0xE5, p.dstCapacities[i]);  /* warm up and erase result buffer */
  118     }   }
  119 
  120     /* benchmark */
  121     {   UTIL_time_t const clockStart = UTIL_getTime();
  122         unsigned loopNb, blockNb;
  123         if (p.initFn != NULL) p.initFn(p.initPayload);
  124         for (loopNb = 0; loopNb < nbLoops; loopNb++) {
  125             for (blockNb = 0; blockNb < p.blockCount; blockNb++) {
  126                 size_t const res = p.benchFn(p.srcBuffers[blockNb], p.srcSizes[blockNb],
  127                                    p.dstBuffers[blockNb], p.dstCapacities[blockNb],
  128                                    p.benchPayload);
  129                 if (loopNb == 0) {
  130                     if (p.blockResults != NULL) p.blockResults[blockNb] = res;
  131                     if ((p.errorFn != NULL) && (p.errorFn(res))) {
  132                         RETURN_QUIET_ERROR(BMK_runOutcome_error(res),
  133                             "Function benchmark failed on block %u (of size %u) with error %i",
  134                             blockNb, (unsigned)p.srcSizes[blockNb], (int)res);
  135                     }
  136                     dstSize += res;
  137             }   }
  138         }  /* for (loopNb = 0; loopNb < nbLoops; loopNb++) */
  139 
  140         {   PTime const totalTime = UTIL_clockSpanNano(clockStart);
  141             BMK_runTime_t rt;
  142             rt.nanoSecPerRun = (double)totalTime / nbLoops;
  143             rt.sumOfReturn = dstSize;
  144             return BMK_setValid_runTime(rt);
  145     }   }
  146 }
  147 
  148 
  149 /* ====  Benchmarking any function, providing intermediate results  ==== */
  150 
  151 struct BMK_timedFnState_s {
  152     PTime timeSpent_ns;
  153     PTime timeBudget_ns;
  154     PTime runBudget_ns;
  155     BMK_runTime_t fastestRun;
  156     unsigned nbLoops;
  157     UTIL_time_t coolTime;
  158 };  /* typedef'd to BMK_timedFnState_t within bench.h */
  159 
  160 BMK_timedFnState_t* BMK_createTimedFnState(unsigned total_ms, unsigned run_ms)
  161 {
  162     BMK_timedFnState_t* const r = (BMK_timedFnState_t*)malloc(sizeof(*r));
  163     if (r == NULL) return NULL;   /* malloc() error */
  164     BMK_resetTimedFnState(r, total_ms, run_ms);
  165     return r;
  166 }
  167 
  168 void BMK_freeTimedFnState(BMK_timedFnState_t* state) { free(state); }
  169 
  170 BMK_timedFnState_t*
  171 BMK_initStatic_timedFnState(void* buffer, size_t size, unsigned total_ms, unsigned run_ms)
  172 {
  173     typedef char check_size[ 2 * (sizeof(BMK_timedFnState_shell) >= sizeof(struct BMK_timedFnState_s)) - 1];  /* static assert : a compilation failure indicates that BMK_timedFnState_shell is not large enough */
  174     typedef struct { check_size c; BMK_timedFnState_t tfs; } tfs_align;  /* force tfs to be aligned at its next best position */
  175     size_t const tfs_alignment = offsetof(tfs_align, tfs); /* provides the minimal alignment restriction for BMK_timedFnState_t */
  176     BMK_timedFnState_t* const r = (BMK_timedFnState_t*)buffer;
  177     if (buffer == NULL) return NULL;
  178     if (size < sizeof(struct BMK_timedFnState_s)) return NULL;
  179     if ((size_t)buffer % tfs_alignment) return NULL;  /* buffer must be properly aligned */
  180     BMK_resetTimedFnState(r, total_ms, run_ms);
  181     return r;
  182 }
  183 
  184 void BMK_resetTimedFnState(BMK_timedFnState_t* timedFnState, unsigned total_ms, unsigned run_ms)
  185 {
  186     if (!total_ms) total_ms = 1 ;
  187     if (!run_ms) run_ms = 1;
  188     if (run_ms > total_ms) run_ms = total_ms;
  189     timedFnState->timeSpent_ns = 0;
  190     timedFnState->timeBudget_ns = (PTime)total_ms * TIMELOOP_NANOSEC / 1000;
  191     timedFnState->runBudget_ns = (PTime)run_ms * TIMELOOP_NANOSEC / 1000;
  192     timedFnState->fastestRun.nanoSecPerRun = (double)TIMELOOP_NANOSEC * 2000000000;  /* hopefully large enough : must be larger than any potential measurement */
  193     timedFnState->fastestRun.sumOfReturn = (size_t)(-1LL);
  194     timedFnState->nbLoops = 1;
  195     timedFnState->coolTime = UTIL_getTime();
  196 }
  197 
  198 /* Tells if nb of seconds set in timedFnState for all runs is spent.
  199  * note : this function will return 1 if BMK_benchFunctionTimed() has actually errored. */
  200 int BMK_isCompleted_TimedFn(const BMK_timedFnState_t* timedFnState)
  201 {
  202     return (timedFnState->timeSpent_ns >= timedFnState->timeBudget_ns);
  203 }
  204 
  205 
  206 #undef MIN
  207 #define MIN(a,b)   ( (a) < (b) ? (a) : (b) )
  208 
  209 #define MINUSABLETIME  (TIMELOOP_NANOSEC / 2)  /* 0.5 seconds */
  210 
  211 BMK_runOutcome_t BMK_benchTimedFn(BMK_timedFnState_t* cont,
  212                                   BMK_benchParams_t p)
  213 {
  214     PTime const runBudget_ns = cont->runBudget_ns;
  215     PTime const runTimeMin_ns = runBudget_ns / 2;
  216     int completed = 0;
  217     BMK_runTime_t bestRunTime = cont->fastestRun;
  218 
  219     while (!completed) {
  220         BMK_runOutcome_t const runResult = BMK_benchFunction(p, cont->nbLoops);
  221 
  222         if(!BMK_isSuccessful_runOutcome(runResult)) { /* error : move out */
  223             return runResult;
  224         }
  225 
  226         {   BMK_runTime_t const newRunTime = BMK_extract_runTime(runResult);
  227             double const loopDuration_ns = newRunTime.nanoSecPerRun * cont->nbLoops;
  228 
  229             cont->timeSpent_ns += (unsigned long long)loopDuration_ns;
  230 
  231             /* estimate nbLoops for next run to last approximately 1 second */
  232             if (loopDuration_ns > (runBudget_ns / 50)) {
  233                 double const fastestRun_ns = MIN(bestRunTime.nanoSecPerRun, newRunTime.nanoSecPerRun);
  234                 cont->nbLoops = (unsigned)(runBudget_ns / fastestRun_ns) + 1;
  235             } else {
  236                 /* previous run was too short : blindly increase workload by x multiplier */
  237                 const unsigned multiplier = 10;
  238                 assert(cont->nbLoops < ((unsigned)-1) / multiplier);  /* avoid overflow */
  239                 cont->nbLoops *= multiplier;
  240             }
  241 
  242             if(loopDuration_ns < runTimeMin_ns) {
  243                 /* don't report results for which benchmark run time was too small : increased risks of rounding errors */
  244                 assert(completed == 0);
  245                 continue;
  246             } else {
  247                 if(newRunTime.nanoSecPerRun < bestRunTime.nanoSecPerRun) {
  248                     bestRunTime = newRunTime;
  249                 }
  250                 completed = 1;
  251             }
  252         }
  253     }   /* while (!completed) */
  254 
  255     return BMK_setValid_runTime(bestRunTime);
  256 }

Cache object: dd2350a5a66c56caede780fd019d81a7


[ source navigation ] [ diff markup ] [ identifier search ] [ freetext search ] [ file search ] [ list types ] [ track identifier ]


This page is part of the FreeBSD/Linux Linux Kernel Cross-Reference, and was automatically generated using a modified version of the LXR engine.