doxy/microbenchmark_8hpp_source.html

 /*
   MICROBENCHMARK.hpp  -  multithreaded timing measurement

    Copyright (C)
      2018,            Hermann Vosseler <Ichthyostega@web.de>

   **Lumiera** is free software; you can redistribute it and/or modify it
   under the terms of the GNU General Public License as published by the
   Free Software Foundation; either version 2 of the License, or (at your
   option) any later version. See the file COPYING for further details.

 */


 #ifndef LIB_TEST_MICROBENCHMARK_H
 #define LIB_TEST_MICROBENCHMARK_H


 #include "lib/meta/function.hpp"
 #include "lib/scoped-collection.hpp"
 #include "lib/sync-barrier.hpp"
 #include "lib/thread.hpp"

 #include "lib/test/microbenchmark-adaptor.hpp"

 #include <chrono>


 namespace lib {
 namespace test{

   namespace {
     constexpr size_t DEFAULT_RUNS = 10'000'000;
     using CLOCK_SCALE = std::micro;          // Results are in µ-sec
   }


   template<class FUN>
   inline double
   benchmarkTime (FUN const& invokeTestCode, const size_t repeatCnt =1)
   {
     using std::chrono::steady_clock;
     using Dur = std::chrono::duration<double, CLOCK_SCALE>;

     auto start = steady_clock::now();
     invokeTestCode();
     Dur duration = steady_clock::now () - start;
     return duration.count() / repeatCnt;
   };


   template<class FUN>
   inline size_t
   benchmarkLoop (FUN const& testSubject, const size_t repeatCnt = DEFAULT_RUNS)
   {
     // the test subject gets the current loop-index and returns a checksum value
     auto subject4benchmark = microbenchmark::adapted4benchmark (testSubject);

     size_t checksum{0};
     for (size_t i=0; i<repeatCnt; ++i)
       checksum += subject4benchmark(i);
     return checksum;
   }


   template<class FUN>
   inline auto
   microBenchmark (FUN const& testSubject, const size_t repeatCnt = DEFAULT_RUNS)
   {
     volatile size_t checksum{0};
     auto invokeTestLoop = [&]{ checksum = benchmarkLoop (testSubject, repeatCnt); };
     double micros = benchmarkTime (invokeTestLoop, repeatCnt);
     return std::make_pair (micros, checksum);
   }


   template<size_t nThreads, class FUN>
   inline auto
   threadBenchmark(FUN const& subject, const size_t repeatCnt = DEFAULT_RUNS)
   {
     using std::chrono::steady_clock;
     using Dur = std::chrono::duration<double, CLOCK_SCALE>;

     // the test subject gets the current loop-index and returns a checksum value
     auto subject4benchmark = microbenchmark::adapted4benchmark (subject);
     using Subject = decltype(subject4benchmark);

     struct Thread
       : lib::ThreadJoinable<>
       {
         Thread(Subject const& subject, size_t loopCnt, SyncBarrier& testStart)
           : ThreadJoinable{"Micro-Benchmark"
                           ,[this,loopCnt, testSubject=subject, &testStart]
                            () mutable              // local (mutable) copy of the test-subject-Functor
                              {
                                testStart.sync();   // block until all threads are ready
                                auto start = steady_clock::now();
                                for (size_t i=0; i < loopCnt; ++i)
                                  checksum += testSubject(i);
                                duration = steady_clock::now () - start;
                              }}
           { }
                              // Note: barrier at begin and join at end both ensure data synchronisation
         Dur duration{};      // measured time within thread
         size_t checksum{0};  // collected checksum
       };

     SyncBarrier testStart{nThreads + 1};           // coordinated start of timing measurement
     lib::ScopedCollection<Thread> threads(nThreads);
     for (size_t n=0; n<nThreads; ++n)              // create test threads
       threads.emplace (subject4benchmark, repeatCnt, testStart);

     testStart.sync();                              // barrier until all threads are ready

     size_t checksum{0};
     Dur sumDuration{0.0};
     for (auto& thread : threads)
       {
         thread.join();                             // block on measurement end (fence)
         sumDuration += thread.duration;
         checksum    += thread.checksum;
       }

     double micros = sumDuration.count() / (nThreads * repeatCnt);
     return std::make_tuple (micros, checksum);
   }


 }} // namespace lib::test
 #endif /*LIB_TEST_MICROBENCHMARK_H*/
lib::ThreadJoinable
Variant of the standard case, requiring to wait and join() on the termination of this thread...
Definition: thread.hpp:668

lib::test::threadBenchmark
auto threadBenchmark(FUN const &subject, const size_t repeatCnt=DEFAULT_RUNS)
perform a multithreaded microbenchmark.
Definition: microbenchmark.hpp:147

lib::ScopedCollection
A fixed collection of non-copyable polymorphic objects.
Definition: scoped-collection.hpp:94

test
Definition: run.hpp:40

lib::ScopedCollection::emplace
TY & emplace(ARGS &&...args)
push new entry at the end of this container and build object of type TY in place there ...
Definition: scoped-collection.hpp:306

lib
Implementation namespace for support and library code.
Definition: common-services.cpp:54

microbenchmark-adaptor.hpp
Helpers and wrappers so simplify usage of micobenchmark.hpp.

lib::test::microBenchmark
auto microBenchmark(FUN const &testSubject, const size_t repeatCnt=DEFAULT_RUNS)
perform a simple looped microbenchmark.
Definition: microbenchmark.hpp:118

scoped-collection.hpp
Managing a collection of non-copyable polymorphic objects in compact storage.

lib::test::benchmarkTime
double benchmarkTime(FUN const &invokeTestCode, const size_t repeatCnt=1)
Helper to invoke a functor or λ to observe its running time.
Definition: microbenchmark.hpp:76

function.hpp
Metaprogramming tools for transforming functor types.

thread.hpp
Convenience front-end to simplify and codify basic thread handling.

lib::SyncBarrier
A one time N-fold mutual synchronisation barrier.
Definition: sync-barrier.hpp:64

lib::Thread
A thin convenience wrapper to simplify thread-handling.
Definition: thread.hpp:648

lib::test::benchmarkLoop
size_t benchmarkLoop(FUN const &testSubject, const size_t repeatCnt=DEFAULT_RUNS)
Benchmark building block to invoke a functor or λ in a tight loop, passing the current loop index and...
Definition: microbenchmark.hpp:95

sync-barrier.hpp
A N-fold synchronisation latch using yield-wait until fulfilment.