mercuryconcurrencyengine/threadpool_8hpp_source.html

 //SPDX-License-Identifier: Apache-2.0

 //Author: Blayne Dennis

 #ifndef __MERCURY_COROUTINE_ENGINE_THREADPOOL__

 #define __MERCURY_COROUTINE_ENGINE_THREADPOOL__


 // c

 #include <limits.h>


 // c++

 #include <vector>

 #include <mutex>

 #include <iostream>

 #include <algorithm>

 #include <memory>


 // local

 #include "function_utility.hpp"

 #include "timer.hpp"

 #include "scheduler.hpp"


 namespace mce {


 struct threadpool;


 namespace detail {


 mce::threadpool*& tl_this_threadpool();


 }


 struct threadpool : public lifecycle, protected lifecycle::implementation

 {

     static inline std::shared_ptr<threadpool> make(size_t worker_count = 0)

     {

         threadpool* tpp = new threadpool(worker_count);

         std::shared_ptr<threadpool> tp(tpp);

         tpp->self_wptr_ = tp;

         tp->init_();

         return tp;

     };


     virtual ~threadpool() { }


     inline size_t size() const { return workers_schedulers_.size(); }


     inline scheduler& worker(size_t idx) const

     {

         return *(workers_schedulers_[idx]);

     }


     inline scheduler& worker()

     {

         const size_t start_idx = current_scheduler_idx_();

         auto sz = workers_schedulers_.size();

         size_t i = start_idx;

         size_t end = sz; // end is our 'break out of loop' index

         auto least_weight = workers_schedulers_[i]->measure();

         scheduler* ret = workers_schedulers_[i];

         bool found_empty = false;


         ++i; // start comparisons at index 1


         auto compare = [&]

         {

             for(; i<end; ++i)

             {

                 // acquire the current scheduling load of a scheduler

                 auto cur_weight = workers_schedulers_[i]->measure();


                 // end iteration if we find an empty scheduler

                 if(cur_weight)

                 {

                     if(cur_weight < least_weight)

                     {

                         // update return value

                         least_weight = cur_weight;

                         ret = workers_schedulers_[i];

                     }

                 }

                 else

                 {

                     found_empty = true;

                     ret = workers_schedulers_[i];

                     break;

                 }

             }

         };


         compare();


         // if we didn't find a 0 weight scheduler and our start_idx > 0

         if(!found_empty && start_idx)

         {

             i = 0; // rotate back around to 0

             end = start_idx; // our new end is our original beginning

             compare();

         }


         return *ret;

     }


     inline std::vector<std::shared_ptr<scheduler>> workers()

     {

         std::vector<std::shared_ptr<scheduler>> ret(workers_schedulers_.size());


         std::transform(

             workers_schedulers_.begin(),

             workers_schedulers_.end(),

             ret.begin(),

             [](scheduler* sch){ return (std::shared_ptr<scheduler>)(*sch); }

         );


         return ret;

     }


     inline operator std::shared_ptr<threadpool>() { return self_wptr_.lock(); }


 protected:

     // return the workers' state

     inline lifecycle::state get_state_impl()

     {

         std::lock_guard<mce::spinlock> lk(lk_);


         auto lf = (lifecycle::implementation*)(workers_schedulers_.front());


         // state should be the same on all workers

         return lf->get_state_impl();

     }


     // suspend all workers, returning true if all workers suspend() == true, else false

     inline bool suspend_impl()

     {

         bool ret = true;


         std::lock_guard<mce::spinlock> lk(lk_);


         for(auto& sch : workers_schedulers_)

         {

             ret = ret && ((lifecycle::implementation*)sch)->suspend_impl();

         }


         return ret;

     }


     // resume all workers

     inline void resume_impl()

     {

         std::lock_guard<mce::spinlock> lk(lk_);


         for(auto& sch : workers_schedulers_)

         {

             ((lifecycle::implementation*)sch)->resume_impl();

         }

     }


     // halt all workers

     inline void halt_impl()

     {

         std::lock_guard<mce::spinlock> lk(lk_);


         for(auto& worker : workers_memory_)

         {

             auto lf = (lifecycle::implementation*)(worker->sch.get());


             if(lf->get_state_impl() != lifecycle::state::halted)

             {

                 lf->halt_impl();

                 worker->thd.join();

             }

         }

     }


 private:

     struct worker_thread

     {

         std::shared_ptr<scheduler> sch;

         std::thread thd;


         worker_thread(std::shared_ptr<threadpool> tp) :

             sch(scheduler::make(tp.get())),

             thd([tp,this]() mutable

             {

                 auto& tl_tp = detail::tl_this_threadpool();

                 auto parent_tp = tl_tp;

                 tl_tp = tp.get();


                 try { while(this->sch->run()){ } }

                 catch(...)

                 {

                     tl_tp = parent_tp;

                     std::rethrow_exception(std::current_exception());

                 }


                 tl_tp = parent_tp;

             })

         { }


         worker_thread() = delete;

         worker_thread(worker_thread&&) = delete;


         ~worker_thread()

         {

             auto lf = (lifecycle::implementation*)(sch.get());


             if(lf->get_state_impl() != lifecycle::state::halted)

             {

                 lf->halt_impl();

             }


             if(thd.joinable()) { thd.join(); }

         }

     };


     threadpool(size_t worker_count) :

         lifecycle(this),

         workers_memory_(

             [=]() mutable -> size_t

             {

                 if(worker_count == 0)

                 {

                     worker_count = std::thread::hardware_concurrency();


                     // enforce a minimum of 1 worker threads

                     if(worker_count == 0) { worker_count = 1; }

                 }


                 return worker_count;

             }()),

         workers_schedulers_(workers_memory_.size())

     { }


     // separate worker init from constructor so self shared_ptr can be setup

     inline void init_()

     {

         auto self = self_wptr_.lock();

         auto it = workers_schedulers_.begin();


         // initialize worker threads, no need for synchronization because no

         // operations are scheduled on the schedulers till

         // threadpool::make() returns.

         for(auto& w : workers_memory_)

         {

             w = std::unique_ptr<worker_thread>(new worker_thread(self));

             *it = w->sch.get();

             ++it;

         }

     }


     // return the index of the worker we should measure() first

     inline size_t current_scheduler_idx_()

     {

         std::lock_guard<mce::spinlock> lk(lk_);


         auto ret = current_scheduler_idx_val_;


         // rotate current scheduler to limit lock contention

         if((current_scheduler_idx_val_+1) < workers_memory_.size())

         {

             ++current_scheduler_idx_val_;

         }

         else

         {

             current_scheduler_idx_val_ = 0;

         }


         return ret;

     }


     // as a general rule, anything relying on access to lk_ should not block

     // on anything else for the duration of the lock

     mce::spinlock lk_;


     // avoid circular shared memory structures through a weak_ptr

     std::weak_ptr<threadpool> self_wptr_;


     // This vector never changes post initialization until the threadpool is

     // destroyed. The fact that this vector doesn't change which worker is

     // stored in what index is important to ensure that calls to

     // `workers(size_t)` are consistent.

     //

     // Because this vector never changes until threadpool is destroyed, it can

     // be read without a lock. However, a lock may be required for synchronized

     // calls to scheduler operations.

     std::vector<std::unique_ptr<worker_thread>> workers_memory_;


     // A vector of schedulers. This vector is not changed post init till

     // destruction; it can be read without a lock.

     std::vector<scheduler*> workers_schedulers_;


     // value which wraps around back to 0 when incremented past the max size,

     // used for limiting lock contention by ensuring measurement()s are taken

     // equally among all schedulers

     size_t current_scheduler_idx_val_ = 0;

 };


 inline bool in_threadpool()

 {

     return detail::tl_this_threadpool();

 }


 inline threadpool& this_threadpool()

 {

     return *detail::tl_this_threadpool();

 }


 bool default_threadpool_enabled();


 threadpool& default_threadpool();


 double balance_ratio();


 namespace detail {


 // select an arbitrary scheduler from the default_threadpool to always return

 scheduler& default_threadpool_scheduler();


 inline scheduler& concurrent_algorithm()

 {

     return in_scheduler()

         ? this_scheduler()

         : default_threadpool_scheduler();

 }


 inline scheduler& parallel_algorithm()

 {

     return in_threadpool()

         ? this_threadpool().worker()

         : default_threadpool().worker();

 }


 inline scheduler& balance_algorithm()

 {

     if(in_threadpool())

     {

         scheduler* least_sch;


         // return true if the workload is imbalanced, else false

         auto imbalanced = [&]() -> bool

         {

             auto& tp = this_threadpool();

             size_t sz = tp.size();


             scheduler::measurement least;


             scheduler::measurement most;


             {

                 auto& sch = tp.worker(0);


                 least_sch = &(sch);

                 least = sch.measure();

                 most = least;

             }


             // begin on index 1, we've already taken 0

             for(size_t i=1; i<sz; ++i)

             {

                 auto& sch = tp.worker(i);

                 scheduler::measurement weight = sch.measure();


                 if(weight < least)

                 {

                     least_sch = &(sch);

                     least = weight;

                 }

                 else if(weight > most) { most = weight; }

             }


             // returns true if the difference between workloads is greater than

             // the balance_ratio()

             auto past_limit = [](size_t lhs, size_t rhs) -> bool

             {

                 // cast to long double for a floating point division

                 return (static_cast<long double>(lhs) / rhs) >= balance_ratio();

             };


             return past_limit(most.scheduled(), least.scheduled());

         };


         return imbalanced()

             ? *least_sch // select the least burdened scheduler

             // select the current thread's scheduler

             : this_scheduler();

     }

     else { return default_threadpool().worker(); }

 }


 }


 template <typename... As>

 void concurrent(As&&... args)

 {

     detail::concurrent_algorithm().schedule(std::forward<As>(args)...);

 }


 template <typename... As>

 void parallel(As&&... args)

 {

     detail::parallel_algorithm().schedule(std::forward<As>(args)...);

 }


 template <typename... As>

 void balance(As&&... args)

 {

     detail::balance_algorithm().schedule(std::forward<As>(args)...);

 }


 }

 #endif

function_utility.hpp

scheduler.hpp

mce::in_scheduler
bool in_scheduler()
returns true if calling scope is executing inside a running scheduler
Definition: scheduler.hpp:1095

mce::this_scheduler
scheduler & this_scheduler()
returns a shared pointer to the scheduler the calling scope is running in
Definition: scheduler.hpp:1106

mce::lifecycle::implementation
virtual interface for implementors of lifecycle
Definition: scheduler.hpp:49

mce::lifecycle
an interface for implementing lifecycle control operations
Definition: scheduler.hpp:38

mce::lifecycle::state
state
an enumeration which represents the lifecycle object's current state
Definition: scheduler.hpp:41

mce::lifecycle::lifecycle
lifecycle(implementation *self)
Definition: scheduler.hpp:62

mce::scheduler::measurement
a struct allowing comparison of scheduler workload
Definition: scheduler.hpp:734

mce::scheduler::measurement::scheduled
size_t scheduled() const
count of all scheduled coroutines, blocked or enqueued
Definition: scheduler.hpp:790

mce::scheduler
object responsible for scheduling and executing coroutines
Definition: scheduler.hpp:180

mce::spinlock
Core mechanism for atomic synchronization.
Definition: atomic.hpp:20

mce::threadpool
Definition: threadpool.hpp:39

mce::threadpool::worker
scheduler & worker()
return the least busy worker scheduler at time of call
Definition: threadpool.hpp:65

mce::threadpool::worker
scheduler & worker(size_t idx) const
access the scheduler for a worker at a given index
Definition: threadpool.hpp:59

mce::threadpool::workers
std::vector< std::shared_ptr< scheduler > > workers()
Definition: threadpool.hpp:124

mce::threadpool::~threadpool
virtual ~threadpool()
halt(), join() and delete all workers
Definition: threadpool.hpp:53

mce::threadpool::make
static std::shared_ptr< threadpool > make(size_t worker_count=0)
construct an allocated threadpool with a count of worker threads
Definition: threadpool.hpp:43

mce::threadpool::size
size_t size() const
return the count of worker threads
Definition: threadpool.hpp:56

mce::concurrent
void concurrent(As &&... args)
Launch user function and optional arguments as a coroutine running on a scheduler.
Definition: threadpool.hpp:434

mce::parallel
void parallel(As &&... args)
Launch user function and optional arguments as a coroutine running on a scheduler.
Definition: threadpool.hpp:452

mce::balance
void balance(As &&... args)
Launch user function and optional arguments as a coroutine running on a scheduler....
Definition: threadpool.hpp:492

mce::default_threadpool_enabled
bool default_threadpool_enabled()
return true if default_threadpool() can be safely called, else false

mce::detail::balance_algorithm
scheduler & balance_algorithm()
Definition: threadpool.hpp:359

mce::in_threadpool
bool in_threadpool()
Return true if calling context is running in a threadpool.
Definition: threadpool.hpp:320

mce::default_threadpool
threadpool & default_threadpool()
return the default threadpool's

mce::balance_ratio
double balance_ratio()
return the balance ratio, set by compiler define: MCEBALANCERATIO

mce::this_threadpool
threadpool & this_threadpool()
return a reference to the threadpool the calling code is executing in
Definition: threadpool.hpp:326

timer.hpp