piantado/Fleet/_chain_pool_8h_source.html

 #pragma once

 #include <thread>

 //#define DEBUG_CHAINPOOL

 #include <vector>

 #include "Errors.h"
 #include "MCMCChain.h"
 #include "Timing.h"
 #include "ThreadedInferenceInterface.h"
 #include "OrderedLock.h"

 template<typename HYP, typename Chain_t=MCMCChain<HYP>>
 class ChainPool : public ThreadedInferenceInterface<HYP> {
 public:

     // the pool stores a bunch of chains
     std::vector<Chain_t> pool;

     // these parameters define the amount of a thread spends on each chain before changing to another
     // NOTE: these interact with ParallelTempering swap/adapt values (because if these are too small, then
     // we won't have time to update every chain before proposing more swaps)
     // NOTE: It seems probably better to set steps rather than time, because the hot chains run *much* faster
     // than the cold chains, typically. This means that if you set it by time, then you are spending lots of
     // time on the bad chains, which is the opposite of what you want. Actually, here, we probably should
     // run for *less* samples on the hot chains because they are faster to sample from.
     // Also note that due to multithreading, this is actually a little complex, we can't perfectly get the
     // number of samples
     unsigned long steps_before_change = 100;

     // Store which chains are running and which are done
     enum class RunningState {READY, RUNNING, DONE};

     // keep track of which threads are currently running
     std::vector<RunningState> running;
     OrderedLock running_lock;

     ChainPool() {}

     ChainPool(HYP& h0, typename HYP::data_t* d, size_t n) {
         assert(n>=1 && "*** You probably shouldn't have a chain pool with 0 elements");
         for(size_t i=0;i<n;i++) {
             add_chain(i==0?h0:h0.restart(), d);
         }
     }

     void set_data(typename HYP::data_t* d, bool recompute=true) {
         for(auto& c : pool) {
             c.set_data(d, recompute);
         }
     }

     template<typename... ARGS>
     void add_chain(ARGS... args) {

         std::lock_guard guard(running_lock);

         pool.emplace_back(args...);
         running.push_back(RunningState::READY);
     }


     size_t nchains() const {
         return pool.size();
     }

     void show(std::string prefix) const {
         for(size_t i=0;i<nchains();i++) {
             std::lock_guard guard(this->pool[i].current_mutex);
             print(prefix, i, (double)this->pool[i].temperature, this->pool[i].getCurrent().posterior, this->pool[i].getCurrent());
         }
     }

     generator<HYP&> run_thread(Control& ctl) override {
         assert(pool.size() > 0 && "*** Cannot run on an empty ChainPool");
         assert(this->nthreads() <= pool.size() && "*** Cannot have more threads than pool items");

         // We have to manage subthreads pretty differently depending on whether we have a time or a
         // sample constraint. For now, we assume we can't have both

         // Here we don't care about being precise about the number of steps
         // (below we do)

         if(ctl.steps == 0) {
             // we end up here if they're both zero, or steps=0. If they're both 0, we are running till CTRL_C

             while( ctl.running() and (not CTRL_C) ) {
                 // find the next open thread
                 size_t idx;
                 {
                     std::lock_guard guard(running_lock);

                     do {
                         idx = this->next_index() % pool.size();
                     } while( running[idx] != RunningState::READY ); // so we exit on a false running idx
                     running[idx] = RunningState::RUNNING; // say I'm running this one
                 }

                 // Actually run and yield, being sure to save where everything came from
                 Control c = ctl; // make a copy of everything in control
                 c.steps = steps_before_change; c.nthreads = 1; c.runtime = 0; // but update to
                 for(auto x : pool[idx].run(c)) {
                     x.born_chain_idx = idx; // set this
                     co_yield x;
                 }

                 // and free this lock space
                 {
                     std::lock_guard guard(running_lock);

                     ctl.done_steps += steps_before_change-1; // -1 because calling ctl.running adds one

                     running[idx] = RunningState::READY;
                 }

             }


         }
         else { // ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~

             assert(ctl.runtime == 0 && "*** Cannot have both time and steps specified in ChainPool (not implemented yet).");

             // note here on the while loops, we don't use ctl.running() because we need all the things
             // we start to actually finish (or else we won't run enough steps)
             while( ctl.done_steps < ctl.steps and (not CTRL_C) ) {

                 // find the next open thread
                 size_t idx;
                 unsigned long to_run_steps=0;
                 {
                     std::lock_guard guard(running_lock);

                     do {
                         idx = this->next_index() % pool.size();
                     } while( running[idx] != RunningState::READY ); // so we exit on a ready idx
                     running[idx] = RunningState::RUNNING; // say I'm running this one

                     to_run_steps = std::min(ctl.steps-ctl.done_steps, this->steps_before_change);

                     // exit here if there is nothing else to do
                     if(to_run_steps <= 0) {
                         break;
                     }

                     // now update ctl's number of steps
                     // NOTE if we do this here, we'll stop too early; if we do it later, we'll run too many...
                     // hmm.... Need a more complex solution it seems...
                     ctl.done_steps += to_run_steps;

 //                  print(">>", idx, ctl.steps, ctl.done_steps, to_run_steps, this->steps_before_change);
                 }


                 // Actually run and yield, being sure to save where everything came from
                 Control c = ctl; // make a copy of everything in control
                 c.steps = to_run_steps; c.nthreads = 1; c.runtime = 0; // but update to
                 for(auto& x : pool[idx].run(c)) {
                     x.born_chain_idx = idx; // set this
                     co_yield x;
                 }

                 #ifdef DEBUG_CHAINPOOL
                     COUT "# Thread " <<std::this_thread::get_id() << " stopping chain "<< idx TAB "at " TAB chain.current.posterior TAB chain.current.string() ENDL;
                 #endif

                 // and free this lock space
                 {
                     std::lock_guard guard(running_lock);

                     // we are done if we ran out of steps to continue running.
                     if(to_run_steps == steps_before_change) {
                         running[idx] = RunningState::READY;
                     }
                     else {
                         running[idx] = RunningState::DONE; // say I'm running this one
                     }
                 }
             }


         }


     }

 };
OrderedLock
Definition: OrderedLock.h:16

Control::steps
unsigned long steps
Definition: Control.h:24

ChainPool< HYP, ConstrainedMCMC< HYP > >::RunningState
RunningState
Definition: ChainPool.h:43

TAB
#define TAB
Definition: IO.h:19

ChainPool::pool
std::vector< Chain_t > pool
Definition: ChainPool.h:29

ChainPool::RunningState::READY

ChainPool::ChainPool
ChainPool(HYP &h0, typename HYP::data_t *d, size_t n)
Definition: ChainPool.h:51

Control::runtime
time_ms runtime
Definition: Control.h:25

ChainPool::ChainPool
ChainPool()
Definition: ChainPool.h:49

ThreadedInferenceInterface< HYP >::nthreads
size_t nthreads()
How many threads are currently run in this interface?
Definition: ThreadedInferenceInterface.h:51

ChainPool::RunningState::RUNNING

ChainPool
Definition: ChainPool.h:25

ChainPool::show
void show(std::string prefix) const
Definition: ChainPool.h:88

CTRL_C
volatile sig_atomic_t CTRL_C

ThreadedInferenceInterface.h
This manages multiple threads for running inference. This requires a subclass to define run_thread...

ChainPool::add_chain
void add_chain(ARGS... args)
Lock and modify the pool.
Definition: ChainPool.h:75

print
void print(FIRST f, ARGS... args)
Lock output_lock and print to std:cout.
Definition: IO.h:53

Control
Definition: Control.h:23

OrderedLock.h
A FIFO mutex (from stackoverflow) https://stackoverflow.com/questions/14792016/creating-a-lock-that-p...

Errors.h

cppcoro::generator
Definition: generator.hpp:21

ThreadedInferenceInterface< HYP >::next_index
unsigned long next_index()
Return the next index to operate on (in a thread-safe way).
Definition: ThreadedInferenceInterface.h:45

ChainPool::set_data
void set_data(typename HYP::data_t *d, bool recompute=true)
Set this data.
Definition: ChainPool.h:63

ChainPool::running
std::vector< RunningState > running
Definition: ChainPool.h:46

Timing.h

ChainPool::nchains
size_t nchains() const
Definition: ChainPool.h:84

Control::nthreads
size_t nthreads
Definition: Control.h:26

ChainPool::RunningState::DONE

ENDL
#define ENDL
Definition: IO.h:21

ChainPool::running_lock
OrderedLock running_lock
Definition: ChainPool.h:47

ThreadedInferenceInterface
Definition: ThreadedInferenceInterface.h:22

Control::done_steps
std::atomic< unsigned long > done_steps
Definition: Control.h:32

Control::running
bool running()
Definition: Control.h:63

ChainPool::steps_before_change
unsigned long steps_before_change
Definition: ChainPool.h:40

COUT
#define COUT
Definition: IO.h:24

ThreadedInferenceInterface< HYP >::run
generator< HYP &> run(Control ctl, Args... args)
Set up the multiple threads and actually run, calling run_thread_generator_wrapper.
Definition: ThreadedInferenceInterface.h:82

ChainPool::run_thread
generator< HYP & > run_thread(Control &ctl) override
This run helper is called internally by multiple different threads, and runs a given pool...
Definition: ChainPool.h:99

MCMCChain.h
This represents an MCMC hain on a hypothesis of type HYP. It uses HYP::propose and HYP::compute_poste...