piantado/Fleet/_threaded_inference_interface_8h_source.html

 #pragma once


 #include <atomic>
 #include <mutex>
 #include <thread>

 #include "Control.h"
 #include "SampleStreams.h"
 #include "ConcurrentQueue.h"

  template<typename X, typename... Args>
 class ThreadedInferenceInterface {
 public:

     // Subclasses must implement run_thread, which is what each individual thread
     // gets called on (and each thread manages its own locks etc)
     virtual generator<X&> run_thread(Control& ctl, Args... args) = 0;

     // index here is used to index into larger parallel collections. Each thread
     // is expected to get its next item to work on through index, though how will vary
     std::atomic<size_t> index;

     // How many threads? Used by some subclasses as asserts
     size_t __nthreads;
     std::atomic<size_t> __nrunning;// everyone updates this when they are done

     ConcurrentQueueRing<X> to_yield;

     ThreadedInferenceInterface() : index(0), __nthreads(0),  __nrunning(0), to_yield(FleetArgs::nthreads) { }

     unsigned long next_index() { return index++; }

     size_t nthreads() { return __nthreads; }

     void run_thread_generator_wrapper(size_t thr, Control& ctl, Args... args) {

         for(auto& x : run_thread(ctl, args...)) {

             if(x.born_chain_idx == 0 or not FleetArgs::yieldOnlyChainOne) {
                 to_yield.push(x, thr);

             }

             if(CTRL_C) break;
         }

         // we always notify when we're done, after making sure we're not running or else the
         // other thread can block
         __nrunning--;
     }

     generator<X&> run(Control ctl, Args... args) {

         std::vector<std::thread> threads(ctl.nthreads);
         __nthreads = ctl.nthreads; // save this for children
         assert(__nrunning==0);

         // Make a new control to run on each thread and then pass this to
         // each subthread. This way multiple threads all share the same control
         // which is required for getting an accurate total count
         Control ctl2  = ctl;
         ctl2.nthreads = 1;
         ctl2.start();

         // give this just some extra space here
         //to_yield.resize(FleetArgs::MCMC_QUEUE_MULTIPLIER*ctl.nthreads); // just some extra space here

         // start each thread
         for(unsigned long thr=0;thr<ctl.nthreads;thr++) {
             ++__nrunning;
             threads[thr] = std::thread(&ThreadedInferenceInterface<X, Args...>::run_thread_generator_wrapper, this, thr, std::ref(ctl2), args...);
         }

         // now yield as long as we have some that are running
         while(__nrunning > 0 and !CTRL_C) { // we don't want to stop when its empty because a thread might fill it
 //          if(not to_yield.empty()) { // w/o this we might pop when its empty...
 //              //print((size_t)to_yield.push_idx, (size_t)to_yield.pop_idx, to_yield.size(), to_yield.N);
 //              co_yield to_yield.pop();
 //          }
             if(not to_yield.empty())  {
                 auto val = to_yield.pop(); // search through until we find one
                 if(val.has_value()) co_yield val.value();
                 else                break;
             }

         }

         // now we're done filling but we still may have stuff in the queue
         // some threads may be waiting so we can't join yet
         while(not to_yield.empty()) {
             auto val = to_yield.pop(); // search through until we find one
             if(val.has_value()) co_yield val.value();
             else                break; // NOTE: we migth break here and leave some in queue -- but we only get break on CTRL_C
         }

         // wait for all to complete
         for(auto& t : threads)
             t.join();

     }

     generator<X&> unthreaded_run(Control ctl, Args... args) {

         // This is a simple version where we don't use threads -- useful
         // because it's hard to debug otherwise

         std::cerr << "*** Warning running unthreaded_run (intended for debugging)" << std::endl;
         ctl.start();
         for(auto& x : run_thread(ctl, args...)) {
             if(CTRL_C) break; // must come first or else we yield something invalid

             auto val = to_yield.pop(); // search through until we find one
             if(val.has_value()) co_yield val.value();
             else                break;
         }
     }

 };


ConcurrentQueueRing::push
void push(const T &item, size_t thr)
Definition: ConcurrentQueue.h:116

ThreadedInferenceInterface::run_thread
virtual generator< X & > run_thread(Control &ctl, Args... args)=0

ConcurrentQueueRing::empty
bool empty()
Definition: ConcurrentQueue.h:137

SampleStreams.h

ThreadedInferenceInterface::nthreads
size_t nthreads()
How many threads are currently run in this interface?
Definition: ThreadedInferenceInterface.h:51

ConcurrentQueue.h
A concurrent queue class that allows multiple threads to push and consume. Note that this has a fixed...

CTRL_C
volatile sig_atomic_t CTRL_C

Control::start
void start()
Definition: Control.h:54

Control
Definition: Control.h:23

FleetArgs::yieldOnlyChainOne
bool yieldOnlyChainOne
Definition: FleetArgs.h:56

ThreadedInferenceInterface::__nrunning
std::atomic< size_t > __nrunning
Definition: ThreadedInferenceInterface.h:35

ThreadedInferenceInterface::ThreadedInferenceInterface
ThreadedInferenceInterface()
Definition: ThreadedInferenceInterface.h:39

cppcoro::generator
Definition: generator.hpp:21

ThreadedInferenceInterface::next_index
unsigned long next_index()
Return the next index to operate on (in a thread-safe way).
Definition: ThreadedInferenceInterface.h:45

ThreadedInferenceInterface::run_thread_generator_wrapper
void run_thread_generator_wrapper(size_t thr, Control &ctl, Args... args)
We have to wrap run_thread in something that manages the sync with main. This really just synchronize...
Definition: ThreadedInferenceInterface.h:60

ConcurrentQueueRing< X >

ThreadedInferenceInterface::to_yield
ConcurrentQueueRing< X > to_yield
Definition: ThreadedInferenceInterface.h:37

Builtins::X
Primitive< typename Grammar_t::input_t > X(Op::X, BUILTIN_LAMBDA { assert(!vms->xstack.empty());vms->template push< typename Grammar_t::input_t >(vms->xstack.top());})

Control::nthreads
size_t nthreads
Definition: Control.h:26

ThreadedInferenceInterface::index
std::atomic< size_t > index
Definition: ThreadedInferenceInterface.h:31

ThreadedInferenceInterface::__nthreads
size_t __nthreads
Definition: ThreadedInferenceInterface.h:34

ThreadedInferenceInterface
Definition: ThreadedInferenceInterface.h:22

ThreadedInferenceInterface::unthreaded_run
generator< X & > unthreaded_run(Control ctl, Args... args)
Definition: ThreadedInferenceInterface.h:132

ThreadedInferenceInterface::run
generator< X & > run(Control ctl, Args... args)
Set up the multiple threads and actually run, calling run_thread_generator_wrapper.
Definition: ThreadedInferenceInterface.h:82

Control.h
This class has all the information for running MCMC or MCTS in a little package. It defaultly constru...

FleetArgs
Definition: FleetArgs.h:10

ConcurrentQueueRing::pop
std::optional< T > pop()
Definition: ConcurrentQueue.h:121