eyalroz/cuda-api-wrappers/multi__wrapper__impls_2event_8hpp_source.html

 #pragma once
 #ifndef MULTI_WRAPPER_IMPLS_EVENT_HPP_
 #define MULTI_WRAPPER_IMPLS_EVENT_HPP_

 #include "../device.hpp"
 #include "../event.hpp"
 #include "../stream.hpp"
 #include "../primary_context.hpp"
 #include "../virtual_memory.hpp"
 #include "../current_context.hpp"
 #include "../current_device.hpp"

 #include <type_traits>
 #include <vector>
 #include <algorithm>

 namespace cuda {

 namespace event {

 inline event_t create(
     const context_t&  context,
     bool              uses_blocking_sync,
     bool              records_timing,
     bool              interprocess)
 {
     return event::detail_::create(
         context.device_id(),
         context.handle(),
         do_not_hold_primary_context_refcount_unit,
         uses_blocking_sync,
         records_timing,
         interprocess);
 }

 inline event_t create(
     const device_t&  device,
     bool             uses_blocking_sync,
     bool             records_timing,
     bool             interprocess)
 {
     // While it's possible that the device's primary context is
     // currently active, we have no guarantee that it will not soon
     // become inactive. So, we increase the PC refcount "on behalf"
     // of the stream, to make sure the PC does not de-activate
     //
     // todo: consider having the event wrapper take care of the primary
     //  context refcount.
     //
     auto pc = device.primary_context(do_not_hold_primary_context_refcount_unit);
     CAW_SET_SCOPE_CONTEXT(pc.handle());
     device::primary_context::detail_::increase_refcount(device.id());
     return event::detail_::create_in_current_context(
         device.id(),
         context::current::detail_::get_handle(),
         do_hold_primary_context_refcount_unit,
         uses_blocking_sync, records_timing, interprocess);
 }

 namespace ipc {

 inline handle_t export_(const event_t& event)
 {
     return detail_::export_(event.handle());
 }

 inline event_t import(const context_t& context, const handle_t& event_ipc_handle)
 {
     static constexpr const bool do_not_take_ownership { false };
     static constexpr const bool do_not_own_pc_refcount_unit { false };
     return event::wrap(
         context.device_id(),
         context.handle(),
         detail_::import(event_ipc_handle),
         do_not_take_ownership,
         do_not_own_pc_refcount_unit);
 }


 inline event_t import(const device_t& device, const handle_t& event_ipc_handle)
 {
     auto pc = device.primary_context();
     device::primary_context::detail_::increase_refcount(device.id());
     auto handle = detail_::import(event_ipc_handle);
     return event::wrap(
         device.id(), context::current::detail_::get_handle(), handle,
         do_not_take_ownership, do_hold_primary_context_refcount_unit);
 }

 } // namespace ipc

 } // namespace event

 inline device_t event_t::device() const
 {
     return cuda::device::get(device_id());
 }

 inline context_t event_t::context() const
 {
     static constexpr const bool dont_take_ownership { false };
     return context::wrap(device_id(), context_handle_, dont_take_ownership);
 }

 inline void event_t::record(const stream_t& stream) const
 {
 #ifndef NDEBUG
     if (stream.context_handle() != context_handle_) {
         throw ::std::invalid_argument("Attempt to record an event on a stream in a different context");
     }
 #endif
     event::detail_::enqueue(context_handle_, stream.handle(), handle_);
 }

 inline void event_t::fire(const stream_t& stream) const
 {
     record(stream);
     stream.synchronize();
 }

 } // namespace cuda

 #endif // MULTI_WRAPPER_IMPLS_EVENT_HPP_

cuda::stream_t::context_handle
context::handle_t context_handle() const noexcept
The raw CUDA handle for the context in which the represented stream is defined.
Definition: stream.hpp:260

cuda::stream_t
Proxy class for a CUDA stream.
Definition: stream.hpp:246

cuda::event_t::handle
event::handle_t handle() const noexcept
The raw CUDA handle for this event.
Definition: event.hpp:143

cuda::stream_t::handle
stream::handle_t handle() const noexcept
The raw CUDA handle for a stream which this class wraps.
Definition: stream.hpp:257

cuda::context_t
Wrapper class for a CUDA context.
Definition: context.hpp:244

cuda::stream_t::synchronize
void synchronize() const
Block or busy-wait until all previously-scheduled work on this stream has been completed.
Definition: stream.hpp:831

cuda
Definitions and functionality wrapping CUDA APIs.
Definition: array.hpp:22

cuda::event::ipc::export_
handle_t export_(const event_t &event)
Enable use of an event which this process created by other processes.
Definition: event.hpp:71

cuda::event_t
Wrapper class for a CUDA event.
Definition: event.hpp:133

cuda::event_t::fire
void fire(const stream_t &stream) const
Records the event and ensures it has occurred before returning (by synchronizing the stream)...
Definition: event.hpp:124

cuda::event::create
event_t create(const context_t &context, bool uses_blocking_sync=sync_by_busy_waiting, bool records_timing=do_record_timings, bool interprocess=not_interprocess)
creates a new event.
Definition: event.hpp:30

cuda::device_t::id
device::id_t id() const noexcept
Return the proxied device&#39;s ID.
Definition: device.hpp:594

cuda::event::ipc::handle_t
CUipcEventHandle handle_t
The concrete value passed between processes, used to tell the CUDA Runtime API which event is desired...
Definition: ipc.hpp:260

cuda::event::wrap
event_t wrap(device::id_t device_id, context::handle_t context_handle, handle_t event_handle, bool take_ownership=false, bool hold_pc_refcount_unit=false) noexcept
Wrap an existing CUDA event in a event_t instance.
Definition: event.hpp:346

cuda::event::create
event_t create(const device_t &device, bool uses_blocking_sync=sync_by_busy_waiting, bool records_timing=do_record_timings, bool interprocess=not_interprocess)
creates a new event on (the primary execution context of) a device.
Definition: event.hpp:45

cuda::device_t::primary_context
device::primary_context_t primary_context(bool hold_pc_refcount_unit=false) const
Produce a proxy for the device&#39;s primary context - the one used by runtime API calls.
Definition: device.hpp:152

cuda::device::get
device_t get(id_t id)
Returns a proxy for the CUDA device with a given id.
Definition: device.hpp:837

cuda::event_t::record
void record() const
Schedule a specified event to occur (= to fire) when all activities already scheduled on the event&#39;s ...
Definition: event.hpp:196

cuda::event_t::device
device_t device() const
The device w.r.t. which the event is defined.
Definition: event.hpp:103

cuda::event::interprocess
Can be shared between processes. Must not be able to record timings.
Definition: constants.hpp:96

cuda::device_t
Wrapper class for a CUDA device.
Definition: device.hpp:135

cuda::event_t::context
context_t context() const
The context in which this stream was defined.
Definition: event.hpp:108