eyalroz/cuda-api-wrappers/peer__to__peer_8hpp_source.html

 #pragma once
 #ifndef CUDA_API_WRAPPERS_PEER_TO_PEER_HPP_
 #define CUDA_API_WRAPPERS_PEER_TO_PEER_HPP_

 #include "current_context.hpp"

 namespace cuda {

 namespace device {

 namespace peer_to_peer {


 constexpr const attribute_t link_performance_rank = CU_DEVICE_P2P_ATTRIBUTE_PERFORMANCE_RANK;

 constexpr const attribute_t access_support = CU_DEVICE_P2P_ATTRIBUTE_ACCESS_SUPPORTED;

 constexpr const attribute_t native_atomics_support = CU_DEVICE_P2P_ATTRIBUTE_NATIVE_ATOMIC_SUPPORTED;

 #if CUDA_VERSION >= 10000
 constexpr const attribute_t array_access_support = CU_DEVICE_P2P_ATTRIBUTE_CUDA_ARRAY_ACCESS_SUPPORTED;
 #endif

 namespace detail_ {
 inline attribute_value_t get_attribute(attribute_t attribute, id_t source, id_t destination)
 {
     attribute_value_t value;
     auto status = cuDeviceGetP2PAttribute(&value, attribute, source, destination);
     throw_if_error_lazy(status, "Failed obtaining peer-to-peer device attribute for device pair ("
         + ::std::to_string(source) + ", " + ::std::to_string(destination) + ')');
     return value;
 }

 inline bool can_access(const device::id_t accessor, const device::id_t peer)
 {
     int result;
     auto status = cuDeviceCanAccessPeer(&result, accessor, peer);
     throw_if_error_lazy(status, "Failed determining whether " + device::detail_::identify(accessor)
         + " can access " + device::detail_::identify(peer));
     return (result == 1);
 }

 } // namespace detail_

 } // namespace peer_to_peer

 } // namespace device

 namespace context {

 namespace current {

 namespace peer_to_peer {

 void enable_access_to(const context_t &peer_context);

 void disable_access_to(const context_t &peer_context);

 } // namespace peer_to_peer

 } // namespace current

 namespace peer_to_peer {

 namespace detail_ {

 inline void enable_access_to(context::handle_t peer_context)
 {
     enum : unsigned {fixed_flags = 0 };
     // No flags are supported as of CUDA 8.0
     auto status = cuCtxEnablePeerAccess(peer_context, fixed_flags);
     throw_if_error_lazy(status, "Failed enabling access to peer " + context::detail_::identify(peer_context));
 }

 inline void disable_access_to(context::handle_t peer_context)
 {
     auto status = cuCtxDisablePeerAccess(peer_context);
     throw_if_error_lazy(status, "Failed disabling access to peer " + context::detail_::identify(peer_context));
 }

 inline void enable_access(context::handle_t accessor, context::handle_t peer)
 {
     context::current::detail_::scoped_override_t set_context_for_this_context(accessor);
     enable_access_to(peer);
 }

 inline void disable_access(context::handle_t accessor, context::handle_t peer)
 {
     context::current::detail_::scoped_override_t set_context_for_this_context(accessor);
     disable_access_to(peer);
 }

 } // namespace detail_

 bool can_access(context_t accessor, context_t peer);

 void enable_access(context_t accessor, context_t peer);

 void disable_access(context_t accessor, context_t peer);

 void enable_bidirectional_access(context_t first, context_t second);

 void disable_bidirectional_access(context_t first, context_t second);

 } // namespace peer_to_peer
 } // namespace context

 namespace device {

 namespace peer_to_peer {

 inline bool can_access(const device_t& accessor, const device_t& peer);

 inline void enable_access(const device_t& accessor, const device_t& peer);

 inline void disable_access(const device_t& accessor, const device_t& peer);

 inline bool can_access_each_other(const device_t& first, const device_t& second);

 inline void enable_bidirectional_access(const device_t& first, const device_t& second);

 inline void disable_bidirectional_access(const device_t& first, const device_t& second);

 inline attribute_value_t get_attribute(attribute_t attribute, const device_t& first, const device_t& second);

 } // namespace peer_to_peer
 } // namespace device
 } // namespace cuda

 #endif // CUDA_API_WRAPPERS_PEER_TO_PEER_HPP_
cuda::device::attribute_value_t
int attribute_value_t
All CUDA device attributes (cuda::device::attribute_t) have a value of this type. ...
Definition: types.hpp:860

cuda::context_t
Wrapper class for a CUDA context.
Definition: context.hpp:244

cuda::device::peer_to_peer::can_access_each_other
bool can_access_each_other(const device_t &first, const device_t &second)
Determine whether two CUDA devices can currently access each other.
Definition: device.hpp:88

cuda
Definitions and functionality wrapping CUDA APIs.
Definition: array.hpp:22

cuda::device::peer_to_peer::can_access
bool can_access(const device_t &accessor, const device_t &peer)
Determine whether one CUDA device can access the global memory of another CUDA device.
Definition: device.hpp:68

cuda::context::handle_t
CUcontext handle_t
Raw CUDA driver handle for a context; see {context_t}.
Definition: types.hpp:878

cuda::device::peer_to_peer::get_attribute
attribute_value_t get_attribute(attribute_t attribute, const device_t &first, const device_t &second)
Get one of the numeric attributes for a(n ordered) pair of devices, relating to their interaction...
Definition: device.hpp:113

cuda::device::id_t
CUdevice id_t
Numeric ID of a CUDA device used by the CUDA Runtime API.
Definition: types.hpp:850

cuda::device::peer_to_peer::access_support
constexpr const attribute_t access_support
1 if access is supported, 0 otherwise
Definition: peer_to_peer.hpp:30

cuda::device::peer_to_peer::link_performance_rank
constexpr const attribute_t link_performance_rank
Aliases for CUDA driver GPU attribute codes.
Definition: peer_to_peer.hpp:27

current_context.hpp

cuda::device::peer_to_peer::native_atomics_support
constexpr const attribute_t native_atomics_support
1 if the first device can perform native atomic operations on the second device, 0 otherwise ...
Definition: peer_to_peer.hpp:33

cuda::device::peer_to_peer::attribute_t
CUdevice_P2PAttribute attribute_t
While Individual CUDA devices have individual "attributes" (attribute_t), there are also attributes c...
Definition: types.hpp:869

throw_if_error_lazy
#define throw_if_error_lazy(status__,...)
A macro for only throwing an error if we&#39;ve failed - which also ensures no string is constructed unle...
Definition: error.hpp:316

cuda::device::peer_to_peer::disable_access
void disable_access(const device_t &accessor, const device_t &peer)
Disable access by one CUDA device to the global memory of another.
Definition: device.hpp:78

cuda::device::peer_to_peer::enable_access
void enable_access(const device_t &accessor, const device_t &peer)
Enable access by one CUDA device to the global memory of another.
Definition: device.hpp:73

cuda::device::peer_to_peer::enable_bidirectional_access
void enable_bidirectional_access(const device_t &first, const device_t &second)
Enable access both by the first to the second device and the other way around.
Definition: device.hpp:93

cuda::device_t
Wrapper class for a CUDA device.
Definition: device.hpp:135

cuda::device::peer_to_peer::disable_bidirectional_access
void disable_bidirectional_access(const device_t &first, const device_t &second)
Disable access both by the first to the second device and the other way around.
Definition: device.hpp:103