eyalroz/cuda-api-wrappers/device__properties_8hpp_source.html

 #pragma once
 #ifndef CUDA_API_WRAPPERS_DEVICE_PROPERTIES_HPP_
 #define CUDA_API_WRAPPERS_DEVICE_PROPERTIES_HPP_

 #include "constants.hpp"
 #include "pci_id.hpp"

 #include "types.hpp"

 #include <cuda_runtime_api.h>

 #include <stdexcept>


 // The following un-definitions avoid warnings about
 // the use of `major` and `minor` in certain versions
 // of the GNU C library
 #ifdef major
 #undef major
 #endif

 #ifdef minor
 #undef minor
 #endif

 namespace cuda {

 namespace device {

 using multiprocessor_count_t = int;

 struct compute_architecture_t {
     unsigned major;

     const char* name() const;

     constexpr bool is_valid() const noexcept;

 };

 struct compute_capability_t {

     compute_architecture_t architecture;

     unsigned minor_;

     constexpr static compute_capability_t from_combined_number(unsigned combined) noexcept;

     constexpr unsigned major() const { return architecture.major; }
     unsigned constexpr minor() const { return minor_; }

     constexpr unsigned as_combined_number() const noexcept;

     constexpr bool is_valid() const noexcept;

     unsigned max_warp_schedulings_per_processor_cycle() const;
     unsigned max_resident_warps_per_processor() const;

     unsigned max_in_flight_threads_per_processor() const;

     memory::shared::size_t max_shared_memory_per_block() const;
 };

 constexpr compute_capability_t make_compute_capability(unsigned combined) noexcept;

 constexpr compute_capability_t make_compute_capability(unsigned major, unsigned minor) noexcept;

 struct properties_t : public cudaDeviceProp {

     properties_t() = default;
     properties_t(const cudaDeviceProp& cdp) noexcept : cudaDeviceProp(cdp) { };
     properties_t(cudaDeviceProp&& cdp) noexcept : cudaDeviceProp(cdp) { };

     bool usable_for_compute() const noexcept;
     compute_capability_t compute_capability() const noexcept
     {
         return { { static_cast<unsigned>(major) }, static_cast<unsigned>(minor) };
     }
     compute_architecture_t compute_architecture() const noexcept { return { static_cast<unsigned>(major) }; };
     pci_location_t pci_id() const noexcept { return { pciDomainID, pciBusID, pciDeviceID, {} }; }

     unsigned max_in_flight_threads_on_device() const
     {
         return compute_capability().max_in_flight_threads_per_processor() * multiProcessorCount;
     }

     grid::block_dimension_t max_threads_per_block() const noexcept { return maxThreadsPerBlock; }
     grid::block_dimension_t max_warps_per_block() const noexcept { return maxThreadsPerBlock / warp_size; }
     size_t max_shared_memory_per_block() const noexcept { return sharedMemPerBlock; }
     size_t global_memory_size() const noexcept { return totalGlobalMem; }
     bool can_map_host_memory() const noexcept { return canMapHostMemory != 0; }
 };

 } // namespace device
 } // namespace cuda

 #include "detail/device_properties.hpp"

 #endif // CUDA_API_WRAPPERS_DEVICE_PROPERTIES_HPP_
cuda
Definitions and functionality wrapping CUDA APIs.
Definition: array.hpp:22

cuda::grid::block_dimension_t
dimension_t block_dimension_t
CUDA kernels are launched in grids of blocks of threads, in 3 dimensions.
Definition: types.hpp:312

cuda::device::compute_capability_t
A numeric designator of the computational capabilities of a CUDA device.
Definition: device_properties.hpp:75

cuda::memory::shared::size_t
unsigned size_t
Each physical core ("Symmetric Multiprocessor") on an nVIDIA GPU has a space of shared memory (see th...
Definition: types.hpp:730

cuda::device::compute_architecture_t::name
const char * name() const

cuda::device::compute_architecture_t::major
unsigned major
A compute_capability_t has a "major" and a "minor" number, with "major" indicating the architecture; ...
Definition: device_properties.hpp:51

cuda::device::pci_location_t
Location "coordinates" for a CUDA device on a PCIe bus.
Definition: pci_id.hpp:24

cuda::device::compute_capability_t::architecture
compute_architecture_t architecture
The major capability designator.
Definition: device_properties.hpp:78

constants.hpp
Fundamental CUDA-related constants and enumerations, not dependent on any more complex abstractions...

cuda::device::compute_architecture_t
A numeric designator of an architectural generation of CUDA devices.
Definition: device_properties.hpp:45

cuda::device::make_compute_capability
constexpr compute_capability_t make_compute_capability(unsigned combined) noexcept
A named constructor idiom for {compute_capability_t}.

cuda::device::properties_t
A structure holding a collection various properties of a device.
Definition: device_properties.hpp:149

cuda::device::compute_architecture_t::is_valid
constexpr bool is_valid() const noexcept

cuda::device::compute_capability_t::minor_
unsigned minor_
The minor designator, indicating mostly numeric choices of capabilities (e.g.
Definition: device_properties.hpp:83

cuda::device::multiprocessor_count_t
int multiprocessor_count_t
Type of the number of mutiprocessors within a single GPU.
Definition: device_properties.hpp:37

types.hpp
Fundamental CUDA-related type definitions.

pci_id.hpp
Definition of a wrapper class for CUDA PCI device ID information.