rapidsmpf: /__w/rapidsmpf/rapidsmpf/cpp/include/rapidsmpf/memory/pinned_memory_resource.hpp Source File

 #pragma once


 #include <cstddef>

 #include <functional>

 #include <memory>


 #include <cuda.h>

 #include <cuda_runtime_api.h>


 #include <cuda/memory_resource>


 #include <rmm/aligned.hpp>

 #include <rmm/cuda_device.hpp>

 #include <rmm/cuda_stream_view.hpp>

 #include <rmm/device_buffer.hpp>


 #include <rapidsmpf/config.hpp>

 #include <rapidsmpf/detail/rmm_resource_adaptor_impl.hpp>

 #include <rapidsmpf/error.hpp>

 #include <rapidsmpf/system_info.hpp>

 #include <rapidsmpf/utils/misc.hpp>


 // NOLINTBEGIN(modernize-macro-to-enum)

 #define RAPIDSMPF_PINNED_MEM_RES_MIN_CUDA_VERSION 12060

 #define RAPIDSMPF_PINNED_MEM_RES_MIN_CUDA_VERSION_STR "v12.6"


 // NOLINTEND(modernize-macro-to-enum)


 namespace rapidsmpf {


 inline bool is_pinned_memory_resources_supported() {

     static const bool supported = [] {

         // check if the device supports async memory pools

         int cuda_pool_supported{};

         auto attr_result = cudaDeviceGetAttribute(

             &cuda_pool_supported,

             cudaDevAttrMemoryPoolsSupported,

             rmm::get_current_cuda_device().value()

         );

         if (attr_result != cudaSuccess || cuda_pool_supported != 1) {

             return false;

         }


         int cuda_driver_version{};

         auto driver_result = cudaDriverGetVersion(&cuda_driver_version);

         int cuda_runtime_version{};

         auto runtime_result = cudaRuntimeGetVersion(&cuda_runtime_version);

         return driver_result == cudaSuccess && runtime_result == cudaSuccess

                && cuda_driver_version >= RAPIDSMPF_PINNED_MEM_RES_MIN_CUDA_VERSION

                && cuda_runtime_version >= RAPIDSMPF_PINNED_MEM_RES_MIN_CUDA_VERSION;

     }();

     return supported;

 }


 struct PinnedPoolProperties {

     std::size_t initial_pool_size = 0;


     std::optional<std::size_t> max_pool_size = std::nullopt;

 };


 class PinnedMemoryResource final

     : public cuda::mr::shared_resource<

           detail::RmmResourceAdaptorImpl<cuda::pinned_memory_pool>> {

     using shared_base = cuda::mr::shared_resource<

         detail::RmmResourceAdaptorImpl<cuda::pinned_memory_pool>>;


   public:

     static constexpr std::nullopt_t Disabled = std::nullopt;


     static constexpr bool EnabledByDefault = false;


     static constexpr std::string_view DefaultInitiPoolSizeFactor = "0%";


     static constexpr std::string_view DefaultMaxPoolSizeFactor = "80%";


     static std::optional<PinnedMemoryResource> make_if_available(

         int numa_id = get_current_numa_node(), PinnedPoolProperties pool_properties = {}

     );


     static std::optional<PinnedMemoryResource> from_options(config::Options options);


     [[nodiscard]] void* allocate(

         cuda::stream_ref stream,

         std::size_t size,

         std::size_t alignment = rmm::CUDA_ALLOCATION_ALIGNMENT

     ) {

         return get().allocate(stream, size, alignment);

     }


     void deallocate(

         cuda::stream_ref stream,

         void* ptr,

         std::size_t size,

         std::size_t alignment = rmm::CUDA_ALLOCATION_ALIGNMENT

     ) noexcept {

         get().deallocate(stream, ptr, size, alignment);

     }


     [[nodiscard]] bool operator==(PinnedMemoryResource const& other) const noexcept {

         return get() == other.get();

     }


     [[nodiscard]] std::int64_t current_allocated() const noexcept {

         return get().current_allocated();

     }


     [[nodiscard]] ScopedMemoryRecord get_main_memory_record() const {

         return get().get_main_record();

     }


     [[nodiscard]] constexpr PinnedPoolProperties const& properties() const noexcept {

         return pool_properties_;

     }


     [[nodiscard]] std::function<std::int64_t()> get_memory_available_cb() const;


     friend void get_property(

         PinnedMemoryResource const&, cuda::mr::host_accessible

     ) noexcept {}


   private:

     PinnedMemoryResource(

         int numa_id = get_current_numa_node(), PinnedPoolProperties pool_properties = {}

     );


     PinnedPoolProperties pool_properties_;

 };


 static_assert(cuda::mr::resource<PinnedMemoryResource>);

 static_assert(cuda::mr::resource_with<PinnedMemoryResource, cuda::mr::host_accessible>);

 static_assert(cuda::mr::resource_with<PinnedMemoryResource, cuda::mr::device_accessible>);


 }  // namespace rapidsmpf

aligned.hpp

rapidsmpf::PinnedMemoryResource
Memory resource that provides pinned (page-locked) host memory using a pool.
Definition: pinned_memory_resource.hpp:95

rapidsmpf::PinnedMemoryResource::DefaultInitiPoolSizeFactor
static constexpr std::string_view DefaultInitiPoolSizeFactor
Fraction of total host memory per GPU used as the initial pinned pool size when no explicit pinned_in...
Definition: pinned_memory_resource.hpp:113

rapidsmpf::PinnedMemoryResource::Disabled
static constexpr std::nullopt_t Disabled
Sentinel value indicating that pinned host memory is disabled.
Definition: pinned_memory_resource.hpp:101

rapidsmpf::PinnedMemoryResource::get_main_memory_record
ScopedMemoryRecord get_main_memory_record() const
Returns the main memory record for the pinned pool.
Definition: pinned_memory_resource.hpp:219

rapidsmpf::PinnedMemoryResource::get_memory_available_cb
std::function< std::int64_t()> get_memory_available_cb() const
Returns a memory-availability callback for the pinned pool, if the pool has a configured maximum size...

rapidsmpf::PinnedMemoryResource::current_allocated
std::int64_t current_allocated() const noexcept
Returns the total number of currently allocated bytes.
Definition: pinned_memory_resource.hpp:210

rapidsmpf::PinnedMemoryResource::operator==
bool operator==(PinnedMemoryResource const &other) const noexcept
Equality comparison.
Definition: pinned_memory_resource.hpp:201

rapidsmpf::PinnedMemoryResource::EnabledByDefault
static constexpr bool EnabledByDefault
Whether pinned host memory is enabled by default.
Definition: pinned_memory_resource.hpp:104

rapidsmpf::PinnedMemoryResource::from_options
static std::optional< PinnedMemoryResource > from_options(config::Options options)
Construct from configuration options.

rapidsmpf::PinnedMemoryResource::DefaultMaxPoolSizeFactor
static constexpr std::string_view DefaultMaxPoolSizeFactor
Fraction of total host memory per GPU used as the maximum pinned pool size when no explicit pinned_ma...
Definition: pinned_memory_resource.hpp:123

rapidsmpf::PinnedMemoryResource::make_if_available
static std::optional< PinnedMemoryResource > make_if_available(int numa_id=get_current_numa_node(), PinnedPoolProperties pool_properties={})
Create a pinned memory resource if the system supports pinned memory.

rapidsmpf::PinnedMemoryResource::allocate
void * allocate(cuda::stream_ref stream, std::size_t size, std::size_t alignment=rmm::CUDA_ALLOCATION_ALIGNMENT)
Allocates pinned host memory associated with a CUDA stream.
Definition: pinned_memory_resource.hpp:170

rapidsmpf::PinnedMemoryResource::properties
constexpr PinnedPoolProperties const  & properties() const noexcept
Returns the properties used to configure the pool.
Definition: pinned_memory_resource.hpp:228

rapidsmpf::PinnedMemoryResource::deallocate
void deallocate(cuda::stream_ref stream, void *ptr, std::size_t size, std::size_t alignment=rmm::CUDA_ALLOCATION_ALIGNMENT) noexcept
Deallocates pinned host memory associated with a CUDA stream.
Definition: pinned_memory_resource.hpp:186

rapidsmpf::PinnedMemoryResource::get_property
friend void get_property(PinnedMemoryResource const &, cuda::mr::host_accessible) noexcept
Enables the cuda::mr::host_accessible property.
Definition: pinned_memory_resource.hpp:244

rapidsmpf::config::Options
Manages configuration options for RapidsMPF operations.
Definition: config.hpp:140

rapidsmpf::detail::RmmResourceAdaptorImpl
Implementation class for RmmResourceAdaptor.
Definition: rmm_resource_adaptor_impl.hpp:52

cuda_device.hpp

cuda_stream_view.hpp

device_buffer.hpp

rmm::get_current_cuda_device
cuda_device_id get_current_cuda_device()

rmm::CUDA_ALLOCATION_ALIGNMENT
static constexpr std::size_t CUDA_ALLOCATION_ALIGNMENT

rapidsmpf
RAPIDS Multi-Processor interfaces.
Definition: backend.hpp:14

rapidsmpf::is_pinned_memory_resources_supported
bool is_pinned_memory_resources_supported()
Checks if the PinnedMemoryResource is supported for the current CUDA version.
Definition: pinned_memory_resource.hpp:44

rapidsmpf::get_current_numa_node
int get_current_numa_node() noexcept
Get the NUMA node ID associated with the calling CPU thread.

rapidsmpf::PinnedPoolProperties
Properties for configuring a pinned memory pool.
Definition: pinned_memory_resource.hpp:71

rapidsmpf::PinnedPoolProperties::max_pool_size
std::optional< std::size_t > max_pool_size
Maximum size of the pool. std::nullopt means no limit.
Definition: pinned_memory_resource.hpp:78

rapidsmpf::PinnedPoolProperties::initial_pool_size
std::size_t initial_pool_size
Initial size of the pool. Initial size is important for pinned memory performance,...
Definition: pinned_memory_resource.hpp:75

rapidsmpf::ScopedMemoryRecord
Memory statistics for a specific scope.
Definition: scoped_memory_record.hpp:20