rapidsmpf: /__w/rapidsmpf/rapidsmpf/cpp/include/rapidsmpf/memory/buffer_resource.hpp Source File

 #pragma once


 #include <array>

 #include <memory>

 #include <mutex>

 #include <optional>

 #include <ranges>

 #include <unordered_map>

 #include <utility>


 #include <cuda/memory_resource>


 #include <rmm/cuda_stream_pool.hpp>


 #include <rapidsmpf/error.hpp>

 #include <rapidsmpf/memory/buffer.hpp>

 #include <rapidsmpf/memory/host_memory_resource.hpp>

 #include <rapidsmpf/memory/memory_reservation.hpp>

 #include <rapidsmpf/memory/pinned_memory_resource.hpp>

 #include <rapidsmpf/memory/resource_types.hpp>

 #include <rapidsmpf/memory/spill_manager.hpp>

 #include <rapidsmpf/rmm_resource_adaptor.hpp>

 #include <rapidsmpf/statistics.hpp>

 #include <rapidsmpf/utils/misc.hpp>


 namespace rapidsmpf {


 enum class AllowOverbooking : bool {

     NO,

     YES,

 };


 class BufferResource {

   public:

     using MemoryAvailable = std::function<std::int64_t()>;


     BufferResource(

         cuda::mr::any_resource<cuda::mr::device_accessible> device_mr,

         std::optional<PinnedMemoryResource> pinned_mr = PinnedMemoryResource::Disabled,

         std::unordered_map<MemoryType, MemoryAvailable> memory_available = {},

         std::optional<Duration> periodic_spill_check = std::chrono::milliseconds{1},

         std::shared_ptr<rmm::cuda_stream_pool> stream_pool = std::make_shared<

             rmm::cuda_stream_pool>(16, rmm::cuda_stream::flags::non_blocking),

         std::shared_ptr<Statistics> statistics = Statistics::disabled()

     );


     static std::shared_ptr<BufferResource> from_options(

         RmmResourceAdaptor mr, config::Options options

     );


     ~BufferResource() noexcept = default;


     [[nodiscard]] rmm::device_async_resource_ref device_mr() const noexcept;


     [[nodiscard]] rmm::host_async_resource_ref host_mr() noexcept;


     [[nodiscard]] rmm::host_device_async_resource_ref pinned_mr();


     [[nodiscard]] std::optional<any_host_device_resource> try_pinned_mr() const noexcept;


     [[nodiscard]] MemoryAvailable const& memory_available(MemoryType mem_type) const {

         return memory_available_.at(mem_type);

     }


     [[nodiscard]] std::size_t memory_reserved(MemoryType mem_type) const {

         return memory_reserved_[static_cast<std::size_t>(mem_type)];

     }


     std::pair<MemoryReservation, std::size_t> reserve(

         MemoryType mem_type, std::size_t size, AllowOverbooking allow_overbooking

     );


     MemoryReservation reserve_device_memory_and_spill(

         std::size_t size, AllowOverbooking allow_overbooking

     );


     template <std::ranges::input_range Range>

         requires std::convertible_to<std::ranges::range_value_t<Range>, MemoryType>

     [[nodiscard]] MemoryReservation reserve_or_fail(std::size_t size, Range mem_types) {

         // try to reserve memory from the given order

         for (auto const& mem_type : mem_types) {

             if (mem_type == MemoryType::PINNED_HOST

                 && pinned_mr_ == PinnedMemoryResource::Disabled)

             {

                 // Pinned host memory is only available if the memory resource is

                 // available.

                 continue;

             }

             auto [res, _] = reserve(mem_type, size, AllowOverbooking::NO);

             if (res.size() == size) {

                 return std::move(res);

             }

         }

         RAPIDSMPF_FAIL("failed to reserve memory", std::runtime_error);

     }


     [[nodiscard]] MemoryReservation reserve_or_fail(

         std::size_t size, MemoryType mem_type

     ) {

         return reserve_or_fail(size, std::ranges::single_view{mem_type});

     }


     std::size_t release(MemoryReservation& reservation, std::size_t size);


     std::unique_ptr<Buffer> allocate(

         std::size_t size, rmm::cuda_stream_view stream, MemoryReservation& reservation

     );


     std::unique_ptr<Buffer> allocate(

         rmm::cuda_stream_view stream, MemoryReservation&& reservation

     );


     std::unique_ptr<Buffer> move(

         std::unique_ptr<rmm::device_buffer> data, rmm::cuda_stream_view stream

     );


     std::unique_ptr<Buffer> move(

         std::unique_ptr<Buffer> buffer, MemoryReservation& reservation

     );


     std::unique_ptr<rmm::device_buffer> move_to_device_buffer(

         std::unique_ptr<Buffer> buffer, MemoryReservation& reservation

     );


     std::unique_ptr<HostBuffer> move_to_host_buffer(

         std::unique_ptr<Buffer> buffer, MemoryReservation& reservation

     );


     rmm::cuda_stream_pool const& stream_pool() const;


     SpillManager& spill_manager();


     std::shared_ptr<Statistics> statistics();


   private:

     std::mutex mutex_;

     cuda::mr::any_resource<cuda::mr::device_accessible> device_mr_;

     std::optional<PinnedMemoryResource> pinned_mr_;

     HostMemoryResource host_mr_;

     std::unordered_map<MemoryType, MemoryAvailable> memory_available_;

     // Zero initialized reserved counters.

     std::array<std::size_t, MEMORY_TYPES.size()> memory_reserved_ = {};

     std::shared_ptr<rmm::cuda_stream_pool> stream_pool_;

     SpillManager spill_manager_;

     std::shared_ptr<Statistics> statistics_;

 };


 class LimitAvailableMemory {

   public:

     LimitAvailableMemory(RmmResourceAdaptor mr, std::int64_t limit)

         : limit{limit}, mr_{std::move(mr)} {}


     std::int64_t operator()() const {

         return limit - mr_.current_allocated();

     }


   public:

     std::int64_t const limit;


   private:

     RmmResourceAdaptor const mr_;

 };


 std::unordered_map<MemoryType, BufferResource::MemoryAvailable>

 memory_available_from_options(RmmResourceAdaptor mr, config::Options options);


 std::optional<Duration> periodic_spill_check_from_options(config::Options options);


 std::shared_ptr<rmm::cuda_stream_pool> stream_pool_from_options(config::Options options);


 }  // namespace rapidsmpf

rapidsmpf::BufferResource
Class managing buffer resources.
Definition: buffer_resource.hpp:55

rapidsmpf::BufferResource::release
std::size_t release(MemoryReservation &reservation, std::size_t size)
Consume a portion of the reserved memory.

rapidsmpf::BufferResource::allocate
std::unique_ptr< Buffer > allocate(std::size_t size, rmm::cuda_stream_view stream, MemoryReservation &reservation)
Allocate a buffer of the specified memory type by the reservation.

rapidsmpf::BufferResource::statistics
std::shared_ptr< Statistics > statistics()
Gets a shared pointer to the statistics associated with this buffer resource.

rapidsmpf::BufferResource::host_mr
rmm::host_async_resource_ref host_mr() noexcept
Get the RMM host memory resource.

rapidsmpf::BufferResource::device_mr
rmm::device_async_resource_ref device_mr() const noexcept
Get the RMM device memory resource.

rapidsmpf::BufferResource::allocate
std::unique_ptr< Buffer > allocate(rmm::cuda_stream_view stream, MemoryReservation &&reservation)
Allocate a buffer consuming the entire reservation.

rapidsmpf::BufferResource::BufferResource
BufferResource(cuda::mr::any_resource< cuda::mr::device_accessible > device_mr, std::optional< PinnedMemoryResource > pinned_mr=PinnedMemoryResource::Disabled, std::unordered_map< MemoryType, MemoryAvailable > memory_available={}, std::optional< Duration > periodic_spill_check=std::chrono::milliseconds{1}, std::shared_ptr< rmm::cuda_stream_pool > stream_pool=std::make_shared< rmm::cuda_stream_pool >(16, rmm::cuda_stream::flags::non_blocking), std::shared_ptr< Statistics > statistics=Statistics::disabled())
Constructs a buffer resource.

rapidsmpf::BufferResource::move
std::unique_ptr< Buffer > move(std::unique_ptr< Buffer > buffer, MemoryReservation &reservation)
Move a Buffer to the memory type specified by the reservation.

rapidsmpf::BufferResource::try_pinned_mr
std::optional< any_host_device_resource > try_pinned_mr() const noexcept
Get the pinned host memory resource if available.

rapidsmpf::BufferResource::memory_reserved
std::size_t memory_reserved(MemoryType mem_type) const
Get the current reserved memory of the specified memory type.
Definition: buffer_resource.hpp:167

rapidsmpf::BufferResource::move_to_device_buffer
std::unique_ptr< rmm::device_buffer > move_to_device_buffer(std::unique_ptr< Buffer > buffer, MemoryReservation &reservation)
Move a Buffer to a device buffer.

rapidsmpf::BufferResource::reserve_device_memory_and_spill
MemoryReservation reserve_device_memory_and_spill(std::size_t size, AllowOverbooking allow_overbooking)
Reserve device memory and spill if necessary.

rapidsmpf::BufferResource::reserve_or_fail
MemoryReservation reserve_or_fail(std::size_t size, MemoryType mem_type)
Make a memory reservation or fail.
Definition: buffer_resource.hpp:260

rapidsmpf::BufferResource::reserve_or_fail
requires std::convertible_to< std::ranges::range_value_t< Range >, MemoryType > MemoryReservation reserve_or_fail(std::size_t size, Range mem_types)
Make a memory reservation or fail based on the given order of memory types.
Definition: buffer_resource.hpp:233

rapidsmpf::BufferResource::from_options
static std::shared_ptr< BufferResource > from_options(RmmResourceAdaptor mr, config::Options options)
Construct a BufferResource from configuration options.

rapidsmpf::BufferResource::memory_available
MemoryAvailable const  & memory_available(MemoryType mem_type) const
Retrieves the memory availability function for a given memory type.
Definition: buffer_resource.hpp:157

rapidsmpf::BufferResource::pinned_mr
rmm::host_device_async_resource_ref pinned_mr()
Get the RMM pinned host memory resource.

rapidsmpf::BufferResource::MemoryAvailable
std::function< std::int64_t()> MemoryAvailable
Callback function to determine available memory.
Definition: buffer_resource.hpp:67

rapidsmpf::BufferResource::spill_manager
SpillManager & spill_manager()
Gets a reference to the spill manager used.

rapidsmpf::BufferResource::stream_pool
rmm::cuda_stream_pool const  & stream_pool() const
Returns the CUDA stream pool used by this buffer resource.

rapidsmpf::BufferResource::move_to_host_buffer
std::unique_ptr< HostBuffer > move_to_host_buffer(std::unique_ptr< Buffer > buffer, MemoryReservation &reservation)
Move a Buffer into a host buffer.

rapidsmpf::BufferResource::reserve
std::pair< MemoryReservation, std::size_t > reserve(MemoryType mem_type, std::size_t size, AllowOverbooking allow_overbooking)
Reserve an amount of the specified memory type.

rapidsmpf::BufferResource::move
std::unique_ptr< Buffer > move(std::unique_ptr< rmm::device_buffer > data, rmm::cuda_stream_view stream)
Move device buffer data into a Buffer.

rapidsmpf::HostMemoryResource
Host memory resource using standard CPU allocation.
Definition: host_memory_resource.hpp:32

rapidsmpf::LimitAvailableMemory
A functor for querying the remaining available memory within a defined limit from an RMM statistics r...
Definition: buffer_resource.hpp:433

rapidsmpf::LimitAvailableMemory::operator()
std::int64_t operator()() const
Returns the remaining available memory within the defined limit.
Definition: buffer_resource.hpp:454

rapidsmpf::LimitAvailableMemory::limit
std::int64_t const limit
The memory limit.
Definition: buffer_resource.hpp:459

rapidsmpf::LimitAvailableMemory::LimitAvailableMemory
LimitAvailableMemory(RmmResourceAdaptor mr, std::int64_t limit)
Constructs a LimitAvailableMemory instance.
Definition: buffer_resource.hpp:442

rapidsmpf::MemoryReservation
Represents a reservation for future memory allocation.
Definition: memory_reservation.hpp:23

rapidsmpf::PinnedMemoryResource::Disabled
static constexpr std::nullopt_t Disabled
Sentinel value indicating that pinned host memory is disabled.
Definition: pinned_memory_resource.hpp:101

rapidsmpf::RmmResourceAdaptor
A RMM memory resource adaptor tailored to RapidsMPF.
Definition: rmm_resource_adaptor.hpp:33

rapidsmpf::RmmResourceAdaptor::current_allocated
std::int64_t current_allocated() const noexcept
Get the total current allocated memory from both primary and fallback.

rapidsmpf::SpillManager
Manages memory spilling to free up device memory when needed.
Definition: spill_manager.hpp:25

rapidsmpf::Statistics::disabled
static std::shared_ptr< Statistics > disabled()
Returns a shared pointer to a disabled (no-op) Statistics instance.

rapidsmpf::config::Options
Manages configuration options for RapidsMPF operations.
Definition: config.hpp:140

rmm::cuda_stream_pool

rmm::cuda_stream_view

rmm::cuda_stream::flags::non_blocking
@ non_blocking

cuda_stream_pool.hpp

host_async_resource_ref
cuda::mr::resource_ref< cuda::mr::host_accessible > host_async_resource_ref

device_async_resource_ref
cuda::mr::resource_ref< cuda::mr::device_accessible > device_async_resource_ref

host_device_async_resource_ref
cuda::mr::resource_ref< cuda::mr::host_accessible, cuda::mr::device_accessible > host_device_async_resource_ref

rapidsmpf
RAPIDS Multi-Processor interfaces.
Definition: backend.hpp:14

rapidsmpf::periodic_spill_check_from_options
std::optional< Duration > periodic_spill_check_from_options(config::Options options)
Get the periodic_spill_check parameter from configuration options.

rapidsmpf::AllowOverbooking
AllowOverbooking
Policy controlling whether a memory reservation is allowed to overbook.
Definition: buffer_resource.hpp:40

rapidsmpf::AllowOverbooking::YES
@ YES
Overbooking is allowed.

rapidsmpf::AllowOverbooking::NO
@ NO
Overbooking is not allowed.

rapidsmpf::MEMORY_TYPES
constexpr std::array< MemoryType, 3 > MEMORY_TYPES
All memory types sorted in decreasing order of preference.
Definition: memory_type.hpp:23

rapidsmpf::MemoryType
MemoryType
Enum representing the type of memory sorted in decreasing order of preference.
Definition: memory_type.hpp:16

rapidsmpf::MemoryType::PINNED_HOST
@ PINNED_HOST
Pinned host memory.

rapidsmpf::any_host_device_resource
cuda::mr::any_resource< cuda::mr::host_accessible, cuda::mr::device_accessible > any_host_device_resource
Owning type-erased host- and device-accessible memory resource.
Definition: resource_types.hpp:17

rapidsmpf::memory_available_from_options
std::unordered_map< MemoryType, BufferResource::MemoryAvailable > memory_available_from_options(RmmResourceAdaptor mr, config::Options options)
Construct a map of memory-available functions from configuration options.

rapidsmpf::stream_pool_from_options
std::shared_ptr< rmm::cuda_stream_pool > stream_pool_from_options(config::Options options)
Get a new CUDA stream pool from configuration options.

rmm