librmm/25.04/limiting__resource__adaptor_8hpp_source

 /*

  * Copyright (c) 2021-2025, NVIDIA CORPORATION.

  *

  * Licensed under the Apache License, Version 2.0 (the "License");

  * you may not use this file except in compliance with the License.

  * You may obtain a copy of the License at

  *

  *     http://www.apache.org/licenses/LICENSE-2.0

  *

  * Unless required by applicable law or agreed to in writing, software

  * distributed under the License is distributed on an "AS IS" BASIS,

  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

  * See the License for the specific language governing permissions and

  * limitations under the License.

  */

 #pragma once


 #include <rmm/aligned.hpp>

 #include <rmm/detail/error.hpp>

 #include <rmm/detail/export.hpp>

 #include <rmm/detail/format.hpp>

 #include <rmm/mr/device/device_memory_resource.hpp>

 #include <rmm/mr/device/per_device_resource.hpp>

 #include <rmm/resource_ref.hpp>


 #include <atomic>

 #include <cstddef>


 namespace RMM_NAMESPACE {

 namespace mr {

 template <typename Upstream>

 class limiting_resource_adaptor final : public device_memory_resource {

  public:

   limiting_resource_adaptor(device_async_resource_ref upstream,

                             std::size_t allocation_limit,

                             std::size_t alignment = CUDA_ALLOCATION_ALIGNMENT)

     : upstream_{upstream},

       allocation_limit_{allocation_limit},

       allocated_bytes_(0),

       alignment_(alignment)

   {

   }


   limiting_resource_adaptor(Upstream* upstream,

                             std::size_t allocation_limit,

                             std::size_t alignment = CUDA_ALLOCATION_ALIGNMENT)

     : upstream_{to_device_async_resource_ref_checked(upstream)},

       allocation_limit_{allocation_limit},

       allocated_bytes_(0),

       alignment_(alignment)

   {

   }


   limiting_resource_adaptor()                                 = delete;

   ~limiting_resource_adaptor() override                       = default;

   limiting_resource_adaptor(limiting_resource_adaptor const&) = delete;

   limiting_resource_adaptor(limiting_resource_adaptor&&) noexcept =

     default;

   limiting_resource_adaptor& operator=(limiting_resource_adaptor const&) = delete;

   limiting_resource_adaptor& operator=(limiting_resource_adaptor&&) noexcept =

     default;


   [[nodiscard]] device_async_resource_ref get_upstream_resource() const noexcept

   {

     return upstream_;

   }


   [[nodiscard]] std::size_t get_allocated_bytes() const { return allocated_bytes_; }


   [[nodiscard]] std::size_t get_allocation_limit() const { return allocation_limit_; }


  private:

   void* do_allocate(std::size_t bytes, cuda_stream_view stream) override

   {

     auto const proposed_size = align_up(bytes, alignment_);

     auto const old           = allocated_bytes_.fetch_add(proposed_size);

     if (old + proposed_size <= allocation_limit_) {

       try {

         return get_upstream_resource().allocate_async(bytes, stream);

       } catch (...) {

         allocated_bytes_ -= proposed_size;

         throw;

       }

     }


     allocated_bytes_ -= proposed_size;

     auto const msg = std::string("Exceeded memory limit (failed to allocate ") +

                      rmm::detail::format_bytes(bytes) + ")";

     RMM_FAIL(msg.c_str(), rmm::out_of_memory);

   }


   void do_deallocate(void* ptr, std::size_t bytes, cuda_stream_view stream) override

   {

     std::size_t allocated_size = align_up(bytes, alignment_);

     get_upstream_resource().deallocate_async(ptr, bytes, stream);

     allocated_bytes_ -= allocated_size;

   }


   [[nodiscard]] bool do_is_equal(device_memory_resource const& other) const noexcept override

   {

     if (this == &other) { return true; }

     auto const* cast = dynamic_cast<limiting_resource_adaptor<Upstream> const*>(&other);

     if (cast == nullptr) { return false; }

     return get_upstream_resource() == cast->get_upstream_resource();

   }


   // The upstream resource used for satisfying allocation requests

   device_async_resource_ref upstream_;


   // maximum bytes this allocator is allowed to allocate.

   std::size_t allocation_limit_;


   // number of currently-allocated bytes

   std::atomic<std::size_t> allocated_bytes_;


   // todo: should be some way to ask the upstream...

   std::size_t alignment_;

 };

   // end of group

 }  // namespace mr

 }  // namespace RMM_NAMESPACE

aligned.hpp

rmm::cuda_stream_view
Strongly-typed non-owning wrapper for CUDA streams with default constructor.
Definition: cuda_stream_view.hpp:39

rmm::mr::device_memory_resource
Base class for all librmm device memory allocation.
Definition: device_memory_resource.hpp:93

rmm::mr::limiting_resource_adaptor
Resource that uses Upstream to allocate memory and limits the total allocations possible.
Definition: limiting_resource_adaptor.hpp:49

rmm::mr::limiting_resource_adaptor::limiting_resource_adaptor
limiting_resource_adaptor(device_async_resource_ref upstream, std::size_t allocation_limit, std::size_t alignment=CUDA_ALLOCATION_ALIGNMENT)
Construct a new limiting resource adaptor using upstream to satisfy allocation requests and limiting ...
Definition: limiting_resource_adaptor.hpp:59

rmm::mr::limiting_resource_adaptor::limiting_resource_adaptor
limiting_resource_adaptor(limiting_resource_adaptor &&) noexcept=default
Default move constructor.

rmm::mr::limiting_resource_adaptor::get_allocated_bytes
std::size_t get_allocated_bytes() const
Query the number of bytes that have been allocated. Note that this can not be used to know how large ...
Definition: limiting_resource_adaptor.hpp:115

rmm::mr::limiting_resource_adaptor::get_allocation_limit
std::size_t get_allocation_limit() const
Query the maximum number of bytes that this allocator is allowed to allocate. This is the limit on th...
Definition: limiting_resource_adaptor.hpp:124

rmm::mr::limiting_resource_adaptor::limiting_resource_adaptor
limiting_resource_adaptor(Upstream *upstream, std::size_t allocation_limit, std::size_t alignment=CUDA_ALLOCATION_ALIGNMENT)
Construct a new limiting resource adaptor using upstream to satisfy allocation requests and limiting ...
Definition: limiting_resource_adaptor.hpp:79

rmm::out_of_memory
Exception thrown when RMM runs out of memory.
Definition: error.hpp:87

device_memory_resource.hpp

rmm::device_async_resource_ref
cuda::mr::async_resource_ref< cuda::mr::device_accessible > device_async_resource_ref
Alias for a cuda::mr::async_resource_ref with the property cuda::mr::device_accessible.
Definition: resource_ref.hpp:41

rmm::to_device_async_resource_ref_checked
device_async_resource_ref to_device_async_resource_ref_checked(Resource *res)
Convert pointer to memory resource into device_async_resource_ref, checking for nullptr
Definition: resource_ref.hpp:79

rmm::CUDA_ALLOCATION_ALIGNMENT
static constexpr std::size_t CUDA_ALLOCATION_ALIGNMENT
Default alignment used for CUDA memory allocation.
Definition: aligned.hpp:43

rmm::align_up
constexpr std::size_t align_up(std::size_t value, std::size_t alignment) noexcept
Align up to nearest multiple of specified power of 2.
Definition: aligned.hpp:77

per_device_resource.hpp
Management of per-device device_memory_resources.

resource_ref.hpp