librmm/25.12/binning__memory__resource_8hpp_source

 /*

  * SPDX-FileCopyrightText: Copyright (c) 2020-2025, NVIDIA CORPORATION.

  * SPDX-License-Identifier: Apache-2.0

  */

 #pragma once


 #include <rmm/aligned.hpp>

 #include <rmm/detail/export.hpp>

 #include <rmm/mr/device_memory_resource.hpp>

 #include <rmm/mr/fixed_size_memory_resource.hpp>

 #include <rmm/resource_ref.hpp>


 #include <cuda_runtime_api.h>


 #include <cassert>

 #include <map>

 #include <memory>

 #include <optional>

 #include <vector>


 namespace RMM_NAMESPACE {

 namespace mr {

 template <typename Upstream>

 class binning_memory_resource final : public device_memory_resource {

  public:

   explicit binning_memory_resource(device_async_resource_ref upstream_resource)

     : upstream_mr_{upstream_resource}

   {

   }


   explicit binning_memory_resource(Upstream* upstream_resource)

     : upstream_mr_{to_device_async_resource_ref_checked(upstream_resource)}

   {

   }


   binning_memory_resource(device_async_resource_ref upstream_resource,

                           int8_t min_size_exponent,  // NOLINT(bugprone-easily-swappable-parameters)

                           int8_t max_size_exponent)

     : upstream_mr_{upstream_resource}

   {

     for (auto i = min_size_exponent; i <= max_size_exponent; i++) {

       add_bin(1 << i);

     }

   }


   binning_memory_resource(Upstream* upstream_resource,

                           int8_t min_size_exponent,  // NOLINT(bugprone-easily-swappable-parameters)

                           int8_t max_size_exponent)

     : upstream_mr_{to_device_async_resource_ref_checked(upstream_resource)}

   {

     for (auto i = min_size_exponent; i <= max_size_exponent; i++) {

       add_bin(1 << i);

     }

   }


   ~binning_memory_resource() override = default;


   binning_memory_resource()                                          = delete;

   binning_memory_resource(binning_memory_resource const&)            = delete;

   binning_memory_resource(binning_memory_resource&&)                 = delete;

   binning_memory_resource& operator=(binning_memory_resource const&) = delete;

   binning_memory_resource& operator=(binning_memory_resource&&)      = delete;


   [[nodiscard]] device_async_resource_ref get_upstream_resource() const noexcept

   {

     return upstream_mr_;

   }


   void add_bin(std::size_t allocation_size,

                std::optional<device_async_resource_ref> bin_resource = std::nullopt)

   {

     allocation_size = align_up(allocation_size, CUDA_ALLOCATION_ALIGNMENT);


     if (bin_resource.has_value()) {

       resource_bins_.insert({allocation_size, bin_resource.value()});

     } else if (resource_bins_.count(allocation_size) == 0) {  // do nothing if bin already exists

       owned_bin_resources_.push_back(

         std::make_unique<fixed_size_memory_resource<Upstream>>(upstream_mr_, allocation_size));

       resource_bins_.insert({allocation_size, owned_bin_resources_.back().get()});

     }

   }


  private:

   device_async_resource_ref get_resource_ref(std::size_t bytes)

   {

     auto iter = resource_bins_.lower_bound(bytes);

     return (iter != resource_bins_.cend()) ? iter->second : get_upstream_resource();

   }


   void* do_allocate(std::size_t bytes, cuda_stream_view stream) override

   {

     if (bytes <= 0) { return nullptr; }

     return get_resource_ref(bytes).allocate(stream, bytes);

   }


   void do_deallocate(void* ptr, std::size_t bytes, cuda_stream_view stream) noexcept override

   {

     get_resource_ref(bytes).deallocate(stream, ptr, bytes);

   }


   device_async_resource_ref

     upstream_mr_;  // The upstream memory_resource from which to allocate blocks.


   std::vector<std::unique_ptr<fixed_size_memory_resource<Upstream>>> owned_bin_resources_;


   std::map<std::size_t, device_async_resource_ref> resource_bins_;

 };

   // end of group

 }  // namespace mr

 }  // namespace RMM_NAMESPACE

aligned.hpp

rmm::cuda_stream_view
Strongly-typed non-owning wrapper for CUDA streams with default constructor.
Definition: cuda_stream_view.hpp:28

rmm::mr::binning_memory_resource
Allocates memory from upstream resources associated with bin sizes.
Definition: binning_memory_resource.hpp:36

rmm::mr::binning_memory_resource::binning_memory_resource
binning_memory_resource(Upstream *upstream_resource)
Construct a new binning memory resource object.
Definition: binning_memory_resource.hpp:61

rmm::mr::binning_memory_resource::get_upstream_resource
device_async_resource_ref get_upstream_resource() const noexcept
device_async_resource_ref to the upstream resource
Definition: binning_memory_resource.hpp:127

rmm::mr::binning_memory_resource::binning_memory_resource
binning_memory_resource(device_async_resource_ref upstream_resource, int8_t min_size_exponent, int8_t max_size_exponent)
Construct a new binning memory resource object with a range of initial bins.
Definition: binning_memory_resource.hpp:78

rmm::mr::binning_memory_resource::~binning_memory_resource
~binning_memory_resource() override=default
Destroy the binning_memory_resource and free all memory allocated from the upstream resource.

rmm::mr::binning_memory_resource::binning_memory_resource
binning_memory_resource(Upstream *upstream_resource, int8_t min_size_exponent, int8_t max_size_exponent)
Construct a new binning memory resource object with a range of initial bins.
Definition: binning_memory_resource.hpp:102

rmm::mr::binning_memory_resource::binning_memory_resource
binning_memory_resource(device_async_resource_ref upstream_resource)
Construct a new binning memory resource object.
Definition: binning_memory_resource.hpp:46

rmm::mr::binning_memory_resource::add_bin
void add_bin(std::size_t allocation_size, std::optional< device_async_resource_ref > bin_resource=std::nullopt)
Add a bin allocator to this resource.
Definition: binning_memory_resource.hpp:147

rmm::mr::device_memory_resource
Base class for all librmm device memory allocation.
Definition: device_memory_resource.hpp:83

rmm::mr::fixed_size_memory_resource
A device_memory_resource which allocates memory blocks of a single fixed size.
Definition: fixed_size_memory_resource.hpp:42

device_memory_resource.hpp

fixed_size_memory_resource.hpp

rmm::to_device_async_resource_ref_checked
device_async_resource_ref to_device_async_resource_ref_checked(Resource *res)
Convert pointer to memory resource into device_async_resource_ref, checking for nullptr
Definition: resource_ref.hpp:72

rmm::device_async_resource_ref
detail::cccl_async_resource_ref< cuda::mr::resource_ref< cuda::mr::device_accessible > > device_async_resource_ref
Alias for a cuda::mr::async_resource_ref with the property cuda::mr::device_accessible.
Definition: resource_ref.hpp:32

rmm::CUDA_ALLOCATION_ALIGNMENT
static constexpr std::size_t CUDA_ALLOCATION_ALIGNMENT
Default alignment used for CUDA memory allocation.
Definition: aligned.hpp:33

rmm::align_up
std::size_t align_up(std::size_t value, std::size_t alignment) noexcept
Align up to nearest multiple of specified power of 2.

resource_ref.hpp