9 #include <initializer_list>
18 #include <string_view>
22 #include <rapidsmpf/config.hpp>
23 #include <rapidsmpf/memory/memory_type.hpp>
24 #include <rapidsmpf/memory/pinned_memory_resource.hpp>
25 #include <rapidsmpf/rmm_resource_adaptor.hpp>
26 #include <rapidsmpf/utils/misc.hpp>
30 class StreamOrderedTiming;
171 return enabled_.load(std::memory_order_acquire);
178 enabled_.store(
true, std::memory_order_release);
185 enabled_.store(
false, std::memory_order_release);
206 std::string
report(std::string
const& header =
"Statistics:")
const;
228 void write_json(std::filesystem::path
const& filepath)
const;
237 [[nodiscard]] std::shared_ptr<Statistics>
copy()
const;
246 [[nodiscard]] std::vector<std::uint8_t>
serialize()
const;
258 std::span<std::uint8_t const> data
282 [[nodiscard]]
static std::shared_ptr<Statistics>
merge(
283 std::span<std::shared_ptr<Statistics>
const> stats
329 [[nodiscard]] std::size_t
count() const noexcept;
336 [[nodiscard]]
double value() const noexcept;
344 [[nodiscard]]
double max() const noexcept;
355 return sizeof(std::uint64_t) +
sizeof(
double) +
sizeof(double);
376 [[nodiscard]]
static std::pair<Stat, std::span<std::uint8_t const>>
deserialize(
377 std::span<std::uint8_t const> data
391 std::size_t count_{0};
393 double max_{-std::numeric_limits<double>::infinity()};
414 void add_stat(std::string
const& name,
double value);
433 std::string
const& report_entry_name,
434 std::initializer_list<std::string_view> stat_names,
446 std::string
const& report_entry_name,
447 std::vector<std::string> stat_names,
586 std::optional<RmmResourceAdaptor> mr_;
612 std::vector<std::string> stat_names;
616 mutable std::mutex mutex_;
617 std::atomic<bool> enabled_;
618 std::map<std::string, Stat> stats_;
619 std::map<std::string, ReportEntry> report_entries_;
620 std::unordered_map<std::string, MemoryRecord> memory_records_;
621 std::optional<RmmResourceAdaptor> mr_;
622 std::shared_ptr<PinnedMemoryResource>
649 #define RAPIDSMPF_MEMORY_PROFILE(...) \
650 RAPIDSMPF_OVERLOAD_BY_ARG_COUNT( \
651 __VA_ARGS__, RAPIDSMPF_MEMORY_PROFILE_2, RAPIDSMPF_MEMORY_PROFILE_1 \
656 #define RAPIDSMPF_MEMORY_PROFILE_1(stats) RAPIDSMPF_MEMORY_PROFILE_2(stats, __func__)
659 #define RAPIDSMPF_MEMORY_PROFILE_2(stats, funcname) \
660 auto&& RAPIDSMPF_CONCAT(_rapidsmpf_stats_, __LINE__) = (stats); \
661 auto const RAPIDSMPF_CONCAT(_rapidsmpf_memory_recorder_, __LINE__) = \
662 ((rapidsmpf::detail::to_pointer(RAPIDSMPF_CONCAT(_rapidsmpf_stats_, __LINE__)) \
663 && rapidsmpf::detail::to_pointer( \
664 RAPIDSMPF_CONCAT(_rapidsmpf_stats_, __LINE__) \
665 ) -> is_memory_profiling_enabled()) \
666 ? rapidsmpf::detail::to_pointer( \
667 RAPIDSMPF_CONCAT(_rapidsmpf_stats_, __LINE__) \
669 ->create_memory_recorder( \
670 std::string(__FILE__) + ":" + RAPIDSMPF_STRINGIFY(__LINE__) + "(" \
671 + std::string(funcname) + ")" \
673 : rapidsmpf::Statistics::MemoryRecorder{})
static constexpr auto Disabled
Sentinel value used to disable pinned host memory.
A RMM memory resource adaptor tailored to RapidsMPF.
RAII-style object for scoped memory usage tracking.
MemoryRecorder(MemoryRecorder const &)=delete
Deleted copy and move constructors/assignments.
~MemoryRecorder()
Destructor.
MemoryRecorder()=default
Constructs a no-op MemoryRecorder (disabled state).
MemoryRecorder(Statistics *stats, RmmResourceAdaptor mr, std::string name)
Constructs an active MemoryRecorder.
Represents a single tracked statistic.
void add(double value)
Adds a value to this statistic.
std::size_t count() const noexcept
Returns the number of updates applied to this statistic.
double max() const noexcept
Returns the maximum value seen across all add() calls.
std::uint8_t * serialize(std::uint8_t *out) const
Serializes this Stat to a byte buffer.
Stat merge(Stat const &other) const
Merges another Stat into this one, returning the combined result.
Stat(std::size_t count, double value, double max)
Constructs a Stat with explicit field values.
double value() const noexcept
Returns the total accumulated value.
auto operator<=>(Stat const &) const noexcept=default
Three-way comparison operator.
static std::pair< Stat, std::span< std::uint8_t const > > deserialize(std::span< std::uint8_t const > data)
Deserializes a Stat from a byte buffer.
Stat()=default
Default-constructs a Stat.
static constexpr std::size_t serialized_size() noexcept
Returns the serialized size of this Stat in bytes.
Tracks statistics across rapidsmpf operations.
std::string report(std::string const &header="Statistics:") const
Generates a formatted report of all collected statistics.
Formatter
Identifies a predefined formatter used by report().
@ _Count
Sentinel; must remain last.
bool is_memory_profiling_enabled() const
Checks whether memory profiling is enabled.
Stat get_stat(std::string const &name) const
Retrieves a statistic by name.
static std::shared_ptr< Statistics > from_options(RmmResourceAdaptor mr, config::Options options, std::shared_ptr< PinnedMemoryResource > pinned_mr=PinnedMemoryResource::Disabled)
Construct from configuration options.
void clear()
Clears all statistics.
MemoryRecorder create_memory_recorder(std::string name)
Creates a scoped memory recorder for the given name.
static std::shared_ptr< Statistics > disabled()
Returns a shared pointer to a disabled (no-op) Statistics instance.
void write_json(std::ostream &os) const
Writes a JSON representation of all collected statistics to a stream.
std::shared_ptr< Statistics > copy() const
Creates a deep copy of this Statistics object.
void add_bytes_stat(std::string const &name, std::size_t nbytes)
Adds a byte count to the named statistic.
void enable() noexcept
Enable statistics tracking for this instance.
void record_alloc(MemoryType mem_type, std::size_t nbytes, StreamOrderedTiming &&timing)
Record size and wall-clock duration for a buffer allocation.
void add_duration_stat(std::string const &name, Duration seconds)
Adds a duration to the named statistic.
void add_report_entry(std::string const &report_entry_name, std::vector< std::string > stat_names, Formatter formatter)
Associate a formatter with one or more named statistics for report rendering.
std::vector< std::string > list_stat_names() const
Get the names of all statistics.
Statistics(bool enabled=true)
Constructs a Statistics object without memory profiling.
void add_stat(std::string const &name, double value)
Adds a numeric value to the named statistic.
static std::shared_ptr< Statistics > merge(std::span< std::shared_ptr< Statistics > const > stats)
Merge a set of Statistics into a new instance.
std::vector< std::uint8_t > serialize() const
Serializes the stats and report entries to a binary byte vector.
void record_copy(MemoryType src, MemoryType dst, std::size_t nbytes, StreamOrderedTiming &&timing)
Record byte count and wall-clock duration for a memory copy operation.
bool enabled() const noexcept
Checks if statistics tracking is enabled.
void write_json(std::filesystem::path const &filepath) const
Writes a JSON report of all collected statistics to a file.
static std::shared_ptr< Statistics > deserialize(std::span< std::uint8_t const > data)
Deserializes a Statistics object from a binary byte vector.
void disable() noexcept
Disable statistics tracking for this instance.
Statistics(RmmResourceAdaptor mr, std::shared_ptr< PinnedMemoryResource > pinned_mr=PinnedMemoryResource::Disabled)
Constructs a Statistics object with memory profiling enabled.
void add_report_entry(std::string const &report_entry_name, std::initializer_list< std::string_view > stat_names, Formatter formatter)
Associate a formatter with one or more named statistics for report rendering.
std::unordered_map< std::string, MemoryRecord > const & get_memory_records() const
Retrieves all memory profiling records stored by this instance.
Stream-ordered wall-clock timer that records its result into Statistics.
Manages configuration options for RapidsMPF operations.
RAPIDS Multi-Processor interfaces.
std::chrono::duration< double > Duration
Alias for a duration type representing time in seconds as a double.
MemoryType
Enum representing the type of memory sorted in decreasing order of preference.
Memory statistics for a specific scope.
Holds memory profiling information for a named scope.
std::int64_t global_peak
Peak global memory usage during the scope.
ScopedMemoryRecord scoped
Scoped memory stats.
std::uint64_t num_calls
Number of times the scope was invoked.