key_remapping.hpp
Go to the documentation of this file.
1 /*
2  * SPDX-FileCopyrightText: Copyright (c) 2026, NVIDIA CORPORATION.
3  * SPDX-License-Identifier: Apache-2.0
4  */
5 
6 #pragma once
7 
8 #include <cudf/column/column.hpp>
10 #include <cudf/types.hpp>
12 #include <cudf/utilities/export.hpp>
14 
15 #include <rmm/cuda_stream_view.hpp>
16 
17 #include <memory>
18 
19 namespace CUDF_EXPORT cudf {
20 
30 enum class compute_metrics : bool { NO = false, YES = true };
31 
32 namespace detail {
36 class key_remapping_impl;
37 } // namespace detail
38 
47 
56 
70  public:
71  key_remapping() = delete;
72  ~key_remapping();
73  key_remapping(key_remapping const&) = delete;
74  key_remapping(key_remapping&&) = delete;
75  key_remapping& operator=(key_remapping const&) = delete;
76  key_remapping& operator=(key_remapping&&) = delete;
77 
94  null_equality compare_nulls = null_equality::EQUAL,
95  cudf::compute_metrics metrics = cudf::compute_metrics::YES,
97 
113  [[nodiscard]] std::unique_ptr<cudf::column> remap_build_keys(
116 
134  [[nodiscard]] std::unique_ptr<cudf::column> remap_probe_keys(
135  cudf::table_view const& keys,
138 
144  [[nodiscard]] bool has_metrics() const;
145 
153  [[nodiscard]] size_type get_distinct_count() const;
154 
162  [[nodiscard]] size_type get_max_duplicate_count() const;
163 
164  private:
165  using impl_type = cudf::detail::key_remapping_impl;
166 
167  std::unique_ptr<impl_type> _impl;
168 };
169  // end of group
171 
172 } // namespace CUDF_EXPORT cudf
Remaps keys to unique integer IDs.
std::unique_ptr< cudf::column > remap_probe_keys(cudf::table_view const &keys, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=cudf::get_current_device_resource_ref()) const
Remap probe keys to integer IDs.
bool has_metrics() const
Check if metrics (distinct_count, max_duplicate_count) were computed.
key_remapping(cudf::table_view const &build, null_equality compare_nulls=null_equality::EQUAL, cudf::compute_metrics metrics=cudf::compute_metrics::YES, rmm::cuda_stream_view stream=cudf::get_default_stream())
Constructs a key remapping structure from the given build keys.
size_type get_max_duplicate_count() const
Get the maximum number of times any single key appears.
std::unique_ptr< cudf::column > remap_build_keys(rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=cudf::get_current_device_resource_ref()) const
Remap build keys to integer IDs.
size_type get_distinct_count() const
Get the number of distinct keys in the build table.
A set of cudf::column_view's of the same size.
Definition: table_view.hpp:189
Class definition for cudf::column.
constexpr size_type KEY_REMAP_NOT_FOUND
Sentinel value for probe-side keys not found in build table.
constexpr size_type KEY_REMAP_BUILD_NULL
Sentinel value for build-side rows with null keys (when nulls are not equal)
compute_metrics
Enum to control whether key remapping metrics should be computed.
rmm::cuda_stream_view const get_default_stream()
Get the current default stream.
rmm::device_async_resource_ref get_current_device_resource_ref()
Get the current device memory resource reference.
detail::cccl_async_resource_ref< cuda::mr::resource_ref< cuda::mr::device_accessible > > device_async_resource_ref
null_equality
Enum to consider two nulls as equal or unequal.
Definition: types.hpp:140
int32_t size_type
Row index type for columns and tables.
Definition: types.hpp:84
cuDF interfaces
Definition: host_udf.hpp:26
Class definitions for (mutable)_table_view
Type declarations for libcudf.