filtered_join.hpp
Go to the documentation of this file.
1 /*
2  * SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION.
3  * SPDX-License-Identifier: Apache-2.0
4  */
5 
6 #pragma once
7 
9 #include <cudf/types.hpp>
11 #include <cudf/utilities/export.hpp>
13 
14 #include <rmm/cuda_stream_view.hpp>
15 #include <rmm/device_uvector.hpp>
16 
17 #include <utility>
18 
19 namespace CUDF_EXPORT cudf {
20 
27 namespace detail {
31 class filtered_join;
32 } // namespace detail
33 
38 enum class set_as_build_table { LEFT, RIGHT };
39 
55  public:
56  filtered_join() = delete;
57  ~filtered_join();
58  filtered_join(filtered_join const&) = delete;
59  filtered_join(filtered_join&&) = delete;
60  filtered_join& operator=(filtered_join const&) = delete;
61  filtered_join& operator=(filtered_join&&) = delete;
62 
75  cudf::null_equality compare_nulls = null_equality::EQUAL,
76  set_as_build_table reuse_tbl = set_as_build_table::RIGHT,
78 
94  null_equality compare_nulls = null_equality::EQUAL,
95  set_as_build_table reuse_tbl = set_as_build_table::RIGHT,
96  double load_factor = 0.5,
98 
121  [[nodiscard]] std::unique_ptr<rmm::device_uvector<size_type>> semi_join(
122  cudf::table_view const& probe,
125 
148  [[nodiscard]] std::unique_ptr<rmm::device_uvector<size_type>> anti_join(
149  cudf::table_view const& probe,
152 
153  private:
154  set_as_build_table _reuse_tbl;
155  std::unique_ptr<cudf::detail::filtered_join> _impl;
156 };
157  // end of group
159 
160 } // namespace CUDF_EXPORT cudf
Filtered hash join that builds hash table on creation and probes results in subsequent *_join member ...
filtered_join(cudf::table_view const &build, cudf::null_equality compare_nulls=null_equality::EQUAL, set_as_build_table reuse_tbl=set_as_build_table::RIGHT, rmm::cuda_stream_view stream=cudf::get_default_stream())
Constructs a filtered hash join object for subsequent probe calls.
std::unique_ptr< rmm::device_uvector< size_type > > semi_join(cudf::table_view const &probe, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=cudf::get_current_device_resource_ref()) const
Returns a vector of row indices corresponding to a semi-join between the specified tables.
filtered_join(cudf::table_view const &build, null_equality compare_nulls=null_equality::EQUAL, set_as_build_table reuse_tbl=set_as_build_table::RIGHT, double load_factor=0.5, rmm::cuda_stream_view stream=cudf::get_default_stream())
Constructs a filtered hash join object for subsequent probe calls.
std::unique_ptr< rmm::device_uvector< size_type > > anti_join(cudf::table_view const &probe, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=cudf::get_current_device_resource_ref()) const
Returns a vector of row indices corresponding to a anti-join between the specified tables.
A set of cudf::column_view's of the same size.
Definition: table_view.hpp:189
set_as_build_table
Specifies which table to use as the build table in a hash join operation.
rmm::cuda_stream_view const get_default_stream()
Get the current default stream.
rmm::device_async_resource_ref get_current_device_resource_ref()
Get the current device memory resource reference.
detail::cccl_async_resource_ref< cuda::mr::resource_ref< cuda::mr::device_accessible > > device_async_resource_ref
null_equality
Enum to consider two nulls as equal or unequal.
Definition: types.hpp:140
cuDF interfaces
Definition: host_udf.hpp:26
Class definitions for (mutable)_table_view
Type declarations for libcudf.