join.hpp
Go to the documentation of this file.
1 /*
2  * SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION.
3  * SPDX-License-Identifier: Apache-2.0
4  */
5 
6 #pragma once
7 
10 #include <cudf/types.hpp>
12 #include <cudf/utilities/export.hpp>
14 
15 #include <rmm/cuda_stream_view.hpp>
16 #include <rmm/device_uvector.hpp>
17 
18 #include <cuda/std/limits>
19 
20 #include <cstdint>
21 
22 namespace CUDF_EXPORT cudf {
23 
37 enum class join_kind : int32_t {
38  INNER_JOIN = 0,
39  LEFT_JOIN = 1,
40  FULL_JOIN = 2,
41  LEFT_SEMI_JOIN = 3,
42  LEFT_ANTI_JOIN = 4
43 };
44 
55 CUDF_HOST_DEVICE constexpr size_type JoinNoMatch = cuda::std::numeric_limits<size_type>::min();
56 
66  std::unique_ptr<rmm::device_uvector<size_type>>
69 };
70 
86 };
87 
121 std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
122  std::unique_ptr<rmm::device_uvector<size_type>>>
123 inner_join(cudf::table_view const& left_keys,
124  cudf::table_view const& right_keys,
125  null_equality compare_nulls = null_equality::EQUAL,
128 
162 std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
163  std::unique_ptr<rmm::device_uvector<size_type>>>
164 left_join(cudf::table_view const& left_keys,
165  cudf::table_view const& right_keys,
166  null_equality compare_nulls = null_equality::EQUAL,
169 
203 std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
204  std::unique_ptr<rmm::device_uvector<size_type>>>
205 full_join(cudf::table_view const& left_keys,
206  cudf::table_view const& right_keys,
207  null_equality compare_nulls = null_equality::EQUAL,
210 
234 std::unique_ptr<cudf::table> cross_join(
235  cudf::table_view const& left,
236  cudf::table_view const& right,
239 
308 std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
309  std::unique_ptr<rmm::device_uvector<size_type>>>
311  cudf::table_view const& right,
314  cudf::ast::expression const& predicate,
318  // end of group
320 
321 } // namespace CUDF_EXPORT cudf
A set of cudf::column_view's of the same size.
Definition: table_view.hpp:189
std::pair< std::unique_ptr< rmm::device_uvector< size_type > >, std::unique_ptr< rmm::device_uvector< size_type > > > left_join(cudf::table_view const &left_keys, cudf::table_view const &right_keys, null_equality compare_nulls=null_equality::EQUAL, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=cudf::get_current_device_resource_ref())
Returns a pair of row index vectors corresponding to a left join between the specified tables.
std::pair< std::unique_ptr< rmm::device_uvector< size_type > >, std::unique_ptr< rmm::device_uvector< size_type > > > full_join(cudf::table_view const &left_keys, cudf::table_view const &right_keys, null_equality compare_nulls=null_equality::EQUAL, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=cudf::get_current_device_resource_ref())
Returns a pair of row index vectors corresponding to a full join between the specified tables.
std::pair< std::unique_ptr< rmm::device_uvector< size_type > >, std::unique_ptr< rmm::device_uvector< size_type > > > filter_join_indices(cudf::table_view const &left, cudf::table_view const &right, cudf::device_span< size_type const > left_indices, cudf::device_span< size_type const > right_indices, cudf::ast::expression const &predicate, cudf::join_kind join_kind, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=cudf::get_current_device_resource_ref())
Filters join result indices based on a conditional predicate and join type.
constexpr CUDF_HOST_DEVICE size_type JoinNoMatch
Sentinel value used to indicate an unmatched row index in join operations.
Definition: join.hpp:55
std::pair< std::unique_ptr< rmm::device_uvector< size_type > >, std::unique_ptr< rmm::device_uvector< size_type > > > inner_join(cudf::table_view const &left_keys, cudf::table_view const &right_keys, null_equality compare_nulls=null_equality::EQUAL, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=cudf::get_current_device_resource_ref())
Returns a pair of row index vectors corresponding to an inner join between the specified tables.
join_kind
Specifies the type of join operation to perform.
Definition: join.hpp:37
std::unique_ptr< cudf::table > cross_join(cudf::table_view const &left, cudf::table_view const &right, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=cudf::get_current_device_resource_ref())
Performs a cross join on two tables (left, right)
@ LEFT_ANTI_JOIN
Left anti join: left rows that have no matches in right table.
@ LEFT_SEMI_JOIN
Left semi join: left rows that have matches in right table.
@ FULL_JOIN
Full outer join: all rows from both tables.
@ LEFT_JOIN
Left join: all rows from left table plus matching rows from right.
@ INNER_JOIN
Inner join: only matching rows from both tables.
rmm::cuda_stream_view const get_default_stream()
Get the current default stream.
rmm::device_async_resource_ref get_current_device_resource_ref()
Get the current device memory resource reference.
detail::cccl_async_resource_ref< cuda::mr::resource_ref< cuda::mr::device_accessible > > device_async_resource_ref
null_equality
Enum to consider two nulls as equal or unequal.
Definition: types.hpp:140
int32_t size_type
Row index type for columns and tables.
Definition: types.hpp:84
cuDF interfaces
Definition: host_udf.hpp:26
A generic expression that can be evaluated to return a value.
Definition: expressions.hpp:61
Device version of C++20 std::span with reduced feature set.
Definition: span.hpp:323
Holds context information about matches between tables during a join operation.
Definition: join.hpp:64
std::unique_ptr< rmm::device_uvector< size_type > > _match_counts
Definition: join.hpp:67
table_view _left_table
View of the left table involved in the join operation.
Definition: join.hpp:65
Stores context information for partitioned join operations.
Definition: join.hpp:81
size_type left_start_idx
The starting row index of the current left table partition.
Definition: join.hpp:84
join_match_context left_table_context
The match context from a previous inner_join_match_context call.
Definition: join.hpp:83
size_type left_end_idx
The ending row index (exclusive) of the current left table partition.
Definition: join.hpp:85
Class definitions for (mutable)_table_view
Type declarations for libcudf.
#define CUDF_HOST_DEVICE
Indicates that the function or method is usable on host and device.
Definition: types.hpp:21