join.hpp
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2019-2024, NVIDIA CORPORATION.
3  *
4  * Licensed under the Apache License, Version 2.0 (the "License");
5  * you may not use this file except in compliance with the License.
6  * You may obtain a copy of the License at
7  *
8  * http://www.apache.org/licenses/LICENSE-2.0
9  *
10  * Unless required by applicable law or agreed to in writing, software
11  * distributed under the License is distributed on an "AS IS" BASIS,
12  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13  * See the License for the specific language governing permissions and
14  * limitations under the License.
15  */
16 
17 #pragma once
18 
19 #include <cudf/ast/expressions.hpp>
20 #include <cudf/hashing.hpp>
22 #include <cudf/types.hpp>
24 #include <cudf/utilities/span.hpp>
25 
26 #include <rmm/cuda_stream_view.hpp>
27 #include <rmm/device_uvector.hpp>
28 #include <rmm/mr/device/per_device_resource.hpp>
29 #include <rmm/resource_ref.hpp>
30 
31 #include <optional>
32 #include <utility>
33 #include <vector>
34 
35 namespace cudf {
36 
42 enum class has_nested : bool { YES, NO };
43 
44 // forward declaration
45 namespace hashing::detail {
46 template <typename T>
48 } // namespace hashing::detail
49 namespace detail {
50 template <typename T>
51 class hash_join;
52 
53 template <cudf::has_nested HasNested>
55 } // namespace detail
56 
95 std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
96  std::unique_ptr<rmm::device_uvector<size_type>>>
97 inner_join(cudf::table_view const& left_keys,
98  cudf::table_view const& right_keys,
99  null_equality compare_nulls = null_equality::EQUAL,
100  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
101 
135 std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
136  std::unique_ptr<rmm::device_uvector<size_type>>>
137 left_join(cudf::table_view const& left_keys,
138  cudf::table_view const& right_keys,
139  null_equality compare_nulls = null_equality::EQUAL,
140  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
141 
174 std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
175  std::unique_ptr<rmm::device_uvector<size_type>>>
176 full_join(cudf::table_view const& left_keys,
177  cudf::table_view const& right_keys,
178  null_equality compare_nulls = null_equality::EQUAL,
179  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
180 
203 std::unique_ptr<rmm::device_uvector<size_type>> left_semi_join(
204  cudf::table_view const& left_keys,
205  cudf::table_view const& right_keys,
206  null_equality compare_nulls = null_equality::EQUAL,
207  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
208 
234 std::unique_ptr<rmm::device_uvector<size_type>> left_anti_join(
235  cudf::table_view const& left_keys,
236  cudf::table_view const& right_keys,
237  null_equality compare_nulls = null_equality::EQUAL,
238  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
239 
262 std::unique_ptr<cudf::table> cross_join(
263  cudf::table_view const& left,
264  cudf::table_view const& right,
265  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
266 
275 enum class nullable_join : bool { YES, NO };
276 
284 class hash_join {
285  public:
288 
289  hash_join() = delete;
290  ~hash_join();
291  hash_join(hash_join const&) = delete;
292  hash_join(hash_join&&) = delete;
293  hash_join& operator=(hash_join const&) = delete;
294  hash_join& operator=(hash_join&&) = delete;
295 
307  null_equality compare_nulls,
308  rmm::cuda_stream_view stream = cudf::get_default_stream());
309 
318  null_equality compare_nulls,
319  rmm::cuda_stream_view stream = cudf::get_default_stream());
320 
339  std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
340  std::unique_ptr<rmm::device_uvector<size_type>>>
342  std::optional<std::size_t> output_size = {},
343  rmm::cuda_stream_view stream = cudf::get_default_stream(),
344  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource()) const;
345 
364  std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
365  std::unique_ptr<rmm::device_uvector<size_type>>>
367  std::optional<std::size_t> output_size = {},
368  rmm::cuda_stream_view stream = cudf::get_default_stream(),
369  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource()) const;
370 
389  std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
390  std::unique_ptr<rmm::device_uvector<size_type>>>
392  std::optional<std::size_t> output_size = {},
393  rmm::cuda_stream_view stream = cudf::get_default_stream(),
394  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource()) const;
395 
409  [[nodiscard]] std::size_t inner_join_size(
410  cudf::table_view const& probe, rmm::cuda_stream_view stream = cudf::get_default_stream()) const;
411 
425  [[nodiscard]] std::size_t left_join_size(
426  cudf::table_view const& probe, rmm::cuda_stream_view stream = cudf::get_default_stream()) const;
427 
443  std::size_t full_join_size(
444  cudf::table_view const& probe,
445  rmm::cuda_stream_view stream = cudf::get_default_stream(),
446  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource()) const;
447 
448  private:
449  const std::unique_ptr<impl_type const> _impl;
450 };
451 
461 // TODO: `HasNested` to be removed via dispatching
462 template <cudf::has_nested HasNested>
464  public:
465  distinct_hash_join() = delete;
467  distinct_hash_join(distinct_hash_join const&) = delete;
469  distinct_hash_join& operator=(distinct_hash_join const&) = delete;
470  distinct_hash_join& operator=(distinct_hash_join&&) = delete;
471 
483  cudf::table_view const& probe,
484  nullable_join has_nulls = nullable_join::YES,
485  null_equality compare_nulls = null_equality::EQUAL,
486  rmm::cuda_stream_view stream = cudf::get_default_stream());
487 
499  std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
500  std::unique_ptr<rmm::device_uvector<size_type>>>
501  inner_join(rmm::cuda_stream_view stream = cudf::get_default_stream(),
502  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource()) const;
503 
518  std::unique_ptr<rmm::device_uvector<size_type>> left_join(
519  rmm::cuda_stream_view stream = cudf::get_default_stream(),
520  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource()) const;
521 
522  private:
523  using impl_type = typename cudf::detail::distinct_hash_join<HasNested>;
524 
525  std::unique_ptr<impl_type> _impl;
526 };
527 
563 std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
564  std::unique_ptr<rmm::device_uvector<size_type>>>
566  table_view const& right,
567  ast::expression const& binary_predicate,
568  std::optional<std::size_t> output_size = {},
569  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
570 
608 std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
609  std::unique_ptr<rmm::device_uvector<size_type>>>
611  table_view const& right,
612  ast::expression const& binary_predicate,
613  std::optional<std::size_t> output_size = {},
614  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
615 
651 std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
652  std::unique_ptr<rmm::device_uvector<size_type>>>
654  table_view const& right,
655  ast::expression const& binary_predicate,
656  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
657 
690 std::unique_ptr<rmm::device_uvector<size_type>> conditional_left_semi_join(
691  table_view const& left,
692  table_view const& right,
693  ast::expression const& binary_predicate,
694  std::optional<std::size_t> output_size = {},
695  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
696 
729 std::unique_ptr<rmm::device_uvector<size_type>> conditional_left_anti_join(
730  table_view const& left,
731  table_view const& right,
732  ast::expression const& binary_predicate,
733  std::optional<std::size_t> output_size = {},
734  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
735 
782 std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
783  std::unique_ptr<rmm::device_uvector<size_type>>>
785  table_view const& left_equality,
786  table_view const& right_equality,
787  table_view const& left_conditional,
788  table_view const& right_conditional,
789  ast::expression const& binary_predicate,
790  null_equality compare_nulls = null_equality::EQUAL,
791  std::optional<std::pair<std::size_t, device_span<size_type const>>> output_size_data = {},
792  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
793 
842 std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
843  std::unique_ptr<rmm::device_uvector<size_type>>>
845  table_view const& left_equality,
846  table_view const& right_equality,
847  table_view const& left_conditional,
848  table_view const& right_conditional,
849  ast::expression const& binary_predicate,
850  null_equality compare_nulls = null_equality::EQUAL,
851  std::optional<std::pair<std::size_t, device_span<size_type const>>> output_size_data = {},
852  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
853 
902 std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
903  std::unique_ptr<rmm::device_uvector<size_type>>>
905  table_view const& left_equality,
906  table_view const& right_equality,
907  table_view const& left_conditional,
908  table_view const& right_conditional,
909  ast::expression const& binary_predicate,
910  null_equality compare_nulls = null_equality::EQUAL,
911  std::optional<std::pair<std::size_t, device_span<size_type const>>> output_size_data = {},
912  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
913 
952 std::unique_ptr<rmm::device_uvector<size_type>> mixed_left_semi_join(
953  table_view const& left_equality,
954  table_view const& right_equality,
955  table_view const& left_conditional,
956  table_view const& right_conditional,
957  ast::expression const& binary_predicate,
958  null_equality compare_nulls = null_equality::EQUAL,
959  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
960 
1000 std::unique_ptr<rmm::device_uvector<size_type>> mixed_left_anti_join(
1001  table_view const& left_equality,
1002  table_view const& right_equality,
1003  table_view const& left_conditional,
1004  table_view const& right_conditional,
1005  ast::expression const& binary_predicate,
1006  null_equality compare_nulls = null_equality::EQUAL,
1007  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
1008 
1040 std::pair<std::size_t, std::unique_ptr<rmm::device_uvector<size_type>>> mixed_inner_join_size(
1041  table_view const& left_equality,
1042  table_view const& right_equality,
1043  table_view const& left_conditional,
1044  table_view const& right_conditional,
1045  ast::expression const& binary_predicate,
1046  null_equality compare_nulls = null_equality::EQUAL,
1047  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
1048 
1080 std::pair<std::size_t, std::unique_ptr<rmm::device_uvector<size_type>>> mixed_left_join_size(
1081  table_view const& left_equality,
1082  table_view const& right_equality,
1083  table_view const& left_conditional,
1084  table_view const& right_conditional,
1085  ast::expression const& binary_predicate,
1086  null_equality compare_nulls = null_equality::EQUAL,
1087  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
1088 
1107  table_view const& left,
1108  table_view const& right,
1109  ast::expression const& binary_predicate,
1110  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
1111 
1130  table_view const& left,
1131  table_view const& right,
1132  ast::expression const& binary_predicate,
1133  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
1134 
1153  table_view const& left,
1154  table_view const& right,
1155  ast::expression const& binary_predicate,
1156  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
1157 
1176  table_view const& left,
1177  table_view const& right,
1178  ast::expression const& binary_predicate,
1179  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource()); // end of group
1181 } // namespace cudf
Distinct hash join that builds hash table in creation and probes results in subsequent *_join member ...
Definition: join.hpp:463
std::pair< std::unique_ptr< rmm::device_uvector< size_type > >, std::unique_ptr< rmm::device_uvector< size_type > > > inner_join(rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource()) const
Returns the row indices that can be used to construct the result of performing an inner join between ...
std::unique_ptr< rmm::device_uvector< size_type > > left_join(rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource()) const
Returns the build table indices that can be used to construct the result of performing a left join be...
distinct_hash_join(cudf::table_view const &build, cudf::table_view const &probe, nullable_join has_nulls=nullable_join::YES, null_equality compare_nulls=null_equality::EQUAL, rmm::cuda_stream_view stream=cudf::get_default_stream())
Constructs a distinct hash join object for subsequent probe calls.
Hash join that builds hash table in creation and probes results in subsequent *_join member functions...
Definition: join.hpp:284
std::pair< std::unique_ptr< rmm::device_uvector< size_type > >, std::unique_ptr< rmm::device_uvector< size_type > > > left_join(cudf::table_view const &probe, std::optional< std::size_t > output_size={}, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource()) const
std::pair< std::unique_ptr< rmm::device_uvector< size_type > >, std::unique_ptr< rmm::device_uvector< size_type > > > full_join(cudf::table_view const &probe, std::optional< std::size_t > output_size={}, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource()) const
std::size_t full_join_size(cudf::table_view const &probe, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource()) const
hash_join(cudf::table_view const &build, nullable_join has_nulls, null_equality compare_nulls, rmm::cuda_stream_view stream=cudf::get_default_stream())
Construct a hash join object for subsequent probe calls.
typename cudf::detail::hash_join< cudf::hashing::detail::MurmurHash3_x86_32< cudf::hash_value_type > > impl_type
Implementation type.
Definition: join.hpp:287
std::size_t left_join_size(cudf::table_view const &probe, rmm::cuda_stream_view stream=cudf::get_default_stream()) const
std::pair< std::unique_ptr< rmm::device_uvector< size_type > >, std::unique_ptr< rmm::device_uvector< size_type > > > inner_join(cudf::table_view const &probe, std::optional< std::size_t > output_size={}, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource()) const
std::size_t inner_join_size(cudf::table_view const &probe, rmm::cuda_stream_view stream=cudf::get_default_stream()) const
hash_join(cudf::table_view const &build, null_equality compare_nulls, rmm::cuda_stream_view stream=cudf::get_default_stream())
Construct a hash join object for subsequent probe calls.
A set of cudf::column_view's of the same size.
Definition: table_view.hpp:187
std::size_t conditional_left_semi_join_size(table_view const &left, table_view const &right, ast::expression const &binary_predicate, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Returns the exact number of matches (rows) when performing a conditional left semi join between the s...
std::pair< std::unique_ptr< rmm::device_uvector< size_type > >, std::unique_ptr< rmm::device_uvector< size_type > > > conditional_full_join(table_view const &left, table_view const &right, ast::expression const &binary_predicate, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Returns a pair of row index vectors corresponding to all pairs of rows between the specified tables w...
std::unique_ptr< rmm::device_uvector< size_type > > mixed_left_anti_join(table_view const &left_equality, table_view const &right_equality, table_view const &left_conditional, table_view const &right_conditional, ast::expression const &binary_predicate, null_equality compare_nulls=null_equality::EQUAL, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Returns an index vector corresponding to all rows in the left tables for which there is no row in the...
std::unique_ptr< rmm::device_uvector< size_type > > left_semi_join(cudf::table_view const &left_keys, cudf::table_view const &right_keys, null_equality compare_nulls=null_equality::EQUAL, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Returns a vector of row indices corresponding to a left semi-join between the specified tables.
std::pair< std::unique_ptr< rmm::device_uvector< size_type > >, std::unique_ptr< rmm::device_uvector< size_type > > > conditional_inner_join(table_view const &left, table_view const &right, ast::expression const &binary_predicate, std::optional< std::size_t > output_size={}, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Returns a pair of row index vectors corresponding to all pairs of rows between the specified tables w...
std::size_t conditional_left_anti_join_size(table_view const &left, table_view const &right, ast::expression const &binary_predicate, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Returns the exact number of matches (rows) when performing a conditional left anti join between the s...
std::pair< std::unique_ptr< rmm::device_uvector< size_type > >, std::unique_ptr< rmm::device_uvector< size_type > > > conditional_left_join(table_view const &left, table_view const &right, ast::expression const &binary_predicate, std::optional< std::size_t > output_size={}, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Returns a pair of row index vectors corresponding to all pairs of rows between the specified tables w...
std::pair< std::size_t, std::unique_ptr< rmm::device_uvector< size_type > > > mixed_inner_join_size(table_view const &left_equality, table_view const &right_equality, table_view const &left_conditional, table_view const &right_conditional, ast::expression const &binary_predicate, null_equality compare_nulls=null_equality::EQUAL, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Returns the exact number of matches (rows) when performing a mixed inner join between the specified t...
std::pair< std::unique_ptr< rmm::device_uvector< size_type > >, std::unique_ptr< rmm::device_uvector< size_type > > > full_join(cudf::table_view const &left_keys, cudf::table_view const &right_keys, null_equality compare_nulls=null_equality::EQUAL, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Returns a pair of row index vectors corresponding to a full join between the specified tables.
std::unique_ptr< rmm::device_uvector< size_type > > conditional_left_anti_join(table_view const &left, table_view const &right, ast::expression const &binary_predicate, std::optional< std::size_t > output_size={}, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Returns an index vector corresponding to all rows in the left table for which there does not exist an...
std::size_t conditional_inner_join_size(table_view const &left, table_view const &right, ast::expression const &binary_predicate, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Returns the exact number of matches (rows) when performing a conditional inner join between the speci...
std::pair< std::unique_ptr< rmm::device_uvector< size_type > >, std::unique_ptr< rmm::device_uvector< size_type > > > mixed_left_join(table_view const &left_equality, table_view const &right_equality, table_view const &left_conditional, table_view const &right_conditional, ast::expression const &binary_predicate, null_equality compare_nulls=null_equality::EQUAL, std::optional< std::pair< std::size_t, device_span< size_type const >>> output_size_data={}, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Returns a pair of row index vectors corresponding to all pairs of rows between the specified tables w...
std::unique_ptr< rmm::device_uvector< size_type > > left_anti_join(cudf::table_view const &left_keys, cudf::table_view const &right_keys, null_equality compare_nulls=null_equality::EQUAL, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Returns a vector of row indices corresponding to a left anti join between the specified tables.
std::unique_ptr< rmm::device_uvector< size_type > > mixed_left_semi_join(table_view const &left_equality, table_view const &right_equality, table_view const &left_conditional, table_view const &right_conditional, ast::expression const &binary_predicate, null_equality compare_nulls=null_equality::EQUAL, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Returns an index vector corresponding to all rows in the left tables where the columns of the equalit...
std::pair< std::unique_ptr< rmm::device_uvector< size_type > >, std::unique_ptr< rmm::device_uvector< size_type > > > mixed_inner_join(table_view const &left_equality, table_view const &right_equality, table_view const &left_conditional, table_view const &right_conditional, ast::expression const &binary_predicate, null_equality compare_nulls=null_equality::EQUAL, std::optional< std::pair< std::size_t, device_span< size_type const >>> output_size_data={}, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Returns a pair of row index vectors corresponding to all pairs of rows between the specified tables w...
has_nested
Enum to indicate whether the distinct join table has nested columns or not.
Definition: join.hpp:42
std::pair< std::unique_ptr< rmm::device_uvector< size_type > >, std::unique_ptr< rmm::device_uvector< size_type > > > mixed_full_join(table_view const &left_equality, table_view const &right_equality, table_view const &left_conditional, table_view const &right_conditional, ast::expression const &binary_predicate, null_equality compare_nulls=null_equality::EQUAL, std::optional< std::pair< std::size_t, device_span< size_type const >>> output_size_data={}, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Returns a pair of row index vectors corresponding to all pairs of rows between the specified tables w...
std::pair< std::size_t, std::unique_ptr< rmm::device_uvector< size_type > > > mixed_left_join_size(table_view const &left_equality, table_view const &right_equality, table_view const &left_conditional, table_view const &right_conditional, ast::expression const &binary_predicate, null_equality compare_nulls=null_equality::EQUAL, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Returns the exact number of matches (rows) when performing a mixed left join between the specified ta...
nullable_join
The enum class to specify if any of the input join tables (build table and any later probe table) has...
Definition: join.hpp:275
std::pair< std::unique_ptr< rmm::device_uvector< size_type > >, std::unique_ptr< rmm::device_uvector< size_type > > > left_join(cudf::table_view const &left_keys, cudf::table_view const &right_keys, null_equality compare_nulls=null_equality::EQUAL, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Returns a pair of row index vectors corresponding to a left join between the specified tables.
std::pair< std::unique_ptr< rmm::device_uvector< size_type > >, std::unique_ptr< rmm::device_uvector< size_type > > > inner_join(cudf::table_view const &left_keys, cudf::table_view const &right_keys, null_equality compare_nulls=null_equality::EQUAL, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Returns a pair of row index vectors corresponding to an inner join between the specified tables.
std::unique_ptr< cudf::table > cross_join(cudf::table_view const &left, cudf::table_view const &right, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Performs a cross join on two tables (left, right)
std::unique_ptr< rmm::device_uvector< size_type > > conditional_left_semi_join(table_view const &left, table_view const &right, ast::expression const &binary_predicate, std::optional< std::size_t > output_size={}, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Returns an index vector corresponding to all rows in the left table for which there exists some row i...
std::size_t conditional_left_join_size(table_view const &left, table_view const &right, ast::expression const &binary_predicate, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Returns the exact number of matches (rows) when performing a conditional left join between the specif...
rmm::cuda_stream_view const get_default_stream()
Get the current default stream.
null_equality
Enum to consider two nulls as equal or unequal.
Definition: types.hpp:149
@ EQUAL
nulls compare equal
cuDF interfaces
Definition: aggregation.hpp:34
bool has_nulls(table_view const &view)
Returns True if the table has nulls in any of its columns.
APIs for spans.
A generic expression that can be evaluated to return a value.
Definition: expressions.hpp:46
Device version of C++20 std::span with reduced feature set.
Definition: span.hpp:291
Class definitions for (mutable)_table_view
Type declarations for libcudf.