Namespaces | Functions
deduplicate.hpp File Reference
#include <cudf/column/column.hpp>
#include <cudf/strings/strings_column_view.hpp>
#include <cudf/utilities/export.hpp>
#include <cudf/utilities/memory_resource.hpp>
#include <rmm/cuda_stream_view.hpp>
#include <rmm/device_uvector.hpp>

Go to the source code of this file.

Namespaces

 nvtext
 NVText APIs.
 

Functions

std::unique_ptr< rmm::device_uvector< cudf::size_type > > nvtext::build_suffix_array (cudf::strings_column_view const &input, cudf::size_type min_width, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=cudf::get_current_device_resource_ref())
 Builds a suffix array for the input strings column. More...
 
std::unique_ptr< cudf::columnnvtext::resolve_duplicates (cudf::strings_column_view const &input, cudf::device_span< cudf::size_type const > indices, cudf::size_type min_width, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=cudf::get_current_device_resource_ref())
 Returns duplicate strings found in the given input. More...
 
std::unique_ptr< cudf::columnnvtext::resolve_duplicates_pair (cudf::strings_column_view const &input1, cudf::device_span< cudf::size_type const > indices1, cudf::strings_column_view const &input2, cudf::device_span< cudf::size_type const > indices2, cudf::size_type min_width, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=cudf::get_current_device_resource_ref())
 Returns duplicate strings found from input1 found in the given input2. More...