cuML C++ API: include/cuml/fil/detail/infer.hpp Source File

 /*

  * SPDX-FileCopyrightText: Copyright (c) 2023-2025, NVIDIA CORPORATION.

  * SPDX-License-Identifier: Apache-2.0

  */

 #pragma once

 #include <cuml/fil/detail/index_type.hpp>

 #include <cuml/fil/detail/infer/cpu.hpp>

 #include <cuml/fil/detail/postprocessor.hpp>

 #include <cuml/fil/detail/raft_proto/cuda_stream.hpp>

 #include <cuml/fil/detail/raft_proto/device_id.hpp>

 #include <cuml/fil/detail/raft_proto/device_type.hpp>

 #include <cuml/fil/exceptions.hpp>

 #include <cuml/fil/infer_kind.hpp>


 #include <cstddef>

 #include <iostream>

 #include <optional>

 #include <type_traits>


 #ifdef CUML_ENABLE_GPU

 #include <cuml/fil/detail/infer/gpu.hpp>

 #endif


 namespace ML {

 namespace fil {

 namespace detail {


 /*

  * Perform inference based on the given forest and input parameters

  *

  * @tparam D The device type (CPU/GPU) used to perform inference

  * @tparam forest_t The type of the forest

  * @param forest The forest to be evaluated

  * @param postproc The postprocessor object used to execute

  * postprocessing

  * @param output Pointer to where the output should be written

  * @param input Pointer to where the input data can be read from

  * @param row_count The number of rows in the input data

  * @param col_count The number of columns in the input data

  * @param output_count The number of outputs per row

  * @param has_categorical_nodes Whether or not any node within the forest has

  * a categorical split

  * @param vector_output Pointer to the beginning of storage for vector

  * outputs of leaves (nullptr for no vector output)

  * @param categorical_data Pointer to external categorical data storage if

  * required

  * @param infer_type Type of inference to perform. Defaults to summing the outputs of all trees

  * and produce an output per row. If set to "per_tree", we will instead output all outputs of

  * individual trees. If set to "leaf_id", we will output the integer ID of the leaf node

  * for each tree.

  * @param specified_chunk_size If non-nullopt, the size of "mini-batches"

  * used for distributing work across threads

  * @param device The device on which to execute evaluation

  * @param stream Optionally, the CUDA stream to use

  */

 template <raft_proto::device_type D, typename forest_t>

 void infer(forest_t const& forest,

            postprocessor<typename forest_t::io_type> const& postproc,

            typename forest_t::io_type* output,

            typename forest_t::io_type* input,

            index_type row_count,

            index_type col_count,

            index_type output_count,

            bool has_categorical_nodes,

            typename forest_t::io_type* vector_output                  = nullptr,

            typename forest_t::node_type::index_type* categorical_data = nullptr,

            infer_kind infer_type                                      = infer_kind::default_kind,

            std::optional<index_type> specified_chunk_size             = std::nullopt,

            raft_proto::device_id<D> device                            = raft_proto::device_id<D>{},

            raft_proto::cuda_stream stream                             = raft_proto::cuda_stream{})

 {

   if (vector_output == nullptr) {

     if (categorical_data == nullptr) {

       if (!has_categorical_nodes) {

         inference::infer<D, false, forest_t, std::nullptr_t, std::nullptr_t>(forest,

                                                                              postproc,

                                                                              output,

                                                                              input,

                                                                              row_count,

                                                                              col_count,

                                                                              output_count,

                                                                              nullptr,

                                                                              nullptr,

                                                                              infer_type,

                                                                              specified_chunk_size,

                                                                              device,

                                                                              stream);

       } else {

         inference::infer<D, true, forest_t, std::nullptr_t, std::nullptr_t>(forest,

                                                                             postproc,

                                                                             output,

                                                                             input,

                                                                             row_count,

                                                                             col_count,

                                                                             output_count,

                                                                             nullptr,

                                                                             nullptr,

                                                                             infer_type,

                                                                             specified_chunk_size,

                                                                             device,

                                                                             stream);

       }

     } else {

       inference::infer<D, true, forest_t>(forest,

                                           postproc,

                                           output,

                                           input,

                                           row_count,

                                           col_count,

                                           output_count,

                                           nullptr,

                                           categorical_data,

                                           infer_type,

                                           specified_chunk_size,

                                           device,

                                           stream);

     }

   } else {

     if (categorical_data == nullptr) {

       if (!has_categorical_nodes) {

         inference::infer<D, false, forest_t>(forest,

                                              postproc,

                                              output,

                                              input,

                                              row_count,

                                              col_count,

                                              output_count,

                                              vector_output,

                                              nullptr,

                                              infer_type,

                                              specified_chunk_size,

                                              device,

                                              stream);

       } else {

         inference::infer<D, true, forest_t>(forest,

                                             postproc,

                                             output,

                                             input,

                                             row_count,

                                             col_count,

                                             output_count,

                                             vector_output,

                                             nullptr,

                                             infer_type,

                                             specified_chunk_size,

                                             device,

                                             stream);

       }

     } else {

       inference::infer<D, true, forest_t>(forest,

                                           postproc,

                                           output,

                                           input,

                                           row_count,

                                           col_count,

                                           output_count,

                                           vector_output,

                                           categorical_data,

                                           infer_type,

                                           specified_chunk_size,

                                           device,

                                           stream);

     }

   }

 }


 }  // namespace detail

 }  // namespace fil

 }  // namespace ML

cuda_stream.hpp

device_id.hpp

device_type.hpp

exceptions.hpp

index_type.hpp

cpu.hpp

gpu.hpp

infer_kind.hpp

ML::fil::detail::infer
void infer(forest_t const &forest, postprocessor< typename forest_t::io_type > const &postproc, typename forest_t::io_type *output, typename forest_t::io_type *input, index_type row_count, index_type col_count, index_type output_count, bool has_categorical_nodes, typename forest_t::io_type *vector_output=nullptr, typename forest_t::node_type::index_type *categorical_data=nullptr, infer_kind infer_type=infer_kind::default_kind, std::optional< index_type > specified_chunk_size=std::nullopt, raft_proto::device_id< D > device=raft_proto::device_id< D >{}, raft_proto::cuda_stream stream=raft_proto::cuda_stream{})
Definition: infer.hpp:57

ML::fil::infer_kind
infer_kind
Definition: infer_kind.hpp:8

ML::fil::infer_kind::default_kind
@ default_kind

ML::fil::index_type
uint32_t index_type
Definition: index_type.hpp:9

ML
Definition: dbscan.hpp:18

raft_proto::cuda_stream
int cuda_stream
Definition: cuda_stream.hpp:14

postprocessor.hpp

ML::fil::forest
Definition: forest.hpp:24

ML::fil::postprocessor
Definition: postprocessor.hpp:135

raft_proto::detail::device_id
Definition: base.hpp:11