cuML C++ API: src/svm/workingset.h Source File

 /*

  * Copyright (c) 2019-2024, NVIDIA CORPORATION.

  *

  * Licensed under the Apache License, Version 2.0 (the "License");

  * you may not use this file except in compliance with the License.

  * You may obtain a copy of the License at

  *

  *     http://www.apache.org/licenses/LICENSE-2.0

  *

  * Unless required by applicable law or agreed to in writing, software

  * distributed under the License is distributed on an "AS IS" BASIS,

  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

  * See the License for the specific language governing permissions and

  * limitations under the License.

  */


 #pragma once


 #include <cuml/common/logger.hpp>

 #include <cuml/svm/svm_parameter.h>


 #include <raft/core/handle.hpp>


 #include <rmm/device_scalar.hpp>

 #include <rmm/device_uvector.hpp>


 #include <algorithm>

 #include <cstddef>

 #include <limits>


 namespace ML {

 namespace SVM {


 template <typename math_t>

 class WorkingSet {

  public:

   bool FIFO_strategy = true;


   WorkingSet(const raft::handle_t& handle,

              cudaStream_t stream,

              int n_rows      = 0,

              int n_ws        = 0,

              SvmType svmType = C_SVC)

     : handle(handle),

       stream(stream),

       svmType(svmType),

       n_rows(n_rows),

       available(0, stream),

       available_sorted(0, stream),

       cub_storage(0, stream),

       f_idx(0, stream),

       f_idx_sorted(0, stream),

       f_sorted(0, stream),

       idx_tmp(0, stream),

       idx(0, stream),

       ws_idx_sorted(0, stream),

       ws_idx_selected(0, stream),

       ws_idx_save(0, stream),

       ws_priority(0, stream),

       ws_priority_sorted(0, stream),

       d_num_selected(stream)

   {

     n_train = (svmType == EPSILON_SVR) ? n_rows * 2 : n_rows;

     SetSize(n_train, n_ws);

   }


   ~WorkingSet() {}


   void SetSize(int n_train, int n_ws = 0)

   {

     if (n_ws == 0 || n_ws > n_train) { n_ws = n_train; }

     n_ws       = std::min(1024, n_ws);

     this->n_ws = n_ws;

     CUML_LOG_DEBUG("Creating working set with %d elements", n_ws);

     AllocateBuffers();

   }


   int GetSize() { return n_ws; }


   int* GetIndices() { return idx.data(); }


   void SimpleSelect(

     math_t* f, math_t* alpha, math_t* y, const math_t* C, int n_already_selected = 0);


   void Select(math_t* f, math_t* alpha, math_t* y, const math_t* C)

   {

     if (n_ws >= n_train) {

       // All elements are selected, we have initialized idx to cover this case

       return;

     }

     int nc         = n_ws / 4;

     int n_selected = 0;

     if (firstcall) {

       if (nc >= 1) {

         firstcall = false;

       } else {

         // This can only happen for n_ws < 4.

         // We keep the calculation always in firstcall mode (only SimpleSelect

         // is used, no advanced strategies because we do not have enough elements)

         //

         // Nothing to do, firstcall is already true

       }

     } else {

       // keep 1/2 of the old working set

       if (FIFO_strategy) {

         // FIFO selection following ThunderSVM

         raft::copy(idx.data(), ws_idx_save.data() + 2 * nc, 2 * nc, stream);

         n_selected = nc * 2;

       } else {

         // priority based selection preferring to keep newer elements in ws

         n_selected = PrioritySelect(alpha, C, nc);

       }

     }

     SimpleSelect(f, alpha, y, C, n_selected);

     raft::copy(ws_idx_save.data(), idx.data(), n_ws, stream);

   }


   int PrioritySelect(math_t* alpha, const math_t* C, int nc);


  private:

   const raft::handle_t& handle;

   cudaStream_t stream;


   bool firstcall = true;

   int n_train    = 0;

   int n_rows     = 0;

   int n_ws       = 0;


   SvmType svmType;


   int TPB = 256;


   // Buffers for the domain size [n_train]

   rmm::device_uvector<int> f_idx;

   rmm::device_uvector<int> f_idx_sorted;

   rmm::device_uvector<int> idx_tmp;

   rmm::device_uvector<math_t> f_sorted;

   rmm::device_uvector<bool> available;

   rmm::device_uvector<bool> available_sorted;


   // working set buffers size [n_ws]

   rmm::device_uvector<int> idx;

   rmm::device_uvector<int> ws_idx_sorted;

   rmm::device_uvector<int> ws_idx_selected;

   rmm::device_uvector<int> ws_idx_save;


   rmm::device_uvector<int> ws_priority;

   rmm::device_uvector<int> ws_priority_sorted;


   rmm::device_scalar<int> d_num_selected;

   std::size_t cub_bytes = 0;

   rmm::device_uvector<char> cub_storage;


   void AllocateBuffers();


   int GatherAvailable(int n_already_selected, int n_needed, bool copy_front);


   void Initialize();


   template <typename select_op>

   int SelectPrevWs(int n_needed, int n_already_selected, select_op op);

 };


 };  // end namespace SVM

 };  // end namespace ML

ML::SVM::WorkingSet
Definition: workingset.h:45

ML::SVM::WorkingSet::GetSize
int GetSize()
Definition: workingset.h:105

ML::SVM::WorkingSet::Select
void Select(math_t *f, math_t *alpha, math_t *y, const math_t *C)
Select working set indices.
Definition: workingset.h:159

ML::SVM::WorkingSet::WorkingSet
WorkingSet(const raft::handle_t &handle, cudaStream_t stream, int n_rows=0, int n_ws=0, SvmType svmType=C_SVC)
Manage a working set.
Definition: workingset.h:59

ML::SVM::WorkingSet::FIFO_strategy
bool FIFO_strategy
Workspace selection strategy, note that only FIFO is tested so far
Definition: workingset.h:48

ML::SVM::WorkingSet::SetSize
void SetSize(int n_train, int n_ws=0)
Set the size of the working set and allocate buffers accordingly.
Definition: workingset.h:95

ML::SVM::WorkingSet::~WorkingSet
~WorkingSet()
Definition: workingset.h:87

ML::SVM::WorkingSet::SimpleSelect
void SimpleSelect(math_t *f, math_t *alpha, math_t *y, const math_t *C, int n_already_selected=0)
Select new elements for a working set.

ML::SVM::WorkingSet::GetIndices
int * GetIndices()
Return a device pointer to the the working set indices.
Definition: workingset.h:112

ML::SVM::WorkingSet::PrioritySelect
int PrioritySelect(math_t *alpha, const math_t *C, int nc)
Select elements from the previous working set based on their priority.

logger.hpp

ML::SVM::SvmType
SvmType
Definition: svm_parameter.h:23

ML::SVM::EPSILON_SVR
@ EPSILON_SVR
Definition: svm_parameter.h:23

ML::SVM::C_SVC
@ C_SVC
Definition: svm_parameter.h:23

ML
Definition: dbscan.hpp:30

raft_proto::copy
const_agnostic_same_t< T, U > copy(buffer< T > &dst, buffer< U > const &src, typename buffer< T >::index_type dst_offset, typename buffer< U >::index_type src_offset, typename buffer< T >::index_type size, cuda_stream stream)
Definition: buffer.hpp:327

svm_parameter.h