Functions
MLCommon::Matrix::opg Namespace Reference

Functions

template<bool rowMajor, bool bcastAlongRows>
void matrixVectorBinaryDivSkipZero (std::vector< Matrix::Data< double > * > &data, const Matrix::PartDescriptor &inDesc, const Matrix::Data< double > &vec, bool return_zero, const raft::comms::comms_t &comm, cudaStream_t *streams, int n_streams)
 
template<bool rowMajor, bool bcastAlongRows>
void matrixVectorBinaryDivSkipZero (std::vector< Matrix::Data< float > * > &data, const Matrix::PartDescriptor &inDesc, const Matrix::Data< float > &vec, bool return_zero, const raft::comms::comms_t &comm, cudaStream_t *streams, int n_streams)
 
template<bool rowMajor, bool bcastAlongRows>
void matrixVectorBinaryMult (std::vector< Matrix::Data< double > * > &data, const Matrix::PartDescriptor &inDesc, const Matrix::Data< double > &vec, const raft::comms::comms_t &comm, cudaStream_t *streams, int n_streams)
 
template<bool rowMajor, bool bcastAlongRows>
void matrixVectorBinaryMult (std::vector< Matrix::Data< float > * > &data, const Matrix::PartDescriptor &inDesc, const Matrix::Data< float > &vec, const raft::comms::comms_t &comm, cudaStream_t *streams, int n_streams)
 
void gatherPart (const raft::handle_t &h, float *gatheredPart, std::vector< Matrix::Data< float > * > &parts, Matrix::PartDescriptor &desc, int partIndex, int rootRank, int myRank, cudaStream_t stream)
 
void allGatherPart (const raft::handle_t &h, float *gatheredPart, std::vector< Matrix::Data< float > * > &parts, Matrix::PartDescriptor &desc, int partIndex, int myRank, cudaStream_t stream)
 
void gather (const raft::handle_t &h, float *gatheredMatrix, std::vector< Matrix::Data< float > * > &parts, Matrix::PartDescriptor &desc, int rootRank, int myRank, cudaStream_t stream)
 
void allGather (const raft::handle_t &h, float *gatheredMatrix, std::vector< Matrix::Data< float > * > &parts, Matrix::PartDescriptor &desc, int myRank, cudaStream_t stream)
 
void allocate (const raft::handle_t &h, std::vector< Matrix::Data< float > * > &parts, Matrix::PartDescriptor &desc, int myRank, cudaStream_t stream)
 
void deallocate (const raft::handle_t &h, std::vector< Matrix::Data< float > * > &parts, Matrix::PartDescriptor &desc, int myRank, cudaStream_t stream)
 
void randomize (const raft::handle_t &h, raft::random::Rng &r, std::vector< Matrix::Data< float > * > &parts, Matrix::PartDescriptor &desc, int myRank, cudaStream_t stream, float low=-1.0f, float high=1.0f)
 
void reset (const raft::handle_t &h, std::vector< Matrix::Data< float > * > &parts, Matrix::PartDescriptor &desc, int myRank, cudaStream_t stream)
 
void printRaw2D (float *buffer, int rows, int cols, bool isColMajor, cudaStream_t stream)
 
void print (const raft::handle_t &h, std::vector< Matrix::Data< float > * > &parts, Matrix::PartDescriptor &desc, const char *matrixName, int myRank, cudaStream_t stream)
 
void gatherPart (const raft::handle_t &h, double *gatheredPart, std::vector< Matrix::Data< double > * > &parts, Matrix::PartDescriptor &desc, int partIndex, int rootRank, int myRank, cudaStream_t stream)
 
void allGatherPart (const raft::handle_t &h, double *gatheredPart, std::vector< Matrix::Data< double > * > &parts, Matrix::PartDescriptor &desc, int partIndex, int myRank, cudaStream_t stream)
 
void gather (const raft::handle_t &h, double *gatheredMatrix, std::vector< Matrix::Data< double > * > &parts, Matrix::PartDescriptor &desc, int rootRank, int myRank, cudaStream_t stream)
 
void allGather (const raft::handle_t &h, double *gatheredMatrix, std::vector< Matrix::Data< double > * > &parts, Matrix::PartDescriptor &desc, int myRank, cudaStream_t stream)
 
void allocate (const raft::handle_t &h, std::vector< Matrix::Data< double > * > &parts, Matrix::PartDescriptor &desc, int myRank, cudaStream_t stream)
 
void deallocate (const raft::handle_t &h, std::vector< Matrix::Data< double > * > &parts, Matrix::PartDescriptor &desc, int myRank, cudaStream_t stream)
 
void randomize (const raft::handle_t &h, raft::random::Rng &r, std::vector< Matrix::Data< double > * > &parts, Matrix::PartDescriptor &desc, int myRank, cudaStream_t stream, double low=-1.0, double high=1.0)
 
void reset (const raft::handle_t &h, std::vector< Matrix::Data< double > * > &parts, Matrix::PartDescriptor &desc, int myRank, cudaStream_t stream)
 
void printRaw2D (double *buffer, int rows, int cols, bool isColMajor, cudaStream_t stream)
 
void print (const raft::handle_t &h, std::vector< Matrix::Data< double > * > &parts, Matrix::PartDescriptor &desc, const char *matrixName, int myRank, cudaStream_t stream)
 

Function Documentation

◆ allGather() [1/2]

void MLCommon::Matrix::opg::allGather ( const raft::handle_t &  h,
double *  gatheredMatrix,
std::vector< Matrix::Data< double > * > &  parts,
Matrix::PartDescriptor desc,
int  myRank,
cudaStream_t  stream 
)

◆ allGather() [2/2]

void MLCommon::Matrix::opg::allGather ( const raft::handle_t &  h,
float *  gatheredMatrix,
std::vector< Matrix::Data< float > * > &  parts,
Matrix::PartDescriptor desc,
int  myRank,
cudaStream_t  stream 
)

◆ allGatherPart() [1/2]

void MLCommon::Matrix::opg::allGatherPart ( const raft::handle_t &  h,
double *  gatheredPart,
std::vector< Matrix::Data< double > * > &  parts,
Matrix::PartDescriptor desc,
int  partIndex,
int  myRank,
cudaStream_t  stream 
)

◆ allGatherPart() [2/2]

void MLCommon::Matrix::opg::allGatherPart ( const raft::handle_t &  h,
float *  gatheredPart,
std::vector< Matrix::Data< float > * > &  parts,
Matrix::PartDescriptor desc,
int  partIndex,
int  myRank,
cudaStream_t  stream 
)

◆ allocate() [1/2]

void MLCommon::Matrix::opg::allocate ( const raft::handle_t &  h,
std::vector< Matrix::Data< double > * > &  parts,
Matrix::PartDescriptor desc,
int  myRank,
cudaStream_t  stream 
)

◆ allocate() [2/2]

void MLCommon::Matrix::opg::allocate ( const raft::handle_t &  h,
std::vector< Matrix::Data< float > * > &  parts,
Matrix::PartDescriptor desc,
int  myRank,
cudaStream_t  stream 
)

◆ deallocate() [1/2]

void MLCommon::Matrix::opg::deallocate ( const raft::handle_t &  h,
std::vector< Matrix::Data< double > * > &  parts,
Matrix::PartDescriptor desc,
int  myRank,
cudaStream_t  stream 
)

◆ deallocate() [2/2]

void MLCommon::Matrix::opg::deallocate ( const raft::handle_t &  h,
std::vector< Matrix::Data< float > * > &  parts,
Matrix::PartDescriptor desc,
int  myRank,
cudaStream_t  stream 
)

◆ gather() [1/2]

void MLCommon::Matrix::opg::gather ( const raft::handle_t &  h,
double *  gatheredMatrix,
std::vector< Matrix::Data< double > * > &  parts,
Matrix::PartDescriptor desc,
int  rootRank,
int  myRank,
cudaStream_t  stream 
)

◆ gather() [2/2]

void MLCommon::Matrix::opg::gather ( const raft::handle_t &  h,
float *  gatheredMatrix,
std::vector< Matrix::Data< float > * > &  parts,
Matrix::PartDescriptor desc,
int  rootRank,
int  myRank,
cudaStream_t  stream 
)

◆ gatherPart() [1/2]

void MLCommon::Matrix::opg::gatherPart ( const raft::handle_t &  h,
double *  gatheredPart,
std::vector< Matrix::Data< double > * > &  parts,
Matrix::PartDescriptor desc,
int  partIndex,
int  rootRank,
int  myRank,
cudaStream_t  stream 
)

◆ gatherPart() [2/2]

void MLCommon::Matrix::opg::gatherPart ( const raft::handle_t &  h,
float *  gatheredPart,
std::vector< Matrix::Data< float > * > &  parts,
Matrix::PartDescriptor desc,
int  partIndex,
int  rootRank,
int  myRank,
cudaStream_t  stream 
)

◆ matrixVectorBinaryDivSkipZero() [1/2]

template<bool rowMajor, bool bcastAlongRows>
void MLCommon::Matrix::opg::matrixVectorBinaryDivSkipZero ( std::vector< Matrix::Data< double > * > &  data,
const Matrix::PartDescriptor inDesc,
const Matrix::Data< double > &  vec,
bool  return_zero,
const raft::comms::comms_t &  comm,
cudaStream_t *  streams,
int  n_streams 
)

◆ matrixVectorBinaryDivSkipZero() [2/2]

template<bool rowMajor, bool bcastAlongRows>
void MLCommon::Matrix::opg::matrixVectorBinaryDivSkipZero ( std::vector< Matrix::Data< float > * > &  data,
const Matrix::PartDescriptor inDesc,
const Matrix::Data< float > &  vec,
bool  return_zero,
const raft::comms::comms_t &  comm,
cudaStream_t *  streams,
int  n_streams 
)

◆ matrixVectorBinaryMult() [1/2]

template<bool rowMajor, bool bcastAlongRows>
void MLCommon::Matrix::opg::matrixVectorBinaryMult ( std::vector< Matrix::Data< double > * > &  data,
const Matrix::PartDescriptor inDesc,
const Matrix::Data< double > &  vec,
const raft::comms::comms_t &  comm,
cudaStream_t *  streams,
int  n_streams 
)

◆ matrixVectorBinaryMult() [2/2]

template<bool rowMajor, bool bcastAlongRows>
void MLCommon::Matrix::opg::matrixVectorBinaryMult ( std::vector< Matrix::Data< float > * > &  data,
const Matrix::PartDescriptor inDesc,
const Matrix::Data< float > &  vec,
const raft::comms::comms_t &  comm,
cudaStream_t *  streams,
int  n_streams 
)

◆ print() [1/2]

void MLCommon::Matrix::opg::print ( const raft::handle_t &  h,
std::vector< Matrix::Data< double > * > &  parts,
Matrix::PartDescriptor desc,
const char *  matrixName,
int  myRank,
cudaStream_t  stream 
)

◆ print() [2/2]

void MLCommon::Matrix::opg::print ( const raft::handle_t &  h,
std::vector< Matrix::Data< float > * > &  parts,
Matrix::PartDescriptor desc,
const char *  matrixName,
int  myRank,
cudaStream_t  stream 
)

◆ printRaw2D() [1/2]

void MLCommon::Matrix::opg::printRaw2D ( double *  buffer,
int  rows,
int  cols,
bool  isColMajor,
cudaStream_t  stream 
)

◆ printRaw2D() [2/2]

void MLCommon::Matrix::opg::printRaw2D ( float *  buffer,
int  rows,
int  cols,
bool  isColMajor,
cudaStream_t  stream 
)

◆ randomize() [1/2]

void MLCommon::Matrix::opg::randomize ( const raft::handle_t &  h,
raft::random::Rng &  r,
std::vector< Matrix::Data< double > * > &  parts,
Matrix::PartDescriptor desc,
int  myRank,
cudaStream_t  stream,
double  low = -1.0,
double  high = 1.0 
)

◆ randomize() [2/2]

void MLCommon::Matrix::opg::randomize ( const raft::handle_t &  h,
raft::random::Rng &  r,
std::vector< Matrix::Data< float > * > &  parts,
Matrix::PartDescriptor desc,
int  myRank,
cudaStream_t  stream,
float  low = -1.0f,
float  high = 1.0f 
)

◆ reset() [1/2]

void MLCommon::Matrix::opg::reset ( const raft::handle_t &  h,
std::vector< Matrix::Data< double > * > &  parts,
Matrix::PartDescriptor desc,
int  myRank,
cudaStream_t  stream 
)

◆ reset() [2/2]

void MLCommon::Matrix::opg::reset ( const raft::handle_t &  h,
std::vector< Matrix::Data< float > * > &  parts,
Matrix::PartDescriptor desc,
int  myRank,
cudaStream_t  stream 
)