9 #include <raft/core/handle.hpp>
10 #include <raft/random/rng.cuh>
33 float* gatheredMatrix,
41 float* gatheredMatrix,
68 void reset(
const raft::handle_t& h,
74 void printRaw2D(
float* buffer,
int rows,
int cols,
bool isColMajor, cudaStream_t stream);
76 void print(
const raft::handle_t& h,
79 const char* matrixName,
100 cudaStream_t stream);
103 double* gatheredMatrix,
108 cudaStream_t stream);
111 double* gatheredMatrix,
115 cudaStream_t stream);
121 cudaStream_t stream);
127 cudaStream_t stream);
130 raft::random::Rng& r,
142 cudaStream_t stream);
144 void printRaw2D(
double* buffer,
int rows,
int cols,
bool isColMajor, cudaStream_t stream);
149 const char* matrixName,
151 cudaStream_t stream);
void printRaw2D(float *buffer, int rows, int cols, bool isColMajor, cudaStream_t stream)
void allGather(const raft::handle_t &h, float *gatheredMatrix, std::vector< Matrix::Data< float > * > &parts, Matrix::PartDescriptor &desc, int myRank, cudaStream_t stream)
void gather(const raft::handle_t &h, float *gatheredMatrix, std::vector< Matrix::Data< float > * > &parts, Matrix::PartDescriptor &desc, int rootRank, int myRank, cudaStream_t stream)
void deallocate(const raft::handle_t &h, std::vector< Matrix::Data< float > * > &parts, Matrix::PartDescriptor &desc, int myRank, cudaStream_t stream)
void allGatherPart(const raft::handle_t &h, float *gatheredPart, std::vector< Matrix::Data< float > * > &parts, Matrix::PartDescriptor &desc, int partIndex, int myRank, cudaStream_t stream)
void randomize(const raft::handle_t &h, raft::random::Rng &r, std::vector< Matrix::Data< float > * > &parts, Matrix::PartDescriptor &desc, int myRank, cudaStream_t stream, float low=-1.0f, float high=1.0f)
void reset(const raft::handle_t &h, std::vector< Matrix::Data< float > * > &parts, Matrix::PartDescriptor &desc, int myRank, cudaStream_t stream)
void print(const raft::handle_t &h, std::vector< Matrix::Data< float > * > &parts, Matrix::PartDescriptor &desc, const char *matrixName, int myRank, cudaStream_t stream)
void gatherPart(const raft::handle_t &h, float *gatheredPart, std::vector< Matrix::Data< float > * > &parts, Matrix::PartDescriptor &desc, int partIndex, int rootRank, int myRank, cudaStream_t stream)
void allocate(const raft::handle_t &h, std::vector< Matrix::Data< float > * > &parts, Matrix::PartDescriptor &desc, int myRank, cudaStream_t stream)
Definition: comm_utils.h:11
This is a helper wrapper around the multi-gpu data blocks owned by a worker. It's design is NOT final...
Definition: data.hpp:18
Definition: part_descriptor.hpp:40