|
| AllreduceNCCLTest (const std::string &path, int worldSize) |
|
std::shared_ptr< c10d::ProcessGroup::Work > | run () |
|
| NCCLTest (const std::string &path, int worldSize) |
|
void | wait (std::shared_ptr< ProcessGroup::Work > &work) |
|
std::vector< at::Tensor > | getTensors () |
|
std::vector< std::vector< at::Tensor > > | getOutputTensors () |
|
int | numDevices () const |
|
| NCCLTestBase (const std::string &path) |
|
| NCCLTestBase (NCCLTestBase &&other) |
|
::c10d::ProcessGroupNCCL & | getProcessGroup () |
|
void | initialize (int rank, int size) |
|
|
const int | numDevices_ |
|
THCState * | state_ |
|
int | worldSize_ |
|
std::vector< at::Tensor > | inputs_ |
|
std::vector< std::vector< at::Tensor > > | outputs_ |
|
std::vector< CUDAStream > | streams_ |
|
std::string | path_ |
|
std::unique_ptr<::c10d::ProcessGroupNCCL > | pg_ |
|
Definition at line 128 of file ProcessGroupNCCLTest.cpp.
The documentation for this class was generated from the following file: