fastvideo.v1.distributed.device_communicators.pynccl_wrapper
#
Module Contents#
Classes#
Data#
API#
- class fastvideo.v1.distributed.device_communicators.pynccl_wrapper.NCCLLibrary(so_file: Optional[str] = None)[source]#
Initialization
- NCCL_CHECK(result: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.ncclResult_t) None [source]#
- ncclAllGather(sendbuff: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.buffer_type, recvbuff: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.buffer_type, count: int, datatype: int, comm: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.ncclComm_t, stream: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.cudaStream_t) None [source]#
- ncclAllReduce(sendbuff: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.buffer_type, recvbuff: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.buffer_type, count: int, datatype: int, op: int, comm: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.ncclComm_t, stream: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.cudaStream_t) None [source]#
- ncclBroadcast(sendbuff: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.buffer_type, recvbuff: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.buffer_type, count: int, datatype: int, root: int, comm: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.ncclComm_t, stream: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.cudaStream_t) None [source]#
- ncclCommDestroy(comm: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.ncclComm_t) None [source]#
- ncclCommInitRank(world_size: int, unique_id: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.ncclUniqueId, rank: int) fastvideo.v1.distributed.device_communicators.pynccl_wrapper.ncclComm_t [source]#
- ncclGetErrorString(result: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.ncclResult_t) str [source]#
- ncclGetUniqueId() fastvideo.v1.distributed.device_communicators.pynccl_wrapper.ncclUniqueId [source]#
- ncclRecv(recvbuff: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.buffer_type, count: int, datatype: int, src: int, comm: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.ncclComm_t, stream: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.cudaStream_t) None [source]#
- ncclReduceScatter(sendbuff: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.buffer_type, recvbuff: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.buffer_type, count: int, datatype: int, op: int, comm: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.ncclComm_t, stream: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.cudaStream_t) None [source]#
- ncclSend(sendbuff: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.buffer_type, count: int, datatype: int, dest: int, comm: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.ncclComm_t, stream: fastvideo.v1.distributed.device_communicators.pynccl_wrapper.cudaStream_t) None [source]#
- class fastvideo.v1.distributed.device_communicators.pynccl_wrapper.ncclDataTypeEnum[source]#
- classmethod from_torch(dtype: torch.dtype) int [source]#
- class fastvideo.v1.distributed.device_communicators.pynccl_wrapper.ncclRedOpTypeEnum[source]#
- classmethod from_torch(op: torch.distributed.ReduceOp) int [source]#
- class fastvideo.v1.distributed.device_communicators.pynccl_wrapper.ncclUniqueId[source]#
Bases:
ctypes.Structure