diff --git a/torch/csrc/distributed/c10d/ProcessGroupNCCL.cpp b/torch/csrc/distributed/c10d/ProcessGroupNCCL.cpp index d6f3e0d42e1..2da127e5b26 100644 --- a/torch/csrc/distributed/c10d/ProcessGroupNCCL.cpp +++ b/torch/csrc/distributed/c10d/ProcessGroupNCCL.cpp @@ -1371,9 +1371,6 @@ void ProcessGroupNCCL::abortCommsFromMap( const std::optional& abortReason) { // The process may control multiple devices, loop through the communicators on // each device - // NCCL expects Group abort when there are multiple communicators created in a - // device. - groupStart(); for (auto& it : ncclCommsMap) { auto& devName = it.first; auto& ncclComm = it.second; @@ -1394,7 +1391,6 @@ void ProcessGroupNCCL::abortCommsFromMap( VLOG(2) << logPrefix() << "ProcessGroupNCCL destroyed " << " communicator on CUDA device: " << devName; } - groupEnd(); } // Abort all communicators on this rank