From e7c8825b0b5344c2b3d3317986b7b9ef257df928 Mon Sep 17 00:00:00 2001 From: David Addison Date: Tue, 3 Jun 2025 10:36:53 -0700 Subject: [PATCH] Wrap ncclCommWindowRegister() calls within ncclGroup --- src/common.cu | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/src/common.cu b/src/common.cu index 3987d89..69b892a 100644 --- a/src/common.cu +++ b/src/common.cu @@ -659,6 +659,7 @@ testResult_t threadInit(struct threadArgs* args) { } NCCLCHECK(ncclGroupEnd()); #if NCCL_VERSION_CODE >= NCCL_VERSION(2,19,0) + NCCLCHECK(ncclGroupStart()); void **sendRegHandles = (local_register) ? (void **)malloc(sizeof(*sendRegHandles)*args->nGpus) : NULL; void **recvRegHandles = (local_register) ? (void **)malloc(sizeof(*recvRegHandles)*args->nGpus) : NULL; for (int i=0; inGpus; i++) { @@ -673,6 +674,7 @@ testResult_t threadInit(struct threadArgs* args) { if (local_register) NCCLCHECK(ncclCommRegister(args->comms[i], args->recvbuffs[i], args->maxbytes, &recvRegHandles[i])); } } + NCCLCHECK(ncclGroupEnd()); #endif TESTCHECK(threadRunTests(args)); @@ -1124,6 +1126,7 @@ testResult_t run() { NCCLCHECK(ncclGroupEnd()); } #if NCCL_VERSION_CODE >= NCCL_VERSION(2,19,0) + NCCLCHECK(ncclGroupStart()); sendRegHandles = (local_register) ? (void **)malloc(sizeof(*sendRegHandles)*nThreads*nGpus) : NULL; recvRegHandles = (local_register) ? (void **)malloc(sizeof(*recvRegHandles)*nThreads*nGpus) : NULL; for (int i=0; i