Do not allocate memory for expected buffer if checking disabled

This allows the tests to be run with larger buffers
2026-05-01 11:58:19 +08:00 · 2021-01-20 17:08:40 -08:00 · 2021-01-20 17:08:40 -08:00 · 7677f3f608
commit 7677f3f608
parent 2f9bba9f20
1 changed files with 3 additions and 3 deletions
--- a/src/common.cu
+++ b/src/common.cu
@ -559,7 +559,7 @@ testResult_t threadLaunch(struct testThread* thread) {
 testResult_t AllocateBuffs(void **sendbuff, size_t sendBytes, void **recvbuff, size_t recvBytes, void **expected, size_t nbytes, int nranks) {
    CUDACHECK(cudaMalloc(sendbuff, nbytes));
    CUDACHECK(cudaMalloc(recvbuff, nbytes));
-    CUDACHECK(cudaMalloc(expected, recvBytes));
+    if (datacheck) CUDACHECK(cudaMalloc(expected, recvBytes));
    return testSuccess;
 }

@ -764,7 +764,7 @@ testResult_t run() {

  for (int i=0; i<nGpus*nThreads; i++) {
    CUDACHECK(cudaSetDevice(localRank*nThreads*nGpus+i));
-    AllocateBuffs(sendbuffs+i, sendBytes, recvbuffs+i, recvBytes, expected+i, (size_t)maxBytes, nProcs*nThreads*nGpus);
+    TESTCHECK(AllocateBuffs(sendbuffs+i, sendBytes, recvbuffs+i, recvBytes, expected+i, (size_t)maxBytes, nProcs*nThreads*nGpus));
    CUDACHECK(cudaStreamCreateWithFlags(streams+i, cudaStreamNonBlocking));
  }

@ -868,7 +868,7 @@ testResult_t run() {
  for (int i=0; i<nGpus*nThreads; i++) {
    CUDACHECK(cudaFree(sendbuffs[i]));
    CUDACHECK(cudaFree(recvbuffs[i]));
-    CUDACHECK(cudaFree(expected[i]));
+    if (datacheck) CUDACHECK(cudaFree(expected[i]));
  }
  CUDACHECK(cudaFreeHost(delta));