replace std::min with min inside CUDA kernel

2026-01-13 22:18:36 +08:00 · 2024-08-23 15:11:37 +08:00 · 2024-08-23 15:11:37 +08:00 · 6dfa8df479
commit 6dfa8df479
parent ca34331e98
1 changed files with 1 additions and 1 deletions
--- a/cpp/tensorrt_llm/kernels/customAllReduceKernels.cu
+++ b/cpp/tensorrt_llm/kernels/customAllReduceKernels.cu
@ -612,7 +612,7 @@ static __global__ void oneShotAllReduceKernel(AllReduceParams params)

    // Start and end offsets of the thread
    size_t const chunk_start = bidx * params.elts_per_block + tidx * PACKED_ELTS;
-    size_t const chunk_end = std::min((bidx + 1) * params.elts_per_block, params.elts_total);
+    size_t const chunk_end = min((bidx + 1) * params.elts_per_block, params.elts_total);

    T* buffers[RANKS_PER_NODE];
 #pragma unroll