From caea58aba405f02c3ff6b6f19c9974e60a9d8b48 Mon Sep 17 00:00:00 2001 From: Xiwen Yu <13230610+VALLIS-NERIA@users.noreply.github.com> Date: Mon, 8 Sep 2025 11:28:39 +0800 Subject: [PATCH] increase build memory Signed-off-by: Xiwen Yu <13230610+VALLIS-NERIA@users.noreply.github.com> --- .../moe_gemm/launchers/moe_gemm_tma_ws_launcher.inl | 10 ++-------- jenkins/Build.groovy | 6 +++--- 2 files changed, 5 insertions(+), 11 deletions(-) diff --git a/cpp/tensorrt_llm/kernels/cutlass_kernels/moe_gemm/launchers/moe_gemm_tma_ws_launcher.inl b/cpp/tensorrt_llm/kernels/cutlass_kernels/moe_gemm/launchers/moe_gemm_tma_ws_launcher.inl index 4223f5fddf..fdd00f7b2c 100644 --- a/cpp/tensorrt_llm/kernels/cutlass_kernels/moe_gemm/launchers/moe_gemm_tma_ws_launcher.inl +++ b/cpp/tensorrt_llm/kernels/cutlass_kernels/moe_gemm/launchers/moe_gemm_tma_ws_launcher.inl @@ -141,14 +141,8 @@ void tma_warp_specialized_generic_moe_gemm_kernelLauncher(TmaWarpSpecializedGrou #ifndef COMPILE_BLACKWELL_SM103_TMA_GROUPED_GEMMS else if constexpr (ArchTag::kMinComputeCapability == 103) { - static bool first_time = true; - if (first_time) - { - TLLM_LOG_WARNING( - "Falling back to sm100f version. For best performance please recompile with support for blackwell by " - "passing 103-real as an arch to build_wheel.py."); - first_time = false; - } + // fallback sm100f logic is done in dispatchMoeGemmFinalDispatchTmaWarpSpecialized + TLLM_THROW("Please recompile with support for blackwell by passing 103-real as an arch to build_wheel.py."); } #endif #ifndef COMPILE_BLACKWELL_SM120_TMA_GROUPED_GEMMS diff --git a/jenkins/Build.groovy b/jenkins/Build.groovy index e8522118dd..a5594d0e2e 100644 --- a/jenkins/Build.groovy +++ b/jenkins/Build.groovy @@ -112,7 +112,7 @@ def BUILD_CONFIGS = [ (WHEEL_EXTRA_ARGS) : "--extra-cmake-vars WARNING_IS_ERROR=ON -DCMAKE_C_COMPILER=clang -DCMAKE_CXX_COMPILER=clang++ -DCMAKE_CUDA_HOST_COMPILER=clang -DCMAKE_LINKER_TYPE=LLD", (TARNAME) : "llvm-TensorRT-LLM-GH200.tar.gz", (WHEEL_ARCHS): "90-real;100-real;103-real;120-real", - (BUILD_JOBS_FOR_CONFIG): "4", // TODO: Remove after fix the build OOM issue on SBSA + // (BUILD_JOBS_FOR_CONFIG): "4", // TODO: Remove after fix the build OOM issue on SBSA ], ] @@ -131,8 +131,8 @@ def globalVars = [ // TODO: Move common variables to an unified location BUILD_CORES_REQUEST = "8" BUILD_CORES_LIMIT = "8" -BUILD_MEMORY_REQUEST = "48Gi" -BUILD_MEMORY_LIMIT = "64Gi" +BUILD_MEMORY_REQUEST = "64Gi" +BUILD_MEMORY_LIMIT = "80Gi" BUILD_JOBS = "8" TESTER_CORES = "12"