diff --git a/docker/Dockerfile.multi b/docker/Dockerfile.multi index c41b600d1a..bd9f927182 100644 --- a/docker/Dockerfile.multi +++ b/docker/Dockerfile.multi @@ -1,8 +1,8 @@ # Multi-stage Dockerfile ARG BASE_IMAGE=gitlab-master.nvidia.com:5005/dl/dgx/pytorch -ARG TRITON_IMAGE=nvcr.io/nvidia/tritonserver +ARG TRITON_IMAGE=gitlab-master.nvidia.com:5005/dl/dgx/tritonserver ARG BASE_TAG=25.08-py3.32224057-base -ARG TRITON_BASE_TAG=25.06-py3 +ARG TRITON_BASE_TAG=25.08-RC-py3.32078257 ARG DEVEL_IMAGE=devel FROM ${BASE_IMAGE}:${BASE_TAG} AS base diff --git a/jenkins/Build.groovy b/jenkins/Build.groovy index d689de393b..dbd3cc3ec7 100644 --- a/jenkins/Build.groovy +++ b/jenkins/Build.groovy @@ -447,7 +447,7 @@ def runLLMBuild(pipeline, buildFlags, tarName, is_linux_x86_64) def llmPath = sh (script: "realpath ${LLM_ROOT}",returnStdout: true).trim() // TODO: Remove after the cmake version is upgraded to 3.31.8 // Get triton tag from docker/dockerfile.multi - def tritonShortTag = sh(script: "${LLM_ROOT}/jenkins/scripts/get_triton_tag.sh ${LLM_ROOT}", returnStdout: true).trim() + def tritonShortTag = "r25.08" sh "cd ${LLM_ROOT}/triton_backend/inflight_batcher_llm && mkdir build && cd build && cmake .. -DTRTLLM_DIR=${llmPath} -DTRITON_COMMON_REPO_TAG=${tritonShortTag} -DTRITON_CORE_REPO_TAG=${tritonShortTag} -DTRITON_THIRD_PARTY_REPO_TAG=${tritonShortTag} -DTRITON_BACKEND_REPO_TAG=${tritonShortTag} -DUSE_CXX11_ABI=ON && make -j${BUILD_JOBS} install" // Step 3: packaging wheels into tarfile