triton-inference-server · mc-nv · May 29, 2025
diff --git a/build.sh b/build.sh
@@ -1,14 +1,14 @@
 #!/bin/bash
 
-git lfs install
+(git lfs env) || git lfs install
 git submodule update --init --recursive
 
 # Default values will be used if not set
-BASE_IMAGE=${BASE_IMAGE:-nvcr.io/nvidia/tritonserver:24.11-py3-min}
-PYTORCH_IMAGE=${PYTORCH_IMAGE:-nvcr.io/nvidia/pytorch:24.11-py3}
-TRT_VERSION=${TRT_VERSION:-10.7.0.23}
-TRT_URL_x86=${TRT_URL_x86:-https://developer.nvidia.com/downloads/compute/machine-learning/tensorrt/10.7.0/tars/TensorRT-${TRT_VERSION}.Linux.x86_64-gnu.cuda-12.6.tar.gz}
-TRT_URL_ARM=${TRT_URL_ARM:-https://developer.nvidia.com/downloads/compute/machine-learning/tensorrt/10.7.0/tars/TensorRT-${TRT_VERSION}.ubuntu-24.04.aarch64-gnu.cuda-12.6.tar.gz}
+BASE_IMAGE=${BASE_IMAGE:-nvcr.io/nvidia/tritonserver:25.03-py3-min}
+PYTORCH_IMAGE=${PYTORCH_IMAGE:-nvcr.io/nvidia/pytorch:25.03-py3}
+TRT_VERSION=${TRT_VERSION:-10.9.0.34}
+TRT_URL_x86=${TRT_URL_x86:-https://developer.nvidia.com/downloads/compute/machine-learning/tensorrt/10.9.0/tars/TensorRT-${TRT_VERSION}.Linux.x86_64-gnu.cuda-12.8.tar.gz}
+TRT_URL_ARM=${TRT_URL_ARM:-https://developer.nvidia.com/downloads/compute/machine-learning/tensorrt/10.9.0/tars/TensorRT-${TRT_VERSION}.ubuntu-24.04.aarch64-gnu.cuda-12.8.tar.gz}
 
 # Build the TRT-LLM base image that has TRT-LLM installed and will be used as
 # the base image for building Triton server and TRT-LLM backend.
@@ -24,7 +24,7 @@ docker build -t trtllm_base \
 cd ../
 # Need to use the aligned version of the Triton server repository.
 # Refer to the support matrix for the aligned version: https://docs.nvidia.com/deeplearning/frameworks/support-matrix/index.html
-TRITON_SERVER_REPO_TAG=${TRITON_SERVER_REPO_TAG:-r24.11}
+TRITON_SERVER_REPO_TAG=${TRITON_SERVER_REPO_TAG:-r25.05}
 git clone -b ${TRITON_SERVER_REPO_TAG} https://github.com/triton-inference-server/server.git
 cd server
 
@@ -33,8 +33,8 @@ cd server
 # the tags of the TensorRT-LLM backend and Python backend repositories that will
 # be used to build the container.
 TRTLLM_BASE_IMAGE=${TRTLLM_BASE_IMAGE:-trtllm_base}
-TENSORRTLLM_BACKEND_REPO_TAG=${TENSORRTLLM_BACKEND_REPO_TAG:-v0.15.0}
-PYTHON_BACKEND_REPO_TAG=${PYTHON_BACKEND_REPO_TAG:-r24.11}
+TENSORRTLLM_BACKEND_REPO_TAG=${TENSORRTLLM_BACKEND_REPO_TAG:-v0.19.0}
+PYTHON_BACKEND_REPO_TAG=${PYTHON_BACKEND_REPO_TAG:-r25.05}
 
 TRITON_GITHUB_ORGANIZATION=${TRITON_GITHUB_ORGANIZATION:-}
 if [ "$TRITON_GITHUB_ORGANIZATION" != "" ]
@@ -62,4 +62,4 @@ fi
               --image=base,${TRTLLM_BASE_IMAGE} \
               --backend=tensorrtllm:${TENSORRTLLM_BACKEND_REPO_TAG} \
               --backend=python:${PYTHON_BACKEND_REPO_TAG} \
-              "${GITHUB_ORGANIZATION}" "${CONTAINER_PREBUILD_COMMAND}"
+              ${GITHUB_ORGANIZATION} ${CONTAINER_PREBUILD_COMMAND}