triton-inference-server · kaiyux · Mar 18, 2025 · Mar 18, 2025 · Mar 18, 2025
diff --git a/ci/L0_backend_trtllm/generate_engines.sh b/ci/L0_backend_trtllm/generate_engines.sh
@@ -61,9 +61,6 @@ function build_tensorrt_engine_inflight_batcher {
     cd ${BASE_DIR}
 }
 
-# Downgrade to legacy version to accommodate Triton CI runners
-pip install pynvml==11.4.0
-
 # Generate the TRT_LLM model engines
 NUM_GPUS_TO_TEST=("1" "2" "4")
 for NUM_GPU in "${NUM_GPUS_TO_TEST[@]}"; do

diff --git a/tensorrt_llm b/tensorrt_llm
diff --git a/tools/version.txt b/tools/version.txt
@@ -1 +1 @@
-cf950ea521ca66fa3e3383545e60e4212d2de547
+85bc9eaf686c2a77c364b30c51e7f844ad6b47eb
Original file line number	Diff line number	Diff line change
		@@ -1 +1 @@
		cf950ea521ca66fa3e3383545e60e4212d2de547
		85bc9eaf686c2a77c364b30c51e7f844ad6b47eb