From dc564aa022f97543af94d1757dfa29eb2456dbd8 Mon Sep 17 00:00:00 2001 From: Morgan Funtowicz Date: Tue, 21 Jan 2025 14:46:21 +0100 Subject: [PATCH] backend(trtllm): update to 0.16.0 --- backends/trtllm/cmake/trtllm.cmake | 2 +- backends/trtllm/scripts/install_tensorrt.sh | 4 ++-- 2 files changed, 3 insertions(+), 3 deletions(-) diff --git a/backends/trtllm/cmake/trtllm.cmake b/backends/trtllm/cmake/trtllm.cmake index d789b1eb..5a0715bc 100644 --- a/backends/trtllm/cmake/trtllm.cmake +++ b/backends/trtllm/cmake/trtllm.cmake @@ -28,7 +28,7 @@ find_package(Python3 REQUIRED Interpreter) fetchcontent_declare( trtllm GIT_REPOSITORY https://github.com/huggingface/TensorRT-LLM.git - GIT_TAG 1bb9ca4688805444f203647674bac1d7219d0579 + GIT_TAG 42a7b0922fc9e095f173eab9a7efa0bcdceadd0d GIT_SHALLOW ON DOWNLOAD_EXTRACT_TIMESTAMP ) diff --git a/backends/trtllm/scripts/install_tensorrt.sh b/backends/trtllm/scripts/install_tensorrt.sh index 7deb2fe8..f3e7270a 100755 --- a/backends/trtllm/scripts/install_tensorrt.sh +++ b/backends/trtllm/scripts/install_tensorrt.sh @@ -2,8 +2,8 @@ set -ex -TRT_VER_BASE="10.6.0" -TRT_VER_FULL="${TRT_VER_BASE}.26" +TRT_VER_BASE="10.7.0" +TRT_VER_FULL="${TRT_VER_BASE}.23" CUDA_VER="12.6" CUDNN_VER="9.5.0.50-1" NCCL_VER="2.22.3-1+cuda12.6"