mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 12:24:53 +00:00
backend(trtllm): update to 0.16.0
This commit is contained in:
parent
bdb3e488e4
commit
dc564aa022
@ -28,7 +28,7 @@ find_package(Python3 REQUIRED Interpreter)
|
|||||||
fetchcontent_declare(
|
fetchcontent_declare(
|
||||||
trtllm
|
trtllm
|
||||||
GIT_REPOSITORY https://github.com/huggingface/TensorRT-LLM.git
|
GIT_REPOSITORY https://github.com/huggingface/TensorRT-LLM.git
|
||||||
GIT_TAG 1bb9ca4688805444f203647674bac1d7219d0579
|
GIT_TAG 42a7b0922fc9e095f173eab9a7efa0bcdceadd0d
|
||||||
GIT_SHALLOW ON
|
GIT_SHALLOW ON
|
||||||
DOWNLOAD_EXTRACT_TIMESTAMP
|
DOWNLOAD_EXTRACT_TIMESTAMP
|
||||||
)
|
)
|
||||||
|
@ -2,8 +2,8 @@
|
|||||||
|
|
||||||
set -ex
|
set -ex
|
||||||
|
|
||||||
TRT_VER_BASE="10.6.0"
|
TRT_VER_BASE="10.7.0"
|
||||||
TRT_VER_FULL="${TRT_VER_BASE}.26"
|
TRT_VER_FULL="${TRT_VER_BASE}.23"
|
||||||
CUDA_VER="12.6"
|
CUDA_VER="12.6"
|
||||||
CUDNN_VER="9.5.0.50-1"
|
CUDNN_VER="9.5.0.50-1"
|
||||||
NCCL_VER="2.22.3-1+cuda12.6"
|
NCCL_VER="2.22.3-1+cuda12.6"
|
||||||
|
Loading…
Reference in New Issue
Block a user