mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-23 16:02:10 +00:00
chore(trtllm): update dependency towards 0.15.0
This commit is contained in:
parent
cc6bc339e5
commit
b6dbf605af
@ -10,7 +10,7 @@ COPY . .
|
|||||||
RUN cargo chef prepare --recipe-path recipe.json
|
RUN cargo chef prepare --recipe-path recipe.json
|
||||||
|
|
||||||
# CUDA dependent dependencies resolver stage
|
# CUDA dependent dependencies resolver stage
|
||||||
FROM nvidia/cuda:12.6.1-cudnn-devel-ubuntu24.04 AS cuda-builder
|
FROM nvidia/cuda:12.6.3-cudnn-devel-ubuntu24.04 AS cuda-builder
|
||||||
|
|
||||||
RUN --mount=type=cache,target=/var/cache/apt,sharing=locked \
|
RUN --mount=type=cache,target=/var/cache/apt,sharing=locked \
|
||||||
--mount=type=cache,target=/var/lib/apt,sharing=locked \
|
--mount=type=cache,target=/var/lib/apt,sharing=locked \
|
||||||
@ -18,8 +18,8 @@ RUN --mount=type=cache,target=/var/cache/apt,sharing=locked \
|
|||||||
build-essential \
|
build-essential \
|
||||||
cmake \
|
cmake \
|
||||||
curl \
|
curl \
|
||||||
gcc \
|
gcc-14 \
|
||||||
g++ \
|
g++-14 \
|
||||||
git \
|
git \
|
||||||
git-lfs \
|
git-lfs \
|
||||||
libssl-dev \
|
libssl-dev \
|
||||||
@ -86,7 +86,7 @@ RUN mkdir $TGI_INSTALL_PREFIX && mkdir "$TGI_INSTALL_PREFIX/include" && mkdir "$
|
|||||||
cd backends/trtllm && \
|
cd backends/trtllm && \
|
||||||
CMAKE_INSTALL_PREFIX=$TGI_INSTALL_PREFIX cargo build --release
|
CMAKE_INSTALL_PREFIX=$TGI_INSTALL_PREFIX cargo build --release
|
||||||
|
|
||||||
FROM nvidia/cuda:12.6.1-cudnn-runtime-ubuntu24.04 AS runtime
|
FROM nvidia/cuda:12.6.3-cudnn-runtime-ubuntu24.04 AS runtime
|
||||||
RUN apt update && apt install -y libucx0 pipx python3-minimal python3-dev python3-pip python3-venv && \
|
RUN apt update && apt install -y libucx0 pipx python3-minimal python3-dev python3-pip python3-venv && \
|
||||||
rm -rf /var/lib/{apt,dpkg,cache,log}/ && \
|
rm -rf /var/lib/{apt,dpkg,cache,log}/ && \
|
||||||
pipx ensurepath && \
|
pipx ensurepath && \
|
||||||
@ -94,6 +94,7 @@ RUN apt update && apt install -y libucx0 pipx python3-minimal python3-dev python
|
|||||||
|
|
||||||
WORKDIR /usr/local/tgi/bin
|
WORKDIR /usr/local/tgi/bin
|
||||||
|
|
||||||
|
ENV PATH=/root/.local/share/pipx/venvs/transformers/bin/:$PATH
|
||||||
ENV LD_LIBRARY_PATH="/usr/local/tgi/lib:/usr/local/mpi/lib:/usr/local/tensorrt/lib:/usr/local/cuda/lib64/stubs:$LD_LIBRARY_PATH"
|
ENV LD_LIBRARY_PATH="/usr/local/tgi/lib:/usr/local/mpi/lib:/usr/local/tensorrt/lib:/usr/local/cuda/lib64/stubs:$LD_LIBRARY_PATH"
|
||||||
ENV TOKENIZERS_PARALLELISM=false
|
ENV TOKENIZERS_PARALLELISM=false
|
||||||
ENV OMPI_MCA_plm_rsh_agent=""
|
ENV OMPI_MCA_plm_rsh_agent=""
|
||||||
|
@ -25,9 +25,9 @@ find_package(Python3 REQUIRED Interpreter)
|
|||||||
|
|
||||||
fetchcontent_declare(
|
fetchcontent_declare(
|
||||||
trtllm
|
trtllm
|
||||||
GIT_REPOSITORY https://github.com/NVIDIA/TensorRT-LLM.git
|
GIT_REPOSITORY https://github.com/huggingface/TensorRT-LLM.git
|
||||||
GIT_TAG 385626572df16175dd327fa785e4434cb7866a64
|
GIT_TAG 1bb9ca4688805444f203647674bac1d7219d0579
|
||||||
GIT_SHALLOW OFF
|
GIT_SHALLOW ON
|
||||||
DOWNLOAD_EXTRACT_TIMESTAMP
|
DOWNLOAD_EXTRACT_TIMESTAMP
|
||||||
)
|
)
|
||||||
fetchcontent_makeavailable(trtllm)
|
fetchcontent_makeavailable(trtllm)
|
||||||
|
@ -2,7 +2,7 @@
|
|||||||
|
|
||||||
set -ex
|
set -ex
|
||||||
|
|
||||||
TRT_VER_BASE="10.4.0"
|
TRT_VER_BASE="10.6.0"
|
||||||
TRT_VER_FULL="${TRT_VER_BASE}.26"
|
TRT_VER_FULL="${TRT_VER_BASE}.26"
|
||||||
CUDA_VER="12.6"
|
CUDA_VER="12.6"
|
||||||
CUDNN_VER="9.5.0.50-1"
|
CUDNN_VER="9.5.0.50-1"
|
||||||
|
Loading…
Reference in New Issue
Block a user