diff --git a/Dockerfile_trtllm b/Dockerfile_trtllm index 3330abdf..da507e3d 100644 --- a/Dockerfile_trtllm +++ b/Dockerfile_trtllm @@ -5,8 +5,10 @@ ARG sccache_gha_enabled=off ARG actions_cache_url="" ARG actions_runtime_token="" +ENV CUDA_BASE=12.8.0 + # CUDA dependent dependencies resolver stage -FROM nvidia/cuda:12.6.3-cudnn-devel-ubuntu24.04 AS cuda-builder +FROM nvidia/cuda:${CUDA_BASE}-cudnn-devel-ubuntu24.04 AS cuda-builder RUN apt-get update && DEBIAN_FRONTEND=noninteractive apt-get install -y \ build-essential \ @@ -105,7 +107,7 @@ RUN export CMAKE_C_COMPILER_LAUNCHER=sccache && \ cargo build --profile ${build_type} --package text-generation-backends-trtllm --bin text-generation-backends-trtllm && \ sccache --show-stats -FROM nvidia/cuda:12.8.0-cudnn-runtime-ubuntu24.04 AS runtime +FROM nvidia/cuda:${CUDA_BASE}-cudnn-runtime-ubuntu24.04 AS runtime RUN apt update && apt install -y libucx0 pipx python3-minimal python3-dev python3-pip python3-venv && \ rm -rf /var/lib/{apt,dpkg,cache,log}/ && \ pipx ensurepath && \ @@ -124,7 +126,7 @@ COPY --from=tgi-builder /usr/local/tgi /usr/local/tgi COPY --from=tgi-builder /usr/src/text-generation-inference/target/release/text-generation-backends-trtllm /usr/local/tgi/bin/text-generation-launcher # This is used only for the CI/CD -FROM nvidia/cuda:12.8.0-cudnn-runtime-ubuntu24.04 AS ci-runtime +FROM nvidia/cuda:${CUDA_BASE}-cudnn-runtime-ubuntu24.04 AS ci-runtime RUN apt update && apt install -y libasan8 libubsan1 libucx0 pipx python3-minimal python3-dev python3-pip python3-venv && \ rm -rf /var/lib/{apt,dpkg,cache,log}/ && \ pipx ensurepath && \