From c632f8a95aefb8a549acf53939bdd0941dd5bf34 Mon Sep 17 00:00:00 2001 From: Morgan Funtowicz Date: Sun, 26 Jan 2025 11:38:00 +0100 Subject: [PATCH] backend(trtllm): Cache mode max to cache intermediate layers --- .github/workflows/build.yaml | 4 ++-- Dockerfile_trtllm | 9 ++++++--- 2 files changed, 8 insertions(+), 5 deletions(-) diff --git a/.github/workflows/build.yaml b/.github/workflows/build.yaml index 92696497..73a55efe 100644 --- a/.github/workflows/build.yaml +++ b/.github/workflows/build.yaml @@ -196,8 +196,8 @@ jobs: tags: ${{ steps.meta.outputs.tags || steps.meta-pr.outputs.tags }} labels: ${{ steps.meta.outputs.labels || steps.meta-pr.outputs.labels }} - cache-from: type=s3,region=us-east-1,bucket=ci-docker-buildx-cache,name=text-generation-inference-cache${{ env.LABEL }},mode=min,access_key_id=${{ secrets.S3_CI_DOCKER_BUILDX_CACHE_ACCESS_KEY_ID }},secret_access_key=${{ secrets.S3_CI_DOCKER_BUILDX_CACHE_SECRET_ACCESS_KEY }},mode=min - cache-to: type=s3,region=us-east-1,bucket=ci-docker-buildx-cache,name=text-generation-inference-cache${{ env.LABEL }},mode=min,access_key_id=${{ secrets.S3_CI_DOCKER_BUILDX_CACHE_ACCESS_KEY_ID }},secret_access_key=${{ secrets.S3_CI_DOCKER_BUILDX_CACHE_SECRET_ACCESS_KEY }},mode=min + cache-from: type=s3,region=us-east-1,bucket=ci-docker-buildx-cache,name=text-generation-inference-cache${{ env.LABEL }},mode=min,access_key_id=${{ secrets.S3_CI_DOCKER_BUILDX_CACHE_ACCESS_KEY_ID }},secret_access_key=${{ secrets.S3_CI_DOCKER_BUILDX_CACHE_SECRET_ACCESS_KEY }},mode=max + cache-to: type=s3,region=us-east-1,bucket=ci-docker-buildx-cache,name=text-generation-inference-cache${{ env.LABEL }},mode=min,access_key_id=${{ secrets.S3_CI_DOCKER_BUILDX_CACHE_ACCESS_KEY_ID }},secret_access_key=${{ secrets.S3_CI_DOCKER_BUILDX_CACHE_SECRET_ACCESS_KEY }},mode=max - name: Final id: final run: | diff --git a/Dockerfile_trtllm b/Dockerfile_trtllm index 42cc48c5..148d29e0 100644 --- a/Dockerfile_trtllm +++ b/Dockerfile_trtllm @@ -1,5 +1,6 @@ ARG cuda_arch_list="75-real;80-real;86-real;89-real;90-real" ARG build_type=release +ARG ompi_version=4.1.7 ARG sccache_gha_enabled=no ARG actions_cache_url="" ARG actions_runtime_token="" @@ -37,14 +38,16 @@ ENV TENSORRT_INSTALL_PREFIX=/usr/local/tensorrt FROM cuda-builder AS mpi-builder WORKDIR /opt/src/mpi +ENV OMPI_VERSION=${ompi_version} +ENV OMPI_TARBALL_FILENAME=openmpi-${OMPI_VERSION}.tar.bz2 ADD --checksum=sha256:54a33cb7ad81ff0976f15a6cc8003c3922f0f3d8ceed14e1813ef3603f22cd34 \ - https://download.open-mpi.org/release/open-mpi/v4.1/openmpi-4.1.7.tar.bz2 . + https://download.open-mpi.org/release/open-mpi/v4.1/${OMPI_TARBALL_FILENAME} . -RUN tar --strip-components=1 -xf openmpi-4.1.7.tar.bz2 &&\ +RUN tar --strip-components=1 -xf ${OMPI_TARBALL_FILENAME} &&\ ./configure --prefix=/usr/local/mpi --with-cuda=/usr/local/cuda --with-slurm && \ make -j all && \ make install && \ - rm -rf "/opt/src/openmpi-4.1.7.tar.bz2" + rm -rf ${OMPI_TARBALL_FILENAME}/.. # Install TensorRT FROM cuda-builder AS trt-builder