From b7b0fd0e35501151cedd81281b919da6acf2bfe8 Mon Sep 17 00:00:00 2001 From: Morgan Funtowicz Date: Sat, 21 Dec 2024 12:12:45 +0100 Subject: [PATCH] misc(backend): attempt to run the testS? --- .github/workflows/build_trtllm.yaml | 13 +++++++++++++ 1 file changed, 13 insertions(+) diff --git a/.github/workflows/build_trtllm.yaml b/.github/workflows/build_trtllm.yaml index 19fc4bfc..63c36403 100644 --- a/.github/workflows/build_trtllm.yaml +++ b/.github/workflows/build_trtllm.yaml @@ -118,5 +118,18 @@ jobs: cache-from: type=s3,region=us-east-1,bucket=ci-docker-buildx-cache,name=text-generation-inference-cache-${{ env.LABEL }},mode=min,access_key_id=${{ secrets.S3_CI_DOCKER_BUILDX_CACHE_ACCESS_KEY_ID }},secret_access_key=${{ secrets.S3_CI_DOCKER_BUILDX_CACHE_SECRET_ACCESS_KEY }},mode=min cache-to: type=s3,region=us-east-1,bucket=ci-docker-buildx-cache,name=text-generation-inference-cache-${{ env.LABEL }},mode=min,access_key_id=${{ secrets.S3_CI_DOCKER_BUILDX_CACHE_ACCESS_KEY_ID }},secret_access_key=${{ secrets.S3_CI_DOCKER_BUILDX_CACHE_SECRET_ACCESS_KEY }},mode=min + tests: + runs-on: + group: aws-g6-12xl-plus-priv-cache + container: + image: + registry.internal.huggingface.tech/api-inference/community/text-generation-inference/tensorrt-llm:${{ env.LABEL }} + credentials: + username: ${{ secrets.REGISTRY_USERNAME }} + password: ${{ secrets.REGISTRY_PASSWORD }} + options: --gpus all --net=host + steps: + - name: Run C++/CUDA tests + run: /usr/local/tgi/tgi_trtllm_backend_tests