mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 12:24:53 +00:00
misc(ci): wtfinfini
This commit is contained in:
parent
3c7710c0db
commit
79469be32a
26
.github/workflows/build_trtllm.yaml
vendored
26
.github/workflows/build_trtllm.yaml
vendored
@ -16,7 +16,7 @@ on:
|
|||||||
value: ${{ jobs.build-and-push.outputs.label }}
|
value: ${{ jobs.build-and-push.outputs.label }}
|
||||||
|
|
||||||
jobs:
|
jobs:
|
||||||
build-trtllm-and-push:
|
build-and-push:
|
||||||
permissions:
|
permissions:
|
||||||
contents: read # Required to check out repository.
|
contents: read # Required to check out repository.
|
||||||
id-token: write # Required to authenticate via OIDC.
|
id-token: write # Required to authenticate via OIDC.
|
||||||
@ -131,4 +131,28 @@ jobs:
|
|||||||
echo "docker_image=registry.internal.huggingface.tech/api-inference/community/text-generation-inference/tensorrt-llm:sha-${{ env.GITHUB_SHA_SHORT }}${{ env.LABEL }}" >> "$GITHUB_OUTPUT"
|
echo "docker_image=registry.internal.huggingface.tech/api-inference/community/text-generation-inference/tensorrt-llm:sha-${{ env.GITHUB_SHA_SHORT }}${{ env.LABEL }}" >> "$GITHUB_OUTPUT"
|
||||||
echo "label=${{ env.LABEL }}" >> "$GITHUB_OUTPUT"
|
echo "label=${{ env.LABEL }}" >> "$GITHUB_OUTPUT"
|
||||||
|
|
||||||
|
run-tests:
|
||||||
|
needs: build-and-push
|
||||||
|
concurrency:
|
||||||
|
group: ${{ github.workflow }}-${{ github.job }}-trtllm-${{ github.head_ref || github.run_id }}
|
||||||
|
cancel-in-progress: true
|
||||||
|
runs-on:
|
||||||
|
group: aws-g6-12xl-plus-priv-cache
|
||||||
|
container:
|
||||||
|
image: ${{ needs.build-and-push.outputs.docker_image }}
|
||||||
|
credentials:
|
||||||
|
username: ${{ secrets.REGISTRY_USERNAME }}
|
||||||
|
password: ${{ secrets.REGISTRY_PASSWORD }}
|
||||||
|
options: --gpus all --shm-size=8g
|
||||||
|
|
||||||
|
steps:
|
||||||
|
- name: whoami
|
||||||
|
run: |
|
||||||
|
echo "Container: ${{ needs.build-and-push.outputs.docker_image }}"
|
||||||
|
|
||||||
|
- name: List binaries
|
||||||
|
run: ls -alh /usr/local/tgi
|
||||||
|
|
||||||
|
- name: Run C++/CUDA tests
|
||||||
|
run: /usr/local/tgi/bin/tgi_trtllm_backend_tests
|
||||||
|
|
||||||
|
56
.github/workflows/trtllm_tests.yaml
vendored
56
.github/workflows/trtllm_tests.yaml
vendored
@ -1,56 +0,0 @@
|
|||||||
name: "TensorRT-LLM C/C++/CUDA Test Suite"
|
|
||||||
on:
|
|
||||||
push:
|
|
||||||
branches:
|
|
||||||
- 'main'
|
|
||||||
- 'trtllm/ci'
|
|
||||||
tags:
|
|
||||||
- 'v*'
|
|
||||||
pull_request:
|
|
||||||
paths:
|
|
||||||
- "backends/trtllm"
|
|
||||||
- "server/**"
|
|
||||||
- "proto/**"
|
|
||||||
- "router/**"
|
|
||||||
- "launcher/**"
|
|
||||||
- "Cargo.lock"
|
|
||||||
- "rust-toolchain.toml"
|
|
||||||
- ".github/workflows/build_trtllm.yaml"
|
|
||||||
- ".github/workflows/trtllm_tests.yaml"
|
|
||||||
branches:
|
|
||||||
- "main"
|
|
||||||
|
|
||||||
jobs:
|
|
||||||
build-backend:
|
|
||||||
permissions:
|
|
||||||
contents: write
|
|
||||||
packages: write
|
|
||||||
id-token: write
|
|
||||||
uses: ./.github/workflows/build_trtllm.yaml
|
|
||||||
with:
|
|
||||||
runs-on: aws-highmemory-64-plus-priv
|
|
||||||
secrets: inherit
|
|
||||||
|
|
||||||
run-tests:
|
|
||||||
needs: build-backend
|
|
||||||
concurrency:
|
|
||||||
group: ${{ github.workflow }}-${{ github.job }}-trtllm-${{ github.head_ref || github.run_id }}
|
|
||||||
cancel-in-progress: true
|
|
||||||
runs-on:
|
|
||||||
group: aws-g6-12xl-plus-priv-cache
|
|
||||||
container:
|
|
||||||
image: ${{ needs.build-backend.outputs.docker_image }}
|
|
||||||
credentials:
|
|
||||||
username: ${{ secrets.REGISTRY_USERNAME }}
|
|
||||||
password: ${{ secrets.REGISTRY_PASSWORD }}
|
|
||||||
options: --gpus all --shm-size=8g
|
|
||||||
|
|
||||||
steps:
|
|
||||||
- name: whoami
|
|
||||||
run: |
|
|
||||||
echo "Container: ${{ needs.build-backend.outputs.docker_image }}"
|
|
||||||
- name: List binaries
|
|
||||||
run: ls -alh /usr/local/tgi
|
|
||||||
|
|
||||||
- name: Run C++/CUDA tests
|
|
||||||
run: /usr/local/tgi/bin/tgi_trtllm_backend_tests
|
|
Loading…
Reference in New Issue
Block a user