From 43b0229da0e28846707669a660c2c2be210f88d4 Mon Sep 17 00:00:00 2001 From: OlivierDehaene <23298448+OlivierDehaene@users.noreply.github.com> Date: Tue, 23 May 2023 15:53:09 +0200 Subject: [PATCH] run on host --- .github/workflows/load_test.yaml | 11 +++++++---- 1 file changed, 7 insertions(+), 4 deletions(-) diff --git a/.github/workflows/load_test.yaml b/.github/workflows/load_test.yaml index 1ded9abb..e5b61e92 100644 --- a/.github/workflows/load_test.yaml +++ b/.github/workflows/load_test.yaml @@ -64,16 +64,19 @@ jobs: sudo mkdir ${{ env.DOCKER_VOLUME }} sudo mount /dev/nvme1n1 ${{ env.DOCKER_VOLUME }} + - name: Install k6 + run: | + curl https://github.com/grafana/k6/releases/download/v0.44.0/k6-v0.44.0-linux-amd64.tar.gz -L | tar xvz --strip-components 1 + - name: Start starcoder run: | docker run --name tgi-starcoder --rm --gpus all -p 3000:80 -v ${{ env.DOCKER_VOLUME }}:/data -e HUGGING_FACE_HUB_TOKEN=${{ secrets.HUGGING_FACE_HUB_TOKEN }} --pull always -d ghcr.io/huggingface/text-generation-inference:latest --model-id bigcode/starcoder --num-shard 2 --max-batch-total-tokens 32768 sleep 10 wget --timeout 10 --retry-on-http-error --waitretry=1 --tries=240 http://localhost:3000/health - - name: Run k6 cloud test - uses: k6io/action@v0.1 - with: - filename: k6/starcoder_load.js + - name: Run k6 + run: | + ./k6 run k6/starcoder_load.js - name: Stop starcoder if: ${{ always() }}