From 772c3774dfaf547a4c0954e2d1ebcbdb6ac79e24 Mon Sep 17 00:00:00 2001 From: OlivierDehaene <23298448+OlivierDehaene@users.noreply.github.com> Date: Fri, 12 Apr 2024 14:18:58 +0200 Subject: [PATCH] remvoe unused kernels --- Dockerfile | 1 + server/Makefile-vllm | 2 +- 2 files changed, 2 insertions(+), 1 deletion(-) diff --git a/Dockerfile b/Dockerfile index 54b160eb..53f0f8d3 100644 --- a/Dockerfile +++ b/Dockerfile @@ -248,6 +248,7 @@ ENTRYPOINT ["./entrypoint.sh"] FROM base COPY ./tgi-entrypoint.sh /tgi-entrypoint.sh +RUN chmod +x /tgi-entrypoint.sh ENTRYPOINT ["/tgi-entrypoint.sh"] CMD ["--json-output"] diff --git a/server/Makefile-vllm b/server/Makefile-vllm index ada484a6..9999ad89 100644 --- a/server/Makefile-vllm +++ b/server/Makefile-vllm @@ -4,7 +4,7 @@ vllm-cuda: git clone https://github.com/OlivierDehaene/vllm.git vllm build-vllm-cuda: vllm-cuda - cd vllm && git fetch && git checkout 4bec8cee87f6bb8cebaec297029713cd2082e0b2 + cd vllm && git fetch && git checkout 3d4693536dcb69f036c26b016a35839b99ebed59 cd vllm && python setup.py build install-vllm-cuda: build-vllm-cuda