Change deploy.

This commit is contained in:
Nicolas Patry 2023-09-25 09:01:07 +00:00
parent 27ecef5153
commit a8f870aa75
3 changed files with 13 additions and 1 deletions

View File

@ -157,7 +157,6 @@ WORKDIR /usr/src
RUN apt-get update && DEBIAN_FRONTEND=noninteractive apt-get install -y --no-install-recommends \
libssl-dev \
ca-certificates \
git \ # Necessary for non-standard package AWQ
make \
&& rm -rf /var/lib/apt/lists/*

1
server/.gitignore vendored
View File

@ -159,3 +159,4 @@ safetensors
flash-attention/
flash-attention-v2/
vllm/
llm-awq/

12
server/Makefile-awq Normal file
View File

@ -0,0 +1,12 @@
awq_commit := f084f40bd996f3cf3a0633c1ad7d9d476c318aaa
awq:
git clone https://github.com/mit-han-lab/llm-awq
build-awq: awq
cd llm-awq/ && git fetch && git checkout $(awq_commit)
cd llm-awq/awq/kernels && python setup.py build
install-awq: build-awq
pip uninstall awq_inference_engine -y || true
cd llm-awq/awq/kernels && python setup.py install