From e27438aac0af934f9fd721cfc5a417d8d1cfe678 Mon Sep 17 00:00:00 2001 From: Nicolas Patry Date: Mon, 25 Sep 2023 12:46:26 +0000 Subject: [PATCH] Fix dockerfile. --- Dockerfile | 6 +++--- server/Makefile-awq | 3 ++- 2 files changed, 5 insertions(+), 4 deletions(-) diff --git a/Dockerfile b/Dockerfile index f29fa107..1d57d110 100644 --- a/Dockerfile +++ b/Dockerfile @@ -121,7 +121,7 @@ FROM kernel-builder as awq-kernels-builder WORKDIR /usr/src COPY server/Makefile-awq Makefile # Build specific version of transformers -RUN TORCH_CUDA_ARCH_LIST="8.0;8.6" make build-awq +RUN TORCH_CUDA_ARCH_LIST="8.0;8.6+PTX" make build-awq # Build Transformers CUDA kernels FROM kernel-builder as custom-kernels-builder @@ -175,8 +175,8 @@ COPY --from=flash-att-v2-builder /usr/src/flash-attention-v2/build/lib.linux-x86 COPY --from=custom-kernels-builder /usr/src/build/lib.linux-x86_64-cpython-39 /opt/conda/lib/python3.9/site-packages # Copy build artifacts from exllama kernels builder COPY --from=exllama-kernels-builder /usr/src/build/lib.linux-x86_64-cpython-39 /opt/conda/lib/python3.9/site-packages -# Copy build artifacts from exllama kernels builder -COPY --from=awq-kernels-builder /usr/src/build/lib.linux-x86_64-cpython-39 /opt/conda/lib/python3.9/site-packages +# Copy build artifacts from awq kernels builder +COPY --from=awq-kernels-builder /usr/src/llm-awq/awq/kernels/build/lib.linux-x86_64-cpython-39 /opt/conda/lib/python3.9/site-packages # Copy builds artifacts from vllm builder COPY --from=vllm-builder /usr/src/vllm/build/lib.linux-x86_64-cpython-39 /opt/conda/lib/python3.9/site-packages diff --git a/server/Makefile-awq b/server/Makefile-awq index 05f3e742..80e78c08 100644 --- a/server/Makefile-awq +++ b/server/Makefile-awq @@ -1,6 +1,7 @@ awq_commit := f084f40bd996f3cf3a0633c1ad7d9d476c318aaa -awq: +awq: + rm -rf llm-awq git clone https://github.com/mit-han-lab/llm-awq build-awq: awq