diff --git a/Dockerfile b/Dockerfile index 4f272679..fd777f51 100644 --- a/Dockerfile +++ b/Dockerfile @@ -232,12 +232,14 @@ COPY server server COPY server/Makefile server/Makefile ENV UV_SYSTEM_PYTHON=1 RUN cd server && \ - make gen-server && \ + # make gen-server && \ pip install -U pip uv && \ - uv pip install -r requirements_cuda.txt + # uv pip install -r requirements_cuda.txt + uv sync --frozen --extra attention --extra bnb --extra accelerate --extra compressed-tensors --extra marlin --extra moe --extra quantize --extra peft --extra outlines && \ + mv ./.venv/lib/python3.11/site-packages/* /opt/conda/lib/python3.11/site-packages/ # uv pip install nvidia-nccl-cu12==2.22.3 -ENV LD_PRELOAD=/opt/conda/lib/python3.11/site-packages/nvidia/nccl/lib/libnccl.so.2 +# ENV LD_PRELOAD=/opt/conda/lib/python3.11/site-packages/nvidia/nccl/lib/libnccl.so.2 # Required to find libpython within the rust binaries ENV LD_LIBRARY_PATH="$LD_LIBRARY_PATH:/opt/conda/lib/" # This is needed because exl2 tries to load flash-attn