mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-06-19 15:52:08 +00:00
The good old monkey.
This commit is contained in:
parent
830c25dd5a
commit
19ea893956
@ -232,12 +232,14 @@ COPY server server
|
||||
COPY server/Makefile server/Makefile
|
||||
ENV UV_SYSTEM_PYTHON=1
|
||||
RUN cd server && \
|
||||
make gen-server && \
|
||||
# make gen-server && \
|
||||
pip install -U pip uv && \
|
||||
uv pip install -r requirements_cuda.txt
|
||||
# uv pip install -r requirements_cuda.txt
|
||||
uv sync --frozen --extra attention --extra bnb --extra accelerate --extra compressed-tensors --extra marlin --extra moe --extra quantize --extra peft --extra outlines && \
|
||||
mv ./.venv/lib/python3.11/site-packages/* /opt/conda/lib/python3.11/site-packages/
|
||||
# uv pip install nvidia-nccl-cu12==2.22.3
|
||||
|
||||
ENV LD_PRELOAD=/opt/conda/lib/python3.11/site-packages/nvidia/nccl/lib/libnccl.so.2
|
||||
# ENV LD_PRELOAD=/opt/conda/lib/python3.11/site-packages/nvidia/nccl/lib/libnccl.so.2
|
||||
# Required to find libpython within the rust binaries
|
||||
ENV LD_LIBRARY_PATH="$LD_LIBRARY_PATH:/opt/conda/lib/"
|
||||
# This is needed because exl2 tries to load flash-attn
|
||||
|
Loading…
Reference in New Issue
Block a user