mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-06-19 15:52:08 +00:00
.
This commit is contained in:
parent
e3326e6b0b
commit
0d382c4508
@ -232,10 +232,12 @@ COPY server server
|
||||
COPY server/Makefile server/Makefile
|
||||
ENV UV_SYSTEM_PYTHON=1
|
||||
RUN cd server && \
|
||||
# make gen-server && \
|
||||
make gen-server && \
|
||||
pip install -U pip uv && \
|
||||
uv pip install -r requirements_cuda.txt && \
|
||||
uv pip install -e .
|
||||
uv pip install -e . &&
|
||||
text-generation-server --help
|
||||
|
||||
# uv sync --frozen --extra attention --extra bnb --extra accelerate --extra compressed-tensors --extra marlin --extra moe --extra quantize --extra peft --extra outlines && \
|
||||
# mv ./.venv/lib/python3.11/site-packages/* /opt/conda/lib/python3.11/site-packages/
|
||||
# uv pip install nvidia-nccl-cu12==2.22.3
|
||||
|
Loading…
Reference in New Issue
Block a user