mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-06-19 15:52:08 +00:00
Cleanup Dockerfile
Signed-off-by: Adrien Gallouët <angt@huggingface.co>
This commit is contained in:
parent
df2a4fbb8a
commit
906c265aef
@ -55,9 +55,6 @@ RUN cargo build \
|
||||
--profile release-opt \
|
||||
--package text-generation-router-llamacpp --frozen
|
||||
|
||||
# fix libcuda.so.1 ?
|
||||
RUN cp "$(pkg-config --variable=libdir cuda-12.6)"/stubs/libcuda.so /usr/lib/libcuda.so.1
|
||||
|
||||
FROM nvidia/cuda:12.6.3-cudnn-runtime-ubuntu24.04
|
||||
|
||||
RUN apt update && apt install -y \
|
||||
@ -72,7 +69,6 @@ RUN pip3 install --no-cache-dir -r requirements.txt
|
||||
|
||||
COPY --from=builder /usr/lib/libllama.so /usr/lib/
|
||||
COPY --from=builder /usr/lib/libggml*.so /usr/lib/
|
||||
COPY --from=builder /usr/lib/libcuda.so.1 /usr/lib/
|
||||
COPY --from=builder /app/target/release-opt/text-generation-router-llamacpp /usr/bin/
|
||||
|
||||
ENTRYPOINT ["text-generation-router-llamacpp"]
|
||||
|
Loading…
Reference in New Issue
Block a user