mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-27 21:12:07 +00:00
Bump llama.cpp
Signed-off-by: Adrien Gallouët <angt@huggingface.co>
This commit is contained in:
parent
2d4aa25b9c
commit
46bc8e6bc7
@ -1,6 +1,6 @@
|
|||||||
FROM nvidia/cuda:12.8.0-cudnn-devel-ubuntu24.04 AS deps
|
FROM nvidia/cuda:12.8.0-cudnn-devel-ubuntu24.04 AS deps
|
||||||
|
|
||||||
ARG llamacpp_version=b4651
|
ARG llamacpp_version=b4714
|
||||||
ARG llamacpp_cuda=OFF
|
ARG llamacpp_cuda=OFF
|
||||||
ARG cuda_arch=75-real;80-real;86-real;89-real;90-real
|
ARG cuda_arch=75-real;80-real;86-real;89-real;90-real
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user