mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-27 13:02:12 +00:00
Bump llama.cpp
Signed-off-by: Adrien Gallouët <angt@huggingface.co>
This commit is contained in:
parent
2d4aa25b9c
commit
46bc8e6bc7
@ -1,6 +1,6 @@
|
||||
FROM nvidia/cuda:12.8.0-cudnn-devel-ubuntu24.04 AS deps
|
||||
|
||||
ARG llamacpp_version=b4651
|
||||
ARG llamacpp_version=b4714
|
||||
ARG llamacpp_cuda=OFF
|
||||
ARG cuda_arch=75-real;80-real;86-real;89-real;90-real
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user