diff --git a/backends/llamacpp/csrc/backend.cpp b/backends/llamacpp/csrc/backend.cpp index 17709b72..46052435 100644 --- a/backends/llamacpp/csrc/backend.cpp +++ b/backends/llamacpp/csrc/backend.cpp @@ -28,7 +28,10 @@ namespace huggingface::tgi::backends::llamacpp { false, false )); - llama_sampler_chain_add(pSampler, llama_sampler_init_top_k(static_cast(top_k))); + + if (top_k > 0) { + llama_sampler_chain_add(pSampler, llama_sampler_init_top_k(static_cast(top_k))); + } if (0 < top_p && top_p < 1) { llama_sampler_chain_add(pSampler, llama_sampler_init_top_p(top_p, 1));