mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-21 23:12:07 +00:00
feat(backend): fix invalid reference to ctx instead of context in release build
This commit is contained in:
parent
3e82f14f57
commit
bd8f0f15e1
@ -105,7 +105,7 @@ namespace huggingface::tgi::backends::llamacpp {
|
|||||||
const auto latency = std::chrono::duration_cast<std::chrono::milliseconds>(end - start);
|
const auto latency = std::chrono::duration_cast<std::chrono::milliseconds>(end - start);
|
||||||
SPDLOG_DEBUG(FMT_STRING("Successfully decoded {:d} token(s) in {}"), batch.n_tokens, latency);
|
SPDLOG_DEBUG(FMT_STRING("Successfully decoded {:d} token(s) in {}"), batch.n_tokens, latency);
|
||||||
#else
|
#else
|
||||||
const auto status = llama_decode(ctx, batch);
|
const auto status = llama_decode(context, batch);
|
||||||
#endif
|
#endif
|
||||||
batch.n_tokens = 0;
|
batch.n_tokens = 0;
|
||||||
if (LLAMA_SUCCESS(status)) {
|
if (LLAMA_SUCCESS(status)) {
|
||||||
|
Loading…
Reference in New Issue
Block a user