mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-24 00:12:08 +00:00
feat(backend): fix invalid reference to context in release mode
This commit is contained in:
parent
7e2890fe2c
commit
488ba93898
@ -74,7 +74,7 @@ namespace huggingface::tgi::backends::llamacpp {
|
||||
const auto latency = std::chrono::duration_cast<std::chrono::milliseconds>(end - start);
|
||||
SPDLOG_DEBUG(FMT_STRING("Successfully decoded {:d} token(s) in {}"), batch.n_tokens, latency);
|
||||
#else
|
||||
const auto status = llama_decode(context, batch);
|
||||
const auto status = llama_decode(context_.get(), batch);
|
||||
#endif
|
||||
batch.n_tokens = 0;
|
||||
if (LLAMA_SUCCESS(status)) [[likely]] {
|
||||
|
Loading…
Reference in New Issue
Block a user