use all tokens

2025-06-19 15:52:08 +00:00 · 2023-04-05 17:18:16 +02:00 · 2023-04-05 17:18:16 +02:00 · 70637b4170
commit 70637b4170
parent b5233f9c3c
1 changed files with 1 additions and 1 deletions
--- a/server/text_generation_server/models/flash_causal_lm.py
+++ b/server/text_generation_server/models/flash_causal_lm.py
@ -355,7 +355,7 @@ class FlashCausalLM(Model):
            # Generated token
            next_token_logprob = logprobs[-1, next_token_id_item]
            next_token_text, offset, token_offset = self.decode_token(
-                all_input_ids[-(stopping_criteria.current_tokens + 1) :],
+                all_input_ids,
                offset,
                token_offset,
            )