"Fixing" double BOS for mistral too.

2025-09-11 12:24:53 +00:00 · 2024-05-01 18:20:44 +02:00 · 2024-05-01 18:20:44 +02:00 · d1639a5827
commit d1639a5827
parent 6073ece4fc
1 changed files with 5 additions and 0 deletions
--- a/server/text_generation_server/models/flash_mistral.py
+++ b/server/text_generation_server/models/flash_mistral.py
@ -121,6 +121,11 @@ class FlashMistralBatch(FlashCausalLMBatch):
            requests_idx_mapping[r.id] = i

            tokenized_input = tokenized_input[-r.truncate :]
+            if (
+                tokenized_input[0] == tokenizer.bos_token_id
+                and tokenized_input[1] == tokenizer.bos_token_id
+            ):
+                tokenized_input = tokenized_input[1:]

            input_length = len(tokenized_input)
            input_lengths.append(input_length)