"Fixing" double BOS for mistral too.

This commit is contained in:
Nicolas Patry 2024-05-01 18:20:44 +02:00
parent 6073ece4fc
commit d1639a5827

View File

@ -121,6 +121,11 @@ class FlashMistralBatch(FlashCausalLMBatch):
requests_idx_mapping[r.id] = i
tokenized_input = tokenized_input[-r.truncate :]
if (
tokenized_input[0] == tokenizer.bos_token_id
and tokenized_input[1] == tokenizer.bos_token_id
):
tokenized_input = tokenized_input[1:]
input_length = len(tokenized_input)
input_lengths.append(input_length)