mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 20:34:54 +00:00
"Fixing" double BOS for mistral too.
This commit is contained in:
parent
6073ece4fc
commit
d1639a5827
@ -121,6 +121,11 @@ class FlashMistralBatch(FlashCausalLMBatch):
|
|||||||
requests_idx_mapping[r.id] = i
|
requests_idx_mapping[r.id] = i
|
||||||
|
|
||||||
tokenized_input = tokenized_input[-r.truncate :]
|
tokenized_input = tokenized_input[-r.truncate :]
|
||||||
|
if (
|
||||||
|
tokenized_input[0] == tokenizer.bos_token_id
|
||||||
|
and tokenized_input[1] == tokenizer.bos_token_id
|
||||||
|
):
|
||||||
|
tokenized_input = tokenized_input[1:]
|
||||||
|
|
||||||
input_length = len(tokenized_input)
|
input_length = len(tokenized_input)
|
||||||
input_lengths.append(input_length)
|
input_lengths.append(input_length)
|
||||||
|
Loading…
Reference in New Issue
Block a user