Easiest fix.

2025-06-19 15:52:08 +00:00 · 2022-12-20 15:24:42 +01:00 · 2022-12-20 15:24:42 +01:00 · d8e1ce669b
commit d8e1ce669b
parent 611e21cb13
1 changed files with 2 additions and 1 deletions
--- a/server/text_generation/models/causal_lm.py
+++ b/server/text_generation/models/causal_lm.py
@ -354,7 +354,8 @@ class CausalLM(Model):
            if stop:
                # Decode all tokens
                output_text = self.tokenizer.decode(
-                    all_input_ids.squeeze(-1), skip_special_tokens=True
+                    all_input_ids.squeeze(-1), skip_special_tokens=True,
+                    cleanup_tokenization_spaces=False
                )
                # Slice with input_length to remove padding
                token_ids = all_input_ids[-new_input_length:]