Merge branch 'habana-main' into 2.3.0

2025-09-11 20:34:54 +00:00 · 2024-10-28 04:37:07 +08:00 · 2024-10-28 04:37:07 +08:00 · c23584f626
commit c23584f626
parent 372e071135 b126bf4785
1 changed files with 2 additions and 4 deletions
--- a/server/text_generation_server/models/causal_lm.py
+++ b/server/text_generation_server/models/causal_lm.py
@ -731,13 +731,11 @@ class CausalLM(Model):
        }
-        if model.config.model_type in ["llama", "mistral", "starcoder2", "qwen2", "falcon", "gemma"]:
+        if model.config.model_type in ["llama", "mistral", "starcoder2", "qwen2", "falcon"]:
            if model.config.model_type not in ["falcon"]:
                self.kwargs["attn_softmax_bf16"] = True
-            if model.config.model_type not in ["gemma"]:
+            self.kwargs["trim_logits"] = True
                self.kwargs["trim_logits"] = True
            if os.getenv("USE_FLASH_ATTENTION", "false").lower() == "true":
                self.kwargs["use_flash_attention"] = True