fix: prefer comparing model enum over str

2025-09-12 04:44:52 +00:00 · 2024-07-24 21:13:07 +00:00 · 2024-07-24 21:13:07 +00:00 · 72c97676fd
commit 72c97676fd
parent 9bfa340e34
1 changed files with 9 additions and 2 deletions
--- a/server/text_generation_server/models/init.py
+++ b/server/text_generation_server/models/init.py
@ -298,8 +298,12 @@ class ModelType(enum.Enum):
        "multimodal": True,
    }

-    def __str__(self):
-        return self.value["type"]
+    @classmethod
+    def from_str(cls, model_type: str) -> "ModelType":
+        for model in cls:
+            if model.value["type"] == model_type:
+                return model
+        raise ValueError(f"Unknown model type {model_type}")


 def get_model(
@ -488,6 +492,9 @@ def get_model(
            f"The backend {SYSTEM} does not support sliding window attention that is used by the model type {model_type}. To use this model nonetheless with the {SYSTEM} backend, please launch TGI with the argument `--max-input-tokens` smaller than sliding_window={sliding_window} (got here max_input_tokens={max_input_tokens})."
        )

+    # convert model_type to ModelType enum
+    model_type = ModelType.from_str(model_type)
+
    if model_type == ModelType.DEEPSEEK_V2:
        if FLASH_ATTENTION:
            head_size = max(