diff --git a/server/text_generation_server/models/__init__.py b/server/text_generation_server/models/__init__.py index 22cd0f57..9c0a5eaa 100644 --- a/server/text_generation_server/models/__init__.py +++ b/server/text_generation_server/models/__init__.py @@ -146,7 +146,9 @@ def get_model( medusa_model_id, revision=revision, filename="config.json" ) hf_hub_download( - medusa_model_id, revision=revision, filename="medusa_lm_head.pt" + medusa_model_id, + revision=revision, + filename="medusa_lm_head.safetensors", ) use_medusa = Path(medusa_config).parent else: