tied embeddings for qwe2

2025-09-12 04:44:52 +00:00 · 2024-07-24 11:59:56 +03:00 · 2024-07-24 11:59:56 +03:00 · f73f57ca21
commit f73f57ca21
parent 8642250602
1 changed files with 4 additions and 0 deletions
--- a/server/text_generation_server/models/init.py
+++ b/server/text_generation_server/models/init.py
@ -959,6 +959,10 @@ def get_model(
                dtype=dtype,
                trust_remote_code=trust_remote_code,
                lora_adapter_ids=lora_adapter_ids,
                aliases={
                    "lm_head.weight": ["model.word_embeddings.weight"],
                    "model.word_embeddings.weight": ["lm_head.weight"],
                }
            )
        elif sharded:
            raise NotImplementedError(FLASH_ATT_ERROR_MESSAGE.format("Sharded Qwen2"))