Modified fix.

2025-09-10 20:04:52 +00:00 · 2023-07-04 11:30:59 +02:00 · 2023-07-04 11:30:59 +02:00 · 742199aa0d
commit 742199aa0d
parent 81f234ec61
1 changed files with 7 additions and 1 deletions
--- a/server/text_generation_server/models/flash_rw.py
+++ b/server/text_generation_server/models/flash_rw.py
@ -48,7 +48,13 @@ class FlashRWSharded(FlashCausalLM):
        torch.distributed.barrier(group=self.process_group)
        filenames = weight_files(model_id, revision=revision, extension=".safetensors")
-        weights = Weights(filenames, device, dtype, process_group=self.process_group)
+        weights = Weights(
            filenames,
            device,
            dtype,
            process_group=self.process_group,
            aliases={"transformer.word_embeddings.weight": ["lm_head.weight"]},
        )
        config.quantize = quantize