mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-10 03:44:54 +00:00
fix
This commit is contained in:
parent
f6438ac352
commit
f652788d54
@ -90,7 +90,7 @@ class FlashSantacoder(FlashCausalLM):
|
||||
filename, framework="pt", device=str(device) if quantize is None else "cpu"
|
||||
) as f:
|
||||
for key in f.keys():
|
||||
value = f.get_slice(key)
|
||||
value = f.get_tensor(key)
|
||||
value = value.to(device if quantize is None else "cpu").to(dtype)
|
||||
|
||||
layer_name = ".".join(key.split(".")[:4])
|
||||
|
Loading…
Reference in New Issue
Block a user