mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-10 11:54:52 +00:00
fix
This commit is contained in:
parent
f6438ac352
commit
f652788d54
@ -90,7 +90,7 @@ class FlashSantacoder(FlashCausalLM):
|
|||||||
filename, framework="pt", device=str(device) if quantize is None else "cpu"
|
filename, framework="pt", device=str(device) if quantize is None else "cpu"
|
||||||
) as f:
|
) as f:
|
||||||
for key in f.keys():
|
for key in f.keys():
|
||||||
value = f.get_slice(key)
|
value = f.get_tensor(key)
|
||||||
value = value.to(device if quantize is None else "cpu").to(dtype)
|
value = value.to(device if quantize is None else "cpu").to(dtype)
|
||||||
|
|
||||||
layer_name = ".".join(key.split(".")[:4])
|
layer_name = ".".join(key.split(".")[:4])
|
||||||
|
Loading…
Reference in New Issue
Block a user