mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-09 19:34:53 +00:00
Update server/text_generation_server/models/flash_neox.py
This commit is contained in:
parent
89ff4e901a
commit
7fc999b7bd
@ -150,4 +150,4 @@ class FlashNeoXSharded(FlashNeoX):
|
||||
else:
|
||||
module._buffers[param_name] = tensor
|
||||
|
||||
# model.post_load_weights(quantize)
|
||||
model.post_load_weights(quantize)
|
||||
|
Loading…
Reference in New Issue
Block a user