diff --git a/server/text_generation_server/models/flash_neox.py b/server/text_generation_server/models/flash_neox.py index 470fb73b..fc741f55 100644 --- a/server/text_generation_server/models/flash_neox.py +++ b/server/text_generation_server/models/flash_neox.py @@ -150,4 +150,4 @@ class FlashNeoXSharded(FlashNeoX): else: module._buffers[param_name] = tensor - # model.post_load_weights(quantize) + model.post_load_weights(quantize)