mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-10 11:54:52 +00:00
Update quantize.py
This commit is contained in:
parent
5a1512c025
commit
d6649411c4
@ -864,7 +864,7 @@ def quantize(
|
||||
)
|
||||
|
||||
with init_empty_weights():
|
||||
model = AutoModelForCausalLM.from_config(config, torch_dtype=torch.float16)
|
||||
model = AutoModelForCausalLM.from_config(config, torch_dtype=torch.float16,trust_remote_code=trust_remote_code)
|
||||
model = model.eval()
|
||||
|
||||
print("LOADED model")
|
||||
|
Loading…
Reference in New Issue
Block a user