mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-10 20:04:52 +00:00
Update quantize.py
This commit is contained in:
parent
5a1512c025
commit
d6649411c4
@ -864,7 +864,7 @@ def quantize(
|
|||||||
)
|
)
|
||||||
|
|
||||||
with init_empty_weights():
|
with init_empty_weights():
|
||||||
model = AutoModelForCausalLM.from_config(config, torch_dtype=torch.float16)
|
model = AutoModelForCausalLM.from_config(config, torch_dtype=torch.float16,trust_remote_code=trust_remote_code)
|
||||||
model = model.eval()
|
model = model.eval()
|
||||||
|
|
||||||
print("LOADED model")
|
print("LOADED model")
|
||||||
|
Loading…
Reference in New Issue
Block a user