Update quantize.py

2025-09-10 11:54:52 +00:00 · 2023-07-19 17:43:49 +02:00 · 2023-07-19 17:43:49 +02:00 · d6649411c4
commit d6649411c4
parent 5a1512c025
1 changed files with 1 additions and 1 deletions
--- a/server/text_generation_server/utils/gptq/quantize.py
+++ b/server/text_generation_server/utils/gptq/quantize.py
@ -864,7 +864,7 @@ def quantize(
    )

    with init_empty_weights():
-        model = AutoModelForCausalLM.from_config(config, torch_dtype=torch.float16)
+        model = AutoModelForCausalLM.from_config(config, torch_dtype=torch.float16,trust_remote_code=trust_remote_code)
    model = model.eval()

    print("LOADED model")