Load quantize_config.json from local path

2025-09-10 11:54:52 +00:00 · 2023-07-27 18:03:04 -07:00 · 2023-07-27 18:03:04 -07:00 · 987b0fff3a
commit 987b0fff3a
parent 9f18f4c006
1 changed files with 6 additions and 2 deletions
--- a/server/text_generation_server/utils/weights.py
+++ b/server/text_generation_server/utils/weights.py
@ -220,9 +220,13 @@ class Weights:

        return bits, groupsize

-    def _set_gptq_params(self, model_id):
+    def _set_gptq_params(self, model_id: str):
        try:
-            filename = hf_hub_download(model_id, filename="quantize_config.json")
+            potential_local_path = Path(model_id, "quantize_config.json")
+            if potential_local_path.exists():
+                filename = potential_local_path
+            else:
+                filename = hf_hub_download(model_id, filename="quantize_config.json")
            with open(filename, "r") as f:
                data = json.load(f)
            self.gptq_bits = data["bits"]