Small fix.

2025-09-10 20:04:52 +00:00 · 2023-07-21 10:20:01 +00:00 · 2023-07-21 10:20:01 +00:00 · 95583ee257
commit 95583ee257
parent c07ee68b60
2 changed files with 3 additions and 1 deletions
--- a/server/text_generation_server/models/flash_santacoder.py
+++ b/server/text_generation_server/models/flash_santacoder.py
@ -63,7 +63,7 @@ class FlashSantacoderSharded(FlashCausalLM):
            aliases={"transformer.wte.weight": ["lm_head.weight"]},
        )
        if config.quantize == "gptq":
-            weights.set_gptq_params(model_id)
+            weights._set_gptq_params(model_id)

        model = FlashSantacoderForCausalLM(config, weights)

--- a/server/text_generation_server/utils/weights.py
+++ b/server/text_generation_server/utils/weights.py
@ -3,6 +3,8 @@ from typing import List, Dict, Optional, Tuple
 from safetensors import safe_open, SafetensorError
 import torch
 from loguru import logger
+from huggingface_hub import hf_hub_download
+import json


 class Weights: