mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-10 20:04:52 +00:00
Support TheBloke exported models.
This commit is contained in:
parent
2d8c034df3
commit
cbf047b4ae
@ -345,4 +345,15 @@ class Weights:
|
|||||||
self.gptq_bits = data["bits"]
|
self.gptq_bits = data["bits"]
|
||||||
self.gptq_groupsize = data["group_size"]
|
self.gptq_groupsize = data["group_size"]
|
||||||
except Exception:
|
except Exception:
|
||||||
pass
|
filename = "quant_config.json"
|
||||||
|
try:
|
||||||
|
if os.path.exists(os.path.join(model_id, filename)):
|
||||||
|
filename = os.path.join(model_id, filename)
|
||||||
|
else:
|
||||||
|
filename = hf_hub_download(model_id, filename=filename)
|
||||||
|
with open(filename, "r") as f:
|
||||||
|
data = json.load(f)
|
||||||
|
self.gptq_bits = data["w_bit"]
|
||||||
|
self.gptq_groupsize = data["q_group_size"]
|
||||||
|
except Exception:
|
||||||
|
pass
|
||||||
|
Loading…
Reference in New Issue
Block a user