mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-10 20:04:52 +00:00
Small fix.
This commit is contained in:
parent
c07ee68b60
commit
95583ee257
@ -63,7 +63,7 @@ class FlashSantacoderSharded(FlashCausalLM):
|
||||
aliases={"transformer.wte.weight": ["lm_head.weight"]},
|
||||
)
|
||||
if config.quantize == "gptq":
|
||||
weights.set_gptq_params(model_id)
|
||||
weights._set_gptq_params(model_id)
|
||||
|
||||
model = FlashSantacoderForCausalLM(config, weights)
|
||||
|
||||
|
@ -3,6 +3,8 @@ from typing import List, Dict, Optional, Tuple
|
||||
from safetensors import safe_open, SafetensorError
|
||||
import torch
|
||||
from loguru import logger
|
||||
from huggingface_hub import hf_hub_download
|
||||
import json
|
||||
|
||||
|
||||
class Weights:
|
||||
|
Loading…
Reference in New Issue
Block a user