mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-25 20:12:07 +00:00
More typing fixes
This commit is contained in:
parent
ed5bfe4241
commit
0a9f0dc53a
@ -188,8 +188,6 @@ class GPTQWeightsLoader(WeightsLoader):
|
||||
def is_layer_skipped_quantization(
|
||||
self, prefix: str, modules_to_not_convert: List[str]
|
||||
):
|
||||
if modules_to_not_convert is None:
|
||||
return False
|
||||
return any(module_name in prefix for module_name in modules_to_not_convert)
|
||||
|
||||
def get_weights_col_packed(
|
||||
|
@ -21,7 +21,7 @@ class _QuantizerConfig:
|
||||
quant_method: str
|
||||
sym: bool
|
||||
weight_block_size: Optional[List[int]]
|
||||
modules_to_not_convert: Optional[List[str]]
|
||||
modules_to_not_convert: List[str]
|
||||
|
||||
|
||||
@dataclass
|
||||
@ -52,7 +52,7 @@ def _get_quantizer_config(model_id, revision):
|
||||
sym = False
|
||||
desc_act = False
|
||||
weight_block_size = None
|
||||
modules_to_not_convert = None
|
||||
modules_to_not_convert = []
|
||||
|
||||
filename = "config.json"
|
||||
try:
|
||||
|
Loading…
Reference in New Issue
Block a user