Small test and typing fixes (#3078)

* test_weights: add modules_to_not_convert * More typing fixes
2025-10-20 04:15:23 +00:00 · 2025-03-10 15:08:23 +01:00 · 2025-03-10 15:08:23 +01:00 · c5ecc7a4de
commit c5ecc7a4de
parent cae0cbe87d
3 changed files with 4 additions and 4 deletions
--- a/server/tests/utils/test_weights.py
+++ b/server/tests/utils/test_weights.py
@ -25,6 +25,7 @@ def gptq_weights_loader():
        quant_method="gptq",
        quantize="gptq",
        sym=True,
        modules_to_not_convert=[],
    )
@ -37,6 +38,7 @@ def gptq_weights_loader_awq():
        quant_method="awq",
        quantize="awq",
        sym=True,
        modules_to_not_convert=[],
    )
--- a/server/text_generation_server/layers/gptq/init.py
+++ b/server/text_generation_server/layers/gptq/init.py
@ -188,8 +188,6 @@ class GPTQWeightsLoader(WeightsLoader):
    def is_layer_skipped_quantization(
        self, prefix: str, modules_to_not_convert: List[str]
    ):
        if modules_to_not_convert is None:
            return False
        return any(module_name in prefix for module_name in modules_to_not_convert)
    def get_weights_col_packed(
--- a/server/text_generation_server/utils/quantization.py
+++ b/server/text_generation_server/utils/quantization.py
@ -21,7 +21,7 @@ class _QuantizerConfig:
    quant_method: str
    sym: bool
    weight_block_size: Optional[List[int]]
-    modules_to_not_convert: Optional[List[str]]
+    modules_to_not_convert: List[str]
@dataclass
@ -52,7 +52,7 @@ def _get_quantizer_config(model_id, revision):
    sym = False
    desc_act = False
    weight_block_size = None
-    modules_to_not_convert = None
+    modules_to_not_convert = []
    filename = "config.json"
    try: