Fix incorrect use of bias in awq

2025-09-11 12:24:53 +00:00 · 2023-12-27 03:25:47 +00:00 · 2023-12-27 03:25:47 +00:00 · 74d9dfa89e
commit 74d9dfa89e
parent dd304cf14c
2 changed files with 2 additions and 5 deletions
--- a/server/text_generation_server/utils/awq/quantize/qmodule.py
+++ b/server/text_generation_server/utils/awq/quantize/qmodule.py
@ -35,10 +35,7 @@ class WQLinear(nn.Module):
        self.qweight = qweight
        self.qzeros = qzeros
        self.scales = scales
        if bias:
        self.bias = bias
        else:
            self.bias = None
    @torch.no_grad()
    def forward(self, x):
--- a/server/text_generation_server/utils/layers.py
+++ b/server/text_generation_server/utils/layers.py
@ -335,7 +335,7 @@ def get_linear(weight, bias, quantize):
            qweight=qweight,
            qzeros=qzeros,
            scales=scales,
-            bias=bias is not None,
+            bias=bias,
        )
    else:
        raise NotImplementedError(f"Quantization `{quantize}` is not implemented yet.")