Fixing non 4bits quantization.

This commit is contained in:
Nicolas Patry 2023-08-07 12:19:02 +02:00
parent 16fadcec57
commit a217b4df5a

View File

@ -263,7 +263,7 @@ class QuantLinear(nn.Module):
self.groupsize = groupsize
self.outfeatures = qweight.shape[1]
self.infeatures = qweight.shape[0] * 32 // 4
self.infeatures = qweight.shape[0] * 32 // bits
@classmethod
def new(cls, bits, groupsize, infeatures, outfeatures, bias):