mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 04:14:52 +00:00
none g_idx
This commit is contained in:
parent
994ed8e10d
commit
af2c589cef
@ -177,6 +177,8 @@ class Weights:
|
||||
dtype=torch.int32,
|
||||
device=qweight.device,
|
||||
)
|
||||
else:
|
||||
g_idx = None
|
||||
|
||||
weight = (qweight, qzeros, scales, g_idx, bits, groupsize, False)
|
||||
else:
|
||||
@ -242,6 +244,8 @@ class Weights:
|
||||
dtype=torch.int32,
|
||||
device=qweight.device,
|
||||
)
|
||||
else:
|
||||
g_idx = None
|
||||
|
||||
from text_generation_server.utils.layers import HAS_EXLLAMA
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user