mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 12:24:53 +00:00
none g_idx
This commit is contained in:
parent
bbe5bedea5
commit
76834c9989
@ -177,6 +177,8 @@ class Weights:
|
|||||||
dtype=torch.int32,
|
dtype=torch.int32,
|
||||||
device=qweight.device,
|
device=qweight.device,
|
||||||
)
|
)
|
||||||
|
else:
|
||||||
|
g_idx = None
|
||||||
|
|
||||||
weight = (qweight, qzeros, scales, g_idx, bits, groupsize, False)
|
weight = (qweight, qzeros, scales, g_idx, bits, groupsize, False)
|
||||||
else:
|
else:
|
||||||
@ -242,6 +244,8 @@ class Weights:
|
|||||||
dtype=torch.int32,
|
dtype=torch.int32,
|
||||||
device=qweight.device,
|
device=qweight.device,
|
||||||
)
|
)
|
||||||
|
else:
|
||||||
|
g_idx = None
|
||||||
|
|
||||||
from text_generation_server.utils.layers import HAS_EXLLAMA
|
from text_generation_server.utils.layers import HAS_EXLLAMA
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user