mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 20:34:54 +00:00
Update server/text_generation_server/layers/gptq/__init__.py
This commit is contained in:
parent
8673bb050d
commit
0229c71b21
@ -325,6 +325,7 @@ class GPTQWeightsLoader(WeightsLoader):
|
|||||||
if g_idx is not None:
|
if g_idx is not None:
|
||||||
if (
|
if (
|
||||||
not torch.equal(
|
not torch.equal(
|
||||||
|
# Remove g_idx[0] to adapt the check with TP>1.
|
||||||
(g_idx - g_idx[0]).cpu(),
|
(g_idx - g_idx[0]).cpu(),
|
||||||
torch.tensor(
|
torch.tensor(
|
||||||
[i // self.groupsize for i in range(g_idx.shape[0])],
|
[i // self.groupsize for i in range(g_idx.shape[0])],
|
||||||
|
Loading…
Reference in New Issue
Block a user