From 0229c71b21e4ea023bb8883e4fab790192dc968d Mon Sep 17 00:00:00 2001 From: Nicolas Patry Date: Fri, 18 Oct 2024 17:55:36 +0200 Subject: [PATCH] Update server/text_generation_server/layers/gptq/__init__.py --- server/text_generation_server/layers/gptq/__init__.py | 1 + 1 file changed, 1 insertion(+) diff --git a/server/text_generation_server/layers/gptq/__init__.py b/server/text_generation_server/layers/gptq/__init__.py index 86856887..63131dee 100644 --- a/server/text_generation_server/layers/gptq/__init__.py +++ b/server/text_generation_server/layers/gptq/__init__.py @@ -325,6 +325,7 @@ class GPTQWeightsLoader(WeightsLoader): if g_idx is not None: if ( not torch.equal( + # Remove g_idx[0] to adapt the check with TP>1. (g_idx - g_idx[0]).cpu(), torch.tensor( [i // self.groupsize for i in range(g_idx.shape[0])],