From 849d8821abaa5ed39ef8024bc412442e0f7ce1a5 Mon Sep 17 00:00:00 2001 From: Nicolas Patry Date: Wed, 23 Oct 2024 18:02:50 +0800 Subject: [PATCH] QuantLinear is rocm compatible. --- server/text_generation_server/layers/gptq/__init__.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/server/text_generation_server/layers/gptq/__init__.py b/server/text_generation_server/layers/gptq/__init__.py index 63131dee..c6db32d3 100644 --- a/server/text_generation_server/layers/gptq/__init__.py +++ b/server/text_generation_server/layers/gptq/__init__.py @@ -10,7 +10,7 @@ from text_generation_server.utils.weights import Weight, Weights, WeightsLoader if SYSTEM == "ipex": from .ipex import QuantLinear -elif SYSTEM == "cuda": +elif SYSTEM in {"cuda", "rocm"}: from .cuda import QuantLinear