Fixing rocm gptq by using triton code too (renamed cuda into triton).

This commit is contained in:
Nicolas Patry 2024-10-25 07:26:33 +02:00
parent 43df056eee
commit 7dc2adf7e9
No known key found for this signature in database
GPG Key ID: D2920555C90F704C
2 changed files with 2 additions and 2 deletions

View File

@ -10,8 +10,8 @@ from text_generation_server.utils.weights import Weight, Weights, WeightsLoader
if SYSTEM == "ipex":
from .ipex import QuantLinear
elif SYSTEM == "cuda":
from .cuda import QuantLinear
elif SYSTEM in {"cuda", "rocm"}:
from .triton import QuantLinear
@dataclass