Better error message on non rocm.

This commit is contained in:
Nicolas Patry 2024-02-09 09:44:53 +00:00
parent a76821e0b2
commit 326f8e30ac

View File

@ -354,6 +354,8 @@ def get_linear(weight, bias, quantize):
"AWQ GEMM kernel can't be used on ROCm systems, please use `--quantize gptq` instead "
"to use Exllama/GPTQ kernels for AWQ inference."
)
if not HAS_AWQ:
raise NotImplementedError("You do not seem to have awq installed, either install it (cd server && make install-awq), or try using GPTQ `---quantize gptq` a conversion AWQ->GPTQ will happen on the fly")
linear = WQLinear(
w_bit=bits,
group_size=groupsize,