From 06a3d19142a5d765590cee219fe54cefcc64df4d Mon Sep 17 00:00:00 2001 From: Maxime Laboissonniere Date: Wed, 6 Sep 2023 19:41:42 -0400 Subject: [PATCH] fixing condition --- server/text_generation_server/utils/weights.py | 9 +++++---- 1 file changed, 5 insertions(+), 4 deletions(-) diff --git a/server/text_generation_server/utils/weights.py b/server/text_generation_server/utils/weights.py index 261456bd..71cc1971 100644 --- a/server/text_generation_server/utils/weights.py +++ b/server/text_generation_server/utils/weights.py @@ -173,10 +173,11 @@ class Weights: from text_generation_server.utils.layers import HAS_EXLLAMA, CAN_EXLLAMA if use_exllama: - if not HAS_EXLLAMA and CAN_EXLLAMA: - logger.warning( - "Exllama GPTQ cuda kernels (which are faster) could have been used, but are not currently installed, try using BUILD_EXTENSIONS=True" - ) + if not HAS_EXLLAMA: + if CAN_EXLLAMA: + logger.warning( + "Exllama GPTQ cuda kernels (which are faster) could have been used, but are not currently installed, try using BUILD_EXTENSIONS=True" + ) use_exllama = False else: logger.info("Using exllama kernels")