fixing condition

This commit is contained in:
Maxime Laboissonniere 2023-09-06 20:02:23 -04:00
parent a9fdfb2464
commit afe9c07476

View File

@ -173,10 +173,11 @@ class Weights:
from text_generation_server.utils.layers import HAS_EXLLAMA, CAN_EXLLAMA from text_generation_server.utils.layers import HAS_EXLLAMA, CAN_EXLLAMA
if use_exllama: if use_exllama:
if not HAS_EXLLAMA and CAN_EXLLAMA: if not HAS_EXLLAMA:
logger.warning( if CAN_EXLLAMA:
"Exllama GPTQ cuda kernels (which are faster) could have been used, but are not currently installed, try using BUILD_EXTENSIONS=True" logger.warning(
) "Exllama GPTQ cuda kernels (which are faster) could have been used, but are not currently installed, try using BUILD_EXTENSIONS=True"
)
use_exllama = False use_exllama = False
else: else:
logger.info("Using exllama kernels") logger.info("Using exllama kernels")