mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 04:14:52 +00:00
fixing condition
This commit is contained in:
parent
a9fdfb2464
commit
afe9c07476
@ -173,10 +173,11 @@ class Weights:
|
|||||||
from text_generation_server.utils.layers import HAS_EXLLAMA, CAN_EXLLAMA
|
from text_generation_server.utils.layers import HAS_EXLLAMA, CAN_EXLLAMA
|
||||||
|
|
||||||
if use_exllama:
|
if use_exllama:
|
||||||
if not HAS_EXLLAMA and CAN_EXLLAMA:
|
if not HAS_EXLLAMA:
|
||||||
logger.warning(
|
if CAN_EXLLAMA:
|
||||||
"Exllama GPTQ cuda kernels (which are faster) could have been used, but are not currently installed, try using BUILD_EXTENSIONS=True"
|
logger.warning(
|
||||||
)
|
"Exllama GPTQ cuda kernels (which are faster) could have been used, but are not currently installed, try using BUILD_EXTENSIONS=True"
|
||||||
|
)
|
||||||
use_exllama = False
|
use_exllama = False
|
||||||
else:
|
else:
|
||||||
logger.info("Using exllama kernels")
|
logger.info("Using exllama kernels")
|
||||||
|
Loading…
Reference in New Issue
Block a user