remove v2 for now

This commit is contained in:
OlivierDehaene 2023-12-21 15:24:41 +01:00
parent 672f290901
commit 96a520ec78

View File

@ -33,7 +33,7 @@ except Exception:
HAS_EXLLAMA = False
CAN_EXLLAMA = major >= 8
V2 = os.getenv("EXLLAMA_VERSION", "2") == "2"
V2 = os.getenv("EXLLAMA_VERSION", "1") == "2"
if V2 and int(os.getenv("WORLD_SIZE", "1")) > 1:
logger.warning(
"Disabling exllama v2 and using v1 instead because there are issues when sharding"