mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 04:14:52 +00:00
remove v2 for now
This commit is contained in:
parent
672f290901
commit
96a520ec78
@ -33,7 +33,7 @@ except Exception:
|
||||
|
||||
HAS_EXLLAMA = False
|
||||
CAN_EXLLAMA = major >= 8
|
||||
V2 = os.getenv("EXLLAMA_VERSION", "2") == "2"
|
||||
V2 = os.getenv("EXLLAMA_VERSION", "1") == "2"
|
||||
if V2 and int(os.getenv("WORLD_SIZE", "1")) > 1:
|
||||
logger.warning(
|
||||
"Disabling exllama v2 and using v1 instead because there are issues when sharding"
|
||||
|
Loading…
Reference in New Issue
Block a user