mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 04:14:52 +00:00
fix env var
This commit is contained in:
parent
9904f66966
commit
8260dc00d8
@ -777,7 +777,7 @@ class FlashCausalLM(Model):
|
||||
self.device,
|
||||
)
|
||||
|
||||
if os.getenv("ENABLE_CUDA_GRAPHS", "false") == "true":
|
||||
if os.getenv("ENABLE_CUDA_GRAPHS", "False") == "True":
|
||||
try:
|
||||
# Warmup cuda graphs for all power of twos until 64
|
||||
for i in range(6):
|
||||
|
Loading…
Reference in New Issue
Block a user