fix env var

2025-09-11 04:14:52 +00:00 · 2024-01-10 17:17:19 +01:00 · 2024-01-10 17:17:19 +01:00 · 8260dc00d8
commit 8260dc00d8
parent 9904f66966
1 changed files with 1 additions and 1 deletions
--- a/server/text_generation_server/models/flash_causal_lm.py
+++ b/server/text_generation_server/models/flash_causal_lm.py
@ -777,7 +777,7 @@ class FlashCausalLM(Model):
            self.device,
        )

-        if os.getenv("ENABLE_CUDA_GRAPHS", "false") == "true":
+        if os.getenv("ENABLE_CUDA_GRAPHS", "False") == "True":
            try:
                # Warmup cuda graphs for all power of twos until 64
                for i in range(6):