fix value

2025-09-11 12:24:53 +00:00 · 2024-01-10 16:49:00 +01:00 · 2024-01-10 16:49:00 +01:00 · 9904f66966
commit 9904f66966
parent 15fdd40587
2 changed files with 2 additions and 2 deletions
--- a/integration-tests/conftest.py
+++ b/integration-tests/conftest.py
@ -319,7 +319,7 @@ def launcher(event_loop):

        env = {
            "LOG_LEVEL": "info,text_generation_router=debug",
-            "ENABLE_CUDA_GRAPHS": "True",
+            "ENABLE_CUDA_GRAPHS": "true",
        }
        if not use_flash_attention:
            env["USE_FLASH_ATTENTION"] = "false"
--- a/server/text_generation_server/models/flash_causal_lm.py
+++ b/server/text_generation_server/models/flash_causal_lm.py
@ -777,7 +777,7 @@ class FlashCausalLM(Model):
            self.device,
        )

-        if os.getenv("ENABLE_CUDA_GRAPHS", "False") == "True":
+        if os.getenv("ENABLE_CUDA_GRAPHS", "false") == "true":
            try:
                # Warmup cuda graphs for all power of twos until 64
                for i in range(6):