Fix prefix_caching variable, remove defaults in server (confusing a lot

of the times).
2025-09-11 20:34:54 +00:00 · 2024-10-16 10:46:03 +02:00 · 2024-10-16 10:46:03 +02:00 · 5c72f269b6
commit 5c72f269b6
parent 594a2b4a3d
1 changed files with 3 additions and 3 deletions
--- a/server/text_generation_server/models/globals.py
+++ b/server/text_generation_server/models/globals.py
@ -5,9 +5,9 @@ from typing import Dict, Optional

 from text_generation_server.utils.log import log_master

-ATTENTION = os.getenv("ATTENTION", "flashinfer")
-default_prefix_caching = "1" if ATTENTION in {"flashinfer", "flashdecoding"} else "0"
-PREFIX_CACHING = os.getenv("PREFIX_CACHING", default_prefix_caching).lower() in {
+ATTENTION = os.environ["ATTENTION"]
+# default_prefix_caching = "1" if ATTENTION in {"flashinfer", "flashdecoding"} else "0"
+PREFIX_CACHING = os.environ["PREFIX_CACHING"].lower() in {
    "1",
    "true",
 }