This commit is contained in:
Cyril Vallez 2024-12-19 17:49:06 +00:00
parent 2e2631e093
commit 44b367937b

View File

@ -8,7 +8,7 @@ from text_generation_server.utils.log import log_master
REQUEST_LOGPROBS = os.getenv("REQUEST_LOGPROBS", "0").lower() in {"1", "true"}
ATTENTION = os.environ["ATTENTION"]
# default_prefix_caching = "1" if ATTENTION in {"flashinfer", "flashdecoding"} else "0"
PREFIX_CACHING = os.environ["USE_PREFIX_CACHING"].lower() in {
PREFIX_CACHING = os.environ["PREFIX_CACHING"].lower() in {
"1",
"true",
}