diff --git a/server/text_generation_server/models/globals.py b/server/text_generation_server/models/globals.py index 6373f796..89f920bb 100644 --- a/server/text_generation_server/models/globals.py +++ b/server/text_generation_server/models/globals.py @@ -8,7 +8,7 @@ from text_generation_server.utils.log import log_master REQUEST_LOGPROBS = os.getenv("REQUEST_LOGPROBS", "0").lower() in {"1", "true"} ATTENTION = os.environ["ATTENTION"] # default_prefix_caching = "1" if ATTENTION in {"flashinfer", "flashdecoding"} else "0" -PREFIX_CACHING = os.environ["USE_PREFIX_CACHING"].lower() in { +PREFIX_CACHING = os.environ["PREFIX_CACHING"].lower() in { "1", "true", }