From e9b9a96ba8a2da72bd4677c1a56d758beab778fc Mon Sep 17 00:00:00 2001 From: fxmarty <9808326+fxmarty@users.noreply.github.com> Date: Thu, 6 Jun 2024 12:35:18 +0000 Subject: [PATCH] update --- server/text_generation_server/models/__init__.py | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/server/text_generation_server/models/__init__.py b/server/text_generation_server/models/__init__.py index 2e280ff4..d9b59de4 100644 --- a/server/text_generation_server/models/__init__.py +++ b/server/text_generation_server/models/__init__.py @@ -412,9 +412,8 @@ def get_model( sliding_window = config_dict.get("sliding_window", -1) if sliding_window != -1 and not SUPPORTS_WINDOWING: logger.warning( - f"Flash attention is available, but doesn't support windowing which is required by model {model_id} for best performance." + f"Flash attention is available, but doesn't support windowing which is required by model {model_id} for long contexts." ) - # FLASH_ATTENTION = False if model_type == MAMBA: return Mamba(