mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 20:34:54 +00:00
update
This commit is contained in:
parent
0d3cc033ad
commit
e9b9a96ba8
@ -412,9 +412,8 @@ def get_model(
|
||||
sliding_window = config_dict.get("sliding_window", -1)
|
||||
if sliding_window != -1 and not SUPPORTS_WINDOWING:
|
||||
logger.warning(
|
||||
f"Flash attention is available, but doesn't support windowing which is required by model {model_id} for best performance."
|
||||
f"Flash attention is available, but doesn't support windowing which is required by model {model_id} for long contexts."
|
||||
)
|
||||
# FLASH_ATTENTION = False
|
||||
|
||||
if model_type == MAMBA:
|
||||
return Mamba(
|
||||
|
Loading…
Reference in New Issue
Block a user