mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 04:14:52 +00:00
Fix window_size_left for flash attention v1
This fixes flash attention v1 by not raising NotImplementedError when window_size_left is left at its default of -1
This commit is contained in:
parent
5ba53d44a1
commit
891b18a0c3
@ -80,7 +80,7 @@ def attention(
|
|||||||
)
|
)
|
||||||
|
|
||||||
if HAS_FLASH_ATTN:
|
if HAS_FLASH_ATTN:
|
||||||
if window_size_left != 0:
|
if window_size_left != -1:
|
||||||
raise NotImplementedError(
|
raise NotImplementedError(
|
||||||
"window_size_left is only available with flash attn v2"
|
"window_size_left is only available with flash attn v2"
|
||||||
)
|
)
|
||||||
|
Loading…
Reference in New Issue
Block a user