Update server/text_generation_server/layers/attention/xpu.py

This commit is contained in:
Nicolas Patry 2024-05-31 17:56:08 +02:00 committed by GitHub
parent d44688b6ac
commit b0c168d249
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -14,9 +14,6 @@ def attention(
softmax_scale,
window_size_left=-1,
):
if window_size_left <= 0 and window_size_left != -1:
raise ValueError("`window_size_left` must be > 0 or -1")
if window_size_left != -1:
raise ValueError(
f"XPU version of Flash Attention does not support window attention (window_size_left != -1, got window_size_left={window_size_left})."