From 1b53c7052326df738409b1b280d2862fd5a4a855 Mon Sep 17 00:00:00 2001 From: seungrokjung Date: Wed, 5 Jun 2024 12:45:53 +0000 Subject: [PATCH] rocm ck flash attn api fix --- server/text_generation_server/layers/attention/rocm.py | 7 +------ 1 file changed, 1 insertion(+), 6 deletions(-) diff --git a/server/text_generation_server/layers/attention/rocm.py b/server/text_generation_server/layers/attention/rocm.py index 2d3601c8..31e26107 100644 --- a/server/text_generation_server/layers/attention/rocm.py +++ b/server/text_generation_server/layers/attention/rocm.py @@ -186,17 +186,12 @@ if ENGINE == "ck": out, cu_seqlens, cu_seqlens, - None, - None, - None, max_s, max_s, 0.0, softmax_scale, False, - causal, - window_size_left, - 0, + True, False, None, )