Fix Cohere.

This commit is contained in:
Nicolas Patry 2024-05-31 22:54:43 +00:00
parent 66081e6ae7
commit b98b94d695

View File

@ -306,7 +306,7 @@ class FlashCohereAttention(torch.nn.Module):
)
# Decode
else:
paged_attention(
attn_output = paged_attention(
attn_output,
query,
kv_cache[0],