mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-12 04:44:52 +00:00
Fix Cohere.
This commit is contained in:
parent
66081e6ae7
commit
b98b94d695
@ -306,7 +306,7 @@ class FlashCohereAttention(torch.nn.Module):
|
||||
)
|
||||
# Decode
|
||||
else:
|
||||
paged_attention(
|
||||
attn_output = paged_attention(
|
||||
attn_output,
|
||||
query,
|
||||
kv_cache[0],
|
||||
|
Loading…
Reference in New Issue
Block a user