mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-10 11:54:52 +00:00
fix
This commit is contained in:
parent
107fcfe9b6
commit
2d4b31070e
@ -178,7 +178,6 @@ class FlashLlamaAttention(torch.nn.Module):
|
||||
False,
|
||||
True,
|
||||
False,
|
||||
0,
|
||||
None,
|
||||
)
|
||||
# Decode
|
||||
|
@ -167,7 +167,6 @@ class FlashNeoxAttention(torch.nn.Module):
|
||||
False,
|
||||
True,
|
||||
False,
|
||||
0,
|
||||
None,
|
||||
)
|
||||
# Decode
|
||||
|
@ -201,7 +201,6 @@ class FlashRWAttention(torch.nn.Module):
|
||||
False,
|
||||
True,
|
||||
False,
|
||||
0,
|
||||
None,
|
||||
)
|
||||
# Decode
|
||||
@ -336,7 +335,6 @@ class FlashRWLargeAttention(torch.nn.Module):
|
||||
False,
|
||||
True,
|
||||
False,
|
||||
0,
|
||||
None,
|
||||
)
|
||||
# Decode
|
||||
|
@ -289,7 +289,6 @@ class FlashMQAttention(torch.nn.Module):
|
||||
False,
|
||||
True,
|
||||
False,
|
||||
0,
|
||||
None,
|
||||
)
|
||||
# Decode
|
||||
|
Loading…
Reference in New Issue
Block a user