mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-22 15:32:08 +00:00
fix: adds causal to attention params (#2408)
fix: adds causal to attention params to check when using flash attn v1
This commit is contained in:
parent
7a4d831d17
commit
ffc8fb0850
@ -293,6 +293,7 @@ else:
|
||||
max_s,
|
||||
softmax_scale,
|
||||
window_size_left=-1,
|
||||
causal=None,
|
||||
softcap=None,
|
||||
):
|
||||
if window_size_left != -1:
|
||||
|
Loading…
Reference in New Issue
Block a user