mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-22 15:32:08 +00:00
fix: return the out tensor rather then the functions return value (#2361)
This commit is contained in:
parent
8b0f5feb02
commit
83d1f23fea
@ -292,8 +292,7 @@ else:
|
||||
)
|
||||
|
||||
out = torch.empty_like(q)
|
||||
|
||||
return flash_attn_cuda.fwd(
|
||||
flash_attn_cuda.fwd(
|
||||
q,
|
||||
k,
|
||||
v,
|
||||
@ -309,4 +308,5 @@ else:
|
||||
False,
|
||||
0,
|
||||
None,
|
||||
)[0]
|
||||
)
|
||||
return out
|
||||
|
Loading…
Reference in New Issue
Block a user