mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-09 11:24:53 +00:00
minor fix
Signed-off-by: Wang, Yi A <yi.a.wang@intel.com>
This commit is contained in:
parent
9f6d1704fe
commit
db11fe1f95
@ -460,7 +460,7 @@ class Qwen2_5VLAttention(nn.Module):
|
|||||||
# execute flash attention
|
# execute flash attention
|
||||||
if SYSTEM == "ipex":
|
if SYSTEM == "ipex":
|
||||||
attn_output = torch.empty_like(query)
|
attn_output = torch.empty_like(query)
|
||||||
if query.device.dtype == "xpu":
|
if query.device.type == "xpu":
|
||||||
ipex.llm.functional.varlen_attention(
|
ipex.llm.functional.varlen_attention(
|
||||||
query.contiguous(),
|
query.contiguous(),
|
||||||
key.contiguous(),
|
key.contiguous(),
|
||||||
|
Loading…
Reference in New Issue
Block a user