fix Qwen VL break in intel platform

Signed-off-by: Wang, Yi A <yi.a.wang@intel.com>
2025-07-29 11:20:16 +00:00 · 2025-02-09 18:01:20 -08:00 · 2025-02-09 18:01:20 -08:00 · 57385c5463
commit 57385c5463
parent 4b8cda684b
1 changed files with 13 additions and 7 deletions
--- a/server/text_generation_server/layers/rotary.py
+++ b/server/text_generation_server/layers/rotary.py
@ -577,6 +577,12 @@ class RotaryPositionEmbeddingMultimodalSections(PositionRotaryEmbedding):
        cos: torch.Tensor,
        sin: torch.Tensor,
    ):
        if SYSTEM == "ipex":
            ipex.llm.functional.rotary_embedding(
                query, key, sin, cos, query.size(-1), True
            )
        else:
            # rotate half the sequence length
            rot = cos.shape[-1] // 2
            q2 = torch.cat([-query[..., rot:], query[..., :rot]], dim=-1)