fix qwen2 failure in intel cpu

Signed-off-by: Wang, Yi A <yi.a.wang@intel.com>
2025-09-11 20:34:54 +00:00 · 2024-10-31 22:39:07 +00:00 · 2024-10-31 22:39:07 +00:00 · 17de5998e5
commit 17de5998e5
parent bfa16a5857
1 changed files with 4 additions and 4 deletions
--- a/server/text_generation_server/models/custom_modeling/qwen2_vl.py
+++ b/server/text_generation_server/models/custom_modeling/qwen2_vl.py
@ -516,7 +516,7 @@ class Qwen2VLForConditionalGeneration(nn.Module):
            prefill_cache_indices=prefill_cache_indices,
        )
        hidden_states, _ = self.norm(hidden_states)
-        print("lm_head_indices", lm_head_indices)
-        logits, speculative_logits = self.lm_head(hidden_states)
-        # import ipdb; ipdb.set_trace()
-        return logits, speculative_logits
+        if lm_head_indices is not None:
+            hidden_states = hidden_states[lm_head_indices]
+        logits = self.lm_head(hidden_states)
+        return logits, None