From 3836c3fe7248b445421ed7312b868e0b32388b2f Mon Sep 17 00:00:00 2001 From: "Wang, Yi A" Date: Wed, 30 Oct 2024 22:29:05 -0700 Subject: [PATCH] fix qwen2 failure in intel cpu Signed-off-by: Wang, Yi A --- .../text_generation_server/models/custom_modeling/qwen2_vl.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/server/text_generation_server/models/custom_modeling/qwen2_vl.py b/server/text_generation_server/models/custom_modeling/qwen2_vl.py index 6ebc3d4e..f920c2a7 100644 --- a/server/text_generation_server/models/custom_modeling/qwen2_vl.py +++ b/server/text_generation_server/models/custom_modeling/qwen2_vl.py @@ -505,5 +505,7 @@ class Qwen2VLForConditionalGeneration(nn.Module): prefill_cache_indices=prefill_cache_indices, ) hidden_states, _ = self.norm(hidden_states) + if lm_head_indices is not None: + hidden_states = hidden_states[lm_head_indices] logits = self.lm_head(hidden_states) return logits, None