diff --git a/server/text_generation_server/models/custom_modeling/qwen2_vl.py b/server/text_generation_server/models/custom_modeling/qwen2_vl.py index 6ebc3d4e..f920c2a7 100644 --- a/server/text_generation_server/models/custom_modeling/qwen2_vl.py +++ b/server/text_generation_server/models/custom_modeling/qwen2_vl.py @@ -505,5 +505,7 @@ class Qwen2VLForConditionalGeneration(nn.Module): prefill_cache_indices=prefill_cache_indices, ) hidden_states, _ = self.norm(hidden_states) + if lm_head_indices is not None: + hidden_states = hidden_states[lm_head_indices] logits = self.lm_head(hidden_states) return logits, None