mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-09 11:24:53 +00:00
Fix the image_token_id issue
Signed-off-by: yuanwu <yuan.wu@intel.com>
This commit is contained in:
parent
50ecfc625a
commit
f5aaa18d8e
@ -1397,7 +1397,9 @@ class Llama4ForConditionalGeneration(nn.Module):
|
||||
vision_flat = image_features.view(-1, image_features.size(-1))
|
||||
projected_vision_flat = self.multi_modal_projector(vision_flat)
|
||||
|
||||
special_image_mask = (input_ids == self.config.image_token_id).unsqueeze(-1)
|
||||
special_image_mask = (input_ids == self.config.image_token_index).unsqueeze(
|
||||
-1
|
||||
)
|
||||
final_mask = special_image_mask.to(inputs_embeds.device)
|
||||
inputs_embeds = inputs_embeds.view(-1, inputs_embeds.size(-1))
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user