Fix qwen vl (#3096)

* Fixing qwen2.5 VL. * Fixing the CI.
2025-07-22 07:40:17 +00:00 · 2025-03-11 11:00:41 +01:00 · 2025-03-11 11:00:41 +01:00 · b447f7e821
commit b447f7e821
parent 094975c3a8
2 changed files with 2 additions and 3 deletions
--- a/Cargo.lock
+++ b/Cargo.lock
@ -4754,7 +4754,7 @@ dependencies = [
 "async-trait",
 "bindgen 0.71.1",
 "clap 4.5.30",
- "hf-hub 0.3.2",
+ "hf-hub 0.4.2",
 "num_cpus",
 "pkg-config",
 "text-generation-router",
--- a/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py
+++ b/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py
@ -313,7 +313,6 @@ class Qwen2_5_VLVisionConfig(PretrainedConfig):


 class Qwen2_5_VLConfig(PretrainedConfig):
-
    def __init__(
        self,
        vocab_size=152064,
@ -702,7 +701,6 @@ class Qwen2_5VisionModel(nn.Module):
        pixel_values: torch.Tensor,
        grid_thw: Optional[torch.LongTensor] = None,
    ) -> torch.Tensor:
-
        # reshape the input tensor for processing
        shape = (
            -1,
@ -967,6 +965,7 @@ class Qwen2_5VLForConditionalGeneration(nn.Module):
            max_s=max_s,
            true_max_s=max_s,
            prefill_cache_indices=prefill_cache_indices,
+            adapter_data=adapter_data,
        )
        if lm_head_indices is not None:
            hidden_states = hidden_states[lm_head_indices]