Make style 2

2025-09-09 03:14:53 +00:00 · 2025-05-10 17:04:32 +00:00 · 2025-05-10 17:04:32 +00:00 · 4ee34f64c6
commit 4ee34f64c6
parent afbebe6990
1 changed files with 3 additions and 3 deletions
--- a/backends/gaudi/server/text_generation_server/models/vlm_causal_lm.py
+++ b/backends/gaudi/server/text_generation_server/models/vlm_causal_lm.py
@ -232,7 +232,7 @@ class VlmCausalLMBatch(CausalLMBatch):
        self.prefilling = prefilling

    @property
-    def token_idx(self):
+    def token_idx(self):  # noqa: F811
        if self.prefilling:
            # no right padding for prefill
            token_idx_scalar = self.attention_mask.shape[-1] - 1
@ -1534,8 +1534,8 @@ class VlmCausalLM(Model):

        except Exception:
            raise RuntimeError(
-                f"Not enough memory to handle following prefill and decode warmup."
-                f"You need to decrease `--max-batch-prefill-tokens`"
+                "Not enough memory to handle following prefill and decode warmup."
+                "You need to decrease `--max-batch-prefill-tokens`"
            )

        mem_stats = get_hpu_memory_stats(self.device)