fmt

Signed-off-by: Wang, Yi A <yi.a.wang@intel.com>
2025-09-09 11:24:53 +00:00 · 2025-05-16 06:07:56 -07:00 · 2025-05-16 06:07:56 -07:00 · becf36f5e4
commit becf36f5e4
parent b5e1ae9209
1 changed files with 2 additions and 1 deletions
--- a/backends/v3/src/queue.rs
+++ b/backends/v3/src/queue.rs
@ -16,6 +16,7 @@ use text_generation_router::validation::{
 use tokio::sync::{mpsc, oneshot};
 use tokio::time::Instant;
 use tracing::{info_span, instrument, Instrument, Span};
+
 /// Queue entry
 #[derive(Debug)]
 pub(crate) struct Entry {
@ -372,8 +373,8 @@ impl State {
                        }
                    }

-                    //HPU padding for the prefill
                    if self.is_hpu_device {
+                        //HPU needs to pad for the prefill
                        max_input_length = max_input_length.max(entry.request.input_length);
                        let actual_prefill_tokens_for_hpu =
                            (batch.len() + 1) as u32 * max_input_length;