From 55e29c956412753c75f676f6b8363a5c683dd3cc Mon Sep 17 00:00:00 2001 From: OlivierDehaene <23298448+OlivierDehaene@users.noreply.github.com> Date: Thu, 8 Feb 2024 17:28:54 +0100 Subject: [PATCH] my b --- router/src/infer.rs | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/router/src/infer.rs b/router/src/infer.rs index d6dbd842..d7b9b52b 100644 --- a/router/src/infer.rs +++ b/router/src/infer.rs @@ -387,7 +387,7 @@ async fn batching_task( }; let token_budget = max_batch_total_tokens.saturating_sub(batch_max_tokens); - let max_size = max_batch_size.map(|max_size| batch_size as usize - max_size); + let max_size = max_batch_size.map(|max_size| max_size - batch_size as usize); // Try to get a new batch if let Some((mut new_entries, new_batch, span)) = queue