Update docstring in launcher/src/main.rs instead

2025-07-13 03:10:17 +00:00 · 2025-03-07 13:25:24 +01:00 · 2025-03-07 13:25:24 +01:00 · a1b3887846
commit a1b3887846
parent 7a40844734
1 changed files with 2 additions and 2 deletions
--- a/launcher/src/main.rs
+++ b/launcher/src/main.rs
@ -702,8 +702,8 @@ struct Args {
    /// Overall this number should be the largest possible amount that fits the
    /// remaining memory (after the model is loaded). Since the actual memory overhead
    /// depends on other parameters like if you're using quantization, flash attention
-    /// or the model implementation, text-generation-inference cannot infer this number
-    /// automatically.
+    /// or the model implementation, text-generation-inference infers this number automatically
+    /// if not provided ensuring that the value is as large as possible.
    #[clap(long, env)]
    max_batch_total_tokens: Option<u32>,