diff --git a/launcher/src/main.rs b/launcher/src/main.rs index 54b8342b..be2426ee 100644 --- a/launcher/src/main.rs +++ b/launcher/src/main.rs @@ -257,7 +257,7 @@ struct Args { /// Limits the number of tokens for the prefill operation. /// Since this operation take the most memory and is compute bound, it is interesting /// to limit the number of requests that can be sent. - /// Default to `max_input_length + 50` to give a bit of room. + /// Default to `max_input_tokens + 50` to give a bit of room. #[clap(long, env)] max_batch_prefill_tokens: Option,