mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-21 14:52:20 +00:00
fix
This commit is contained in:
parent
2fa5e31839
commit
09fee2f6fb
@ -128,11 +128,11 @@ example = json ! ({"error": "Model is overloaded"})),
|
||||
example = json ! ({"error": "Input validation error"})),
|
||||
(status = 500, description = "Incomplete generation", body = ErrorResponse,
|
||||
example = json ! ({"error": "Incomplete generation"})),
|
||||
params(("max_input_length" = usize, Path, description = "This is the maximum allowed input
|
||||
params("max_input_length" = usize, Path, description = "This is the maximum allowed input
|
||||
length (expressed in number of tokens) for users. The larger this value, the longer prompt
|
||||
users can send which can impact the overall memory required to handle the load.
|
||||
Please note that some models have a finite range of sequence they can handle."),
|
||||
)),
|
||||
),
|
||||
)
|
||||
)]
|
||||
#[instrument(
|
||||
|
Loading…
Reference in New Issue
Block a user