mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-05-14 22:12:06 +00:00
Update server.rs
This commit is contained in:
parent
c4422e5678
commit
2fa5e31839
@ -128,6 +128,11 @@ example = json ! ({"error": "Model is overloaded"})),
|
||||
example = json ! ({"error": "Input validation error"})),
|
||||
(status = 500, description = "Incomplete generation", body = ErrorResponse,
|
||||
example = json ! ({"error": "Incomplete generation"})),
|
||||
params(("max_input_length" = usize, Path, description = "This is the maximum allowed input
|
||||
length (expressed in number of tokens) for users. The larger this value, the longer prompt
|
||||
users can send which can impact the overall memory required to handle the load.
|
||||
Please note that some models have a finite range of sequence they can handle."),
|
||||
)),
|
||||
)
|
||||
)]
|
||||
#[instrument(
|
||||
|
Loading…
Reference in New Issue
Block a user