mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-21 23:12:07 +00:00
fix
This commit is contained in:
parent
2fa5e31839
commit
09fee2f6fb
@ -128,11 +128,11 @@ example = json ! ({"error": "Model is overloaded"})),
|
|||||||
example = json ! ({"error": "Input validation error"})),
|
example = json ! ({"error": "Input validation error"})),
|
||||||
(status = 500, description = "Incomplete generation", body = ErrorResponse,
|
(status = 500, description = "Incomplete generation", body = ErrorResponse,
|
||||||
example = json ! ({"error": "Incomplete generation"})),
|
example = json ! ({"error": "Incomplete generation"})),
|
||||||
params(("max_input_length" = usize, Path, description = "This is the maximum allowed input
|
params("max_input_length" = usize, Path, description = "This is the maximum allowed input
|
||||||
length (expressed in number of tokens) for users. The larger this value, the longer prompt
|
length (expressed in number of tokens) for users. The larger this value, the longer prompt
|
||||||
users can send which can impact the overall memory required to handle the load.
|
users can send which can impact the overall memory required to handle the load.
|
||||||
Please note that some models have a finite range of sequence they can handle."),
|
Please note that some models have a finite range of sequence they can handle."),
|
||||||
)),
|
),
|
||||||
)
|
)
|
||||||
)]
|
)]
|
||||||
#[instrument(
|
#[instrument(
|
||||||
|
Loading…
Reference in New Issue
Block a user