Add ignore_eos_token to HTTP interface

This commit is contained in:
Chirag Jain 2023-10-06 18:22:12 +05:30
parent 00b8f36fba
commit 017f3de464
No known key found for this signature in database
GPG Key ID: D6A7538AE0A6D9AF
2 changed files with 6 additions and 1 deletions

View File

@ -138,6 +138,9 @@ pub(crate) struct GenerateParameters {
#[serde(default)] #[serde(default)]
#[schema(exclusive_minimum = 0, nullable = true, default = "null", example = 5)] #[schema(exclusive_minimum = 0, nullable = true, default = "null", example = 5)]
pub top_n_tokens: Option<u32>, pub top_n_tokens: Option<u32>,
#[serde(default)]
#[schema(default = "false")]
pub ignore_eos_token: bool
} }
fn default_max_new_tokens() -> Option<u32> { fn default_max_new_tokens() -> Option<u32> {
@ -162,6 +165,7 @@ fn default_parameters() -> GenerateParameters {
decoder_input_details: false, decoder_input_details: false,
seed: None, seed: None,
top_n_tokens: None, top_n_tokens: None,
ignore_eos_token: false,
} }
} }

View File

@ -156,6 +156,7 @@ impl Validation {
watermark, watermark,
decoder_input_details, decoder_input_details,
top_n_tokens, top_n_tokens,
ignore_eos_token,
.. ..
} = request.parameters; } = request.parameters;
@ -274,7 +275,7 @@ impl Validation {
let stopping_parameters = StoppingCriteriaParameters { let stopping_parameters = StoppingCriteriaParameters {
max_new_tokens, max_new_tokens,
stop_sequences, stop_sequences,
ignore_eos_token: false, ignore_eos_token: ignore_eos_token,
}; };
metrics::histogram!("tgi_request_max_new_tokens", max_new_tokens as f64); metrics::histogram!("tgi_request_max_new_tokens", max_new_tokens as f64);